1 /*
2 * Copyright (c) 2017, Mellanox Technologies. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 */
32
33 #include <rdma/ib_verbs.h>
34 #include <linux/mlx5/fs.h>
35 #include "en.h"
36 #include "en/params.h"
37 #include "ipoib.h"
38 #include "en/fs_ethtool.h"
39
40 #define IB_DEFAULT_Q_KEY 0xb1b
41 #define MLX5I_PARAMS_DEFAULT_LOG_RQ_SIZE 9
42
43 static int mlx5i_open(struct net_device *netdev);
44 static int mlx5i_close(struct net_device *netdev);
45 static int mlx5i_change_mtu(struct net_device *netdev, int new_mtu);
46
47 static const struct net_device_ops mlx5i_netdev_ops = {
48 .ndo_open = mlx5i_open,
49 .ndo_stop = mlx5i_close,
50 .ndo_get_stats64 = mlx5i_get_stats,
51 .ndo_init = mlx5i_dev_init,
52 .ndo_uninit = mlx5i_dev_cleanup,
53 .ndo_change_mtu = mlx5i_change_mtu,
54 .ndo_eth_ioctl = mlx5i_ioctl,
55 };
56
57 /* IPoIB mlx5 netdev profile */
mlx5i_build_nic_params(struct mlx5_core_dev * mdev,struct mlx5e_params * params)58 static void mlx5i_build_nic_params(struct mlx5_core_dev *mdev,
59 struct mlx5e_params *params)
60 {
61 /* Override RQ params as IPoIB supports only LINKED LIST RQ for now */
62 MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_STRIDING_RQ, false);
63 mlx5e_set_rq_type(mdev, params);
64 mlx5e_init_rq_type_params(mdev, params);
65
66 /* RQ size in ipoib by default is 512 */
67 params->log_rq_mtu_frames = is_kdump_kernel() ?
68 MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE :
69 MLX5I_PARAMS_DEFAULT_LOG_RQ_SIZE;
70
71 params->packet_merge.type = MLX5E_PACKET_MERGE_NONE;
72 params->hard_mtu = MLX5_IB_GRH_BYTES + MLX5_IPOIB_HARD_LEN;
73
74 /* CQE compression is not supported for IPoIB */
75 params->rx_cqe_compress_def = false;
76 MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_CQE_COMPRESS, params->rx_cqe_compress_def);
77 }
78
79 /* Called directly after IPoIB netdevice was created to initialize SW structs */
mlx5i_init(struct mlx5_core_dev * mdev,struct net_device * netdev)80 int mlx5i_init(struct mlx5_core_dev *mdev, struct net_device *netdev)
81 {
82 struct mlx5e_priv *priv = mlx5i_epriv(netdev);
83
84 netif_carrier_off(netdev);
85 mlx5e_set_netdev_mtu_boundaries(priv);
86 netdev->mtu = netdev->max_mtu;
87
88 mlx5e_build_nic_params(priv, NULL, netdev->mtu);
89 mlx5i_build_nic_params(mdev, &priv->channels.params);
90
91 mlx5e_timestamp_init(priv);
92
93 /* netdev init */
94 netdev->hw_features |= NETIF_F_SG;
95 netdev->hw_features |= NETIF_F_IP_CSUM;
96 netdev->hw_features |= NETIF_F_IPV6_CSUM;
97 netdev->hw_features |= NETIF_F_GRO;
98 netdev->hw_features |= NETIF_F_TSO;
99 netdev->hw_features |= NETIF_F_TSO6;
100 netdev->hw_features |= NETIF_F_RXCSUM;
101 netdev->hw_features |= NETIF_F_RXHASH;
102
103 netdev->netdev_ops = &mlx5i_netdev_ops;
104 netdev->ethtool_ops = &mlx5i_ethtool_ops;
105
106 return 0;
107 }
108
109 /* Called directly before IPoIB netdevice is destroyed to cleanup SW structs */
mlx5i_cleanup(struct mlx5e_priv * priv)110 void mlx5i_cleanup(struct mlx5e_priv *priv)
111 {
112 mlx5e_priv_cleanup(priv);
113 }
114
mlx5i_grp_sw_update_stats(struct mlx5e_priv * priv)115 static void mlx5i_grp_sw_update_stats(struct mlx5e_priv *priv)
116 {
117 struct rtnl_link_stats64 s = {};
118 int i, j;
119
120 for (i = 0; i < priv->stats_nch; i++) {
121 struct mlx5e_channel_stats *channel_stats;
122 struct mlx5e_rq_stats *rq_stats;
123
124 channel_stats = priv->channel_stats[i];
125 rq_stats = &channel_stats->rq;
126
127 s.rx_packets += rq_stats->packets;
128 s.rx_bytes += rq_stats->bytes;
129
130 for (j = 0; j < priv->max_opened_tc; j++) {
131 struct mlx5e_sq_stats *sq_stats = &channel_stats->sq[j];
132
133 s.tx_packets += sq_stats->packets;
134 s.tx_bytes += sq_stats->bytes;
135 s.tx_dropped += sq_stats->dropped;
136 }
137 }
138
139 memset(&priv->stats.sw, 0, sizeof(s));
140
141 priv->stats.sw.rx_packets = s.rx_packets;
142 priv->stats.sw.rx_bytes = s.rx_bytes;
143 priv->stats.sw.tx_packets = s.tx_packets;
144 priv->stats.sw.tx_bytes = s.tx_bytes;
145 priv->stats.sw.tx_queue_dropped = s.tx_dropped;
146 }
147
mlx5i_get_stats(struct net_device * dev,struct rtnl_link_stats64 * stats)148 void mlx5i_get_stats(struct net_device *dev, struct rtnl_link_stats64 *stats)
149 {
150 struct mlx5e_priv *priv = mlx5i_epriv(dev);
151 struct mlx5e_sw_stats *sstats = &priv->stats.sw;
152
153 mlx5i_grp_sw_update_stats(priv);
154
155 stats->rx_packets = sstats->rx_packets;
156 stats->rx_bytes = sstats->rx_bytes;
157 stats->tx_packets = sstats->tx_packets;
158 stats->tx_bytes = sstats->tx_bytes;
159 stats->tx_dropped = sstats->tx_queue_dropped;
160 }
161
mlx5i_parent_get(struct net_device * netdev)162 struct net_device *mlx5i_parent_get(struct net_device *netdev)
163 {
164 struct mlx5e_priv *priv = mlx5i_epriv(netdev);
165 struct mlx5i_priv *ipriv, *parent_ipriv;
166 struct net_device *parent_dev;
167 int parent_ifindex;
168
169 ipriv = priv->ppriv;
170
171 parent_ifindex = netdev->netdev_ops->ndo_get_iflink(netdev);
172 parent_dev = dev_get_by_index(dev_net(netdev), parent_ifindex);
173 if (!parent_dev)
174 return NULL;
175
176 parent_ipriv = netdev_priv(parent_dev);
177
178 ASSERT_RTNL();
179 parent_ipriv->num_sub_interfaces++;
180
181 ipriv->parent_dev = parent_dev;
182
183 return parent_dev;
184 }
185
mlx5i_parent_put(struct net_device * netdev)186 void mlx5i_parent_put(struct net_device *netdev)
187 {
188 struct mlx5e_priv *priv = mlx5i_epriv(netdev);
189 struct mlx5i_priv *ipriv, *parent_ipriv;
190
191 ipriv = priv->ppriv;
192 parent_ipriv = netdev_priv(ipriv->parent_dev);
193
194 ASSERT_RTNL();
195 parent_ipriv->num_sub_interfaces--;
196
197 dev_put(ipriv->parent_dev);
198 }
199
mlx5i_init_underlay_qp(struct mlx5e_priv * priv)200 int mlx5i_init_underlay_qp(struct mlx5e_priv *priv)
201 {
202 struct mlx5_core_dev *mdev = priv->mdev;
203 struct mlx5i_priv *ipriv = priv->ppriv;
204 int ret;
205
206 {
207 u32 in[MLX5_ST_SZ_DW(rst2init_qp_in)] = {};
208 u32 *qpc;
209
210 qpc = MLX5_ADDR_OF(rst2init_qp_in, in, qpc);
211
212 MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED);
213 MLX5_SET(qpc, qpc, primary_address_path.pkey_index,
214 ipriv->pkey_index);
215 MLX5_SET(qpc, qpc, primary_address_path.vhca_port_num, 1);
216 MLX5_SET(qpc, qpc, q_key, IB_DEFAULT_Q_KEY);
217
218 MLX5_SET(rst2init_qp_in, in, opcode, MLX5_CMD_OP_RST2INIT_QP);
219 MLX5_SET(rst2init_qp_in, in, qpn, ipriv->qpn);
220 ret = mlx5_cmd_exec_in(mdev, rst2init_qp, in);
221 if (ret)
222 goto err_qp_modify_to_err;
223 }
224 {
225 u32 in[MLX5_ST_SZ_DW(init2rtr_qp_in)] = {};
226
227 MLX5_SET(init2rtr_qp_in, in, opcode, MLX5_CMD_OP_INIT2RTR_QP);
228 MLX5_SET(init2rtr_qp_in, in, qpn, ipriv->qpn);
229 ret = mlx5_cmd_exec_in(mdev, init2rtr_qp, in);
230 if (ret)
231 goto err_qp_modify_to_err;
232 }
233 {
234 u32 in[MLX5_ST_SZ_DW(rtr2rts_qp_in)] = {};
235
236 MLX5_SET(rtr2rts_qp_in, in, opcode, MLX5_CMD_OP_RTR2RTS_QP);
237 MLX5_SET(rtr2rts_qp_in, in, qpn, ipriv->qpn);
238 ret = mlx5_cmd_exec_in(mdev, rtr2rts_qp, in);
239 if (ret)
240 goto err_qp_modify_to_err;
241 }
242 return 0;
243
244 err_qp_modify_to_err:
245 {
246 u32 in[MLX5_ST_SZ_DW(qp_2err_in)] = {};
247
248 MLX5_SET(qp_2err_in, in, opcode, MLX5_CMD_OP_2ERR_QP);
249 MLX5_SET(qp_2err_in, in, qpn, ipriv->qpn);
250 mlx5_cmd_exec_in(mdev, qp_2err, in);
251 }
252 return ret;
253 }
254
mlx5i_uninit_underlay_qp(struct mlx5e_priv * priv)255 void mlx5i_uninit_underlay_qp(struct mlx5e_priv *priv)
256 {
257 struct mlx5i_priv *ipriv = priv->ppriv;
258 struct mlx5_core_dev *mdev = priv->mdev;
259 u32 in[MLX5_ST_SZ_DW(qp_2rst_in)] = {};
260
261 MLX5_SET(qp_2rst_in, in, opcode, MLX5_CMD_OP_2RST_QP);
262 MLX5_SET(qp_2rst_in, in, qpn, ipriv->qpn);
263 mlx5_cmd_exec_in(mdev, qp_2rst, in);
264 }
265
266 #define MLX5_QP_ENHANCED_ULP_STATELESS_MODE 2
267
mlx5i_create_underlay_qp(struct mlx5e_priv * priv)268 int mlx5i_create_underlay_qp(struct mlx5e_priv *priv)
269 {
270 const unsigned char *dev_addr = priv->netdev->dev_addr;
271 u32 out[MLX5_ST_SZ_DW(create_qp_out)] = {};
272 u32 in[MLX5_ST_SZ_DW(create_qp_in)] = {};
273 struct mlx5i_priv *ipriv = priv->ppriv;
274 void *addr_path;
275 int qpn = 0;
276 int ret = 0;
277 void *qpc;
278
279 if (MLX5_CAP_GEN(priv->mdev, mkey_by_name)) {
280 qpn = (dev_addr[1] << 16) + (dev_addr[2] << 8) + dev_addr[3];
281 MLX5_SET(create_qp_in, in, input_qpn, qpn);
282 }
283
284 qpc = MLX5_ADDR_OF(create_qp_in, in, qpc);
285 MLX5_SET(qpc, qpc, ts_format, mlx5_get_qp_default_ts(priv->mdev));
286 MLX5_SET(qpc, qpc, st, MLX5_QP_ST_UD);
287 MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED);
288 MLX5_SET(qpc, qpc, ulp_stateless_offload_mode,
289 MLX5_QP_ENHANCED_ULP_STATELESS_MODE);
290
291 addr_path = MLX5_ADDR_OF(qpc, qpc, primary_address_path);
292 MLX5_SET(ads, addr_path, vhca_port_num, 1);
293 MLX5_SET(ads, addr_path, grh, 1);
294
295 MLX5_SET(create_qp_in, in, opcode, MLX5_CMD_OP_CREATE_QP);
296 ret = mlx5_cmd_exec_inout(priv->mdev, create_qp, in, out);
297 if (ret)
298 return ret;
299
300 ipriv->qpn = MLX5_GET(create_qp_out, out, qpn);
301
302 return 0;
303 }
304
mlx5i_destroy_underlay_qp(struct mlx5_core_dev * mdev,u32 qpn)305 void mlx5i_destroy_underlay_qp(struct mlx5_core_dev *mdev, u32 qpn)
306 {
307 u32 in[MLX5_ST_SZ_DW(destroy_qp_in)] = {};
308
309 MLX5_SET(destroy_qp_in, in, opcode, MLX5_CMD_OP_DESTROY_QP);
310 MLX5_SET(destroy_qp_in, in, qpn, qpn);
311 mlx5_cmd_exec_in(mdev, destroy_qp, in);
312 }
313
mlx5i_update_nic_rx(struct mlx5e_priv * priv)314 int mlx5i_update_nic_rx(struct mlx5e_priv *priv)
315 {
316 return mlx5e_refresh_tirs(priv, true, true);
317 }
318
mlx5i_create_tis(struct mlx5_core_dev * mdev,u32 underlay_qpn,u32 * tisn)319 int mlx5i_create_tis(struct mlx5_core_dev *mdev, u32 underlay_qpn, u32 *tisn)
320 {
321 u32 in[MLX5_ST_SZ_DW(create_tis_in)] = {};
322 void *tisc;
323
324 tisc = MLX5_ADDR_OF(create_tis_in, in, ctx);
325
326 MLX5_SET(tisc, tisc, underlay_qpn, underlay_qpn);
327
328 return mlx5e_create_tis(mdev, in, tisn);
329 }
330
mlx5i_init_tx(struct mlx5e_priv * priv)331 static int mlx5i_init_tx(struct mlx5e_priv *priv)
332 {
333 struct mlx5i_priv *ipriv = priv->ppriv;
334 int err;
335
336 err = mlx5i_create_underlay_qp(priv);
337 if (err) {
338 mlx5_core_warn(priv->mdev, "create underlay QP failed, %d\n", err);
339 return err;
340 }
341
342 err = mlx5i_create_tis(priv->mdev, ipriv->qpn, &ipriv->tisn);
343 if (err) {
344 mlx5_core_warn(priv->mdev, "create tis failed, %d\n", err);
345 goto err_destroy_underlay_qp;
346 }
347
348 return 0;
349
350 err_destroy_underlay_qp:
351 mlx5i_destroy_underlay_qp(priv->mdev, ipriv->qpn);
352 return err;
353 }
354
mlx5i_cleanup_tx(struct mlx5e_priv * priv)355 static void mlx5i_cleanup_tx(struct mlx5e_priv *priv)
356 {
357 struct mlx5i_priv *ipriv = priv->ppriv;
358
359 mlx5e_destroy_tis(priv->mdev, ipriv->tisn);
360 mlx5i_destroy_underlay_qp(priv->mdev, ipriv->qpn);
361 }
362
mlx5i_create_flow_steering(struct mlx5e_priv * priv)363 static int mlx5i_create_flow_steering(struct mlx5e_priv *priv)
364 {
365 struct mlx5_flow_namespace *ns =
366 mlx5_get_flow_namespace(priv->mdev, MLX5_FLOW_NAMESPACE_KERNEL);
367 int err;
368
369
370 if (!ns)
371 return -EINVAL;
372
373 mlx5e_fs_set_ns(priv->fs, ns, false);
374 err = mlx5e_arfs_create_tables(priv->fs, priv->rx_res,
375 mlx5e_fs_has_arfs(priv->netdev));
376 if (err) {
377 netdev_err(priv->netdev, "Failed to create arfs tables, err=%d\n",
378 err);
379 priv->netdev->hw_features &= ~NETIF_F_NTUPLE;
380 }
381
382 err = mlx5e_create_ttc_table(priv->fs, priv->rx_res);
383 if (err) {
384 netdev_err(priv->netdev, "Failed to create ttc table, err=%d\n",
385 err);
386 goto err_destroy_arfs_tables;
387 }
388
389 mlx5e_ethtool_init_steering(priv->fs);
390
391 return 0;
392
393 err_destroy_arfs_tables:
394 mlx5e_arfs_destroy_tables(priv->fs, mlx5e_fs_has_arfs(priv->netdev));
395
396 return err;
397 }
398
mlx5i_destroy_flow_steering(struct mlx5e_priv * priv)399 static void mlx5i_destroy_flow_steering(struct mlx5e_priv *priv)
400 {
401 mlx5e_destroy_ttc_table(priv->fs);
402 mlx5e_arfs_destroy_tables(priv->fs, mlx5e_fs_has_arfs(priv->netdev));
403 mlx5e_ethtool_cleanup_steering(priv->fs);
404 }
405
mlx5i_init_rx(struct mlx5e_priv * priv)406 static int mlx5i_init_rx(struct mlx5e_priv *priv)
407 {
408 struct mlx5_core_dev *mdev = priv->mdev;
409 int err;
410
411 priv->fs = mlx5e_fs_init(priv->profile, mdev,
412 !test_bit(MLX5E_STATE_DESTROYING, &priv->state),
413 priv->dfs_root);
414 if (!priv->fs) {
415 netdev_err(priv->netdev, "FS allocation failed\n");
416 return -ENOMEM;
417 }
418
419 mlx5e_create_q_counters(priv);
420
421 err = mlx5e_open_drop_rq(priv, &priv->drop_rq);
422 if (err) {
423 mlx5_core_err(mdev, "open drop rq failed, %d\n", err);
424 goto err_destroy_q_counters;
425 }
426
427 priv->rx_res = mlx5e_rx_res_create(priv->mdev, 0, priv->max_nch, priv->drop_rq.rqn,
428 &priv->channels.params.packet_merge,
429 priv->channels.params.num_channels);
430 if (IS_ERR(priv->rx_res)) {
431 err = PTR_ERR(priv->rx_res);
432 goto err_close_drop_rq;
433 }
434
435 err = mlx5i_create_flow_steering(priv);
436 if (err)
437 goto err_destroy_rx_res;
438
439 return 0;
440
441 err_destroy_rx_res:
442 mlx5e_rx_res_destroy(priv->rx_res);
443 priv->rx_res = ERR_PTR(-EINVAL);
444 err_close_drop_rq:
445 mlx5e_close_drop_rq(&priv->drop_rq);
446 err_destroy_q_counters:
447 mlx5e_destroy_q_counters(priv);
448 mlx5e_fs_cleanup(priv->fs);
449 return err;
450 }
451
mlx5i_cleanup_rx(struct mlx5e_priv * priv)452 static void mlx5i_cleanup_rx(struct mlx5e_priv *priv)
453 {
454 mlx5i_destroy_flow_steering(priv);
455 mlx5e_rx_res_destroy(priv->rx_res);
456 priv->rx_res = ERR_PTR(-EINVAL);
457 mlx5e_close_drop_rq(&priv->drop_rq);
458 mlx5e_destroy_q_counters(priv);
459 mlx5e_fs_cleanup(priv->fs);
460 }
461
462 /* The stats groups order is opposite to the update_stats() order calls */
463 static mlx5e_stats_grp_t mlx5i_stats_grps[] = {
464 &MLX5E_STATS_GRP(sw),
465 &MLX5E_STATS_GRP(qcnt),
466 &MLX5E_STATS_GRP(vnic_env),
467 &MLX5E_STATS_GRP(vport),
468 &MLX5E_STATS_GRP(802_3),
469 &MLX5E_STATS_GRP(2863),
470 &MLX5E_STATS_GRP(2819),
471 &MLX5E_STATS_GRP(phy),
472 &MLX5E_STATS_GRP(pcie),
473 &MLX5E_STATS_GRP(per_prio),
474 &MLX5E_STATS_GRP(pme),
475 &MLX5E_STATS_GRP(channels),
476 &MLX5E_STATS_GRP(per_port_buff_congest),
477 };
478
mlx5i_stats_grps_num(struct mlx5e_priv * priv)479 static unsigned int mlx5i_stats_grps_num(struct mlx5e_priv *priv)
480 {
481 return ARRAY_SIZE(mlx5i_stats_grps);
482 }
483
mlx5i_get_tisn(struct mlx5_core_dev * mdev,struct mlx5e_priv * priv,u8 lag_port,u8 tc)484 u32 mlx5i_get_tisn(struct mlx5_core_dev *mdev, struct mlx5e_priv *priv, u8 lag_port, u8 tc)
485 {
486 struct mlx5i_priv *ipriv = priv->ppriv;
487
488 if (WARN(lag_port || tc,
489 "IPoIB unexpected non-zero value: lag_port (%u), tc (%u)\n",
490 lag_port, tc))
491 return 0;
492
493 return ipriv->tisn;
494 }
495
496 static const struct mlx5e_profile mlx5i_nic_profile = {
497 .init = mlx5i_init,
498 .cleanup = mlx5i_cleanup,
499 .init_tx = mlx5i_init_tx,
500 .cleanup_tx = mlx5i_cleanup_tx,
501 .init_rx = mlx5i_init_rx,
502 .cleanup_rx = mlx5i_cleanup_rx,
503 .enable = NULL, /* mlx5i_enable */
504 .disable = NULL, /* mlx5i_disable */
505 .update_rx = mlx5i_update_nic_rx,
506 .update_stats = NULL, /* mlx5i_update_stats */
507 .update_carrier = NULL, /* no HW update in IB link */
508 .rx_handlers = &mlx5i_rx_handlers,
509 .max_tc = MLX5I_MAX_NUM_TC,
510 .stats_grps = mlx5i_stats_grps,
511 .stats_grps_num = mlx5i_stats_grps_num,
512 .get_tisn = mlx5i_get_tisn,
513 };
514
515 /* mlx5i netdev NDos */
516
mlx5i_change_mtu(struct net_device * netdev,int new_mtu)517 static int mlx5i_change_mtu(struct net_device *netdev, int new_mtu)
518 {
519 struct mlx5e_priv *priv = mlx5i_epriv(netdev);
520 struct mlx5e_params new_params;
521 int err = 0;
522
523 mutex_lock(&priv->state_lock);
524
525 new_params = priv->channels.params;
526 new_params.sw_mtu = new_mtu;
527
528 err = mlx5e_safe_switch_params(priv, &new_params, NULL, NULL, true);
529 if (err)
530 goto out;
531
532 WRITE_ONCE(netdev->mtu, new_params.sw_mtu);
533
534 out:
535 mutex_unlock(&priv->state_lock);
536 return err;
537 }
538
mlx5i_dev_init(struct net_device * dev)539 int mlx5i_dev_init(struct net_device *dev)
540 {
541 struct mlx5e_priv *priv = mlx5i_epriv(dev);
542 struct mlx5i_priv *ipriv = priv->ppriv;
543 u8 addr_mod[3];
544
545 /* Set dev address using underlay QP */
546 addr_mod[0] = (ipriv->qpn >> 16) & 0xff;
547 addr_mod[1] = (ipriv->qpn >> 8) & 0xff;
548 addr_mod[2] = (ipriv->qpn) & 0xff;
549 dev_addr_mod(dev, 1, addr_mod, sizeof(addr_mod));
550
551 /* Add QPN to net-device mapping to HT */
552 mlx5i_pkey_add_qpn(dev, ipriv->qpn);
553
554 return 0;
555 }
556
mlx5i_ioctl(struct net_device * dev,struct ifreq * ifr,int cmd)557 int mlx5i_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
558 {
559 struct mlx5e_priv *priv = mlx5i_epriv(dev);
560
561 switch (cmd) {
562 case SIOCSHWTSTAMP:
563 return mlx5e_hwstamp_set(priv, ifr);
564 case SIOCGHWTSTAMP:
565 return mlx5e_hwstamp_get(priv, ifr);
566 default:
567 return -EOPNOTSUPP;
568 }
569 }
570
mlx5i_dev_cleanup(struct net_device * dev)571 void mlx5i_dev_cleanup(struct net_device *dev)
572 {
573 struct mlx5e_priv *priv = mlx5i_epriv(dev);
574 struct mlx5i_priv *ipriv = priv->ppriv;
575
576 mlx5i_uninit_underlay_qp(priv);
577
578 /* Delete QPN to net-device mapping from HT */
579 mlx5i_pkey_del_qpn(dev, ipriv->qpn);
580 }
581
mlx5i_open(struct net_device * netdev)582 static int mlx5i_open(struct net_device *netdev)
583 {
584 struct mlx5e_priv *epriv = mlx5i_epriv(netdev);
585 struct mlx5i_priv *ipriv = epriv->ppriv;
586 struct mlx5_core_dev *mdev = epriv->mdev;
587 int err;
588
589 mutex_lock(&epriv->state_lock);
590
591 set_bit(MLX5E_STATE_OPENED, &epriv->state);
592
593 err = mlx5i_init_underlay_qp(epriv);
594 if (err) {
595 mlx5_core_warn(mdev, "prepare underlay qp state failed, %d\n", err);
596 goto err_clear_state_opened_flag;
597 }
598
599 err = mlx5_fs_add_rx_underlay_qpn(mdev, ipriv->qpn);
600 if (err) {
601 mlx5_core_warn(mdev, "attach underlay qp to ft failed, %d\n", err);
602 goto err_reset_qp;
603 }
604
605 err = mlx5e_open_channels(epriv, &epriv->channels);
606 if (err)
607 goto err_remove_fs_underlay_qp;
608
609 err = epriv->profile->update_rx(epriv);
610 if (err)
611 goto err_close_channels;
612
613 mlx5e_activate_priv_channels(epriv);
614
615 mutex_unlock(&epriv->state_lock);
616 return 0;
617
618 err_close_channels:
619 mlx5e_close_channels(&epriv->channels);
620 err_remove_fs_underlay_qp:
621 mlx5_fs_remove_rx_underlay_qpn(mdev, ipriv->qpn);
622 err_reset_qp:
623 mlx5i_uninit_underlay_qp(epriv);
624 err_clear_state_opened_flag:
625 clear_bit(MLX5E_STATE_OPENED, &epriv->state);
626 mutex_unlock(&epriv->state_lock);
627 return err;
628 }
629
mlx5i_close(struct net_device * netdev)630 static int mlx5i_close(struct net_device *netdev)
631 {
632 struct mlx5e_priv *epriv = mlx5i_epriv(netdev);
633 struct mlx5i_priv *ipriv = epriv->ppriv;
634 struct mlx5_core_dev *mdev = epriv->mdev;
635
636 /* May already be CLOSED in case a previous configuration operation
637 * (e.g RX/TX queue size change) that involves close&open failed.
638 */
639 mutex_lock(&epriv->state_lock);
640
641 if (!test_bit(MLX5E_STATE_OPENED, &epriv->state))
642 goto unlock;
643
644 clear_bit(MLX5E_STATE_OPENED, &epriv->state);
645
646 netif_carrier_off(epriv->netdev);
647 mlx5_fs_remove_rx_underlay_qpn(mdev, ipriv->qpn);
648 mlx5e_deactivate_priv_channels(epriv);
649 mlx5e_close_channels(&epriv->channels);
650 mlx5i_uninit_underlay_qp(epriv);
651 unlock:
652 mutex_unlock(&epriv->state_lock);
653 return 0;
654 }
655
656 /* IPoIB RDMA netdev callbacks */
mlx5i_attach_mcast(struct net_device * netdev,struct ib_device * hca,union ib_gid * gid,u16 lid,int set_qkey,u32 qkey)657 static int mlx5i_attach_mcast(struct net_device *netdev, struct ib_device *hca,
658 union ib_gid *gid, u16 lid, int set_qkey,
659 u32 qkey)
660 {
661 struct mlx5e_priv *epriv = mlx5i_epriv(netdev);
662 struct mlx5_core_dev *mdev = epriv->mdev;
663 struct mlx5i_priv *ipriv = epriv->ppriv;
664 int err;
665
666 mlx5_core_dbg(mdev, "attaching QPN 0x%x, MGID %pI6\n", ipriv->qpn,
667 gid->raw);
668 err = mlx5_core_attach_mcg(mdev, gid, ipriv->qpn);
669 if (err)
670 mlx5_core_warn(mdev, "failed attaching QPN 0x%x, MGID %pI6\n",
671 ipriv->qpn, gid->raw);
672
673 if (set_qkey) {
674 mlx5_core_dbg(mdev, "%s setting qkey 0x%x\n",
675 netdev->name, qkey);
676 ipriv->qkey = qkey;
677 }
678
679 return err;
680 }
681
mlx5i_detach_mcast(struct net_device * netdev,struct ib_device * hca,union ib_gid * gid,u16 lid)682 static int mlx5i_detach_mcast(struct net_device *netdev, struct ib_device *hca,
683 union ib_gid *gid, u16 lid)
684 {
685 struct mlx5e_priv *epriv = mlx5i_epriv(netdev);
686 struct mlx5_core_dev *mdev = epriv->mdev;
687 struct mlx5i_priv *ipriv = epriv->ppriv;
688 int err;
689
690 mlx5_core_dbg(mdev, "detaching QPN 0x%x, MGID %pI6\n", ipriv->qpn,
691 gid->raw);
692
693 err = mlx5_core_detach_mcg(mdev, gid, ipriv->qpn);
694 if (err)
695 mlx5_core_dbg(mdev, "failed detaching QPN 0x%x, MGID %pI6\n",
696 ipriv->qpn, gid->raw);
697
698 return err;
699 }
700
mlx5i_xmit(struct net_device * dev,struct sk_buff * skb,struct ib_ah * address,u32 dqpn)701 static int mlx5i_xmit(struct net_device *dev, struct sk_buff *skb,
702 struct ib_ah *address, u32 dqpn)
703 {
704 struct mlx5e_priv *epriv = mlx5i_epriv(dev);
705 struct mlx5e_txqsq *sq = epriv->txq2sq[skb_get_queue_mapping(skb)];
706 struct mlx5_ib_ah *mah = to_mah(address);
707 struct mlx5i_priv *ipriv = epriv->ppriv;
708
709 mlx5i_sq_xmit(sq, skb, &mah->av, dqpn, ipriv->qkey, netdev_xmit_more());
710
711 return NETDEV_TX_OK;
712 }
713
mlx5i_set_pkey_index(struct net_device * netdev,int id)714 static void mlx5i_set_pkey_index(struct net_device *netdev, int id)
715 {
716 struct mlx5i_priv *ipriv = netdev_priv(netdev);
717
718 ipriv->pkey_index = (u16)id;
719 }
720
mlx5i_check_required_hca_cap(struct mlx5_core_dev * mdev)721 static int mlx5i_check_required_hca_cap(struct mlx5_core_dev *mdev)
722 {
723 if (MLX5_CAP_GEN(mdev, port_type) != MLX5_CAP_PORT_TYPE_IB)
724 return -EOPNOTSUPP;
725
726 if (!MLX5_CAP_GEN(mdev, ipoib_enhanced_offloads)) {
727 mlx5_core_warn(mdev, "IPoIB enhanced offloads are not supported\n");
728 return -EOPNOTSUPP;
729 }
730
731 return 0;
732 }
733
mlx5_rdma_netdev_free(struct net_device * netdev)734 static void mlx5_rdma_netdev_free(struct net_device *netdev)
735 {
736 struct mlx5e_priv *priv = mlx5i_epriv(netdev);
737 struct mlx5_core_dev *mdev = priv->mdev;
738 struct mlx5i_priv *ipriv = priv->ppriv;
739 const struct mlx5e_profile *profile = priv->profile;
740
741 mlx5e_detach_netdev(priv);
742 profile->cleanup(priv);
743
744 if (!ipriv->sub_interface) {
745 mlx5i_pkey_qpn_ht_cleanup(netdev);
746 mlx5e_destroy_mdev_resources(mdev);
747 }
748 }
749
mlx5_is_sub_interface(struct mlx5_core_dev * mdev)750 static bool mlx5_is_sub_interface(struct mlx5_core_dev *mdev)
751 {
752 return mdev->mlx5e_res.hw_objs.pdn != 0;
753 }
754
mlx5_get_profile(struct mlx5_core_dev * mdev)755 static const struct mlx5e_profile *mlx5_get_profile(struct mlx5_core_dev *mdev)
756 {
757 if (mlx5_is_sub_interface(mdev))
758 return mlx5i_pkey_get_profile();
759 return &mlx5i_nic_profile;
760 }
761
mlx5_rdma_setup_rn(struct ib_device * ibdev,u32 port_num,struct net_device * netdev,void * param)762 static int mlx5_rdma_setup_rn(struct ib_device *ibdev, u32 port_num,
763 struct net_device *netdev, void *param)
764 {
765 struct mlx5_core_dev *mdev = (struct mlx5_core_dev *)param;
766 const struct mlx5e_profile *prof = mlx5_get_profile(mdev);
767 struct mlx5i_priv *ipriv;
768 struct mlx5e_priv *epriv;
769 struct rdma_netdev *rn;
770 int err;
771
772 ipriv = netdev_priv(netdev);
773 epriv = mlx5i_epriv(netdev);
774
775 ipriv->sub_interface = mlx5_is_sub_interface(mdev);
776 if (!ipriv->sub_interface) {
777 err = mlx5i_pkey_qpn_ht_init(netdev);
778 if (err) {
779 mlx5_core_warn(mdev, "allocate qpn_to_netdev ht failed\n");
780 return err;
781 }
782
783 /* This should only be called once per mdev */
784 err = mlx5e_create_mdev_resources(mdev, false);
785 if (err)
786 goto destroy_ht;
787 }
788
789 err = mlx5e_priv_init(epriv, prof, netdev, mdev);
790 if (err)
791 goto destroy_mdev_resources;
792
793 epriv->profile = prof;
794 epriv->ppriv = ipriv;
795
796 prof->init(mdev, netdev);
797
798 err = mlx5e_attach_netdev(epriv);
799 if (err)
800 goto detach;
801 netif_carrier_off(netdev);
802
803 /* set rdma_netdev func pointers */
804 rn = &ipriv->rn;
805 rn->hca = ibdev;
806 rn->send = mlx5i_xmit;
807 rn->attach_mcast = mlx5i_attach_mcast;
808 rn->detach_mcast = mlx5i_detach_mcast;
809 rn->set_id = mlx5i_set_pkey_index;
810
811 netdev->priv_destructor = mlx5_rdma_netdev_free;
812 netdev->needs_free_netdev = 1;
813
814 return 0;
815
816 detach:
817 prof->cleanup(epriv);
818 if (ipriv->sub_interface)
819 return err;
820 destroy_mdev_resources:
821 mlx5e_destroy_mdev_resources(mdev);
822 destroy_ht:
823 mlx5i_pkey_qpn_ht_cleanup(netdev);
824 return err;
825 }
826
mlx5_rdma_rn_get_params(struct mlx5_core_dev * mdev,struct ib_device * device,struct rdma_netdev_alloc_params * params)827 int mlx5_rdma_rn_get_params(struct mlx5_core_dev *mdev,
828 struct ib_device *device,
829 struct rdma_netdev_alloc_params *params)
830 {
831 int nch;
832 int rc;
833
834 rc = mlx5i_check_required_hca_cap(mdev);
835 if (rc)
836 return rc;
837
838 nch = mlx5e_get_max_num_channels(mdev);
839
840 *params = (struct rdma_netdev_alloc_params){
841 .sizeof_priv = sizeof(struct mlx5i_priv) +
842 sizeof(struct mlx5e_priv),
843 .txqs = nch * MLX5_MAX_NUM_TC,
844 .rxqs = nch,
845 .param = mdev,
846 .initialize_rdma_netdev = mlx5_rdma_setup_rn,
847 };
848
849 return 0;
850 }
851 EXPORT_SYMBOL(mlx5_rdma_rn_get_params);
852