xref: /linux/drivers/net/ethernet/mellanox/mlx5/core/ipoib/ipoib.c (revision ab93e0dd72c37d378dd936f031ffb83ff2bd87ce)
1 /*
2  * Copyright (c) 2017, Mellanox Technologies. All rights reserved.
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and/or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  */
32 
33 #include <rdma/ib_verbs.h>
34 #include <linux/mlx5/fs.h>
35 #include <net/netdev_lock.h>
36 #include "en.h"
37 #include "en/params.h"
38 #include "ipoib.h"
39 #include "en/fs_ethtool.h"
40 
41 #define IB_DEFAULT_Q_KEY   0xb1b
42 #define MLX5I_PARAMS_DEFAULT_LOG_RQ_SIZE 9
43 
44 static int mlx5i_open(struct net_device *netdev);
45 static int mlx5i_close(struct net_device *netdev);
46 static int mlx5i_change_mtu(struct net_device *netdev, int new_mtu);
47 
48 static const struct net_device_ops mlx5i_netdev_ops = {
49 	.ndo_open                = mlx5i_open,
50 	.ndo_stop                = mlx5i_close,
51 	.ndo_get_stats64         = mlx5i_get_stats,
52 	.ndo_init                = mlx5i_dev_init,
53 	.ndo_uninit              = mlx5i_dev_cleanup,
54 	.ndo_change_mtu          = mlx5i_change_mtu,
55 	.ndo_eth_ioctl            = mlx5i_ioctl,
56 };
57 
58 /* IPoIB mlx5 netdev profile */
mlx5i_build_nic_params(struct mlx5_core_dev * mdev,struct mlx5e_params * params)59 static void mlx5i_build_nic_params(struct mlx5_core_dev *mdev,
60 				   struct mlx5e_params *params)
61 {
62 	/* Override RQ params as IPoIB supports only LINKED LIST RQ for now */
63 	MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_STRIDING_RQ, false);
64 	mlx5e_set_rq_type(mdev, params);
65 	mlx5e_init_rq_type_params(mdev, params);
66 
67 	/* RQ size in ipoib by default is 512 */
68 	params->log_rq_mtu_frames = is_kdump_kernel() ?
69 		MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE :
70 		MLX5I_PARAMS_DEFAULT_LOG_RQ_SIZE;
71 
72 	params->packet_merge.type = MLX5E_PACKET_MERGE_NONE;
73 	params->hard_mtu = MLX5_IB_GRH_BYTES + MLX5_IPOIB_HARD_LEN;
74 
75 	/* CQE compression is not supported for IPoIB */
76 	params->rx_cqe_compress_def = false;
77 	MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_CQE_COMPRESS, params->rx_cqe_compress_def);
78 }
79 
80 /* Called directly after IPoIB netdevice was created to initialize SW structs */
mlx5i_init(struct mlx5_core_dev * mdev,struct net_device * netdev)81 int mlx5i_init(struct mlx5_core_dev *mdev, struct net_device *netdev)
82 {
83 	struct mlx5e_priv *priv  = mlx5i_epriv(netdev);
84 
85 	netif_carrier_off(netdev);
86 	mlx5e_set_netdev_mtu_boundaries(priv);
87 	netdev->mtu = netdev->max_mtu;
88 
89 	mlx5e_build_nic_params(priv, NULL, netdev->mtu);
90 	mlx5i_build_nic_params(mdev, &priv->channels.params);
91 
92 	mlx5e_timestamp_init(priv);
93 
94 	/* netdev init */
95 	netdev->hw_features    |= NETIF_F_SG;
96 	netdev->hw_features    |= NETIF_F_IP_CSUM;
97 	netdev->hw_features    |= NETIF_F_IPV6_CSUM;
98 	netdev->hw_features    |= NETIF_F_GRO;
99 	netdev->hw_features    |= NETIF_F_TSO;
100 	netdev->hw_features    |= NETIF_F_TSO6;
101 	netdev->hw_features    |= NETIF_F_RXCSUM;
102 	netdev->hw_features    |= NETIF_F_RXHASH;
103 
104 	netdev->netdev_ops = &mlx5i_netdev_ops;
105 	netdev->ethtool_ops = &mlx5i_ethtool_ops;
106 	netdev->request_ops_lock = true;
107 	netdev_lockdep_set_classes(netdev);
108 
109 	return 0;
110 }
111 
112 /* Called directly before IPoIB netdevice is destroyed to cleanup SW structs */
mlx5i_cleanup(struct mlx5e_priv * priv)113 void mlx5i_cleanup(struct mlx5e_priv *priv)
114 {
115 	mlx5e_priv_cleanup(priv);
116 }
117 
mlx5i_grp_sw_update_stats(struct mlx5e_priv * priv)118 static void mlx5i_grp_sw_update_stats(struct mlx5e_priv *priv)
119 {
120 	struct rtnl_link_stats64 s = {};
121 	int i, j;
122 
123 	for (i = 0; i < priv->stats_nch; i++) {
124 		struct mlx5e_channel_stats *channel_stats;
125 		struct mlx5e_rq_stats *rq_stats;
126 
127 		channel_stats = priv->channel_stats[i];
128 		rq_stats = &channel_stats->rq;
129 
130 		s.rx_packets += rq_stats->packets;
131 		s.rx_bytes   += rq_stats->bytes;
132 
133 		for (j = 0; j < priv->max_opened_tc; j++) {
134 			struct mlx5e_sq_stats *sq_stats = &channel_stats->sq[j];
135 
136 			s.tx_packets           += sq_stats->packets;
137 			s.tx_bytes             += sq_stats->bytes;
138 			s.tx_dropped           += sq_stats->dropped;
139 		}
140 	}
141 
142 	memset(&priv->stats.sw, 0, sizeof(s));
143 
144 	priv->stats.sw.rx_packets = s.rx_packets;
145 	priv->stats.sw.rx_bytes = s.rx_bytes;
146 	priv->stats.sw.tx_packets = s.tx_packets;
147 	priv->stats.sw.tx_bytes = s.tx_bytes;
148 	priv->stats.sw.tx_queue_dropped = s.tx_dropped;
149 }
150 
mlx5i_get_stats(struct net_device * dev,struct rtnl_link_stats64 * stats)151 void mlx5i_get_stats(struct net_device *dev, struct rtnl_link_stats64 *stats)
152 {
153 	struct mlx5e_priv     *priv   = mlx5i_epriv(dev);
154 	struct mlx5e_sw_stats *sstats = &priv->stats.sw;
155 
156 	mlx5i_grp_sw_update_stats(priv);
157 
158 	stats->rx_packets = sstats->rx_packets;
159 	stats->rx_bytes   = sstats->rx_bytes;
160 	stats->tx_packets = sstats->tx_packets;
161 	stats->tx_bytes   = sstats->tx_bytes;
162 	stats->tx_dropped = sstats->tx_queue_dropped;
163 }
164 
mlx5i_parent_get(struct net_device * netdev)165 struct net_device *mlx5i_parent_get(struct net_device *netdev)
166 {
167 	struct mlx5e_priv *priv = mlx5i_epriv(netdev);
168 	struct mlx5i_priv *ipriv, *parent_ipriv;
169 	struct net_device *parent_dev;
170 	int parent_ifindex;
171 
172 	ipriv = priv->ppriv;
173 
174 	parent_ifindex = netdev->netdev_ops->ndo_get_iflink(netdev);
175 	parent_dev = dev_get_by_index(dev_net(netdev), parent_ifindex);
176 	if (!parent_dev)
177 		return NULL;
178 
179 	parent_ipriv = netdev_priv(parent_dev);
180 
181 	ASSERT_RTNL();
182 	parent_ipriv->num_sub_interfaces++;
183 
184 	ipriv->parent_dev = parent_dev;
185 
186 	return parent_dev;
187 }
188 
mlx5i_parent_put(struct net_device * netdev)189 void mlx5i_parent_put(struct net_device *netdev)
190 {
191 	struct mlx5e_priv *priv = mlx5i_epriv(netdev);
192 	struct mlx5i_priv *ipriv, *parent_ipriv;
193 
194 	ipriv = priv->ppriv;
195 	parent_ipriv = netdev_priv(ipriv->parent_dev);
196 
197 	ASSERT_RTNL();
198 	parent_ipriv->num_sub_interfaces--;
199 
200 	dev_put(ipriv->parent_dev);
201 }
202 
mlx5i_init_underlay_qp(struct mlx5e_priv * priv)203 int mlx5i_init_underlay_qp(struct mlx5e_priv *priv)
204 {
205 	struct mlx5_core_dev *mdev = priv->mdev;
206 	struct mlx5i_priv *ipriv = priv->ppriv;
207 	int ret;
208 
209 	{
210 		u32 in[MLX5_ST_SZ_DW(rst2init_qp_in)] = {};
211 		u32 *qpc;
212 
213 		qpc = MLX5_ADDR_OF(rst2init_qp_in, in, qpc);
214 
215 		MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED);
216 		MLX5_SET(qpc, qpc, primary_address_path.pkey_index,
217 			 ipriv->pkey_index);
218 		MLX5_SET(qpc, qpc, primary_address_path.vhca_port_num, 1);
219 		MLX5_SET(qpc, qpc, q_key, IB_DEFAULT_Q_KEY);
220 
221 		MLX5_SET(rst2init_qp_in, in, opcode, MLX5_CMD_OP_RST2INIT_QP);
222 		MLX5_SET(rst2init_qp_in, in, qpn, ipriv->qpn);
223 		ret = mlx5_cmd_exec_in(mdev, rst2init_qp, in);
224 		if (ret)
225 			goto err_qp_modify_to_err;
226 	}
227 	{
228 		u32 in[MLX5_ST_SZ_DW(init2rtr_qp_in)] = {};
229 
230 		MLX5_SET(init2rtr_qp_in, in, opcode, MLX5_CMD_OP_INIT2RTR_QP);
231 		MLX5_SET(init2rtr_qp_in, in, qpn, ipriv->qpn);
232 		ret = mlx5_cmd_exec_in(mdev, init2rtr_qp, in);
233 		if (ret)
234 			goto err_qp_modify_to_err;
235 	}
236 	{
237 		u32 in[MLX5_ST_SZ_DW(rtr2rts_qp_in)] = {};
238 
239 		MLX5_SET(rtr2rts_qp_in, in, opcode, MLX5_CMD_OP_RTR2RTS_QP);
240 		MLX5_SET(rtr2rts_qp_in, in, qpn, ipriv->qpn);
241 		ret = mlx5_cmd_exec_in(mdev, rtr2rts_qp, in);
242 		if (ret)
243 			goto err_qp_modify_to_err;
244 	}
245 	return 0;
246 
247 err_qp_modify_to_err:
248 	{
249 		u32 in[MLX5_ST_SZ_DW(qp_2err_in)] = {};
250 
251 		MLX5_SET(qp_2err_in, in, opcode, MLX5_CMD_OP_2ERR_QP);
252 		MLX5_SET(qp_2err_in, in, qpn, ipriv->qpn);
253 		mlx5_cmd_exec_in(mdev, qp_2err, in);
254 	}
255 	return ret;
256 }
257 
mlx5i_uninit_underlay_qp(struct mlx5e_priv * priv)258 void mlx5i_uninit_underlay_qp(struct mlx5e_priv *priv)
259 {
260 	struct mlx5i_priv *ipriv = priv->ppriv;
261 	struct mlx5_core_dev *mdev = priv->mdev;
262 	u32 in[MLX5_ST_SZ_DW(qp_2rst_in)] = {};
263 
264 	MLX5_SET(qp_2rst_in, in, opcode, MLX5_CMD_OP_2RST_QP);
265 	MLX5_SET(qp_2rst_in, in, qpn, ipriv->qpn);
266 	mlx5_cmd_exec_in(mdev, qp_2rst, in);
267 }
268 
269 #define MLX5_QP_ENHANCED_ULP_STATELESS_MODE 2
270 
mlx5i_create_underlay_qp(struct mlx5e_priv * priv)271 int mlx5i_create_underlay_qp(struct mlx5e_priv *priv)
272 {
273 	const unsigned char *dev_addr = priv->netdev->dev_addr;
274 	u32 out[MLX5_ST_SZ_DW(create_qp_out)] = {};
275 	u32 in[MLX5_ST_SZ_DW(create_qp_in)] = {};
276 	struct mlx5i_priv *ipriv = priv->ppriv;
277 	void *addr_path;
278 	int qpn = 0;
279 	int ret = 0;
280 	void *qpc;
281 
282 	if (MLX5_CAP_GEN(priv->mdev, mkey_by_name)) {
283 		qpn = (dev_addr[1] << 16) + (dev_addr[2] << 8) + dev_addr[3];
284 		MLX5_SET(create_qp_in, in, input_qpn, qpn);
285 	}
286 
287 	qpc = MLX5_ADDR_OF(create_qp_in, in, qpc);
288 	MLX5_SET(qpc, qpc, ts_format, mlx5_get_qp_default_ts(priv->mdev));
289 	MLX5_SET(qpc, qpc, st, MLX5_QP_ST_UD);
290 	MLX5_SET(qpc, qpc, pm_state, MLX5_QP_PM_MIGRATED);
291 	MLX5_SET(qpc, qpc, ulp_stateless_offload_mode,
292 		 MLX5_QP_ENHANCED_ULP_STATELESS_MODE);
293 
294 	addr_path = MLX5_ADDR_OF(qpc, qpc, primary_address_path);
295 	MLX5_SET(ads, addr_path, vhca_port_num, 1);
296 	MLX5_SET(ads, addr_path, grh, 1);
297 
298 	MLX5_SET(create_qp_in, in, opcode, MLX5_CMD_OP_CREATE_QP);
299 	ret = mlx5_cmd_exec_inout(priv->mdev, create_qp, in, out);
300 	if (ret)
301 		return ret;
302 
303 	ipriv->qpn = MLX5_GET(create_qp_out, out, qpn);
304 
305 	return 0;
306 }
307 
mlx5i_destroy_underlay_qp(struct mlx5_core_dev * mdev,u32 qpn)308 void mlx5i_destroy_underlay_qp(struct mlx5_core_dev *mdev, u32 qpn)
309 {
310 	u32 in[MLX5_ST_SZ_DW(destroy_qp_in)] = {};
311 
312 	MLX5_SET(destroy_qp_in, in, opcode, MLX5_CMD_OP_DESTROY_QP);
313 	MLX5_SET(destroy_qp_in, in, qpn, qpn);
314 	mlx5_cmd_exec_in(mdev, destroy_qp, in);
315 }
316 
mlx5i_update_nic_rx(struct mlx5e_priv * priv)317 int mlx5i_update_nic_rx(struct mlx5e_priv *priv)
318 {
319 	return mlx5e_refresh_tirs(priv, true, true);
320 }
321 
mlx5i_create_tis(struct mlx5_core_dev * mdev,u32 underlay_qpn,u32 * tisn)322 int mlx5i_create_tis(struct mlx5_core_dev *mdev, u32 underlay_qpn, u32 *tisn)
323 {
324 	u32 in[MLX5_ST_SZ_DW(create_tis_in)] = {};
325 	void *tisc;
326 
327 	tisc = MLX5_ADDR_OF(create_tis_in, in, ctx);
328 
329 	MLX5_SET(tisc, tisc, underlay_qpn, underlay_qpn);
330 
331 	return mlx5e_create_tis(mdev, in, tisn);
332 }
333 
mlx5i_init_tx(struct mlx5e_priv * priv)334 static int mlx5i_init_tx(struct mlx5e_priv *priv)
335 {
336 	struct mlx5i_priv *ipriv = priv->ppriv;
337 	int err;
338 
339 	err = mlx5i_create_underlay_qp(priv);
340 	if (err) {
341 		mlx5_core_warn(priv->mdev, "create underlay QP failed, %d\n", err);
342 		return err;
343 	}
344 
345 	err = mlx5i_create_tis(priv->mdev, ipriv->qpn, &ipriv->tisn);
346 	if (err) {
347 		mlx5_core_warn(priv->mdev, "create tis failed, %d\n", err);
348 		goto err_destroy_underlay_qp;
349 	}
350 
351 	return 0;
352 
353 err_destroy_underlay_qp:
354 	mlx5i_destroy_underlay_qp(priv->mdev, ipriv->qpn);
355 	return err;
356 }
357 
mlx5i_cleanup_tx(struct mlx5e_priv * priv)358 static void mlx5i_cleanup_tx(struct mlx5e_priv *priv)
359 {
360 	struct mlx5i_priv *ipriv = priv->ppriv;
361 
362 	mlx5e_destroy_tis(priv->mdev, ipriv->tisn);
363 	mlx5i_destroy_underlay_qp(priv->mdev, ipriv->qpn);
364 }
365 
mlx5i_create_flow_steering(struct mlx5e_priv * priv)366 static int mlx5i_create_flow_steering(struct mlx5e_priv *priv)
367 {
368 	struct mlx5_flow_namespace *ns =
369 		mlx5_get_flow_namespace(priv->mdev, MLX5_FLOW_NAMESPACE_KERNEL);
370 	int err;
371 
372 
373 	if (!ns)
374 		return -EINVAL;
375 
376 	mlx5e_fs_set_ns(priv->fs, ns, false);
377 	err = mlx5e_arfs_create_tables(priv->fs, priv->rx_res,
378 				       mlx5e_fs_has_arfs(priv->netdev));
379 	if (err) {
380 		netdev_err(priv->netdev, "Failed to create arfs tables, err=%d\n",
381 			   err);
382 		priv->netdev->hw_features &= ~NETIF_F_NTUPLE;
383 	}
384 
385 	err = mlx5e_create_ttc_table(priv->fs, priv->rx_res);
386 	if (err) {
387 		netdev_err(priv->netdev, "Failed to create ttc table, err=%d\n",
388 			   err);
389 		goto err_destroy_arfs_tables;
390 	}
391 
392 	mlx5e_ethtool_init_steering(priv->fs);
393 
394 	return 0;
395 
396 err_destroy_arfs_tables:
397 	mlx5e_arfs_destroy_tables(priv->fs, mlx5e_fs_has_arfs(priv->netdev));
398 
399 	return err;
400 }
401 
mlx5i_destroy_flow_steering(struct mlx5e_priv * priv)402 static void mlx5i_destroy_flow_steering(struct mlx5e_priv *priv)
403 {
404 	mlx5e_destroy_ttc_table(priv->fs);
405 	mlx5e_arfs_destroy_tables(priv->fs, mlx5e_fs_has_arfs(priv->netdev));
406 	mlx5e_ethtool_cleanup_steering(priv->fs);
407 }
408 
mlx5i_init_rx(struct mlx5e_priv * priv)409 static int mlx5i_init_rx(struct mlx5e_priv *priv)
410 {
411 	struct mlx5_core_dev *mdev = priv->mdev;
412 	int err;
413 
414 	priv->fs = mlx5e_fs_init(priv->profile, mdev,
415 				 !test_bit(MLX5E_STATE_DESTROYING, &priv->state),
416 				 priv->dfs_root);
417 	if (!priv->fs) {
418 		netdev_err(priv->netdev, "FS allocation failed\n");
419 		return -ENOMEM;
420 	}
421 
422 	mlx5e_create_q_counters(priv);
423 
424 	err = mlx5e_open_drop_rq(priv, &priv->drop_rq);
425 	if (err) {
426 		mlx5_core_err(mdev, "open drop rq failed, %d\n", err);
427 		goto err_destroy_q_counters;
428 	}
429 
430 	priv->rx_res = mlx5e_rx_res_create(priv->mdev, 0, priv->max_nch, priv->drop_rq.rqn,
431 					   &priv->channels.params.packet_merge,
432 					   priv->channels.params.num_channels);
433 	if (IS_ERR(priv->rx_res)) {
434 		err = PTR_ERR(priv->rx_res);
435 		goto err_close_drop_rq;
436 	}
437 
438 	err = mlx5i_create_flow_steering(priv);
439 	if (err)
440 		goto err_destroy_rx_res;
441 
442 	return 0;
443 
444 err_destroy_rx_res:
445 	mlx5e_rx_res_destroy(priv->rx_res);
446 	priv->rx_res = ERR_PTR(-EINVAL);
447 err_close_drop_rq:
448 	mlx5e_close_drop_rq(&priv->drop_rq);
449 err_destroy_q_counters:
450 	mlx5e_destroy_q_counters(priv);
451 	mlx5e_fs_cleanup(priv->fs);
452 	return err;
453 }
454 
mlx5i_cleanup_rx(struct mlx5e_priv * priv)455 static void mlx5i_cleanup_rx(struct mlx5e_priv *priv)
456 {
457 	mlx5i_destroy_flow_steering(priv);
458 	mlx5e_rx_res_destroy(priv->rx_res);
459 	priv->rx_res = ERR_PTR(-EINVAL);
460 	mlx5e_close_drop_rq(&priv->drop_rq);
461 	mlx5e_destroy_q_counters(priv);
462 	mlx5e_fs_cleanup(priv->fs);
463 }
464 
465 /* The stats groups order is opposite to the update_stats() order calls */
466 static mlx5e_stats_grp_t mlx5i_stats_grps[] = {
467 	&MLX5E_STATS_GRP(sw),
468 	&MLX5E_STATS_GRP(qcnt),
469 	&MLX5E_STATS_GRP(vnic_env),
470 	&MLX5E_STATS_GRP(vport),
471 	&MLX5E_STATS_GRP(802_3),
472 	&MLX5E_STATS_GRP(2863),
473 	&MLX5E_STATS_GRP(2819),
474 	&MLX5E_STATS_GRP(phy),
475 	&MLX5E_STATS_GRP(pcie),
476 	&MLX5E_STATS_GRP(per_prio),
477 	&MLX5E_STATS_GRP(pme),
478 	&MLX5E_STATS_GRP(channels),
479 	&MLX5E_STATS_GRP(per_port_buff_congest),
480 };
481 
mlx5i_stats_grps_num(struct mlx5e_priv * priv)482 static unsigned int mlx5i_stats_grps_num(struct mlx5e_priv *priv)
483 {
484 	return ARRAY_SIZE(mlx5i_stats_grps);
485 }
486 
mlx5i_get_tisn(struct mlx5_core_dev * mdev,struct mlx5e_priv * priv,u8 lag_port,u8 tc)487 u32 mlx5i_get_tisn(struct mlx5_core_dev *mdev, struct mlx5e_priv *priv, u8 lag_port, u8 tc)
488 {
489 	struct mlx5i_priv *ipriv = priv->ppriv;
490 
491 	if (WARN(lag_port || tc,
492 		 "IPoIB unexpected non-zero value: lag_port (%u), tc (%u)\n",
493 		 lag_port, tc))
494 		return 0;
495 
496 	return ipriv->tisn;
497 }
498 
499 static const struct mlx5e_profile mlx5i_nic_profile = {
500 	.init		   = mlx5i_init,
501 	.cleanup	   = mlx5i_cleanup,
502 	.init_tx	   = mlx5i_init_tx,
503 	.cleanup_tx	   = mlx5i_cleanup_tx,
504 	.init_rx	   = mlx5i_init_rx,
505 	.cleanup_rx	   = mlx5i_cleanup_rx,
506 	.enable		   = NULL, /* mlx5i_enable */
507 	.disable	   = NULL, /* mlx5i_disable */
508 	.update_rx	   = mlx5i_update_nic_rx,
509 	.update_stats	   = NULL, /* mlx5i_update_stats */
510 	.update_carrier    = NULL, /* no HW update in IB link */
511 	.rx_handlers       = &mlx5i_rx_handlers,
512 	.max_tc		   = MLX5I_MAX_NUM_TC,
513 	.stats_grps        = mlx5i_stats_grps,
514 	.stats_grps_num    = mlx5i_stats_grps_num,
515 	.get_tisn          = mlx5i_get_tisn,
516 };
517 
518 /* mlx5i netdev NDos */
519 
mlx5i_change_mtu(struct net_device * netdev,int new_mtu)520 static int mlx5i_change_mtu(struct net_device *netdev, int new_mtu)
521 {
522 	struct mlx5e_priv *priv = mlx5i_epriv(netdev);
523 	struct mlx5e_params new_params;
524 	int err = 0;
525 
526 	mutex_lock(&priv->state_lock);
527 
528 	new_params = priv->channels.params;
529 	new_params.sw_mtu = new_mtu;
530 
531 	err = mlx5e_safe_switch_params(priv, &new_params, NULL, NULL, true);
532 	if (err)
533 		goto out;
534 
535 	WRITE_ONCE(netdev->mtu, new_params.sw_mtu);
536 
537 out:
538 	mutex_unlock(&priv->state_lock);
539 	return err;
540 }
541 
mlx5i_dev_init(struct net_device * dev)542 int mlx5i_dev_init(struct net_device *dev)
543 {
544 	struct mlx5e_priv    *priv   = mlx5i_epriv(dev);
545 	struct mlx5i_priv    *ipriv  = priv->ppriv;
546 	u8 addr_mod[3];
547 
548 	/* Set dev address using underlay QP */
549 	addr_mod[0] = (ipriv->qpn >> 16) & 0xff;
550 	addr_mod[1] = (ipriv->qpn >>  8) & 0xff;
551 	addr_mod[2] = (ipriv->qpn) & 0xff;
552 	dev_addr_mod(dev, 1, addr_mod, sizeof(addr_mod));
553 
554 	/* Add QPN to net-device mapping to HT */
555 	mlx5i_pkey_add_qpn(dev, ipriv->qpn);
556 
557 	return 0;
558 }
559 
mlx5i_ioctl(struct net_device * dev,struct ifreq * ifr,int cmd)560 int mlx5i_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
561 {
562 	struct mlx5e_priv *priv = mlx5i_epriv(dev);
563 
564 	switch (cmd) {
565 	case SIOCSHWTSTAMP:
566 		return mlx5e_hwstamp_set(priv, ifr);
567 	case SIOCGHWTSTAMP:
568 		return mlx5e_hwstamp_get(priv, ifr);
569 	default:
570 		return -EOPNOTSUPP;
571 	}
572 }
573 
mlx5i_dev_cleanup(struct net_device * dev)574 void mlx5i_dev_cleanup(struct net_device *dev)
575 {
576 	struct mlx5e_priv    *priv   = mlx5i_epriv(dev);
577 	struct mlx5i_priv    *ipriv = priv->ppriv;
578 
579 	mlx5i_uninit_underlay_qp(priv);
580 
581 	/* Delete QPN to net-device mapping from HT */
582 	mlx5i_pkey_del_qpn(dev, ipriv->qpn);
583 }
584 
mlx5i_open(struct net_device * netdev)585 static int mlx5i_open(struct net_device *netdev)
586 {
587 	struct mlx5e_priv *epriv = mlx5i_epriv(netdev);
588 	struct mlx5i_priv *ipriv = epriv->ppriv;
589 	struct mlx5_core_dev *mdev = epriv->mdev;
590 	int err;
591 
592 	mutex_lock(&epriv->state_lock);
593 
594 	set_bit(MLX5E_STATE_OPENED, &epriv->state);
595 
596 	err = mlx5i_init_underlay_qp(epriv);
597 	if (err) {
598 		mlx5_core_warn(mdev, "prepare underlay qp state failed, %d\n", err);
599 		goto err_clear_state_opened_flag;
600 	}
601 
602 	err = mlx5_fs_add_rx_underlay_qpn(mdev, ipriv->qpn);
603 	if (err) {
604 		mlx5_core_warn(mdev, "attach underlay qp to ft failed, %d\n", err);
605 		goto err_reset_qp;
606 	}
607 
608 	err = mlx5e_open_channels(epriv, &epriv->channels);
609 	if (err)
610 		goto err_remove_fs_underlay_qp;
611 
612 	err = epriv->profile->update_rx(epriv);
613 	if (err)
614 		goto err_close_channels;
615 
616 	mlx5e_activate_priv_channels(epriv);
617 
618 	mutex_unlock(&epriv->state_lock);
619 	return 0;
620 
621 err_close_channels:
622 	mlx5e_close_channels(&epriv->channels);
623 err_remove_fs_underlay_qp:
624 	mlx5_fs_remove_rx_underlay_qpn(mdev, ipriv->qpn);
625 err_reset_qp:
626 	mlx5i_uninit_underlay_qp(epriv);
627 err_clear_state_opened_flag:
628 	clear_bit(MLX5E_STATE_OPENED, &epriv->state);
629 	mutex_unlock(&epriv->state_lock);
630 	return err;
631 }
632 
mlx5i_close(struct net_device * netdev)633 static int mlx5i_close(struct net_device *netdev)
634 {
635 	struct mlx5e_priv *epriv = mlx5i_epriv(netdev);
636 	struct mlx5i_priv *ipriv = epriv->ppriv;
637 	struct mlx5_core_dev *mdev = epriv->mdev;
638 
639 	/* May already be CLOSED in case a previous configuration operation
640 	 * (e.g RX/TX queue size change) that involves close&open failed.
641 	 */
642 	mutex_lock(&epriv->state_lock);
643 
644 	if (!test_bit(MLX5E_STATE_OPENED, &epriv->state))
645 		goto unlock;
646 
647 	clear_bit(MLX5E_STATE_OPENED, &epriv->state);
648 
649 	netif_carrier_off(epriv->netdev);
650 	mlx5_fs_remove_rx_underlay_qpn(mdev, ipriv->qpn);
651 	mlx5e_deactivate_priv_channels(epriv);
652 	mlx5e_close_channels(&epriv->channels);
653 	mlx5i_uninit_underlay_qp(epriv);
654 unlock:
655 	mutex_unlock(&epriv->state_lock);
656 	return 0;
657 }
658 
659 /* IPoIB RDMA netdev callbacks */
mlx5i_attach_mcast(struct net_device * netdev,struct ib_device * hca,union ib_gid * gid,u16 lid,int set_qkey,u32 qkey)660 static int mlx5i_attach_mcast(struct net_device *netdev, struct ib_device *hca,
661 			      union ib_gid *gid, u16 lid, int set_qkey,
662 			      u32 qkey)
663 {
664 	struct mlx5e_priv    *epriv = mlx5i_epriv(netdev);
665 	struct mlx5_core_dev *mdev  = epriv->mdev;
666 	struct mlx5i_priv    *ipriv = epriv->ppriv;
667 	int err;
668 
669 	mlx5_core_dbg(mdev, "attaching QPN 0x%x, MGID %pI6\n", ipriv->qpn,
670 		      gid->raw);
671 	err = mlx5_core_attach_mcg(mdev, gid, ipriv->qpn);
672 	if (err)
673 		mlx5_core_warn(mdev, "failed attaching QPN 0x%x, MGID %pI6\n",
674 			       ipriv->qpn, gid->raw);
675 
676 	if (set_qkey) {
677 		mlx5_core_dbg(mdev, "%s setting qkey 0x%x\n",
678 			      netdev->name, qkey);
679 		ipriv->qkey = qkey;
680 	}
681 
682 	return err;
683 }
684 
mlx5i_detach_mcast(struct net_device * netdev,struct ib_device * hca,union ib_gid * gid,u16 lid)685 static int mlx5i_detach_mcast(struct net_device *netdev, struct ib_device *hca,
686 			      union ib_gid *gid, u16 lid)
687 {
688 	struct mlx5e_priv    *epriv = mlx5i_epriv(netdev);
689 	struct mlx5_core_dev *mdev  = epriv->mdev;
690 	struct mlx5i_priv    *ipriv = epriv->ppriv;
691 	int err;
692 
693 	mlx5_core_dbg(mdev, "detaching QPN 0x%x, MGID %pI6\n", ipriv->qpn,
694 		      gid->raw);
695 
696 	err = mlx5_core_detach_mcg(mdev, gid, ipriv->qpn);
697 	if (err)
698 		mlx5_core_dbg(mdev, "failed detaching QPN 0x%x, MGID %pI6\n",
699 			      ipriv->qpn, gid->raw);
700 
701 	return err;
702 }
703 
mlx5i_xmit(struct net_device * dev,struct sk_buff * skb,struct ib_ah * address,u32 dqpn)704 static int mlx5i_xmit(struct net_device *dev, struct sk_buff *skb,
705 		      struct ib_ah *address, u32 dqpn)
706 {
707 	struct mlx5e_priv *epriv = mlx5i_epriv(dev);
708 	struct mlx5e_txqsq *sq   = epriv->txq2sq[skb_get_queue_mapping(skb)];
709 	struct mlx5_ib_ah *mah   = to_mah(address);
710 	struct mlx5i_priv *ipriv = epriv->ppriv;
711 
712 	mlx5i_sq_xmit(sq, skb, &mah->av, dqpn, ipriv->qkey, netdev_xmit_more());
713 
714 	return NETDEV_TX_OK;
715 }
716 
mlx5i_set_pkey_index(struct net_device * netdev,int id)717 static void mlx5i_set_pkey_index(struct net_device *netdev, int id)
718 {
719 	struct mlx5i_priv *ipriv = netdev_priv(netdev);
720 
721 	ipriv->pkey_index = (u16)id;
722 }
723 
mlx5i_check_required_hca_cap(struct mlx5_core_dev * mdev)724 static int mlx5i_check_required_hca_cap(struct mlx5_core_dev *mdev)
725 {
726 	if (MLX5_CAP_GEN(mdev, port_type) != MLX5_CAP_PORT_TYPE_IB)
727 		return -EOPNOTSUPP;
728 
729 	if (!MLX5_CAP_GEN(mdev, ipoib_enhanced_offloads)) {
730 		mlx5_core_warn(mdev, "IPoIB enhanced offloads are not supported\n");
731 		return -EOPNOTSUPP;
732 	}
733 
734 	return 0;
735 }
736 
mlx5_rdma_netdev_free(struct net_device * netdev)737 static void mlx5_rdma_netdev_free(struct net_device *netdev)
738 {
739 	struct mlx5e_priv *priv = mlx5i_epriv(netdev);
740 	struct mlx5_core_dev *mdev = priv->mdev;
741 	struct mlx5i_priv *ipriv = priv->ppriv;
742 	const struct mlx5e_profile *profile = priv->profile;
743 
744 	mlx5e_detach_netdev(priv);
745 	profile->cleanup(priv);
746 
747 	if (!ipriv->sub_interface) {
748 		mlx5i_pkey_qpn_ht_cleanup(netdev);
749 		mlx5e_destroy_mdev_resources(mdev);
750 	}
751 }
752 
mlx5_is_sub_interface(struct mlx5_core_dev * mdev)753 static bool mlx5_is_sub_interface(struct mlx5_core_dev *mdev)
754 {
755 	return mdev->mlx5e_res.hw_objs.pdn != 0;
756 }
757 
mlx5_get_profile(struct mlx5_core_dev * mdev)758 static const struct mlx5e_profile *mlx5_get_profile(struct mlx5_core_dev *mdev)
759 {
760 	if (mlx5_is_sub_interface(mdev))
761 		return mlx5i_pkey_get_profile();
762 	return &mlx5i_nic_profile;
763 }
764 
mlx5_rdma_setup_rn(struct ib_device * ibdev,u32 port_num,struct net_device * netdev,void * param)765 static int mlx5_rdma_setup_rn(struct ib_device *ibdev, u32 port_num,
766 			      struct net_device *netdev, void *param)
767 {
768 	struct mlx5_core_dev *mdev = (struct mlx5_core_dev *)param;
769 	const struct mlx5e_profile *prof = mlx5_get_profile(mdev);
770 	struct mlx5i_priv *ipriv;
771 	struct mlx5e_priv *epriv;
772 	struct rdma_netdev *rn;
773 	int err;
774 
775 	ipriv = netdev_priv(netdev);
776 	epriv = mlx5i_epriv(netdev);
777 
778 	ipriv->sub_interface = mlx5_is_sub_interface(mdev);
779 	if (!ipriv->sub_interface) {
780 		err = mlx5i_pkey_qpn_ht_init(netdev);
781 		if (err) {
782 			mlx5_core_warn(mdev, "allocate qpn_to_netdev ht failed\n");
783 			return err;
784 		}
785 
786 		/* This should only be called once per mdev */
787 		err = mlx5e_create_mdev_resources(mdev, false);
788 		if (err)
789 			goto destroy_ht;
790 	}
791 
792 	err = mlx5e_priv_init(epriv, prof, netdev, mdev);
793 	if (err)
794 		goto destroy_mdev_resources;
795 
796 	epriv->profile = prof;
797 	epriv->ppriv = ipriv;
798 
799 	prof->init(mdev, netdev);
800 
801 	err = mlx5e_attach_netdev(epriv);
802 	if (err)
803 		goto detach;
804 	netif_carrier_off(netdev);
805 
806 	/* set rdma_netdev func pointers */
807 	rn = &ipriv->rn;
808 	rn->hca  = ibdev;
809 	rn->send = mlx5i_xmit;
810 	rn->attach_mcast = mlx5i_attach_mcast;
811 	rn->detach_mcast = mlx5i_detach_mcast;
812 	rn->set_id = mlx5i_set_pkey_index;
813 
814 	netdev->priv_destructor = mlx5_rdma_netdev_free;
815 	netdev->needs_free_netdev = 1;
816 
817 	return 0;
818 
819 detach:
820 	prof->cleanup(epriv);
821 	if (ipriv->sub_interface)
822 		return err;
823 destroy_mdev_resources:
824 	mlx5e_destroy_mdev_resources(mdev);
825 destroy_ht:
826 	mlx5i_pkey_qpn_ht_cleanup(netdev);
827 	return err;
828 }
829 
mlx5_rdma_rn_get_params(struct mlx5_core_dev * mdev,struct ib_device * device,struct rdma_netdev_alloc_params * params)830 int mlx5_rdma_rn_get_params(struct mlx5_core_dev *mdev,
831 			    struct ib_device *device,
832 			    struct rdma_netdev_alloc_params *params)
833 {
834 	int nch;
835 	int rc;
836 
837 	rc = mlx5i_check_required_hca_cap(mdev);
838 	if (rc)
839 		return rc;
840 
841 	nch = mlx5e_get_max_num_channels(mdev);
842 
843 	*params = (struct rdma_netdev_alloc_params){
844 		.sizeof_priv = sizeof(struct mlx5i_priv) +
845 			       sizeof(struct mlx5e_priv),
846 		.txqs = nch * MLX5_MAX_NUM_TC,
847 		.rxqs = nch,
848 		.param = mdev,
849 		.initialize_rdma_netdev = mlx5_rdma_setup_rn,
850 	};
851 
852 	return 0;
853 }
854 EXPORT_SYMBOL(mlx5_rdma_rn_get_params);
855