2 * Copyright (c) 2017, Mellanox Technologies. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
33 #include <rdma/ib_verbs.h>
34 #include <linux/mlx5/fs.h>
38 #define IB_DEFAULT_Q_KEY 0xb1b
40 static int mlx5i_open(struct net_device
*netdev
);
41 static int mlx5i_close(struct net_device
*netdev
);
42 static int mlx5i_dev_init(struct net_device
*dev
);
43 static void mlx5i_dev_cleanup(struct net_device
*dev
);
45 static const struct net_device_ops mlx5i_netdev_ops
= {
46 .ndo_open
= mlx5i_open
,
47 .ndo_stop
= mlx5i_close
,
48 .ndo_init
= mlx5i_dev_init
,
49 .ndo_uninit
= mlx5i_dev_cleanup
,
52 /* IPoIB mlx5 netdev profile */
54 /* Called directly after IPoIB netdevice was created to initialize SW structs */
55 static void mlx5i_init(struct mlx5_core_dev
*mdev
,
56 struct net_device
*netdev
,
57 const struct mlx5e_profile
*profile
,
60 struct mlx5e_priv
*priv
= mlx5i_epriv(netdev
);
63 priv
->netdev
= netdev
;
64 priv
->profile
= profile
;
67 mlx5e_build_nic_params(mdev
, &priv
->channels
.params
, profile
->max_nch(mdev
));
69 mutex_init(&priv
->state_lock
);
71 netdev
->hw_features
|= NETIF_F_SG
;
72 netdev
->hw_features
|= NETIF_F_IP_CSUM
;
73 netdev
->hw_features
|= NETIF_F_IPV6_CSUM
;
74 netdev
->hw_features
|= NETIF_F_GRO
;
75 netdev
->hw_features
|= NETIF_F_TSO
;
76 netdev
->hw_features
|= NETIF_F_TSO6
;
77 netdev
->hw_features
|= NETIF_F_RXCSUM
;
78 netdev
->hw_features
|= NETIF_F_RXHASH
;
80 netdev
->netdev_ops
= &mlx5i_netdev_ops
;
83 /* Called directly before IPoIB netdevice is destroyed to cleanup SW structs */
84 static void mlx5i_cleanup(struct mlx5e_priv
*priv
)
89 #define MLX5_QP_ENHANCED_ULP_STATELESS_MODE 2
91 static int mlx5i_create_underlay_qp(struct mlx5_core_dev
*mdev
, struct mlx5_core_qp
*qp
)
93 struct mlx5_qp_context
*context
= NULL
;
100 inlen
= MLX5_ST_SZ_BYTES(create_qp_in
);
101 in
= mlx5_vzalloc(inlen
);
105 qpc
= MLX5_ADDR_OF(create_qp_in
, in
, qpc
);
106 MLX5_SET(qpc
, qpc
, st
, MLX5_QP_ST_UD
);
107 MLX5_SET(qpc
, qpc
, pm_state
, MLX5_QP_PM_MIGRATED
);
108 MLX5_SET(qpc
, qpc
, ulp_stateless_offload_mode
,
109 MLX5_QP_ENHANCED_ULP_STATELESS_MODE
);
111 addr_path
= MLX5_ADDR_OF(qpc
, qpc
, primary_address_path
);
112 MLX5_SET(ads
, addr_path
, port
, 1);
113 MLX5_SET(ads
, addr_path
, grh
, 1);
115 ret
= mlx5_core_create_qp(mdev
, qp
, in
, inlen
);
117 mlx5_core_err(mdev
, "Failed creating IPoIB QP err : %d\n", ret
);
122 context
= kzalloc(sizeof(*context
), GFP_KERNEL
);
128 context
->flags
= cpu_to_be32(MLX5_QP_PM_MIGRATED
<< 11);
129 context
->pri_path
.port
= 1;
130 context
->qkey
= cpu_to_be32(IB_DEFAULT_Q_KEY
);
132 ret
= mlx5_core_qp_modify(mdev
, MLX5_CMD_OP_RST2INIT_QP
, 0, context
, qp
);
134 mlx5_core_err(mdev
, "Failed to modify qp RST2INIT, err: %d\n", ret
);
137 memset(context
, 0, sizeof(*context
));
139 ret
= mlx5_core_qp_modify(mdev
, MLX5_CMD_OP_INIT2RTR_QP
, 0, context
, qp
);
141 mlx5_core_err(mdev
, "Failed to modify qp INIT2RTR, err: %d\n", ret
);
145 ret
= mlx5_core_qp_modify(mdev
, MLX5_CMD_OP_RTR2RTS_QP
, 0, context
, qp
);
147 mlx5_core_err(mdev
, "Failed to modify qp RTR2RTS, err: %d\n", ret
);
157 static void mlx5i_destroy_underlay_qp(struct mlx5_core_dev
*mdev
, struct mlx5_core_qp
*qp
)
159 mlx5_core_destroy_qp(mdev
, qp
);
162 static int mlx5i_init_tx(struct mlx5e_priv
*priv
)
164 struct mlx5i_priv
*ipriv
= priv
->ppriv
;
167 err
= mlx5i_create_underlay_qp(priv
->mdev
, &ipriv
->qp
);
169 mlx5_core_warn(priv
->mdev
, "create underlay QP failed, %d\n", err
);
173 err
= mlx5e_create_tis(priv
->mdev
, 0 /* tc */, ipriv
->qp
.qpn
, &priv
->tisn
[0]);
175 mlx5_core_warn(priv
->mdev
, "create tis failed, %d\n", err
);
182 static void mlx5i_cleanup_tx(struct mlx5e_priv
*priv
)
184 struct mlx5i_priv
*ipriv
= priv
->ppriv
;
186 mlx5e_destroy_tis(priv
->mdev
, priv
->tisn
[0]);
187 mlx5i_destroy_underlay_qp(priv
->mdev
, &ipriv
->qp
);
190 static int mlx5i_create_flow_steering(struct mlx5e_priv
*priv
)
192 struct mlx5i_priv
*ipriv
= priv
->ppriv
;
195 priv
->fs
.ns
= mlx5_get_flow_namespace(priv
->mdev
,
196 MLX5_FLOW_NAMESPACE_KERNEL
);
201 err
= mlx5e_arfs_create_tables(priv
);
203 netdev_err(priv
->netdev
, "Failed to create arfs tables, err=%d\n",
205 priv
->netdev
->hw_features
&= ~NETIF_F_NTUPLE
;
208 err
= mlx5e_create_ttc_table(priv
, ipriv
->qp
.qpn
);
210 netdev_err(priv
->netdev
, "Failed to create ttc table, err=%d\n",
212 goto err_destroy_arfs_tables
;
217 err_destroy_arfs_tables
:
218 mlx5e_arfs_destroy_tables(priv
);
223 static void mlx5i_destroy_flow_steering(struct mlx5e_priv
*priv
)
225 mlx5e_destroy_ttc_table(priv
);
226 mlx5e_arfs_destroy_tables(priv
);
229 static int mlx5i_init_rx(struct mlx5e_priv
*priv
)
233 err
= mlx5e_create_indirect_rqt(priv
);
237 err
= mlx5e_create_direct_rqts(priv
);
239 goto err_destroy_indirect_rqts
;
241 err
= mlx5e_create_indirect_tirs(priv
);
243 goto err_destroy_direct_rqts
;
245 err
= mlx5e_create_direct_tirs(priv
);
247 goto err_destroy_indirect_tirs
;
249 err
= mlx5i_create_flow_steering(priv
);
251 goto err_destroy_direct_tirs
;
255 err_destroy_direct_tirs
:
256 mlx5e_destroy_direct_tirs(priv
);
257 err_destroy_indirect_tirs
:
258 mlx5e_destroy_indirect_tirs(priv
);
259 err_destroy_direct_rqts
:
260 mlx5e_destroy_direct_rqts(priv
);
261 err_destroy_indirect_rqts
:
262 mlx5e_destroy_rqt(priv
, &priv
->indir_rqt
);
266 static void mlx5i_cleanup_rx(struct mlx5e_priv
*priv
)
268 mlx5i_destroy_flow_steering(priv
);
269 mlx5e_destroy_direct_tirs(priv
);
270 mlx5e_destroy_indirect_tirs(priv
);
271 mlx5e_destroy_direct_rqts(priv
);
272 mlx5e_destroy_rqt(priv
, &priv
->indir_rqt
);
275 static const struct mlx5e_profile mlx5i_nic_profile
= {
277 .cleanup
= mlx5i_cleanup
,
278 .init_tx
= mlx5i_init_tx
,
279 .cleanup_tx
= mlx5i_cleanup_tx
,
280 .init_rx
= mlx5i_init_rx
,
281 .cleanup_rx
= mlx5i_cleanup_rx
,
282 .enable
= NULL
, /* mlx5i_enable */
283 .disable
= NULL
, /* mlx5i_disable */
284 .update_stats
= NULL
, /* mlx5i_update_stats */
285 .max_nch
= mlx5e_get_max_num_channels
,
286 .rx_handlers
.handle_rx_cqe
= mlx5i_handle_rx_cqe
,
287 .rx_handlers
.handle_rx_cqe_mpwqe
= NULL
, /* Not supported */
288 .max_tc
= MLX5I_MAX_NUM_TC
,
291 /* mlx5i netdev NDos */
293 static int mlx5i_dev_init(struct net_device
*dev
)
295 struct mlx5e_priv
*priv
= mlx5i_epriv(dev
);
296 struct mlx5i_priv
*ipriv
= priv
->ppriv
;
298 /* Set dev address using underlay QP */
299 dev
->dev_addr
[1] = (ipriv
->qp
.qpn
>> 16) & 0xff;
300 dev
->dev_addr
[2] = (ipriv
->qp
.qpn
>> 8) & 0xff;
301 dev
->dev_addr
[3] = (ipriv
->qp
.qpn
) & 0xff;
306 static void mlx5i_dev_cleanup(struct net_device
*dev
)
308 struct mlx5e_priv
*priv
= mlx5i_epriv(dev
);
309 struct mlx5_core_dev
*mdev
= priv
->mdev
;
310 struct mlx5i_priv
*ipriv
= priv
->ppriv
;
311 struct mlx5_qp_context context
;
313 /* detach qp from flow-steering by reset it */
314 mlx5_core_qp_modify(mdev
, MLX5_CMD_OP_2RST_QP
, 0, &context
, &ipriv
->qp
);
317 static int mlx5i_open(struct net_device
*netdev
)
319 struct mlx5e_priv
*priv
= mlx5i_epriv(netdev
);
322 mutex_lock(&priv
->state_lock
);
324 set_bit(MLX5E_STATE_OPENED
, &priv
->state
);
326 err
= mlx5e_open_channels(priv
, &priv
->channels
);
328 goto err_clear_state_opened_flag
;
330 mlx5e_refresh_tirs(priv
, false);
331 mlx5e_activate_priv_channels(priv
);
332 mutex_unlock(&priv
->state_lock
);
335 err_clear_state_opened_flag
:
336 clear_bit(MLX5E_STATE_OPENED
, &priv
->state
);
337 mutex_unlock(&priv
->state_lock
);
341 static int mlx5i_close(struct net_device
*netdev
)
343 struct mlx5e_priv
*priv
= mlx5i_epriv(netdev
);
345 /* May already be CLOSED in case a previous configuration operation
346 * (e.g RX/TX queue size change) that involves close&open failed.
348 mutex_lock(&priv
->state_lock
);
350 if (!test_bit(MLX5E_STATE_OPENED
, &priv
->state
))
353 clear_bit(MLX5E_STATE_OPENED
, &priv
->state
);
355 netif_carrier_off(priv
->netdev
);
356 mlx5e_deactivate_priv_channels(priv
);
357 mlx5e_close_channels(&priv
->channels
);
359 mutex_unlock(&priv
->state_lock
);
363 /* IPoIB RDMA netdev callbacks */
364 static int mlx5i_attach_mcast(struct net_device
*netdev
, struct ib_device
*hca
,
365 union ib_gid
*gid
, u16 lid
, int set_qkey
,
368 struct mlx5e_priv
*epriv
= mlx5i_epriv(netdev
);
369 struct mlx5_core_dev
*mdev
= epriv
->mdev
;
370 struct mlx5i_priv
*ipriv
= epriv
->ppriv
;
373 mlx5_core_dbg(mdev
, "attaching QPN 0x%x, MGID %pI6\n", ipriv
->qp
.qpn
, gid
->raw
);
374 err
= mlx5_core_attach_mcg(mdev
, gid
, ipriv
->qp
.qpn
);
376 mlx5_core_warn(mdev
, "failed attaching QPN 0x%x, MGID %pI6\n",
377 ipriv
->qp
.qpn
, gid
->raw
);
380 mlx5_core_dbg(mdev
, "%s setting qkey 0x%x\n",
388 static int mlx5i_detach_mcast(struct net_device
*netdev
, struct ib_device
*hca
,
389 union ib_gid
*gid
, u16 lid
)
391 struct mlx5e_priv
*epriv
= mlx5i_epriv(netdev
);
392 struct mlx5_core_dev
*mdev
= epriv
->mdev
;
393 struct mlx5i_priv
*ipriv
= epriv
->ppriv
;
396 mlx5_core_dbg(mdev
, "detaching QPN 0x%x, MGID %pI6\n", ipriv
->qp
.qpn
, gid
->raw
);
398 err
= mlx5_core_detach_mcg(mdev
, gid
, ipriv
->qp
.qpn
);
400 mlx5_core_dbg(mdev
, "failed dettaching QPN 0x%x, MGID %pI6\n",
401 ipriv
->qp
.qpn
, gid
->raw
);
406 static int mlx5i_xmit(struct net_device
*dev
, struct sk_buff
*skb
,
407 struct ib_ah
*address
, u32 dqpn
)
409 struct mlx5e_priv
*epriv
= mlx5i_epriv(dev
);
410 struct mlx5e_txqsq
*sq
= epriv
->txq2sq
[skb_get_queue_mapping(skb
)];
411 struct mlx5_ib_ah
*mah
= to_mah(address
);
412 struct mlx5i_priv
*ipriv
= epriv
->ppriv
;
414 return mlx5i_sq_xmit(sq
, skb
, &mah
->av
, dqpn
, ipriv
->qkey
);
417 static int mlx5i_check_required_hca_cap(struct mlx5_core_dev
*mdev
)
419 if (MLX5_CAP_GEN(mdev
, port_type
) != MLX5_CAP_PORT_TYPE_IB
)
422 if (!MLX5_CAP_GEN(mdev
, ipoib_enhanced_offloads
)) {
423 mlx5_core_warn(mdev
, "IPoIB enhanced offloads are not supported\n");
430 struct net_device
*mlx5_rdma_netdev_alloc(struct mlx5_core_dev
*mdev
,
431 struct ib_device
*ibdev
,
433 void (*setup
)(struct net_device
*))
435 const struct mlx5e_profile
*profile
= &mlx5i_nic_profile
;
436 int nch
= profile
->max_nch(mdev
);
437 struct net_device
*netdev
;
438 struct mlx5i_priv
*ipriv
;
439 struct mlx5e_priv
*epriv
;
440 struct rdma_netdev
*rn
;
443 if (mlx5i_check_required_hca_cap(mdev
)) {
444 mlx5_core_warn(mdev
, "Accelerated mode is not supported\n");
445 return ERR_PTR(-EOPNOTSUPP
);
448 /* This function should only be called once per mdev */
449 err
= mlx5e_create_mdev_resources(mdev
);
453 netdev
= alloc_netdev_mqs(sizeof(struct mlx5i_priv
) + sizeof(struct mlx5e_priv
),
454 name
, NET_NAME_UNKNOWN
,
456 nch
* MLX5E_MAX_NUM_TC
,
459 mlx5_core_warn(mdev
, "alloc_netdev_mqs failed\n");
460 goto free_mdev_resources
;
463 ipriv
= netdev_priv(netdev
);
464 epriv
= mlx5i_epriv(netdev
);
466 epriv
->wq
= create_singlethread_workqueue("mlx5i");
468 goto err_free_netdev
;
470 profile
->init(mdev
, netdev
, profile
, ipriv
);
472 mlx5e_attach_netdev(epriv
);
473 netif_carrier_off(netdev
);
475 /* set rdma_netdev func pointers */
478 rn
->send
= mlx5i_xmit
;
479 rn
->attach_mcast
= mlx5i_attach_mcast
;
480 rn
->detach_mcast
= mlx5i_detach_mcast
;
487 mlx5e_destroy_mdev_resources(mdev
);
491 EXPORT_SYMBOL(mlx5_rdma_netdev_alloc
);
493 void mlx5_rdma_netdev_free(struct net_device
*netdev
)
495 struct mlx5e_priv
*priv
= mlx5i_epriv(netdev
);
496 const struct mlx5e_profile
*profile
= priv
->profile
;
498 mlx5e_detach_netdev(priv
);
499 profile
->cleanup(priv
);
500 destroy_workqueue(priv
->wq
);
503 mlx5e_destroy_mdev_resources(priv
->mdev
);
505 EXPORT_SYMBOL(mlx5_rdma_netdev_free
);