]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blob - drivers/net/ethernet/mellanox/mlx5/core/en_main.c
net/mlx5e: Add support for RXFCS feature flag
[mirror_ubuntu-bionic-kernel.git] / drivers / net / ethernet / mellanox / mlx5 / core / en_main.c
1 /*
2 * Copyright (c) 2015-2016, Mellanox Technologies. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 */
32
33 #include <net/tc_act/tc_gact.h>
34 #include <linux/crash_dump.h>
35 #include <net/pkt_cls.h>
36 #include <linux/mlx5/fs.h>
37 #include <net/vxlan.h>
38 #include <linux/bpf.h>
39 #include "en.h"
40 #include "en_tc.h"
41 #include "eswitch.h"
42 #include "vxlan.h"
43
44 struct mlx5e_rq_param {
45 u32 rqc[MLX5_ST_SZ_DW(rqc)];
46 struct mlx5_wq_param wq;
47 };
48
49 struct mlx5e_sq_param {
50 u32 sqc[MLX5_ST_SZ_DW(sqc)];
51 struct mlx5_wq_param wq;
52 };
53
54 struct mlx5e_cq_param {
55 u32 cqc[MLX5_ST_SZ_DW(cqc)];
56 struct mlx5_wq_param wq;
57 u16 eq_ix;
58 u8 cq_period_mode;
59 };
60
61 struct mlx5e_channel_param {
62 struct mlx5e_rq_param rq;
63 struct mlx5e_sq_param sq;
64 struct mlx5e_sq_param xdp_sq;
65 struct mlx5e_sq_param icosq;
66 struct mlx5e_cq_param rx_cq;
67 struct mlx5e_cq_param tx_cq;
68 struct mlx5e_cq_param icosq_cq;
69 };
70
71 static bool mlx5e_check_fragmented_striding_rq_cap(struct mlx5_core_dev *mdev)
72 {
73 return MLX5_CAP_GEN(mdev, striding_rq) &&
74 MLX5_CAP_GEN(mdev, umr_ptr_rlky) &&
75 MLX5_CAP_ETH(mdev, reg_umr_sq);
76 }
77
78 void mlx5e_set_rq_type_params(struct mlx5_core_dev *mdev,
79 struct mlx5e_params *params, u8 rq_type)
80 {
81 params->rq_wq_type = rq_type;
82 params->lro_wqe_sz = MLX5E_PARAMS_DEFAULT_LRO_WQE_SZ;
83 switch (params->rq_wq_type) {
84 case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
85 params->log_rq_size = is_kdump_kernel() ?
86 MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE_MPW :
87 MLX5E_PARAMS_DEFAULT_LOG_RQ_SIZE_MPW;
88 params->mpwqe_log_stride_sz =
89 MLX5E_GET_PFLAG(params, MLX5E_PFLAG_RX_CQE_COMPRESS) ?
90 MLX5_MPWRQ_CQE_CMPRS_LOG_STRIDE_SZ(mdev) :
91 MLX5_MPWRQ_DEF_LOG_STRIDE_SZ(mdev);
92 params->mpwqe_log_num_strides = MLX5_MPWRQ_LOG_WQE_SZ -
93 params->mpwqe_log_stride_sz;
94 break;
95 default: /* MLX5_WQ_TYPE_LINKED_LIST */
96 params->log_rq_size = is_kdump_kernel() ?
97 MLX5E_PARAMS_MINIMUM_LOG_RQ_SIZE :
98 MLX5E_PARAMS_DEFAULT_LOG_RQ_SIZE;
99
100 /* Extra room needed for build_skb */
101 params->lro_wqe_sz -= MLX5_RX_HEADROOM +
102 SKB_DATA_ALIGN(sizeof(struct skb_shared_info));
103 }
104
105 mlx5_core_info(mdev, "MLX5E: StrdRq(%d) RqSz(%ld) StrdSz(%ld) RxCqeCmprss(%d)\n",
106 params->rq_wq_type == MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ,
107 BIT(params->log_rq_size),
108 BIT(params->mpwqe_log_stride_sz),
109 MLX5E_GET_PFLAG(params, MLX5E_PFLAG_RX_CQE_COMPRESS));
110 }
111
112 static void mlx5e_set_rq_params(struct mlx5_core_dev *mdev, struct mlx5e_params *params)
113 {
114 u8 rq_type = mlx5e_check_fragmented_striding_rq_cap(mdev) &&
115 !params->xdp_prog ?
116 MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ :
117 MLX5_WQ_TYPE_LINKED_LIST;
118 mlx5e_set_rq_type_params(mdev, params, rq_type);
119 }
120
121 static void mlx5e_update_carrier(struct mlx5e_priv *priv)
122 {
123 struct mlx5_core_dev *mdev = priv->mdev;
124 u8 port_state;
125
126 port_state = mlx5_query_vport_state(mdev,
127 MLX5_QUERY_VPORT_STATE_IN_OP_MOD_VNIC_VPORT, 0);
128
129 if (port_state == VPORT_STATE_UP) {
130 netdev_info(priv->netdev, "Link up\n");
131 netif_carrier_on(priv->netdev);
132 } else {
133 netdev_info(priv->netdev, "Link down\n");
134 netif_carrier_off(priv->netdev);
135 }
136 }
137
138 static void mlx5e_update_carrier_work(struct work_struct *work)
139 {
140 struct mlx5e_priv *priv = container_of(work, struct mlx5e_priv,
141 update_carrier_work);
142
143 mutex_lock(&priv->state_lock);
144 if (test_bit(MLX5E_STATE_OPENED, &priv->state))
145 mlx5e_update_carrier(priv);
146 mutex_unlock(&priv->state_lock);
147 }
148
149 static void mlx5e_tx_timeout_work(struct work_struct *work)
150 {
151 struct mlx5e_priv *priv = container_of(work, struct mlx5e_priv,
152 tx_timeout_work);
153 int err;
154
155 rtnl_lock();
156 mutex_lock(&priv->state_lock);
157 if (!test_bit(MLX5E_STATE_OPENED, &priv->state))
158 goto unlock;
159 mlx5e_close_locked(priv->netdev);
160 err = mlx5e_open_locked(priv->netdev);
161 if (err)
162 netdev_err(priv->netdev, "mlx5e_open_locked failed recovering from a tx_timeout, err(%d).\n",
163 err);
164 unlock:
165 mutex_unlock(&priv->state_lock);
166 rtnl_unlock();
167 }
168
169 static void mlx5e_update_sw_counters(struct mlx5e_priv *priv)
170 {
171 struct mlx5e_sw_stats *s = &priv->stats.sw;
172 struct mlx5e_rq_stats *rq_stats;
173 struct mlx5e_sq_stats *sq_stats;
174 u64 tx_offload_none = 0;
175 int i, j;
176
177 memset(s, 0, sizeof(*s));
178 for (i = 0; i < priv->channels.num; i++) {
179 struct mlx5e_channel *c = priv->channels.c[i];
180
181 rq_stats = &c->rq.stats;
182
183 s->rx_packets += rq_stats->packets;
184 s->rx_bytes += rq_stats->bytes;
185 s->rx_lro_packets += rq_stats->lro_packets;
186 s->rx_lro_bytes += rq_stats->lro_bytes;
187 s->rx_csum_none += rq_stats->csum_none;
188 s->rx_csum_complete += rq_stats->csum_complete;
189 s->rx_csum_unnecessary_inner += rq_stats->csum_unnecessary_inner;
190 s->rx_xdp_drop += rq_stats->xdp_drop;
191 s->rx_xdp_tx += rq_stats->xdp_tx;
192 s->rx_xdp_tx_full += rq_stats->xdp_tx_full;
193 s->rx_wqe_err += rq_stats->wqe_err;
194 s->rx_mpwqe_filler += rq_stats->mpwqe_filler;
195 s->rx_buff_alloc_err += rq_stats->buff_alloc_err;
196 s->rx_cqe_compress_blks += rq_stats->cqe_compress_blks;
197 s->rx_cqe_compress_pkts += rq_stats->cqe_compress_pkts;
198 s->rx_cache_reuse += rq_stats->cache_reuse;
199 s->rx_cache_full += rq_stats->cache_full;
200 s->rx_cache_empty += rq_stats->cache_empty;
201 s->rx_cache_busy += rq_stats->cache_busy;
202
203 for (j = 0; j < priv->channels.params.num_tc; j++) {
204 sq_stats = &c->sq[j].stats;
205
206 s->tx_packets += sq_stats->packets;
207 s->tx_bytes += sq_stats->bytes;
208 s->tx_tso_packets += sq_stats->tso_packets;
209 s->tx_tso_bytes += sq_stats->tso_bytes;
210 s->tx_tso_inner_packets += sq_stats->tso_inner_packets;
211 s->tx_tso_inner_bytes += sq_stats->tso_inner_bytes;
212 s->tx_queue_stopped += sq_stats->stopped;
213 s->tx_queue_wake += sq_stats->wake;
214 s->tx_queue_dropped += sq_stats->dropped;
215 s->tx_xmit_more += sq_stats->xmit_more;
216 s->tx_csum_partial_inner += sq_stats->csum_partial_inner;
217 tx_offload_none += sq_stats->csum_none;
218 }
219 }
220
221 /* Update calculated offload counters */
222 s->tx_csum_partial = s->tx_packets - tx_offload_none - s->tx_csum_partial_inner;
223 s->rx_csum_unnecessary = s->rx_packets - s->rx_csum_none - s->rx_csum_complete;
224
225 s->link_down_events_phy = MLX5_GET(ppcnt_reg,
226 priv->stats.pport.phy_counters,
227 counter_set.phys_layer_cntrs.link_down_events);
228 }
229
230 static void mlx5e_update_vport_counters(struct mlx5e_priv *priv)
231 {
232 int outlen = MLX5_ST_SZ_BYTES(query_vport_counter_out);
233 u32 *out = (u32 *)priv->stats.vport.query_vport_out;
234 u32 in[MLX5_ST_SZ_DW(query_vport_counter_in)] = {0};
235 struct mlx5_core_dev *mdev = priv->mdev;
236
237 MLX5_SET(query_vport_counter_in, in, opcode,
238 MLX5_CMD_OP_QUERY_VPORT_COUNTER);
239 MLX5_SET(query_vport_counter_in, in, op_mod, 0);
240 MLX5_SET(query_vport_counter_in, in, other_vport, 0);
241
242 memset(out, 0, outlen);
243 mlx5_cmd_exec(mdev, in, sizeof(in), out, outlen);
244 }
245
246 static void mlx5e_update_pport_counters(struct mlx5e_priv *priv)
247 {
248 struct mlx5e_pport_stats *pstats = &priv->stats.pport;
249 struct mlx5_core_dev *mdev = priv->mdev;
250 int sz = MLX5_ST_SZ_BYTES(ppcnt_reg);
251 int prio;
252 void *out;
253 u32 *in;
254
255 in = mlx5_vzalloc(sz);
256 if (!in)
257 goto free_out;
258
259 MLX5_SET(ppcnt_reg, in, local_port, 1);
260
261 out = pstats->IEEE_802_3_counters;
262 MLX5_SET(ppcnt_reg, in, grp, MLX5_IEEE_802_3_COUNTERS_GROUP);
263 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0);
264
265 out = pstats->RFC_2863_counters;
266 MLX5_SET(ppcnt_reg, in, grp, MLX5_RFC_2863_COUNTERS_GROUP);
267 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0);
268
269 out = pstats->RFC_2819_counters;
270 MLX5_SET(ppcnt_reg, in, grp, MLX5_RFC_2819_COUNTERS_GROUP);
271 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0);
272
273 out = pstats->phy_counters;
274 MLX5_SET(ppcnt_reg, in, grp, MLX5_PHYSICAL_LAYER_COUNTERS_GROUP);
275 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0);
276
277 if (MLX5_CAP_PCAM_FEATURE(mdev, ppcnt_statistical_group)) {
278 out = pstats->phy_statistical_counters;
279 MLX5_SET(ppcnt_reg, in, grp, MLX5_PHYSICAL_LAYER_STATISTICAL_GROUP);
280 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_PPCNT, 0, 0);
281 }
282
283 MLX5_SET(ppcnt_reg, in, grp, MLX5_PER_PRIORITY_COUNTERS_GROUP);
284 for (prio = 0; prio < NUM_PPORT_PRIO; prio++) {
285 out = pstats->per_prio_counters[prio];
286 MLX5_SET(ppcnt_reg, in, prio_tc, prio);
287 mlx5_core_access_reg(mdev, in, sz, out, sz,
288 MLX5_REG_PPCNT, 0, 0);
289 }
290
291 free_out:
292 kvfree(in);
293 }
294
295 static void mlx5e_update_q_counter(struct mlx5e_priv *priv)
296 {
297 struct mlx5e_qcounter_stats *qcnt = &priv->stats.qcnt;
298
299 if (!priv->q_counter)
300 return;
301
302 mlx5_core_query_out_of_buffer(priv->mdev, priv->q_counter,
303 &qcnt->rx_out_of_buffer);
304 }
305
306 static void mlx5e_update_pcie_counters(struct mlx5e_priv *priv)
307 {
308 struct mlx5e_pcie_stats *pcie_stats = &priv->stats.pcie;
309 struct mlx5_core_dev *mdev = priv->mdev;
310 int sz = MLX5_ST_SZ_BYTES(mpcnt_reg);
311 void *out;
312 u32 *in;
313
314 if (!MLX5_CAP_MCAM_FEATURE(mdev, pcie_performance_group))
315 return;
316
317 in = mlx5_vzalloc(sz);
318 if (!in)
319 return;
320
321 out = pcie_stats->pcie_perf_counters;
322 MLX5_SET(mpcnt_reg, in, grp, MLX5_PCIE_PERFORMANCE_COUNTERS_GROUP);
323 mlx5_core_access_reg(mdev, in, sz, out, sz, MLX5_REG_MPCNT, 0, 0);
324
325 kvfree(in);
326 }
327
328 void mlx5e_update_stats(struct mlx5e_priv *priv)
329 {
330 mlx5e_update_pcie_counters(priv);
331 mlx5e_update_pport_counters(priv);
332 mlx5e_update_vport_counters(priv);
333 mlx5e_update_q_counter(priv);
334 mlx5e_update_sw_counters(priv);
335 }
336
337 void mlx5e_update_stats_work(struct work_struct *work)
338 {
339 struct delayed_work *dwork = to_delayed_work(work);
340 struct mlx5e_priv *priv = container_of(dwork, struct mlx5e_priv,
341 update_stats_work);
342 mutex_lock(&priv->state_lock);
343 if (test_bit(MLX5E_STATE_OPENED, &priv->state)) {
344 priv->profile->update_stats(priv);
345 queue_delayed_work(priv->wq, dwork,
346 msecs_to_jiffies(MLX5E_UPDATE_STATS_INTERVAL));
347 }
348 mutex_unlock(&priv->state_lock);
349 }
350
351 static void mlx5e_async_event(struct mlx5_core_dev *mdev, void *vpriv,
352 enum mlx5_dev_event event, unsigned long param)
353 {
354 struct mlx5e_priv *priv = vpriv;
355 struct ptp_clock_event ptp_event;
356 struct mlx5_eqe *eqe = NULL;
357
358 if (!test_bit(MLX5E_STATE_ASYNC_EVENTS_ENABLED, &priv->state))
359 return;
360
361 switch (event) {
362 case MLX5_DEV_EVENT_PORT_UP:
363 case MLX5_DEV_EVENT_PORT_DOWN:
364 queue_work(priv->wq, &priv->update_carrier_work);
365 break;
366 case MLX5_DEV_EVENT_PPS:
367 eqe = (struct mlx5_eqe *)param;
368 ptp_event.type = PTP_CLOCK_EXTTS;
369 ptp_event.index = eqe->data.pps.pin;
370 ptp_event.timestamp =
371 timecounter_cyc2time(&priv->tstamp.clock,
372 be64_to_cpu(eqe->data.pps.time_stamp));
373 mlx5e_pps_event_handler(vpriv, &ptp_event);
374 break;
375 default:
376 break;
377 }
378 }
379
380 static void mlx5e_enable_async_events(struct mlx5e_priv *priv)
381 {
382 set_bit(MLX5E_STATE_ASYNC_EVENTS_ENABLED, &priv->state);
383 }
384
385 static void mlx5e_disable_async_events(struct mlx5e_priv *priv)
386 {
387 clear_bit(MLX5E_STATE_ASYNC_EVENTS_ENABLED, &priv->state);
388 synchronize_irq(mlx5_get_msix_vec(priv->mdev, MLX5_EQ_VEC_ASYNC));
389 }
390
391 static inline int mlx5e_get_wqe_mtt_sz(void)
392 {
393 /* UMR copies MTTs in units of MLX5_UMR_MTT_ALIGNMENT bytes.
394 * To avoid copying garbage after the mtt array, we allocate
395 * a little more.
396 */
397 return ALIGN(MLX5_MPWRQ_PAGES_PER_WQE * sizeof(__be64),
398 MLX5_UMR_MTT_ALIGNMENT);
399 }
400
401 static inline void mlx5e_build_umr_wqe(struct mlx5e_rq *rq,
402 struct mlx5e_icosq *sq,
403 struct mlx5e_umr_wqe *wqe,
404 u16 ix)
405 {
406 struct mlx5_wqe_ctrl_seg *cseg = &wqe->ctrl;
407 struct mlx5_wqe_umr_ctrl_seg *ucseg = &wqe->uctrl;
408 struct mlx5_wqe_data_seg *dseg = &wqe->data;
409 struct mlx5e_mpw_info *wi = &rq->mpwqe.info[ix];
410 u8 ds_cnt = DIV_ROUND_UP(sizeof(*wqe), MLX5_SEND_WQE_DS);
411 u32 umr_wqe_mtt_offset = mlx5e_get_wqe_mtt_offset(rq, ix);
412
413 cseg->qpn_ds = cpu_to_be32((sq->sqn << MLX5_WQE_CTRL_QPN_SHIFT) |
414 ds_cnt);
415 cseg->fm_ce_se = MLX5_WQE_CTRL_CQ_UPDATE;
416 cseg->imm = rq->mkey_be;
417
418 ucseg->flags = MLX5_UMR_TRANSLATION_OFFSET_EN;
419 ucseg->xlt_octowords =
420 cpu_to_be16(MLX5_MTT_OCTW(MLX5_MPWRQ_PAGES_PER_WQE));
421 ucseg->bsf_octowords =
422 cpu_to_be16(MLX5_MTT_OCTW(umr_wqe_mtt_offset));
423 ucseg->mkey_mask = cpu_to_be64(MLX5_MKEY_MASK_FREE);
424
425 dseg->lkey = sq->mkey_be;
426 dseg->addr = cpu_to_be64(wi->umr.mtt_addr);
427 }
428
429 static int mlx5e_rq_alloc_mpwqe_info(struct mlx5e_rq *rq,
430 struct mlx5e_channel *c)
431 {
432 int wq_sz = mlx5_wq_ll_get_size(&rq->wq);
433 int mtt_sz = mlx5e_get_wqe_mtt_sz();
434 int mtt_alloc = mtt_sz + MLX5_UMR_ALIGN - 1;
435 int i;
436
437 rq->mpwqe.info = kzalloc_node(wq_sz * sizeof(*rq->mpwqe.info),
438 GFP_KERNEL, cpu_to_node(c->cpu));
439 if (!rq->mpwqe.info)
440 goto err_out;
441
442 /* We allocate more than mtt_sz as we will align the pointer */
443 rq->mpwqe.mtt_no_align = kzalloc_node(mtt_alloc * wq_sz, GFP_KERNEL,
444 cpu_to_node(c->cpu));
445 if (unlikely(!rq->mpwqe.mtt_no_align))
446 goto err_free_wqe_info;
447
448 for (i = 0; i < wq_sz; i++) {
449 struct mlx5e_mpw_info *wi = &rq->mpwqe.info[i];
450
451 wi->umr.mtt = PTR_ALIGN(rq->mpwqe.mtt_no_align + i * mtt_alloc,
452 MLX5_UMR_ALIGN);
453 wi->umr.mtt_addr = dma_map_single(c->pdev, wi->umr.mtt, mtt_sz,
454 PCI_DMA_TODEVICE);
455 if (unlikely(dma_mapping_error(c->pdev, wi->umr.mtt_addr)))
456 goto err_unmap_mtts;
457
458 mlx5e_build_umr_wqe(rq, &c->icosq, &wi->umr.wqe, i);
459 }
460
461 return 0;
462
463 err_unmap_mtts:
464 while (--i >= 0) {
465 struct mlx5e_mpw_info *wi = &rq->mpwqe.info[i];
466
467 dma_unmap_single(c->pdev, wi->umr.mtt_addr, mtt_sz,
468 PCI_DMA_TODEVICE);
469 }
470 kfree(rq->mpwqe.mtt_no_align);
471 err_free_wqe_info:
472 kfree(rq->mpwqe.info);
473
474 err_out:
475 return -ENOMEM;
476 }
477
478 static void mlx5e_rq_free_mpwqe_info(struct mlx5e_rq *rq)
479 {
480 int wq_sz = mlx5_wq_ll_get_size(&rq->wq);
481 int mtt_sz = mlx5e_get_wqe_mtt_sz();
482 int i;
483
484 for (i = 0; i < wq_sz; i++) {
485 struct mlx5e_mpw_info *wi = &rq->mpwqe.info[i];
486
487 dma_unmap_single(rq->pdev, wi->umr.mtt_addr, mtt_sz,
488 PCI_DMA_TODEVICE);
489 }
490 kfree(rq->mpwqe.mtt_no_align);
491 kfree(rq->mpwqe.info);
492 }
493
494 static int mlx5e_create_umr_mkey(struct mlx5_core_dev *mdev,
495 u64 npages, u8 page_shift,
496 struct mlx5_core_mkey *umr_mkey)
497 {
498 int inlen = MLX5_ST_SZ_BYTES(create_mkey_in);
499 void *mkc;
500 u32 *in;
501 int err;
502
503 if (!MLX5E_VALID_NUM_MTTS(npages))
504 return -EINVAL;
505
506 in = mlx5_vzalloc(inlen);
507 if (!in)
508 return -ENOMEM;
509
510 mkc = MLX5_ADDR_OF(create_mkey_in, in, memory_key_mkey_entry);
511
512 MLX5_SET(mkc, mkc, free, 1);
513 MLX5_SET(mkc, mkc, umr_en, 1);
514 MLX5_SET(mkc, mkc, lw, 1);
515 MLX5_SET(mkc, mkc, lr, 1);
516 MLX5_SET(mkc, mkc, access_mode, MLX5_MKC_ACCESS_MODE_MTT);
517
518 MLX5_SET(mkc, mkc, qpn, 0xffffff);
519 MLX5_SET(mkc, mkc, pd, mdev->mlx5e_res.pdn);
520 MLX5_SET64(mkc, mkc, len, npages << page_shift);
521 MLX5_SET(mkc, mkc, translations_octword_size,
522 MLX5_MTT_OCTW(npages));
523 MLX5_SET(mkc, mkc, log_page_size, page_shift);
524
525 err = mlx5_core_create_mkey(mdev, umr_mkey, in, inlen);
526
527 kvfree(in);
528 return err;
529 }
530
531 static int mlx5e_create_rq_umr_mkey(struct mlx5_core_dev *mdev, struct mlx5e_rq *rq)
532 {
533 u64 num_mtts = MLX5E_REQUIRED_MTTS(mlx5_wq_ll_get_size(&rq->wq));
534
535 return mlx5e_create_umr_mkey(mdev, num_mtts, PAGE_SHIFT, &rq->umr_mkey);
536 }
537
538 static int mlx5e_alloc_rq(struct mlx5e_channel *c,
539 struct mlx5e_params *params,
540 struct mlx5e_rq_param *rqp,
541 struct mlx5e_rq *rq)
542 {
543 struct mlx5_core_dev *mdev = c->mdev;
544 void *rqc = rqp->rqc;
545 void *rqc_wq = MLX5_ADDR_OF(rqc, rqc, wq);
546 u32 byte_count;
547 u32 frag_sz;
548 int npages;
549 int wq_sz;
550 int err;
551 int i;
552
553 rqp->wq.db_numa_node = cpu_to_node(c->cpu);
554
555 err = mlx5_wq_ll_create(mdev, &rqp->wq, rqc_wq, &rq->wq,
556 &rq->wq_ctrl);
557 if (err)
558 return err;
559
560 rq->wq.db = &rq->wq.db[MLX5_RCV_DBR];
561
562 wq_sz = mlx5_wq_ll_get_size(&rq->wq);
563
564 rq->wq_type = params->rq_wq_type;
565 rq->pdev = c->pdev;
566 rq->netdev = c->netdev;
567 rq->tstamp = c->tstamp;
568 rq->channel = c;
569 rq->ix = c->ix;
570 rq->mdev = mdev;
571
572 rq->xdp_prog = params->xdp_prog ? bpf_prog_inc(params->xdp_prog) : NULL;
573 if (IS_ERR(rq->xdp_prog)) {
574 err = PTR_ERR(rq->xdp_prog);
575 rq->xdp_prog = NULL;
576 goto err_rq_wq_destroy;
577 }
578
579 if (rq->xdp_prog) {
580 rq->buff.map_dir = DMA_BIDIRECTIONAL;
581 rq->rx_headroom = XDP_PACKET_HEADROOM;
582 } else {
583 rq->buff.map_dir = DMA_FROM_DEVICE;
584 rq->rx_headroom = MLX5_RX_HEADROOM;
585 }
586
587 switch (rq->wq_type) {
588 case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
589 if (mlx5e_is_vf_vport_rep(c->priv)) {
590 err = -EINVAL;
591 goto err_rq_wq_destroy;
592 }
593
594 rq->handle_rx_cqe = mlx5e_handle_rx_cqe_mpwrq;
595 rq->alloc_wqe = mlx5e_alloc_rx_mpwqe;
596 rq->dealloc_wqe = mlx5e_dealloc_rx_mpwqe;
597
598 rq->mpwqe_stride_sz = BIT(params->mpwqe_log_stride_sz);
599 rq->mpwqe_num_strides = BIT(params->mpwqe_log_num_strides);
600
601 rq->buff.wqe_sz = rq->mpwqe_stride_sz * rq->mpwqe_num_strides;
602 byte_count = rq->buff.wqe_sz;
603
604 err = mlx5e_create_rq_umr_mkey(mdev, rq);
605 if (err)
606 goto err_rq_wq_destroy;
607 rq->mkey_be = cpu_to_be32(rq->umr_mkey.key);
608
609 err = mlx5e_rq_alloc_mpwqe_info(rq, c);
610 if (err)
611 goto err_destroy_umr_mkey;
612 break;
613 default: /* MLX5_WQ_TYPE_LINKED_LIST */
614 rq->dma_info = kzalloc_node(wq_sz * sizeof(*rq->dma_info),
615 GFP_KERNEL, cpu_to_node(c->cpu));
616 if (!rq->dma_info) {
617 err = -ENOMEM;
618 goto err_rq_wq_destroy;
619 }
620
621 if (mlx5e_is_vf_vport_rep(c->priv))
622 rq->handle_rx_cqe = mlx5e_handle_rx_cqe_rep;
623 else
624 rq->handle_rx_cqe = mlx5e_handle_rx_cqe;
625
626 rq->alloc_wqe = mlx5e_alloc_rx_wqe;
627 rq->dealloc_wqe = mlx5e_dealloc_rx_wqe;
628
629 rq->buff.wqe_sz = params->lro_en ?
630 params->lro_wqe_sz :
631 MLX5E_SW2HW_MTU(c->netdev->mtu);
632 byte_count = rq->buff.wqe_sz;
633
634 /* calc the required page order */
635 frag_sz = rq->rx_headroom +
636 byte_count /* packet data */ +
637 SKB_DATA_ALIGN(sizeof(struct skb_shared_info));
638 frag_sz = SKB_DATA_ALIGN(frag_sz);
639
640 npages = DIV_ROUND_UP(frag_sz, PAGE_SIZE);
641 rq->buff.page_order = order_base_2(npages);
642
643 byte_count |= MLX5_HW_START_PADDING;
644 rq->mkey_be = c->mkey_be;
645 }
646
647 for (i = 0; i < wq_sz; i++) {
648 struct mlx5e_rx_wqe *wqe = mlx5_wq_ll_get_wqe(&rq->wq, i);
649
650 wqe->data.byte_count = cpu_to_be32(byte_count);
651 wqe->data.lkey = rq->mkey_be;
652 }
653
654 INIT_WORK(&rq->am.work, mlx5e_rx_am_work);
655 rq->am.mode = params->rx_cq_period_mode;
656 rq->page_cache.head = 0;
657 rq->page_cache.tail = 0;
658
659 return 0;
660
661 err_destroy_umr_mkey:
662 mlx5_core_destroy_mkey(mdev, &rq->umr_mkey);
663
664 err_rq_wq_destroy:
665 if (rq->xdp_prog)
666 bpf_prog_put(rq->xdp_prog);
667 mlx5_wq_destroy(&rq->wq_ctrl);
668
669 return err;
670 }
671
672 static void mlx5e_free_rq(struct mlx5e_rq *rq)
673 {
674 int i;
675
676 if (rq->xdp_prog)
677 bpf_prog_put(rq->xdp_prog);
678
679 switch (rq->wq_type) {
680 case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
681 mlx5e_rq_free_mpwqe_info(rq);
682 mlx5_core_destroy_mkey(rq->mdev, &rq->umr_mkey);
683 break;
684 default: /* MLX5_WQ_TYPE_LINKED_LIST */
685 kfree(rq->dma_info);
686 }
687
688 for (i = rq->page_cache.head; i != rq->page_cache.tail;
689 i = (i + 1) & (MLX5E_CACHE_SIZE - 1)) {
690 struct mlx5e_dma_info *dma_info = &rq->page_cache.page_cache[i];
691
692 mlx5e_page_release(rq, dma_info, false);
693 }
694 mlx5_wq_destroy(&rq->wq_ctrl);
695 }
696
697 static int mlx5e_create_rq(struct mlx5e_rq *rq,
698 struct mlx5e_rq_param *param)
699 {
700 struct mlx5_core_dev *mdev = rq->mdev;
701
702 void *in;
703 void *rqc;
704 void *wq;
705 int inlen;
706 int err;
707
708 inlen = MLX5_ST_SZ_BYTES(create_rq_in) +
709 sizeof(u64) * rq->wq_ctrl.buf.npages;
710 in = mlx5_vzalloc(inlen);
711 if (!in)
712 return -ENOMEM;
713
714 rqc = MLX5_ADDR_OF(create_rq_in, in, ctx);
715 wq = MLX5_ADDR_OF(rqc, rqc, wq);
716
717 memcpy(rqc, param->rqc, sizeof(param->rqc));
718
719 MLX5_SET(rqc, rqc, cqn, rq->cq.mcq.cqn);
720 MLX5_SET(rqc, rqc, state, MLX5_RQC_STATE_RST);
721 MLX5_SET(wq, wq, log_wq_pg_sz, rq->wq_ctrl.buf.page_shift -
722 MLX5_ADAPTER_PAGE_SHIFT);
723 MLX5_SET64(wq, wq, dbr_addr, rq->wq_ctrl.db.dma);
724
725 mlx5_fill_page_array(&rq->wq_ctrl.buf,
726 (__be64 *)MLX5_ADDR_OF(wq, wq, pas));
727
728 err = mlx5_core_create_rq(mdev, in, inlen, &rq->rqn);
729
730 kvfree(in);
731
732 return err;
733 }
734
735 static int mlx5e_modify_rq_state(struct mlx5e_rq *rq, int curr_state,
736 int next_state)
737 {
738 struct mlx5e_channel *c = rq->channel;
739 struct mlx5_core_dev *mdev = c->mdev;
740
741 void *in;
742 void *rqc;
743 int inlen;
744 int err;
745
746 inlen = MLX5_ST_SZ_BYTES(modify_rq_in);
747 in = mlx5_vzalloc(inlen);
748 if (!in)
749 return -ENOMEM;
750
751 rqc = MLX5_ADDR_OF(modify_rq_in, in, ctx);
752
753 MLX5_SET(modify_rq_in, in, rq_state, curr_state);
754 MLX5_SET(rqc, rqc, state, next_state);
755
756 err = mlx5_core_modify_rq(mdev, rq->rqn, in, inlen);
757
758 kvfree(in);
759
760 return err;
761 }
762
763 static int mlx5e_modify_rq_scatter_fcs(struct mlx5e_rq *rq, bool enable)
764 {
765 struct mlx5e_channel *c = rq->channel;
766 struct mlx5e_priv *priv = c->priv;
767 struct mlx5_core_dev *mdev = priv->mdev;
768
769 void *in;
770 void *rqc;
771 int inlen;
772 int err;
773
774 inlen = MLX5_ST_SZ_BYTES(modify_rq_in);
775 in = mlx5_vzalloc(inlen);
776 if (!in)
777 return -ENOMEM;
778
779 rqc = MLX5_ADDR_OF(modify_rq_in, in, ctx);
780
781 MLX5_SET(modify_rq_in, in, rq_state, MLX5_RQC_STATE_RDY);
782 MLX5_SET64(modify_rq_in, in, modify_bitmask,
783 MLX5_MODIFY_RQ_IN_MODIFY_BITMASK_SCATTER_FCS);
784 MLX5_SET(rqc, rqc, scatter_fcs, enable);
785 MLX5_SET(rqc, rqc, state, MLX5_RQC_STATE_RDY);
786
787 err = mlx5_core_modify_rq(mdev, rq->rqn, in, inlen);
788
789 kvfree(in);
790
791 return err;
792 }
793
794 static int mlx5e_modify_rq_vsd(struct mlx5e_rq *rq, bool vsd)
795 {
796 struct mlx5e_channel *c = rq->channel;
797 struct mlx5_core_dev *mdev = c->mdev;
798 void *in;
799 void *rqc;
800 int inlen;
801 int err;
802
803 inlen = MLX5_ST_SZ_BYTES(modify_rq_in);
804 in = mlx5_vzalloc(inlen);
805 if (!in)
806 return -ENOMEM;
807
808 rqc = MLX5_ADDR_OF(modify_rq_in, in, ctx);
809
810 MLX5_SET(modify_rq_in, in, rq_state, MLX5_RQC_STATE_RDY);
811 MLX5_SET64(modify_rq_in, in, modify_bitmask,
812 MLX5_MODIFY_RQ_IN_MODIFY_BITMASK_VSD);
813 MLX5_SET(rqc, rqc, vsd, vsd);
814 MLX5_SET(rqc, rqc, state, MLX5_RQC_STATE_RDY);
815
816 err = mlx5_core_modify_rq(mdev, rq->rqn, in, inlen);
817
818 kvfree(in);
819
820 return err;
821 }
822
823 static void mlx5e_destroy_rq(struct mlx5e_rq *rq)
824 {
825 mlx5_core_destroy_rq(rq->mdev, rq->rqn);
826 }
827
828 static int mlx5e_wait_for_min_rx_wqes(struct mlx5e_rq *rq)
829 {
830 unsigned long exp_time = jiffies + msecs_to_jiffies(20000);
831 struct mlx5e_channel *c = rq->channel;
832
833 struct mlx5_wq_ll *wq = &rq->wq;
834 u16 min_wqes = mlx5_min_rx_wqes(rq->wq_type, mlx5_wq_ll_get_size(wq));
835
836 while (time_before(jiffies, exp_time)) {
837 if (wq->cur_sz >= min_wqes)
838 return 0;
839
840 msleep(20);
841 }
842
843 netdev_warn(c->netdev, "Failed to get min RX wqes on RQN[0x%x] wq cur_sz(%d) min_rx_wqes(%d)\n",
844 rq->rqn, wq->cur_sz, min_wqes);
845 return -ETIMEDOUT;
846 }
847
848 static void mlx5e_free_rx_descs(struct mlx5e_rq *rq)
849 {
850 struct mlx5_wq_ll *wq = &rq->wq;
851 struct mlx5e_rx_wqe *wqe;
852 __be16 wqe_ix_be;
853 u16 wqe_ix;
854
855 /* UMR WQE (if in progress) is always at wq->head */
856 if (test_bit(MLX5E_RQ_STATE_UMR_WQE_IN_PROGRESS, &rq->state))
857 mlx5e_free_rx_mpwqe(rq, &rq->mpwqe.info[wq->head]);
858
859 while (!mlx5_wq_ll_is_empty(wq)) {
860 wqe_ix_be = *wq->tail_next;
861 wqe_ix = be16_to_cpu(wqe_ix_be);
862 wqe = mlx5_wq_ll_get_wqe(&rq->wq, wqe_ix);
863 rq->dealloc_wqe(rq, wqe_ix);
864 mlx5_wq_ll_pop(&rq->wq, wqe_ix_be,
865 &wqe->next.next_wqe_index);
866 }
867 }
868
869 static int mlx5e_open_rq(struct mlx5e_channel *c,
870 struct mlx5e_params *params,
871 struct mlx5e_rq_param *param,
872 struct mlx5e_rq *rq)
873 {
874 int err;
875
876 err = mlx5e_alloc_rq(c, params, param, rq);
877 if (err)
878 return err;
879
880 err = mlx5e_create_rq(rq, param);
881 if (err)
882 goto err_free_rq;
883
884 err = mlx5e_modify_rq_state(rq, MLX5_RQC_STATE_RST, MLX5_RQC_STATE_RDY);
885 if (err)
886 goto err_destroy_rq;
887
888 if (params->rx_am_enabled)
889 set_bit(MLX5E_RQ_STATE_AM, &c->rq.state);
890
891 return 0;
892
893 err_destroy_rq:
894 mlx5e_destroy_rq(rq);
895 err_free_rq:
896 mlx5e_free_rq(rq);
897
898 return err;
899 }
900
901 static void mlx5e_activate_rq(struct mlx5e_rq *rq)
902 {
903 struct mlx5e_icosq *sq = &rq->channel->icosq;
904 u16 pi = sq->pc & sq->wq.sz_m1;
905 struct mlx5e_tx_wqe *nopwqe;
906
907 set_bit(MLX5E_RQ_STATE_ENABLED, &rq->state);
908 sq->db.ico_wqe[pi].opcode = MLX5_OPCODE_NOP;
909 sq->db.ico_wqe[pi].num_wqebbs = 1;
910 nopwqe = mlx5e_post_nop(&sq->wq, sq->sqn, &sq->pc);
911 mlx5e_notify_hw(&sq->wq, sq->pc, sq->uar_map, &nopwqe->ctrl);
912 }
913
914 static void mlx5e_deactivate_rq(struct mlx5e_rq *rq)
915 {
916 clear_bit(MLX5E_RQ_STATE_ENABLED, &rq->state);
917 napi_synchronize(&rq->channel->napi); /* prevent mlx5e_post_rx_wqes */
918 }
919
920 static void mlx5e_close_rq(struct mlx5e_rq *rq)
921 {
922 cancel_work_sync(&rq->am.work);
923 mlx5e_destroy_rq(rq);
924 mlx5e_free_rx_descs(rq);
925 mlx5e_free_rq(rq);
926 }
927
928 static void mlx5e_free_xdpsq_db(struct mlx5e_xdpsq *sq)
929 {
930 kfree(sq->db.di);
931 }
932
933 static int mlx5e_alloc_xdpsq_db(struct mlx5e_xdpsq *sq, int numa)
934 {
935 int wq_sz = mlx5_wq_cyc_get_size(&sq->wq);
936
937 sq->db.di = kzalloc_node(sizeof(*sq->db.di) * wq_sz,
938 GFP_KERNEL, numa);
939 if (!sq->db.di) {
940 mlx5e_free_xdpsq_db(sq);
941 return -ENOMEM;
942 }
943
944 return 0;
945 }
946
947 static int mlx5e_alloc_xdpsq(struct mlx5e_channel *c,
948 struct mlx5e_params *params,
949 struct mlx5e_sq_param *param,
950 struct mlx5e_xdpsq *sq)
951 {
952 void *sqc_wq = MLX5_ADDR_OF(sqc, param->sqc, wq);
953 struct mlx5_core_dev *mdev = c->mdev;
954 int err;
955
956 sq->pdev = c->pdev;
957 sq->mkey_be = c->mkey_be;
958 sq->channel = c;
959 sq->uar_map = mdev->mlx5e_res.bfreg.map;
960 sq->min_inline_mode = params->tx_min_inline_mode;
961
962 param->wq.db_numa_node = cpu_to_node(c->cpu);
963 err = mlx5_wq_cyc_create(mdev, &param->wq, sqc_wq, &sq->wq, &sq->wq_ctrl);
964 if (err)
965 return err;
966 sq->wq.db = &sq->wq.db[MLX5_SND_DBR];
967
968 err = mlx5e_alloc_xdpsq_db(sq, cpu_to_node(c->cpu));
969 if (err)
970 goto err_sq_wq_destroy;
971
972 return 0;
973
974 err_sq_wq_destroy:
975 mlx5_wq_destroy(&sq->wq_ctrl);
976
977 return err;
978 }
979
980 static void mlx5e_free_xdpsq(struct mlx5e_xdpsq *sq)
981 {
982 mlx5e_free_xdpsq_db(sq);
983 mlx5_wq_destroy(&sq->wq_ctrl);
984 }
985
986 static void mlx5e_free_icosq_db(struct mlx5e_icosq *sq)
987 {
988 kfree(sq->db.ico_wqe);
989 }
990
991 static int mlx5e_alloc_icosq_db(struct mlx5e_icosq *sq, int numa)
992 {
993 u8 wq_sz = mlx5_wq_cyc_get_size(&sq->wq);
994
995 sq->db.ico_wqe = kzalloc_node(sizeof(*sq->db.ico_wqe) * wq_sz,
996 GFP_KERNEL, numa);
997 if (!sq->db.ico_wqe)
998 return -ENOMEM;
999
1000 return 0;
1001 }
1002
1003 static int mlx5e_alloc_icosq(struct mlx5e_channel *c,
1004 struct mlx5e_sq_param *param,
1005 struct mlx5e_icosq *sq)
1006 {
1007 void *sqc_wq = MLX5_ADDR_OF(sqc, param->sqc, wq);
1008 struct mlx5_core_dev *mdev = c->mdev;
1009 int err;
1010
1011 sq->pdev = c->pdev;
1012 sq->mkey_be = c->mkey_be;
1013 sq->channel = c;
1014 sq->uar_map = mdev->mlx5e_res.bfreg.map;
1015
1016 param->wq.db_numa_node = cpu_to_node(c->cpu);
1017 err = mlx5_wq_cyc_create(mdev, &param->wq, sqc_wq, &sq->wq, &sq->wq_ctrl);
1018 if (err)
1019 return err;
1020 sq->wq.db = &sq->wq.db[MLX5_SND_DBR];
1021
1022 err = mlx5e_alloc_icosq_db(sq, cpu_to_node(c->cpu));
1023 if (err)
1024 goto err_sq_wq_destroy;
1025
1026 sq->edge = (sq->wq.sz_m1 + 1) - MLX5E_ICOSQ_MAX_WQEBBS;
1027
1028 return 0;
1029
1030 err_sq_wq_destroy:
1031 mlx5_wq_destroy(&sq->wq_ctrl);
1032
1033 return err;
1034 }
1035
1036 static void mlx5e_free_icosq(struct mlx5e_icosq *sq)
1037 {
1038 mlx5e_free_icosq_db(sq);
1039 mlx5_wq_destroy(&sq->wq_ctrl);
1040 }
1041
1042 static void mlx5e_free_txqsq_db(struct mlx5e_txqsq *sq)
1043 {
1044 kfree(sq->db.wqe_info);
1045 kfree(sq->db.dma_fifo);
1046 kfree(sq->db.skb);
1047 }
1048
1049 static int mlx5e_alloc_txqsq_db(struct mlx5e_txqsq *sq, int numa)
1050 {
1051 int wq_sz = mlx5_wq_cyc_get_size(&sq->wq);
1052 int df_sz = wq_sz * MLX5_SEND_WQEBB_NUM_DS;
1053
1054 sq->db.skb = kzalloc_node(wq_sz * sizeof(*sq->db.skb),
1055 GFP_KERNEL, numa);
1056 sq->db.dma_fifo = kzalloc_node(df_sz * sizeof(*sq->db.dma_fifo),
1057 GFP_KERNEL, numa);
1058 sq->db.wqe_info = kzalloc_node(wq_sz * sizeof(*sq->db.wqe_info),
1059 GFP_KERNEL, numa);
1060 if (!sq->db.skb || !sq->db.dma_fifo || !sq->db.wqe_info) {
1061 mlx5e_free_txqsq_db(sq);
1062 return -ENOMEM;
1063 }
1064
1065 sq->dma_fifo_mask = df_sz - 1;
1066
1067 return 0;
1068 }
1069
1070 static int mlx5e_alloc_txqsq(struct mlx5e_channel *c,
1071 int txq_ix,
1072 struct mlx5e_params *params,
1073 struct mlx5e_sq_param *param,
1074 struct mlx5e_txqsq *sq)
1075 {
1076 void *sqc_wq = MLX5_ADDR_OF(sqc, param->sqc, wq);
1077 struct mlx5_core_dev *mdev = c->mdev;
1078 int err;
1079
1080 sq->pdev = c->pdev;
1081 sq->tstamp = c->tstamp;
1082 sq->mkey_be = c->mkey_be;
1083 sq->channel = c;
1084 sq->txq_ix = txq_ix;
1085 sq->uar_map = mdev->mlx5e_res.bfreg.map;
1086 sq->max_inline = params->tx_max_inline;
1087 sq->min_inline_mode = params->tx_min_inline_mode;
1088
1089 param->wq.db_numa_node = cpu_to_node(c->cpu);
1090 err = mlx5_wq_cyc_create(mdev, &param->wq, sqc_wq, &sq->wq, &sq->wq_ctrl);
1091 if (err)
1092 return err;
1093 sq->wq.db = &sq->wq.db[MLX5_SND_DBR];
1094
1095 err = mlx5e_alloc_txqsq_db(sq, cpu_to_node(c->cpu));
1096 if (err)
1097 goto err_sq_wq_destroy;
1098
1099 sq->edge = (sq->wq.sz_m1 + 1) - MLX5_SEND_WQE_MAX_WQEBBS;
1100
1101 return 0;
1102
1103 err_sq_wq_destroy:
1104 mlx5_wq_destroy(&sq->wq_ctrl);
1105
1106 return err;
1107 }
1108
1109 static void mlx5e_free_txqsq(struct mlx5e_txqsq *sq)
1110 {
1111 mlx5e_free_txqsq_db(sq);
1112 mlx5_wq_destroy(&sq->wq_ctrl);
1113 }
1114
1115 struct mlx5e_create_sq_param {
1116 struct mlx5_wq_ctrl *wq_ctrl;
1117 u32 cqn;
1118 u32 tisn;
1119 u8 tis_lst_sz;
1120 u8 min_inline_mode;
1121 };
1122
1123 static int mlx5e_create_sq(struct mlx5_core_dev *mdev,
1124 struct mlx5e_sq_param *param,
1125 struct mlx5e_create_sq_param *csp,
1126 u32 *sqn)
1127 {
1128 void *in;
1129 void *sqc;
1130 void *wq;
1131 int inlen;
1132 int err;
1133
1134 inlen = MLX5_ST_SZ_BYTES(create_sq_in) +
1135 sizeof(u64) * csp->wq_ctrl->buf.npages;
1136 in = mlx5_vzalloc(inlen);
1137 if (!in)
1138 return -ENOMEM;
1139
1140 sqc = MLX5_ADDR_OF(create_sq_in, in, ctx);
1141 wq = MLX5_ADDR_OF(sqc, sqc, wq);
1142
1143 memcpy(sqc, param->sqc, sizeof(param->sqc));
1144 MLX5_SET(sqc, sqc, tis_lst_sz, csp->tis_lst_sz);
1145 MLX5_SET(sqc, sqc, tis_num_0, csp->tisn);
1146 MLX5_SET(sqc, sqc, cqn, csp->cqn);
1147
1148 if (MLX5_CAP_ETH(mdev, wqe_inline_mode) == MLX5_CAP_INLINE_MODE_VPORT_CONTEXT)
1149 MLX5_SET(sqc, sqc, min_wqe_inline_mode, csp->min_inline_mode);
1150
1151 MLX5_SET(sqc, sqc, state, MLX5_SQC_STATE_RST);
1152
1153 MLX5_SET(wq, wq, wq_type, MLX5_WQ_TYPE_CYCLIC);
1154 MLX5_SET(wq, wq, uar_page, mdev->mlx5e_res.bfreg.index);
1155 MLX5_SET(wq, wq, log_wq_pg_sz, csp->wq_ctrl->buf.page_shift -
1156 MLX5_ADAPTER_PAGE_SHIFT);
1157 MLX5_SET64(wq, wq, dbr_addr, csp->wq_ctrl->db.dma);
1158
1159 mlx5_fill_page_array(&csp->wq_ctrl->buf, (__be64 *)MLX5_ADDR_OF(wq, wq, pas));
1160
1161 err = mlx5_core_create_sq(mdev, in, inlen, sqn);
1162
1163 kvfree(in);
1164
1165 return err;
1166 }
1167
1168 struct mlx5e_modify_sq_param {
1169 int curr_state;
1170 int next_state;
1171 bool rl_update;
1172 int rl_index;
1173 };
1174
1175 static int mlx5e_modify_sq(struct mlx5_core_dev *mdev, u32 sqn,
1176 struct mlx5e_modify_sq_param *p)
1177 {
1178 void *in;
1179 void *sqc;
1180 int inlen;
1181 int err;
1182
1183 inlen = MLX5_ST_SZ_BYTES(modify_sq_in);
1184 in = mlx5_vzalloc(inlen);
1185 if (!in)
1186 return -ENOMEM;
1187
1188 sqc = MLX5_ADDR_OF(modify_sq_in, in, ctx);
1189
1190 MLX5_SET(modify_sq_in, in, sq_state, p->curr_state);
1191 MLX5_SET(sqc, sqc, state, p->next_state);
1192 if (p->rl_update && p->next_state == MLX5_SQC_STATE_RDY) {
1193 MLX5_SET64(modify_sq_in, in, modify_bitmask, 1);
1194 MLX5_SET(sqc, sqc, packet_pacing_rate_limit_index, p->rl_index);
1195 }
1196
1197 err = mlx5_core_modify_sq(mdev, sqn, in, inlen);
1198
1199 kvfree(in);
1200
1201 return err;
1202 }
1203
1204 static void mlx5e_destroy_sq(struct mlx5_core_dev *mdev, u32 sqn)
1205 {
1206 mlx5_core_destroy_sq(mdev, sqn);
1207 }
1208
1209 static int mlx5e_create_sq_rdy(struct mlx5_core_dev *mdev,
1210 struct mlx5e_sq_param *param,
1211 struct mlx5e_create_sq_param *csp,
1212 u32 *sqn)
1213 {
1214 struct mlx5e_modify_sq_param msp = {0};
1215 int err;
1216
1217 err = mlx5e_create_sq(mdev, param, csp, sqn);
1218 if (err)
1219 return err;
1220
1221 msp.curr_state = MLX5_SQC_STATE_RST;
1222 msp.next_state = MLX5_SQC_STATE_RDY;
1223 err = mlx5e_modify_sq(mdev, *sqn, &msp);
1224 if (err)
1225 mlx5e_destroy_sq(mdev, *sqn);
1226
1227 return err;
1228 }
1229
1230 static int mlx5e_set_sq_maxrate(struct net_device *dev,
1231 struct mlx5e_txqsq *sq, u32 rate);
1232
1233 static int mlx5e_open_txqsq(struct mlx5e_channel *c,
1234 u32 tisn,
1235 int txq_ix,
1236 struct mlx5e_params *params,
1237 struct mlx5e_sq_param *param,
1238 struct mlx5e_txqsq *sq)
1239 {
1240 struct mlx5e_create_sq_param csp = {};
1241 u32 tx_rate;
1242 int err;
1243
1244 err = mlx5e_alloc_txqsq(c, txq_ix, params, param, sq);
1245 if (err)
1246 return err;
1247
1248 csp.tisn = tisn;
1249 csp.tis_lst_sz = 1;
1250 csp.cqn = sq->cq.mcq.cqn;
1251 csp.wq_ctrl = &sq->wq_ctrl;
1252 csp.min_inline_mode = sq->min_inline_mode;
1253 err = mlx5e_create_sq_rdy(c->mdev, param, &csp, &sq->sqn);
1254 if (err)
1255 goto err_free_txqsq;
1256
1257 tx_rate = c->priv->tx_rates[sq->txq_ix];
1258 if (tx_rate)
1259 mlx5e_set_sq_maxrate(c->netdev, sq, tx_rate);
1260
1261 return 0;
1262
1263 err_free_txqsq:
1264 clear_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1265 mlx5e_free_txqsq(sq);
1266
1267 return err;
1268 }
1269
1270 static void mlx5e_activate_txqsq(struct mlx5e_txqsq *sq)
1271 {
1272 sq->txq = netdev_get_tx_queue(sq->channel->netdev, sq->txq_ix);
1273 set_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1274 netdev_tx_reset_queue(sq->txq);
1275 netif_tx_start_queue(sq->txq);
1276 }
1277
1278 static inline void netif_tx_disable_queue(struct netdev_queue *txq)
1279 {
1280 __netif_tx_lock_bh(txq);
1281 netif_tx_stop_queue(txq);
1282 __netif_tx_unlock_bh(txq);
1283 }
1284
1285 static void mlx5e_deactivate_txqsq(struct mlx5e_txqsq *sq)
1286 {
1287 struct mlx5e_channel *c = sq->channel;
1288
1289 clear_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1290 /* prevent netif_tx_wake_queue */
1291 napi_synchronize(&c->napi);
1292
1293 netif_tx_disable_queue(sq->txq);
1294
1295 /* last doorbell out, godspeed .. */
1296 if (mlx5e_wqc_has_room_for(&sq->wq, sq->cc, sq->pc, 1)) {
1297 struct mlx5e_tx_wqe *nop;
1298
1299 sq->db.skb[(sq->pc & sq->wq.sz_m1)] = NULL;
1300 nop = mlx5e_post_nop(&sq->wq, sq->sqn, &sq->pc);
1301 mlx5e_notify_hw(&sq->wq, sq->pc, sq->uar_map, &nop->ctrl);
1302 }
1303 }
1304
1305 static void mlx5e_close_txqsq(struct mlx5e_txqsq *sq)
1306 {
1307 struct mlx5e_channel *c = sq->channel;
1308 struct mlx5_core_dev *mdev = c->mdev;
1309
1310 mlx5e_destroy_sq(mdev, sq->sqn);
1311 if (sq->rate_limit)
1312 mlx5_rl_remove_rate(mdev, sq->rate_limit);
1313 mlx5e_free_txqsq_descs(sq);
1314 mlx5e_free_txqsq(sq);
1315 }
1316
1317 static int mlx5e_open_icosq(struct mlx5e_channel *c,
1318 struct mlx5e_params *params,
1319 struct mlx5e_sq_param *param,
1320 struct mlx5e_icosq *sq)
1321 {
1322 struct mlx5e_create_sq_param csp = {};
1323 int err;
1324
1325 err = mlx5e_alloc_icosq(c, param, sq);
1326 if (err)
1327 return err;
1328
1329 csp.cqn = sq->cq.mcq.cqn;
1330 csp.wq_ctrl = &sq->wq_ctrl;
1331 csp.min_inline_mode = params->tx_min_inline_mode;
1332 set_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1333 err = mlx5e_create_sq_rdy(c->mdev, param, &csp, &sq->sqn);
1334 if (err)
1335 goto err_free_icosq;
1336
1337 return 0;
1338
1339 err_free_icosq:
1340 clear_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1341 mlx5e_free_icosq(sq);
1342
1343 return err;
1344 }
1345
1346 static void mlx5e_close_icosq(struct mlx5e_icosq *sq)
1347 {
1348 struct mlx5e_channel *c = sq->channel;
1349
1350 clear_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1351 napi_synchronize(&c->napi);
1352
1353 mlx5e_destroy_sq(c->mdev, sq->sqn);
1354 mlx5e_free_icosq(sq);
1355 }
1356
1357 static int mlx5e_open_xdpsq(struct mlx5e_channel *c,
1358 struct mlx5e_params *params,
1359 struct mlx5e_sq_param *param,
1360 struct mlx5e_xdpsq *sq)
1361 {
1362 unsigned int ds_cnt = MLX5E_XDP_TX_DS_COUNT;
1363 struct mlx5e_create_sq_param csp = {};
1364 unsigned int inline_hdr_sz = 0;
1365 int err;
1366 int i;
1367
1368 err = mlx5e_alloc_xdpsq(c, params, param, sq);
1369 if (err)
1370 return err;
1371
1372 csp.tis_lst_sz = 1;
1373 csp.tisn = c->priv->tisn[0]; /* tc = 0 */
1374 csp.cqn = sq->cq.mcq.cqn;
1375 csp.wq_ctrl = &sq->wq_ctrl;
1376 csp.min_inline_mode = sq->min_inline_mode;
1377 set_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1378 err = mlx5e_create_sq_rdy(c->mdev, param, &csp, &sq->sqn);
1379 if (err)
1380 goto err_free_xdpsq;
1381
1382 if (sq->min_inline_mode != MLX5_INLINE_MODE_NONE) {
1383 inline_hdr_sz = MLX5E_XDP_MIN_INLINE;
1384 ds_cnt++;
1385 }
1386
1387 /* Pre initialize fixed WQE fields */
1388 for (i = 0; i < mlx5_wq_cyc_get_size(&sq->wq); i++) {
1389 struct mlx5e_tx_wqe *wqe = mlx5_wq_cyc_get_wqe(&sq->wq, i);
1390 struct mlx5_wqe_ctrl_seg *cseg = &wqe->ctrl;
1391 struct mlx5_wqe_eth_seg *eseg = &wqe->eth;
1392 struct mlx5_wqe_data_seg *dseg;
1393
1394 cseg->qpn_ds = cpu_to_be32((sq->sqn << 8) | ds_cnt);
1395 eseg->inline_hdr.sz = cpu_to_be16(inline_hdr_sz);
1396
1397 dseg = (struct mlx5_wqe_data_seg *)cseg + (ds_cnt - 1);
1398 dseg->lkey = sq->mkey_be;
1399 }
1400
1401 return 0;
1402
1403 err_free_xdpsq:
1404 clear_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1405 mlx5e_free_xdpsq(sq);
1406
1407 return err;
1408 }
1409
1410 static void mlx5e_close_xdpsq(struct mlx5e_xdpsq *sq)
1411 {
1412 struct mlx5e_channel *c = sq->channel;
1413
1414 clear_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
1415 napi_synchronize(&c->napi);
1416
1417 mlx5e_destroy_sq(c->mdev, sq->sqn);
1418 mlx5e_free_xdpsq_descs(sq);
1419 mlx5e_free_xdpsq(sq);
1420 }
1421
1422 static int mlx5e_alloc_cq(struct mlx5e_channel *c,
1423 struct mlx5e_cq_param *param,
1424 struct mlx5e_cq *cq)
1425 {
1426 struct mlx5_core_dev *mdev = c->mdev;
1427 struct mlx5_core_cq *mcq = &cq->mcq;
1428 int eqn_not_used;
1429 unsigned int irqn;
1430 int err;
1431 u32 i;
1432
1433 param->wq.buf_numa_node = cpu_to_node(c->cpu);
1434 param->wq.db_numa_node = cpu_to_node(c->cpu);
1435 param->eq_ix = c->ix;
1436
1437 err = mlx5_cqwq_create(mdev, &param->wq, param->cqc, &cq->wq,
1438 &cq->wq_ctrl);
1439 if (err)
1440 return err;
1441
1442 mlx5_vector2eqn(mdev, param->eq_ix, &eqn_not_used, &irqn);
1443
1444 cq->napi = &c->napi;
1445
1446 mcq->cqe_sz = 64;
1447 mcq->set_ci_db = cq->wq_ctrl.db.db;
1448 mcq->arm_db = cq->wq_ctrl.db.db + 1;
1449 *mcq->set_ci_db = 0;
1450 *mcq->arm_db = 0;
1451 mcq->vector = param->eq_ix;
1452 mcq->comp = mlx5e_completion_event;
1453 mcq->event = mlx5e_cq_error_event;
1454 mcq->irqn = irqn;
1455
1456 for (i = 0; i < mlx5_cqwq_get_size(&cq->wq); i++) {
1457 struct mlx5_cqe64 *cqe = mlx5_cqwq_get_wqe(&cq->wq, i);
1458
1459 cqe->op_own = 0xf1;
1460 }
1461
1462 cq->channel = c;
1463 cq->mdev = mdev;
1464
1465 return 0;
1466 }
1467
1468 static void mlx5e_free_cq(struct mlx5e_cq *cq)
1469 {
1470 mlx5_cqwq_destroy(&cq->wq_ctrl);
1471 }
1472
1473 static int mlx5e_create_cq(struct mlx5e_cq *cq, struct mlx5e_cq_param *param)
1474 {
1475 struct mlx5_core_dev *mdev = cq->mdev;
1476 struct mlx5_core_cq *mcq = &cq->mcq;
1477
1478 void *in;
1479 void *cqc;
1480 int inlen;
1481 unsigned int irqn_not_used;
1482 int eqn;
1483 int err;
1484
1485 inlen = MLX5_ST_SZ_BYTES(create_cq_in) +
1486 sizeof(u64) * cq->wq_ctrl.frag_buf.npages;
1487 in = mlx5_vzalloc(inlen);
1488 if (!in)
1489 return -ENOMEM;
1490
1491 cqc = MLX5_ADDR_OF(create_cq_in, in, cq_context);
1492
1493 memcpy(cqc, param->cqc, sizeof(param->cqc));
1494
1495 mlx5_fill_page_frag_array(&cq->wq_ctrl.frag_buf,
1496 (__be64 *)MLX5_ADDR_OF(create_cq_in, in, pas));
1497
1498 mlx5_vector2eqn(mdev, param->eq_ix, &eqn, &irqn_not_used);
1499
1500 MLX5_SET(cqc, cqc, cq_period_mode, param->cq_period_mode);
1501 MLX5_SET(cqc, cqc, c_eqn, eqn);
1502 MLX5_SET(cqc, cqc, uar_page, mdev->priv.uar->index);
1503 MLX5_SET(cqc, cqc, log_page_size, cq->wq_ctrl.frag_buf.page_shift -
1504 MLX5_ADAPTER_PAGE_SHIFT);
1505 MLX5_SET64(cqc, cqc, dbr_addr, cq->wq_ctrl.db.dma);
1506
1507 err = mlx5_core_create_cq(mdev, mcq, in, inlen);
1508
1509 kvfree(in);
1510
1511 if (err)
1512 return err;
1513
1514 mlx5e_cq_arm(cq);
1515
1516 return 0;
1517 }
1518
1519 static void mlx5e_destroy_cq(struct mlx5e_cq *cq)
1520 {
1521 mlx5_core_destroy_cq(cq->mdev, &cq->mcq);
1522 }
1523
1524 static int mlx5e_open_cq(struct mlx5e_channel *c,
1525 struct mlx5e_cq_moder moder,
1526 struct mlx5e_cq_param *param,
1527 struct mlx5e_cq *cq)
1528 {
1529 struct mlx5_core_dev *mdev = c->mdev;
1530 int err;
1531
1532 err = mlx5e_alloc_cq(c, param, cq);
1533 if (err)
1534 return err;
1535
1536 err = mlx5e_create_cq(cq, param);
1537 if (err)
1538 goto err_free_cq;
1539
1540 if (MLX5_CAP_GEN(mdev, cq_moderation))
1541 mlx5_core_modify_cq_moderation(mdev, &cq->mcq, moder.usec, moder.pkts);
1542 return 0;
1543
1544 err_free_cq:
1545 mlx5e_free_cq(cq);
1546
1547 return err;
1548 }
1549
1550 static void mlx5e_close_cq(struct mlx5e_cq *cq)
1551 {
1552 mlx5e_destroy_cq(cq);
1553 mlx5e_free_cq(cq);
1554 }
1555
1556 static int mlx5e_get_cpu(struct mlx5e_priv *priv, int ix)
1557 {
1558 return cpumask_first(priv->mdev->priv.irq_info[ix].mask);
1559 }
1560
1561 static int mlx5e_open_tx_cqs(struct mlx5e_channel *c,
1562 struct mlx5e_params *params,
1563 struct mlx5e_channel_param *cparam)
1564 {
1565 int err;
1566 int tc;
1567
1568 for (tc = 0; tc < c->num_tc; tc++) {
1569 err = mlx5e_open_cq(c, params->tx_cq_moderation,
1570 &cparam->tx_cq, &c->sq[tc].cq);
1571 if (err)
1572 goto err_close_tx_cqs;
1573 }
1574
1575 return 0;
1576
1577 err_close_tx_cqs:
1578 for (tc--; tc >= 0; tc--)
1579 mlx5e_close_cq(&c->sq[tc].cq);
1580
1581 return err;
1582 }
1583
1584 static void mlx5e_close_tx_cqs(struct mlx5e_channel *c)
1585 {
1586 int tc;
1587
1588 for (tc = 0; tc < c->num_tc; tc++)
1589 mlx5e_close_cq(&c->sq[tc].cq);
1590 }
1591
1592 static int mlx5e_open_sqs(struct mlx5e_channel *c,
1593 struct mlx5e_params *params,
1594 struct mlx5e_channel_param *cparam)
1595 {
1596 int err;
1597 int tc;
1598
1599 for (tc = 0; tc < params->num_tc; tc++) {
1600 int txq_ix = c->ix + tc * params->num_channels;
1601
1602 err = mlx5e_open_txqsq(c, c->priv->tisn[tc], txq_ix,
1603 params, &cparam->sq, &c->sq[tc]);
1604 if (err)
1605 goto err_close_sqs;
1606 }
1607
1608 return 0;
1609
1610 err_close_sqs:
1611 for (tc--; tc >= 0; tc--)
1612 mlx5e_close_txqsq(&c->sq[tc]);
1613
1614 return err;
1615 }
1616
1617 static void mlx5e_close_sqs(struct mlx5e_channel *c)
1618 {
1619 int tc;
1620
1621 for (tc = 0; tc < c->num_tc; tc++)
1622 mlx5e_close_txqsq(&c->sq[tc]);
1623 }
1624
1625 static int mlx5e_set_sq_maxrate(struct net_device *dev,
1626 struct mlx5e_txqsq *sq, u32 rate)
1627 {
1628 struct mlx5e_priv *priv = netdev_priv(dev);
1629 struct mlx5_core_dev *mdev = priv->mdev;
1630 struct mlx5e_modify_sq_param msp = {0};
1631 u16 rl_index = 0;
1632 int err;
1633
1634 if (rate == sq->rate_limit)
1635 /* nothing to do */
1636 return 0;
1637
1638 if (sq->rate_limit)
1639 /* remove current rl index to free space to next ones */
1640 mlx5_rl_remove_rate(mdev, sq->rate_limit);
1641
1642 sq->rate_limit = 0;
1643
1644 if (rate) {
1645 err = mlx5_rl_add_rate(mdev, rate, &rl_index);
1646 if (err) {
1647 netdev_err(dev, "Failed configuring rate %u: %d\n",
1648 rate, err);
1649 return err;
1650 }
1651 }
1652
1653 msp.curr_state = MLX5_SQC_STATE_RDY;
1654 msp.next_state = MLX5_SQC_STATE_RDY;
1655 msp.rl_index = rl_index;
1656 msp.rl_update = true;
1657 err = mlx5e_modify_sq(mdev, sq->sqn, &msp);
1658 if (err) {
1659 netdev_err(dev, "Failed configuring rate %u: %d\n",
1660 rate, err);
1661 /* remove the rate from the table */
1662 if (rate)
1663 mlx5_rl_remove_rate(mdev, rate);
1664 return err;
1665 }
1666
1667 sq->rate_limit = rate;
1668 return 0;
1669 }
1670
1671 static int mlx5e_set_tx_maxrate(struct net_device *dev, int index, u32 rate)
1672 {
1673 struct mlx5e_priv *priv = netdev_priv(dev);
1674 struct mlx5_core_dev *mdev = priv->mdev;
1675 struct mlx5e_txqsq *sq = priv->txq2sq[index];
1676 int err = 0;
1677
1678 if (!mlx5_rl_is_supported(mdev)) {
1679 netdev_err(dev, "Rate limiting is not supported on this device\n");
1680 return -EINVAL;
1681 }
1682
1683 /* rate is given in Mb/sec, HW config is in Kb/sec */
1684 rate = rate << 10;
1685
1686 /* Check whether rate in valid range, 0 is always valid */
1687 if (rate && !mlx5_rl_is_in_range(mdev, rate)) {
1688 netdev_err(dev, "TX rate %u, is not in range\n", rate);
1689 return -ERANGE;
1690 }
1691
1692 mutex_lock(&priv->state_lock);
1693 if (test_bit(MLX5E_STATE_OPENED, &priv->state))
1694 err = mlx5e_set_sq_maxrate(dev, sq, rate);
1695 if (!err)
1696 priv->tx_rates[index] = rate;
1697 mutex_unlock(&priv->state_lock);
1698
1699 return err;
1700 }
1701
1702 static inline int mlx5e_get_max_num_channels(struct mlx5_core_dev *mdev)
1703 {
1704 return is_kdump_kernel() ?
1705 MLX5E_MIN_NUM_CHANNELS :
1706 min_t(int, mdev->priv.eq_table.num_comp_vectors,
1707 MLX5E_MAX_NUM_CHANNELS);
1708 }
1709
1710 static int mlx5e_open_channel(struct mlx5e_priv *priv, int ix,
1711 struct mlx5e_params *params,
1712 struct mlx5e_channel_param *cparam,
1713 struct mlx5e_channel **cp)
1714 {
1715 struct mlx5e_cq_moder icocq_moder = {0, 0};
1716 struct net_device *netdev = priv->netdev;
1717 int cpu = mlx5e_get_cpu(priv, ix);
1718 struct mlx5e_channel *c;
1719 int err;
1720
1721 c = kzalloc_node(sizeof(*c), GFP_KERNEL, cpu_to_node(cpu));
1722 if (!c)
1723 return -ENOMEM;
1724
1725 c->priv = priv;
1726 c->mdev = priv->mdev;
1727 c->tstamp = &priv->tstamp;
1728 c->ix = ix;
1729 c->cpu = cpu;
1730 c->pdev = &priv->mdev->pdev->dev;
1731 c->netdev = priv->netdev;
1732 c->mkey_be = cpu_to_be32(priv->mdev->mlx5e_res.mkey.key);
1733 c->num_tc = params->num_tc;
1734 c->xdp = !!params->xdp_prog;
1735
1736 netif_napi_add(netdev, &c->napi, mlx5e_napi_poll, 64);
1737
1738 err = mlx5e_open_cq(c, icocq_moder, &cparam->icosq_cq, &c->icosq.cq);
1739 if (err)
1740 goto err_napi_del;
1741
1742 err = mlx5e_open_tx_cqs(c, params, cparam);
1743 if (err)
1744 goto err_close_icosq_cq;
1745
1746 err = mlx5e_open_cq(c, params->rx_cq_moderation, &cparam->rx_cq, &c->rq.cq);
1747 if (err)
1748 goto err_close_tx_cqs;
1749
1750 /* XDP SQ CQ params are same as normal TXQ sq CQ params */
1751 err = c->xdp ? mlx5e_open_cq(c, params->tx_cq_moderation,
1752 &cparam->tx_cq, &c->rq.xdpsq.cq) : 0;
1753 if (err)
1754 goto err_close_rx_cq;
1755
1756 napi_enable(&c->napi);
1757
1758 err = mlx5e_open_icosq(c, params, &cparam->icosq, &c->icosq);
1759 if (err)
1760 goto err_disable_napi;
1761
1762 err = mlx5e_open_sqs(c, params, cparam);
1763 if (err)
1764 goto err_close_icosq;
1765
1766 err = c->xdp ? mlx5e_open_xdpsq(c, params, &cparam->xdp_sq, &c->rq.xdpsq) : 0;
1767 if (err)
1768 goto err_close_sqs;
1769
1770 err = mlx5e_open_rq(c, params, &cparam->rq, &c->rq);
1771 if (err)
1772 goto err_close_xdp_sq;
1773
1774 *cp = c;
1775
1776 return 0;
1777 err_close_xdp_sq:
1778 if (c->xdp)
1779 mlx5e_close_xdpsq(&c->rq.xdpsq);
1780
1781 err_close_sqs:
1782 mlx5e_close_sqs(c);
1783
1784 err_close_icosq:
1785 mlx5e_close_icosq(&c->icosq);
1786
1787 err_disable_napi:
1788 napi_disable(&c->napi);
1789 if (c->xdp)
1790 mlx5e_close_cq(&c->rq.xdpsq.cq);
1791
1792 err_close_rx_cq:
1793 mlx5e_close_cq(&c->rq.cq);
1794
1795 err_close_tx_cqs:
1796 mlx5e_close_tx_cqs(c);
1797
1798 err_close_icosq_cq:
1799 mlx5e_close_cq(&c->icosq.cq);
1800
1801 err_napi_del:
1802 netif_napi_del(&c->napi);
1803 kfree(c);
1804
1805 return err;
1806 }
1807
1808 static void mlx5e_activate_channel(struct mlx5e_channel *c)
1809 {
1810 int tc;
1811
1812 for (tc = 0; tc < c->num_tc; tc++)
1813 mlx5e_activate_txqsq(&c->sq[tc]);
1814 mlx5e_activate_rq(&c->rq);
1815 netif_set_xps_queue(c->netdev, get_cpu_mask(c->cpu), c->ix);
1816 }
1817
1818 static void mlx5e_deactivate_channel(struct mlx5e_channel *c)
1819 {
1820 int tc;
1821
1822 mlx5e_deactivate_rq(&c->rq);
1823 for (tc = 0; tc < c->num_tc; tc++)
1824 mlx5e_deactivate_txqsq(&c->sq[tc]);
1825 }
1826
1827 static void mlx5e_close_channel(struct mlx5e_channel *c)
1828 {
1829 mlx5e_close_rq(&c->rq);
1830 if (c->xdp)
1831 mlx5e_close_xdpsq(&c->rq.xdpsq);
1832 mlx5e_close_sqs(c);
1833 mlx5e_close_icosq(&c->icosq);
1834 napi_disable(&c->napi);
1835 if (c->xdp)
1836 mlx5e_close_cq(&c->rq.xdpsq.cq);
1837 mlx5e_close_cq(&c->rq.cq);
1838 mlx5e_close_tx_cqs(c);
1839 mlx5e_close_cq(&c->icosq.cq);
1840 netif_napi_del(&c->napi);
1841
1842 kfree(c);
1843 }
1844
1845 static void mlx5e_build_rq_param(struct mlx5e_priv *priv,
1846 struct mlx5e_params *params,
1847 struct mlx5e_rq_param *param)
1848 {
1849 void *rqc = param->rqc;
1850 void *wq = MLX5_ADDR_OF(rqc, rqc, wq);
1851
1852 switch (params->rq_wq_type) {
1853 case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
1854 MLX5_SET(wq, wq, log_wqe_num_of_strides, params->mpwqe_log_num_strides - 9);
1855 MLX5_SET(wq, wq, log_wqe_stride_size, params->mpwqe_log_stride_sz - 6);
1856 MLX5_SET(wq, wq, wq_type, MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ);
1857 break;
1858 default: /* MLX5_WQ_TYPE_LINKED_LIST */
1859 MLX5_SET(wq, wq, wq_type, MLX5_WQ_TYPE_LINKED_LIST);
1860 }
1861
1862 MLX5_SET(wq, wq, end_padding_mode, MLX5_WQ_END_PAD_MODE_ALIGN);
1863 MLX5_SET(wq, wq, log_wq_stride, ilog2(sizeof(struct mlx5e_rx_wqe)));
1864 MLX5_SET(wq, wq, log_wq_sz, params->log_rq_size);
1865 MLX5_SET(wq, wq, pd, priv->mdev->mlx5e_res.pdn);
1866 MLX5_SET(rqc, rqc, counter_set_id, priv->q_counter);
1867 MLX5_SET(rqc, rqc, vsd, params->vlan_strip_disable);
1868 MLX5_SET(rqc, rqc, scatter_fcs, params->scatter_fcs_en);
1869
1870 param->wq.buf_numa_node = dev_to_node(&priv->mdev->pdev->dev);
1871 param->wq.linear = 1;
1872 }
1873
1874 static void mlx5e_build_drop_rq_param(struct mlx5e_rq_param *param)
1875 {
1876 void *rqc = param->rqc;
1877 void *wq = MLX5_ADDR_OF(rqc, rqc, wq);
1878
1879 MLX5_SET(wq, wq, wq_type, MLX5_WQ_TYPE_LINKED_LIST);
1880 MLX5_SET(wq, wq, log_wq_stride, ilog2(sizeof(struct mlx5e_rx_wqe)));
1881 }
1882
1883 static void mlx5e_build_sq_param_common(struct mlx5e_priv *priv,
1884 struct mlx5e_sq_param *param)
1885 {
1886 void *sqc = param->sqc;
1887 void *wq = MLX5_ADDR_OF(sqc, sqc, wq);
1888
1889 MLX5_SET(wq, wq, log_wq_stride, ilog2(MLX5_SEND_WQE_BB));
1890 MLX5_SET(wq, wq, pd, priv->mdev->mlx5e_res.pdn);
1891
1892 param->wq.buf_numa_node = dev_to_node(&priv->mdev->pdev->dev);
1893 }
1894
1895 static void mlx5e_build_sq_param(struct mlx5e_priv *priv,
1896 struct mlx5e_params *params,
1897 struct mlx5e_sq_param *param)
1898 {
1899 void *sqc = param->sqc;
1900 void *wq = MLX5_ADDR_OF(sqc, sqc, wq);
1901
1902 mlx5e_build_sq_param_common(priv, param);
1903 MLX5_SET(wq, wq, log_wq_sz, params->log_sq_size);
1904 }
1905
1906 static void mlx5e_build_common_cq_param(struct mlx5e_priv *priv,
1907 struct mlx5e_cq_param *param)
1908 {
1909 void *cqc = param->cqc;
1910
1911 MLX5_SET(cqc, cqc, uar_page, priv->mdev->priv.uar->index);
1912 }
1913
1914 static void mlx5e_build_rx_cq_param(struct mlx5e_priv *priv,
1915 struct mlx5e_params *params,
1916 struct mlx5e_cq_param *param)
1917 {
1918 void *cqc = param->cqc;
1919 u8 log_cq_size;
1920
1921 switch (params->rq_wq_type) {
1922 case MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ:
1923 log_cq_size = params->log_rq_size + params->mpwqe_log_num_strides;
1924 break;
1925 default: /* MLX5_WQ_TYPE_LINKED_LIST */
1926 log_cq_size = params->log_rq_size;
1927 }
1928
1929 MLX5_SET(cqc, cqc, log_cq_size, log_cq_size);
1930 if (MLX5E_GET_PFLAG(params, MLX5E_PFLAG_RX_CQE_COMPRESS)) {
1931 MLX5_SET(cqc, cqc, mini_cqe_res_format, MLX5_CQE_FORMAT_CSUM);
1932 MLX5_SET(cqc, cqc, cqe_comp_en, 1);
1933 }
1934
1935 mlx5e_build_common_cq_param(priv, param);
1936
1937 if (params->rx_am_enabled)
1938 params->rx_cq_moderation =
1939 mlx5e_am_get_def_profile(params->rx_cq_period_mode);
1940 }
1941
1942 static void mlx5e_build_tx_cq_param(struct mlx5e_priv *priv,
1943 struct mlx5e_params *params,
1944 struct mlx5e_cq_param *param)
1945 {
1946 void *cqc = param->cqc;
1947
1948 MLX5_SET(cqc, cqc, log_cq_size, params->log_sq_size);
1949
1950 mlx5e_build_common_cq_param(priv, param);
1951
1952 param->cq_period_mode = MLX5_CQ_PERIOD_MODE_START_FROM_EQE;
1953 }
1954
1955 static void mlx5e_build_ico_cq_param(struct mlx5e_priv *priv,
1956 u8 log_wq_size,
1957 struct mlx5e_cq_param *param)
1958 {
1959 void *cqc = param->cqc;
1960
1961 MLX5_SET(cqc, cqc, log_cq_size, log_wq_size);
1962
1963 mlx5e_build_common_cq_param(priv, param);
1964
1965 param->cq_period_mode = MLX5_CQ_PERIOD_MODE_START_FROM_EQE;
1966 }
1967
1968 static void mlx5e_build_icosq_param(struct mlx5e_priv *priv,
1969 u8 log_wq_size,
1970 struct mlx5e_sq_param *param)
1971 {
1972 void *sqc = param->sqc;
1973 void *wq = MLX5_ADDR_OF(sqc, sqc, wq);
1974
1975 mlx5e_build_sq_param_common(priv, param);
1976
1977 MLX5_SET(wq, wq, log_wq_sz, log_wq_size);
1978 MLX5_SET(sqc, sqc, reg_umr, MLX5_CAP_ETH(priv->mdev, reg_umr_sq));
1979 }
1980
1981 static void mlx5e_build_xdpsq_param(struct mlx5e_priv *priv,
1982 struct mlx5e_params *params,
1983 struct mlx5e_sq_param *param)
1984 {
1985 void *sqc = param->sqc;
1986 void *wq = MLX5_ADDR_OF(sqc, sqc, wq);
1987
1988 mlx5e_build_sq_param_common(priv, param);
1989 MLX5_SET(wq, wq, log_wq_sz, params->log_sq_size);
1990 }
1991
1992 static void mlx5e_build_channel_param(struct mlx5e_priv *priv,
1993 struct mlx5e_params *params,
1994 struct mlx5e_channel_param *cparam)
1995 {
1996 u8 icosq_log_wq_sz = MLX5E_PARAMS_MINIMUM_LOG_SQ_SIZE;
1997
1998 mlx5e_build_rq_param(priv, params, &cparam->rq);
1999 mlx5e_build_sq_param(priv, params, &cparam->sq);
2000 mlx5e_build_xdpsq_param(priv, params, &cparam->xdp_sq);
2001 mlx5e_build_icosq_param(priv, icosq_log_wq_sz, &cparam->icosq);
2002 mlx5e_build_rx_cq_param(priv, params, &cparam->rx_cq);
2003 mlx5e_build_tx_cq_param(priv, params, &cparam->tx_cq);
2004 mlx5e_build_ico_cq_param(priv, icosq_log_wq_sz, &cparam->icosq_cq);
2005 }
2006
2007 int mlx5e_open_channels(struct mlx5e_priv *priv,
2008 struct mlx5e_channels *chs)
2009 {
2010 struct mlx5e_channel_param *cparam;
2011 int err = -ENOMEM;
2012 int i;
2013
2014 chs->num = chs->params.num_channels;
2015
2016 chs->c = kcalloc(chs->num, sizeof(struct mlx5e_channel *), GFP_KERNEL);
2017 cparam = kzalloc(sizeof(struct mlx5e_channel_param), GFP_KERNEL);
2018 if (!chs->c || !cparam)
2019 goto err_free;
2020
2021 mlx5e_build_channel_param(priv, &chs->params, cparam);
2022 for (i = 0; i < chs->num; i++) {
2023 err = mlx5e_open_channel(priv, i, &chs->params, cparam, &chs->c[i]);
2024 if (err)
2025 goto err_close_channels;
2026 }
2027
2028 kfree(cparam);
2029 return 0;
2030
2031 err_close_channels:
2032 for (i--; i >= 0; i--)
2033 mlx5e_close_channel(chs->c[i]);
2034
2035 err_free:
2036 kfree(chs->c);
2037 kfree(cparam);
2038 chs->num = 0;
2039 return err;
2040 }
2041
2042 static void mlx5e_activate_channels(struct mlx5e_channels *chs)
2043 {
2044 int i;
2045
2046 for (i = 0; i < chs->num; i++)
2047 mlx5e_activate_channel(chs->c[i]);
2048 }
2049
2050 static int mlx5e_wait_channels_min_rx_wqes(struct mlx5e_channels *chs)
2051 {
2052 int err = 0;
2053 int i;
2054
2055 for (i = 0; i < chs->num; i++) {
2056 err = mlx5e_wait_for_min_rx_wqes(&chs->c[i]->rq);
2057 if (err)
2058 break;
2059 }
2060
2061 return err;
2062 }
2063
2064 static void mlx5e_deactivate_channels(struct mlx5e_channels *chs)
2065 {
2066 int i;
2067
2068 for (i = 0; i < chs->num; i++)
2069 mlx5e_deactivate_channel(chs->c[i]);
2070 }
2071
2072 void mlx5e_close_channels(struct mlx5e_channels *chs)
2073 {
2074 int i;
2075
2076 for (i = 0; i < chs->num; i++)
2077 mlx5e_close_channel(chs->c[i]);
2078
2079 kfree(chs->c);
2080 chs->num = 0;
2081 }
2082
2083 static int
2084 mlx5e_create_rqt(struct mlx5e_priv *priv, int sz, struct mlx5e_rqt *rqt)
2085 {
2086 struct mlx5_core_dev *mdev = priv->mdev;
2087 void *rqtc;
2088 int inlen;
2089 int err;
2090 u32 *in;
2091 int i;
2092
2093 inlen = MLX5_ST_SZ_BYTES(create_rqt_in) + sizeof(u32) * sz;
2094 in = mlx5_vzalloc(inlen);
2095 if (!in)
2096 return -ENOMEM;
2097
2098 rqtc = MLX5_ADDR_OF(create_rqt_in, in, rqt_context);
2099
2100 MLX5_SET(rqtc, rqtc, rqt_actual_size, sz);
2101 MLX5_SET(rqtc, rqtc, rqt_max_size, sz);
2102
2103 for (i = 0; i < sz; i++)
2104 MLX5_SET(rqtc, rqtc, rq_num[i], priv->drop_rq.rqn);
2105
2106 err = mlx5_core_create_rqt(mdev, in, inlen, &rqt->rqtn);
2107 if (!err)
2108 rqt->enabled = true;
2109
2110 kvfree(in);
2111 return err;
2112 }
2113
2114 void mlx5e_destroy_rqt(struct mlx5e_priv *priv, struct mlx5e_rqt *rqt)
2115 {
2116 rqt->enabled = false;
2117 mlx5_core_destroy_rqt(priv->mdev, rqt->rqtn);
2118 }
2119
2120 static int mlx5e_create_indirect_rqts(struct mlx5e_priv *priv)
2121 {
2122 struct mlx5e_rqt *rqt = &priv->indir_rqt;
2123
2124 return mlx5e_create_rqt(priv, MLX5E_INDIR_RQT_SIZE, rqt);
2125 }
2126
2127 int mlx5e_create_direct_rqts(struct mlx5e_priv *priv)
2128 {
2129 struct mlx5e_rqt *rqt;
2130 int err;
2131 int ix;
2132
2133 for (ix = 0; ix < priv->profile->max_nch(priv->mdev); ix++) {
2134 rqt = &priv->direct_tir[ix].rqt;
2135 err = mlx5e_create_rqt(priv, 1 /*size */, rqt);
2136 if (err)
2137 goto err_destroy_rqts;
2138 }
2139
2140 return 0;
2141
2142 err_destroy_rqts:
2143 for (ix--; ix >= 0; ix--)
2144 mlx5e_destroy_rqt(priv, &priv->direct_tir[ix].rqt);
2145
2146 return err;
2147 }
2148
2149 static int mlx5e_rx_hash_fn(int hfunc)
2150 {
2151 return (hfunc == ETH_RSS_HASH_TOP) ?
2152 MLX5_RX_HASH_FN_TOEPLITZ :
2153 MLX5_RX_HASH_FN_INVERTED_XOR8;
2154 }
2155
2156 static int mlx5e_bits_invert(unsigned long a, int size)
2157 {
2158 int inv = 0;
2159 int i;
2160
2161 for (i = 0; i < size; i++)
2162 inv |= (test_bit(size - i - 1, &a) ? 1 : 0) << i;
2163
2164 return inv;
2165 }
2166
2167 static void mlx5e_fill_rqt_rqns(struct mlx5e_priv *priv, int sz,
2168 struct mlx5e_redirect_rqt_param rrp, void *rqtc)
2169 {
2170 int i;
2171
2172 for (i = 0; i < sz; i++) {
2173 u32 rqn;
2174
2175 if (rrp.is_rss) {
2176 int ix = i;
2177
2178 if (rrp.rss.hfunc == ETH_RSS_HASH_XOR)
2179 ix = mlx5e_bits_invert(i, ilog2(sz));
2180
2181 ix = priv->channels.params.indirection_rqt[ix];
2182 rqn = rrp.rss.channels->c[ix]->rq.rqn;
2183 } else {
2184 rqn = rrp.rqn;
2185 }
2186 MLX5_SET(rqtc, rqtc, rq_num[i], rqn);
2187 }
2188 }
2189
2190 int mlx5e_redirect_rqt(struct mlx5e_priv *priv, u32 rqtn, int sz,
2191 struct mlx5e_redirect_rqt_param rrp)
2192 {
2193 struct mlx5_core_dev *mdev = priv->mdev;
2194 void *rqtc;
2195 int inlen;
2196 u32 *in;
2197 int err;
2198
2199 inlen = MLX5_ST_SZ_BYTES(modify_rqt_in) + sizeof(u32) * sz;
2200 in = mlx5_vzalloc(inlen);
2201 if (!in)
2202 return -ENOMEM;
2203
2204 rqtc = MLX5_ADDR_OF(modify_rqt_in, in, ctx);
2205
2206 MLX5_SET(rqtc, rqtc, rqt_actual_size, sz);
2207 MLX5_SET(modify_rqt_in, in, bitmask.rqn_list, 1);
2208 mlx5e_fill_rqt_rqns(priv, sz, rrp, rqtc);
2209 err = mlx5_core_modify_rqt(mdev, rqtn, in, inlen);
2210
2211 kvfree(in);
2212 return err;
2213 }
2214
2215 static u32 mlx5e_get_direct_rqn(struct mlx5e_priv *priv, int ix,
2216 struct mlx5e_redirect_rqt_param rrp)
2217 {
2218 if (!rrp.is_rss)
2219 return rrp.rqn;
2220
2221 if (ix >= rrp.rss.channels->num)
2222 return priv->drop_rq.rqn;
2223
2224 return rrp.rss.channels->c[ix]->rq.rqn;
2225 }
2226
2227 static void mlx5e_redirect_rqts(struct mlx5e_priv *priv,
2228 struct mlx5e_redirect_rqt_param rrp)
2229 {
2230 u32 rqtn;
2231 int ix;
2232
2233 if (priv->indir_rqt.enabled) {
2234 /* RSS RQ table */
2235 rqtn = priv->indir_rqt.rqtn;
2236 mlx5e_redirect_rqt(priv, rqtn, MLX5E_INDIR_RQT_SIZE, rrp);
2237 }
2238
2239 for (ix = 0; ix < priv->profile->max_nch(priv->mdev); ix++) {
2240 struct mlx5e_redirect_rqt_param direct_rrp = {
2241 .is_rss = false,
2242 {
2243 .rqn = mlx5e_get_direct_rqn(priv, ix, rrp)
2244 },
2245 };
2246
2247 /* Direct RQ Tables */
2248 if (!priv->direct_tir[ix].rqt.enabled)
2249 continue;
2250
2251 rqtn = priv->direct_tir[ix].rqt.rqtn;
2252 mlx5e_redirect_rqt(priv, rqtn, 1, direct_rrp);
2253 }
2254 }
2255
2256 static void mlx5e_redirect_rqts_to_channels(struct mlx5e_priv *priv,
2257 struct mlx5e_channels *chs)
2258 {
2259 struct mlx5e_redirect_rqt_param rrp = {
2260 .is_rss = true,
2261 {
2262 .rss = {
2263 .channels = chs,
2264 .hfunc = chs->params.rss_hfunc,
2265 }
2266 },
2267 };
2268
2269 mlx5e_redirect_rqts(priv, rrp);
2270 }
2271
2272 static void mlx5e_redirect_rqts_to_drop(struct mlx5e_priv *priv)
2273 {
2274 struct mlx5e_redirect_rqt_param drop_rrp = {
2275 .is_rss = false,
2276 {
2277 .rqn = priv->drop_rq.rqn,
2278 },
2279 };
2280
2281 mlx5e_redirect_rqts(priv, drop_rrp);
2282 }
2283
2284 static void mlx5e_build_tir_ctx_lro(struct mlx5e_params *params, void *tirc)
2285 {
2286 if (!params->lro_en)
2287 return;
2288
2289 #define ROUGH_MAX_L2_L3_HDR_SZ 256
2290
2291 MLX5_SET(tirc, tirc, lro_enable_mask,
2292 MLX5_TIRC_LRO_ENABLE_MASK_IPV4_LRO |
2293 MLX5_TIRC_LRO_ENABLE_MASK_IPV6_LRO);
2294 MLX5_SET(tirc, tirc, lro_max_ip_payload_size,
2295 (params->lro_wqe_sz - ROUGH_MAX_L2_L3_HDR_SZ) >> 8);
2296 MLX5_SET(tirc, tirc, lro_timeout_period_usecs, params->lro_timeout);
2297 }
2298
2299 void mlx5e_build_indir_tir_ctx_hash(struct mlx5e_params *params,
2300 enum mlx5e_traffic_types tt,
2301 void *tirc)
2302 {
2303 void *hfso = MLX5_ADDR_OF(tirc, tirc, rx_hash_field_selector_outer);
2304
2305 #define MLX5_HASH_IP (MLX5_HASH_FIELD_SEL_SRC_IP |\
2306 MLX5_HASH_FIELD_SEL_DST_IP)
2307
2308 #define MLX5_HASH_IP_L4PORTS (MLX5_HASH_FIELD_SEL_SRC_IP |\
2309 MLX5_HASH_FIELD_SEL_DST_IP |\
2310 MLX5_HASH_FIELD_SEL_L4_SPORT |\
2311 MLX5_HASH_FIELD_SEL_L4_DPORT)
2312
2313 #define MLX5_HASH_IP_IPSEC_SPI (MLX5_HASH_FIELD_SEL_SRC_IP |\
2314 MLX5_HASH_FIELD_SEL_DST_IP |\
2315 MLX5_HASH_FIELD_SEL_IPSEC_SPI)
2316
2317 MLX5_SET(tirc, tirc, rx_hash_fn, mlx5e_rx_hash_fn(params->rss_hfunc));
2318 if (params->rss_hfunc == ETH_RSS_HASH_TOP) {
2319 void *rss_key = MLX5_ADDR_OF(tirc, tirc,
2320 rx_hash_toeplitz_key);
2321 size_t len = MLX5_FLD_SZ_BYTES(tirc,
2322 rx_hash_toeplitz_key);
2323
2324 MLX5_SET(tirc, tirc, rx_hash_symmetric, 1);
2325 memcpy(rss_key, params->toeplitz_hash_key, len);
2326 }
2327
2328 switch (tt) {
2329 case MLX5E_TT_IPV4_TCP:
2330 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2331 MLX5_L3_PROT_TYPE_IPV4);
2332 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type,
2333 MLX5_L4_PROT_TYPE_TCP);
2334 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2335 MLX5_HASH_IP_L4PORTS);
2336 break;
2337
2338 case MLX5E_TT_IPV6_TCP:
2339 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2340 MLX5_L3_PROT_TYPE_IPV6);
2341 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type,
2342 MLX5_L4_PROT_TYPE_TCP);
2343 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2344 MLX5_HASH_IP_L4PORTS);
2345 break;
2346
2347 case MLX5E_TT_IPV4_UDP:
2348 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2349 MLX5_L3_PROT_TYPE_IPV4);
2350 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type,
2351 MLX5_L4_PROT_TYPE_UDP);
2352 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2353 MLX5_HASH_IP_L4PORTS);
2354 break;
2355
2356 case MLX5E_TT_IPV6_UDP:
2357 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2358 MLX5_L3_PROT_TYPE_IPV6);
2359 MLX5_SET(rx_hash_field_select, hfso, l4_prot_type,
2360 MLX5_L4_PROT_TYPE_UDP);
2361 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2362 MLX5_HASH_IP_L4PORTS);
2363 break;
2364
2365 case MLX5E_TT_IPV4_IPSEC_AH:
2366 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2367 MLX5_L3_PROT_TYPE_IPV4);
2368 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2369 MLX5_HASH_IP_IPSEC_SPI);
2370 break;
2371
2372 case MLX5E_TT_IPV6_IPSEC_AH:
2373 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2374 MLX5_L3_PROT_TYPE_IPV6);
2375 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2376 MLX5_HASH_IP_IPSEC_SPI);
2377 break;
2378
2379 case MLX5E_TT_IPV4_IPSEC_ESP:
2380 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2381 MLX5_L3_PROT_TYPE_IPV4);
2382 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2383 MLX5_HASH_IP_IPSEC_SPI);
2384 break;
2385
2386 case MLX5E_TT_IPV6_IPSEC_ESP:
2387 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2388 MLX5_L3_PROT_TYPE_IPV6);
2389 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2390 MLX5_HASH_IP_IPSEC_SPI);
2391 break;
2392
2393 case MLX5E_TT_IPV4:
2394 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2395 MLX5_L3_PROT_TYPE_IPV4);
2396 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2397 MLX5_HASH_IP);
2398 break;
2399
2400 case MLX5E_TT_IPV6:
2401 MLX5_SET(rx_hash_field_select, hfso, l3_prot_type,
2402 MLX5_L3_PROT_TYPE_IPV6);
2403 MLX5_SET(rx_hash_field_select, hfso, selected_fields,
2404 MLX5_HASH_IP);
2405 break;
2406 default:
2407 WARN_ONCE(true, "%s: bad traffic type!\n", __func__);
2408 }
2409 }
2410
2411 static int mlx5e_modify_tirs_lro(struct mlx5e_priv *priv)
2412 {
2413 struct mlx5_core_dev *mdev = priv->mdev;
2414
2415 void *in;
2416 void *tirc;
2417 int inlen;
2418 int err;
2419 int tt;
2420 int ix;
2421
2422 inlen = MLX5_ST_SZ_BYTES(modify_tir_in);
2423 in = mlx5_vzalloc(inlen);
2424 if (!in)
2425 return -ENOMEM;
2426
2427 MLX5_SET(modify_tir_in, in, bitmask.lro, 1);
2428 tirc = MLX5_ADDR_OF(modify_tir_in, in, ctx);
2429
2430 mlx5e_build_tir_ctx_lro(&priv->channels.params, tirc);
2431
2432 for (tt = 0; tt < MLX5E_NUM_INDIR_TIRS; tt++) {
2433 err = mlx5_core_modify_tir(mdev, priv->indir_tir[tt].tirn, in,
2434 inlen);
2435 if (err)
2436 goto free_in;
2437 }
2438
2439 for (ix = 0; ix < priv->profile->max_nch(priv->mdev); ix++) {
2440 err = mlx5_core_modify_tir(mdev, priv->direct_tir[ix].tirn,
2441 in, inlen);
2442 if (err)
2443 goto free_in;
2444 }
2445
2446 free_in:
2447 kvfree(in);
2448
2449 return err;
2450 }
2451
2452 static int mlx5e_set_mtu(struct mlx5e_priv *priv, u16 mtu)
2453 {
2454 struct mlx5_core_dev *mdev = priv->mdev;
2455 u16 hw_mtu = MLX5E_SW2HW_MTU(mtu);
2456 int err;
2457
2458 err = mlx5_set_port_mtu(mdev, hw_mtu, 1);
2459 if (err)
2460 return err;
2461
2462 /* Update vport context MTU */
2463 mlx5_modify_nic_vport_mtu(mdev, hw_mtu);
2464 return 0;
2465 }
2466
2467 static void mlx5e_query_mtu(struct mlx5e_priv *priv, u16 *mtu)
2468 {
2469 struct mlx5_core_dev *mdev = priv->mdev;
2470 u16 hw_mtu = 0;
2471 int err;
2472
2473 err = mlx5_query_nic_vport_mtu(mdev, &hw_mtu);
2474 if (err || !hw_mtu) /* fallback to port oper mtu */
2475 mlx5_query_port_oper_mtu(mdev, &hw_mtu, 1);
2476
2477 *mtu = MLX5E_HW2SW_MTU(hw_mtu);
2478 }
2479
2480 static int mlx5e_set_dev_port_mtu(struct mlx5e_priv *priv)
2481 {
2482 struct net_device *netdev = priv->netdev;
2483 u16 mtu;
2484 int err;
2485
2486 err = mlx5e_set_mtu(priv, netdev->mtu);
2487 if (err)
2488 return err;
2489
2490 mlx5e_query_mtu(priv, &mtu);
2491 if (mtu != netdev->mtu)
2492 netdev_warn(netdev, "%s: VPort MTU %d is different than netdev mtu %d\n",
2493 __func__, mtu, netdev->mtu);
2494
2495 netdev->mtu = mtu;
2496 return 0;
2497 }
2498
2499 static void mlx5e_netdev_set_tcs(struct net_device *netdev)
2500 {
2501 struct mlx5e_priv *priv = netdev_priv(netdev);
2502 int nch = priv->channels.params.num_channels;
2503 int ntc = priv->channels.params.num_tc;
2504 int tc;
2505
2506 netdev_reset_tc(netdev);
2507
2508 if (ntc == 1)
2509 return;
2510
2511 netdev_set_num_tc(netdev, ntc);
2512
2513 /* Map netdev TCs to offset 0
2514 * We have our own UP to TXQ mapping for QoS
2515 */
2516 for (tc = 0; tc < ntc; tc++)
2517 netdev_set_tc_queue(netdev, tc, nch, 0);
2518 }
2519
2520 static void mlx5e_build_channels_tx_maps(struct mlx5e_priv *priv)
2521 {
2522 struct mlx5e_channel *c;
2523 struct mlx5e_txqsq *sq;
2524 int i, tc;
2525
2526 for (i = 0; i < priv->channels.num; i++)
2527 for (tc = 0; tc < priv->profile->max_tc; tc++)
2528 priv->channel_tc2txq[i][tc] = i + tc * priv->channels.num;
2529
2530 for (i = 0; i < priv->channels.num; i++) {
2531 c = priv->channels.c[i];
2532 for (tc = 0; tc < c->num_tc; tc++) {
2533 sq = &c->sq[tc];
2534 priv->txq2sq[sq->txq_ix] = sq;
2535 }
2536 }
2537 }
2538
2539 static void mlx5e_activate_priv_channels(struct mlx5e_priv *priv)
2540 {
2541 int num_txqs = priv->channels.num * priv->channels.params.num_tc;
2542 struct net_device *netdev = priv->netdev;
2543
2544 mlx5e_netdev_set_tcs(netdev);
2545 netif_set_real_num_tx_queues(netdev, num_txqs);
2546 netif_set_real_num_rx_queues(netdev, priv->channels.num);
2547
2548 mlx5e_build_channels_tx_maps(priv);
2549 mlx5e_activate_channels(&priv->channels);
2550 netif_tx_start_all_queues(priv->netdev);
2551
2552 if (MLX5_CAP_GEN(priv->mdev, vport_group_manager))
2553 mlx5e_add_sqs_fwd_rules(priv);
2554
2555 mlx5e_wait_channels_min_rx_wqes(&priv->channels);
2556 mlx5e_redirect_rqts_to_channels(priv, &priv->channels);
2557 }
2558
2559 static void mlx5e_deactivate_priv_channels(struct mlx5e_priv *priv)
2560 {
2561 mlx5e_redirect_rqts_to_drop(priv);
2562
2563 if (MLX5_CAP_GEN(priv->mdev, vport_group_manager))
2564 mlx5e_remove_sqs_fwd_rules(priv);
2565
2566 /* FIXME: This is a W/A only for tx timeout watch dog false alarm when
2567 * polling for inactive tx queues.
2568 */
2569 netif_tx_stop_all_queues(priv->netdev);
2570 netif_tx_disable(priv->netdev);
2571 mlx5e_deactivate_channels(&priv->channels);
2572 }
2573
2574 void mlx5e_switch_priv_channels(struct mlx5e_priv *priv,
2575 struct mlx5e_channels *new_chs,
2576 mlx5e_fp_hw_modify hw_modify)
2577 {
2578 struct net_device *netdev = priv->netdev;
2579 int new_num_txqs;
2580
2581 new_num_txqs = new_chs->num * new_chs->params.num_tc;
2582
2583 netif_carrier_off(netdev);
2584
2585 if (new_num_txqs < netdev->real_num_tx_queues)
2586 netif_set_real_num_tx_queues(netdev, new_num_txqs);
2587
2588 mlx5e_deactivate_priv_channels(priv);
2589 mlx5e_close_channels(&priv->channels);
2590
2591 priv->channels = *new_chs;
2592
2593 /* New channels are ready to roll, modify HW settings if needed */
2594 if (hw_modify)
2595 hw_modify(priv);
2596
2597 mlx5e_refresh_tirs(priv, false);
2598 mlx5e_activate_priv_channels(priv);
2599
2600 mlx5e_update_carrier(priv);
2601 }
2602
2603 int mlx5e_open_locked(struct net_device *netdev)
2604 {
2605 struct mlx5e_priv *priv = netdev_priv(netdev);
2606 int err;
2607
2608 set_bit(MLX5E_STATE_OPENED, &priv->state);
2609
2610 err = mlx5e_open_channels(priv, &priv->channels);
2611 if (err)
2612 goto err_clear_state_opened_flag;
2613
2614 mlx5e_refresh_tirs(priv, false);
2615 mlx5e_activate_priv_channels(priv);
2616 mlx5e_update_carrier(priv);
2617 mlx5e_timestamp_init(priv);
2618
2619 if (priv->profile->update_stats)
2620 queue_delayed_work(priv->wq, &priv->update_stats_work, 0);
2621
2622 return 0;
2623
2624 err_clear_state_opened_flag:
2625 clear_bit(MLX5E_STATE_OPENED, &priv->state);
2626 return err;
2627 }
2628
2629 int mlx5e_open(struct net_device *netdev)
2630 {
2631 struct mlx5e_priv *priv = netdev_priv(netdev);
2632 int err;
2633
2634 mutex_lock(&priv->state_lock);
2635 err = mlx5e_open_locked(netdev);
2636 mutex_unlock(&priv->state_lock);
2637
2638 return err;
2639 }
2640
2641 int mlx5e_close_locked(struct net_device *netdev)
2642 {
2643 struct mlx5e_priv *priv = netdev_priv(netdev);
2644
2645 /* May already be CLOSED in case a previous configuration operation
2646 * (e.g RX/TX queue size change) that involves close&open failed.
2647 */
2648 if (!test_bit(MLX5E_STATE_OPENED, &priv->state))
2649 return 0;
2650
2651 clear_bit(MLX5E_STATE_OPENED, &priv->state);
2652
2653 mlx5e_timestamp_cleanup(priv);
2654 netif_carrier_off(priv->netdev);
2655 mlx5e_deactivate_priv_channels(priv);
2656 mlx5e_close_channels(&priv->channels);
2657
2658 return 0;
2659 }
2660
2661 int mlx5e_close(struct net_device *netdev)
2662 {
2663 struct mlx5e_priv *priv = netdev_priv(netdev);
2664 int err;
2665
2666 if (!netif_device_present(netdev))
2667 return -ENODEV;
2668
2669 mutex_lock(&priv->state_lock);
2670 err = mlx5e_close_locked(netdev);
2671 mutex_unlock(&priv->state_lock);
2672
2673 return err;
2674 }
2675
2676 static int mlx5e_alloc_drop_rq(struct mlx5_core_dev *mdev,
2677 struct mlx5e_rq *rq,
2678 struct mlx5e_rq_param *param)
2679 {
2680 void *rqc = param->rqc;
2681 void *rqc_wq = MLX5_ADDR_OF(rqc, rqc, wq);
2682 int err;
2683
2684 param->wq.db_numa_node = param->wq.buf_numa_node;
2685
2686 err = mlx5_wq_ll_create(mdev, &param->wq, rqc_wq, &rq->wq,
2687 &rq->wq_ctrl);
2688 if (err)
2689 return err;
2690
2691 rq->mdev = mdev;
2692
2693 return 0;
2694 }
2695
2696 static int mlx5e_alloc_drop_cq(struct mlx5_core_dev *mdev,
2697 struct mlx5e_cq *cq,
2698 struct mlx5e_cq_param *param)
2699 {
2700 struct mlx5_core_cq *mcq = &cq->mcq;
2701 int eqn_not_used;
2702 unsigned int irqn;
2703 int err;
2704
2705 err = mlx5_cqwq_create(mdev, &param->wq, param->cqc, &cq->wq,
2706 &cq->wq_ctrl);
2707 if (err)
2708 return err;
2709
2710 mlx5_vector2eqn(mdev, param->eq_ix, &eqn_not_used, &irqn);
2711
2712 mcq->cqe_sz = 64;
2713 mcq->set_ci_db = cq->wq_ctrl.db.db;
2714 mcq->arm_db = cq->wq_ctrl.db.db + 1;
2715 *mcq->set_ci_db = 0;
2716 *mcq->arm_db = 0;
2717 mcq->vector = param->eq_ix;
2718 mcq->comp = mlx5e_completion_event;
2719 mcq->event = mlx5e_cq_error_event;
2720 mcq->irqn = irqn;
2721
2722 cq->mdev = mdev;
2723
2724 return 0;
2725 }
2726
2727 static int mlx5e_open_drop_rq(struct mlx5_core_dev *mdev,
2728 struct mlx5e_rq *drop_rq)
2729 {
2730 struct mlx5e_cq_param cq_param = {};
2731 struct mlx5e_rq_param rq_param = {};
2732 struct mlx5e_cq *cq = &drop_rq->cq;
2733 int err;
2734
2735 mlx5e_build_drop_rq_param(&rq_param);
2736
2737 err = mlx5e_alloc_drop_cq(mdev, cq, &cq_param);
2738 if (err)
2739 return err;
2740
2741 err = mlx5e_create_cq(cq, &cq_param);
2742 if (err)
2743 goto err_free_cq;
2744
2745 err = mlx5e_alloc_drop_rq(mdev, drop_rq, &rq_param);
2746 if (err)
2747 goto err_destroy_cq;
2748
2749 err = mlx5e_create_rq(drop_rq, &rq_param);
2750 if (err)
2751 goto err_free_rq;
2752
2753 return 0;
2754
2755 err_free_rq:
2756 mlx5e_free_rq(drop_rq);
2757
2758 err_destroy_cq:
2759 mlx5e_destroy_cq(cq);
2760
2761 err_free_cq:
2762 mlx5e_free_cq(cq);
2763
2764 return err;
2765 }
2766
2767 static void mlx5e_close_drop_rq(struct mlx5e_rq *drop_rq)
2768 {
2769 mlx5e_destroy_rq(drop_rq);
2770 mlx5e_free_rq(drop_rq);
2771 mlx5e_destroy_cq(&drop_rq->cq);
2772 mlx5e_free_cq(&drop_rq->cq);
2773 }
2774
2775 static int mlx5e_create_tis(struct mlx5e_priv *priv, int tc)
2776 {
2777 struct mlx5_core_dev *mdev = priv->mdev;
2778 u32 in[MLX5_ST_SZ_DW(create_tis_in)] = {0};
2779 void *tisc = MLX5_ADDR_OF(create_tis_in, in, ctx);
2780
2781 MLX5_SET(tisc, tisc, prio, tc << 1);
2782 MLX5_SET(tisc, tisc, transport_domain, mdev->mlx5e_res.td.tdn);
2783
2784 if (mlx5_lag_is_lacp_owner(mdev))
2785 MLX5_SET(tisc, tisc, strict_lag_tx_port_affinity, 1);
2786
2787 return mlx5_core_create_tis(mdev, in, sizeof(in), &priv->tisn[tc]);
2788 }
2789
2790 static void mlx5e_destroy_tis(struct mlx5e_priv *priv, int tc)
2791 {
2792 mlx5_core_destroy_tis(priv->mdev, priv->tisn[tc]);
2793 }
2794
2795 int mlx5e_create_tises(struct mlx5e_priv *priv)
2796 {
2797 int err;
2798 int tc;
2799
2800 for (tc = 0; tc < priv->profile->max_tc; tc++) {
2801 err = mlx5e_create_tis(priv, tc);
2802 if (err)
2803 goto err_close_tises;
2804 }
2805
2806 return 0;
2807
2808 err_close_tises:
2809 for (tc--; tc >= 0; tc--)
2810 mlx5e_destroy_tis(priv, tc);
2811
2812 return err;
2813 }
2814
2815 void mlx5e_cleanup_nic_tx(struct mlx5e_priv *priv)
2816 {
2817 int tc;
2818
2819 for (tc = 0; tc < priv->profile->max_tc; tc++)
2820 mlx5e_destroy_tis(priv, tc);
2821 }
2822
2823 static void mlx5e_build_indir_tir_ctx(struct mlx5e_priv *priv,
2824 enum mlx5e_traffic_types tt,
2825 u32 *tirc)
2826 {
2827 MLX5_SET(tirc, tirc, transport_domain, priv->mdev->mlx5e_res.td.tdn);
2828
2829 mlx5e_build_tir_ctx_lro(&priv->channels.params, tirc);
2830
2831 MLX5_SET(tirc, tirc, disp_type, MLX5_TIRC_DISP_TYPE_INDIRECT);
2832 MLX5_SET(tirc, tirc, indirect_table, priv->indir_rqt.rqtn);
2833 mlx5e_build_indir_tir_ctx_hash(&priv->channels.params, tt, tirc);
2834 }
2835
2836 static void mlx5e_build_direct_tir_ctx(struct mlx5e_priv *priv, u32 rqtn, u32 *tirc)
2837 {
2838 MLX5_SET(tirc, tirc, transport_domain, priv->mdev->mlx5e_res.td.tdn);
2839
2840 mlx5e_build_tir_ctx_lro(&priv->channels.params, tirc);
2841
2842 MLX5_SET(tirc, tirc, disp_type, MLX5_TIRC_DISP_TYPE_INDIRECT);
2843 MLX5_SET(tirc, tirc, indirect_table, rqtn);
2844 MLX5_SET(tirc, tirc, rx_hash_fn, MLX5_RX_HASH_FN_INVERTED_XOR8);
2845 }
2846
2847 static int mlx5e_create_indirect_tirs(struct mlx5e_priv *priv)
2848 {
2849 struct mlx5e_tir *tir;
2850 void *tirc;
2851 int inlen;
2852 int err;
2853 u32 *in;
2854 int tt;
2855
2856 inlen = MLX5_ST_SZ_BYTES(create_tir_in);
2857 in = mlx5_vzalloc(inlen);
2858 if (!in)
2859 return -ENOMEM;
2860
2861 for (tt = 0; tt < MLX5E_NUM_INDIR_TIRS; tt++) {
2862 memset(in, 0, inlen);
2863 tir = &priv->indir_tir[tt];
2864 tirc = MLX5_ADDR_OF(create_tir_in, in, ctx);
2865 mlx5e_build_indir_tir_ctx(priv, tt, tirc);
2866 err = mlx5e_create_tir(priv->mdev, tir, in, inlen);
2867 if (err)
2868 goto err_destroy_tirs;
2869 }
2870
2871 kvfree(in);
2872
2873 return 0;
2874
2875 err_destroy_tirs:
2876 for (tt--; tt >= 0; tt--)
2877 mlx5e_destroy_tir(priv->mdev, &priv->indir_tir[tt]);
2878
2879 kvfree(in);
2880
2881 return err;
2882 }
2883
2884 int mlx5e_create_direct_tirs(struct mlx5e_priv *priv)
2885 {
2886 int nch = priv->profile->max_nch(priv->mdev);
2887 struct mlx5e_tir *tir;
2888 void *tirc;
2889 int inlen;
2890 int err;
2891 u32 *in;
2892 int ix;
2893
2894 inlen = MLX5_ST_SZ_BYTES(create_tir_in);
2895 in = mlx5_vzalloc(inlen);
2896 if (!in)
2897 return -ENOMEM;
2898
2899 for (ix = 0; ix < nch; ix++) {
2900 memset(in, 0, inlen);
2901 tir = &priv->direct_tir[ix];
2902 tirc = MLX5_ADDR_OF(create_tir_in, in, ctx);
2903 mlx5e_build_direct_tir_ctx(priv, priv->direct_tir[ix].rqt.rqtn, tirc);
2904 err = mlx5e_create_tir(priv->mdev, tir, in, inlen);
2905 if (err)
2906 goto err_destroy_ch_tirs;
2907 }
2908
2909 kvfree(in);
2910
2911 return 0;
2912
2913 err_destroy_ch_tirs:
2914 for (ix--; ix >= 0; ix--)
2915 mlx5e_destroy_tir(priv->mdev, &priv->direct_tir[ix]);
2916
2917 kvfree(in);
2918
2919 return err;
2920 }
2921
2922 static void mlx5e_destroy_indirect_tirs(struct mlx5e_priv *priv)
2923 {
2924 int i;
2925
2926 for (i = 0; i < MLX5E_NUM_INDIR_TIRS; i++)
2927 mlx5e_destroy_tir(priv->mdev, &priv->indir_tir[i]);
2928 }
2929
2930 void mlx5e_destroy_direct_tirs(struct mlx5e_priv *priv)
2931 {
2932 int nch = priv->profile->max_nch(priv->mdev);
2933 int i;
2934
2935 for (i = 0; i < nch; i++)
2936 mlx5e_destroy_tir(priv->mdev, &priv->direct_tir[i]);
2937 }
2938
2939 static int mlx5e_modify_channels_scatter_fcs(struct mlx5e_channels *chs, bool enable)
2940 {
2941 int err = 0;
2942 int i;
2943
2944 for (i = 0; i < chs->num; i++) {
2945 err = mlx5e_modify_rq_scatter_fcs(&chs->c[i]->rq, enable);
2946 if (err)
2947 return err;
2948 }
2949
2950 return 0;
2951 }
2952
2953 int mlx5e_modify_channels_vsd(struct mlx5e_channels *chs, bool vsd)
2954 {
2955 int err = 0;
2956 int i;
2957
2958 for (i = 0; i < chs->num; i++) {
2959 err = mlx5e_modify_rq_vsd(&chs->c[i]->rq, vsd);
2960 if (err)
2961 return err;
2962 }
2963
2964 return 0;
2965 }
2966
2967 static int mlx5e_setup_tc(struct net_device *netdev, u8 tc)
2968 {
2969 struct mlx5e_priv *priv = netdev_priv(netdev);
2970 struct mlx5e_channels new_channels = {};
2971 int err = 0;
2972
2973 if (tc && tc != MLX5E_MAX_NUM_TC)
2974 return -EINVAL;
2975
2976 mutex_lock(&priv->state_lock);
2977
2978 new_channels.params = priv->channels.params;
2979 new_channels.params.num_tc = tc ? tc : 1;
2980
2981 if (test_bit(MLX5E_STATE_OPENED, &priv->state)) {
2982 priv->channels.params = new_channels.params;
2983 goto out;
2984 }
2985
2986 err = mlx5e_open_channels(priv, &new_channels);
2987 if (err)
2988 goto out;
2989
2990 mlx5e_switch_priv_channels(priv, &new_channels, NULL);
2991 out:
2992 mutex_unlock(&priv->state_lock);
2993 return err;
2994 }
2995
2996 static int mlx5e_ndo_setup_tc(struct net_device *dev, u32 handle,
2997 __be16 proto, struct tc_to_netdev *tc)
2998 {
2999 struct mlx5e_priv *priv = netdev_priv(dev);
3000
3001 if (TC_H_MAJ(handle) != TC_H_MAJ(TC_H_INGRESS))
3002 goto mqprio;
3003
3004 switch (tc->type) {
3005 case TC_SETUP_CLSFLOWER:
3006 switch (tc->cls_flower->command) {
3007 case TC_CLSFLOWER_REPLACE:
3008 return mlx5e_configure_flower(priv, proto, tc->cls_flower);
3009 case TC_CLSFLOWER_DESTROY:
3010 return mlx5e_delete_flower(priv, tc->cls_flower);
3011 case TC_CLSFLOWER_STATS:
3012 return mlx5e_stats_flower(priv, tc->cls_flower);
3013 }
3014 default:
3015 return -EOPNOTSUPP;
3016 }
3017
3018 mqprio:
3019 if (tc->type != TC_SETUP_MQPRIO)
3020 return -EINVAL;
3021
3022 tc->mqprio->hw = TC_MQPRIO_HW_OFFLOAD_TCS;
3023
3024 return mlx5e_setup_tc(dev, tc->mqprio->num_tc);
3025 }
3026
3027 static void
3028 mlx5e_get_stats(struct net_device *dev, struct rtnl_link_stats64 *stats)
3029 {
3030 struct mlx5e_priv *priv = netdev_priv(dev);
3031 struct mlx5e_sw_stats *sstats = &priv->stats.sw;
3032 struct mlx5e_vport_stats *vstats = &priv->stats.vport;
3033 struct mlx5e_pport_stats *pstats = &priv->stats.pport;
3034
3035 if (mlx5e_is_uplink_rep(priv)) {
3036 stats->rx_packets = PPORT_802_3_GET(pstats, a_frames_received_ok);
3037 stats->rx_bytes = PPORT_802_3_GET(pstats, a_octets_received_ok);
3038 stats->tx_packets = PPORT_802_3_GET(pstats, a_frames_transmitted_ok);
3039 stats->tx_bytes = PPORT_802_3_GET(pstats, a_octets_transmitted_ok);
3040 } else {
3041 stats->rx_packets = sstats->rx_packets;
3042 stats->rx_bytes = sstats->rx_bytes;
3043 stats->tx_packets = sstats->tx_packets;
3044 stats->tx_bytes = sstats->tx_bytes;
3045 stats->tx_dropped = sstats->tx_queue_dropped;
3046 }
3047
3048 stats->rx_dropped = priv->stats.qcnt.rx_out_of_buffer;
3049
3050 stats->rx_length_errors =
3051 PPORT_802_3_GET(pstats, a_in_range_length_errors) +
3052 PPORT_802_3_GET(pstats, a_out_of_range_length_field) +
3053 PPORT_802_3_GET(pstats, a_frame_too_long_errors);
3054 stats->rx_crc_errors =
3055 PPORT_802_3_GET(pstats, a_frame_check_sequence_errors);
3056 stats->rx_frame_errors = PPORT_802_3_GET(pstats, a_alignment_errors);
3057 stats->tx_aborted_errors = PPORT_2863_GET(pstats, if_out_discards);
3058 stats->tx_carrier_errors =
3059 PPORT_802_3_GET(pstats, a_symbol_error_during_carrier);
3060 stats->rx_errors = stats->rx_length_errors + stats->rx_crc_errors +
3061 stats->rx_frame_errors;
3062 stats->tx_errors = stats->tx_aborted_errors + stats->tx_carrier_errors;
3063
3064 /* vport multicast also counts packets that are dropped due to steering
3065 * or rx out of buffer
3066 */
3067 stats->multicast =
3068 VPORT_COUNTER_GET(vstats, received_eth_multicast.packets);
3069
3070 }
3071
3072 static void mlx5e_set_rx_mode(struct net_device *dev)
3073 {
3074 struct mlx5e_priv *priv = netdev_priv(dev);
3075
3076 queue_work(priv->wq, &priv->set_rx_mode_work);
3077 }
3078
3079 static int mlx5e_set_mac(struct net_device *netdev, void *addr)
3080 {
3081 struct mlx5e_priv *priv = netdev_priv(netdev);
3082 struct sockaddr *saddr = addr;
3083
3084 if (!is_valid_ether_addr(saddr->sa_data))
3085 return -EADDRNOTAVAIL;
3086
3087 netif_addr_lock_bh(netdev);
3088 ether_addr_copy(netdev->dev_addr, saddr->sa_data);
3089 netif_addr_unlock_bh(netdev);
3090
3091 queue_work(priv->wq, &priv->set_rx_mode_work);
3092
3093 return 0;
3094 }
3095
3096 #define MLX5E_SET_FEATURE(netdev, feature, enable) \
3097 do { \
3098 if (enable) \
3099 netdev->features |= feature; \
3100 else \
3101 netdev->features &= ~feature; \
3102 } while (0)
3103
3104 typedef int (*mlx5e_feature_handler)(struct net_device *netdev, bool enable);
3105
3106 static int set_feature_lro(struct net_device *netdev, bool enable)
3107 {
3108 struct mlx5e_priv *priv = netdev_priv(netdev);
3109 struct mlx5e_channels new_channels = {};
3110 int err = 0;
3111 bool reset;
3112
3113 mutex_lock(&priv->state_lock);
3114
3115 reset = (priv->channels.params.rq_wq_type == MLX5_WQ_TYPE_LINKED_LIST);
3116 reset = reset && test_bit(MLX5E_STATE_OPENED, &priv->state);
3117
3118 new_channels.params = priv->channels.params;
3119 new_channels.params.lro_en = enable;
3120
3121 if (!reset) {
3122 priv->channels.params = new_channels.params;
3123 err = mlx5e_modify_tirs_lro(priv);
3124 goto out;
3125 }
3126
3127 err = mlx5e_open_channels(priv, &new_channels);
3128 if (err)
3129 goto out;
3130
3131 mlx5e_switch_priv_channels(priv, &new_channels, mlx5e_modify_tirs_lro);
3132 out:
3133 mutex_unlock(&priv->state_lock);
3134 return err;
3135 }
3136
3137 static int set_feature_vlan_filter(struct net_device *netdev, bool enable)
3138 {
3139 struct mlx5e_priv *priv = netdev_priv(netdev);
3140
3141 if (enable)
3142 mlx5e_enable_vlan_filter(priv);
3143 else
3144 mlx5e_disable_vlan_filter(priv);
3145
3146 return 0;
3147 }
3148
3149 static int set_feature_tc_num_filters(struct net_device *netdev, bool enable)
3150 {
3151 struct mlx5e_priv *priv = netdev_priv(netdev);
3152
3153 if (!enable && mlx5e_tc_num_filters(priv)) {
3154 netdev_err(netdev,
3155 "Active offloaded tc filters, can't turn hw_tc_offload off\n");
3156 return -EINVAL;
3157 }
3158
3159 return 0;
3160 }
3161
3162 static int set_feature_rx_all(struct net_device *netdev, bool enable)
3163 {
3164 struct mlx5e_priv *priv = netdev_priv(netdev);
3165 struct mlx5_core_dev *mdev = priv->mdev;
3166
3167 return mlx5_set_port_fcs(mdev, !enable);
3168 }
3169
3170 static int set_feature_rx_fcs(struct net_device *netdev, bool enable)
3171 {
3172 struct mlx5e_priv *priv = netdev_priv(netdev);
3173 int err;
3174
3175 mutex_lock(&priv->state_lock);
3176
3177 priv->channels.params.scatter_fcs_en = enable;
3178 err = mlx5e_modify_channels_scatter_fcs(&priv->channels, enable);
3179 if (err)
3180 priv->channels.params.scatter_fcs_en = !enable;
3181
3182 mutex_unlock(&priv->state_lock);
3183
3184 return err;
3185 }
3186
3187 static int set_feature_rx_vlan(struct net_device *netdev, bool enable)
3188 {
3189 struct mlx5e_priv *priv = netdev_priv(netdev);
3190 int err = 0;
3191
3192 mutex_lock(&priv->state_lock);
3193
3194 priv->channels.params.vlan_strip_disable = !enable;
3195 if (!test_bit(MLX5E_STATE_OPENED, &priv->state))
3196 goto unlock;
3197
3198 err = mlx5e_modify_channels_vsd(&priv->channels, !enable);
3199 if (err)
3200 priv->channels.params.vlan_strip_disable = enable;
3201
3202 unlock:
3203 mutex_unlock(&priv->state_lock);
3204
3205 return err;
3206 }
3207
3208 #ifdef CONFIG_RFS_ACCEL
3209 static int set_feature_arfs(struct net_device *netdev, bool enable)
3210 {
3211 struct mlx5e_priv *priv = netdev_priv(netdev);
3212 int err;
3213
3214 if (enable)
3215 err = mlx5e_arfs_enable(priv);
3216 else
3217 err = mlx5e_arfs_disable(priv);
3218
3219 return err;
3220 }
3221 #endif
3222
3223 static int mlx5e_handle_feature(struct net_device *netdev,
3224 netdev_features_t wanted_features,
3225 netdev_features_t feature,
3226 mlx5e_feature_handler feature_handler)
3227 {
3228 netdev_features_t changes = wanted_features ^ netdev->features;
3229 bool enable = !!(wanted_features & feature);
3230 int err;
3231
3232 if (!(changes & feature))
3233 return 0;
3234
3235 err = feature_handler(netdev, enable);
3236 if (err) {
3237 netdev_err(netdev, "%s feature 0x%llx failed err %d\n",
3238 enable ? "Enable" : "Disable", feature, err);
3239 return err;
3240 }
3241
3242 MLX5E_SET_FEATURE(netdev, feature, enable);
3243 return 0;
3244 }
3245
3246 static int mlx5e_set_features(struct net_device *netdev,
3247 netdev_features_t features)
3248 {
3249 int err;
3250
3251 err = mlx5e_handle_feature(netdev, features, NETIF_F_LRO,
3252 set_feature_lro);
3253 err |= mlx5e_handle_feature(netdev, features,
3254 NETIF_F_HW_VLAN_CTAG_FILTER,
3255 set_feature_vlan_filter);
3256 err |= mlx5e_handle_feature(netdev, features, NETIF_F_HW_TC,
3257 set_feature_tc_num_filters);
3258 err |= mlx5e_handle_feature(netdev, features, NETIF_F_RXALL,
3259 set_feature_rx_all);
3260 err |= mlx5e_handle_feature(netdev, features, NETIF_F_RXFCS,
3261 set_feature_rx_fcs);
3262 err |= mlx5e_handle_feature(netdev, features, NETIF_F_HW_VLAN_CTAG_RX,
3263 set_feature_rx_vlan);
3264 #ifdef CONFIG_RFS_ACCEL
3265 err |= mlx5e_handle_feature(netdev, features, NETIF_F_NTUPLE,
3266 set_feature_arfs);
3267 #endif
3268
3269 return err ? -EINVAL : 0;
3270 }
3271
3272 static int mlx5e_change_mtu(struct net_device *netdev, int new_mtu)
3273 {
3274 struct mlx5e_priv *priv = netdev_priv(netdev);
3275 struct mlx5e_channels new_channels = {};
3276 int curr_mtu;
3277 int err = 0;
3278 bool reset;
3279
3280 mutex_lock(&priv->state_lock);
3281
3282 reset = !priv->channels.params.lro_en &&
3283 (priv->channels.params.rq_wq_type !=
3284 MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ);
3285
3286 reset = reset && test_bit(MLX5E_STATE_OPENED, &priv->state);
3287
3288 curr_mtu = netdev->mtu;
3289 netdev->mtu = new_mtu;
3290
3291 if (!reset) {
3292 mlx5e_set_dev_port_mtu(priv);
3293 goto out;
3294 }
3295
3296 new_channels.params = priv->channels.params;
3297 err = mlx5e_open_channels(priv, &new_channels);
3298 if (err) {
3299 netdev->mtu = curr_mtu;
3300 goto out;
3301 }
3302
3303 mlx5e_switch_priv_channels(priv, &new_channels, mlx5e_set_dev_port_mtu);
3304
3305 out:
3306 mutex_unlock(&priv->state_lock);
3307 return err;
3308 }
3309
3310 static int mlx5e_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
3311 {
3312 switch (cmd) {
3313 case SIOCSHWTSTAMP:
3314 return mlx5e_hwstamp_set(dev, ifr);
3315 case SIOCGHWTSTAMP:
3316 return mlx5e_hwstamp_get(dev, ifr);
3317 default:
3318 return -EOPNOTSUPP;
3319 }
3320 }
3321
3322 static int mlx5e_set_vf_mac(struct net_device *dev, int vf, u8 *mac)
3323 {
3324 struct mlx5e_priv *priv = netdev_priv(dev);
3325 struct mlx5_core_dev *mdev = priv->mdev;
3326
3327 return mlx5_eswitch_set_vport_mac(mdev->priv.eswitch, vf + 1, mac);
3328 }
3329
3330 static int mlx5e_set_vf_vlan(struct net_device *dev, int vf, u16 vlan, u8 qos,
3331 __be16 vlan_proto)
3332 {
3333 struct mlx5e_priv *priv = netdev_priv(dev);
3334 struct mlx5_core_dev *mdev = priv->mdev;
3335
3336 if (vlan_proto != htons(ETH_P_8021Q))
3337 return -EPROTONOSUPPORT;
3338
3339 return mlx5_eswitch_set_vport_vlan(mdev->priv.eswitch, vf + 1,
3340 vlan, qos);
3341 }
3342
3343 static int mlx5e_set_vf_spoofchk(struct net_device *dev, int vf, bool setting)
3344 {
3345 struct mlx5e_priv *priv = netdev_priv(dev);
3346 struct mlx5_core_dev *mdev = priv->mdev;
3347
3348 return mlx5_eswitch_set_vport_spoofchk(mdev->priv.eswitch, vf + 1, setting);
3349 }
3350
3351 static int mlx5e_set_vf_trust(struct net_device *dev, int vf, bool setting)
3352 {
3353 struct mlx5e_priv *priv = netdev_priv(dev);
3354 struct mlx5_core_dev *mdev = priv->mdev;
3355
3356 return mlx5_eswitch_set_vport_trust(mdev->priv.eswitch, vf + 1, setting);
3357 }
3358
3359 static int mlx5e_set_vf_rate(struct net_device *dev, int vf, int min_tx_rate,
3360 int max_tx_rate)
3361 {
3362 struct mlx5e_priv *priv = netdev_priv(dev);
3363 struct mlx5_core_dev *mdev = priv->mdev;
3364
3365 return mlx5_eswitch_set_vport_rate(mdev->priv.eswitch, vf + 1,
3366 max_tx_rate, min_tx_rate);
3367 }
3368
3369 static int mlx5_vport_link2ifla(u8 esw_link)
3370 {
3371 switch (esw_link) {
3372 case MLX5_ESW_VPORT_ADMIN_STATE_DOWN:
3373 return IFLA_VF_LINK_STATE_DISABLE;
3374 case MLX5_ESW_VPORT_ADMIN_STATE_UP:
3375 return IFLA_VF_LINK_STATE_ENABLE;
3376 }
3377 return IFLA_VF_LINK_STATE_AUTO;
3378 }
3379
3380 static int mlx5_ifla_link2vport(u8 ifla_link)
3381 {
3382 switch (ifla_link) {
3383 case IFLA_VF_LINK_STATE_DISABLE:
3384 return MLX5_ESW_VPORT_ADMIN_STATE_DOWN;
3385 case IFLA_VF_LINK_STATE_ENABLE:
3386 return MLX5_ESW_VPORT_ADMIN_STATE_UP;
3387 }
3388 return MLX5_ESW_VPORT_ADMIN_STATE_AUTO;
3389 }
3390
3391 static int mlx5e_set_vf_link_state(struct net_device *dev, int vf,
3392 int link_state)
3393 {
3394 struct mlx5e_priv *priv = netdev_priv(dev);
3395 struct mlx5_core_dev *mdev = priv->mdev;
3396
3397 return mlx5_eswitch_set_vport_state(mdev->priv.eswitch, vf + 1,
3398 mlx5_ifla_link2vport(link_state));
3399 }
3400
3401 static int mlx5e_get_vf_config(struct net_device *dev,
3402 int vf, struct ifla_vf_info *ivi)
3403 {
3404 struct mlx5e_priv *priv = netdev_priv(dev);
3405 struct mlx5_core_dev *mdev = priv->mdev;
3406 int err;
3407
3408 err = mlx5_eswitch_get_vport_config(mdev->priv.eswitch, vf + 1, ivi);
3409 if (err)
3410 return err;
3411 ivi->linkstate = mlx5_vport_link2ifla(ivi->linkstate);
3412 return 0;
3413 }
3414
3415 static int mlx5e_get_vf_stats(struct net_device *dev,
3416 int vf, struct ifla_vf_stats *vf_stats)
3417 {
3418 struct mlx5e_priv *priv = netdev_priv(dev);
3419 struct mlx5_core_dev *mdev = priv->mdev;
3420
3421 return mlx5_eswitch_get_vport_stats(mdev->priv.eswitch, vf + 1,
3422 vf_stats);
3423 }
3424
3425 static void mlx5e_add_vxlan_port(struct net_device *netdev,
3426 struct udp_tunnel_info *ti)
3427 {
3428 struct mlx5e_priv *priv = netdev_priv(netdev);
3429
3430 if (ti->type != UDP_TUNNEL_TYPE_VXLAN)
3431 return;
3432
3433 if (!mlx5e_vxlan_allowed(priv->mdev))
3434 return;
3435
3436 mlx5e_vxlan_queue_work(priv, ti->sa_family, be16_to_cpu(ti->port), 1);
3437 }
3438
3439 static void mlx5e_del_vxlan_port(struct net_device *netdev,
3440 struct udp_tunnel_info *ti)
3441 {
3442 struct mlx5e_priv *priv = netdev_priv(netdev);
3443
3444 if (ti->type != UDP_TUNNEL_TYPE_VXLAN)
3445 return;
3446
3447 if (!mlx5e_vxlan_allowed(priv->mdev))
3448 return;
3449
3450 mlx5e_vxlan_queue_work(priv, ti->sa_family, be16_to_cpu(ti->port), 0);
3451 }
3452
3453 static netdev_features_t mlx5e_vxlan_features_check(struct mlx5e_priv *priv,
3454 struct sk_buff *skb,
3455 netdev_features_t features)
3456 {
3457 struct udphdr *udph;
3458 u16 proto;
3459 u16 port = 0;
3460
3461 switch (vlan_get_protocol(skb)) {
3462 case htons(ETH_P_IP):
3463 proto = ip_hdr(skb)->protocol;
3464 break;
3465 case htons(ETH_P_IPV6):
3466 proto = ipv6_hdr(skb)->nexthdr;
3467 break;
3468 default:
3469 goto out;
3470 }
3471
3472 if (proto == IPPROTO_UDP) {
3473 udph = udp_hdr(skb);
3474 port = be16_to_cpu(udph->dest);
3475 }
3476
3477 /* Verify if UDP port is being offloaded by HW */
3478 if (port && mlx5e_vxlan_lookup_port(priv, port))
3479 return features;
3480
3481 out:
3482 /* Disable CSUM and GSO if the udp dport is not offloaded by HW */
3483 return features & ~(NETIF_F_CSUM_MASK | NETIF_F_GSO_MASK);
3484 }
3485
3486 static netdev_features_t mlx5e_features_check(struct sk_buff *skb,
3487 struct net_device *netdev,
3488 netdev_features_t features)
3489 {
3490 struct mlx5e_priv *priv = netdev_priv(netdev);
3491
3492 features = vlan_features_check(skb, features);
3493 features = vxlan_features_check(skb, features);
3494
3495 /* Validate if the tunneled packet is being offloaded by HW */
3496 if (skb->encapsulation &&
3497 (features & NETIF_F_CSUM_MASK || features & NETIF_F_GSO_MASK))
3498 return mlx5e_vxlan_features_check(priv, skb, features);
3499
3500 return features;
3501 }
3502
3503 static void mlx5e_tx_timeout(struct net_device *dev)
3504 {
3505 struct mlx5e_priv *priv = netdev_priv(dev);
3506 bool sched_work = false;
3507 int i;
3508
3509 netdev_err(dev, "TX timeout detected\n");
3510
3511 for (i = 0; i < priv->channels.num * priv->channels.params.num_tc; i++) {
3512 struct mlx5e_txqsq *sq = priv->txq2sq[i];
3513
3514 if (!netif_xmit_stopped(netdev_get_tx_queue(dev, i)))
3515 continue;
3516 sched_work = true;
3517 clear_bit(MLX5E_SQ_STATE_ENABLED, &sq->state);
3518 netdev_err(dev, "TX timeout on queue: %d, SQ: 0x%x, CQ: 0x%x, SQ Cons: 0x%x SQ Prod: 0x%x\n",
3519 i, sq->sqn, sq->cq.mcq.cqn, sq->cc, sq->pc);
3520 }
3521
3522 if (sched_work && test_bit(MLX5E_STATE_OPENED, &priv->state))
3523 schedule_work(&priv->tx_timeout_work);
3524 }
3525
3526 static int mlx5e_xdp_set(struct net_device *netdev, struct bpf_prog *prog)
3527 {
3528 struct mlx5e_priv *priv = netdev_priv(netdev);
3529 struct bpf_prog *old_prog;
3530 int err = 0;
3531 bool reset, was_opened;
3532 int i;
3533
3534 mutex_lock(&priv->state_lock);
3535
3536 if ((netdev->features & NETIF_F_LRO) && prog) {
3537 netdev_warn(netdev, "can't set XDP while LRO is on, disable LRO first\n");
3538 err = -EINVAL;
3539 goto unlock;
3540 }
3541
3542 was_opened = test_bit(MLX5E_STATE_OPENED, &priv->state);
3543 /* no need for full reset when exchanging programs */
3544 reset = (!priv->channels.params.xdp_prog || !prog);
3545
3546 if (was_opened && reset)
3547 mlx5e_close_locked(netdev);
3548 if (was_opened && !reset) {
3549 /* num_channels is invariant here, so we can take the
3550 * batched reference right upfront.
3551 */
3552 prog = bpf_prog_add(prog, priv->channels.num);
3553 if (IS_ERR(prog)) {
3554 err = PTR_ERR(prog);
3555 goto unlock;
3556 }
3557 }
3558
3559 /* exchange programs, extra prog reference we got from caller
3560 * as long as we don't fail from this point onwards.
3561 */
3562 old_prog = xchg(&priv->channels.params.xdp_prog, prog);
3563 if (old_prog)
3564 bpf_prog_put(old_prog);
3565
3566 if (reset) /* change RQ type according to priv->xdp_prog */
3567 mlx5e_set_rq_params(priv->mdev, &priv->channels.params);
3568
3569 if (was_opened && reset)
3570 mlx5e_open_locked(netdev);
3571
3572 if (!test_bit(MLX5E_STATE_OPENED, &priv->state) || reset)
3573 goto unlock;
3574
3575 /* exchanging programs w/o reset, we update ref counts on behalf
3576 * of the channels RQs here.
3577 */
3578 for (i = 0; i < priv->channels.num; i++) {
3579 struct mlx5e_channel *c = priv->channels.c[i];
3580
3581 clear_bit(MLX5E_RQ_STATE_ENABLED, &c->rq.state);
3582 napi_synchronize(&c->napi);
3583 /* prevent mlx5e_poll_rx_cq from accessing rq->xdp_prog */
3584
3585 old_prog = xchg(&c->rq.xdp_prog, prog);
3586
3587 set_bit(MLX5E_RQ_STATE_ENABLED, &c->rq.state);
3588 /* napi_schedule in case we have missed anything */
3589 set_bit(MLX5E_CHANNEL_NAPI_SCHED, &c->flags);
3590 napi_schedule(&c->napi);
3591
3592 if (old_prog)
3593 bpf_prog_put(old_prog);
3594 }
3595
3596 unlock:
3597 mutex_unlock(&priv->state_lock);
3598 return err;
3599 }
3600
3601 static bool mlx5e_xdp_attached(struct net_device *dev)
3602 {
3603 struct mlx5e_priv *priv = netdev_priv(dev);
3604
3605 return !!priv->channels.params.xdp_prog;
3606 }
3607
3608 static int mlx5e_xdp(struct net_device *dev, struct netdev_xdp *xdp)
3609 {
3610 switch (xdp->command) {
3611 case XDP_SETUP_PROG:
3612 return mlx5e_xdp_set(dev, xdp->prog);
3613 case XDP_QUERY_PROG:
3614 xdp->prog_attached = mlx5e_xdp_attached(dev);
3615 return 0;
3616 default:
3617 return -EINVAL;
3618 }
3619 }
3620
3621 #ifdef CONFIG_NET_POLL_CONTROLLER
3622 /* Fake "interrupt" called by netpoll (eg netconsole) to send skbs without
3623 * reenabling interrupts.
3624 */
3625 static void mlx5e_netpoll(struct net_device *dev)
3626 {
3627 struct mlx5e_priv *priv = netdev_priv(dev);
3628 struct mlx5e_channels *chs = &priv->channels;
3629
3630 int i;
3631
3632 for (i = 0; i < chs->num; i++)
3633 napi_schedule(&chs->c[i]->napi);
3634 }
3635 #endif
3636
3637 static const struct net_device_ops mlx5e_netdev_ops_basic = {
3638 .ndo_open = mlx5e_open,
3639 .ndo_stop = mlx5e_close,
3640 .ndo_start_xmit = mlx5e_xmit,
3641 .ndo_setup_tc = mlx5e_ndo_setup_tc,
3642 .ndo_select_queue = mlx5e_select_queue,
3643 .ndo_get_stats64 = mlx5e_get_stats,
3644 .ndo_set_rx_mode = mlx5e_set_rx_mode,
3645 .ndo_set_mac_address = mlx5e_set_mac,
3646 .ndo_vlan_rx_add_vid = mlx5e_vlan_rx_add_vid,
3647 .ndo_vlan_rx_kill_vid = mlx5e_vlan_rx_kill_vid,
3648 .ndo_set_features = mlx5e_set_features,
3649 .ndo_change_mtu = mlx5e_change_mtu,
3650 .ndo_do_ioctl = mlx5e_ioctl,
3651 .ndo_set_tx_maxrate = mlx5e_set_tx_maxrate,
3652 #ifdef CONFIG_RFS_ACCEL
3653 .ndo_rx_flow_steer = mlx5e_rx_flow_steer,
3654 #endif
3655 .ndo_tx_timeout = mlx5e_tx_timeout,
3656 .ndo_xdp = mlx5e_xdp,
3657 #ifdef CONFIG_NET_POLL_CONTROLLER
3658 .ndo_poll_controller = mlx5e_netpoll,
3659 #endif
3660 };
3661
3662 static const struct net_device_ops mlx5e_netdev_ops_sriov = {
3663 .ndo_open = mlx5e_open,
3664 .ndo_stop = mlx5e_close,
3665 .ndo_start_xmit = mlx5e_xmit,
3666 .ndo_setup_tc = mlx5e_ndo_setup_tc,
3667 .ndo_select_queue = mlx5e_select_queue,
3668 .ndo_get_stats64 = mlx5e_get_stats,
3669 .ndo_set_rx_mode = mlx5e_set_rx_mode,
3670 .ndo_set_mac_address = mlx5e_set_mac,
3671 .ndo_vlan_rx_add_vid = mlx5e_vlan_rx_add_vid,
3672 .ndo_vlan_rx_kill_vid = mlx5e_vlan_rx_kill_vid,
3673 .ndo_set_features = mlx5e_set_features,
3674 .ndo_change_mtu = mlx5e_change_mtu,
3675 .ndo_do_ioctl = mlx5e_ioctl,
3676 .ndo_udp_tunnel_add = mlx5e_add_vxlan_port,
3677 .ndo_udp_tunnel_del = mlx5e_del_vxlan_port,
3678 .ndo_set_tx_maxrate = mlx5e_set_tx_maxrate,
3679 .ndo_features_check = mlx5e_features_check,
3680 #ifdef CONFIG_RFS_ACCEL
3681 .ndo_rx_flow_steer = mlx5e_rx_flow_steer,
3682 #endif
3683 .ndo_set_vf_mac = mlx5e_set_vf_mac,
3684 .ndo_set_vf_vlan = mlx5e_set_vf_vlan,
3685 .ndo_set_vf_spoofchk = mlx5e_set_vf_spoofchk,
3686 .ndo_set_vf_trust = mlx5e_set_vf_trust,
3687 .ndo_set_vf_rate = mlx5e_set_vf_rate,
3688 .ndo_get_vf_config = mlx5e_get_vf_config,
3689 .ndo_set_vf_link_state = mlx5e_set_vf_link_state,
3690 .ndo_get_vf_stats = mlx5e_get_vf_stats,
3691 .ndo_tx_timeout = mlx5e_tx_timeout,
3692 .ndo_xdp = mlx5e_xdp,
3693 #ifdef CONFIG_NET_POLL_CONTROLLER
3694 .ndo_poll_controller = mlx5e_netpoll,
3695 #endif
3696 .ndo_has_offload_stats = mlx5e_has_offload_stats,
3697 .ndo_get_offload_stats = mlx5e_get_offload_stats,
3698 };
3699
3700 static int mlx5e_check_required_hca_cap(struct mlx5_core_dev *mdev)
3701 {
3702 if (MLX5_CAP_GEN(mdev, port_type) != MLX5_CAP_PORT_TYPE_ETH)
3703 return -EOPNOTSUPP;
3704 if (!MLX5_CAP_GEN(mdev, eth_net_offloads) ||
3705 !MLX5_CAP_GEN(mdev, nic_flow_table) ||
3706 !MLX5_CAP_ETH(mdev, csum_cap) ||
3707 !MLX5_CAP_ETH(mdev, max_lso_cap) ||
3708 !MLX5_CAP_ETH(mdev, vlan_cap) ||
3709 !MLX5_CAP_ETH(mdev, rss_ind_tbl_cap) ||
3710 MLX5_CAP_FLOWTABLE(mdev,
3711 flow_table_properties_nic_receive.max_ft_level)
3712 < 3) {
3713 mlx5_core_warn(mdev,
3714 "Not creating net device, some required device capabilities are missing\n");
3715 return -EOPNOTSUPP;
3716 }
3717 if (!MLX5_CAP_ETH(mdev, self_lb_en_modifiable))
3718 mlx5_core_warn(mdev, "Self loop back prevention is not supported\n");
3719 if (!MLX5_CAP_GEN(mdev, cq_moderation))
3720 mlx5_core_warn(mdev, "CQ modiration is not supported\n");
3721
3722 return 0;
3723 }
3724
3725 u16 mlx5e_get_max_inline_cap(struct mlx5_core_dev *mdev)
3726 {
3727 int bf_buf_size = (1 << MLX5_CAP_GEN(mdev, log_bf_reg_size)) / 2;
3728
3729 return bf_buf_size -
3730 sizeof(struct mlx5e_tx_wqe) +
3731 2 /*sizeof(mlx5e_tx_wqe.inline_hdr_start)*/;
3732 }
3733
3734 void mlx5e_build_default_indir_rqt(struct mlx5_core_dev *mdev,
3735 u32 *indirection_rqt, int len,
3736 int num_channels)
3737 {
3738 int node = mdev->priv.numa_node;
3739 int node_num_of_cores;
3740 int i;
3741
3742 if (node == -1)
3743 node = first_online_node;
3744
3745 node_num_of_cores = cpumask_weight(cpumask_of_node(node));
3746
3747 if (node_num_of_cores)
3748 num_channels = min_t(int, num_channels, node_num_of_cores);
3749
3750 for (i = 0; i < len; i++)
3751 indirection_rqt[i] = i % num_channels;
3752 }
3753
3754 static int mlx5e_get_pci_bw(struct mlx5_core_dev *mdev, u32 *pci_bw)
3755 {
3756 enum pcie_link_width width;
3757 enum pci_bus_speed speed;
3758 int err = 0;
3759
3760 err = pcie_get_minimum_link(mdev->pdev, &speed, &width);
3761 if (err)
3762 return err;
3763
3764 if (speed == PCI_SPEED_UNKNOWN || width == PCIE_LNK_WIDTH_UNKNOWN)
3765 return -EINVAL;
3766
3767 switch (speed) {
3768 case PCIE_SPEED_2_5GT:
3769 *pci_bw = 2500 * width;
3770 break;
3771 case PCIE_SPEED_5_0GT:
3772 *pci_bw = 5000 * width;
3773 break;
3774 case PCIE_SPEED_8_0GT:
3775 *pci_bw = 8000 * width;
3776 break;
3777 default:
3778 return -EINVAL;
3779 }
3780
3781 return 0;
3782 }
3783
3784 static bool cqe_compress_heuristic(u32 link_speed, u32 pci_bw)
3785 {
3786 return (link_speed && pci_bw &&
3787 (pci_bw < 40000) && (pci_bw < link_speed));
3788 }
3789
3790 void mlx5e_set_rx_cq_mode_params(struct mlx5e_params *params, u8 cq_period_mode)
3791 {
3792 params->rx_cq_period_mode = cq_period_mode;
3793
3794 params->rx_cq_moderation.pkts =
3795 MLX5E_PARAMS_DEFAULT_RX_CQ_MODERATION_PKTS;
3796 params->rx_cq_moderation.usec =
3797 MLX5E_PARAMS_DEFAULT_RX_CQ_MODERATION_USEC;
3798
3799 if (cq_period_mode == MLX5_CQ_PERIOD_MODE_START_FROM_CQE)
3800 params->rx_cq_moderation.usec =
3801 MLX5E_PARAMS_DEFAULT_RX_CQ_MODERATION_USEC_FROM_CQE;
3802
3803 MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_CQE_BASED_MODER,
3804 params->rx_cq_period_mode == MLX5_CQ_PERIOD_MODE_START_FROM_CQE);
3805 }
3806
3807 u32 mlx5e_choose_lro_timeout(struct mlx5_core_dev *mdev, u32 wanted_timeout)
3808 {
3809 int i;
3810
3811 /* The supported periods are organized in ascending order */
3812 for (i = 0; i < MLX5E_LRO_TIMEOUT_ARR_SIZE - 1; i++)
3813 if (MLX5_CAP_ETH(mdev, lro_timer_supported_periods[i]) >= wanted_timeout)
3814 break;
3815
3816 return MLX5_CAP_ETH(mdev, lro_timer_supported_periods[i]);
3817 }
3818
3819 static void mlx5e_build_nic_params(struct mlx5_core_dev *mdev,
3820 struct mlx5e_params *params,
3821 u16 max_channels)
3822 {
3823 u8 cq_period_mode = 0;
3824 u32 link_speed = 0;
3825 u32 pci_bw = 0;
3826
3827 params->num_channels = max_channels;
3828 params->num_tc = 1;
3829
3830 /* SQ */
3831 params->log_sq_size = is_kdump_kernel() ?
3832 MLX5E_PARAMS_MINIMUM_LOG_SQ_SIZE :
3833 MLX5E_PARAMS_DEFAULT_LOG_SQ_SIZE;
3834
3835 /* set CQE compression */
3836 params->rx_cqe_compress_def = false;
3837 if (MLX5_CAP_GEN(mdev, cqe_compression) &&
3838 MLX5_CAP_GEN(mdev, vport_group_manager)) {
3839 mlx5e_get_max_linkspeed(mdev, &link_speed);
3840 mlx5e_get_pci_bw(mdev, &pci_bw);
3841 mlx5_core_dbg(mdev, "Max link speed = %d, PCI BW = %d\n",
3842 link_speed, pci_bw);
3843 params->rx_cqe_compress_def = cqe_compress_heuristic(link_speed, pci_bw);
3844 }
3845 MLX5E_SET_PFLAG(params, MLX5E_PFLAG_RX_CQE_COMPRESS, params->rx_cqe_compress_def);
3846
3847 /* RQ */
3848 mlx5e_set_rq_params(mdev, params);
3849
3850 /* HW LRO */
3851 if (params->rq_wq_type == MLX5_WQ_TYPE_LINKED_LIST_STRIDING_RQ)
3852 params->lro_en = true;
3853 params->lro_timeout = mlx5e_choose_lro_timeout(mdev, MLX5E_DEFAULT_LRO_TIMEOUT);
3854
3855 /* CQ moderation params */
3856 cq_period_mode = MLX5_CAP_GEN(mdev, cq_period_start_from_cqe) ?
3857 MLX5_CQ_PERIOD_MODE_START_FROM_CQE :
3858 MLX5_CQ_PERIOD_MODE_START_FROM_EQE;
3859 params->rx_am_enabled = MLX5_CAP_GEN(mdev, cq_moderation);
3860 mlx5e_set_rx_cq_mode_params(params, cq_period_mode);
3861
3862 params->tx_cq_moderation.usec = MLX5E_PARAMS_DEFAULT_TX_CQ_MODERATION_USEC;
3863 params->tx_cq_moderation.pkts = MLX5E_PARAMS_DEFAULT_TX_CQ_MODERATION_PKTS;
3864
3865 /* TX inline */
3866 params->tx_max_inline = mlx5e_get_max_inline_cap(mdev);
3867 mlx5_query_min_inline(mdev, &params->tx_min_inline_mode);
3868 if (params->tx_min_inline_mode == MLX5_INLINE_MODE_NONE &&
3869 !MLX5_CAP_ETH(mdev, wqe_vlan_insert))
3870 params->tx_min_inline_mode = MLX5_INLINE_MODE_L2;
3871
3872 /* RSS */
3873 params->rss_hfunc = ETH_RSS_HASH_XOR;
3874 netdev_rss_key_fill(params->toeplitz_hash_key, sizeof(params->toeplitz_hash_key));
3875 mlx5e_build_default_indir_rqt(mdev, params->indirection_rqt,
3876 MLX5E_INDIR_RQT_SIZE, max_channels);
3877 }
3878
3879 static void mlx5e_build_nic_netdev_priv(struct mlx5_core_dev *mdev,
3880 struct net_device *netdev,
3881 const struct mlx5e_profile *profile,
3882 void *ppriv)
3883 {
3884 struct mlx5e_priv *priv = netdev_priv(netdev);
3885
3886 priv->mdev = mdev;
3887 priv->netdev = netdev;
3888 priv->profile = profile;
3889 priv->ppriv = ppriv;
3890
3891 mlx5e_build_nic_params(mdev, &priv->channels.params, profile->max_nch(mdev));
3892
3893 mutex_init(&priv->state_lock);
3894
3895 INIT_WORK(&priv->update_carrier_work, mlx5e_update_carrier_work);
3896 INIT_WORK(&priv->set_rx_mode_work, mlx5e_set_rx_mode_work);
3897 INIT_WORK(&priv->tx_timeout_work, mlx5e_tx_timeout_work);
3898 INIT_DELAYED_WORK(&priv->update_stats_work, mlx5e_update_stats_work);
3899 }
3900
3901 static void mlx5e_set_netdev_dev_addr(struct net_device *netdev)
3902 {
3903 struct mlx5e_priv *priv = netdev_priv(netdev);
3904
3905 mlx5_query_nic_vport_mac_address(priv->mdev, 0, netdev->dev_addr);
3906 if (is_zero_ether_addr(netdev->dev_addr) &&
3907 !MLX5_CAP_GEN(priv->mdev, vport_group_manager)) {
3908 eth_hw_addr_random(netdev);
3909 mlx5_core_info(priv->mdev, "Assigned random MAC address %pM\n", netdev->dev_addr);
3910 }
3911 }
3912
3913 static const struct switchdev_ops mlx5e_switchdev_ops = {
3914 .switchdev_port_attr_get = mlx5e_attr_get,
3915 };
3916
3917 static void mlx5e_build_nic_netdev(struct net_device *netdev)
3918 {
3919 struct mlx5e_priv *priv = netdev_priv(netdev);
3920 struct mlx5_core_dev *mdev = priv->mdev;
3921 bool fcs_supported;
3922 bool fcs_enabled;
3923
3924 SET_NETDEV_DEV(netdev, &mdev->pdev->dev);
3925
3926 if (MLX5_CAP_GEN(mdev, vport_group_manager)) {
3927 netdev->netdev_ops = &mlx5e_netdev_ops_sriov;
3928 #ifdef CONFIG_MLX5_CORE_EN_DCB
3929 if (MLX5_CAP_GEN(mdev, qos))
3930 netdev->dcbnl_ops = &mlx5e_dcbnl_ops;
3931 #endif
3932 } else {
3933 netdev->netdev_ops = &mlx5e_netdev_ops_basic;
3934 }
3935
3936 netdev->watchdog_timeo = 15 * HZ;
3937
3938 netdev->ethtool_ops = &mlx5e_ethtool_ops;
3939
3940 netdev->vlan_features |= NETIF_F_SG;
3941 netdev->vlan_features |= NETIF_F_IP_CSUM;
3942 netdev->vlan_features |= NETIF_F_IPV6_CSUM;
3943 netdev->vlan_features |= NETIF_F_GRO;
3944 netdev->vlan_features |= NETIF_F_TSO;
3945 netdev->vlan_features |= NETIF_F_TSO6;
3946 netdev->vlan_features |= NETIF_F_RXCSUM;
3947 netdev->vlan_features |= NETIF_F_RXHASH;
3948
3949 if (!!MLX5_CAP_ETH(mdev, lro_cap))
3950 netdev->vlan_features |= NETIF_F_LRO;
3951
3952 netdev->hw_features = netdev->vlan_features;
3953 netdev->hw_features |= NETIF_F_HW_VLAN_CTAG_TX;
3954 netdev->hw_features |= NETIF_F_HW_VLAN_CTAG_RX;
3955 netdev->hw_features |= NETIF_F_HW_VLAN_CTAG_FILTER;
3956
3957 if (mlx5e_vxlan_allowed(mdev)) {
3958 netdev->hw_features |= NETIF_F_GSO_UDP_TUNNEL |
3959 NETIF_F_GSO_UDP_TUNNEL_CSUM |
3960 NETIF_F_GSO_PARTIAL;
3961 netdev->hw_enc_features |= NETIF_F_IP_CSUM;
3962 netdev->hw_enc_features |= NETIF_F_IPV6_CSUM;
3963 netdev->hw_enc_features |= NETIF_F_TSO;
3964 netdev->hw_enc_features |= NETIF_F_TSO6;
3965 netdev->hw_enc_features |= NETIF_F_GSO_UDP_TUNNEL;
3966 netdev->hw_enc_features |= NETIF_F_GSO_UDP_TUNNEL_CSUM |
3967 NETIF_F_GSO_PARTIAL;
3968 netdev->gso_partial_features = NETIF_F_GSO_UDP_TUNNEL_CSUM;
3969 }
3970
3971 mlx5_query_port_fcs(mdev, &fcs_supported, &fcs_enabled);
3972
3973 if (fcs_supported)
3974 netdev->hw_features |= NETIF_F_RXALL;
3975
3976 if (MLX5_CAP_ETH(mdev, scatter_fcs))
3977 netdev->hw_features |= NETIF_F_RXFCS;
3978
3979 netdev->features = netdev->hw_features;
3980 if (!priv->channels.params.lro_en)
3981 netdev->features &= ~NETIF_F_LRO;
3982
3983 if (fcs_enabled)
3984 netdev->features &= ~NETIF_F_RXALL;
3985
3986 if (!priv->channels.params.scatter_fcs_en)
3987 netdev->features &= ~NETIF_F_RXFCS;
3988
3989 #define FT_CAP(f) MLX5_CAP_FLOWTABLE(mdev, flow_table_properties_nic_receive.f)
3990 if (FT_CAP(flow_modify_en) &&
3991 FT_CAP(modify_root) &&
3992 FT_CAP(identified_miss_table_mode) &&
3993 FT_CAP(flow_table_modify)) {
3994 netdev->hw_features |= NETIF_F_HW_TC;
3995 #ifdef CONFIG_RFS_ACCEL
3996 netdev->hw_features |= NETIF_F_NTUPLE;
3997 #endif
3998 }
3999
4000 netdev->features |= NETIF_F_HIGHDMA;
4001
4002 netdev->priv_flags |= IFF_UNICAST_FLT;
4003
4004 mlx5e_set_netdev_dev_addr(netdev);
4005
4006 #ifdef CONFIG_NET_SWITCHDEV
4007 if (MLX5_CAP_GEN(mdev, vport_group_manager))
4008 netdev->switchdev_ops = &mlx5e_switchdev_ops;
4009 #endif
4010 }
4011
4012 static void mlx5e_create_q_counter(struct mlx5e_priv *priv)
4013 {
4014 struct mlx5_core_dev *mdev = priv->mdev;
4015 int err;
4016
4017 err = mlx5_core_alloc_q_counter(mdev, &priv->q_counter);
4018 if (err) {
4019 mlx5_core_warn(mdev, "alloc queue counter failed, %d\n", err);
4020 priv->q_counter = 0;
4021 }
4022 }
4023
4024 static void mlx5e_destroy_q_counter(struct mlx5e_priv *priv)
4025 {
4026 if (!priv->q_counter)
4027 return;
4028
4029 mlx5_core_dealloc_q_counter(priv->mdev, priv->q_counter);
4030 }
4031
4032 static void mlx5e_nic_init(struct mlx5_core_dev *mdev,
4033 struct net_device *netdev,
4034 const struct mlx5e_profile *profile,
4035 void *ppriv)
4036 {
4037 struct mlx5e_priv *priv = netdev_priv(netdev);
4038
4039 mlx5e_build_nic_netdev_priv(mdev, netdev, profile, ppriv);
4040 mlx5e_build_nic_netdev(netdev);
4041 mlx5e_vxlan_init(priv);
4042 }
4043
4044 static void mlx5e_nic_cleanup(struct mlx5e_priv *priv)
4045 {
4046 mlx5e_vxlan_cleanup(priv);
4047
4048 if (priv->channels.params.xdp_prog)
4049 bpf_prog_put(priv->channels.params.xdp_prog);
4050 }
4051
4052 static int mlx5e_init_nic_rx(struct mlx5e_priv *priv)
4053 {
4054 struct mlx5_core_dev *mdev = priv->mdev;
4055 int err;
4056 int i;
4057
4058 err = mlx5e_create_indirect_rqts(priv);
4059 if (err) {
4060 mlx5_core_warn(mdev, "create indirect rqts failed, %d\n", err);
4061 return err;
4062 }
4063
4064 err = mlx5e_create_direct_rqts(priv);
4065 if (err) {
4066 mlx5_core_warn(mdev, "create direct rqts failed, %d\n", err);
4067 goto err_destroy_indirect_rqts;
4068 }
4069
4070 err = mlx5e_create_indirect_tirs(priv);
4071 if (err) {
4072 mlx5_core_warn(mdev, "create indirect tirs failed, %d\n", err);
4073 goto err_destroy_direct_rqts;
4074 }
4075
4076 err = mlx5e_create_direct_tirs(priv);
4077 if (err) {
4078 mlx5_core_warn(mdev, "create direct tirs failed, %d\n", err);
4079 goto err_destroy_indirect_tirs;
4080 }
4081
4082 err = mlx5e_create_flow_steering(priv);
4083 if (err) {
4084 mlx5_core_warn(mdev, "create flow steering failed, %d\n", err);
4085 goto err_destroy_direct_tirs;
4086 }
4087
4088 err = mlx5e_tc_init(priv);
4089 if (err)
4090 goto err_destroy_flow_steering;
4091
4092 return 0;
4093
4094 err_destroy_flow_steering:
4095 mlx5e_destroy_flow_steering(priv);
4096 err_destroy_direct_tirs:
4097 mlx5e_destroy_direct_tirs(priv);
4098 err_destroy_indirect_tirs:
4099 mlx5e_destroy_indirect_tirs(priv);
4100 err_destroy_direct_rqts:
4101 for (i = 0; i < priv->profile->max_nch(mdev); i++)
4102 mlx5e_destroy_rqt(priv, &priv->direct_tir[i].rqt);
4103 err_destroy_indirect_rqts:
4104 mlx5e_destroy_rqt(priv, &priv->indir_rqt);
4105 return err;
4106 }
4107
4108 static void mlx5e_cleanup_nic_rx(struct mlx5e_priv *priv)
4109 {
4110 int i;
4111
4112 mlx5e_tc_cleanup(priv);
4113 mlx5e_destroy_flow_steering(priv);
4114 mlx5e_destroy_direct_tirs(priv);
4115 mlx5e_destroy_indirect_tirs(priv);
4116 for (i = 0; i < priv->profile->max_nch(priv->mdev); i++)
4117 mlx5e_destroy_rqt(priv, &priv->direct_tir[i].rqt);
4118 mlx5e_destroy_rqt(priv, &priv->indir_rqt);
4119 }
4120
4121 static int mlx5e_init_nic_tx(struct mlx5e_priv *priv)
4122 {
4123 int err;
4124
4125 err = mlx5e_create_tises(priv);
4126 if (err) {
4127 mlx5_core_warn(priv->mdev, "create tises failed, %d\n", err);
4128 return err;
4129 }
4130
4131 #ifdef CONFIG_MLX5_CORE_EN_DCB
4132 mlx5e_dcbnl_initialize(priv);
4133 #endif
4134 return 0;
4135 }
4136
4137 static void mlx5e_nic_enable(struct mlx5e_priv *priv)
4138 {
4139 struct net_device *netdev = priv->netdev;
4140 struct mlx5_core_dev *mdev = priv->mdev;
4141 struct mlx5_eswitch *esw = mdev->priv.eswitch;
4142 struct mlx5_eswitch_rep rep;
4143
4144 mlx5_lag_add(mdev, netdev);
4145
4146 mlx5e_enable_async_events(priv);
4147
4148 if (MLX5_CAP_GEN(mdev, vport_group_manager)) {
4149 mlx5_query_nic_vport_mac_address(mdev, 0, rep.hw_id);
4150 rep.load = mlx5e_nic_rep_load;
4151 rep.unload = mlx5e_nic_rep_unload;
4152 rep.vport = FDB_UPLINK_VPORT;
4153 rep.netdev = netdev;
4154 mlx5_eswitch_register_vport_rep(esw, 0, &rep);
4155 }
4156
4157 if (netdev->reg_state != NETREG_REGISTERED)
4158 return;
4159
4160 /* Device already registered: sync netdev system state */
4161 if (mlx5e_vxlan_allowed(mdev)) {
4162 rtnl_lock();
4163 udp_tunnel_get_rx_info(netdev);
4164 rtnl_unlock();
4165 }
4166
4167 queue_work(priv->wq, &priv->set_rx_mode_work);
4168 }
4169
4170 static void mlx5e_nic_disable(struct mlx5e_priv *priv)
4171 {
4172 struct mlx5_core_dev *mdev = priv->mdev;
4173 struct mlx5_eswitch *esw = mdev->priv.eswitch;
4174
4175 queue_work(priv->wq, &priv->set_rx_mode_work);
4176 if (MLX5_CAP_GEN(mdev, vport_group_manager))
4177 mlx5_eswitch_unregister_vport_rep(esw, 0);
4178 mlx5e_disable_async_events(priv);
4179 mlx5_lag_remove(mdev);
4180 }
4181
4182 static const struct mlx5e_profile mlx5e_nic_profile = {
4183 .init = mlx5e_nic_init,
4184 .cleanup = mlx5e_nic_cleanup,
4185 .init_rx = mlx5e_init_nic_rx,
4186 .cleanup_rx = mlx5e_cleanup_nic_rx,
4187 .init_tx = mlx5e_init_nic_tx,
4188 .cleanup_tx = mlx5e_cleanup_nic_tx,
4189 .enable = mlx5e_nic_enable,
4190 .disable = mlx5e_nic_disable,
4191 .update_stats = mlx5e_update_stats,
4192 .max_nch = mlx5e_get_max_num_channels,
4193 .max_tc = MLX5E_MAX_NUM_TC,
4194 };
4195
4196 struct net_device *mlx5e_create_netdev(struct mlx5_core_dev *mdev,
4197 const struct mlx5e_profile *profile,
4198 void *ppriv)
4199 {
4200 int nch = profile->max_nch(mdev);
4201 struct net_device *netdev;
4202 struct mlx5e_priv *priv;
4203
4204 netdev = alloc_etherdev_mqs(sizeof(struct mlx5e_priv),
4205 nch * profile->max_tc,
4206 nch);
4207 if (!netdev) {
4208 mlx5_core_err(mdev, "alloc_etherdev_mqs() failed\n");
4209 return NULL;
4210 }
4211
4212 #ifdef CONFIG_RFS_ACCEL
4213 netdev->rx_cpu_rmap = mdev->rmap;
4214 #endif
4215
4216 profile->init(mdev, netdev, profile, ppriv);
4217
4218 netif_carrier_off(netdev);
4219
4220 priv = netdev_priv(netdev);
4221
4222 priv->wq = create_singlethread_workqueue("mlx5e");
4223 if (!priv->wq)
4224 goto err_cleanup_nic;
4225
4226 return netdev;
4227
4228 err_cleanup_nic:
4229 profile->cleanup(priv);
4230 free_netdev(netdev);
4231
4232 return NULL;
4233 }
4234
4235 int mlx5e_attach_netdev(struct mlx5_core_dev *mdev, struct net_device *netdev)
4236 {
4237 const struct mlx5e_profile *profile;
4238 struct mlx5e_priv *priv;
4239 u16 max_mtu;
4240 int err;
4241
4242 priv = netdev_priv(netdev);
4243 profile = priv->profile;
4244 clear_bit(MLX5E_STATE_DESTROYING, &priv->state);
4245
4246 err = profile->init_tx(priv);
4247 if (err)
4248 goto out;
4249
4250 err = mlx5e_open_drop_rq(mdev, &priv->drop_rq);
4251 if (err) {
4252 mlx5_core_err(mdev, "open drop rq failed, %d\n", err);
4253 goto err_cleanup_tx;
4254 }
4255
4256 err = profile->init_rx(priv);
4257 if (err)
4258 goto err_close_drop_rq;
4259
4260 mlx5e_create_q_counter(priv);
4261
4262 mlx5e_init_l2_addr(priv);
4263
4264 /* MTU range: 68 - hw-specific max */
4265 netdev->min_mtu = ETH_MIN_MTU;
4266 mlx5_query_port_max_mtu(priv->mdev, &max_mtu, 1);
4267 netdev->max_mtu = MLX5E_HW2SW_MTU(max_mtu);
4268
4269 mlx5e_set_dev_port_mtu(priv);
4270
4271 if (profile->enable)
4272 profile->enable(priv);
4273
4274 rtnl_lock();
4275 if (netif_running(netdev))
4276 mlx5e_open(netdev);
4277 netif_device_attach(netdev);
4278 rtnl_unlock();
4279
4280 return 0;
4281
4282 err_close_drop_rq:
4283 mlx5e_close_drop_rq(&priv->drop_rq);
4284
4285 err_cleanup_tx:
4286 profile->cleanup_tx(priv);
4287
4288 out:
4289 return err;
4290 }
4291
4292 static void mlx5e_register_vport_rep(struct mlx5_core_dev *mdev)
4293 {
4294 struct mlx5_eswitch *esw = mdev->priv.eswitch;
4295 int total_vfs = MLX5_TOTAL_VPORTS(mdev);
4296 int vport;
4297 u8 mac[ETH_ALEN];
4298
4299 if (!MLX5_CAP_GEN(mdev, vport_group_manager))
4300 return;
4301
4302 mlx5_query_nic_vport_mac_address(mdev, 0, mac);
4303
4304 for (vport = 1; vport < total_vfs; vport++) {
4305 struct mlx5_eswitch_rep rep;
4306
4307 rep.load = mlx5e_vport_rep_load;
4308 rep.unload = mlx5e_vport_rep_unload;
4309 rep.vport = vport;
4310 ether_addr_copy(rep.hw_id, mac);
4311 mlx5_eswitch_register_vport_rep(esw, vport, &rep);
4312 }
4313 }
4314
4315 static void mlx5e_unregister_vport_rep(struct mlx5_core_dev *mdev)
4316 {
4317 struct mlx5_eswitch *esw = mdev->priv.eswitch;
4318 int total_vfs = MLX5_TOTAL_VPORTS(mdev);
4319 int vport;
4320
4321 if (!MLX5_CAP_GEN(mdev, vport_group_manager))
4322 return;
4323
4324 for (vport = 1; vport < total_vfs; vport++)
4325 mlx5_eswitch_unregister_vport_rep(esw, vport);
4326 }
4327
4328 void mlx5e_detach_netdev(struct mlx5_core_dev *mdev, struct net_device *netdev)
4329 {
4330 struct mlx5e_priv *priv = netdev_priv(netdev);
4331 const struct mlx5e_profile *profile = priv->profile;
4332
4333 set_bit(MLX5E_STATE_DESTROYING, &priv->state);
4334
4335 rtnl_lock();
4336 if (netif_running(netdev))
4337 mlx5e_close(netdev);
4338 netif_device_detach(netdev);
4339 rtnl_unlock();
4340
4341 if (profile->disable)
4342 profile->disable(priv);
4343 flush_workqueue(priv->wq);
4344
4345 mlx5e_destroy_q_counter(priv);
4346 profile->cleanup_rx(priv);
4347 mlx5e_close_drop_rq(&priv->drop_rq);
4348 profile->cleanup_tx(priv);
4349 cancel_delayed_work_sync(&priv->update_stats_work);
4350 }
4351
4352 /* mlx5e_attach and mlx5e_detach scope should be only creating/destroying
4353 * hardware contexts and to connect it to the current netdev.
4354 */
4355 static int mlx5e_attach(struct mlx5_core_dev *mdev, void *vpriv)
4356 {
4357 struct mlx5e_priv *priv = vpriv;
4358 struct net_device *netdev = priv->netdev;
4359 int err;
4360
4361 if (netif_device_present(netdev))
4362 return 0;
4363
4364 err = mlx5e_create_mdev_resources(mdev);
4365 if (err)
4366 return err;
4367
4368 err = mlx5e_attach_netdev(mdev, netdev);
4369 if (err) {
4370 mlx5e_destroy_mdev_resources(mdev);
4371 return err;
4372 }
4373
4374 mlx5e_register_vport_rep(mdev);
4375 return 0;
4376 }
4377
4378 static void mlx5e_detach(struct mlx5_core_dev *mdev, void *vpriv)
4379 {
4380 struct mlx5e_priv *priv = vpriv;
4381 struct net_device *netdev = priv->netdev;
4382
4383 if (!netif_device_present(netdev))
4384 return;
4385
4386 mlx5e_unregister_vport_rep(mdev);
4387 mlx5e_detach_netdev(mdev, netdev);
4388 mlx5e_destroy_mdev_resources(mdev);
4389 }
4390
4391 static void *mlx5e_add(struct mlx5_core_dev *mdev)
4392 {
4393 struct mlx5_eswitch *esw = mdev->priv.eswitch;
4394 int total_vfs = MLX5_TOTAL_VPORTS(mdev);
4395 void *ppriv = NULL;
4396 void *priv;
4397 int vport;
4398 int err;
4399 struct net_device *netdev;
4400
4401 err = mlx5e_check_required_hca_cap(mdev);
4402 if (err)
4403 return NULL;
4404
4405 if (MLX5_CAP_GEN(mdev, vport_group_manager))
4406 ppriv = &esw->offloads.vport_reps[0];
4407
4408 netdev = mlx5e_create_netdev(mdev, &mlx5e_nic_profile, ppriv);
4409 if (!netdev) {
4410 mlx5_core_err(mdev, "mlx5e_create_netdev failed\n");
4411 goto err_unregister_reps;
4412 }
4413
4414 priv = netdev_priv(netdev);
4415
4416 err = mlx5e_attach(mdev, priv);
4417 if (err) {
4418 mlx5_core_err(mdev, "mlx5e_attach failed, %d\n", err);
4419 goto err_destroy_netdev;
4420 }
4421
4422 err = register_netdev(netdev);
4423 if (err) {
4424 mlx5_core_err(mdev, "register_netdev failed, %d\n", err);
4425 goto err_detach;
4426 }
4427
4428 return priv;
4429
4430 err_detach:
4431 mlx5e_detach(mdev, priv);
4432
4433 err_destroy_netdev:
4434 mlx5e_destroy_netdev(mdev, priv);
4435
4436 err_unregister_reps:
4437 for (vport = 1; vport < total_vfs; vport++)
4438 mlx5_eswitch_unregister_vport_rep(esw, vport);
4439
4440 return NULL;
4441 }
4442
4443 void mlx5e_destroy_netdev(struct mlx5_core_dev *mdev, struct mlx5e_priv *priv)
4444 {
4445 const struct mlx5e_profile *profile = priv->profile;
4446 struct net_device *netdev = priv->netdev;
4447
4448 destroy_workqueue(priv->wq);
4449 if (profile->cleanup)
4450 profile->cleanup(priv);
4451 free_netdev(netdev);
4452 }
4453
4454 static void mlx5e_remove(struct mlx5_core_dev *mdev, void *vpriv)
4455 {
4456 struct mlx5e_priv *priv = vpriv;
4457
4458 unregister_netdev(priv->netdev);
4459 mlx5e_detach(mdev, vpriv);
4460 mlx5e_destroy_netdev(mdev, priv);
4461 }
4462
4463 static void *mlx5e_get_netdev(void *vpriv)
4464 {
4465 struct mlx5e_priv *priv = vpriv;
4466
4467 return priv->netdev;
4468 }
4469
4470 static struct mlx5_interface mlx5e_interface = {
4471 .add = mlx5e_add,
4472 .remove = mlx5e_remove,
4473 .attach = mlx5e_attach,
4474 .detach = mlx5e_detach,
4475 .event = mlx5e_async_event,
4476 .protocol = MLX5_INTERFACE_PROTOCOL_ETH,
4477 .get_dev = mlx5e_get_netdev,
4478 };
4479
4480 void mlx5e_init(void)
4481 {
4482 mlx5e_build_ptys2ethtool_map();
4483 mlx5_register_interface(&mlx5e_interface);
4484 }
4485
4486 void mlx5e_cleanup(void)
4487 {
4488 mlx5_unregister_interface(&mlx5e_interface);
4489 }