2 * Copyright (c) 2007 Mellanox Technologies. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34 #include <linux/bpf.h>
35 #include <linux/etherdevice.h>
36 #include <linux/tcp.h>
37 #include <linux/if_vlan.h>
38 #include <linux/delay.h>
39 #include <linux/slab.h>
40 #include <linux/hash.h>
42 #include <net/busy_poll.h>
43 #include <net/vxlan.h>
44 #include <net/devlink.h>
46 #include <linux/mlx4/driver.h>
47 #include <linux/mlx4/device.h>
48 #include <linux/mlx4/cmd.h>
49 #include <linux/mlx4/cq.h>
54 #define MLX4_EN_MAX_XDP_MTU ((int)(PAGE_SIZE - ETH_HLEN - (2 * VLAN_HLEN) - \
57 int mlx4_en_setup_tc(struct net_device
*dev
, u8 up
)
59 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
61 unsigned int offset
= 0;
63 if (up
&& up
!= MLX4_EN_NUM_UP
)
66 netdev_set_num_tc(dev
, up
);
68 /* Partition Tx queues evenly amongst UP's */
69 for (i
= 0; i
< up
; i
++) {
70 netdev_set_tc_queue(dev
, i
, priv
->num_tx_rings_p_up
, offset
);
71 offset
+= priv
->num_tx_rings_p_up
;
74 #ifdef CONFIG_MLX4_EN_DCB
75 if (!mlx4_is_slave(priv
->mdev
->dev
)) {
78 priv
->flags
|= MLX4_EN_FLAG_DCB_ENABLED
;
80 priv
->flags
&= ~MLX4_EN_FLAG_DCB_ENABLED
;
81 priv
->cee_config
.pfc_state
= false;
84 #endif /* CONFIG_MLX4_EN_DCB */
89 static int __mlx4_en_setup_tc(struct net_device
*dev
, u32 handle
, __be16 proto
,
90 struct tc_to_netdev
*tc
)
92 if (tc
->type
!= TC_SETUP_MQPRIO
)
95 return mlx4_en_setup_tc(dev
, tc
->tc
);
98 #ifdef CONFIG_RFS_ACCEL
100 struct mlx4_en_filter
{
101 struct list_head next
;
102 struct work_struct work
;
111 struct mlx4_en_priv
*priv
;
112 u32 flow_id
; /* RFS infrastructure id */
113 int id
; /* mlx4_en driver id */
114 u64 reg_id
; /* Flow steering API id */
115 u8 activated
; /* Used to prevent expiry before filter
118 struct hlist_node filter_chain
;
121 static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv
*priv
);
123 static enum mlx4_net_trans_rule_id
mlx4_ip_proto_to_trans_rule_id(u8 ip_proto
)
127 return MLX4_NET_TRANS_RULE_ID_UDP
;
129 return MLX4_NET_TRANS_RULE_ID_TCP
;
131 return MLX4_NET_TRANS_RULE_NUM
;
135 /* Must not acquire state_lock, as its corresponding work_sync
138 static void mlx4_en_filter_work(struct work_struct
*work
)
140 struct mlx4_en_filter
*filter
= container_of(work
,
141 struct mlx4_en_filter
,
143 struct mlx4_en_priv
*priv
= filter
->priv
;
144 struct mlx4_spec_list spec_tcp_udp
= {
145 .id
= mlx4_ip_proto_to_trans_rule_id(filter
->ip_proto
),
148 .dst_port
= filter
->dst_port
,
149 .dst_port_msk
= (__force __be16
)-1,
150 .src_port
= filter
->src_port
,
151 .src_port_msk
= (__force __be16
)-1,
155 struct mlx4_spec_list spec_ip
= {
156 .id
= MLX4_NET_TRANS_RULE_ID_IPV4
,
159 .dst_ip
= filter
->dst_ip
,
160 .dst_ip_msk
= (__force __be32
)-1,
161 .src_ip
= filter
->src_ip
,
162 .src_ip_msk
= (__force __be32
)-1,
166 struct mlx4_spec_list spec_eth
= {
167 .id
= MLX4_NET_TRANS_RULE_ID_ETH
,
169 struct mlx4_net_trans_rule rule
= {
170 .list
= LIST_HEAD_INIT(rule
.list
),
171 .queue_mode
= MLX4_NET_TRANS_Q_LIFO
,
174 .promisc_mode
= MLX4_FS_REGULAR
,
176 .priority
= MLX4_DOMAIN_RFS
,
179 __be64 mac_mask
= cpu_to_be64(MLX4_MAC_MASK
<< 16);
181 if (spec_tcp_udp
.id
>= MLX4_NET_TRANS_RULE_NUM
) {
182 en_warn(priv
, "RFS: ignoring unsupported ip protocol (%d)\n",
186 list_add_tail(&spec_eth
.list
, &rule
.list
);
187 list_add_tail(&spec_ip
.list
, &rule
.list
);
188 list_add_tail(&spec_tcp_udp
.list
, &rule
.list
);
190 rule
.qpn
= priv
->rss_map
.qps
[filter
->rxq_index
].qpn
;
191 memcpy(spec_eth
.eth
.dst_mac
, priv
->dev
->dev_addr
, ETH_ALEN
);
192 memcpy(spec_eth
.eth
.dst_mac_msk
, &mac_mask
, ETH_ALEN
);
194 filter
->activated
= 0;
196 if (filter
->reg_id
) {
197 rc
= mlx4_flow_detach(priv
->mdev
->dev
, filter
->reg_id
);
198 if (rc
&& rc
!= -ENOENT
)
199 en_err(priv
, "Error detaching flow. rc = %d\n", rc
);
202 rc
= mlx4_flow_attach(priv
->mdev
->dev
, &rule
, &filter
->reg_id
);
204 en_err(priv
, "Error attaching flow. err = %d\n", rc
);
207 mlx4_en_filter_rfs_expire(priv
);
209 filter
->activated
= 1;
212 static inline struct hlist_head
*
213 filter_hash_bucket(struct mlx4_en_priv
*priv
, __be32 src_ip
, __be32 dst_ip
,
214 __be16 src_port
, __be16 dst_port
)
219 l
= (__force
unsigned long)src_port
|
220 ((__force
unsigned long)dst_port
<< 2);
221 l
^= (__force
unsigned long)(src_ip
^ dst_ip
);
223 bucket_idx
= hash_long(l
, MLX4_EN_FILTER_HASH_SHIFT
);
225 return &priv
->filter_hash
[bucket_idx
];
228 static struct mlx4_en_filter
*
229 mlx4_en_filter_alloc(struct mlx4_en_priv
*priv
, int rxq_index
, __be32 src_ip
,
230 __be32 dst_ip
, u8 ip_proto
, __be16 src_port
,
231 __be16 dst_port
, u32 flow_id
)
233 struct mlx4_en_filter
*filter
= NULL
;
235 filter
= kzalloc(sizeof(struct mlx4_en_filter
), GFP_ATOMIC
);
240 filter
->rxq_index
= rxq_index
;
241 INIT_WORK(&filter
->work
, mlx4_en_filter_work
);
243 filter
->src_ip
= src_ip
;
244 filter
->dst_ip
= dst_ip
;
245 filter
->ip_proto
= ip_proto
;
246 filter
->src_port
= src_port
;
247 filter
->dst_port
= dst_port
;
249 filter
->flow_id
= flow_id
;
251 filter
->id
= priv
->last_filter_id
++ % RPS_NO_FILTER
;
253 list_add_tail(&filter
->next
, &priv
->filters
);
254 hlist_add_head(&filter
->filter_chain
,
255 filter_hash_bucket(priv
, src_ip
, dst_ip
, src_port
,
261 static void mlx4_en_filter_free(struct mlx4_en_filter
*filter
)
263 struct mlx4_en_priv
*priv
= filter
->priv
;
266 list_del(&filter
->next
);
268 rc
= mlx4_flow_detach(priv
->mdev
->dev
, filter
->reg_id
);
269 if (rc
&& rc
!= -ENOENT
)
270 en_err(priv
, "Error detaching flow. rc = %d\n", rc
);
275 static inline struct mlx4_en_filter
*
276 mlx4_en_filter_find(struct mlx4_en_priv
*priv
, __be32 src_ip
, __be32 dst_ip
,
277 u8 ip_proto
, __be16 src_port
, __be16 dst_port
)
279 struct mlx4_en_filter
*filter
;
280 struct mlx4_en_filter
*ret
= NULL
;
282 hlist_for_each_entry(filter
,
283 filter_hash_bucket(priv
, src_ip
, dst_ip
,
286 if (filter
->src_ip
== src_ip
&&
287 filter
->dst_ip
== dst_ip
&&
288 filter
->ip_proto
== ip_proto
&&
289 filter
->src_port
== src_port
&&
290 filter
->dst_port
== dst_port
) {
300 mlx4_en_filter_rfs(struct net_device
*net_dev
, const struct sk_buff
*skb
,
301 u16 rxq_index
, u32 flow_id
)
303 struct mlx4_en_priv
*priv
= netdev_priv(net_dev
);
304 struct mlx4_en_filter
*filter
;
305 const struct iphdr
*ip
;
312 int nhoff
= skb_network_offset(skb
);
315 if (skb
->protocol
!= htons(ETH_P_IP
))
316 return -EPROTONOSUPPORT
;
318 ip
= (const struct iphdr
*)(skb
->data
+ nhoff
);
319 if (ip_is_fragment(ip
))
320 return -EPROTONOSUPPORT
;
322 if ((ip
->protocol
!= IPPROTO_TCP
) && (ip
->protocol
!= IPPROTO_UDP
))
323 return -EPROTONOSUPPORT
;
324 ports
= (const __be16
*)(skb
->data
+ nhoff
+ 4 * ip
->ihl
);
326 ip_proto
= ip
->protocol
;
332 spin_lock_bh(&priv
->filters_lock
);
333 filter
= mlx4_en_filter_find(priv
, src_ip
, dst_ip
, ip_proto
,
336 if (filter
->rxq_index
== rxq_index
)
339 filter
->rxq_index
= rxq_index
;
341 filter
= mlx4_en_filter_alloc(priv
, rxq_index
,
342 src_ip
, dst_ip
, ip_proto
,
343 src_port
, dst_port
, flow_id
);
350 queue_work(priv
->mdev
->workqueue
, &filter
->work
);
355 spin_unlock_bh(&priv
->filters_lock
);
360 void mlx4_en_cleanup_filters(struct mlx4_en_priv
*priv
)
362 struct mlx4_en_filter
*filter
, *tmp
;
365 spin_lock_bh(&priv
->filters_lock
);
366 list_for_each_entry_safe(filter
, tmp
, &priv
->filters
, next
) {
367 list_move(&filter
->next
, &del_list
);
368 hlist_del(&filter
->filter_chain
);
370 spin_unlock_bh(&priv
->filters_lock
);
372 list_for_each_entry_safe(filter
, tmp
, &del_list
, next
) {
373 cancel_work_sync(&filter
->work
);
374 mlx4_en_filter_free(filter
);
378 static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv
*priv
)
380 struct mlx4_en_filter
*filter
= NULL
, *tmp
, *last_filter
= NULL
;
384 spin_lock_bh(&priv
->filters_lock
);
385 list_for_each_entry_safe(filter
, tmp
, &priv
->filters
, next
) {
386 if (i
> MLX4_EN_FILTER_EXPIRY_QUOTA
)
389 if (filter
->activated
&&
390 !work_pending(&filter
->work
) &&
391 rps_may_expire_flow(priv
->dev
,
392 filter
->rxq_index
, filter
->flow_id
,
394 list_move(&filter
->next
, &del_list
);
395 hlist_del(&filter
->filter_chain
);
397 last_filter
= filter
;
402 if (last_filter
&& (&last_filter
->next
!= priv
->filters
.next
))
403 list_move(&priv
->filters
, &last_filter
->next
);
405 spin_unlock_bh(&priv
->filters_lock
);
407 list_for_each_entry_safe(filter
, tmp
, &del_list
, next
)
408 mlx4_en_filter_free(filter
);
412 static int mlx4_en_vlan_rx_add_vid(struct net_device
*dev
,
413 __be16 proto
, u16 vid
)
415 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
416 struct mlx4_en_dev
*mdev
= priv
->mdev
;
420 en_dbg(HW
, priv
, "adding VLAN:%d\n", vid
);
422 set_bit(vid
, priv
->active_vlans
);
424 /* Add VID to port VLAN filter */
425 mutex_lock(&mdev
->state_lock
);
426 if (mdev
->device_up
&& priv
->port_up
) {
427 err
= mlx4_SET_VLAN_FLTR(mdev
->dev
, priv
);
429 en_err(priv
, "Failed configuring VLAN filter\n");
433 err
= mlx4_register_vlan(mdev
->dev
, priv
->port
, vid
, &idx
);
435 en_dbg(HW
, priv
, "Failed adding vlan %d\n", vid
);
438 mutex_unlock(&mdev
->state_lock
);
442 static int mlx4_en_vlan_rx_kill_vid(struct net_device
*dev
,
443 __be16 proto
, u16 vid
)
445 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
446 struct mlx4_en_dev
*mdev
= priv
->mdev
;
449 en_dbg(HW
, priv
, "Killing VID:%d\n", vid
);
451 clear_bit(vid
, priv
->active_vlans
);
453 /* Remove VID from port VLAN filter */
454 mutex_lock(&mdev
->state_lock
);
455 mlx4_unregister_vlan(mdev
->dev
, priv
->port
, vid
);
457 if (mdev
->device_up
&& priv
->port_up
) {
458 err
= mlx4_SET_VLAN_FLTR(mdev
->dev
, priv
);
460 en_err(priv
, "Failed configuring VLAN filter\n");
462 mutex_unlock(&mdev
->state_lock
);
467 static void mlx4_en_u64_to_mac(unsigned char dst_mac
[ETH_ALEN
+ 2], u64 src_mac
)
470 for (i
= ETH_ALEN
- 1; i
>= 0; --i
) {
471 dst_mac
[i
] = src_mac
& 0xff;
474 memset(&dst_mac
[ETH_ALEN
], 0, 2);
478 static int mlx4_en_tunnel_steer_add(struct mlx4_en_priv
*priv
, unsigned char *addr
,
479 int qpn
, u64
*reg_id
)
483 if (priv
->mdev
->dev
->caps
.tunnel_offload_mode
!= MLX4_TUNNEL_OFFLOAD_MODE_VXLAN
||
484 priv
->mdev
->dev
->caps
.dmfs_high_steer_mode
== MLX4_STEERING_DMFS_A0_STATIC
)
485 return 0; /* do nothing */
487 err
= mlx4_tunnel_steer_add(priv
->mdev
->dev
, addr
, priv
->port
, qpn
,
488 MLX4_DOMAIN_NIC
, reg_id
);
490 en_err(priv
, "failed to add vxlan steering rule, err %d\n", err
);
493 en_dbg(DRV
, priv
, "added vxlan steering rule, mac %pM reg_id %llx\n", addr
, *reg_id
);
498 static int mlx4_en_uc_steer_add(struct mlx4_en_priv
*priv
,
499 unsigned char *mac
, int *qpn
, u64
*reg_id
)
501 struct mlx4_en_dev
*mdev
= priv
->mdev
;
502 struct mlx4_dev
*dev
= mdev
->dev
;
505 switch (dev
->caps
.steering_mode
) {
506 case MLX4_STEERING_MODE_B0
: {
511 memcpy(&gid
[10], mac
, ETH_ALEN
);
514 err
= mlx4_unicast_attach(dev
, &qp
, gid
, 0, MLX4_PROT_ETH
);
517 case MLX4_STEERING_MODE_DEVICE_MANAGED
: {
518 struct mlx4_spec_list spec_eth
= { {NULL
} };
519 __be64 mac_mask
= cpu_to_be64(MLX4_MAC_MASK
<< 16);
521 struct mlx4_net_trans_rule rule
= {
522 .queue_mode
= MLX4_NET_TRANS_Q_FIFO
,
525 .promisc_mode
= MLX4_FS_REGULAR
,
526 .priority
= MLX4_DOMAIN_NIC
,
529 rule
.port
= priv
->port
;
531 INIT_LIST_HEAD(&rule
.list
);
533 spec_eth
.id
= MLX4_NET_TRANS_RULE_ID_ETH
;
534 memcpy(spec_eth
.eth
.dst_mac
, mac
, ETH_ALEN
);
535 memcpy(spec_eth
.eth
.dst_mac_msk
, &mac_mask
, ETH_ALEN
);
536 list_add_tail(&spec_eth
.list
, &rule
.list
);
538 err
= mlx4_flow_attach(dev
, &rule
, reg_id
);
545 en_warn(priv
, "Failed Attaching Unicast\n");
550 static void mlx4_en_uc_steer_release(struct mlx4_en_priv
*priv
,
551 unsigned char *mac
, int qpn
, u64 reg_id
)
553 struct mlx4_en_dev
*mdev
= priv
->mdev
;
554 struct mlx4_dev
*dev
= mdev
->dev
;
556 switch (dev
->caps
.steering_mode
) {
557 case MLX4_STEERING_MODE_B0
: {
562 memcpy(&gid
[10], mac
, ETH_ALEN
);
565 mlx4_unicast_detach(dev
, &qp
, gid
, MLX4_PROT_ETH
);
568 case MLX4_STEERING_MODE_DEVICE_MANAGED
: {
569 mlx4_flow_detach(dev
, reg_id
);
573 en_err(priv
, "Invalid steering mode.\n");
577 static int mlx4_en_get_qp(struct mlx4_en_priv
*priv
)
579 struct mlx4_en_dev
*mdev
= priv
->mdev
;
580 struct mlx4_dev
*dev
= mdev
->dev
;
583 int *qpn
= &priv
->base_qpn
;
584 u64 mac
= mlx4_mac_to_u64(priv
->dev
->dev_addr
);
586 en_dbg(DRV
, priv
, "Registering MAC: %pM for adding\n",
587 priv
->dev
->dev_addr
);
588 index
= mlx4_register_mac(dev
, priv
->port
, mac
);
591 en_err(priv
, "Failed adding MAC: %pM\n",
592 priv
->dev
->dev_addr
);
596 if (dev
->caps
.steering_mode
== MLX4_STEERING_MODE_A0
) {
597 int base_qpn
= mlx4_get_base_qpn(dev
, priv
->port
);
598 *qpn
= base_qpn
+ index
;
602 err
= mlx4_qp_reserve_range(dev
, 1, 1, qpn
, MLX4_RESERVE_A0_QP
);
603 en_dbg(DRV
, priv
, "Reserved qp %d\n", *qpn
);
605 en_err(priv
, "Failed to reserve qp for mac registration\n");
606 mlx4_unregister_mac(dev
, priv
->port
, mac
);
613 static void mlx4_en_put_qp(struct mlx4_en_priv
*priv
)
615 struct mlx4_en_dev
*mdev
= priv
->mdev
;
616 struct mlx4_dev
*dev
= mdev
->dev
;
617 int qpn
= priv
->base_qpn
;
619 if (dev
->caps
.steering_mode
== MLX4_STEERING_MODE_A0
) {
620 u64 mac
= mlx4_mac_to_u64(priv
->dev
->dev_addr
);
621 en_dbg(DRV
, priv
, "Registering MAC: %pM for deleting\n",
622 priv
->dev
->dev_addr
);
623 mlx4_unregister_mac(dev
, priv
->port
, mac
);
625 en_dbg(DRV
, priv
, "Releasing qp: port %d, qpn %d\n",
627 mlx4_qp_release_range(dev
, qpn
, 1);
628 priv
->flags
&= ~MLX4_EN_FLAG_FORCE_PROMISC
;
632 static int mlx4_en_replace_mac(struct mlx4_en_priv
*priv
, int qpn
,
633 unsigned char *new_mac
, unsigned char *prev_mac
)
635 struct mlx4_en_dev
*mdev
= priv
->mdev
;
636 struct mlx4_dev
*dev
= mdev
->dev
;
638 u64 new_mac_u64
= mlx4_mac_to_u64(new_mac
);
640 if (dev
->caps
.steering_mode
!= MLX4_STEERING_MODE_A0
) {
641 struct hlist_head
*bucket
;
642 unsigned int mac_hash
;
643 struct mlx4_mac_entry
*entry
;
644 struct hlist_node
*tmp
;
645 u64 prev_mac_u64
= mlx4_mac_to_u64(prev_mac
);
647 bucket
= &priv
->mac_hash
[prev_mac
[MLX4_EN_MAC_HASH_IDX
]];
648 hlist_for_each_entry_safe(entry
, tmp
, bucket
, hlist
) {
649 if (ether_addr_equal_64bits(entry
->mac
, prev_mac
)) {
650 mlx4_en_uc_steer_release(priv
, entry
->mac
,
652 mlx4_unregister_mac(dev
, priv
->port
,
654 hlist_del_rcu(&entry
->hlist
);
656 memcpy(entry
->mac
, new_mac
, ETH_ALEN
);
658 mac_hash
= new_mac
[MLX4_EN_MAC_HASH_IDX
];
659 hlist_add_head_rcu(&entry
->hlist
,
660 &priv
->mac_hash
[mac_hash
]);
661 mlx4_register_mac(dev
, priv
->port
, new_mac_u64
);
662 err
= mlx4_en_uc_steer_add(priv
, new_mac
,
667 if (priv
->tunnel_reg_id
) {
668 mlx4_flow_detach(priv
->mdev
->dev
, priv
->tunnel_reg_id
);
669 priv
->tunnel_reg_id
= 0;
671 err
= mlx4_en_tunnel_steer_add(priv
, new_mac
, qpn
,
672 &priv
->tunnel_reg_id
);
679 return __mlx4_replace_mac(dev
, priv
->port
, qpn
, new_mac_u64
);
682 static int mlx4_en_do_set_mac(struct mlx4_en_priv
*priv
,
683 unsigned char new_mac
[ETH_ALEN
+ 2])
688 /* Remove old MAC and insert the new one */
689 err
= mlx4_en_replace_mac(priv
, priv
->base_qpn
,
690 new_mac
, priv
->current_mac
);
692 en_err(priv
, "Failed changing HW MAC address\n");
694 en_dbg(HW
, priv
, "Port is down while registering mac, exiting...\n");
697 memcpy(priv
->current_mac
, new_mac
, sizeof(priv
->current_mac
));
702 static int mlx4_en_set_mac(struct net_device
*dev
, void *addr
)
704 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
705 struct mlx4_en_dev
*mdev
= priv
->mdev
;
706 struct sockaddr
*saddr
= addr
;
707 unsigned char new_mac
[ETH_ALEN
+ 2];
710 if (!is_valid_ether_addr(saddr
->sa_data
))
711 return -EADDRNOTAVAIL
;
713 mutex_lock(&mdev
->state_lock
);
714 memcpy(new_mac
, saddr
->sa_data
, ETH_ALEN
);
715 err
= mlx4_en_do_set_mac(priv
, new_mac
);
717 memcpy(dev
->dev_addr
, saddr
->sa_data
, ETH_ALEN
);
718 mutex_unlock(&mdev
->state_lock
);
723 static void mlx4_en_clear_list(struct net_device
*dev
)
725 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
726 struct mlx4_en_mc_list
*tmp
, *mc_to_del
;
728 list_for_each_entry_safe(mc_to_del
, tmp
, &priv
->mc_list
, list
) {
729 list_del(&mc_to_del
->list
);
734 static void mlx4_en_cache_mclist(struct net_device
*dev
)
736 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
737 struct netdev_hw_addr
*ha
;
738 struct mlx4_en_mc_list
*tmp
;
740 mlx4_en_clear_list(dev
);
741 netdev_for_each_mc_addr(ha
, dev
) {
742 tmp
= kzalloc(sizeof(struct mlx4_en_mc_list
), GFP_ATOMIC
);
744 mlx4_en_clear_list(dev
);
747 memcpy(tmp
->addr
, ha
->addr
, ETH_ALEN
);
748 list_add_tail(&tmp
->list
, &priv
->mc_list
);
752 static void update_mclist_flags(struct mlx4_en_priv
*priv
,
753 struct list_head
*dst
,
754 struct list_head
*src
)
756 struct mlx4_en_mc_list
*dst_tmp
, *src_tmp
, *new_mc
;
759 /* Find all the entries that should be removed from dst,
760 * These are the entries that are not found in src
762 list_for_each_entry(dst_tmp
, dst
, list
) {
764 list_for_each_entry(src_tmp
, src
, list
) {
765 if (ether_addr_equal(dst_tmp
->addr
, src_tmp
->addr
)) {
771 dst_tmp
->action
= MCLIST_REM
;
774 /* Add entries that exist in src but not in dst
775 * mark them as need to add
777 list_for_each_entry(src_tmp
, src
, list
) {
779 list_for_each_entry(dst_tmp
, dst
, list
) {
780 if (ether_addr_equal(dst_tmp
->addr
, src_tmp
->addr
)) {
781 dst_tmp
->action
= MCLIST_NONE
;
787 new_mc
= kmemdup(src_tmp
,
788 sizeof(struct mlx4_en_mc_list
),
793 new_mc
->action
= MCLIST_ADD
;
794 list_add_tail(&new_mc
->list
, dst
);
799 static void mlx4_en_set_rx_mode(struct net_device
*dev
)
801 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
806 queue_work(priv
->mdev
->workqueue
, &priv
->rx_mode_task
);
809 static void mlx4_en_set_promisc_mode(struct mlx4_en_priv
*priv
,
810 struct mlx4_en_dev
*mdev
)
814 if (!(priv
->flags
& MLX4_EN_FLAG_PROMISC
)) {
815 if (netif_msg_rx_status(priv
))
816 en_warn(priv
, "Entering promiscuous mode\n");
817 priv
->flags
|= MLX4_EN_FLAG_PROMISC
;
819 /* Enable promiscouos mode */
820 switch (mdev
->dev
->caps
.steering_mode
) {
821 case MLX4_STEERING_MODE_DEVICE_MANAGED
:
822 err
= mlx4_flow_steer_promisc_add(mdev
->dev
,
825 MLX4_FS_ALL_DEFAULT
);
827 en_err(priv
, "Failed enabling promiscuous mode\n");
828 priv
->flags
|= MLX4_EN_FLAG_MC_PROMISC
;
831 case MLX4_STEERING_MODE_B0
:
832 err
= mlx4_unicast_promisc_add(mdev
->dev
,
836 en_err(priv
, "Failed enabling unicast promiscuous mode\n");
838 /* Add the default qp number as multicast
841 if (!(priv
->flags
& MLX4_EN_FLAG_MC_PROMISC
)) {
842 err
= mlx4_multicast_promisc_add(mdev
->dev
,
846 en_err(priv
, "Failed enabling multicast promiscuous mode\n");
847 priv
->flags
|= MLX4_EN_FLAG_MC_PROMISC
;
851 case MLX4_STEERING_MODE_A0
:
852 err
= mlx4_SET_PORT_qpn_calc(mdev
->dev
,
857 en_err(priv
, "Failed enabling promiscuous mode\n");
861 /* Disable port multicast filter (unconditionally) */
862 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
863 0, MLX4_MCAST_DISABLE
);
865 en_err(priv
, "Failed disabling multicast filter\n");
869 static void mlx4_en_clear_promisc_mode(struct mlx4_en_priv
*priv
,
870 struct mlx4_en_dev
*mdev
)
874 if (netif_msg_rx_status(priv
))
875 en_warn(priv
, "Leaving promiscuous mode\n");
876 priv
->flags
&= ~MLX4_EN_FLAG_PROMISC
;
878 /* Disable promiscouos mode */
879 switch (mdev
->dev
->caps
.steering_mode
) {
880 case MLX4_STEERING_MODE_DEVICE_MANAGED
:
881 err
= mlx4_flow_steer_promisc_remove(mdev
->dev
,
883 MLX4_FS_ALL_DEFAULT
);
885 en_err(priv
, "Failed disabling promiscuous mode\n");
886 priv
->flags
&= ~MLX4_EN_FLAG_MC_PROMISC
;
889 case MLX4_STEERING_MODE_B0
:
890 err
= mlx4_unicast_promisc_remove(mdev
->dev
,
894 en_err(priv
, "Failed disabling unicast promiscuous mode\n");
895 /* Disable Multicast promisc */
896 if (priv
->flags
& MLX4_EN_FLAG_MC_PROMISC
) {
897 err
= mlx4_multicast_promisc_remove(mdev
->dev
,
901 en_err(priv
, "Failed disabling multicast promiscuous mode\n");
902 priv
->flags
&= ~MLX4_EN_FLAG_MC_PROMISC
;
906 case MLX4_STEERING_MODE_A0
:
907 err
= mlx4_SET_PORT_qpn_calc(mdev
->dev
,
911 en_err(priv
, "Failed disabling promiscuous mode\n");
916 static void mlx4_en_do_multicast(struct mlx4_en_priv
*priv
,
917 struct net_device
*dev
,
918 struct mlx4_en_dev
*mdev
)
920 struct mlx4_en_mc_list
*mclist
, *tmp
;
922 u8 mc_list
[16] = {0};
925 /* Enable/disable the multicast filter according to IFF_ALLMULTI */
926 if (dev
->flags
& IFF_ALLMULTI
) {
927 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
928 0, MLX4_MCAST_DISABLE
);
930 en_err(priv
, "Failed disabling multicast filter\n");
932 /* Add the default qp number as multicast promisc */
933 if (!(priv
->flags
& MLX4_EN_FLAG_MC_PROMISC
)) {
934 switch (mdev
->dev
->caps
.steering_mode
) {
935 case MLX4_STEERING_MODE_DEVICE_MANAGED
:
936 err
= mlx4_flow_steer_promisc_add(mdev
->dev
,
942 case MLX4_STEERING_MODE_B0
:
943 err
= mlx4_multicast_promisc_add(mdev
->dev
,
948 case MLX4_STEERING_MODE_A0
:
952 en_err(priv
, "Failed entering multicast promisc mode\n");
953 priv
->flags
|= MLX4_EN_FLAG_MC_PROMISC
;
956 /* Disable Multicast promisc */
957 if (priv
->flags
& MLX4_EN_FLAG_MC_PROMISC
) {
958 switch (mdev
->dev
->caps
.steering_mode
) {
959 case MLX4_STEERING_MODE_DEVICE_MANAGED
:
960 err
= mlx4_flow_steer_promisc_remove(mdev
->dev
,
965 case MLX4_STEERING_MODE_B0
:
966 err
= mlx4_multicast_promisc_remove(mdev
->dev
,
971 case MLX4_STEERING_MODE_A0
:
975 en_err(priv
, "Failed disabling multicast promiscuous mode\n");
976 priv
->flags
&= ~MLX4_EN_FLAG_MC_PROMISC
;
979 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
980 0, MLX4_MCAST_DISABLE
);
982 en_err(priv
, "Failed disabling multicast filter\n");
984 /* Flush mcast filter and init it with broadcast address */
985 mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, ETH_BCAST
,
986 1, MLX4_MCAST_CONFIG
);
988 /* Update multicast list - we cache all addresses so they won't
989 * change while HW is updated holding the command semaphor */
990 netif_addr_lock_bh(dev
);
991 mlx4_en_cache_mclist(dev
);
992 netif_addr_unlock_bh(dev
);
993 list_for_each_entry(mclist
, &priv
->mc_list
, list
) {
994 mcast_addr
= mlx4_mac_to_u64(mclist
->addr
);
995 mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
,
996 mcast_addr
, 0, MLX4_MCAST_CONFIG
);
998 err
= mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0,
999 0, MLX4_MCAST_ENABLE
);
1001 en_err(priv
, "Failed enabling multicast filter\n");
1003 update_mclist_flags(priv
, &priv
->curr_list
, &priv
->mc_list
);
1004 list_for_each_entry_safe(mclist
, tmp
, &priv
->curr_list
, list
) {
1005 if (mclist
->action
== MCLIST_REM
) {
1006 /* detach this address and delete from list */
1007 memcpy(&mc_list
[10], mclist
->addr
, ETH_ALEN
);
1008 mc_list
[5] = priv
->port
;
1009 err
= mlx4_multicast_detach(mdev
->dev
,
1010 &priv
->rss_map
.indir_qp
,
1015 en_err(priv
, "Fail to detach multicast address\n");
1017 if (mclist
->tunnel_reg_id
) {
1018 err
= mlx4_flow_detach(priv
->mdev
->dev
, mclist
->tunnel_reg_id
);
1020 en_err(priv
, "Failed to detach multicast address\n");
1023 /* remove from list */
1024 list_del(&mclist
->list
);
1026 } else if (mclist
->action
== MCLIST_ADD
) {
1027 /* attach the address */
1028 memcpy(&mc_list
[10], mclist
->addr
, ETH_ALEN
);
1029 /* needed for B0 steering support */
1030 mc_list
[5] = priv
->port
;
1031 err
= mlx4_multicast_attach(mdev
->dev
,
1032 &priv
->rss_map
.indir_qp
,
1038 en_err(priv
, "Fail to attach multicast address\n");
1040 err
= mlx4_en_tunnel_steer_add(priv
, &mc_list
[10], priv
->base_qpn
,
1041 &mclist
->tunnel_reg_id
);
1043 en_err(priv
, "Failed to attach multicast address\n");
1049 static void mlx4_en_do_uc_filter(struct mlx4_en_priv
*priv
,
1050 struct net_device
*dev
,
1051 struct mlx4_en_dev
*mdev
)
1053 struct netdev_hw_addr
*ha
;
1054 struct mlx4_mac_entry
*entry
;
1055 struct hlist_node
*tmp
;
1059 struct hlist_head
*bucket
;
1064 /* Note that we do not need to protect our mac_hash traversal with rcu,
1065 * since all modification code is protected by mdev->state_lock
1068 /* find what to remove */
1069 for (i
= 0; i
< MLX4_EN_MAC_HASH_SIZE
; ++i
) {
1070 bucket
= &priv
->mac_hash
[i
];
1071 hlist_for_each_entry_safe(entry
, tmp
, bucket
, hlist
) {
1073 netdev_for_each_uc_addr(ha
, dev
) {
1074 if (ether_addr_equal_64bits(entry
->mac
,
1081 /* MAC address of the port is not in uc list */
1082 if (ether_addr_equal_64bits(entry
->mac
,
1087 mac
= mlx4_mac_to_u64(entry
->mac
);
1088 mlx4_en_uc_steer_release(priv
, entry
->mac
,
1091 mlx4_unregister_mac(mdev
->dev
, priv
->port
, mac
);
1093 hlist_del_rcu(&entry
->hlist
);
1094 kfree_rcu(entry
, rcu
);
1095 en_dbg(DRV
, priv
, "Removed MAC %pM on port:%d\n",
1096 entry
->mac
, priv
->port
);
1102 /* if we didn't remove anything, there is no use in trying to add
1103 * again once we are in a forced promisc mode state
1105 if ((priv
->flags
& MLX4_EN_FLAG_FORCE_PROMISC
) && 0 == removed
)
1108 prev_flags
= priv
->flags
;
1109 priv
->flags
&= ~MLX4_EN_FLAG_FORCE_PROMISC
;
1111 /* find what to add */
1112 netdev_for_each_uc_addr(ha
, dev
) {
1114 bucket
= &priv
->mac_hash
[ha
->addr
[MLX4_EN_MAC_HASH_IDX
]];
1115 hlist_for_each_entry(entry
, bucket
, hlist
) {
1116 if (ether_addr_equal_64bits(entry
->mac
, ha
->addr
)) {
1123 entry
= kmalloc(sizeof(*entry
), GFP_KERNEL
);
1125 en_err(priv
, "Failed adding MAC %pM on port:%d (out of memory)\n",
1126 ha
->addr
, priv
->port
);
1127 priv
->flags
|= MLX4_EN_FLAG_FORCE_PROMISC
;
1130 mac
= mlx4_mac_to_u64(ha
->addr
);
1131 memcpy(entry
->mac
, ha
->addr
, ETH_ALEN
);
1132 err
= mlx4_register_mac(mdev
->dev
, priv
->port
, mac
);
1134 en_err(priv
, "Failed registering MAC %pM on port %d: %d\n",
1135 ha
->addr
, priv
->port
, err
);
1137 priv
->flags
|= MLX4_EN_FLAG_FORCE_PROMISC
;
1140 err
= mlx4_en_uc_steer_add(priv
, ha
->addr
,
1144 en_err(priv
, "Failed adding MAC %pM on port %d: %d\n",
1145 ha
->addr
, priv
->port
, err
);
1146 mlx4_unregister_mac(mdev
->dev
, priv
->port
, mac
);
1148 priv
->flags
|= MLX4_EN_FLAG_FORCE_PROMISC
;
1151 unsigned int mac_hash
;
1152 en_dbg(DRV
, priv
, "Added MAC %pM on port:%d\n",
1153 ha
->addr
, priv
->port
);
1154 mac_hash
= ha
->addr
[MLX4_EN_MAC_HASH_IDX
];
1155 bucket
= &priv
->mac_hash
[mac_hash
];
1156 hlist_add_head_rcu(&entry
->hlist
, bucket
);
1161 if (priv
->flags
& MLX4_EN_FLAG_FORCE_PROMISC
) {
1162 en_warn(priv
, "Forcing promiscuous mode on port:%d\n",
1164 } else if (prev_flags
& MLX4_EN_FLAG_FORCE_PROMISC
) {
1165 en_warn(priv
, "Stop forcing promiscuous mode on port:%d\n",
1170 static void mlx4_en_do_set_rx_mode(struct work_struct
*work
)
1172 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
1174 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1175 struct net_device
*dev
= priv
->dev
;
1177 mutex_lock(&mdev
->state_lock
);
1178 if (!mdev
->device_up
) {
1179 en_dbg(HW
, priv
, "Card is not up, ignoring rx mode change.\n");
1182 if (!priv
->port_up
) {
1183 en_dbg(HW
, priv
, "Port is down, ignoring rx mode change.\n");
1187 if (!netif_carrier_ok(dev
)) {
1188 if (!mlx4_en_QUERY_PORT(mdev
, priv
->port
)) {
1189 if (priv
->port_state
.link_state
) {
1190 priv
->last_link_state
= MLX4_DEV_EVENT_PORT_UP
;
1191 netif_carrier_on(dev
);
1192 en_dbg(LINK
, priv
, "Link Up\n");
1197 if (dev
->priv_flags
& IFF_UNICAST_FLT
)
1198 mlx4_en_do_uc_filter(priv
, dev
, mdev
);
1200 /* Promsicuous mode: disable all filters */
1201 if ((dev
->flags
& IFF_PROMISC
) ||
1202 (priv
->flags
& MLX4_EN_FLAG_FORCE_PROMISC
)) {
1203 mlx4_en_set_promisc_mode(priv
, mdev
);
1207 /* Not in promiscuous mode */
1208 if (priv
->flags
& MLX4_EN_FLAG_PROMISC
)
1209 mlx4_en_clear_promisc_mode(priv
, mdev
);
1211 mlx4_en_do_multicast(priv
, dev
, mdev
);
1213 mutex_unlock(&mdev
->state_lock
);
1216 #ifdef CONFIG_NET_POLL_CONTROLLER
1217 static void mlx4_en_netpoll(struct net_device
*dev
)
1219 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
1220 struct mlx4_en_cq
*cq
;
1223 for (i
= 0; i
< priv
->tx_ring_num
[TX
]; i
++) {
1224 cq
= priv
->tx_cq
[TX
][i
];
1225 napi_schedule(&cq
->napi
);
1230 static int mlx4_en_set_rss_steer_rules(struct mlx4_en_priv
*priv
)
1234 int *qpn
= &priv
->base_qpn
;
1235 struct mlx4_mac_entry
*entry
;
1237 err
= mlx4_en_uc_steer_add(priv
, priv
->dev
->dev_addr
, qpn
, ®_id
);
1241 err
= mlx4_en_tunnel_steer_add(priv
, priv
->dev
->dev_addr
, *qpn
,
1242 &priv
->tunnel_reg_id
);
1246 entry
= kmalloc(sizeof(*entry
), GFP_KERNEL
);
1252 memcpy(entry
->mac
, priv
->dev
->dev_addr
, sizeof(entry
->mac
));
1253 memcpy(priv
->current_mac
, entry
->mac
, sizeof(priv
->current_mac
));
1254 entry
->reg_id
= reg_id
;
1255 hlist_add_head_rcu(&entry
->hlist
,
1256 &priv
->mac_hash
[entry
->mac
[MLX4_EN_MAC_HASH_IDX
]]);
1261 if (priv
->tunnel_reg_id
)
1262 mlx4_flow_detach(priv
->mdev
->dev
, priv
->tunnel_reg_id
);
1265 mlx4_en_uc_steer_release(priv
, priv
->dev
->dev_addr
, *qpn
, reg_id
);
1269 static void mlx4_en_delete_rss_steer_rules(struct mlx4_en_priv
*priv
)
1273 int qpn
= priv
->base_qpn
;
1274 struct hlist_head
*bucket
;
1275 struct hlist_node
*tmp
;
1276 struct mlx4_mac_entry
*entry
;
1278 for (i
= 0; i
< MLX4_EN_MAC_HASH_SIZE
; ++i
) {
1279 bucket
= &priv
->mac_hash
[i
];
1280 hlist_for_each_entry_safe(entry
, tmp
, bucket
, hlist
) {
1281 mac
= mlx4_mac_to_u64(entry
->mac
);
1282 en_dbg(DRV
, priv
, "Registering MAC:%pM for deleting\n",
1284 mlx4_en_uc_steer_release(priv
, entry
->mac
,
1285 qpn
, entry
->reg_id
);
1287 mlx4_unregister_mac(priv
->mdev
->dev
, priv
->port
, mac
);
1288 hlist_del_rcu(&entry
->hlist
);
1289 kfree_rcu(entry
, rcu
);
1293 if (priv
->tunnel_reg_id
) {
1294 mlx4_flow_detach(priv
->mdev
->dev
, priv
->tunnel_reg_id
);
1295 priv
->tunnel_reg_id
= 0;
1299 static void mlx4_en_tx_timeout(struct net_device
*dev
)
1301 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
1302 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1305 if (netif_msg_timer(priv
))
1306 en_warn(priv
, "Tx timeout called on port:%d\n", priv
->port
);
1308 for (i
= 0; i
< priv
->tx_ring_num
[TX
]; i
++) {
1309 struct mlx4_en_tx_ring
*tx_ring
= priv
->tx_ring
[TX
][i
];
1311 if (!netif_tx_queue_stopped(netdev_get_tx_queue(dev
, i
)))
1313 en_warn(priv
, "TX timeout on queue: %d, QP: 0x%x, CQ: 0x%x, Cons: 0x%x, Prod: 0x%x\n",
1314 i
, tx_ring
->qpn
, tx_ring
->sp_cqn
,
1315 tx_ring
->cons
, tx_ring
->prod
);
1318 priv
->port_stats
.tx_timeout
++;
1319 en_dbg(DRV
, priv
, "Scheduling watchdog\n");
1320 queue_work(mdev
->workqueue
, &priv
->watchdog_task
);
1325 mlx4_en_get_stats64(struct net_device
*dev
, struct rtnl_link_stats64
*stats
)
1327 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
1329 spin_lock_bh(&priv
->stats_lock
);
1330 mlx4_en_fold_software_stats(dev
);
1331 netdev_stats_to_stats64(stats
, &dev
->stats
);
1332 spin_unlock_bh(&priv
->stats_lock
);
1335 static void mlx4_en_set_default_moderation(struct mlx4_en_priv
*priv
)
1337 struct mlx4_en_cq
*cq
;
1340 /* If we haven't received a specific coalescing setting
1341 * (module param), we set the moderation parameters as follows:
1342 * - moder_cnt is set to the number of mtu sized packets to
1343 * satisfy our coalescing target.
1344 * - moder_time is set to a fixed value.
1346 priv
->rx_frames
= MLX4_EN_RX_COAL_TARGET
;
1347 priv
->rx_usecs
= MLX4_EN_RX_COAL_TIME
;
1348 priv
->tx_frames
= MLX4_EN_TX_COAL_PKTS
;
1349 priv
->tx_usecs
= MLX4_EN_TX_COAL_TIME
;
1350 en_dbg(INTR
, priv
, "Default coalesing params for mtu:%d - rx_frames:%d rx_usecs:%d\n",
1351 priv
->dev
->mtu
, priv
->rx_frames
, priv
->rx_usecs
);
1353 /* Setup cq moderation params */
1354 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
1355 cq
= priv
->rx_cq
[i
];
1356 cq
->moder_cnt
= priv
->rx_frames
;
1357 cq
->moder_time
= priv
->rx_usecs
;
1358 priv
->last_moder_time
[i
] = MLX4_EN_AUTO_CONF
;
1359 priv
->last_moder_packets
[i
] = 0;
1360 priv
->last_moder_bytes
[i
] = 0;
1363 for (t
= 0 ; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
1364 for (i
= 0; i
< priv
->tx_ring_num
[t
]; i
++) {
1365 cq
= priv
->tx_cq
[t
][i
];
1366 cq
->moder_cnt
= priv
->tx_frames
;
1367 cq
->moder_time
= priv
->tx_usecs
;
1371 /* Reset auto-moderation params */
1372 priv
->pkt_rate_low
= MLX4_EN_RX_RATE_LOW
;
1373 priv
->rx_usecs_low
= MLX4_EN_RX_COAL_TIME_LOW
;
1374 priv
->pkt_rate_high
= MLX4_EN_RX_RATE_HIGH
;
1375 priv
->rx_usecs_high
= MLX4_EN_RX_COAL_TIME_HIGH
;
1376 priv
->sample_interval
= MLX4_EN_SAMPLE_INTERVAL
;
1377 priv
->adaptive_rx_coal
= 1;
1378 priv
->last_moder_jiffies
= 0;
1379 priv
->last_moder_tx_packets
= 0;
1382 static void mlx4_en_auto_moderation(struct mlx4_en_priv
*priv
)
1384 unsigned long period
= (unsigned long) (jiffies
- priv
->last_moder_jiffies
);
1385 struct mlx4_en_cq
*cq
;
1386 unsigned long packets
;
1388 unsigned long avg_pkt_size
;
1389 unsigned long rx_packets
;
1390 unsigned long rx_bytes
;
1391 unsigned long rx_pkt_diff
;
1395 if (!priv
->adaptive_rx_coal
|| period
< priv
->sample_interval
* HZ
)
1398 for (ring
= 0; ring
< priv
->rx_ring_num
; ring
++) {
1399 rx_packets
= READ_ONCE(priv
->rx_ring
[ring
]->packets
);
1400 rx_bytes
= READ_ONCE(priv
->rx_ring
[ring
]->bytes
);
1402 rx_pkt_diff
= ((unsigned long) (rx_packets
-
1403 priv
->last_moder_packets
[ring
]));
1404 packets
= rx_pkt_diff
;
1405 rate
= packets
* HZ
/ period
;
1406 avg_pkt_size
= packets
? ((unsigned long) (rx_bytes
-
1407 priv
->last_moder_bytes
[ring
])) / packets
: 0;
1409 /* Apply auto-moderation only when packet rate
1410 * exceeds a rate that it matters */
1411 if (rate
> (MLX4_EN_RX_RATE_THRESH
/ priv
->rx_ring_num
) &&
1412 avg_pkt_size
> MLX4_EN_AVG_PKT_SMALL
) {
1413 if (rate
< priv
->pkt_rate_low
)
1414 moder_time
= priv
->rx_usecs_low
;
1415 else if (rate
> priv
->pkt_rate_high
)
1416 moder_time
= priv
->rx_usecs_high
;
1418 moder_time
= (rate
- priv
->pkt_rate_low
) *
1419 (priv
->rx_usecs_high
- priv
->rx_usecs_low
) /
1420 (priv
->pkt_rate_high
- priv
->pkt_rate_low
) +
1423 moder_time
= priv
->rx_usecs_low
;
1426 if (moder_time
!= priv
->last_moder_time
[ring
]) {
1427 priv
->last_moder_time
[ring
] = moder_time
;
1428 cq
= priv
->rx_cq
[ring
];
1429 cq
->moder_time
= moder_time
;
1430 cq
->moder_cnt
= priv
->rx_frames
;
1431 err
= mlx4_en_set_cq_moder(priv
, cq
);
1433 en_err(priv
, "Failed modifying moderation for cq:%d\n",
1436 priv
->last_moder_packets
[ring
] = rx_packets
;
1437 priv
->last_moder_bytes
[ring
] = rx_bytes
;
1440 priv
->last_moder_jiffies
= jiffies
;
1443 static void mlx4_en_do_get_stats(struct work_struct
*work
)
1445 struct delayed_work
*delay
= to_delayed_work(work
);
1446 struct mlx4_en_priv
*priv
= container_of(delay
, struct mlx4_en_priv
,
1448 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1451 mutex_lock(&mdev
->state_lock
);
1452 if (mdev
->device_up
) {
1453 if (priv
->port_up
) {
1454 err
= mlx4_en_DUMP_ETH_STATS(mdev
, priv
->port
, 0);
1456 en_dbg(HW
, priv
, "Could not update stats\n");
1458 mlx4_en_auto_moderation(priv
);
1461 queue_delayed_work(mdev
->workqueue
, &priv
->stats_task
, STATS_DELAY
);
1463 if (mdev
->mac_removed
[MLX4_MAX_PORTS
+ 1 - priv
->port
]) {
1464 mlx4_en_do_set_mac(priv
, priv
->current_mac
);
1465 mdev
->mac_removed
[MLX4_MAX_PORTS
+ 1 - priv
->port
] = 0;
1467 mutex_unlock(&mdev
->state_lock
);
1470 /* mlx4_en_service_task - Run service task for tasks that needed to be done
1473 static void mlx4_en_service_task(struct work_struct
*work
)
1475 struct delayed_work
*delay
= to_delayed_work(work
);
1476 struct mlx4_en_priv
*priv
= container_of(delay
, struct mlx4_en_priv
,
1478 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1480 mutex_lock(&mdev
->state_lock
);
1481 if (mdev
->device_up
) {
1482 if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_TS
)
1483 mlx4_en_ptp_overflow_check(mdev
);
1485 mlx4_en_recover_from_oom(priv
);
1486 queue_delayed_work(mdev
->workqueue
, &priv
->service_task
,
1487 SERVICE_TASK_DELAY
);
1489 mutex_unlock(&mdev
->state_lock
);
1492 static void mlx4_en_linkstate(struct work_struct
*work
)
1494 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
1496 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1497 int linkstate
= priv
->link_state
;
1499 mutex_lock(&mdev
->state_lock
);
1500 /* If observable port state changed set carrier state and
1501 * report to system log */
1502 if (priv
->last_link_state
!= linkstate
) {
1503 if (linkstate
== MLX4_DEV_EVENT_PORT_DOWN
) {
1504 en_info(priv
, "Link Down\n");
1505 netif_carrier_off(priv
->dev
);
1507 en_info(priv
, "Link Up\n");
1508 netif_carrier_on(priv
->dev
);
1511 priv
->last_link_state
= linkstate
;
1512 mutex_unlock(&mdev
->state_lock
);
1515 static int mlx4_en_init_affinity_hint(struct mlx4_en_priv
*priv
, int ring_idx
)
1517 struct mlx4_en_rx_ring
*ring
= priv
->rx_ring
[ring_idx
];
1518 int numa_node
= priv
->mdev
->dev
->numa_node
;
1520 if (!zalloc_cpumask_var(&ring
->affinity_mask
, GFP_KERNEL
))
1523 cpumask_set_cpu(cpumask_local_spread(ring_idx
, numa_node
),
1524 ring
->affinity_mask
);
1528 static void mlx4_en_free_affinity_hint(struct mlx4_en_priv
*priv
, int ring_idx
)
1530 free_cpumask_var(priv
->rx_ring
[ring_idx
]->affinity_mask
);
1533 static void mlx4_en_init_recycle_ring(struct mlx4_en_priv
*priv
,
1536 struct mlx4_en_tx_ring
*tx_ring
= priv
->tx_ring
[TX_XDP
][tx_ring_idx
];
1537 int rr_index
= tx_ring_idx
;
1539 tx_ring
->free_tx_desc
= mlx4_en_recycle_tx_desc
;
1540 tx_ring
->recycle_ring
= priv
->rx_ring
[rr_index
];
1541 en_dbg(DRV
, priv
, "Set tx_ring[%d][%d]->recycle_ring = rx_ring[%d]\n",
1542 TX_XDP
, tx_ring_idx
, rr_index
);
1545 int mlx4_en_start_port(struct net_device
*dev
)
1547 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
1548 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1549 struct mlx4_en_cq
*cq
;
1550 struct mlx4_en_tx_ring
*tx_ring
;
1555 u8 mc_list
[16] = {0};
1557 if (priv
->port_up
) {
1558 en_dbg(DRV
, priv
, "start port called while port already up\n");
1562 INIT_LIST_HEAD(&priv
->mc_list
);
1563 INIT_LIST_HEAD(&priv
->curr_list
);
1564 INIT_LIST_HEAD(&priv
->ethtool_list
);
1565 memset(&priv
->ethtool_rules
[0], 0,
1566 sizeof(struct ethtool_flow_id
) * MAX_NUM_OF_FS_RULES
);
1568 /* Calculate Rx buf size */
1569 dev
->mtu
= min(dev
->mtu
, priv
->max_mtu
);
1570 mlx4_en_calc_rx_buf(dev
);
1571 en_dbg(DRV
, priv
, "Rx buf size:%d\n", priv
->rx_skb_size
);
1573 /* Configure rx cq's and rings */
1574 err
= mlx4_en_activate_rx_rings(priv
);
1576 en_err(priv
, "Failed to activate RX rings\n");
1579 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
1580 cq
= priv
->rx_cq
[i
];
1582 err
= mlx4_en_init_affinity_hint(priv
, i
);
1584 en_err(priv
, "Failed preparing IRQ affinity hint\n");
1588 err
= mlx4_en_activate_cq(priv
, cq
, i
);
1590 en_err(priv
, "Failed activating Rx CQ\n");
1591 mlx4_en_free_affinity_hint(priv
, i
);
1595 for (j
= 0; j
< cq
->size
; j
++) {
1596 struct mlx4_cqe
*cqe
= NULL
;
1598 cqe
= mlx4_en_get_cqe(cq
->buf
, j
, priv
->cqe_size
) +
1600 cqe
->owner_sr_opcode
= MLX4_CQE_OWNER_MASK
;
1603 err
= mlx4_en_set_cq_moder(priv
, cq
);
1605 en_err(priv
, "Failed setting cq moderation parameters\n");
1606 mlx4_en_deactivate_cq(priv
, cq
);
1607 mlx4_en_free_affinity_hint(priv
, i
);
1610 mlx4_en_arm_cq(priv
, cq
);
1611 priv
->rx_ring
[i
]->cqn
= cq
->mcq
.cqn
;
1616 en_dbg(DRV
, priv
, "Getting qp number for port %d\n", priv
->port
);
1617 err
= mlx4_en_get_qp(priv
);
1619 en_err(priv
, "Failed getting eth qp\n");
1622 mdev
->mac_removed
[priv
->port
] = 0;
1624 priv
->counter_index
=
1625 mlx4_get_default_counter_index(mdev
->dev
, priv
->port
);
1627 err
= mlx4_en_config_rss_steer(priv
);
1629 en_err(priv
, "Failed configuring rss steering\n");
1633 err
= mlx4_en_create_drop_qp(priv
);
1637 /* Configure tx cq's and rings */
1638 for (t
= 0 ; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
1639 u8 num_tx_rings_p_up
= t
== TX
?
1640 priv
->num_tx_rings_p_up
: priv
->tx_ring_num
[t
];
1642 for (i
= 0; i
< priv
->tx_ring_num
[t
]; i
++) {
1644 cq
= priv
->tx_cq
[t
][i
];
1645 err
= mlx4_en_activate_cq(priv
, cq
, i
);
1647 en_err(priv
, "Failed allocating Tx CQ\n");
1650 err
= mlx4_en_set_cq_moder(priv
, cq
);
1652 en_err(priv
, "Failed setting cq moderation parameters\n");
1653 mlx4_en_deactivate_cq(priv
, cq
);
1657 "Resetting index of collapsed CQ:%d to -1\n", i
);
1658 cq
->buf
->wqe_index
= cpu_to_be16(0xffff);
1660 /* Configure ring */
1661 tx_ring
= priv
->tx_ring
[t
][i
];
1662 err
= mlx4_en_activate_tx_ring(priv
, tx_ring
,
1664 i
/ num_tx_rings_p_up
);
1666 en_err(priv
, "Failed allocating Tx ring\n");
1667 mlx4_en_deactivate_cq(priv
, cq
);
1671 tx_ring
->tx_queue
= netdev_get_tx_queue(dev
, i
);
1672 tx_ring
->recycle_ring
= NULL
;
1674 mlx4_en_init_recycle_ring(priv
, i
);
1677 /* Arm CQ for TX completions */
1678 mlx4_en_arm_cq(priv
, cq
);
1680 /* Set initial ownership of all Tx TXBBs to SW (1) */
1681 for (j
= 0; j
< tx_ring
->buf_size
; j
+= STAMP_STRIDE
)
1682 *((u32
*)(tx_ring
->buf
+ j
)) = 0xffffffff;
1686 /* Configure port */
1687 err
= mlx4_SET_PORT_general(mdev
->dev
, priv
->port
,
1688 priv
->rx_skb_size
+ ETH_FCS_LEN
,
1689 priv
->prof
->tx_pause
,
1691 priv
->prof
->rx_pause
,
1692 priv
->prof
->rx_ppp
);
1694 en_err(priv
, "Failed setting port general configurations for port %d, with error %d\n",
1698 /* Set default qp number */
1699 err
= mlx4_SET_PORT_qpn_calc(mdev
->dev
, priv
->port
, priv
->base_qpn
, 0);
1701 en_err(priv
, "Failed setting default qp numbers\n");
1705 if (mdev
->dev
->caps
.tunnel_offload_mode
== MLX4_TUNNEL_OFFLOAD_MODE_VXLAN
) {
1706 err
= mlx4_SET_PORT_VXLAN(mdev
->dev
, priv
->port
, VXLAN_STEER_BY_OUTER_MAC
, 1);
1708 en_err(priv
, "Failed setting port L2 tunnel configuration, err %d\n",
1715 en_dbg(HW
, priv
, "Initializing port\n");
1716 err
= mlx4_INIT_PORT(mdev
->dev
, priv
->port
);
1718 en_err(priv
, "Failed Initializing port\n");
1722 /* Set Unicast and VXLAN steering rules */
1723 if (mdev
->dev
->caps
.steering_mode
!= MLX4_STEERING_MODE_A0
&&
1724 mlx4_en_set_rss_steer_rules(priv
))
1725 mlx4_warn(mdev
, "Failed setting steering rules\n");
1727 /* Attach rx QP to bradcast address */
1728 eth_broadcast_addr(&mc_list
[10]);
1729 mc_list
[5] = priv
->port
; /* needed for B0 steering support */
1730 if (mlx4_multicast_attach(mdev
->dev
, &priv
->rss_map
.indir_qp
, mc_list
,
1731 priv
->port
, 0, MLX4_PROT_ETH
,
1732 &priv
->broadcast_id
))
1733 mlx4_warn(mdev
, "Failed Attaching Broadcast\n");
1735 /* Must redo promiscuous mode setup. */
1736 priv
->flags
&= ~(MLX4_EN_FLAG_PROMISC
| MLX4_EN_FLAG_MC_PROMISC
);
1738 /* Schedule multicast task to populate multicast list */
1739 queue_work(mdev
->workqueue
, &priv
->rx_mode_task
);
1741 if (priv
->mdev
->dev
->caps
.tunnel_offload_mode
== MLX4_TUNNEL_OFFLOAD_MODE_VXLAN
)
1742 udp_tunnel_get_rx_info(dev
);
1744 priv
->port_up
= true;
1746 /* Process all completions if exist to prevent
1747 * the queues freezing if they are full
1749 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
1751 napi_schedule(&priv
->rx_cq
[i
]->napi
);
1755 netif_tx_start_all_queues(dev
);
1756 netif_device_attach(dev
);
1761 if (t
== MLX4_EN_NUM_TX_TYPES
) {
1763 i
= priv
->tx_ring_num
[t
];
1767 mlx4_en_deactivate_tx_ring(priv
, priv
->tx_ring
[t
][i
]);
1768 mlx4_en_deactivate_cq(priv
, priv
->tx_cq
[t
][i
]);
1772 i
= priv
->tx_ring_num
[t
];
1774 mlx4_en_destroy_drop_qp(priv
);
1776 mlx4_en_release_rss_steer(priv
);
1778 mlx4_en_put_qp(priv
);
1780 while (rx_index
--) {
1781 mlx4_en_deactivate_cq(priv
, priv
->rx_cq
[rx_index
]);
1782 mlx4_en_free_affinity_hint(priv
, rx_index
);
1784 for (i
= 0; i
< priv
->rx_ring_num
; i
++)
1785 mlx4_en_deactivate_rx_ring(priv
, priv
->rx_ring
[i
]);
1787 return err
; /* need to close devices */
1791 void mlx4_en_stop_port(struct net_device
*dev
, int detach
)
1793 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
1794 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1795 struct mlx4_en_mc_list
*mclist
, *tmp
;
1796 struct ethtool_flow_id
*flow
, *tmp_flow
;
1798 u8 mc_list
[16] = {0};
1800 if (!priv
->port_up
) {
1801 en_dbg(DRV
, priv
, "stop port called while port already down\n");
1806 mlx4_CLOSE_PORT(mdev
->dev
, priv
->port
);
1808 /* Synchronize with tx routine */
1809 netif_tx_lock_bh(dev
);
1811 netif_device_detach(dev
);
1812 netif_tx_stop_all_queues(dev
);
1813 netif_tx_unlock_bh(dev
);
1815 netif_tx_disable(dev
);
1817 spin_lock_bh(&priv
->stats_lock
);
1818 mlx4_en_fold_software_stats(dev
);
1819 /* Set port as not active */
1820 priv
->port_up
= false;
1821 spin_unlock_bh(&priv
->stats_lock
);
1823 priv
->counter_index
= MLX4_SINK_COUNTER_INDEX(mdev
->dev
);
1825 /* Promsicuous mode */
1826 if (mdev
->dev
->caps
.steering_mode
==
1827 MLX4_STEERING_MODE_DEVICE_MANAGED
) {
1828 priv
->flags
&= ~(MLX4_EN_FLAG_PROMISC
|
1829 MLX4_EN_FLAG_MC_PROMISC
);
1830 mlx4_flow_steer_promisc_remove(mdev
->dev
,
1832 MLX4_FS_ALL_DEFAULT
);
1833 mlx4_flow_steer_promisc_remove(mdev
->dev
,
1835 MLX4_FS_MC_DEFAULT
);
1836 } else if (priv
->flags
& MLX4_EN_FLAG_PROMISC
) {
1837 priv
->flags
&= ~MLX4_EN_FLAG_PROMISC
;
1839 /* Disable promiscouos mode */
1840 mlx4_unicast_promisc_remove(mdev
->dev
, priv
->base_qpn
,
1843 /* Disable Multicast promisc */
1844 if (priv
->flags
& MLX4_EN_FLAG_MC_PROMISC
) {
1845 mlx4_multicast_promisc_remove(mdev
->dev
, priv
->base_qpn
,
1847 priv
->flags
&= ~MLX4_EN_FLAG_MC_PROMISC
;
1851 /* Detach All multicasts */
1852 eth_broadcast_addr(&mc_list
[10]);
1853 mc_list
[5] = priv
->port
; /* needed for B0 steering support */
1854 mlx4_multicast_detach(mdev
->dev
, &priv
->rss_map
.indir_qp
, mc_list
,
1855 MLX4_PROT_ETH
, priv
->broadcast_id
);
1856 list_for_each_entry(mclist
, &priv
->curr_list
, list
) {
1857 memcpy(&mc_list
[10], mclist
->addr
, ETH_ALEN
);
1858 mc_list
[5] = priv
->port
;
1859 mlx4_multicast_detach(mdev
->dev
, &priv
->rss_map
.indir_qp
,
1860 mc_list
, MLX4_PROT_ETH
, mclist
->reg_id
);
1861 if (mclist
->tunnel_reg_id
)
1862 mlx4_flow_detach(mdev
->dev
, mclist
->tunnel_reg_id
);
1864 mlx4_en_clear_list(dev
);
1865 list_for_each_entry_safe(mclist
, tmp
, &priv
->curr_list
, list
) {
1866 list_del(&mclist
->list
);
1870 /* Flush multicast filter */
1871 mlx4_SET_MCAST_FLTR(mdev
->dev
, priv
->port
, 0, 1, MLX4_MCAST_CONFIG
);
1873 /* Remove flow steering rules for the port*/
1874 if (mdev
->dev
->caps
.steering_mode
==
1875 MLX4_STEERING_MODE_DEVICE_MANAGED
) {
1877 list_for_each_entry_safe(flow
, tmp_flow
,
1878 &priv
->ethtool_list
, list
) {
1879 mlx4_flow_detach(mdev
->dev
, flow
->id
);
1880 list_del(&flow
->list
);
1884 mlx4_en_destroy_drop_qp(priv
);
1887 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
1888 for (i
= 0; i
< priv
->tx_ring_num
[t
]; i
++) {
1889 mlx4_en_deactivate_tx_ring(priv
, priv
->tx_ring
[t
][i
]);
1890 mlx4_en_deactivate_cq(priv
, priv
->tx_cq
[t
][i
]);
1895 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++)
1896 for (i
= 0; i
< priv
->tx_ring_num
[t
]; i
++)
1897 mlx4_en_free_tx_buf(dev
, priv
->tx_ring
[t
][i
]);
1899 if (mdev
->dev
->caps
.steering_mode
!= MLX4_STEERING_MODE_A0
)
1900 mlx4_en_delete_rss_steer_rules(priv
);
1903 mlx4_en_release_rss_steer(priv
);
1905 /* Unregister Mac address for the port */
1906 mlx4_en_put_qp(priv
);
1907 if (!(mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_REASSIGN_MAC_EN
))
1908 mdev
->mac_removed
[priv
->port
] = 1;
1911 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
1912 struct mlx4_en_cq
*cq
= priv
->rx_cq
[i
];
1914 napi_synchronize(&cq
->napi
);
1915 mlx4_en_deactivate_rx_ring(priv
, priv
->rx_ring
[i
]);
1916 mlx4_en_deactivate_cq(priv
, cq
);
1918 mlx4_en_free_affinity_hint(priv
, i
);
1922 static void mlx4_en_restart(struct work_struct
*work
)
1924 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
1926 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1927 struct net_device
*dev
= priv
->dev
;
1929 en_dbg(DRV
, priv
, "Watchdog task called for port %d\n", priv
->port
);
1932 mutex_lock(&mdev
->state_lock
);
1933 if (priv
->port_up
) {
1934 mlx4_en_stop_port(dev
, 1);
1935 if (mlx4_en_start_port(dev
))
1936 en_err(priv
, "Failed restarting port %d\n", priv
->port
);
1938 mutex_unlock(&mdev
->state_lock
);
1942 static void mlx4_en_clear_stats(struct net_device
*dev
)
1944 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
1945 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1946 struct mlx4_en_tx_ring
**tx_ring
;
1949 if (!mlx4_is_slave(mdev
->dev
))
1950 if (mlx4_en_DUMP_ETH_STATS(mdev
, priv
->port
, 1))
1951 en_dbg(HW
, priv
, "Failed dumping statistics\n");
1953 memset(&priv
->pstats
, 0, sizeof(priv
->pstats
));
1954 memset(&priv
->pkstats
, 0, sizeof(priv
->pkstats
));
1955 memset(&priv
->port_stats
, 0, sizeof(priv
->port_stats
));
1956 memset(&priv
->rx_flowstats
, 0, sizeof(priv
->rx_flowstats
));
1957 memset(&priv
->tx_flowstats
, 0, sizeof(priv
->tx_flowstats
));
1958 memset(&priv
->rx_priority_flowstats
, 0,
1959 sizeof(priv
->rx_priority_flowstats
));
1960 memset(&priv
->tx_priority_flowstats
, 0,
1961 sizeof(priv
->tx_priority_flowstats
));
1962 memset(&priv
->pf_stats
, 0, sizeof(priv
->pf_stats
));
1964 tx_ring
= priv
->tx_ring
[TX
];
1965 for (i
= 0; i
< priv
->tx_ring_num
[TX
]; i
++) {
1966 tx_ring
[i
]->bytes
= 0;
1967 tx_ring
[i
]->packets
= 0;
1968 tx_ring
[i
]->tx_csum
= 0;
1969 tx_ring
[i
]->tx_dropped
= 0;
1970 tx_ring
[i
]->queue_stopped
= 0;
1971 tx_ring
[i
]->wake_queue
= 0;
1972 tx_ring
[i
]->tso_packets
= 0;
1973 tx_ring
[i
]->xmit_more
= 0;
1975 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
1976 priv
->rx_ring
[i
]->bytes
= 0;
1977 priv
->rx_ring
[i
]->packets
= 0;
1978 priv
->rx_ring
[i
]->csum_ok
= 0;
1979 priv
->rx_ring
[i
]->csum_none
= 0;
1980 priv
->rx_ring
[i
]->csum_complete
= 0;
1984 static int mlx4_en_open(struct net_device
*dev
)
1986 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
1987 struct mlx4_en_dev
*mdev
= priv
->mdev
;
1990 mutex_lock(&mdev
->state_lock
);
1992 if (!mdev
->device_up
) {
1993 en_err(priv
, "Cannot open - device down/disabled\n");
1998 /* Reset HW statistics and SW counters */
1999 mlx4_en_clear_stats(dev
);
2001 err
= mlx4_en_start_port(dev
);
2003 en_err(priv
, "Failed starting port:%d\n", priv
->port
);
2006 mutex_unlock(&mdev
->state_lock
);
2011 static int mlx4_en_close(struct net_device
*dev
)
2013 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2014 struct mlx4_en_dev
*mdev
= priv
->mdev
;
2016 en_dbg(IFDOWN
, priv
, "Close port called\n");
2018 mutex_lock(&mdev
->state_lock
);
2020 mlx4_en_stop_port(dev
, 0);
2021 netif_carrier_off(dev
);
2023 mutex_unlock(&mdev
->state_lock
);
2027 static void mlx4_en_free_resources(struct mlx4_en_priv
*priv
)
2031 #ifdef CONFIG_RFS_ACCEL
2032 priv
->dev
->rx_cpu_rmap
= NULL
;
2035 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
2036 for (i
= 0; i
< priv
->tx_ring_num
[t
]; i
++) {
2037 if (priv
->tx_ring
[t
] && priv
->tx_ring
[t
][i
])
2038 mlx4_en_destroy_tx_ring(priv
,
2039 &priv
->tx_ring
[t
][i
]);
2040 if (priv
->tx_cq
[t
] && priv
->tx_cq
[t
][i
])
2041 mlx4_en_destroy_cq(priv
, &priv
->tx_cq
[t
][i
]);
2045 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
2046 if (priv
->rx_ring
[i
])
2047 mlx4_en_destroy_rx_ring(priv
, &priv
->rx_ring
[i
],
2048 priv
->prof
->rx_ring_size
, priv
->stride
);
2050 mlx4_en_destroy_cq(priv
, &priv
->rx_cq
[i
]);
2055 static int mlx4_en_alloc_resources(struct mlx4_en_priv
*priv
)
2057 struct mlx4_en_port_profile
*prof
= priv
->prof
;
2061 /* Create tx Rings */
2062 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
2063 for (i
= 0; i
< priv
->tx_ring_num
[t
]; i
++) {
2064 node
= cpu_to_node(i
% num_online_cpus());
2065 if (mlx4_en_create_cq(priv
, &priv
->tx_cq
[t
][i
],
2066 prof
->tx_ring_size
, i
, t
, node
))
2069 if (mlx4_en_create_tx_ring(priv
, &priv
->tx_ring
[t
][i
],
2071 TXBB_SIZE
, node
, i
))
2076 /* Create rx Rings */
2077 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
2078 node
= cpu_to_node(i
% num_online_cpus());
2079 if (mlx4_en_create_cq(priv
, &priv
->rx_cq
[i
],
2080 prof
->rx_ring_size
, i
, RX
, node
))
2083 if (mlx4_en_create_rx_ring(priv
, &priv
->rx_ring
[i
],
2084 prof
->rx_ring_size
, priv
->stride
,
2089 #ifdef CONFIG_RFS_ACCEL
2090 priv
->dev
->rx_cpu_rmap
= mlx4_get_cpu_rmap(priv
->mdev
->dev
, priv
->port
);
2096 en_err(priv
, "Failed to allocate NIC resources\n");
2097 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
2098 if (priv
->rx_ring
[i
])
2099 mlx4_en_destroy_rx_ring(priv
, &priv
->rx_ring
[i
],
2103 mlx4_en_destroy_cq(priv
, &priv
->rx_cq
[i
]);
2105 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
2106 for (i
= 0; i
< priv
->tx_ring_num
[t
]; i
++) {
2107 if (priv
->tx_ring
[t
][i
])
2108 mlx4_en_destroy_tx_ring(priv
,
2109 &priv
->tx_ring
[t
][i
]);
2110 if (priv
->tx_cq
[t
][i
])
2111 mlx4_en_destroy_cq(priv
, &priv
->tx_cq
[t
][i
]);
2118 static int mlx4_en_copy_priv(struct mlx4_en_priv
*dst
,
2119 struct mlx4_en_priv
*src
,
2120 struct mlx4_en_port_profile
*prof
)
2124 memcpy(&dst
->hwtstamp_config
, &prof
->hwtstamp_config
,
2125 sizeof(dst
->hwtstamp_config
));
2126 dst
->num_tx_rings_p_up
= src
->mdev
->profile
.num_tx_rings_p_up
;
2127 dst
->rx_ring_num
= prof
->rx_ring_num
;
2128 dst
->flags
= prof
->flags
;
2129 dst
->mdev
= src
->mdev
;
2130 dst
->port
= src
->port
;
2131 dst
->dev
= src
->dev
;
2133 dst
->stride
= roundup_pow_of_two(sizeof(struct mlx4_en_rx_desc
) +
2134 DS_SIZE
* MLX4_EN_MAX_RX_FRAGS
);
2136 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
2137 dst
->tx_ring_num
[t
] = prof
->tx_ring_num
[t
];
2138 if (!dst
->tx_ring_num
[t
])
2141 dst
->tx_ring
[t
] = kzalloc(sizeof(struct mlx4_en_tx_ring
*) *
2142 MAX_TX_RINGS
, GFP_KERNEL
);
2143 if (!dst
->tx_ring
[t
])
2146 dst
->tx_cq
[t
] = kzalloc(sizeof(struct mlx4_en_cq
*) *
2147 MAX_TX_RINGS
, GFP_KERNEL
);
2148 if (!dst
->tx_cq
[t
]) {
2149 kfree(dst
->tx_ring
[t
]);
2158 kfree(dst
->tx_ring
[t
]);
2159 kfree(dst
->tx_cq
[t
]);
2164 static void mlx4_en_update_priv(struct mlx4_en_priv
*dst
,
2165 struct mlx4_en_priv
*src
)
2168 memcpy(dst
->rx_ring
, src
->rx_ring
,
2169 sizeof(struct mlx4_en_rx_ring
*) * src
->rx_ring_num
);
2170 memcpy(dst
->rx_cq
, src
->rx_cq
,
2171 sizeof(struct mlx4_en_cq
*) * src
->rx_ring_num
);
2172 memcpy(&dst
->hwtstamp_config
, &src
->hwtstamp_config
,
2173 sizeof(dst
->hwtstamp_config
));
2174 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
2175 dst
->tx_ring_num
[t
] = src
->tx_ring_num
[t
];
2176 dst
->tx_ring
[t
] = src
->tx_ring
[t
];
2177 dst
->tx_cq
[t
] = src
->tx_cq
[t
];
2179 dst
->rx_ring_num
= src
->rx_ring_num
;
2180 memcpy(dst
->prof
, src
->prof
, sizeof(struct mlx4_en_port_profile
));
2183 int mlx4_en_try_alloc_resources(struct mlx4_en_priv
*priv
,
2184 struct mlx4_en_priv
*tmp
,
2185 struct mlx4_en_port_profile
*prof
)
2189 mlx4_en_copy_priv(tmp
, priv
, prof
);
2191 if (mlx4_en_alloc_resources(tmp
)) {
2193 "%s: Resource allocation failed, using previous configuration\n",
2195 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
2196 kfree(tmp
->tx_ring
[t
]);
2197 kfree(tmp
->tx_cq
[t
]);
2204 void mlx4_en_safe_replace_resources(struct mlx4_en_priv
*priv
,
2205 struct mlx4_en_priv
*tmp
)
2207 mlx4_en_free_resources(priv
);
2208 mlx4_en_update_priv(priv
, tmp
);
2211 void mlx4_en_destroy_netdev(struct net_device
*dev
)
2213 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2214 struct mlx4_en_dev
*mdev
= priv
->mdev
;
2217 en_dbg(DRV
, priv
, "Destroying netdev on port:%d\n", priv
->port
);
2219 /* Unregister device - this will close the port if it was up */
2220 if (priv
->registered
) {
2221 devlink_port_type_clear(mlx4_get_devlink_port(mdev
->dev
,
2223 unregister_netdev(dev
);
2226 if (priv
->allocated
)
2227 mlx4_free_hwq_res(mdev
->dev
, &priv
->res
, MLX4_EN_PAGE_SIZE
);
2229 cancel_delayed_work(&priv
->stats_task
);
2230 cancel_delayed_work(&priv
->service_task
);
2231 /* flush any pending task for this netdev */
2232 flush_workqueue(mdev
->workqueue
);
2234 if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_TS
)
2235 mlx4_en_remove_timestamp(mdev
);
2237 /* Detach the netdev so tasks would not attempt to access it */
2238 mutex_lock(&mdev
->state_lock
);
2239 mdev
->pndev
[priv
->port
] = NULL
;
2240 mdev
->upper
[priv
->port
] = NULL
;
2242 #ifdef CONFIG_RFS_ACCEL
2243 mlx4_en_cleanup_filters(priv
);
2246 mlx4_en_free_resources(priv
);
2247 mutex_unlock(&mdev
->state_lock
);
2249 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
2250 kfree(priv
->tx_ring
[t
]);
2251 kfree(priv
->tx_cq
[t
]);
2257 static bool mlx4_en_check_xdp_mtu(struct net_device
*dev
, int mtu
)
2259 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2261 if (mtu
> MLX4_EN_MAX_XDP_MTU
) {
2262 en_err(priv
, "mtu:%d > max:%d when XDP prog is attached\n",
2263 mtu
, MLX4_EN_MAX_XDP_MTU
);
2270 static int mlx4_en_change_mtu(struct net_device
*dev
, int new_mtu
)
2272 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2273 struct mlx4_en_dev
*mdev
= priv
->mdev
;
2276 en_dbg(DRV
, priv
, "Change MTU called - current:%d new:%d\n",
2279 if (priv
->tx_ring_num
[TX_XDP
] &&
2280 !mlx4_en_check_xdp_mtu(dev
, new_mtu
))
2285 if (netif_running(dev
)) {
2286 mutex_lock(&mdev
->state_lock
);
2287 if (!mdev
->device_up
) {
2288 /* NIC is probably restarting - let watchdog task reset
2290 en_dbg(DRV
, priv
, "Change MTU called with card down!?\n");
2292 mlx4_en_stop_port(dev
, 1);
2293 err
= mlx4_en_start_port(dev
);
2295 en_err(priv
, "Failed restarting port:%d\n",
2297 queue_work(mdev
->workqueue
, &priv
->watchdog_task
);
2300 mutex_unlock(&mdev
->state_lock
);
2305 static int mlx4_en_hwtstamp_set(struct net_device
*dev
, struct ifreq
*ifr
)
2307 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2308 struct mlx4_en_dev
*mdev
= priv
->mdev
;
2309 struct hwtstamp_config config
;
2311 if (copy_from_user(&config
, ifr
->ifr_data
, sizeof(config
)))
2314 /* reserved for future extensions */
2318 /* device doesn't support time stamping */
2319 if (!(mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_TS
))
2322 /* TX HW timestamp */
2323 switch (config
.tx_type
) {
2324 case HWTSTAMP_TX_OFF
:
2325 case HWTSTAMP_TX_ON
:
2331 /* RX HW timestamp */
2332 switch (config
.rx_filter
) {
2333 case HWTSTAMP_FILTER_NONE
:
2335 case HWTSTAMP_FILTER_ALL
:
2336 case HWTSTAMP_FILTER_SOME
:
2337 case HWTSTAMP_FILTER_PTP_V1_L4_EVENT
:
2338 case HWTSTAMP_FILTER_PTP_V1_L4_SYNC
:
2339 case HWTSTAMP_FILTER_PTP_V1_L4_DELAY_REQ
:
2340 case HWTSTAMP_FILTER_PTP_V2_L4_EVENT
:
2341 case HWTSTAMP_FILTER_PTP_V2_L4_SYNC
:
2342 case HWTSTAMP_FILTER_PTP_V2_L4_DELAY_REQ
:
2343 case HWTSTAMP_FILTER_PTP_V2_L2_EVENT
:
2344 case HWTSTAMP_FILTER_PTP_V2_L2_SYNC
:
2345 case HWTSTAMP_FILTER_PTP_V2_L2_DELAY_REQ
:
2346 case HWTSTAMP_FILTER_PTP_V2_EVENT
:
2347 case HWTSTAMP_FILTER_PTP_V2_SYNC
:
2348 case HWTSTAMP_FILTER_PTP_V2_DELAY_REQ
:
2349 config
.rx_filter
= HWTSTAMP_FILTER_ALL
;
2355 if (mlx4_en_reset_config(dev
, config
, dev
->features
)) {
2356 config
.tx_type
= HWTSTAMP_TX_OFF
;
2357 config
.rx_filter
= HWTSTAMP_FILTER_NONE
;
2360 return copy_to_user(ifr
->ifr_data
, &config
,
2361 sizeof(config
)) ? -EFAULT
: 0;
2364 static int mlx4_en_hwtstamp_get(struct net_device
*dev
, struct ifreq
*ifr
)
2366 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2368 return copy_to_user(ifr
->ifr_data
, &priv
->hwtstamp_config
,
2369 sizeof(priv
->hwtstamp_config
)) ? -EFAULT
: 0;
2372 static int mlx4_en_ioctl(struct net_device
*dev
, struct ifreq
*ifr
, int cmd
)
2376 return mlx4_en_hwtstamp_set(dev
, ifr
);
2378 return mlx4_en_hwtstamp_get(dev
, ifr
);
2384 static netdev_features_t
mlx4_en_fix_features(struct net_device
*netdev
,
2385 netdev_features_t features
)
2387 struct mlx4_en_priv
*en_priv
= netdev_priv(netdev
);
2388 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2390 /* Since there is no support for separate RX C-TAG/S-TAG vlan accel
2391 * enable/disable make sure S-TAG flag is always in same state as
2394 if (features
& NETIF_F_HW_VLAN_CTAG_RX
&&
2395 !(mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_SKIP_OUTER_VLAN
))
2396 features
|= NETIF_F_HW_VLAN_STAG_RX
;
2398 features
&= ~NETIF_F_HW_VLAN_STAG_RX
;
2403 static int mlx4_en_set_features(struct net_device
*netdev
,
2404 netdev_features_t features
)
2406 struct mlx4_en_priv
*priv
= netdev_priv(netdev
);
2410 if (DEV_FEATURE_CHANGED(netdev
, features
, NETIF_F_RXFCS
)) {
2411 en_info(priv
, "Turn %s RX-FCS\n",
2412 (features
& NETIF_F_RXFCS
) ? "ON" : "OFF");
2416 if (DEV_FEATURE_CHANGED(netdev
, features
, NETIF_F_RXALL
)) {
2417 u8 ignore_fcs_value
= (features
& NETIF_F_RXALL
) ? 1 : 0;
2419 en_info(priv
, "Turn %s RX-ALL\n",
2420 ignore_fcs_value
? "ON" : "OFF");
2421 ret
= mlx4_SET_PORT_fcs_check(priv
->mdev
->dev
,
2422 priv
->port
, ignore_fcs_value
);
2427 if (DEV_FEATURE_CHANGED(netdev
, features
, NETIF_F_HW_VLAN_CTAG_RX
)) {
2428 en_info(priv
, "Turn %s RX vlan strip offload\n",
2429 (features
& NETIF_F_HW_VLAN_CTAG_RX
) ? "ON" : "OFF");
2433 if (DEV_FEATURE_CHANGED(netdev
, features
, NETIF_F_HW_VLAN_CTAG_TX
))
2434 en_info(priv
, "Turn %s TX vlan strip offload\n",
2435 (features
& NETIF_F_HW_VLAN_CTAG_TX
) ? "ON" : "OFF");
2437 if (DEV_FEATURE_CHANGED(netdev
, features
, NETIF_F_HW_VLAN_STAG_TX
))
2438 en_info(priv
, "Turn %s TX S-VLAN strip offload\n",
2439 (features
& NETIF_F_HW_VLAN_STAG_TX
) ? "ON" : "OFF");
2441 if (DEV_FEATURE_CHANGED(netdev
, features
, NETIF_F_LOOPBACK
)) {
2442 en_info(priv
, "Turn %s loopback\n",
2443 (features
& NETIF_F_LOOPBACK
) ? "ON" : "OFF");
2444 mlx4_en_update_loopback_state(netdev
, features
);
2448 ret
= mlx4_en_reset_config(netdev
, priv
->hwtstamp_config
,
2457 static int mlx4_en_set_vf_mac(struct net_device
*dev
, int queue
, u8
*mac
)
2459 struct mlx4_en_priv
*en_priv
= netdev_priv(dev
);
2460 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2461 u64 mac_u64
= mlx4_mac_to_u64(mac
);
2463 if (is_multicast_ether_addr(mac
))
2466 return mlx4_set_vf_mac(mdev
->dev
, en_priv
->port
, queue
, mac_u64
);
2469 static int mlx4_en_set_vf_vlan(struct net_device
*dev
, int vf
, u16 vlan
, u8 qos
,
2472 struct mlx4_en_priv
*en_priv
= netdev_priv(dev
);
2473 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2475 return mlx4_set_vf_vlan(mdev
->dev
, en_priv
->port
, vf
, vlan
, qos
,
2479 static int mlx4_en_set_vf_rate(struct net_device
*dev
, int vf
, int min_tx_rate
,
2482 struct mlx4_en_priv
*en_priv
= netdev_priv(dev
);
2483 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2485 return mlx4_set_vf_rate(mdev
->dev
, en_priv
->port
, vf
, min_tx_rate
,
2489 static int mlx4_en_set_vf_spoofchk(struct net_device
*dev
, int vf
, bool setting
)
2491 struct mlx4_en_priv
*en_priv
= netdev_priv(dev
);
2492 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2494 return mlx4_set_vf_spoofchk(mdev
->dev
, en_priv
->port
, vf
, setting
);
2497 static int mlx4_en_get_vf_config(struct net_device
*dev
, int vf
, struct ifla_vf_info
*ivf
)
2499 struct mlx4_en_priv
*en_priv
= netdev_priv(dev
);
2500 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2502 return mlx4_get_vf_config(mdev
->dev
, en_priv
->port
, vf
, ivf
);
2505 static int mlx4_en_set_vf_link_state(struct net_device
*dev
, int vf
, int link_state
)
2507 struct mlx4_en_priv
*en_priv
= netdev_priv(dev
);
2508 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2510 return mlx4_set_vf_link_state(mdev
->dev
, en_priv
->port
, vf
, link_state
);
2513 static int mlx4_en_get_vf_stats(struct net_device
*dev
, int vf
,
2514 struct ifla_vf_stats
*vf_stats
)
2516 struct mlx4_en_priv
*en_priv
= netdev_priv(dev
);
2517 struct mlx4_en_dev
*mdev
= en_priv
->mdev
;
2519 return mlx4_get_vf_stats(mdev
->dev
, en_priv
->port
, vf
, vf_stats
);
2522 #define PORT_ID_BYTE_LEN 8
2523 static int mlx4_en_get_phys_port_id(struct net_device
*dev
,
2524 struct netdev_phys_item_id
*ppid
)
2526 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2527 struct mlx4_dev
*mdev
= priv
->mdev
->dev
;
2529 u64 phys_port_id
= mdev
->caps
.phys_port_id
[priv
->port
];
2534 ppid
->id_len
= sizeof(phys_port_id
);
2535 for (i
= PORT_ID_BYTE_LEN
- 1; i
>= 0; --i
) {
2536 ppid
->id
[i
] = phys_port_id
& 0xff;
2542 static void mlx4_en_add_vxlan_offloads(struct work_struct
*work
)
2545 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
2548 ret
= mlx4_config_vxlan_port(priv
->mdev
->dev
, priv
->vxlan_port
);
2552 ret
= mlx4_SET_PORT_VXLAN(priv
->mdev
->dev
, priv
->port
,
2553 VXLAN_STEER_BY_OUTER_MAC
, 1);
2556 en_err(priv
, "failed setting L2 tunnel configuration ret %d\n", ret
);
2561 priv
->dev
->hw_enc_features
|= NETIF_F_IP_CSUM
| NETIF_F_IPV6_CSUM
|
2563 NETIF_F_TSO
| NETIF_F_TSO6
|
2564 NETIF_F_GSO_UDP_TUNNEL
|
2565 NETIF_F_GSO_UDP_TUNNEL_CSUM
|
2566 NETIF_F_GSO_PARTIAL
;
2569 static void mlx4_en_del_vxlan_offloads(struct work_struct
*work
)
2572 struct mlx4_en_priv
*priv
= container_of(work
, struct mlx4_en_priv
,
2574 /* unset offloads */
2575 priv
->dev
->hw_enc_features
&= ~(NETIF_F_IP_CSUM
| NETIF_F_IPV6_CSUM
|
2577 NETIF_F_TSO
| NETIF_F_TSO6
|
2578 NETIF_F_GSO_UDP_TUNNEL
|
2579 NETIF_F_GSO_UDP_TUNNEL_CSUM
|
2580 NETIF_F_GSO_PARTIAL
);
2582 ret
= mlx4_SET_PORT_VXLAN(priv
->mdev
->dev
, priv
->port
,
2583 VXLAN_STEER_BY_OUTER_MAC
, 0);
2585 en_err(priv
, "failed setting L2 tunnel configuration ret %d\n", ret
);
2587 priv
->vxlan_port
= 0;
2590 static void mlx4_en_add_vxlan_port(struct net_device
*dev
,
2591 struct udp_tunnel_info
*ti
)
2593 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2594 __be16 port
= ti
->port
;
2595 __be16 current_port
;
2597 if (ti
->type
!= UDP_TUNNEL_TYPE_VXLAN
)
2600 if (ti
->sa_family
!= AF_INET
)
2603 if (priv
->mdev
->dev
->caps
.tunnel_offload_mode
!= MLX4_TUNNEL_OFFLOAD_MODE_VXLAN
)
2606 current_port
= priv
->vxlan_port
;
2607 if (current_port
&& current_port
!= port
) {
2608 en_warn(priv
, "vxlan port %d configured, can't add port %d\n",
2609 ntohs(current_port
), ntohs(port
));
2613 priv
->vxlan_port
= port
;
2614 queue_work(priv
->mdev
->workqueue
, &priv
->vxlan_add_task
);
2617 static void mlx4_en_del_vxlan_port(struct net_device
*dev
,
2618 struct udp_tunnel_info
*ti
)
2620 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2621 __be16 port
= ti
->port
;
2622 __be16 current_port
;
2624 if (ti
->type
!= UDP_TUNNEL_TYPE_VXLAN
)
2627 if (ti
->sa_family
!= AF_INET
)
2630 if (priv
->mdev
->dev
->caps
.tunnel_offload_mode
!= MLX4_TUNNEL_OFFLOAD_MODE_VXLAN
)
2633 current_port
= priv
->vxlan_port
;
2634 if (current_port
!= port
) {
2635 en_dbg(DRV
, priv
, "vxlan port %d isn't configured, ignoring\n", ntohs(port
));
2639 queue_work(priv
->mdev
->workqueue
, &priv
->vxlan_del_task
);
2642 static netdev_features_t
mlx4_en_features_check(struct sk_buff
*skb
,
2643 struct net_device
*dev
,
2644 netdev_features_t features
)
2646 features
= vlan_features_check(skb
, features
);
2647 features
= vxlan_features_check(skb
, features
);
2649 /* The ConnectX-3 doesn't support outer IPv6 checksums but it does
2650 * support inner IPv6 checksums and segmentation so we need to
2651 * strip that feature if this is an IPv6 encapsulated frame.
2653 if (skb
->encapsulation
&&
2654 (skb
->ip_summed
== CHECKSUM_PARTIAL
)) {
2655 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2657 if (!priv
->vxlan_port
||
2658 (ip_hdr(skb
)->version
!= 4) ||
2659 (udp_hdr(skb
)->dest
!= priv
->vxlan_port
))
2660 features
&= ~(NETIF_F_CSUM_MASK
| NETIF_F_GSO_MASK
);
2666 static int mlx4_en_set_tx_maxrate(struct net_device
*dev
, int queue_index
, u32 maxrate
)
2668 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2669 struct mlx4_en_tx_ring
*tx_ring
= priv
->tx_ring
[TX
][queue_index
];
2670 struct mlx4_update_qp_params params
;
2673 if (!(priv
->mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_QP_RATE_LIMIT
))
2676 /* rate provided to us in Mbs, check if it fits into 12 bits, if not use Gbs */
2677 if (maxrate
>> 12) {
2678 params
.rate_unit
= MLX4_QP_RATE_LIMIT_GBS
;
2679 params
.rate_val
= maxrate
/ 1000;
2680 } else if (maxrate
) {
2681 params
.rate_unit
= MLX4_QP_RATE_LIMIT_MBS
;
2682 params
.rate_val
= maxrate
;
2683 } else { /* zero serves to revoke the QP rate-limitation */
2684 params
.rate_unit
= 0;
2685 params
.rate_val
= 0;
2688 err
= mlx4_update_qp(priv
->mdev
->dev
, tx_ring
->qpn
, MLX4_UPDATE_QP_RATE_LIMIT
,
2693 static int mlx4_xdp_set(struct net_device
*dev
, struct bpf_prog
*prog
)
2695 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2696 struct mlx4_en_dev
*mdev
= priv
->mdev
;
2697 struct mlx4_en_port_profile new_prof
;
2698 struct bpf_prog
*old_prog
;
2699 struct mlx4_en_priv
*tmp
;
2706 xdp_ring_num
= prog
? priv
->rx_ring_num
: 0;
2708 /* No need to reconfigure buffers when simply swapping the
2709 * program for a new one.
2711 if (priv
->tx_ring_num
[TX_XDP
] == xdp_ring_num
) {
2713 prog
= bpf_prog_add(prog
, priv
->rx_ring_num
- 1);
2715 return PTR_ERR(prog
);
2717 mutex_lock(&mdev
->state_lock
);
2718 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
2719 old_prog
= rcu_dereference_protected(
2720 priv
->rx_ring
[i
]->xdp_prog
,
2721 lockdep_is_held(&mdev
->state_lock
));
2722 rcu_assign_pointer(priv
->rx_ring
[i
]->xdp_prog
, prog
);
2724 bpf_prog_put(old_prog
);
2726 mutex_unlock(&mdev
->state_lock
);
2730 if (!mlx4_en_check_xdp_mtu(dev
, dev
->mtu
))
2733 tmp
= kzalloc(sizeof(*tmp
), GFP_KERNEL
);
2738 prog
= bpf_prog_add(prog
, priv
->rx_ring_num
- 1);
2740 err
= PTR_ERR(prog
);
2745 mutex_lock(&mdev
->state_lock
);
2746 memcpy(&new_prof
, priv
->prof
, sizeof(struct mlx4_en_port_profile
));
2747 new_prof
.tx_ring_num
[TX_XDP
] = xdp_ring_num
;
2749 if (priv
->tx_ring_num
[TX
] + xdp_ring_num
> MAX_TX_RINGS
) {
2751 new_prof
.tx_ring_num
[TX
] =
2752 MAX_TX_RINGS
- ALIGN(xdp_ring_num
, MLX4_EN_NUM_UP
);
2753 en_warn(priv
, "Reducing the number of TX rings, to not exceed the max total rings number.\n");
2756 err
= mlx4_en_try_alloc_resources(priv
, tmp
, &new_prof
);
2759 bpf_prog_sub(prog
, priv
->rx_ring_num
- 1);
2763 if (priv
->port_up
) {
2765 mlx4_en_stop_port(dev
, 1);
2768 mlx4_en_safe_replace_resources(priv
, tmp
);
2770 netif_set_real_num_tx_queues(dev
, priv
->tx_ring_num
[TX
]);
2772 for (i
= 0; i
< priv
->rx_ring_num
; i
++) {
2773 old_prog
= rcu_dereference_protected(
2774 priv
->rx_ring
[i
]->xdp_prog
,
2775 lockdep_is_held(&mdev
->state_lock
));
2776 rcu_assign_pointer(priv
->rx_ring
[i
]->xdp_prog
, prog
);
2778 bpf_prog_put(old_prog
);
2782 err
= mlx4_en_start_port(dev
);
2784 en_err(priv
, "Failed starting port %d for XDP change\n",
2786 queue_work(mdev
->workqueue
, &priv
->watchdog_task
);
2791 mutex_unlock(&mdev
->state_lock
);
2797 static bool mlx4_xdp_attached(struct net_device
*dev
)
2799 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
2801 return !!priv
->tx_ring_num
[TX_XDP
];
2804 static int mlx4_xdp(struct net_device
*dev
, struct netdev_xdp
*xdp
)
2806 switch (xdp
->command
) {
2807 case XDP_SETUP_PROG
:
2808 return mlx4_xdp_set(dev
, xdp
->prog
);
2809 case XDP_QUERY_PROG
:
2810 xdp
->prog_attached
= mlx4_xdp_attached(dev
);
2817 static const struct net_device_ops mlx4_netdev_ops
= {
2818 .ndo_open
= mlx4_en_open
,
2819 .ndo_stop
= mlx4_en_close
,
2820 .ndo_start_xmit
= mlx4_en_xmit
,
2821 .ndo_select_queue
= mlx4_en_select_queue
,
2822 .ndo_get_stats64
= mlx4_en_get_stats64
,
2823 .ndo_set_rx_mode
= mlx4_en_set_rx_mode
,
2824 .ndo_set_mac_address
= mlx4_en_set_mac
,
2825 .ndo_validate_addr
= eth_validate_addr
,
2826 .ndo_change_mtu
= mlx4_en_change_mtu
,
2827 .ndo_do_ioctl
= mlx4_en_ioctl
,
2828 .ndo_tx_timeout
= mlx4_en_tx_timeout
,
2829 .ndo_vlan_rx_add_vid
= mlx4_en_vlan_rx_add_vid
,
2830 .ndo_vlan_rx_kill_vid
= mlx4_en_vlan_rx_kill_vid
,
2831 #ifdef CONFIG_NET_POLL_CONTROLLER
2832 .ndo_poll_controller
= mlx4_en_netpoll
,
2834 .ndo_set_features
= mlx4_en_set_features
,
2835 .ndo_fix_features
= mlx4_en_fix_features
,
2836 .ndo_setup_tc
= __mlx4_en_setup_tc
,
2837 #ifdef CONFIG_RFS_ACCEL
2838 .ndo_rx_flow_steer
= mlx4_en_filter_rfs
,
2840 .ndo_get_phys_port_id
= mlx4_en_get_phys_port_id
,
2841 .ndo_udp_tunnel_add
= mlx4_en_add_vxlan_port
,
2842 .ndo_udp_tunnel_del
= mlx4_en_del_vxlan_port
,
2843 .ndo_features_check
= mlx4_en_features_check
,
2844 .ndo_set_tx_maxrate
= mlx4_en_set_tx_maxrate
,
2845 .ndo_xdp
= mlx4_xdp
,
2848 static const struct net_device_ops mlx4_netdev_ops_master
= {
2849 .ndo_open
= mlx4_en_open
,
2850 .ndo_stop
= mlx4_en_close
,
2851 .ndo_start_xmit
= mlx4_en_xmit
,
2852 .ndo_select_queue
= mlx4_en_select_queue
,
2853 .ndo_get_stats64
= mlx4_en_get_stats64
,
2854 .ndo_set_rx_mode
= mlx4_en_set_rx_mode
,
2855 .ndo_set_mac_address
= mlx4_en_set_mac
,
2856 .ndo_validate_addr
= eth_validate_addr
,
2857 .ndo_change_mtu
= mlx4_en_change_mtu
,
2858 .ndo_tx_timeout
= mlx4_en_tx_timeout
,
2859 .ndo_vlan_rx_add_vid
= mlx4_en_vlan_rx_add_vid
,
2860 .ndo_vlan_rx_kill_vid
= mlx4_en_vlan_rx_kill_vid
,
2861 .ndo_set_vf_mac
= mlx4_en_set_vf_mac
,
2862 .ndo_set_vf_vlan
= mlx4_en_set_vf_vlan
,
2863 .ndo_set_vf_rate
= mlx4_en_set_vf_rate
,
2864 .ndo_set_vf_spoofchk
= mlx4_en_set_vf_spoofchk
,
2865 .ndo_set_vf_link_state
= mlx4_en_set_vf_link_state
,
2866 .ndo_get_vf_stats
= mlx4_en_get_vf_stats
,
2867 .ndo_get_vf_config
= mlx4_en_get_vf_config
,
2868 #ifdef CONFIG_NET_POLL_CONTROLLER
2869 .ndo_poll_controller
= mlx4_en_netpoll
,
2871 .ndo_set_features
= mlx4_en_set_features
,
2872 .ndo_fix_features
= mlx4_en_fix_features
,
2873 .ndo_setup_tc
= __mlx4_en_setup_tc
,
2874 #ifdef CONFIG_RFS_ACCEL
2875 .ndo_rx_flow_steer
= mlx4_en_filter_rfs
,
2877 .ndo_get_phys_port_id
= mlx4_en_get_phys_port_id
,
2878 .ndo_udp_tunnel_add
= mlx4_en_add_vxlan_port
,
2879 .ndo_udp_tunnel_del
= mlx4_en_del_vxlan_port
,
2880 .ndo_features_check
= mlx4_en_features_check
,
2881 .ndo_set_tx_maxrate
= mlx4_en_set_tx_maxrate
,
2882 .ndo_xdp
= mlx4_xdp
,
2885 struct mlx4_en_bond
{
2886 struct work_struct work
;
2887 struct mlx4_en_priv
*priv
;
2889 struct mlx4_port_map port_map
;
2892 static void mlx4_en_bond_work(struct work_struct
*work
)
2894 struct mlx4_en_bond
*bond
= container_of(work
,
2895 struct mlx4_en_bond
,
2898 struct mlx4_dev
*dev
= bond
->priv
->mdev
->dev
;
2900 if (bond
->is_bonded
) {
2901 if (!mlx4_is_bonded(dev
)) {
2902 err
= mlx4_bond(dev
);
2904 en_err(bond
->priv
, "Fail to bond device\n");
2907 err
= mlx4_port_map_set(dev
, &bond
->port_map
);
2909 en_err(bond
->priv
, "Fail to set port map [%d][%d]: %d\n",
2910 bond
->port_map
.port1
,
2911 bond
->port_map
.port2
,
2914 } else if (mlx4_is_bonded(dev
)) {
2915 err
= mlx4_unbond(dev
);
2917 en_err(bond
->priv
, "Fail to unbond device\n");
2919 dev_put(bond
->priv
->dev
);
2923 static int mlx4_en_queue_bond_work(struct mlx4_en_priv
*priv
, int is_bonded
,
2924 u8 v2p_p1
, u8 v2p_p2
)
2926 struct mlx4_en_bond
*bond
= NULL
;
2928 bond
= kzalloc(sizeof(*bond
), GFP_ATOMIC
);
2932 INIT_WORK(&bond
->work
, mlx4_en_bond_work
);
2934 bond
->is_bonded
= is_bonded
;
2935 bond
->port_map
.port1
= v2p_p1
;
2936 bond
->port_map
.port2
= v2p_p2
;
2937 dev_hold(priv
->dev
);
2938 queue_work(priv
->mdev
->workqueue
, &bond
->work
);
2942 int mlx4_en_netdev_event(struct notifier_block
*this,
2943 unsigned long event
, void *ptr
)
2945 struct net_device
*ndev
= netdev_notifier_info_to_dev(ptr
);
2947 struct mlx4_en_dev
*mdev
;
2948 struct mlx4_dev
*dev
;
2949 int i
, num_eth_ports
= 0;
2950 bool do_bond
= true;
2951 struct mlx4_en_priv
*priv
;
2955 if (!net_eq(dev_net(ndev
), &init_net
))
2958 mdev
= container_of(this, struct mlx4_en_dev
, nb
);
2961 /* Go into this mode only when two network devices set on two ports
2962 * of the same mlx4 device are slaves of the same bonding master
2964 mlx4_foreach_port(i
, dev
, MLX4_PORT_TYPE_ETH
) {
2966 if (!port
&& (mdev
->pndev
[i
] == ndev
))
2968 mdev
->upper
[i
] = mdev
->pndev
[i
] ?
2969 netdev_master_upper_dev_get(mdev
->pndev
[i
]) : NULL
;
2970 /* condition not met: network device is a slave */
2971 if (!mdev
->upper
[i
])
2973 if (num_eth_ports
< 2)
2975 /* condition not met: same master */
2976 if (mdev
->upper
[i
] != mdev
->upper
[i
-1])
2979 /* condition not met: 2 salves */
2980 do_bond
= (num_eth_ports
== 2) ? do_bond
: false;
2982 /* handle only events that come with enough info */
2983 if ((do_bond
&& (event
!= NETDEV_BONDING_INFO
)) || !port
)
2986 priv
= netdev_priv(ndev
);
2988 struct netdev_notifier_bonding_info
*notifier_info
= ptr
;
2989 struct netdev_bonding_info
*bonding_info
=
2990 ¬ifier_info
->bonding_info
;
2992 /* required mode 1, 2 or 4 */
2993 if ((bonding_info
->master
.bond_mode
!= BOND_MODE_ACTIVEBACKUP
) &&
2994 (bonding_info
->master
.bond_mode
!= BOND_MODE_XOR
) &&
2995 (bonding_info
->master
.bond_mode
!= BOND_MODE_8023AD
))
2998 /* require exactly 2 slaves */
2999 if (bonding_info
->master
.num_slaves
!= 2)
3004 if (bonding_info
->master
.bond_mode
==
3005 BOND_MODE_ACTIVEBACKUP
) {
3006 /* in active-backup mode virtual ports are
3007 * mapped to the physical port of the active
3009 if (bonding_info
->slave
.state
==
3010 BOND_STATE_BACKUP
) {
3018 } else { /* BOND_STATE_ACTIVE */
3027 } else { /* Active-Active */
3028 /* in active-active mode a virtual port is
3029 * mapped to the native physical port if and only
3030 * if the physical port is up */
3031 __s8 link
= bonding_info
->slave
.link
;
3037 if ((link
== BOND_LINK_UP
) ||
3038 (link
== BOND_LINK_FAIL
)) {
3043 } else { /* BOND_LINK_DOWN || BOND_LINK_BACK */
3053 mlx4_en_queue_bond_work(priv
, do_bond
,
3054 v2p_port1
, v2p_port2
);
3059 void mlx4_en_update_pfc_stats_bitmap(struct mlx4_dev
*dev
,
3060 struct mlx4_en_stats_bitmap
*stats_bitmap
,
3061 u8 rx_ppp
, u8 rx_pause
,
3062 u8 tx_ppp
, u8 tx_pause
)
3064 int last_i
= NUM_MAIN_STATS
+ NUM_PORT_STATS
+ NUM_PF_STATS
;
3066 if (!mlx4_is_slave(dev
) &&
3067 (dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_FLOWSTATS_EN
)) {
3068 mutex_lock(&stats_bitmap
->mutex
);
3069 bitmap_clear(stats_bitmap
->bitmap
, last_i
, NUM_FLOW_STATS
);
3072 bitmap_set(stats_bitmap
->bitmap
, last_i
,
3073 NUM_FLOW_PRIORITY_STATS_RX
);
3074 last_i
+= NUM_FLOW_PRIORITY_STATS_RX
;
3076 if (rx_pause
&& !(rx_ppp
))
3077 bitmap_set(stats_bitmap
->bitmap
, last_i
,
3079 last_i
+= NUM_FLOW_STATS_RX
;
3082 bitmap_set(stats_bitmap
->bitmap
, last_i
,
3083 NUM_FLOW_PRIORITY_STATS_TX
);
3084 last_i
+= NUM_FLOW_PRIORITY_STATS_TX
;
3086 if (tx_pause
&& !(tx_ppp
))
3087 bitmap_set(stats_bitmap
->bitmap
, last_i
,
3089 last_i
+= NUM_FLOW_STATS_TX
;
3091 mutex_unlock(&stats_bitmap
->mutex
);
3095 void mlx4_en_set_stats_bitmap(struct mlx4_dev
*dev
,
3096 struct mlx4_en_stats_bitmap
*stats_bitmap
,
3097 u8 rx_ppp
, u8 rx_pause
,
3098 u8 tx_ppp
, u8 tx_pause
)
3102 mutex_init(&stats_bitmap
->mutex
);
3103 bitmap_zero(stats_bitmap
->bitmap
, NUM_ALL_STATS
);
3105 if (mlx4_is_slave(dev
)) {
3106 bitmap_set(stats_bitmap
->bitmap
, last_i
+
3107 MLX4_FIND_NETDEV_STAT(rx_packets
), 1);
3108 bitmap_set(stats_bitmap
->bitmap
, last_i
+
3109 MLX4_FIND_NETDEV_STAT(tx_packets
), 1);
3110 bitmap_set(stats_bitmap
->bitmap
, last_i
+
3111 MLX4_FIND_NETDEV_STAT(rx_bytes
), 1);
3112 bitmap_set(stats_bitmap
->bitmap
, last_i
+
3113 MLX4_FIND_NETDEV_STAT(tx_bytes
), 1);
3114 bitmap_set(stats_bitmap
->bitmap
, last_i
+
3115 MLX4_FIND_NETDEV_STAT(rx_dropped
), 1);
3116 bitmap_set(stats_bitmap
->bitmap
, last_i
+
3117 MLX4_FIND_NETDEV_STAT(tx_dropped
), 1);
3119 bitmap_set(stats_bitmap
->bitmap
, last_i
, NUM_MAIN_STATS
);
3121 last_i
+= NUM_MAIN_STATS
;
3123 bitmap_set(stats_bitmap
->bitmap
, last_i
, NUM_PORT_STATS
);
3124 last_i
+= NUM_PORT_STATS
;
3126 if (mlx4_is_master(dev
))
3127 bitmap_set(stats_bitmap
->bitmap
, last_i
,
3129 last_i
+= NUM_PF_STATS
;
3131 mlx4_en_update_pfc_stats_bitmap(dev
, stats_bitmap
,
3134 last_i
+= NUM_FLOW_STATS
;
3136 if (!mlx4_is_slave(dev
))
3137 bitmap_set(stats_bitmap
->bitmap
, last_i
, NUM_PKT_STATS
);
3138 last_i
+= NUM_PKT_STATS
;
3140 bitmap_set(stats_bitmap
->bitmap
, last_i
, NUM_XDP_STATS
);
3141 last_i
+= NUM_XDP_STATS
;
3144 int mlx4_en_init_netdev(struct mlx4_en_dev
*mdev
, int port
,
3145 struct mlx4_en_port_profile
*prof
)
3147 struct net_device
*dev
;
3148 struct mlx4_en_priv
*priv
;
3152 dev
= alloc_etherdev_mqs(sizeof(struct mlx4_en_priv
),
3153 MAX_TX_RINGS
, MAX_RX_RINGS
);
3157 netif_set_real_num_tx_queues(dev
, prof
->tx_ring_num
[TX
]);
3158 netif_set_real_num_rx_queues(dev
, prof
->rx_ring_num
);
3160 SET_NETDEV_DEV(dev
, &mdev
->dev
->persist
->pdev
->dev
);
3161 dev
->dev_port
= port
- 1;
3164 * Initialize driver private data
3167 priv
= netdev_priv(dev
);
3168 memset(priv
, 0, sizeof(struct mlx4_en_priv
));
3169 priv
->counter_index
= MLX4_SINK_COUNTER_INDEX(mdev
->dev
);
3170 spin_lock_init(&priv
->stats_lock
);
3171 INIT_WORK(&priv
->rx_mode_task
, mlx4_en_do_set_rx_mode
);
3172 INIT_WORK(&priv
->watchdog_task
, mlx4_en_restart
);
3173 INIT_WORK(&priv
->linkstate_task
, mlx4_en_linkstate
);
3174 INIT_DELAYED_WORK(&priv
->stats_task
, mlx4_en_do_get_stats
);
3175 INIT_DELAYED_WORK(&priv
->service_task
, mlx4_en_service_task
);
3176 INIT_WORK(&priv
->vxlan_add_task
, mlx4_en_add_vxlan_offloads
);
3177 INIT_WORK(&priv
->vxlan_del_task
, mlx4_en_del_vxlan_offloads
);
3178 #ifdef CONFIG_RFS_ACCEL
3179 INIT_LIST_HEAD(&priv
->filters
);
3180 spin_lock_init(&priv
->filters_lock
);
3185 priv
->ddev
= &mdev
->pdev
->dev
;
3188 priv
->port_up
= false;
3189 priv
->flags
= prof
->flags
;
3190 priv
->pflags
= MLX4_EN_PRIV_FLAGS_BLUEFLAME
;
3191 priv
->ctrl_flags
= cpu_to_be32(MLX4_WQE_CTRL_CQ_UPDATE
|
3192 MLX4_WQE_CTRL_SOLICITED
);
3193 priv
->num_tx_rings_p_up
= mdev
->profile
.num_tx_rings_p_up
;
3194 priv
->tx_work_limit
= MLX4_EN_DEFAULT_TX_WORK
;
3195 netdev_rss_key_fill(priv
->rss_key
, sizeof(priv
->rss_key
));
3197 for (t
= 0; t
< MLX4_EN_NUM_TX_TYPES
; t
++) {
3198 priv
->tx_ring_num
[t
] = prof
->tx_ring_num
[t
];
3199 if (!priv
->tx_ring_num
[t
])
3202 priv
->tx_ring
[t
] = kzalloc(sizeof(struct mlx4_en_tx_ring
*) *
3203 MAX_TX_RINGS
, GFP_KERNEL
);
3204 if (!priv
->tx_ring
[t
]) {
3208 priv
->tx_cq
[t
] = kzalloc(sizeof(struct mlx4_en_cq
*) *
3209 MAX_TX_RINGS
, GFP_KERNEL
);
3210 if (!priv
->tx_cq
[t
]) {
3211 kfree(priv
->tx_ring
[t
]);
3216 priv
->rx_ring_num
= prof
->rx_ring_num
;
3217 priv
->cqe_factor
= (mdev
->dev
->caps
.cqe_size
== 64) ? 1 : 0;
3218 priv
->cqe_size
= mdev
->dev
->caps
.cqe_size
;
3219 priv
->mac_index
= -1;
3220 priv
->msg_enable
= MLX4_EN_MSG_LEVEL
;
3221 #ifdef CONFIG_MLX4_EN_DCB
3222 if (!mlx4_is_slave(priv
->mdev
->dev
)) {
3223 priv
->dcbx_cap
= DCB_CAP_DCBX_VER_CEE
| DCB_CAP_DCBX_HOST
|
3224 DCB_CAP_DCBX_VER_IEEE
;
3225 priv
->flags
|= MLX4_EN_DCB_ENABLED
;
3226 priv
->cee_config
.pfc_state
= false;
3228 for (i
= 0; i
< MLX4_EN_NUM_UP
; i
++)
3229 priv
->cee_config
.dcb_pfc
[i
] = pfc_disabled
;
3231 if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_ETS_CFG
) {
3232 dev
->dcbnl_ops
= &mlx4_en_dcbnl_ops
;
3234 en_info(priv
, "enabling only PFC DCB ops\n");
3235 dev
->dcbnl_ops
= &mlx4_en_dcbnl_pfc_ops
;
3240 for (i
= 0; i
< MLX4_EN_MAC_HASH_SIZE
; ++i
)
3241 INIT_HLIST_HEAD(&priv
->mac_hash
[i
]);
3243 /* Query for default mac and max mtu */
3244 priv
->max_mtu
= mdev
->dev
->caps
.eth_mtu_cap
[priv
->port
];
3246 if (mdev
->dev
->caps
.rx_checksum_flags_port
[priv
->port
] &
3247 MLX4_RX_CSUM_MODE_VAL_NON_TCP_UDP
)
3248 priv
->flags
|= MLX4_EN_FLAG_RX_CSUM_NON_TCP_UDP
;
3250 /* Set default MAC */
3251 dev
->addr_len
= ETH_ALEN
;
3252 mlx4_en_u64_to_mac(dev
->dev_addr
, mdev
->dev
->caps
.def_mac
[priv
->port
]);
3253 if (!is_valid_ether_addr(dev
->dev_addr
)) {
3254 en_err(priv
, "Port: %d, invalid mac burned: %pM, quiting\n",
3255 priv
->port
, dev
->dev_addr
);
3258 } else if (mlx4_is_slave(priv
->mdev
->dev
) &&
3259 (priv
->mdev
->dev
->port_random_macs
& 1 << priv
->port
)) {
3260 /* Random MAC was assigned in mlx4_slave_cap
3261 * in mlx4_core module
3263 dev
->addr_assign_type
|= NET_ADDR_RANDOM
;
3264 en_warn(priv
, "Assigned random MAC address %pM\n", dev
->dev_addr
);
3267 memcpy(priv
->current_mac
, dev
->dev_addr
, sizeof(priv
->current_mac
));
3269 priv
->stride
= roundup_pow_of_two(sizeof(struct mlx4_en_rx_desc
) +
3270 DS_SIZE
* MLX4_EN_MAX_RX_FRAGS
);
3271 err
= mlx4_en_alloc_resources(priv
);
3275 /* Initialize time stamping config */
3276 priv
->hwtstamp_config
.flags
= 0;
3277 priv
->hwtstamp_config
.tx_type
= HWTSTAMP_TX_OFF
;
3278 priv
->hwtstamp_config
.rx_filter
= HWTSTAMP_FILTER_NONE
;
3280 /* Allocate page for receive rings */
3281 err
= mlx4_alloc_hwq_res(mdev
->dev
, &priv
->res
,
3284 en_err(priv
, "Failed to allocate page for rx qps\n");
3287 priv
->allocated
= 1;
3290 * Initialize netdev entry points
3292 if (mlx4_is_master(priv
->mdev
->dev
))
3293 dev
->netdev_ops
= &mlx4_netdev_ops_master
;
3295 dev
->netdev_ops
= &mlx4_netdev_ops
;
3296 dev
->watchdog_timeo
= MLX4_EN_WATCHDOG_TIMEOUT
;
3297 netif_set_real_num_tx_queues(dev
, priv
->tx_ring_num
[TX
]);
3298 netif_set_real_num_rx_queues(dev
, priv
->rx_ring_num
);
3300 dev
->ethtool_ops
= &mlx4_en_ethtool_ops
;
3303 * Set driver features
3305 dev
->hw_features
= NETIF_F_SG
| NETIF_F_IP_CSUM
| NETIF_F_IPV6_CSUM
;
3306 if (mdev
->LSO_support
)
3307 dev
->hw_features
|= NETIF_F_TSO
| NETIF_F_TSO6
;
3309 dev
->vlan_features
= dev
->hw_features
;
3311 dev
->hw_features
|= NETIF_F_RXCSUM
| NETIF_F_RXHASH
;
3312 dev
->features
= dev
->hw_features
| NETIF_F_HIGHDMA
|
3313 NETIF_F_HW_VLAN_CTAG_TX
| NETIF_F_HW_VLAN_CTAG_RX
|
3314 NETIF_F_HW_VLAN_CTAG_FILTER
;
3315 dev
->hw_features
|= NETIF_F_LOOPBACK
|
3316 NETIF_F_HW_VLAN_CTAG_TX
| NETIF_F_HW_VLAN_CTAG_RX
;
3318 if (!(mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_SKIP_OUTER_VLAN
)) {
3319 dev
->features
|= NETIF_F_HW_VLAN_STAG_RX
|
3320 NETIF_F_HW_VLAN_STAG_FILTER
;
3321 dev
->hw_features
|= NETIF_F_HW_VLAN_STAG_RX
;
3324 if (mlx4_is_slave(mdev
->dev
)) {
3325 bool vlan_offload_disabled
;
3328 err
= get_phv_bit(mdev
->dev
, port
, &phv
);
3330 dev
->hw_features
|= NETIF_F_HW_VLAN_STAG_TX
;
3331 priv
->pflags
|= MLX4_EN_PRIV_FLAGS_PHV
;
3333 err
= mlx4_get_is_vlan_offload_disabled(mdev
->dev
, port
,
3334 &vlan_offload_disabled
);
3335 if (!err
&& vlan_offload_disabled
) {
3336 dev
->hw_features
&= ~(NETIF_F_HW_VLAN_CTAG_TX
|
3337 NETIF_F_HW_VLAN_CTAG_RX
|
3338 NETIF_F_HW_VLAN_STAG_TX
|
3339 NETIF_F_HW_VLAN_STAG_RX
);
3340 dev
->features
&= ~(NETIF_F_HW_VLAN_CTAG_TX
|
3341 NETIF_F_HW_VLAN_CTAG_RX
|
3342 NETIF_F_HW_VLAN_STAG_TX
|
3343 NETIF_F_HW_VLAN_STAG_RX
);
3346 if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_PHV_EN
&&
3347 !(mdev
->dev
->caps
.flags2
&
3348 MLX4_DEV_CAP_FLAG2_SKIP_OUTER_VLAN
))
3349 dev
->hw_features
|= NETIF_F_HW_VLAN_STAG_TX
;
3352 if (mdev
->dev
->caps
.flags
& MLX4_DEV_CAP_FLAG_FCS_KEEP
)
3353 dev
->hw_features
|= NETIF_F_RXFCS
;
3355 if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_IGNORE_FCS
)
3356 dev
->hw_features
|= NETIF_F_RXALL
;
3358 if (mdev
->dev
->caps
.steering_mode
==
3359 MLX4_STEERING_MODE_DEVICE_MANAGED
&&
3360 mdev
->dev
->caps
.dmfs_high_steer_mode
!= MLX4_STEERING_DMFS_A0_STATIC
)
3361 dev
->hw_features
|= NETIF_F_NTUPLE
;
3363 if (mdev
->dev
->caps
.steering_mode
!= MLX4_STEERING_MODE_A0
)
3364 dev
->priv_flags
|= IFF_UNICAST_FLT
;
3366 /* Setting a default hash function value */
3367 if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_RSS_TOP
) {
3368 priv
->rss_hash_fn
= ETH_RSS_HASH_TOP
;
3369 } else if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_RSS_XOR
) {
3370 priv
->rss_hash_fn
= ETH_RSS_HASH_XOR
;
3373 "No RSS hash capabilities exposed, using Toeplitz\n");
3374 priv
->rss_hash_fn
= ETH_RSS_HASH_TOP
;
3377 if (mdev
->dev
->caps
.tunnel_offload_mode
== MLX4_TUNNEL_OFFLOAD_MODE_VXLAN
) {
3378 dev
->hw_features
|= NETIF_F_GSO_UDP_TUNNEL
|
3379 NETIF_F_GSO_UDP_TUNNEL_CSUM
|
3380 NETIF_F_GSO_PARTIAL
;
3381 dev
->features
|= NETIF_F_GSO_UDP_TUNNEL
|
3382 NETIF_F_GSO_UDP_TUNNEL_CSUM
|
3383 NETIF_F_GSO_PARTIAL
;
3384 dev
->gso_partial_features
= NETIF_F_GSO_UDP_TUNNEL_CSUM
;
3387 /* MTU range: 46 - hw-specific max */
3388 dev
->min_mtu
= MLX4_EN_MIN_MTU
;
3389 dev
->max_mtu
= priv
->max_mtu
;
3391 mdev
->pndev
[port
] = dev
;
3392 mdev
->upper
[port
] = NULL
;
3394 netif_carrier_off(dev
);
3395 mlx4_en_set_default_moderation(priv
);
3397 en_warn(priv
, "Using %d TX rings\n", prof
->tx_ring_num
[TX
]);
3398 en_warn(priv
, "Using %d RX rings\n", prof
->rx_ring_num
);
3400 mlx4_en_update_loopback_state(priv
->dev
, priv
->dev
->features
);
3402 /* Configure port */
3403 mlx4_en_calc_rx_buf(dev
);
3404 err
= mlx4_SET_PORT_general(mdev
->dev
, priv
->port
,
3405 priv
->rx_skb_size
+ ETH_FCS_LEN
,
3406 prof
->tx_pause
, prof
->tx_ppp
,
3407 prof
->rx_pause
, prof
->rx_ppp
);
3409 en_err(priv
, "Failed setting port general configurations for port %d, with error %d\n",
3414 if (mdev
->dev
->caps
.tunnel_offload_mode
== MLX4_TUNNEL_OFFLOAD_MODE_VXLAN
) {
3415 err
= mlx4_SET_PORT_VXLAN(mdev
->dev
, priv
->port
, VXLAN_STEER_BY_OUTER_MAC
, 1);
3417 en_err(priv
, "Failed setting port L2 tunnel configuration, err %d\n",
3424 en_warn(priv
, "Initializing port\n");
3425 err
= mlx4_INIT_PORT(mdev
->dev
, priv
->port
);
3427 en_err(priv
, "Failed Initializing port\n");
3430 queue_delayed_work(mdev
->workqueue
, &priv
->stats_task
, STATS_DELAY
);
3432 /* Initialize time stamp mechanism */
3433 if (mdev
->dev
->caps
.flags2
& MLX4_DEV_CAP_FLAG2_TS
)
3434 mlx4_en_init_timestamp(mdev
);
3436 queue_delayed_work(mdev
->workqueue
, &priv
->service_task
,
3437 SERVICE_TASK_DELAY
);
3439 mlx4_en_set_stats_bitmap(mdev
->dev
, &priv
->stats_bitmap
,
3440 mdev
->profile
.prof
[priv
->port
].rx_ppp
,
3441 mdev
->profile
.prof
[priv
->port
].rx_pause
,
3442 mdev
->profile
.prof
[priv
->port
].tx_ppp
,
3443 mdev
->profile
.prof
[priv
->port
].tx_pause
);
3445 err
= register_netdev(dev
);
3447 en_err(priv
, "Netdev registration failed for port %d\n", port
);
3451 priv
->registered
= 1;
3452 devlink_port_type_eth_set(mlx4_get_devlink_port(mdev
->dev
, priv
->port
),
3459 kfree(priv
->tx_ring
[t
]);
3460 kfree(priv
->tx_cq
[t
]);
3463 mlx4_en_destroy_netdev(dev
);
3467 int mlx4_en_reset_config(struct net_device
*dev
,
3468 struct hwtstamp_config ts_config
,
3469 netdev_features_t features
)
3471 struct mlx4_en_priv
*priv
= netdev_priv(dev
);
3472 struct mlx4_en_dev
*mdev
= priv
->mdev
;
3473 struct mlx4_en_port_profile new_prof
;
3474 struct mlx4_en_priv
*tmp
;
3478 if (priv
->hwtstamp_config
.tx_type
== ts_config
.tx_type
&&
3479 priv
->hwtstamp_config
.rx_filter
== ts_config
.rx_filter
&&
3480 !DEV_FEATURE_CHANGED(dev
, features
, NETIF_F_HW_VLAN_CTAG_RX
) &&
3481 !DEV_FEATURE_CHANGED(dev
, features
, NETIF_F_RXFCS
))
3482 return 0; /* Nothing to change */
3484 if (DEV_FEATURE_CHANGED(dev
, features
, NETIF_F_HW_VLAN_CTAG_RX
) &&
3485 (features
& NETIF_F_HW_VLAN_CTAG_RX
) &&
3486 (priv
->hwtstamp_config
.rx_filter
!= HWTSTAMP_FILTER_NONE
)) {
3487 en_warn(priv
, "Can't turn ON rx vlan offload while time-stamping rx filter is ON\n");
3491 tmp
= kzalloc(sizeof(*tmp
), GFP_KERNEL
);
3495 mutex_lock(&mdev
->state_lock
);
3497 memcpy(&new_prof
, priv
->prof
, sizeof(struct mlx4_en_port_profile
));
3498 memcpy(&new_prof
.hwtstamp_config
, &ts_config
, sizeof(ts_config
));
3500 err
= mlx4_en_try_alloc_resources(priv
, tmp
, &new_prof
);
3504 if (priv
->port_up
) {
3506 mlx4_en_stop_port(dev
, 1);
3509 en_warn(priv
, "Changing device configuration rx filter(%x) rx vlan(%x)\n",
3510 ts_config
.rx_filter
,
3511 !!(features
& NETIF_F_HW_VLAN_CTAG_RX
));
3513 mlx4_en_safe_replace_resources(priv
, tmp
);
3515 if (DEV_FEATURE_CHANGED(dev
, features
, NETIF_F_HW_VLAN_CTAG_RX
)) {
3516 if (features
& NETIF_F_HW_VLAN_CTAG_RX
)
3517 dev
->features
|= NETIF_F_HW_VLAN_CTAG_RX
;
3519 dev
->features
&= ~NETIF_F_HW_VLAN_CTAG_RX
;
3520 } else if (ts_config
.rx_filter
== HWTSTAMP_FILTER_NONE
) {
3521 /* RX time-stamping is OFF, update the RX vlan offload
3522 * to the latest wanted state
3524 if (dev
->wanted_features
& NETIF_F_HW_VLAN_CTAG_RX
)
3525 dev
->features
|= NETIF_F_HW_VLAN_CTAG_RX
;
3527 dev
->features
&= ~NETIF_F_HW_VLAN_CTAG_RX
;
3530 if (DEV_FEATURE_CHANGED(dev
, features
, NETIF_F_RXFCS
)) {
3531 if (features
& NETIF_F_RXFCS
)
3532 dev
->features
|= NETIF_F_RXFCS
;
3534 dev
->features
&= ~NETIF_F_RXFCS
;
3537 /* RX vlan offload and RX time-stamping can't co-exist !
3538 * Regardless of the caller's choice,
3539 * Turn Off RX vlan offload in case of time-stamping is ON
3541 if (ts_config
.rx_filter
!= HWTSTAMP_FILTER_NONE
) {
3542 if (dev
->features
& NETIF_F_HW_VLAN_CTAG_RX
)
3543 en_warn(priv
, "Turning off RX vlan offload since RX time-stamping is ON\n");
3544 dev
->features
&= ~NETIF_F_HW_VLAN_CTAG_RX
;
3548 err
= mlx4_en_start_port(dev
);
3550 en_err(priv
, "Failed starting port\n");
3554 mutex_unlock(&mdev
->state_lock
);
3557 netdev_features_change(dev
);