2 * Copyright (c) 2016 Mellanox Technologies, Ltd.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
18 #include "netdev-tc-offloads.h"
21 #include <linux/if_ether.h>
25 #include "openvswitch/hmap.h"
26 #include "openvswitch/match.h"
27 #include "openvswitch/ofpbuf.h"
28 #include "openvswitch/thread.h"
29 #include "openvswitch/types.h"
30 #include "openvswitch/util.h"
31 #include "openvswitch/vlog.h"
32 #include "netdev-linux.h"
34 #include "netlink-socket.h"
35 #include "odp-netlink.h"
38 #include "unaligned.h"
41 VLOG_DEFINE_THIS_MODULE(netdev_tc_offloads
);
43 static struct vlog_rate_limit error_rl
= VLOG_RATE_LIMIT_INIT(60, 5);
45 static struct hmap ufid_tc
= HMAP_INITIALIZER(&ufid_tc
);
47 struct netlink_field
{
53 static struct netlink_field set_flower_map
[][3] = {
54 [OVS_KEY_ATTR_IPV4
] = {
55 { offsetof(struct ovs_key_ipv4
, ipv4_src
),
56 offsetof(struct tc_flower_key
, ipv4
.ipv4_src
),
57 MEMBER_SIZEOF(struct tc_flower_key
, ipv4
.ipv4_src
)
59 { offsetof(struct ovs_key_ipv4
, ipv4_dst
),
60 offsetof(struct tc_flower_key
, ipv4
.ipv4_dst
),
61 MEMBER_SIZEOF(struct tc_flower_key
, ipv4
.ipv4_dst
)
63 { offsetof(struct ovs_key_ipv4
, ipv4_ttl
),
64 offsetof(struct tc_flower_key
, ipv4
.rewrite_ttl
),
65 MEMBER_SIZEOF(struct tc_flower_key
, ipv4
.rewrite_ttl
)
68 [OVS_KEY_ATTR_IPV6
] = {
69 { offsetof(struct ovs_key_ipv6
, ipv6_src
),
70 offsetof(struct tc_flower_key
, ipv6
.ipv6_src
),
71 MEMBER_SIZEOF(struct tc_flower_key
, ipv6
.ipv6_src
)
73 { offsetof(struct ovs_key_ipv6
, ipv6_dst
),
74 offsetof(struct tc_flower_key
, ipv6
.ipv6_dst
),
75 MEMBER_SIZEOF(struct tc_flower_key
, ipv6
.ipv6_dst
)
78 [OVS_KEY_ATTR_ETHERNET
] = {
79 { offsetof(struct ovs_key_ethernet
, eth_src
),
80 offsetof(struct tc_flower_key
, src_mac
),
81 MEMBER_SIZEOF(struct tc_flower_key
, src_mac
)
83 { offsetof(struct ovs_key_ethernet
, eth_dst
),
84 offsetof(struct tc_flower_key
, dst_mac
),
85 MEMBER_SIZEOF(struct tc_flower_key
, dst_mac
)
88 [OVS_KEY_ATTR_ETHERTYPE
] = {
90 offsetof(struct tc_flower_key
, eth_type
),
91 MEMBER_SIZEOF(struct tc_flower_key
, eth_type
)
94 [OVS_KEY_ATTR_TCP
] = {
95 { offsetof(struct ovs_key_tcp
, tcp_src
),
96 offsetof(struct tc_flower_key
, tcp_src
),
97 MEMBER_SIZEOF(struct tc_flower_key
, tcp_src
)
99 { offsetof(struct ovs_key_tcp
, tcp_dst
),
100 offsetof(struct tc_flower_key
, tcp_dst
),
101 MEMBER_SIZEOF(struct tc_flower_key
, tcp_dst
)
104 [OVS_KEY_ATTR_UDP
] = {
105 { offsetof(struct ovs_key_udp
, udp_src
),
106 offsetof(struct tc_flower_key
, udp_src
),
107 MEMBER_SIZEOF(struct tc_flower_key
, udp_src
)
109 { offsetof(struct ovs_key_udp
, udp_dst
),
110 offsetof(struct tc_flower_key
, udp_dst
),
111 MEMBER_SIZEOF(struct tc_flower_key
, udp_dst
)
116 static struct ovs_mutex ufid_lock
= OVS_MUTEX_INITIALIZER
;
119 * struct ufid_tc_data - data entry for ufid_tc hmap.
120 * @ufid_node: Element in @ufid_tc hash table by ufid key.
121 * @tc_node: Element in @ufid_tc hash table by prio/handle/ifindex key.
122 * @ufid: ufid assigned to the flow
125 * @ifindex: netdev ifindex.
126 * @netdev: netdev associated with the tc rule
128 struct ufid_tc_data
{
129 struct hmap_node ufid_node
;
130 struct hmap_node tc_node
;
135 struct netdev
*netdev
;
138 /* Remove matching ufid entry from ufid_tc hashmap. */
140 del_ufid_tc_mapping(const ovs_u128
*ufid
)
142 size_t ufid_hash
= hash_bytes(ufid
, sizeof *ufid
, 0);
143 struct ufid_tc_data
*data
;
145 ovs_mutex_lock(&ufid_lock
);
146 HMAP_FOR_EACH_WITH_HASH(data
, ufid_node
, ufid_hash
, &ufid_tc
) {
147 if (ovs_u128_equals(*ufid
, data
->ufid
)) {
153 ovs_mutex_unlock(&ufid_lock
);
157 hmap_remove(&ufid_tc
, &data
->ufid_node
);
158 hmap_remove(&ufid_tc
, &data
->tc_node
);
159 netdev_close(data
->netdev
);
161 ovs_mutex_unlock(&ufid_lock
);
164 /* Add ufid entry to ufid_tc hashmap.
165 * If entry exists already it will be replaced. */
167 add_ufid_tc_mapping(const ovs_u128
*ufid
, int prio
, int handle
,
168 struct netdev
*netdev
, int ifindex
)
170 size_t ufid_hash
= hash_bytes(ufid
, sizeof *ufid
, 0);
171 size_t tc_hash
= hash_int(hash_int(prio
, handle
), ifindex
);
172 struct ufid_tc_data
*new_data
= xzalloc(sizeof *new_data
);
174 del_ufid_tc_mapping(ufid
);
176 new_data
->ufid
= *ufid
;
177 new_data
->prio
= prio
;
178 new_data
->handle
= handle
;
179 new_data
->netdev
= netdev_ref(netdev
);
180 new_data
->ifindex
= ifindex
;
182 ovs_mutex_lock(&ufid_lock
);
183 hmap_insert(&ufid_tc
, &new_data
->ufid_node
, ufid_hash
);
184 hmap_insert(&ufid_tc
, &new_data
->tc_node
, tc_hash
);
185 ovs_mutex_unlock(&ufid_lock
);
188 /* Get ufid from ufid_tc hashmap.
190 * If netdev output param is not NULL then the function will return
191 * associated netdev on success and a refcount is taken on that netdev.
192 * The caller is then responsible to close the netdev.
194 * Returns handle if successful and fill prio and netdev for that ufid.
195 * Otherwise returns 0.
198 get_ufid_tc_mapping(const ovs_u128
*ufid
, int *prio
, struct netdev
**netdev
)
200 size_t ufid_hash
= hash_bytes(ufid
, sizeof *ufid
, 0);
201 struct ufid_tc_data
*data
;
204 ovs_mutex_lock(&ufid_lock
);
205 HMAP_FOR_EACH_WITH_HASH(data
, ufid_node
, ufid_hash
, &ufid_tc
) {
206 if (ovs_u128_equals(*ufid
, data
->ufid
)) {
211 *netdev
= netdev_ref(data
->netdev
);
213 handle
= data
->handle
;
217 ovs_mutex_unlock(&ufid_lock
);
222 /* Find ufid entry in ufid_tc hashmap using prio, handle and netdev.
223 * The result is saved in ufid.
225 * Returns true on success.
228 find_ufid(int prio
, int handle
, struct netdev
*netdev
, ovs_u128
*ufid
)
230 int ifindex
= netdev_get_ifindex(netdev
);
231 struct ufid_tc_data
*data
;
232 size_t tc_hash
= hash_int(hash_int(prio
, handle
), ifindex
);
234 ovs_mutex_lock(&ufid_lock
);
235 HMAP_FOR_EACH_WITH_HASH(data
, tc_node
, tc_hash
, &ufid_tc
) {
236 if (data
->prio
== prio
&& data
->handle
== handle
237 && data
->ifindex
== ifindex
) {
242 ovs_mutex_unlock(&ufid_lock
);
244 return (data
!= NULL
);
247 struct prio_map_data
{
248 struct hmap_node node
;
249 struct tc_flower_key mask
;
254 /* Get free prio for tc flower
255 * If prio is already allocated for mask/eth_type combination then return it.
256 * If not assign new prio.
258 * Return prio on success or 0 if we are out of prios.
261 get_prio_for_tc_flower(struct tc_flower
*flower
)
263 static struct hmap prios
= HMAP_INITIALIZER(&prios
);
264 static struct ovs_mutex prios_lock
= OVS_MUTEX_INITIALIZER
;
265 static uint16_t last_prio
= 0;
266 size_t key_len
= sizeof(struct tc_flower_key
);
267 size_t hash
= hash_bytes(&flower
->mask
, key_len
,
268 (OVS_FORCE
uint32_t) flower
->key
.eth_type
);
269 struct prio_map_data
*data
;
270 struct prio_map_data
*new_data
;
272 /* We can use the same prio for same mask/eth combination but must have
273 * different prio if not. Flower classifier will reject same prio for
274 * different mask/eth combination. */
275 ovs_mutex_lock(&prios_lock
);
276 HMAP_FOR_EACH_WITH_HASH(data
, node
, hash
, &prios
) {
277 if (!memcmp(&flower
->mask
, &data
->mask
, key_len
)
278 && data
->protocol
== flower
->key
.eth_type
) {
279 ovs_mutex_unlock(&prios_lock
);
284 if (last_prio
== UINT16_MAX
) {
285 /* last_prio can overflow if there will be many different kinds of
286 * flows which shouldn't happen organically. */
287 ovs_mutex_unlock(&prios_lock
);
291 new_data
= xzalloc(sizeof *new_data
);
292 memcpy(&new_data
->mask
, &flower
->mask
, key_len
);
293 new_data
->prio
= ++last_prio
;
294 new_data
->protocol
= flower
->key
.eth_type
;
295 hmap_insert(&prios
, &new_data
->node
, hash
);
296 ovs_mutex_unlock(&prios_lock
);
298 return new_data
->prio
;
302 netdev_tc_flow_flush(struct netdev
*netdev
)
304 int ifindex
= netdev_get_ifindex(netdev
);
307 VLOG_ERR_RL(&error_rl
, "flow_flush: failed to get ifindex for %s: %s",
308 netdev_get_name(netdev
), ovs_strerror(-ifindex
));
312 return tc_flush(ifindex
);
316 netdev_tc_flow_dump_create(struct netdev
*netdev
,
317 struct netdev_flow_dump
**dump_out
)
319 struct netdev_flow_dump
*dump
;
322 ifindex
= netdev_get_ifindex(netdev
);
324 VLOG_ERR_RL(&error_rl
, "dump_create: failed to get ifindex for %s: %s",
325 netdev_get_name(netdev
), ovs_strerror(-ifindex
));
329 dump
= xzalloc(sizeof *dump
);
330 dump
->nl_dump
= xzalloc(sizeof *dump
->nl_dump
);
331 dump
->netdev
= netdev_ref(netdev
);
332 tc_dump_flower_start(ifindex
, dump
->nl_dump
);
340 netdev_tc_flow_dump_destroy(struct netdev_flow_dump
*dump
)
342 nl_dump_done(dump
->nl_dump
);
343 netdev_close(dump
->netdev
);
350 parse_flower_rewrite_to_netlink_action(struct ofpbuf
*buf
,
351 struct tc_flower
*flower
)
353 char *mask
= (char *) &flower
->rewrite
.mask
;
354 char *data
= (char *) &flower
->rewrite
.key
;
356 for (int type
= 0; type
< ARRAY_SIZE(set_flower_map
); type
++) {
359 int len
= ovs_flow_key_attr_lens
[type
].len
;
365 for (int j
= 0; j
< ARRAY_SIZE(set_flower_map
[type
]); j
++) {
366 struct netlink_field
*f
= &set_flower_map
[type
][j
];
372 if (!is_all_zeros(mask
+ f
->flower_offset
, f
->size
)) {
374 nested
= nl_msg_start_nested(buf
,
375 OVS_ACTION_ATTR_SET_MASKED
);
376 put
= nl_msg_put_unspec_zero(buf
, type
, len
* 2);
379 memcpy(put
+ f
->offset
, data
+ f
->flower_offset
, f
->size
);
380 memcpy(put
+ len
+ f
->offset
,
381 mask
+ f
->flower_offset
, f
->size
);
386 nl_msg_end_nested(buf
, nested
);
392 parse_tc_flower_to_match(struct tc_flower
*flower
,
394 struct nlattr
**actions
,
395 struct dpif_flow_stats
*stats
,
396 struct ofpbuf
*buf
) {
398 struct tc_flower_key
*key
= &flower
->key
;
399 struct tc_flower_key
*mask
= &flower
->mask
;
400 odp_port_t outport
= 0;
402 if (flower
->ifindex_out
) {
403 outport
= netdev_ifindex_to_odp_port(flower
->ifindex_out
);
411 match_init_catchall(match
);
412 match_set_dl_src_masked(match
, key
->src_mac
, mask
->src_mac
);
413 match_set_dl_dst_masked(match
, key
->dst_mac
, mask
->dst_mac
);
415 if (key
->eth_type
== htons(ETH_TYPE_VLAN
)) {
416 match_set_dl_vlan(match
, htons(key
->vlan_id
));
417 match_set_dl_vlan_pcp(match
, key
->vlan_prio
);
418 match_set_dl_type(match
, key
->encap_eth_type
);
419 flow_fix_vlan_tpid(&match
->flow
);
421 match_set_dl_type(match
, key
->eth_type
);
424 if (is_ip_any(&match
->flow
)) {
426 match_set_nw_proto(match
, key
->ip_proto
);
429 match_set_nw_ttl_masked(match
, key
->ip_ttl
, mask
->ip_ttl
);
431 match_set_nw_src_masked(match
, key
->ipv4
.ipv4_src
, mask
->ipv4
.ipv4_src
);
432 match_set_nw_dst_masked(match
, key
->ipv4
.ipv4_dst
, mask
->ipv4
.ipv4_dst
);
434 match_set_ipv6_src_masked(match
,
435 &key
->ipv6
.ipv6_src
, &mask
->ipv6
.ipv6_src
);
436 match_set_ipv6_dst_masked(match
,
437 &key
->ipv6
.ipv6_dst
, &mask
->ipv6
.ipv6_dst
);
439 if (key
->ip_proto
== IPPROTO_TCP
) {
440 match_set_tp_dst_masked(match
, key
->tcp_dst
, mask
->tcp_dst
);
441 match_set_tp_src_masked(match
, key
->tcp_src
, mask
->tcp_src
);
442 match_set_tcp_flags_masked(match
, key
->tcp_flags
, mask
->tcp_flags
);
443 } else if (key
->ip_proto
== IPPROTO_UDP
) {
444 match_set_tp_dst_masked(match
, key
->udp_dst
, mask
->udp_dst
);
445 match_set_tp_src_masked(match
, key
->udp_src
, mask
->udp_src
);
446 } else if (key
->ip_proto
== IPPROTO_SCTP
) {
447 match_set_tp_dst_masked(match
, key
->sctp_dst
, mask
->sctp_dst
);
448 match_set_tp_src_masked(match
, key
->sctp_src
, mask
->sctp_src
);
452 if (flower
->tunnel
.tunnel
) {
453 match_set_tun_id(match
, flower
->tunnel
.id
);
454 if (flower
->tunnel
.ipv4
.ipv4_dst
) {
455 match_set_tun_src(match
, flower
->tunnel
.ipv4
.ipv4_src
);
456 match_set_tun_dst(match
, flower
->tunnel
.ipv4
.ipv4_dst
);
457 } else if (!is_all_zeros(&flower
->tunnel
.ipv6
.ipv6_dst
,
458 sizeof flower
->tunnel
.ipv6
.ipv6_dst
)) {
459 match_set_tun_ipv6_src(match
, &flower
->tunnel
.ipv6
.ipv6_src
);
460 match_set_tun_ipv6_dst(match
, &flower
->tunnel
.ipv6
.ipv6_dst
);
462 if (flower
->tunnel
.tp_dst
) {
463 match_set_tun_tp_dst(match
, flower
->tunnel
.tp_dst
);
467 act_off
= nl_msg_start_nested(buf
, OVS_FLOW_ATTR_ACTIONS
);
469 if (flower
->vlan_pop
) {
470 nl_msg_put_flag(buf
, OVS_ACTION_ATTR_POP_VLAN
);
473 if (flower
->vlan_push_id
|| flower
->vlan_push_prio
) {
474 struct ovs_action_push_vlan
*push
;
475 push
= nl_msg_put_unspec_zero(buf
, OVS_ACTION_ATTR_PUSH_VLAN
,
478 push
->vlan_tpid
= htons(ETH_TYPE_VLAN
);
479 push
->vlan_tci
= htons(flower
->vlan_push_id
480 | (flower
->vlan_push_prio
<< 13)
484 if (flower
->rewrite
.rewrite
) {
485 parse_flower_rewrite_to_netlink_action(buf
, flower
);
488 if (flower
->set
.set
) {
489 size_t set_offset
= nl_msg_start_nested(buf
, OVS_ACTION_ATTR_SET
);
490 size_t tunnel_offset
=
491 nl_msg_start_nested(buf
, OVS_KEY_ATTR_TUNNEL
);
493 nl_msg_put_be64(buf
, OVS_TUNNEL_KEY_ATTR_ID
, flower
->set
.id
);
494 if (flower
->set
.ipv4
.ipv4_src
) {
495 nl_msg_put_be32(buf
, OVS_TUNNEL_KEY_ATTR_IPV4_SRC
,
496 flower
->set
.ipv4
.ipv4_src
);
498 if (flower
->set
.ipv4
.ipv4_dst
) {
499 nl_msg_put_be32(buf
, OVS_TUNNEL_KEY_ATTR_IPV4_DST
,
500 flower
->set
.ipv4
.ipv4_dst
);
502 if (!is_all_zeros(&flower
->set
.ipv6
.ipv6_src
,
503 sizeof flower
->set
.ipv6
.ipv6_src
)) {
504 nl_msg_put_in6_addr(buf
, OVS_TUNNEL_KEY_ATTR_IPV6_SRC
,
505 &flower
->set
.ipv6
.ipv6_src
);
507 if (!is_all_zeros(&flower
->set
.ipv6
.ipv6_dst
,
508 sizeof flower
->set
.ipv6
.ipv6_dst
)) {
509 nl_msg_put_in6_addr(buf
, OVS_TUNNEL_KEY_ATTR_IPV6_DST
,
510 &flower
->set
.ipv6
.ipv6_dst
);
512 nl_msg_put_be16(buf
, OVS_TUNNEL_KEY_ATTR_TP_DST
,
515 nl_msg_end_nested(buf
, tunnel_offset
);
516 nl_msg_end_nested(buf
, set_offset
);
519 if (flower
->ifindex_out
> 0) {
520 nl_msg_put_u32(buf
, OVS_ACTION_ATTR_OUTPUT
, odp_to_u32(outport
));
524 nl_msg_end_nested(buf
, act_off
);
526 *actions
= ofpbuf_at_assert(buf
, act_off
, sizeof(struct nlattr
));
529 memset(stats
, 0, sizeof *stats
);
530 stats
->n_packets
= get_32aligned_u64(&flower
->stats
.n_packets
);
531 stats
->n_bytes
= get_32aligned_u64(&flower
->stats
.n_bytes
);
532 stats
->used
= flower
->lastused
;
539 netdev_tc_flow_dump_next(struct netdev_flow_dump
*dump
,
541 struct nlattr
**actions
,
542 struct dpif_flow_stats
*stats
,
544 struct ofpbuf
*rbuffer
,
545 struct ofpbuf
*wbuffer
)
547 struct ofpbuf nl_flow
;
549 while (nl_dump_next(dump
->nl_dump
, &nl_flow
, rbuffer
)) {
550 struct tc_flower flower
;
551 struct netdev
*netdev
= dump
->netdev
;
553 if (parse_netlink_to_tc_flower(&nl_flow
, &flower
)) {
557 if (parse_tc_flower_to_match(&flower
, match
, actions
, stats
,
562 if (flower
.act_cookie
.len
) {
563 *ufid
= *((ovs_u128
*) flower
.act_cookie
.data
);
564 } else if (!find_ufid(flower
.prio
, flower
.handle
, netdev
, ufid
)) {
568 match
->wc
.masks
.in_port
.odp_port
= u32_to_odp(UINT32_MAX
);
569 match
->flow
.in_port
.odp_port
= dump
->port
;
578 parse_put_flow_set_masked_action(struct tc_flower
*flower
,
579 const struct nlattr
*set
,
583 static struct vlog_rate_limit rl
= VLOG_RATE_LIMIT_INIT(5, 20);
584 uint64_t set_stub
[1024 / 8];
585 struct ofpbuf set_buf
= OFPBUF_STUB_INITIALIZER(set_stub
);
586 char *set_data
, *set_mask
;
587 char *key
= (char *) &flower
->rewrite
.key
;
588 char *mask
= (char *) &flower
->rewrite
.mask
;
589 const struct nlattr
*attr
;
593 /* copy so we can set attr mask to 0 for used ovs key struct members */
594 attr
= ofpbuf_put(&set_buf
, set
, set_len
);
596 type
= nl_attr_type(attr
);
597 size
= nl_attr_get_size(attr
) / 2;
598 set_data
= CONST_CAST(char *, nl_attr_get(attr
));
599 set_mask
= set_data
+ size
;
601 if (type
>= ARRAY_SIZE(set_flower_map
)
602 || !set_flower_map
[type
][0].size
) {
603 VLOG_DBG_RL(&rl
, "unsupported set action type: %d", type
);
604 ofpbuf_uninit(&set_buf
);
608 for (i
= 0; i
< ARRAY_SIZE(set_flower_map
[type
]); i
++) {
609 struct netlink_field
*f
= &set_flower_map
[type
][i
];
615 /* copy masked value */
616 for (j
= 0; j
< f
->size
; j
++) {
617 char maskval
= hasmask
? set_mask
[f
->offset
+ j
] : 0xFF;
619 key
[f
->flower_offset
+ j
] = maskval
& set_data
[f
->offset
+ j
];
620 mask
[f
->flower_offset
+ j
] = maskval
;
624 /* set its mask to 0 to show it's been used. */
626 memset(set_mask
+ f
->offset
, 0, f
->size
);
630 if (!is_all_zeros(&flower
->rewrite
, sizeof flower
->rewrite
)) {
631 flower
->rewrite
.rewrite
= true;
634 if (hasmask
&& !is_all_zeros(set_mask
, size
)) {
635 VLOG_DBG_RL(&rl
, "unsupported sub attribute of set action type %d",
637 ofpbuf_uninit(&set_buf
);
641 ofpbuf_uninit(&set_buf
);
646 parse_put_flow_set_action(struct tc_flower
*flower
, const struct nlattr
*set
,
649 const struct nlattr
*tunnel
;
650 const struct nlattr
*tun_attr
;
651 size_t tun_left
, tunnel_len
;
653 if (nl_attr_type(set
) != OVS_KEY_ATTR_TUNNEL
) {
654 return parse_put_flow_set_masked_action(flower
, set
, set_len
,
658 tunnel
= nl_attr_get(set
);
659 tunnel_len
= nl_attr_get_size(set
);
661 flower
->set
.set
= true;
662 NL_ATTR_FOR_EACH_UNSAFE(tun_attr
, tun_left
, tunnel
, tunnel_len
) {
663 switch (nl_attr_type(tun_attr
)) {
664 case OVS_TUNNEL_KEY_ATTR_ID
: {
665 flower
->set
.id
= nl_attr_get_be64(tun_attr
);
668 case OVS_TUNNEL_KEY_ATTR_IPV4_SRC
: {
669 flower
->set
.ipv4
.ipv4_src
= nl_attr_get_be32(tun_attr
);
672 case OVS_TUNNEL_KEY_ATTR_IPV4_DST
: {
673 flower
->set
.ipv4
.ipv4_dst
= nl_attr_get_be32(tun_attr
);
676 case OVS_TUNNEL_KEY_ATTR_IPV6_SRC
: {
677 flower
->set
.ipv6
.ipv6_src
=
678 nl_attr_get_in6_addr(tun_attr
);
681 case OVS_TUNNEL_KEY_ATTR_IPV6_DST
: {
682 flower
->set
.ipv6
.ipv6_dst
=
683 nl_attr_get_in6_addr(tun_attr
);
686 case OVS_TUNNEL_KEY_ATTR_TP_SRC
: {
687 flower
->set
.tp_src
= nl_attr_get_be16(tun_attr
);
690 case OVS_TUNNEL_KEY_ATTR_TP_DST
: {
691 flower
->set
.tp_dst
= nl_attr_get_be16(tun_attr
);
701 test_key_and_mask(struct match
*match
)
703 static struct vlog_rate_limit rl
= VLOG_RATE_LIMIT_INIT(5, 20);
704 const struct flow
*key
= &match
->flow
;
705 struct flow
*mask
= &match
->wc
.masks
;
707 if (mask
->pkt_mark
) {
708 VLOG_DBG_RL(&rl
, "offloading attribute pkt_mark isn't supported");
712 if (mask
->recirc_id
&& key
->recirc_id
) {
713 VLOG_DBG_RL(&rl
, "offloading attribute recirc_id isn't supported");
719 VLOG_DBG_RL(&rl
, "offloading attribute dp_hash isn't supported");
724 VLOG_DBG_RL(&rl
, "offloading attribute conj_id isn't supported");
728 if (mask
->skb_priority
) {
729 VLOG_DBG_RL(&rl
, "offloading attribute skb_priority isn't supported");
733 if (mask
->actset_output
) {
735 "offloading attribute actset_output isn't supported");
739 if (mask
->ct_state
) {
740 VLOG_DBG_RL(&rl
, "offloading attribute ct_state isn't supported");
745 VLOG_DBG_RL(&rl
, "offloading attribute ct_zone isn't supported");
750 VLOG_DBG_RL(&rl
, "offloading attribute ct_mark isn't supported");
754 if (mask
->packet_type
&& key
->packet_type
) {
755 VLOG_DBG_RL(&rl
, "offloading attribute packet_type isn't supported");
758 mask
->packet_type
= 0;
760 if (!ovs_u128_is_zero(mask
->ct_label
)) {
761 VLOG_DBG_RL(&rl
, "offloading attribute ct_label isn't supported");
765 for (int i
= 0; i
< FLOW_N_REGS
; i
++) {
768 "offloading attribute regs[%d] isn't supported", i
);
773 if (mask
->metadata
) {
774 VLOG_DBG_RL(&rl
, "offloading attribute metadata isn't supported");
779 VLOG_DBG_RL(&rl
, "offloading attribute nw_tos isn't supported");
784 VLOG_DBG_RL(&rl
, "offloading attribute nw_frag isn't supported");
788 for (int i
= 0; i
< FLOW_MAX_MPLS_LABELS
; i
++) {
789 if (mask
->mpls_lse
[i
]) {
790 VLOG_DBG_RL(&rl
, "offloading attribute mpls_lse isn't supported");
795 if (key
->dl_type
== htons(ETH_TYPE_IP
) &&
796 key
->nw_proto
== IPPROTO_ICMP
) {
799 "offloading attribute icmp_type isn't supported");
804 "offloading attribute icmp_code isn't supported");
807 } else if (key
->dl_type
== htons(ETH_TYPE_IP
) &&
808 key
->nw_proto
== IPPROTO_IGMP
) {
811 "offloading attribute igmp_type isn't supported");
816 "offloading attribute igmp_code isn't supported");
819 } else if (key
->dl_type
== htons(ETH_TYPE_IPV6
) &&
820 key
->nw_proto
== IPPROTO_ICMPV6
) {
823 "offloading attribute icmp_type isn't supported");
828 "offloading attribute icmp_code isn't supported");
833 if (!is_all_zeros(mask
, sizeof *mask
)) {
834 VLOG_DBG_RL(&rl
, "offloading isn't supported, unknown attribute");
842 netdev_tc_flow_put(struct netdev
*netdev
, struct match
*match
,
843 struct nlattr
*actions
, size_t actions_len
,
844 const ovs_u128
*ufid
, struct offload_info
*info
,
845 struct dpif_flow_stats
*stats OVS_UNUSED
)
847 static struct vlog_rate_limit rl
= VLOG_RATE_LIMIT_INIT(5, 20);
848 struct tc_flower flower
;
849 const struct flow
*key
= &match
->flow
;
850 struct flow
*mask
= &match
->wc
.masks
;
851 const struct flow_tnl
*tnl
= &match
->flow
.tunnel
;
859 ifindex
= netdev_get_ifindex(netdev
);
861 VLOG_ERR_RL(&error_rl
, "flow_put: failed to get ifindex for %s: %s",
862 netdev_get_name(netdev
), ovs_strerror(-ifindex
));
866 memset(&flower
, 0, sizeof flower
);
868 if (flow_tnl_dst_is_set(&key
->tunnel
)) {
870 "tunnel: id %#" PRIx64
" src " IP_FMT
871 " dst " IP_FMT
" tp_src %d tp_dst %d",
873 IP_ARGS(tnl
->ip_src
), IP_ARGS(tnl
->ip_dst
),
874 ntohs(tnl
->tp_src
), ntohs(tnl
->tp_dst
));
875 flower
.tunnel
.id
= tnl
->tun_id
;
876 flower
.tunnel
.ipv4
.ipv4_src
= tnl
->ip_src
;
877 flower
.tunnel
.ipv4
.ipv4_dst
= tnl
->ip_dst
;
878 flower
.tunnel
.ipv6
.ipv6_src
= tnl
->ipv6_src
;
879 flower
.tunnel
.ipv6
.ipv6_dst
= tnl
->ipv6_dst
;
880 flower
.tunnel
.tp_src
= tnl
->tp_src
;
881 flower
.tunnel
.tp_dst
= tnl
->tp_dst
;
882 flower
.tunnel
.tunnel
= true;
884 memset(&mask
->tunnel
, 0, sizeof mask
->tunnel
);
886 flower
.key
.eth_type
= key
->dl_type
;
887 flower
.mask
.eth_type
= mask
->dl_type
;
889 if (mask
->vlans
[0].tci
) {
890 ovs_be16 vid_mask
= mask
->vlans
[0].tci
& htons(VLAN_VID_MASK
);
891 ovs_be16 pcp_mask
= mask
->vlans
[0].tci
& htons(VLAN_PCP_MASK
);
892 ovs_be16 cfi
= mask
->vlans
[0].tci
& htons(VLAN_CFI
);
894 if (cfi
&& key
->vlans
[0].tci
& htons(VLAN_CFI
)
895 && (!vid_mask
|| vid_mask
== htons(VLAN_VID_MASK
))
896 && (!pcp_mask
|| pcp_mask
== htons(VLAN_PCP_MASK
))
897 && (vid_mask
|| pcp_mask
)) {
899 flower
.key
.vlan_id
= vlan_tci_to_vid(key
->vlans
[0].tci
);
900 VLOG_DBG_RL(&rl
, "vlan_id: %d\n", flower
.key
.vlan_id
);
903 flower
.key
.vlan_prio
= vlan_tci_to_pcp(key
->vlans
[0].tci
);
904 VLOG_DBG_RL(&rl
, "vlan_prio: %d\n", flower
.key
.vlan_prio
);
906 flower
.key
.encap_eth_type
= flower
.key
.eth_type
;
907 flower
.key
.eth_type
= htons(ETH_TYPE_VLAN
);
908 } else if (mask
->vlans
[0].tci
== htons(0xffff) &&
909 ntohs(key
->vlans
[0].tci
) == 0) {
910 /* exact && no vlan */
915 } else if (mask
->vlans
[1].tci
) {
918 memset(mask
->vlans
, 0, sizeof mask
->vlans
);
920 flower
.key
.dst_mac
= key
->dl_dst
;
921 flower
.mask
.dst_mac
= mask
->dl_dst
;
922 flower
.key
.src_mac
= key
->dl_src
;
923 flower
.mask
.src_mac
= mask
->dl_src
;
924 memset(&mask
->dl_dst
, 0, sizeof mask
->dl_dst
);
925 memset(&mask
->dl_src
, 0, sizeof mask
->dl_src
);
927 mask
->in_port
.odp_port
= 0;
929 if (is_ip_any(key
)) {
930 flower
.key
.ip_proto
= key
->nw_proto
;
931 flower
.mask
.ip_proto
= mask
->nw_proto
;
932 flower
.key
.ip_ttl
= key
->nw_ttl
;
933 flower
.mask
.ip_ttl
= mask
->nw_ttl
;
935 if (key
->nw_proto
== IPPROTO_TCP
) {
936 flower
.key
.tcp_dst
= key
->tp_dst
;
937 flower
.mask
.tcp_dst
= mask
->tp_dst
;
938 flower
.key
.tcp_src
= key
->tp_src
;
939 flower
.mask
.tcp_src
= mask
->tp_src
;
940 flower
.key
.tcp_flags
= key
->tcp_flags
;
941 flower
.mask
.tcp_flags
= mask
->tcp_flags
;
945 } else if (key
->nw_proto
== IPPROTO_UDP
) {
946 flower
.key
.udp_dst
= key
->tp_dst
;
947 flower
.mask
.udp_dst
= mask
->tp_dst
;
948 flower
.key
.udp_src
= key
->tp_src
;
949 flower
.mask
.udp_src
= mask
->tp_src
;
952 } else if (key
->nw_proto
== IPPROTO_SCTP
) {
953 flower
.key
.sctp_dst
= key
->tp_dst
;
954 flower
.mask
.sctp_dst
= mask
->tp_dst
;
955 flower
.key
.sctp_src
= key
->tp_src
;
956 flower
.mask
.sctp_src
= mask
->tp_src
;
966 if (key
->dl_type
== htons(ETH_P_IP
)) {
967 flower
.key
.ipv4
.ipv4_src
= key
->nw_src
;
968 flower
.mask
.ipv4
.ipv4_src
= mask
->nw_src
;
969 flower
.key
.ipv4
.ipv4_dst
= key
->nw_dst
;
970 flower
.mask
.ipv4
.ipv4_dst
= mask
->nw_dst
;
973 } else if (key
->dl_type
== htons(ETH_P_IPV6
)) {
974 flower
.key
.ipv6
.ipv6_src
= key
->ipv6_src
;
975 flower
.mask
.ipv6
.ipv6_src
= mask
->ipv6_src
;
976 flower
.key
.ipv6
.ipv6_dst
= key
->ipv6_dst
;
977 flower
.mask
.ipv6
.ipv6_dst
= mask
->ipv6_dst
;
978 memset(&mask
->ipv6_src
, 0, sizeof mask
->ipv6_src
);
979 memset(&mask
->ipv6_dst
, 0, sizeof mask
->ipv6_dst
);
983 err
= test_key_and_mask(match
);
988 NL_ATTR_FOR_EACH(nla
, left
, actions
, actions_len
) {
989 if (nl_attr_type(nla
) == OVS_ACTION_ATTR_OUTPUT
) {
990 odp_port_t port
= nl_attr_get_odp_port(nla
);
991 struct netdev
*outdev
= netdev_ports_get(port
, info
->dpif_class
);
993 flower
.ifindex_out
= netdev_get_ifindex(outdev
);
994 flower
.set
.tp_dst
= info
->tp_dst_port
;
995 netdev_close(outdev
);
996 } else if (nl_attr_type(nla
) == OVS_ACTION_ATTR_PUSH_VLAN
) {
997 const struct ovs_action_push_vlan
*vlan_push
= nl_attr_get(nla
);
999 flower
.vlan_push_id
= vlan_tci_to_vid(vlan_push
->vlan_tci
);
1000 flower
.vlan_push_prio
= vlan_tci_to_pcp(vlan_push
->vlan_tci
);
1001 } else if (nl_attr_type(nla
) == OVS_ACTION_ATTR_POP_VLAN
) {
1002 flower
.vlan_pop
= 1;
1003 } else if (nl_attr_type(nla
) == OVS_ACTION_ATTR_SET
) {
1004 const struct nlattr
*set
= nl_attr_get(nla
);
1005 const size_t set_len
= nl_attr_get_size(nla
);
1007 err
= parse_put_flow_set_action(&flower
, set
, set_len
);
1011 } else if (nl_attr_type(nla
) == OVS_ACTION_ATTR_SET_MASKED
) {
1012 const struct nlattr
*set
= nl_attr_get(nla
);
1013 const size_t set_len
= nl_attr_get_size(nla
);
1015 err
= parse_put_flow_set_masked_action(&flower
, set
, set_len
,
1021 VLOG_DBG_RL(&rl
, "unsupported put action type: %d",
1027 handle
= get_ufid_tc_mapping(ufid
, &prio
, NULL
);
1028 if (handle
&& prio
) {
1029 VLOG_DBG_RL(&rl
, "updating old handle: %d prio: %d", handle
, prio
);
1030 tc_del_filter(ifindex
, prio
, handle
);
1034 prio
= get_prio_for_tc_flower(&flower
);
1036 VLOG_ERR_RL(&rl
, "couldn't get tc prio: %s", ovs_strerror(ENOSPC
));
1041 flower
.act_cookie
.data
= ufid
;
1042 flower
.act_cookie
.len
= sizeof *ufid
;
1044 err
= tc_replace_flower(ifindex
, prio
, handle
, &flower
);
1046 add_ufid_tc_mapping(ufid
, flower
.prio
, flower
.handle
, netdev
, ifindex
);
1053 netdev_tc_flow_get(struct netdev
*netdev OVS_UNUSED
,
1054 struct match
*match
,
1055 struct nlattr
**actions
,
1056 const ovs_u128
*ufid
,
1057 struct dpif_flow_stats
*stats
,
1060 static struct vlog_rate_limit rl
= VLOG_RATE_LIMIT_INIT(5, 20);
1062 struct tc_flower flower
;
1069 handle
= get_ufid_tc_mapping(ufid
, &prio
, &dev
);
1074 ifindex
= netdev_get_ifindex(dev
);
1076 VLOG_ERR_RL(&error_rl
, "flow_get: failed to get ifindex for %s: %s",
1077 netdev_get_name(dev
), ovs_strerror(-ifindex
));
1082 VLOG_DBG_RL(&rl
, "flow get (dev %s prio %d handle %d)",
1083 netdev_get_name(dev
), prio
, handle
);
1084 err
= tc_get_flower(ifindex
, prio
, handle
, &flower
);
1087 VLOG_ERR_RL(&error_rl
, "flow get failed (dev %s prio %d handle %d): %s",
1088 netdev_get_name(dev
), prio
, handle
, ovs_strerror(err
));
1092 in_port
= netdev_ifindex_to_odp_port(ifindex
);
1093 parse_tc_flower_to_match(&flower
, match
, actions
, stats
, buf
);
1095 match
->wc
.masks
.in_port
.odp_port
= u32_to_odp(UINT32_MAX
);
1096 match
->flow
.in_port
.odp_port
= in_port
;
1102 netdev_tc_flow_del(struct netdev
*netdev OVS_UNUSED
,
1103 const ovs_u128
*ufid
,
1104 struct dpif_flow_stats
*stats
)
1106 struct tc_flower flower
;
1113 handle
= get_ufid_tc_mapping(ufid
, &prio
, &dev
);
1118 ifindex
= netdev_get_ifindex(dev
);
1120 VLOG_ERR_RL(&error_rl
, "flow_del: failed to get ifindex for %s: %s",
1121 netdev_get_name(dev
), ovs_strerror(-ifindex
));
1127 memset(stats
, 0, sizeof *stats
);
1128 if (!tc_get_flower(ifindex
, prio
, handle
, &flower
)) {
1129 stats
->n_packets
= get_32aligned_u64(&flower
.stats
.n_packets
);
1130 stats
->n_bytes
= get_32aligned_u64(&flower
.stats
.n_bytes
);
1131 stats
->used
= flower
.lastused
;
1135 error
= tc_del_filter(ifindex
, prio
, handle
);
1136 del_ufid_tc_mapping(ufid
);
1144 netdev_tc_init_flow_api(struct netdev
*netdev
)
1149 ifindex
= netdev_get_ifindex(netdev
);
1151 VLOG_ERR_RL(&error_rl
, "init: failed to get ifindex for %s: %s",
1152 netdev_get_name(netdev
), ovs_strerror(-ifindex
));
1156 error
= tc_add_del_ingress_qdisc(ifindex
, true);
1158 if (error
&& error
!= EEXIST
) {
1159 VLOG_ERR("failed adding ingress qdisc required for offloading: %s",
1160 ovs_strerror(error
));
1164 VLOG_INFO("added ingress qdisc to %s", netdev_get_name(netdev
));