2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/vmalloc.h>
17 #include <linux/netfilter.h>
18 #include <linux/netfilter/nfnetlink.h>
19 #include <linux/netfilter/nf_tables.h>
20 #include <net/netfilter/nf_flow_table.h>
21 #include <net/netfilter/nf_tables_core.h>
22 #include <net/netfilter/nf_tables.h>
23 #include <net/net_namespace.h>
26 static LIST_HEAD(nf_tables_expressions
);
27 static LIST_HEAD(nf_tables_objects
);
28 static LIST_HEAD(nf_tables_flowtables
);
31 * nft_register_afinfo - register nf_tables address family info
33 * @afi: address family info to register
35 * Register the address family for use with nf_tables. Returns zero on
36 * success or a negative errno code otherwise.
38 int nft_register_afinfo(struct net
*net
, struct nft_af_info
*afi
)
40 INIT_LIST_HEAD(&afi
->tables
);
41 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
42 list_add_tail_rcu(&afi
->list
, &net
->nft
.af_info
);
43 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
46 EXPORT_SYMBOL_GPL(nft_register_afinfo
);
48 static void __nft_release_afinfo(struct net
*net
, struct nft_af_info
*afi
);
51 * nft_unregister_afinfo - unregister nf_tables address family info
53 * @afi: address family info to unregister
55 * Unregister the address family for use with nf_tables.
57 void nft_unregister_afinfo(struct net
*net
, struct nft_af_info
*afi
)
59 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
60 __nft_release_afinfo(net
, afi
);
61 list_del_rcu(&afi
->list
);
62 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
64 EXPORT_SYMBOL_GPL(nft_unregister_afinfo
);
66 static struct nft_af_info
*nft_afinfo_lookup(struct net
*net
, int family
)
68 struct nft_af_info
*afi
;
70 list_for_each_entry(afi
, &net
->nft
.af_info
, list
) {
71 if (afi
->family
== family
)
77 static struct nft_af_info
*
78 nf_tables_afinfo_lookup(struct net
*net
, int family
, bool autoload
)
80 struct nft_af_info
*afi
;
82 afi
= nft_afinfo_lookup(net
, family
);
87 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
88 request_module("nft-afinfo-%u", family
);
89 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
90 afi
= nft_afinfo_lookup(net
, family
);
92 return ERR_PTR(-EAGAIN
);
95 return ERR_PTR(-EAFNOSUPPORT
);
98 static void nft_ctx_init(struct nft_ctx
*ctx
,
100 const struct sk_buff
*skb
,
101 const struct nlmsghdr
*nlh
,
102 struct nft_af_info
*afi
,
103 struct nft_table
*table
,
104 struct nft_chain
*chain
,
105 const struct nlattr
* const *nla
)
112 ctx
->portid
= NETLINK_CB(skb
).portid
;
113 ctx
->report
= nlmsg_report(nlh
);
114 ctx
->seq
= nlh
->nlmsg_seq
;
117 static struct nft_trans
*nft_trans_alloc_gfp(const struct nft_ctx
*ctx
,
118 int msg_type
, u32 size
, gfp_t gfp
)
120 struct nft_trans
*trans
;
122 trans
= kzalloc(sizeof(struct nft_trans
) + size
, gfp
);
126 trans
->msg_type
= msg_type
;
132 static struct nft_trans
*nft_trans_alloc(const struct nft_ctx
*ctx
,
133 int msg_type
, u32 size
)
135 return nft_trans_alloc_gfp(ctx
, msg_type
, size
, GFP_KERNEL
);
138 static void nft_trans_destroy(struct nft_trans
*trans
)
140 list_del(&trans
->list
);
144 static int nf_tables_register_hook(struct net
*net
,
145 const struct nft_table
*table
,
146 struct nft_chain
*chain
)
148 if (table
->flags
& NFT_TABLE_F_DORMANT
||
149 !nft_is_base_chain(chain
))
152 return nf_register_net_hook(net
, &nft_base_chain(chain
)->ops
);
155 static void nf_tables_unregister_hook(struct net
*net
,
156 const struct nft_table
*table
,
157 struct nft_chain
*chain
)
159 if (table
->flags
& NFT_TABLE_F_DORMANT
||
160 !nft_is_base_chain(chain
))
163 nf_unregister_net_hook(net
, &nft_base_chain(chain
)->ops
);
166 static int nft_trans_table_add(struct nft_ctx
*ctx
, int msg_type
)
168 struct nft_trans
*trans
;
170 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_table
));
174 if (msg_type
== NFT_MSG_NEWTABLE
)
175 nft_activate_next(ctx
->net
, ctx
->table
);
177 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
181 static int nft_deltable(struct nft_ctx
*ctx
)
185 err
= nft_trans_table_add(ctx
, NFT_MSG_DELTABLE
);
189 nft_deactivate_next(ctx
->net
, ctx
->table
);
193 static int nft_trans_chain_add(struct nft_ctx
*ctx
, int msg_type
)
195 struct nft_trans
*trans
;
197 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_chain
));
201 if (msg_type
== NFT_MSG_NEWCHAIN
)
202 nft_activate_next(ctx
->net
, ctx
->chain
);
204 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
208 static int nft_delchain(struct nft_ctx
*ctx
)
212 err
= nft_trans_chain_add(ctx
, NFT_MSG_DELCHAIN
);
217 nft_deactivate_next(ctx
->net
, ctx
->chain
);
223 nf_tables_delrule_deactivate(struct nft_ctx
*ctx
, struct nft_rule
*rule
)
225 /* You cannot delete the same rule twice */
226 if (nft_is_active_next(ctx
->net
, rule
)) {
227 nft_deactivate_next(ctx
->net
, rule
);
234 static struct nft_trans
*nft_trans_rule_add(struct nft_ctx
*ctx
, int msg_type
,
235 struct nft_rule
*rule
)
237 struct nft_trans
*trans
;
239 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_rule
));
243 if (msg_type
== NFT_MSG_NEWRULE
&& ctx
->nla
[NFTA_RULE_ID
] != NULL
) {
244 nft_trans_rule_id(trans
) =
245 ntohl(nla_get_be32(ctx
->nla
[NFTA_RULE_ID
]));
247 nft_trans_rule(trans
) = rule
;
248 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
253 static int nft_delrule(struct nft_ctx
*ctx
, struct nft_rule
*rule
)
255 struct nft_trans
*trans
;
258 trans
= nft_trans_rule_add(ctx
, NFT_MSG_DELRULE
, rule
);
262 err
= nf_tables_delrule_deactivate(ctx
, rule
);
264 nft_trans_destroy(trans
);
271 static int nft_delrule_by_chain(struct nft_ctx
*ctx
)
273 struct nft_rule
*rule
;
276 list_for_each_entry(rule
, &ctx
->chain
->rules
, list
) {
277 err
= nft_delrule(ctx
, rule
);
284 static int nft_trans_set_add(struct nft_ctx
*ctx
, int msg_type
,
287 struct nft_trans
*trans
;
289 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_set
));
293 if (msg_type
== NFT_MSG_NEWSET
&& ctx
->nla
[NFTA_SET_ID
] != NULL
) {
294 nft_trans_set_id(trans
) =
295 ntohl(nla_get_be32(ctx
->nla
[NFTA_SET_ID
]));
296 nft_activate_next(ctx
->net
, set
);
298 nft_trans_set(trans
) = set
;
299 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
304 static int nft_delset(struct nft_ctx
*ctx
, struct nft_set
*set
)
308 err
= nft_trans_set_add(ctx
, NFT_MSG_DELSET
, set
);
312 nft_deactivate_next(ctx
->net
, set
);
318 static int nft_trans_obj_add(struct nft_ctx
*ctx
, int msg_type
,
319 struct nft_object
*obj
)
321 struct nft_trans
*trans
;
323 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_obj
));
327 if (msg_type
== NFT_MSG_NEWOBJ
)
328 nft_activate_next(ctx
->net
, obj
);
330 nft_trans_obj(trans
) = obj
;
331 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
336 static int nft_delobj(struct nft_ctx
*ctx
, struct nft_object
*obj
)
340 err
= nft_trans_obj_add(ctx
, NFT_MSG_DELOBJ
, obj
);
344 nft_deactivate_next(ctx
->net
, obj
);
350 static int nft_trans_flowtable_add(struct nft_ctx
*ctx
, int msg_type
,
351 struct nft_flowtable
*flowtable
)
353 struct nft_trans
*trans
;
355 trans
= nft_trans_alloc(ctx
, msg_type
,
356 sizeof(struct nft_trans_flowtable
));
360 if (msg_type
== NFT_MSG_NEWFLOWTABLE
)
361 nft_activate_next(ctx
->net
, flowtable
);
363 nft_trans_flowtable(trans
) = flowtable
;
364 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
369 static int nft_delflowtable(struct nft_ctx
*ctx
,
370 struct nft_flowtable
*flowtable
)
374 err
= nft_trans_flowtable_add(ctx
, NFT_MSG_DELFLOWTABLE
, flowtable
);
378 nft_deactivate_next(ctx
->net
, flowtable
);
388 static struct nft_table
*nft_table_lookup(const struct nft_af_info
*afi
,
389 const struct nlattr
*nla
,
392 struct nft_table
*table
;
394 list_for_each_entry(table
, &afi
->tables
, list
) {
395 if (!nla_strcmp(nla
, table
->name
) &&
396 nft_active_genmask(table
, genmask
))
402 static struct nft_table
*nf_tables_table_lookup(const struct nft_af_info
*afi
,
403 const struct nlattr
*nla
,
406 struct nft_table
*table
;
409 return ERR_PTR(-EINVAL
);
411 table
= nft_table_lookup(afi
, nla
, genmask
);
415 return ERR_PTR(-ENOENT
);
418 static inline u64
nf_tables_alloc_handle(struct nft_table
*table
)
420 return ++table
->hgenerator
;
423 static const struct nf_chain_type
*chain_type
[NFPROTO_NUMPROTO
][NFT_CHAIN_T_MAX
];
425 static const struct nf_chain_type
*
426 __nf_tables_chain_type_lookup(int family
, const struct nlattr
*nla
)
430 for (i
= 0; i
< NFT_CHAIN_T_MAX
; i
++) {
431 if (chain_type
[family
][i
] != NULL
&&
432 !nla_strcmp(nla
, chain_type
[family
][i
]->name
))
433 return chain_type
[family
][i
];
438 static const struct nf_chain_type
*
439 nf_tables_chain_type_lookup(const struct nft_af_info
*afi
,
440 const struct nlattr
*nla
,
443 const struct nf_chain_type
*type
;
445 type
= __nf_tables_chain_type_lookup(afi
->family
, nla
);
448 #ifdef CONFIG_MODULES
450 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
451 request_module("nft-chain-%u-%.*s", afi
->family
,
452 nla_len(nla
), (const char *)nla_data(nla
));
453 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
454 type
= __nf_tables_chain_type_lookup(afi
->family
, nla
);
456 return ERR_PTR(-EAGAIN
);
459 return ERR_PTR(-ENOENT
);
462 static const struct nla_policy nft_table_policy
[NFTA_TABLE_MAX
+ 1] = {
463 [NFTA_TABLE_NAME
] = { .type
= NLA_STRING
,
464 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
465 [NFTA_TABLE_FLAGS
] = { .type
= NLA_U32
},
468 static int nf_tables_fill_table_info(struct sk_buff
*skb
, struct net
*net
,
469 u32 portid
, u32 seq
, int event
, u32 flags
,
470 int family
, const struct nft_table
*table
)
472 struct nlmsghdr
*nlh
;
473 struct nfgenmsg
*nfmsg
;
475 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
476 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
478 goto nla_put_failure
;
480 nfmsg
= nlmsg_data(nlh
);
481 nfmsg
->nfgen_family
= family
;
482 nfmsg
->version
= NFNETLINK_V0
;
483 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
485 if (nla_put_string(skb
, NFTA_TABLE_NAME
, table
->name
) ||
486 nla_put_be32(skb
, NFTA_TABLE_FLAGS
, htonl(table
->flags
)) ||
487 nla_put_be32(skb
, NFTA_TABLE_USE
, htonl(table
->use
)))
488 goto nla_put_failure
;
494 nlmsg_trim(skb
, nlh
);
498 static void nf_tables_table_notify(const struct nft_ctx
*ctx
, int event
)
504 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
507 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
511 err
= nf_tables_fill_table_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
512 event
, 0, ctx
->afi
->family
, ctx
->table
);
518 nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
519 ctx
->report
, GFP_KERNEL
);
522 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
525 static int nf_tables_dump_tables(struct sk_buff
*skb
,
526 struct netlink_callback
*cb
)
528 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
529 const struct nft_af_info
*afi
;
530 const struct nft_table
*table
;
531 unsigned int idx
= 0, s_idx
= cb
->args
[0];
532 struct net
*net
= sock_net(skb
->sk
);
533 int family
= nfmsg
->nfgen_family
;
536 cb
->seq
= net
->nft
.base_seq
;
538 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
539 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
542 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
546 memset(&cb
->args
[1], 0,
547 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
548 if (!nft_is_active(net
, table
))
550 if (nf_tables_fill_table_info(skb
, net
,
551 NETLINK_CB(cb
->skb
).portid
,
555 afi
->family
, table
) < 0)
558 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
569 static int nf_tables_gettable(struct net
*net
, struct sock
*nlsk
,
570 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
571 const struct nlattr
* const nla
[],
572 struct netlink_ext_ack
*extack
)
574 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
575 u8 genmask
= nft_genmask_cur(net
);
576 const struct nft_af_info
*afi
;
577 const struct nft_table
*table
;
578 struct sk_buff
*skb2
;
579 int family
= nfmsg
->nfgen_family
;
582 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
583 struct netlink_dump_control c
= {
584 .dump
= nf_tables_dump_tables
,
586 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
589 afi
= nf_tables_afinfo_lookup(net
, family
, false);
593 table
= nf_tables_table_lookup(afi
, nla
[NFTA_TABLE_NAME
], genmask
);
595 return PTR_ERR(table
);
597 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
601 err
= nf_tables_fill_table_info(skb2
, net
, NETLINK_CB(skb
).portid
,
602 nlh
->nlmsg_seq
, NFT_MSG_NEWTABLE
, 0,
607 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
614 static void _nf_tables_table_disable(struct net
*net
,
615 const struct nft_af_info
*afi
,
616 struct nft_table
*table
,
619 struct nft_chain
*chain
;
622 list_for_each_entry(chain
, &table
->chains
, list
) {
623 if (!nft_is_active_next(net
, chain
))
625 if (!nft_is_base_chain(chain
))
628 if (cnt
&& i
++ == cnt
)
631 nf_unregister_net_hook(net
, &nft_base_chain(chain
)->ops
);
635 static int nf_tables_table_enable(struct net
*net
,
636 const struct nft_af_info
*afi
,
637 struct nft_table
*table
)
639 struct nft_chain
*chain
;
642 list_for_each_entry(chain
, &table
->chains
, list
) {
643 if (!nft_is_active_next(net
, chain
))
645 if (!nft_is_base_chain(chain
))
648 err
= nf_register_net_hook(net
, &nft_base_chain(chain
)->ops
);
657 _nf_tables_table_disable(net
, afi
, table
, i
);
661 static void nf_tables_table_disable(struct net
*net
,
662 const struct nft_af_info
*afi
,
663 struct nft_table
*table
)
665 _nf_tables_table_disable(net
, afi
, table
, 0);
668 static int nf_tables_updtable(struct nft_ctx
*ctx
)
670 struct nft_trans
*trans
;
674 if (!ctx
->nla
[NFTA_TABLE_FLAGS
])
677 flags
= ntohl(nla_get_be32(ctx
->nla
[NFTA_TABLE_FLAGS
]));
678 if (flags
& ~NFT_TABLE_F_DORMANT
)
681 if (flags
== ctx
->table
->flags
)
684 trans
= nft_trans_alloc(ctx
, NFT_MSG_NEWTABLE
,
685 sizeof(struct nft_trans_table
));
689 if ((flags
& NFT_TABLE_F_DORMANT
) &&
690 !(ctx
->table
->flags
& NFT_TABLE_F_DORMANT
)) {
691 nft_trans_table_enable(trans
) = false;
692 } else if (!(flags
& NFT_TABLE_F_DORMANT
) &&
693 ctx
->table
->flags
& NFT_TABLE_F_DORMANT
) {
694 ret
= nf_tables_table_enable(ctx
->net
, ctx
->afi
, ctx
->table
);
696 ctx
->table
->flags
&= ~NFT_TABLE_F_DORMANT
;
697 nft_trans_table_enable(trans
) = true;
703 nft_trans_table_update(trans
) = true;
704 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
707 nft_trans_destroy(trans
);
711 static int nf_tables_newtable(struct net
*net
, struct sock
*nlsk
,
712 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
713 const struct nlattr
* const nla
[],
714 struct netlink_ext_ack
*extack
)
716 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
717 u8 genmask
= nft_genmask_next(net
);
718 const struct nlattr
*name
;
719 struct nft_af_info
*afi
;
720 struct nft_table
*table
;
721 int family
= nfmsg
->nfgen_family
;
726 afi
= nf_tables_afinfo_lookup(net
, family
, true);
730 name
= nla
[NFTA_TABLE_NAME
];
731 table
= nf_tables_table_lookup(afi
, name
, genmask
);
733 if (PTR_ERR(table
) != -ENOENT
)
734 return PTR_ERR(table
);
736 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
738 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
741 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
742 return nf_tables_updtable(&ctx
);
745 if (nla
[NFTA_TABLE_FLAGS
]) {
746 flags
= ntohl(nla_get_be32(nla
[NFTA_TABLE_FLAGS
]));
747 if (flags
& ~NFT_TABLE_F_DORMANT
)
752 if (!try_module_get(afi
->owner
))
756 table
= kzalloc(sizeof(*table
), GFP_KERNEL
);
760 table
->name
= nla_strdup(name
, GFP_KERNEL
);
761 if (table
->name
== NULL
)
764 INIT_LIST_HEAD(&table
->chains
);
765 INIT_LIST_HEAD(&table
->sets
);
766 INIT_LIST_HEAD(&table
->objects
);
767 INIT_LIST_HEAD(&table
->flowtables
);
768 table
->flags
= flags
;
770 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
771 err
= nft_trans_table_add(&ctx
, NFT_MSG_NEWTABLE
);
775 list_add_tail_rcu(&table
->list
, &afi
->tables
);
782 module_put(afi
->owner
);
787 static int nft_flush_table(struct nft_ctx
*ctx
)
789 struct nft_flowtable
*flowtable
, *nft
;
790 struct nft_chain
*chain
, *nc
;
791 struct nft_object
*obj
, *ne
;
792 struct nft_set
*set
, *ns
;
795 list_for_each_entry(chain
, &ctx
->table
->chains
, list
) {
796 if (!nft_is_active_next(ctx
->net
, chain
))
801 err
= nft_delrule_by_chain(ctx
);
806 list_for_each_entry_safe(set
, ns
, &ctx
->table
->sets
, list
) {
807 if (!nft_is_active_next(ctx
->net
, set
))
810 if (nft_set_is_anonymous(set
) &&
811 !list_empty(&set
->bindings
))
814 err
= nft_delset(ctx
, set
);
819 list_for_each_entry_safe(flowtable
, nft
, &ctx
->table
->flowtables
, list
) {
820 err
= nft_delflowtable(ctx
, flowtable
);
825 list_for_each_entry_safe(obj
, ne
, &ctx
->table
->objects
, list
) {
826 err
= nft_delobj(ctx
, obj
);
831 list_for_each_entry_safe(chain
, nc
, &ctx
->table
->chains
, list
) {
832 if (!nft_is_active_next(ctx
->net
, chain
))
837 err
= nft_delchain(ctx
);
842 err
= nft_deltable(ctx
);
847 static int nft_flush(struct nft_ctx
*ctx
, int family
)
849 struct nft_af_info
*afi
;
850 struct nft_table
*table
, *nt
;
851 const struct nlattr
* const *nla
= ctx
->nla
;
854 list_for_each_entry(afi
, &ctx
->net
->nft
.af_info
, list
) {
855 if (family
!= AF_UNSPEC
&& afi
->family
!= family
)
859 list_for_each_entry_safe(table
, nt
, &afi
->tables
, list
) {
860 if (!nft_is_active_next(ctx
->net
, table
))
863 if (nla
[NFTA_TABLE_NAME
] &&
864 nla_strcmp(nla
[NFTA_TABLE_NAME
], table
->name
) != 0)
869 err
= nft_flush_table(ctx
);
878 static int nf_tables_deltable(struct net
*net
, struct sock
*nlsk
,
879 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
880 const struct nlattr
* const nla
[],
881 struct netlink_ext_ack
*extack
)
883 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
884 u8 genmask
= nft_genmask_next(net
);
885 struct nft_af_info
*afi
;
886 struct nft_table
*table
;
887 int family
= nfmsg
->nfgen_family
;
890 nft_ctx_init(&ctx
, net
, skb
, nlh
, NULL
, NULL
, NULL
, nla
);
891 if (family
== AF_UNSPEC
|| nla
[NFTA_TABLE_NAME
] == NULL
)
892 return nft_flush(&ctx
, family
);
894 afi
= nf_tables_afinfo_lookup(net
, family
, false);
898 table
= nf_tables_table_lookup(afi
, nla
[NFTA_TABLE_NAME
], genmask
);
900 return PTR_ERR(table
);
902 if (nlh
->nlmsg_flags
& NLM_F_NONREC
&&
909 return nft_flush_table(&ctx
);
912 static void nf_tables_table_destroy(struct nft_ctx
*ctx
)
914 BUG_ON(ctx
->table
->use
> 0);
916 kfree(ctx
->table
->name
);
918 module_put(ctx
->afi
->owner
);
921 int nft_register_chain_type(const struct nf_chain_type
*ctype
)
925 if (WARN_ON(ctype
->family
>= NFPROTO_NUMPROTO
))
928 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
929 if (chain_type
[ctype
->family
][ctype
->type
] != NULL
) {
933 chain_type
[ctype
->family
][ctype
->type
] = ctype
;
935 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
938 EXPORT_SYMBOL_GPL(nft_register_chain_type
);
940 void nft_unregister_chain_type(const struct nf_chain_type
*ctype
)
942 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
943 chain_type
[ctype
->family
][ctype
->type
] = NULL
;
944 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
946 EXPORT_SYMBOL_GPL(nft_unregister_chain_type
);
952 static struct nft_chain
*
953 nf_tables_chain_lookup_byhandle(const struct nft_table
*table
, u64 handle
,
956 struct nft_chain
*chain
;
958 list_for_each_entry(chain
, &table
->chains
, list
) {
959 if (chain
->handle
== handle
&&
960 nft_active_genmask(chain
, genmask
))
964 return ERR_PTR(-ENOENT
);
967 static struct nft_chain
*nf_tables_chain_lookup(const struct nft_table
*table
,
968 const struct nlattr
*nla
,
971 struct nft_chain
*chain
;
974 return ERR_PTR(-EINVAL
);
976 list_for_each_entry(chain
, &table
->chains
, list
) {
977 if (!nla_strcmp(nla
, chain
->name
) &&
978 nft_active_genmask(chain
, genmask
))
982 return ERR_PTR(-ENOENT
);
985 static const struct nla_policy nft_chain_policy
[NFTA_CHAIN_MAX
+ 1] = {
986 [NFTA_CHAIN_TABLE
] = { .type
= NLA_STRING
,
987 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
988 [NFTA_CHAIN_HANDLE
] = { .type
= NLA_U64
},
989 [NFTA_CHAIN_NAME
] = { .type
= NLA_STRING
,
990 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
991 [NFTA_CHAIN_HOOK
] = { .type
= NLA_NESTED
},
992 [NFTA_CHAIN_POLICY
] = { .type
= NLA_U32
},
993 [NFTA_CHAIN_TYPE
] = { .type
= NLA_STRING
},
994 [NFTA_CHAIN_COUNTERS
] = { .type
= NLA_NESTED
},
997 static const struct nla_policy nft_hook_policy
[NFTA_HOOK_MAX
+ 1] = {
998 [NFTA_HOOK_HOOKNUM
] = { .type
= NLA_U32
},
999 [NFTA_HOOK_PRIORITY
] = { .type
= NLA_U32
},
1000 [NFTA_HOOK_DEV
] = { .type
= NLA_STRING
,
1001 .len
= IFNAMSIZ
- 1 },
1004 static int nft_dump_stats(struct sk_buff
*skb
, struct nft_stats __percpu
*stats
)
1006 struct nft_stats
*cpu_stats
, total
;
1007 struct nlattr
*nest
;
1012 memset(&total
, 0, sizeof(total
));
1013 for_each_possible_cpu(cpu
) {
1014 cpu_stats
= per_cpu_ptr(stats
, cpu
);
1016 seq
= u64_stats_fetch_begin_irq(&cpu_stats
->syncp
);
1017 pkts
= cpu_stats
->pkts
;
1018 bytes
= cpu_stats
->bytes
;
1019 } while (u64_stats_fetch_retry_irq(&cpu_stats
->syncp
, seq
));
1021 total
.bytes
+= bytes
;
1023 nest
= nla_nest_start(skb
, NFTA_CHAIN_COUNTERS
);
1025 goto nla_put_failure
;
1027 if (nla_put_be64(skb
, NFTA_COUNTER_PACKETS
, cpu_to_be64(total
.pkts
),
1028 NFTA_COUNTER_PAD
) ||
1029 nla_put_be64(skb
, NFTA_COUNTER_BYTES
, cpu_to_be64(total
.bytes
),
1031 goto nla_put_failure
;
1033 nla_nest_end(skb
, nest
);
1040 static int nf_tables_fill_chain_info(struct sk_buff
*skb
, struct net
*net
,
1041 u32 portid
, u32 seq
, int event
, u32 flags
,
1042 int family
, const struct nft_table
*table
,
1043 const struct nft_chain
*chain
)
1045 struct nlmsghdr
*nlh
;
1046 struct nfgenmsg
*nfmsg
;
1048 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
1049 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
1051 goto nla_put_failure
;
1053 nfmsg
= nlmsg_data(nlh
);
1054 nfmsg
->nfgen_family
= family
;
1055 nfmsg
->version
= NFNETLINK_V0
;
1056 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
1058 if (nla_put_string(skb
, NFTA_CHAIN_TABLE
, table
->name
))
1059 goto nla_put_failure
;
1060 if (nla_put_be64(skb
, NFTA_CHAIN_HANDLE
, cpu_to_be64(chain
->handle
),
1062 goto nla_put_failure
;
1063 if (nla_put_string(skb
, NFTA_CHAIN_NAME
, chain
->name
))
1064 goto nla_put_failure
;
1066 if (nft_is_base_chain(chain
)) {
1067 const struct nft_base_chain
*basechain
= nft_base_chain(chain
);
1068 const struct nf_hook_ops
*ops
= &basechain
->ops
;
1069 struct nlattr
*nest
;
1071 nest
= nla_nest_start(skb
, NFTA_CHAIN_HOOK
);
1073 goto nla_put_failure
;
1074 if (nla_put_be32(skb
, NFTA_HOOK_HOOKNUM
, htonl(ops
->hooknum
)))
1075 goto nla_put_failure
;
1076 if (nla_put_be32(skb
, NFTA_HOOK_PRIORITY
, htonl(ops
->priority
)))
1077 goto nla_put_failure
;
1078 if (basechain
->dev_name
[0] &&
1079 nla_put_string(skb
, NFTA_HOOK_DEV
, basechain
->dev_name
))
1080 goto nla_put_failure
;
1081 nla_nest_end(skb
, nest
);
1083 if (nla_put_be32(skb
, NFTA_CHAIN_POLICY
,
1084 htonl(basechain
->policy
)))
1085 goto nla_put_failure
;
1087 if (nla_put_string(skb
, NFTA_CHAIN_TYPE
, basechain
->type
->name
))
1088 goto nla_put_failure
;
1090 if (basechain
->stats
&& nft_dump_stats(skb
, basechain
->stats
))
1091 goto nla_put_failure
;
1094 if (nla_put_be32(skb
, NFTA_CHAIN_USE
, htonl(chain
->use
)))
1095 goto nla_put_failure
;
1097 nlmsg_end(skb
, nlh
);
1101 nlmsg_trim(skb
, nlh
);
1105 static void nf_tables_chain_notify(const struct nft_ctx
*ctx
, int event
)
1107 struct sk_buff
*skb
;
1111 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
1114 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
1118 err
= nf_tables_fill_chain_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
1119 event
, 0, ctx
->afi
->family
, ctx
->table
,
1126 nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
1127 ctx
->report
, GFP_KERNEL
);
1130 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
1133 static int nf_tables_dump_chains(struct sk_buff
*skb
,
1134 struct netlink_callback
*cb
)
1136 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
1137 const struct nft_af_info
*afi
;
1138 const struct nft_table
*table
;
1139 const struct nft_chain
*chain
;
1140 unsigned int idx
= 0, s_idx
= cb
->args
[0];
1141 struct net
*net
= sock_net(skb
->sk
);
1142 int family
= nfmsg
->nfgen_family
;
1145 cb
->seq
= net
->nft
.base_seq
;
1147 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
1148 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
1151 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
1152 list_for_each_entry_rcu(chain
, &table
->chains
, list
) {
1156 memset(&cb
->args
[1], 0,
1157 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
1158 if (!nft_is_active(net
, chain
))
1160 if (nf_tables_fill_chain_info(skb
, net
,
1161 NETLINK_CB(cb
->skb
).portid
,
1165 afi
->family
, table
, chain
) < 0)
1168 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
1180 static int nf_tables_getchain(struct net
*net
, struct sock
*nlsk
,
1181 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
1182 const struct nlattr
* const nla
[],
1183 struct netlink_ext_ack
*extack
)
1185 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1186 u8 genmask
= nft_genmask_cur(net
);
1187 const struct nft_af_info
*afi
;
1188 const struct nft_table
*table
;
1189 const struct nft_chain
*chain
;
1190 struct sk_buff
*skb2
;
1191 int family
= nfmsg
->nfgen_family
;
1194 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
1195 struct netlink_dump_control c
= {
1196 .dump
= nf_tables_dump_chains
,
1198 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
1201 afi
= nf_tables_afinfo_lookup(net
, family
, false);
1203 return PTR_ERR(afi
);
1205 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
], genmask
);
1207 return PTR_ERR(table
);
1209 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
], genmask
);
1211 return PTR_ERR(chain
);
1213 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
1217 err
= nf_tables_fill_chain_info(skb2
, net
, NETLINK_CB(skb
).portid
,
1218 nlh
->nlmsg_seq
, NFT_MSG_NEWCHAIN
, 0,
1219 family
, table
, chain
);
1223 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
1230 static const struct nla_policy nft_counter_policy
[NFTA_COUNTER_MAX
+ 1] = {
1231 [NFTA_COUNTER_PACKETS
] = { .type
= NLA_U64
},
1232 [NFTA_COUNTER_BYTES
] = { .type
= NLA_U64
},
1235 static struct nft_stats __percpu
*nft_stats_alloc(const struct nlattr
*attr
)
1237 struct nlattr
*tb
[NFTA_COUNTER_MAX
+1];
1238 struct nft_stats __percpu
*newstats
;
1239 struct nft_stats
*stats
;
1242 err
= nla_parse_nested(tb
, NFTA_COUNTER_MAX
, attr
, nft_counter_policy
,
1245 return ERR_PTR(err
);
1247 if (!tb
[NFTA_COUNTER_BYTES
] || !tb
[NFTA_COUNTER_PACKETS
])
1248 return ERR_PTR(-EINVAL
);
1250 newstats
= netdev_alloc_pcpu_stats(struct nft_stats
);
1251 if (newstats
== NULL
)
1252 return ERR_PTR(-ENOMEM
);
1254 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1255 * are not exposed to userspace.
1258 stats
= this_cpu_ptr(newstats
);
1259 stats
->bytes
= be64_to_cpu(nla_get_be64(tb
[NFTA_COUNTER_BYTES
]));
1260 stats
->pkts
= be64_to_cpu(nla_get_be64(tb
[NFTA_COUNTER_PACKETS
]));
1266 static void nft_chain_stats_replace(struct nft_base_chain
*chain
,
1267 struct nft_stats __percpu
*newstats
)
1269 struct nft_stats __percpu
*oldstats
;
1271 if (newstats
== NULL
)
1275 oldstats
= nfnl_dereference(chain
->stats
, NFNL_SUBSYS_NFTABLES
);
1276 rcu_assign_pointer(chain
->stats
, newstats
);
1278 free_percpu(oldstats
);
1280 rcu_assign_pointer(chain
->stats
, newstats
);
1283 static void nf_tables_chain_destroy(struct nft_chain
*chain
)
1285 BUG_ON(chain
->use
> 0);
1287 if (nft_is_base_chain(chain
)) {
1288 struct nft_base_chain
*basechain
= nft_base_chain(chain
);
1290 module_put(basechain
->type
->owner
);
1291 free_percpu(basechain
->stats
);
1292 if (basechain
->stats
)
1293 static_branch_dec(&nft_counters_enabled
);
1294 if (basechain
->ops
.dev
!= NULL
)
1295 dev_put(basechain
->ops
.dev
);
1304 struct nft_chain_hook
{
1307 const struct nf_chain_type
*type
;
1308 struct net_device
*dev
;
1311 static int nft_chain_parse_hook(struct net
*net
,
1312 const struct nlattr
* const nla
[],
1313 struct nft_af_info
*afi
,
1314 struct nft_chain_hook
*hook
, bool create
)
1316 struct nlattr
*ha
[NFTA_HOOK_MAX
+ 1];
1317 const struct nf_chain_type
*type
;
1318 struct net_device
*dev
;
1321 err
= nla_parse_nested(ha
, NFTA_HOOK_MAX
, nla
[NFTA_CHAIN_HOOK
],
1322 nft_hook_policy
, NULL
);
1326 if (ha
[NFTA_HOOK_HOOKNUM
] == NULL
||
1327 ha
[NFTA_HOOK_PRIORITY
] == NULL
)
1330 hook
->num
= ntohl(nla_get_be32(ha
[NFTA_HOOK_HOOKNUM
]));
1331 if (hook
->num
>= afi
->nhooks
)
1334 hook
->priority
= ntohl(nla_get_be32(ha
[NFTA_HOOK_PRIORITY
]));
1336 type
= chain_type
[afi
->family
][NFT_CHAIN_T_DEFAULT
];
1337 if (nla
[NFTA_CHAIN_TYPE
]) {
1338 type
= nf_tables_chain_type_lookup(afi
, nla
[NFTA_CHAIN_TYPE
],
1341 return PTR_ERR(type
);
1343 if (!(type
->hook_mask
& (1 << hook
->num
)))
1346 if (type
->type
== NFT_CHAIN_T_NAT
&&
1347 hook
->priority
<= NF_IP_PRI_CONNTRACK
)
1350 if (!try_module_get(type
->owner
))
1356 if (afi
->flags
& NFT_AF_NEEDS_DEV
) {
1357 char ifname
[IFNAMSIZ
];
1359 if (!ha
[NFTA_HOOK_DEV
]) {
1360 module_put(type
->owner
);
1364 nla_strlcpy(ifname
, ha
[NFTA_HOOK_DEV
], IFNAMSIZ
);
1365 dev
= dev_get_by_name(net
, ifname
);
1367 module_put(type
->owner
);
1371 } else if (ha
[NFTA_HOOK_DEV
]) {
1372 module_put(type
->owner
);
1379 static void nft_chain_release_hook(struct nft_chain_hook
*hook
)
1381 module_put(hook
->type
->owner
);
1382 if (hook
->dev
!= NULL
)
1386 static int nf_tables_addchain(struct nft_ctx
*ctx
, u8 family
, u8 genmask
,
1387 u8 policy
, bool create
)
1389 const struct nlattr
* const *nla
= ctx
->nla
;
1390 struct nft_table
*table
= ctx
->table
;
1391 struct nft_af_info
*afi
= ctx
->afi
;
1392 struct nft_base_chain
*basechain
;
1393 struct nft_stats __percpu
*stats
;
1394 struct net
*net
= ctx
->net
;
1395 struct nft_chain
*chain
;
1398 if (table
->use
== UINT_MAX
)
1401 if (nla
[NFTA_CHAIN_HOOK
]) {
1402 struct nft_chain_hook hook
;
1403 struct nf_hook_ops
*ops
;
1405 err
= nft_chain_parse_hook(net
, nla
, afi
, &hook
, create
);
1409 basechain
= kzalloc(sizeof(*basechain
), GFP_KERNEL
);
1410 if (basechain
== NULL
) {
1411 nft_chain_release_hook(&hook
);
1415 if (hook
.dev
!= NULL
)
1416 strncpy(basechain
->dev_name
, hook
.dev
->name
, IFNAMSIZ
);
1418 if (nla
[NFTA_CHAIN_COUNTERS
]) {
1419 stats
= nft_stats_alloc(nla
[NFTA_CHAIN_COUNTERS
]);
1420 if (IS_ERR(stats
)) {
1421 nft_chain_release_hook(&hook
);
1423 return PTR_ERR(stats
);
1425 basechain
->stats
= stats
;
1426 static_branch_inc(&nft_counters_enabled
);
1429 basechain
->type
= hook
.type
;
1430 chain
= &basechain
->chain
;
1432 ops
= &basechain
->ops
;
1434 ops
->hooknum
= hook
.num
;
1435 ops
->priority
= hook
.priority
;
1437 ops
->hook
= hook
.type
->hooks
[ops
->hooknum
];
1438 ops
->dev
= hook
.dev
;
1440 if (basechain
->type
->type
== NFT_CHAIN_T_NAT
)
1441 ops
->nat_hook
= true;
1443 chain
->flags
|= NFT_BASE_CHAIN
;
1444 basechain
->policy
= policy
;
1446 chain
= kzalloc(sizeof(*chain
), GFP_KERNEL
);
1450 INIT_LIST_HEAD(&chain
->rules
);
1451 chain
->handle
= nf_tables_alloc_handle(table
);
1452 chain
->table
= table
;
1453 chain
->name
= nla_strdup(nla
[NFTA_CHAIN_NAME
], GFP_KERNEL
);
1459 err
= nf_tables_register_hook(net
, table
, chain
);
1464 err
= nft_trans_chain_add(ctx
, NFT_MSG_NEWCHAIN
);
1469 list_add_tail_rcu(&chain
->list
, &table
->chains
);
1473 nf_tables_unregister_hook(net
, table
, chain
);
1475 nf_tables_chain_destroy(chain
);
1480 static int nf_tables_updchain(struct nft_ctx
*ctx
, u8 genmask
, u8 policy
,
1483 const struct nlattr
* const *nla
= ctx
->nla
;
1484 struct nft_table
*table
= ctx
->table
;
1485 struct nft_chain
*chain
= ctx
->chain
;
1486 struct nft_base_chain
*basechain
;
1487 struct nft_stats
*stats
= NULL
;
1488 struct nft_chain_hook hook
;
1489 const struct nlattr
*name
;
1490 struct nf_hook_ops
*ops
;
1491 struct nft_trans
*trans
;
1494 if (nla
[NFTA_CHAIN_HOOK
]) {
1495 if (!nft_is_base_chain(chain
))
1498 err
= nft_chain_parse_hook(ctx
->net
, nla
, ctx
->afi
, &hook
,
1503 basechain
= nft_base_chain(chain
);
1504 if (basechain
->type
!= hook
.type
) {
1505 nft_chain_release_hook(&hook
);
1509 ops
= &basechain
->ops
;
1510 if (ops
->hooknum
!= hook
.num
||
1511 ops
->priority
!= hook
.priority
||
1512 ops
->dev
!= hook
.dev
) {
1513 nft_chain_release_hook(&hook
);
1516 nft_chain_release_hook(&hook
);
1519 if (nla
[NFTA_CHAIN_HANDLE
] &&
1520 nla
[NFTA_CHAIN_NAME
]) {
1521 struct nft_chain
*chain2
;
1523 chain2
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
],
1525 if (!IS_ERR(chain2
))
1529 if (nla
[NFTA_CHAIN_COUNTERS
]) {
1530 if (!nft_is_base_chain(chain
))
1533 stats
= nft_stats_alloc(nla
[NFTA_CHAIN_COUNTERS
]);
1535 return PTR_ERR(stats
);
1538 trans
= nft_trans_alloc(ctx
, NFT_MSG_NEWCHAIN
,
1539 sizeof(struct nft_trans_chain
));
1540 if (trans
== NULL
) {
1545 nft_trans_chain_stats(trans
) = stats
;
1546 nft_trans_chain_update(trans
) = true;
1548 if (nla
[NFTA_CHAIN_POLICY
])
1549 nft_trans_chain_policy(trans
) = policy
;
1551 nft_trans_chain_policy(trans
) = -1;
1553 name
= nla
[NFTA_CHAIN_NAME
];
1554 if (nla
[NFTA_CHAIN_HANDLE
] && name
) {
1555 nft_trans_chain_name(trans
) =
1556 nla_strdup(name
, GFP_KERNEL
);
1557 if (!nft_trans_chain_name(trans
)) {
1563 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
1568 static int nf_tables_newchain(struct net
*net
, struct sock
*nlsk
,
1569 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
1570 const struct nlattr
* const nla
[],
1571 struct netlink_ext_ack
*extack
)
1573 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1574 const struct nlattr
* uninitialized_var(name
);
1575 u8 genmask
= nft_genmask_next(net
);
1576 int family
= nfmsg
->nfgen_family
;
1577 struct nft_af_info
*afi
;
1578 struct nft_table
*table
;
1579 struct nft_chain
*chain
;
1580 u8 policy
= NF_ACCEPT
;
1585 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
1587 afi
= nf_tables_afinfo_lookup(net
, family
, true);
1589 return PTR_ERR(afi
);
1591 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
], genmask
);
1593 return PTR_ERR(table
);
1596 name
= nla
[NFTA_CHAIN_NAME
];
1598 if (nla
[NFTA_CHAIN_HANDLE
]) {
1599 handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_CHAIN_HANDLE
]));
1600 chain
= nf_tables_chain_lookup_byhandle(table
, handle
, genmask
);
1602 return PTR_ERR(chain
);
1604 chain
= nf_tables_chain_lookup(table
, name
, genmask
);
1605 if (IS_ERR(chain
)) {
1606 if (PTR_ERR(chain
) != -ENOENT
)
1607 return PTR_ERR(chain
);
1612 if (nla
[NFTA_CHAIN_POLICY
]) {
1613 if (chain
!= NULL
&&
1614 !nft_is_base_chain(chain
))
1617 if (chain
== NULL
&&
1618 nla
[NFTA_CHAIN_HOOK
] == NULL
)
1621 policy
= ntohl(nla_get_be32(nla
[NFTA_CHAIN_POLICY
]));
1631 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
1633 if (chain
!= NULL
) {
1634 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
1636 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
1639 return nf_tables_updchain(&ctx
, genmask
, policy
, create
);
1642 return nf_tables_addchain(&ctx
, family
, genmask
, policy
, create
);
1645 static int nf_tables_delchain(struct net
*net
, struct sock
*nlsk
,
1646 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
1647 const struct nlattr
* const nla
[],
1648 struct netlink_ext_ack
*extack
)
1650 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1651 u8 genmask
= nft_genmask_next(net
);
1652 struct nft_af_info
*afi
;
1653 struct nft_table
*table
;
1654 struct nft_chain
*chain
;
1655 struct nft_rule
*rule
;
1656 int family
= nfmsg
->nfgen_family
;
1661 afi
= nf_tables_afinfo_lookup(net
, family
, false);
1663 return PTR_ERR(afi
);
1665 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
], genmask
);
1667 return PTR_ERR(table
);
1669 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
], genmask
);
1671 return PTR_ERR(chain
);
1673 if (nlh
->nlmsg_flags
& NLM_F_NONREC
&&
1677 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
1680 list_for_each_entry(rule
, &chain
->rules
, list
) {
1681 if (!nft_is_active_next(net
, rule
))
1685 err
= nft_delrule(&ctx
, rule
);
1690 /* There are rules and elements that are still holding references to us,
1691 * we cannot do a recursive removal in this case.
1696 return nft_delchain(&ctx
);
1704 * nft_register_expr - register nf_tables expr type
1707 * Registers the expr type for use with nf_tables. Returns zero on
1708 * success or a negative errno code otherwise.
1710 int nft_register_expr(struct nft_expr_type
*type
)
1712 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1713 if (type
->family
== NFPROTO_UNSPEC
)
1714 list_add_tail_rcu(&type
->list
, &nf_tables_expressions
);
1716 list_add_rcu(&type
->list
, &nf_tables_expressions
);
1717 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1720 EXPORT_SYMBOL_GPL(nft_register_expr
);
1723 * nft_unregister_expr - unregister nf_tables expr type
1726 * Unregisters the expr typefor use with nf_tables.
1728 void nft_unregister_expr(struct nft_expr_type
*type
)
1730 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1731 list_del_rcu(&type
->list
);
1732 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1734 EXPORT_SYMBOL_GPL(nft_unregister_expr
);
1736 static const struct nft_expr_type
*__nft_expr_type_get(u8 family
,
1739 const struct nft_expr_type
*type
;
1741 list_for_each_entry(type
, &nf_tables_expressions
, list
) {
1742 if (!nla_strcmp(nla
, type
->name
) &&
1743 (!type
->family
|| type
->family
== family
))
1749 static const struct nft_expr_type
*nft_expr_type_get(u8 family
,
1752 const struct nft_expr_type
*type
;
1755 return ERR_PTR(-EINVAL
);
1757 type
= __nft_expr_type_get(family
, nla
);
1758 if (type
!= NULL
&& try_module_get(type
->owner
))
1761 #ifdef CONFIG_MODULES
1763 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1764 request_module("nft-expr-%u-%.*s", family
,
1765 nla_len(nla
), (char *)nla_data(nla
));
1766 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1767 if (__nft_expr_type_get(family
, nla
))
1768 return ERR_PTR(-EAGAIN
);
1770 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1771 request_module("nft-expr-%.*s",
1772 nla_len(nla
), (char *)nla_data(nla
));
1773 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1774 if (__nft_expr_type_get(family
, nla
))
1775 return ERR_PTR(-EAGAIN
);
1778 return ERR_PTR(-ENOENT
);
1781 static const struct nla_policy nft_expr_policy
[NFTA_EXPR_MAX
+ 1] = {
1782 [NFTA_EXPR_NAME
] = { .type
= NLA_STRING
},
1783 [NFTA_EXPR_DATA
] = { .type
= NLA_NESTED
},
1786 static int nf_tables_fill_expr_info(struct sk_buff
*skb
,
1787 const struct nft_expr
*expr
)
1789 if (nla_put_string(skb
, NFTA_EXPR_NAME
, expr
->ops
->type
->name
))
1790 goto nla_put_failure
;
1792 if (expr
->ops
->dump
) {
1793 struct nlattr
*data
= nla_nest_start(skb
, NFTA_EXPR_DATA
);
1795 goto nla_put_failure
;
1796 if (expr
->ops
->dump(skb
, expr
) < 0)
1797 goto nla_put_failure
;
1798 nla_nest_end(skb
, data
);
1807 int nft_expr_dump(struct sk_buff
*skb
, unsigned int attr
,
1808 const struct nft_expr
*expr
)
1810 struct nlattr
*nest
;
1812 nest
= nla_nest_start(skb
, attr
);
1814 goto nla_put_failure
;
1815 if (nf_tables_fill_expr_info(skb
, expr
) < 0)
1816 goto nla_put_failure
;
1817 nla_nest_end(skb
, nest
);
1824 struct nft_expr_info
{
1825 const struct nft_expr_ops
*ops
;
1826 struct nlattr
*tb
[NFT_EXPR_MAXATTR
+ 1];
1829 static int nf_tables_expr_parse(const struct nft_ctx
*ctx
,
1830 const struct nlattr
*nla
,
1831 struct nft_expr_info
*info
)
1833 const struct nft_expr_type
*type
;
1834 const struct nft_expr_ops
*ops
;
1835 struct nlattr
*tb
[NFTA_EXPR_MAX
+ 1];
1838 err
= nla_parse_nested(tb
, NFTA_EXPR_MAX
, nla
, nft_expr_policy
, NULL
);
1842 type
= nft_expr_type_get(ctx
->afi
->family
, tb
[NFTA_EXPR_NAME
]);
1844 return PTR_ERR(type
);
1846 if (tb
[NFTA_EXPR_DATA
]) {
1847 err
= nla_parse_nested(info
->tb
, type
->maxattr
,
1848 tb
[NFTA_EXPR_DATA
], type
->policy
, NULL
);
1852 memset(info
->tb
, 0, sizeof(info
->tb
[0]) * (type
->maxattr
+ 1));
1854 if (type
->select_ops
!= NULL
) {
1855 ops
= type
->select_ops(ctx
,
1856 (const struct nlattr
* const *)info
->tb
);
1868 module_put(type
->owner
);
1872 static int nf_tables_newexpr(const struct nft_ctx
*ctx
,
1873 const struct nft_expr_info
*info
,
1874 struct nft_expr
*expr
)
1876 const struct nft_expr_ops
*ops
= info
->ops
;
1881 err
= ops
->init(ctx
, expr
, (const struct nlattr
**)info
->tb
);
1886 if (ops
->validate
) {
1887 const struct nft_data
*data
= NULL
;
1889 err
= ops
->validate(ctx
, expr
, &data
);
1898 ops
->destroy(ctx
, expr
);
1904 static void nf_tables_expr_destroy(const struct nft_ctx
*ctx
,
1905 struct nft_expr
*expr
)
1907 if (expr
->ops
->destroy
)
1908 expr
->ops
->destroy(ctx
, expr
);
1909 module_put(expr
->ops
->type
->owner
);
1912 struct nft_expr
*nft_expr_init(const struct nft_ctx
*ctx
,
1913 const struct nlattr
*nla
)
1915 struct nft_expr_info info
;
1916 struct nft_expr
*expr
;
1919 err
= nf_tables_expr_parse(ctx
, nla
, &info
);
1924 expr
= kzalloc(info
.ops
->size
, GFP_KERNEL
);
1928 err
= nf_tables_newexpr(ctx
, &info
, expr
);
1936 module_put(info
.ops
->type
->owner
);
1938 return ERR_PTR(err
);
1941 void nft_expr_destroy(const struct nft_ctx
*ctx
, struct nft_expr
*expr
)
1943 nf_tables_expr_destroy(ctx
, expr
);
1951 static struct nft_rule
*__nf_tables_rule_lookup(const struct nft_chain
*chain
,
1954 struct nft_rule
*rule
;
1956 // FIXME: this sucks
1957 list_for_each_entry(rule
, &chain
->rules
, list
) {
1958 if (handle
== rule
->handle
)
1962 return ERR_PTR(-ENOENT
);
1965 static struct nft_rule
*nf_tables_rule_lookup(const struct nft_chain
*chain
,
1966 const struct nlattr
*nla
)
1969 return ERR_PTR(-EINVAL
);
1971 return __nf_tables_rule_lookup(chain
, be64_to_cpu(nla_get_be64(nla
)));
1974 static const struct nla_policy nft_rule_policy
[NFTA_RULE_MAX
+ 1] = {
1975 [NFTA_RULE_TABLE
] = { .type
= NLA_STRING
,
1976 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
1977 [NFTA_RULE_CHAIN
] = { .type
= NLA_STRING
,
1978 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
1979 [NFTA_RULE_HANDLE
] = { .type
= NLA_U64
},
1980 [NFTA_RULE_EXPRESSIONS
] = { .type
= NLA_NESTED
},
1981 [NFTA_RULE_COMPAT
] = { .type
= NLA_NESTED
},
1982 [NFTA_RULE_POSITION
] = { .type
= NLA_U64
},
1983 [NFTA_RULE_USERDATA
] = { .type
= NLA_BINARY
,
1984 .len
= NFT_USERDATA_MAXLEN
},
1987 static int nf_tables_fill_rule_info(struct sk_buff
*skb
, struct net
*net
,
1988 u32 portid
, u32 seq
, int event
,
1989 u32 flags
, int family
,
1990 const struct nft_table
*table
,
1991 const struct nft_chain
*chain
,
1992 const struct nft_rule
*rule
)
1994 struct nlmsghdr
*nlh
;
1995 struct nfgenmsg
*nfmsg
;
1996 const struct nft_expr
*expr
, *next
;
1997 struct nlattr
*list
;
1998 const struct nft_rule
*prule
;
1999 u16 type
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
2001 nlh
= nlmsg_put(skb
, portid
, seq
, type
, sizeof(struct nfgenmsg
), flags
);
2003 goto nla_put_failure
;
2005 nfmsg
= nlmsg_data(nlh
);
2006 nfmsg
->nfgen_family
= family
;
2007 nfmsg
->version
= NFNETLINK_V0
;
2008 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
2010 if (nla_put_string(skb
, NFTA_RULE_TABLE
, table
->name
))
2011 goto nla_put_failure
;
2012 if (nla_put_string(skb
, NFTA_RULE_CHAIN
, chain
->name
))
2013 goto nla_put_failure
;
2014 if (nla_put_be64(skb
, NFTA_RULE_HANDLE
, cpu_to_be64(rule
->handle
),
2016 goto nla_put_failure
;
2018 if ((event
!= NFT_MSG_DELRULE
) && (rule
->list
.prev
!= &chain
->rules
)) {
2019 prule
= list_prev_entry(rule
, list
);
2020 if (nla_put_be64(skb
, NFTA_RULE_POSITION
,
2021 cpu_to_be64(prule
->handle
),
2023 goto nla_put_failure
;
2026 list
= nla_nest_start(skb
, NFTA_RULE_EXPRESSIONS
);
2028 goto nla_put_failure
;
2029 nft_rule_for_each_expr(expr
, next
, rule
) {
2030 if (nft_expr_dump(skb
, NFTA_LIST_ELEM
, expr
) < 0)
2031 goto nla_put_failure
;
2033 nla_nest_end(skb
, list
);
2036 struct nft_userdata
*udata
= nft_userdata(rule
);
2037 if (nla_put(skb
, NFTA_RULE_USERDATA
, udata
->len
+ 1,
2039 goto nla_put_failure
;
2042 nlmsg_end(skb
, nlh
);
2046 nlmsg_trim(skb
, nlh
);
2050 static void nf_tables_rule_notify(const struct nft_ctx
*ctx
,
2051 const struct nft_rule
*rule
, int event
)
2053 struct sk_buff
*skb
;
2057 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
2060 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
2064 err
= nf_tables_fill_rule_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
2065 event
, 0, ctx
->afi
->family
, ctx
->table
,
2072 nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
2073 ctx
->report
, GFP_KERNEL
);
2076 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
2079 struct nft_rule_dump_ctx
{
2084 static int nf_tables_dump_rules(struct sk_buff
*skb
,
2085 struct netlink_callback
*cb
)
2087 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
2088 const struct nft_rule_dump_ctx
*ctx
= cb
->data
;
2089 const struct nft_af_info
*afi
;
2090 const struct nft_table
*table
;
2091 const struct nft_chain
*chain
;
2092 const struct nft_rule
*rule
;
2093 unsigned int idx
= 0, s_idx
= cb
->args
[0];
2094 struct net
*net
= sock_net(skb
->sk
);
2095 int family
= nfmsg
->nfgen_family
;
2098 cb
->seq
= net
->nft
.base_seq
;
2100 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
2101 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
2104 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
2105 if (ctx
&& ctx
->table
&&
2106 strcmp(ctx
->table
, table
->name
) != 0)
2109 list_for_each_entry_rcu(chain
, &table
->chains
, list
) {
2110 if (ctx
&& ctx
->chain
[0] &&
2111 strcmp(ctx
->chain
, chain
->name
) != 0)
2114 list_for_each_entry_rcu(rule
, &chain
->rules
, list
) {
2115 if (!nft_is_active(net
, rule
))
2120 memset(&cb
->args
[1], 0,
2121 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
2122 if (nf_tables_fill_rule_info(skb
, net
, NETLINK_CB(cb
->skb
).portid
,
2125 NLM_F_MULTI
| NLM_F_APPEND
,
2126 afi
->family
, table
, chain
, rule
) < 0)
2129 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
2143 static int nf_tables_dump_rules_done(struct netlink_callback
*cb
)
2145 struct nft_rule_dump_ctx
*ctx
= cb
->data
;
2155 static int nf_tables_getrule(struct net
*net
, struct sock
*nlsk
,
2156 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2157 const struct nlattr
* const nla
[],
2158 struct netlink_ext_ack
*extack
)
2160 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2161 u8 genmask
= nft_genmask_cur(net
);
2162 const struct nft_af_info
*afi
;
2163 const struct nft_table
*table
;
2164 const struct nft_chain
*chain
;
2165 const struct nft_rule
*rule
;
2166 struct sk_buff
*skb2
;
2167 int family
= nfmsg
->nfgen_family
;
2170 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
2171 struct netlink_dump_control c
= {
2172 .dump
= nf_tables_dump_rules
,
2173 .done
= nf_tables_dump_rules_done
,
2176 if (nla
[NFTA_RULE_TABLE
] || nla
[NFTA_RULE_CHAIN
]) {
2177 struct nft_rule_dump_ctx
*ctx
;
2179 ctx
= kzalloc(sizeof(*ctx
), GFP_KERNEL
);
2183 if (nla
[NFTA_RULE_TABLE
]) {
2184 ctx
->table
= nla_strdup(nla
[NFTA_RULE_TABLE
],
2191 if (nla
[NFTA_RULE_CHAIN
]) {
2192 ctx
->chain
= nla_strdup(nla
[NFTA_RULE_CHAIN
],
2203 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
2206 afi
= nf_tables_afinfo_lookup(net
, family
, false);
2208 return PTR_ERR(afi
);
2210 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
], genmask
);
2212 return PTR_ERR(table
);
2214 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
], genmask
);
2216 return PTR_ERR(chain
);
2218 rule
= nf_tables_rule_lookup(chain
, nla
[NFTA_RULE_HANDLE
]);
2220 return PTR_ERR(rule
);
2222 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
2226 err
= nf_tables_fill_rule_info(skb2
, net
, NETLINK_CB(skb
).portid
,
2227 nlh
->nlmsg_seq
, NFT_MSG_NEWRULE
, 0,
2228 family
, table
, chain
, rule
);
2232 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
2239 static void nf_tables_rule_destroy(const struct nft_ctx
*ctx
,
2240 struct nft_rule
*rule
)
2242 struct nft_expr
*expr
;
2245 * Careful: some expressions might not be initialized in case this
2246 * is called on error from nf_tables_newrule().
2248 expr
= nft_expr_first(rule
);
2249 while (expr
!= nft_expr_last(rule
) && expr
->ops
) {
2250 nf_tables_expr_destroy(ctx
, expr
);
2251 expr
= nft_expr_next(expr
);
2256 #define NFT_RULE_MAXEXPRS 128
2258 static struct nft_expr_info
*info
;
2260 static int nf_tables_newrule(struct net
*net
, struct sock
*nlsk
,
2261 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2262 const struct nlattr
* const nla
[],
2263 struct netlink_ext_ack
*extack
)
2265 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2266 u8 genmask
= nft_genmask_next(net
);
2267 struct nft_af_info
*afi
;
2268 struct nft_table
*table
;
2269 struct nft_chain
*chain
;
2270 struct nft_rule
*rule
, *old_rule
= NULL
;
2271 struct nft_userdata
*udata
;
2272 struct nft_trans
*trans
= NULL
;
2273 struct nft_expr
*expr
;
2276 unsigned int size
, i
, n
, ulen
= 0, usize
= 0;
2279 u64 handle
, pos_handle
;
2281 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
2283 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, create
);
2285 return PTR_ERR(afi
);
2287 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
], genmask
);
2289 return PTR_ERR(table
);
2291 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
], genmask
);
2293 return PTR_ERR(chain
);
2295 if (nla
[NFTA_RULE_HANDLE
]) {
2296 handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_RULE_HANDLE
]));
2297 rule
= __nf_tables_rule_lookup(chain
, handle
);
2299 return PTR_ERR(rule
);
2301 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
2303 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
2308 if (!create
|| nlh
->nlmsg_flags
& NLM_F_REPLACE
)
2310 handle
= nf_tables_alloc_handle(table
);
2312 if (chain
->use
== UINT_MAX
)
2316 if (nla
[NFTA_RULE_POSITION
]) {
2317 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
))
2320 pos_handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_RULE_POSITION
]));
2321 old_rule
= __nf_tables_rule_lookup(chain
, pos_handle
);
2322 if (IS_ERR(old_rule
))
2323 return PTR_ERR(old_rule
);
2326 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
2330 if (nla
[NFTA_RULE_EXPRESSIONS
]) {
2331 nla_for_each_nested(tmp
, nla
[NFTA_RULE_EXPRESSIONS
], rem
) {
2333 if (nla_type(tmp
) != NFTA_LIST_ELEM
)
2335 if (n
== NFT_RULE_MAXEXPRS
)
2337 err
= nf_tables_expr_parse(&ctx
, tmp
, &info
[n
]);
2340 size
+= info
[n
].ops
->size
;
2344 /* Check for overflow of dlen field */
2346 if (size
>= 1 << 12)
2349 if (nla
[NFTA_RULE_USERDATA
]) {
2350 ulen
= nla_len(nla
[NFTA_RULE_USERDATA
]);
2352 usize
= sizeof(struct nft_userdata
) + ulen
;
2356 rule
= kzalloc(sizeof(*rule
) + size
+ usize
, GFP_KERNEL
);
2360 nft_activate_next(net
, rule
);
2362 rule
->handle
= handle
;
2364 rule
->udata
= ulen
? 1 : 0;
2367 udata
= nft_userdata(rule
);
2368 udata
->len
= ulen
- 1;
2369 nla_memcpy(udata
->data
, nla
[NFTA_RULE_USERDATA
], ulen
);
2372 expr
= nft_expr_first(rule
);
2373 for (i
= 0; i
< n
; i
++) {
2374 err
= nf_tables_newexpr(&ctx
, &info
[i
], expr
);
2378 expr
= nft_expr_next(expr
);
2381 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
) {
2382 if (nft_is_active_next(net
, old_rule
)) {
2383 trans
= nft_trans_rule_add(&ctx
, NFT_MSG_DELRULE
,
2385 if (trans
== NULL
) {
2389 nft_deactivate_next(net
, old_rule
);
2391 list_add_tail_rcu(&rule
->list
, &old_rule
->list
);
2396 } else if (nlh
->nlmsg_flags
& NLM_F_APPEND
)
2398 list_add_rcu(&rule
->list
, &old_rule
->list
);
2400 list_add_tail_rcu(&rule
->list
, &chain
->rules
);
2403 list_add_tail_rcu(&rule
->list
, &old_rule
->list
);
2405 list_add_rcu(&rule
->list
, &chain
->rules
);
2408 if (nft_trans_rule_add(&ctx
, NFT_MSG_NEWRULE
, rule
) == NULL
) {
2416 list_del_rcu(&rule
->list
);
2418 nf_tables_rule_destroy(&ctx
, rule
);
2420 for (i
= 0; i
< n
; i
++) {
2421 if (info
[i
].ops
!= NULL
)
2422 module_put(info
[i
].ops
->type
->owner
);
2427 static struct nft_rule
*nft_rule_lookup_byid(const struct net
*net
,
2428 const struct nlattr
*nla
)
2430 u32 id
= ntohl(nla_get_be32(nla
));
2431 struct nft_trans
*trans
;
2433 list_for_each_entry(trans
, &net
->nft
.commit_list
, list
) {
2434 struct nft_rule
*rule
= nft_trans_rule(trans
);
2436 if (trans
->msg_type
== NFT_MSG_NEWRULE
&&
2437 id
== nft_trans_rule_id(trans
))
2440 return ERR_PTR(-ENOENT
);
2443 static int nf_tables_delrule(struct net
*net
, struct sock
*nlsk
,
2444 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2445 const struct nlattr
* const nla
[],
2446 struct netlink_ext_ack
*extack
)
2448 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2449 u8 genmask
= nft_genmask_next(net
);
2450 struct nft_af_info
*afi
;
2451 struct nft_table
*table
;
2452 struct nft_chain
*chain
= NULL
;
2453 struct nft_rule
*rule
;
2454 int family
= nfmsg
->nfgen_family
, err
= 0;
2457 afi
= nf_tables_afinfo_lookup(net
, family
, false);
2459 return PTR_ERR(afi
);
2461 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
], genmask
);
2463 return PTR_ERR(table
);
2465 if (nla
[NFTA_RULE_CHAIN
]) {
2466 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
],
2469 return PTR_ERR(chain
);
2472 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
2475 if (nla
[NFTA_RULE_HANDLE
]) {
2476 rule
= nf_tables_rule_lookup(chain
,
2477 nla
[NFTA_RULE_HANDLE
]);
2479 return PTR_ERR(rule
);
2481 err
= nft_delrule(&ctx
, rule
);
2482 } else if (nla
[NFTA_RULE_ID
]) {
2483 rule
= nft_rule_lookup_byid(net
, nla
[NFTA_RULE_ID
]);
2485 return PTR_ERR(rule
);
2487 err
= nft_delrule(&ctx
, rule
);
2489 err
= nft_delrule_by_chain(&ctx
);
2492 list_for_each_entry(chain
, &table
->chains
, list
) {
2493 if (!nft_is_active_next(net
, chain
))
2497 err
= nft_delrule_by_chain(&ctx
);
2510 static LIST_HEAD(nf_tables_set_types
);
2512 int nft_register_set(struct nft_set_type
*type
)
2514 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2515 list_add_tail_rcu(&type
->list
, &nf_tables_set_types
);
2516 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2519 EXPORT_SYMBOL_GPL(nft_register_set
);
2521 void nft_unregister_set(struct nft_set_type
*type
)
2523 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2524 list_del_rcu(&type
->list
);
2525 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2527 EXPORT_SYMBOL_GPL(nft_unregister_set
);
2529 #define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
2530 NFT_SET_TIMEOUT | NFT_SET_OBJECT)
2532 static bool nft_set_ops_candidate(const struct nft_set_ops
*ops
, u32 flags
)
2534 return (flags
& ops
->features
) == (flags
& NFT_SET_FEATURES
);
2538 * Select a set implementation based on the data characteristics and the
2539 * given policy. The total memory use might not be known if no size is
2540 * given, in that case the amount of memory per element is used.
2542 static const struct nft_set_ops
*
2543 nft_select_set_ops(const struct nft_ctx
*ctx
,
2544 const struct nlattr
* const nla
[],
2545 const struct nft_set_desc
*desc
,
2546 enum nft_set_policies policy
)
2548 const struct nft_set_ops
*ops
, *bops
;
2549 struct nft_set_estimate est
, best
;
2550 const struct nft_set_type
*type
;
2553 #ifdef CONFIG_MODULES
2554 if (list_empty(&nf_tables_set_types
)) {
2555 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2556 request_module("nft-set");
2557 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2558 if (!list_empty(&nf_tables_set_types
))
2559 return ERR_PTR(-EAGAIN
);
2562 if (nla
[NFTA_SET_FLAGS
] != NULL
)
2563 flags
= ntohl(nla_get_be32(nla
[NFTA_SET_FLAGS
]));
2570 list_for_each_entry(type
, &nf_tables_set_types
, list
) {
2571 if (!type
->select_ops
)
2574 ops
= type
->select_ops(ctx
, desc
, flags
);
2578 if (!nft_set_ops_candidate(ops
, flags
))
2580 if (!ops
->estimate(desc
, flags
, &est
))
2584 case NFT_SET_POL_PERFORMANCE
:
2585 if (est
.lookup
< best
.lookup
)
2587 if (est
.lookup
== best
.lookup
&&
2588 est
.space
< best
.space
)
2591 case NFT_SET_POL_MEMORY
:
2593 if (est
.space
< best
.space
)
2595 if (est
.space
== best
.space
&&
2596 est
.lookup
< best
.lookup
)
2598 } else if (est
.size
< best
.size
) {
2606 if (!try_module_get(type
->owner
))
2609 module_put(bops
->type
->owner
);
2618 return ERR_PTR(-EOPNOTSUPP
);
2621 static const struct nla_policy nft_set_policy
[NFTA_SET_MAX
+ 1] = {
2622 [NFTA_SET_TABLE
] = { .type
= NLA_STRING
,
2623 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
2624 [NFTA_SET_NAME
] = { .type
= NLA_STRING
,
2625 .len
= NFT_SET_MAXNAMELEN
- 1 },
2626 [NFTA_SET_FLAGS
] = { .type
= NLA_U32
},
2627 [NFTA_SET_KEY_TYPE
] = { .type
= NLA_U32
},
2628 [NFTA_SET_KEY_LEN
] = { .type
= NLA_U32
},
2629 [NFTA_SET_DATA_TYPE
] = { .type
= NLA_U32
},
2630 [NFTA_SET_DATA_LEN
] = { .type
= NLA_U32
},
2631 [NFTA_SET_POLICY
] = { .type
= NLA_U32
},
2632 [NFTA_SET_DESC
] = { .type
= NLA_NESTED
},
2633 [NFTA_SET_ID
] = { .type
= NLA_U32
},
2634 [NFTA_SET_TIMEOUT
] = { .type
= NLA_U64
},
2635 [NFTA_SET_GC_INTERVAL
] = { .type
= NLA_U32
},
2636 [NFTA_SET_USERDATA
] = { .type
= NLA_BINARY
,
2637 .len
= NFT_USERDATA_MAXLEN
},
2638 [NFTA_SET_OBJ_TYPE
] = { .type
= NLA_U32
},
2641 static const struct nla_policy nft_set_desc_policy
[NFTA_SET_DESC_MAX
+ 1] = {
2642 [NFTA_SET_DESC_SIZE
] = { .type
= NLA_U32
},
2645 static int nft_ctx_init_from_setattr(struct nft_ctx
*ctx
, struct net
*net
,
2646 const struct sk_buff
*skb
,
2647 const struct nlmsghdr
*nlh
,
2648 const struct nlattr
* const nla
[],
2651 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2652 struct nft_af_info
*afi
= NULL
;
2653 struct nft_table
*table
= NULL
;
2655 if (nfmsg
->nfgen_family
!= NFPROTO_UNSPEC
) {
2656 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, false);
2658 return PTR_ERR(afi
);
2661 if (nla
[NFTA_SET_TABLE
] != NULL
) {
2663 return -EAFNOSUPPORT
;
2665 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_TABLE
],
2668 return PTR_ERR(table
);
2671 nft_ctx_init(ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
2675 static struct nft_set
*nf_tables_set_lookup(const struct nft_table
*table
,
2676 const struct nlattr
*nla
, u8 genmask
)
2678 struct nft_set
*set
;
2681 return ERR_PTR(-EINVAL
);
2683 list_for_each_entry(set
, &table
->sets
, list
) {
2684 if (!nla_strcmp(nla
, set
->name
) &&
2685 nft_active_genmask(set
, genmask
))
2688 return ERR_PTR(-ENOENT
);
2691 static struct nft_set
*nf_tables_set_lookup_byid(const struct net
*net
,
2692 const struct nlattr
*nla
,
2695 struct nft_trans
*trans
;
2696 u32 id
= ntohl(nla_get_be32(nla
));
2698 list_for_each_entry(trans
, &net
->nft
.commit_list
, list
) {
2699 struct nft_set
*set
= nft_trans_set(trans
);
2701 if (trans
->msg_type
== NFT_MSG_NEWSET
&&
2702 id
== nft_trans_set_id(trans
) &&
2703 nft_active_genmask(set
, genmask
))
2706 return ERR_PTR(-ENOENT
);
2709 struct nft_set
*nft_set_lookup(const struct net
*net
,
2710 const struct nft_table
*table
,
2711 const struct nlattr
*nla_set_name
,
2712 const struct nlattr
*nla_set_id
,
2715 struct nft_set
*set
;
2717 set
= nf_tables_set_lookup(table
, nla_set_name
, genmask
);
2722 set
= nf_tables_set_lookup_byid(net
, nla_set_id
, genmask
);
2726 EXPORT_SYMBOL_GPL(nft_set_lookup
);
2728 static int nf_tables_set_alloc_name(struct nft_ctx
*ctx
, struct nft_set
*set
,
2731 const struct nft_set
*i
;
2733 unsigned long *inuse
;
2734 unsigned int n
= 0, min
= 0;
2736 p
= strchr(name
, '%');
2738 if (p
[1] != 'd' || strchr(p
+ 2, '%'))
2741 inuse
= (unsigned long *)get_zeroed_page(GFP_KERNEL
);
2745 list_for_each_entry(i
, &ctx
->table
->sets
, list
) {
2748 if (!nft_is_active_next(ctx
->net
, set
))
2750 if (!sscanf(i
->name
, name
, &tmp
))
2752 if (tmp
< min
|| tmp
>= min
+ BITS_PER_BYTE
* PAGE_SIZE
)
2755 set_bit(tmp
- min
, inuse
);
2758 n
= find_first_zero_bit(inuse
, BITS_PER_BYTE
* PAGE_SIZE
);
2759 if (n
>= BITS_PER_BYTE
* PAGE_SIZE
) {
2760 min
+= BITS_PER_BYTE
* PAGE_SIZE
;
2761 memset(inuse
, 0, PAGE_SIZE
);
2764 free_page((unsigned long)inuse
);
2767 set
->name
= kasprintf(GFP_KERNEL
, name
, min
+ n
);
2771 list_for_each_entry(i
, &ctx
->table
->sets
, list
) {
2772 if (!nft_is_active_next(ctx
->net
, i
))
2774 if (!strcmp(set
->name
, i
->name
)) {
2782 static int nf_tables_fill_set(struct sk_buff
*skb
, const struct nft_ctx
*ctx
,
2783 const struct nft_set
*set
, u16 event
, u16 flags
)
2785 struct nfgenmsg
*nfmsg
;
2786 struct nlmsghdr
*nlh
;
2787 struct nlattr
*desc
;
2788 u32 portid
= ctx
->portid
;
2791 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
2792 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
2795 goto nla_put_failure
;
2797 nfmsg
= nlmsg_data(nlh
);
2798 nfmsg
->nfgen_family
= ctx
->afi
->family
;
2799 nfmsg
->version
= NFNETLINK_V0
;
2800 nfmsg
->res_id
= htons(ctx
->net
->nft
.base_seq
& 0xffff);
2802 if (nla_put_string(skb
, NFTA_SET_TABLE
, ctx
->table
->name
))
2803 goto nla_put_failure
;
2804 if (nla_put_string(skb
, NFTA_SET_NAME
, set
->name
))
2805 goto nla_put_failure
;
2806 if (set
->flags
!= 0)
2807 if (nla_put_be32(skb
, NFTA_SET_FLAGS
, htonl(set
->flags
)))
2808 goto nla_put_failure
;
2810 if (nla_put_be32(skb
, NFTA_SET_KEY_TYPE
, htonl(set
->ktype
)))
2811 goto nla_put_failure
;
2812 if (nla_put_be32(skb
, NFTA_SET_KEY_LEN
, htonl(set
->klen
)))
2813 goto nla_put_failure
;
2814 if (set
->flags
& NFT_SET_MAP
) {
2815 if (nla_put_be32(skb
, NFTA_SET_DATA_TYPE
, htonl(set
->dtype
)))
2816 goto nla_put_failure
;
2817 if (nla_put_be32(skb
, NFTA_SET_DATA_LEN
, htonl(set
->dlen
)))
2818 goto nla_put_failure
;
2820 if (set
->flags
& NFT_SET_OBJECT
&&
2821 nla_put_be32(skb
, NFTA_SET_OBJ_TYPE
, htonl(set
->objtype
)))
2822 goto nla_put_failure
;
2825 nla_put_be64(skb
, NFTA_SET_TIMEOUT
,
2826 cpu_to_be64(jiffies_to_msecs(set
->timeout
)),
2828 goto nla_put_failure
;
2830 nla_put_be32(skb
, NFTA_SET_GC_INTERVAL
, htonl(set
->gc_int
)))
2831 goto nla_put_failure
;
2833 if (set
->policy
!= NFT_SET_POL_PERFORMANCE
) {
2834 if (nla_put_be32(skb
, NFTA_SET_POLICY
, htonl(set
->policy
)))
2835 goto nla_put_failure
;
2838 if (nla_put(skb
, NFTA_SET_USERDATA
, set
->udlen
, set
->udata
))
2839 goto nla_put_failure
;
2841 desc
= nla_nest_start(skb
, NFTA_SET_DESC
);
2843 goto nla_put_failure
;
2845 nla_put_be32(skb
, NFTA_SET_DESC_SIZE
, htonl(set
->size
)))
2846 goto nla_put_failure
;
2847 nla_nest_end(skb
, desc
);
2849 nlmsg_end(skb
, nlh
);
2853 nlmsg_trim(skb
, nlh
);
2857 static void nf_tables_set_notify(const struct nft_ctx
*ctx
,
2858 const struct nft_set
*set
, int event
,
2861 struct sk_buff
*skb
;
2862 u32 portid
= ctx
->portid
;
2866 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
2869 skb
= nlmsg_new(NLMSG_GOODSIZE
, gfp_flags
);
2873 err
= nf_tables_fill_set(skb
, ctx
, set
, event
, 0);
2879 nfnetlink_send(skb
, ctx
->net
, portid
, NFNLGRP_NFTABLES
, ctx
->report
,
2883 nfnetlink_set_err(ctx
->net
, portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
2886 static int nf_tables_dump_sets(struct sk_buff
*skb
, struct netlink_callback
*cb
)
2888 const struct nft_set
*set
;
2889 unsigned int idx
, s_idx
= cb
->args
[0];
2890 struct nft_af_info
*afi
;
2891 struct nft_table
*table
, *cur_table
= (struct nft_table
*)cb
->args
[2];
2892 struct net
*net
= sock_net(skb
->sk
);
2893 int cur_family
= cb
->args
[3];
2894 struct nft_ctx
*ctx
= cb
->data
, ctx_set
;
2900 cb
->seq
= net
->nft
.base_seq
;
2902 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
2903 if (ctx
->afi
&& ctx
->afi
!= afi
)
2907 if (afi
->family
!= cur_family
)
2912 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
2913 if (ctx
->table
&& ctx
->table
!= table
)
2917 if (cur_table
!= table
)
2923 list_for_each_entry_rcu(set
, &table
->sets
, list
) {
2926 if (!nft_is_active(net
, set
))
2930 ctx_set
.table
= table
;
2932 if (nf_tables_fill_set(skb
, &ctx_set
, set
,
2936 cb
->args
[2] = (unsigned long) table
;
2937 cb
->args
[3] = afi
->family
;
2940 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
2954 static int nf_tables_dump_sets_done(struct netlink_callback
*cb
)
2960 static int nf_tables_getset(struct net
*net
, struct sock
*nlsk
,
2961 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2962 const struct nlattr
* const nla
[],
2963 struct netlink_ext_ack
*extack
)
2965 u8 genmask
= nft_genmask_cur(net
);
2966 const struct nft_set
*set
;
2968 struct sk_buff
*skb2
;
2969 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2972 /* Verify existence before starting dump */
2973 err
= nft_ctx_init_from_setattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
2977 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
2978 struct netlink_dump_control c
= {
2979 .dump
= nf_tables_dump_sets
,
2980 .done
= nf_tables_dump_sets_done
,
2982 struct nft_ctx
*ctx_dump
;
2984 ctx_dump
= kmalloc(sizeof(*ctx_dump
), GFP_KERNEL
);
2985 if (ctx_dump
== NULL
)
2991 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
2994 /* Only accept unspec with dump */
2995 if (nfmsg
->nfgen_family
== NFPROTO_UNSPEC
)
2996 return -EAFNOSUPPORT
;
2997 if (!nla
[NFTA_SET_TABLE
])
3000 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_NAME
], genmask
);
3002 return PTR_ERR(set
);
3004 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
3008 err
= nf_tables_fill_set(skb2
, &ctx
, set
, NFT_MSG_NEWSET
, 0);
3012 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
3019 static int nf_tables_set_desc_parse(const struct nft_ctx
*ctx
,
3020 struct nft_set_desc
*desc
,
3021 const struct nlattr
*nla
)
3023 struct nlattr
*da
[NFTA_SET_DESC_MAX
+ 1];
3026 err
= nla_parse_nested(da
, NFTA_SET_DESC_MAX
, nla
,
3027 nft_set_desc_policy
, NULL
);
3031 if (da
[NFTA_SET_DESC_SIZE
] != NULL
)
3032 desc
->size
= ntohl(nla_get_be32(da
[NFTA_SET_DESC_SIZE
]));
3037 static int nf_tables_newset(struct net
*net
, struct sock
*nlsk
,
3038 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
3039 const struct nlattr
* const nla
[],
3040 struct netlink_ext_ack
*extack
)
3042 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
3043 u8 genmask
= nft_genmask_next(net
);
3044 const struct nft_set_ops
*ops
;
3045 struct nft_af_info
*afi
;
3046 struct nft_table
*table
;
3047 struct nft_set
*set
;
3053 u32 ktype
, dtype
, flags
, policy
, gc_int
, objtype
;
3054 struct nft_set_desc desc
;
3055 unsigned char *udata
;
3059 if (nla
[NFTA_SET_TABLE
] == NULL
||
3060 nla
[NFTA_SET_NAME
] == NULL
||
3061 nla
[NFTA_SET_KEY_LEN
] == NULL
||
3062 nla
[NFTA_SET_ID
] == NULL
)
3065 memset(&desc
, 0, sizeof(desc
));
3067 ktype
= NFT_DATA_VALUE
;
3068 if (nla
[NFTA_SET_KEY_TYPE
] != NULL
) {
3069 ktype
= ntohl(nla_get_be32(nla
[NFTA_SET_KEY_TYPE
]));
3070 if ((ktype
& NFT_DATA_RESERVED_MASK
) == NFT_DATA_RESERVED_MASK
)
3074 desc
.klen
= ntohl(nla_get_be32(nla
[NFTA_SET_KEY_LEN
]));
3075 if (desc
.klen
== 0 || desc
.klen
> NFT_DATA_VALUE_MAXLEN
)
3079 if (nla
[NFTA_SET_FLAGS
] != NULL
) {
3080 flags
= ntohl(nla_get_be32(nla
[NFTA_SET_FLAGS
]));
3081 if (flags
& ~(NFT_SET_ANONYMOUS
| NFT_SET_CONSTANT
|
3082 NFT_SET_INTERVAL
| NFT_SET_TIMEOUT
|
3083 NFT_SET_MAP
| NFT_SET_EVAL
|
3086 /* Only one of these operations is supported */
3087 if ((flags
& (NFT_SET_MAP
| NFT_SET_EVAL
| NFT_SET_OBJECT
)) ==
3088 (NFT_SET_MAP
| NFT_SET_EVAL
| NFT_SET_OBJECT
))
3093 if (nla
[NFTA_SET_DATA_TYPE
] != NULL
) {
3094 if (!(flags
& NFT_SET_MAP
))
3097 dtype
= ntohl(nla_get_be32(nla
[NFTA_SET_DATA_TYPE
]));
3098 if ((dtype
& NFT_DATA_RESERVED_MASK
) == NFT_DATA_RESERVED_MASK
&&
3099 dtype
!= NFT_DATA_VERDICT
)
3102 if (dtype
!= NFT_DATA_VERDICT
) {
3103 if (nla
[NFTA_SET_DATA_LEN
] == NULL
)
3105 desc
.dlen
= ntohl(nla_get_be32(nla
[NFTA_SET_DATA_LEN
]));
3106 if (desc
.dlen
== 0 || desc
.dlen
> NFT_DATA_VALUE_MAXLEN
)
3109 desc
.dlen
= sizeof(struct nft_verdict
);
3110 } else if (flags
& NFT_SET_MAP
)
3113 if (nla
[NFTA_SET_OBJ_TYPE
] != NULL
) {
3114 if (!(flags
& NFT_SET_OBJECT
))
3117 objtype
= ntohl(nla_get_be32(nla
[NFTA_SET_OBJ_TYPE
]));
3118 if (objtype
== NFT_OBJECT_UNSPEC
||
3119 objtype
> NFT_OBJECT_MAX
)
3121 } else if (flags
& NFT_SET_OBJECT
)
3124 objtype
= NFT_OBJECT_UNSPEC
;
3127 if (nla
[NFTA_SET_TIMEOUT
] != NULL
) {
3128 if (!(flags
& NFT_SET_TIMEOUT
))
3130 timeout
= msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3131 nla
[NFTA_SET_TIMEOUT
])));
3134 if (nla
[NFTA_SET_GC_INTERVAL
] != NULL
) {
3135 if (!(flags
& NFT_SET_TIMEOUT
))
3137 gc_int
= ntohl(nla_get_be32(nla
[NFTA_SET_GC_INTERVAL
]));
3140 policy
= NFT_SET_POL_PERFORMANCE
;
3141 if (nla
[NFTA_SET_POLICY
] != NULL
)
3142 policy
= ntohl(nla_get_be32(nla
[NFTA_SET_POLICY
]));
3144 if (nla
[NFTA_SET_DESC
] != NULL
) {
3145 err
= nf_tables_set_desc_parse(&ctx
, &desc
, nla
[NFTA_SET_DESC
]);
3150 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
3152 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, create
);
3154 return PTR_ERR(afi
);
3156 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_TABLE
], genmask
);
3158 return PTR_ERR(table
);
3160 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
3162 set
= nf_tables_set_lookup(table
, nla
[NFTA_SET_NAME
], genmask
);
3164 if (PTR_ERR(set
) != -ENOENT
)
3165 return PTR_ERR(set
);
3167 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
3169 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
3174 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
))
3177 ops
= nft_select_set_ops(&ctx
, nla
, &desc
, policy
);
3179 return PTR_ERR(ops
);
3182 if (nla
[NFTA_SET_USERDATA
])
3183 udlen
= nla_len(nla
[NFTA_SET_USERDATA
]);
3186 if (ops
->privsize
!= NULL
)
3187 size
= ops
->privsize(nla
, &desc
);
3189 set
= kvzalloc(sizeof(*set
) + size
+ udlen
, GFP_KERNEL
);
3195 name
= nla_strdup(nla
[NFTA_SET_NAME
], GFP_KERNEL
);
3201 err
= nf_tables_set_alloc_name(&ctx
, set
, name
);
3208 udata
= set
->data
+ size
;
3209 nla_memcpy(udata
, nla
[NFTA_SET_USERDATA
], udlen
);
3212 INIT_LIST_HEAD(&set
->bindings
);
3215 set
->klen
= desc
.klen
;
3217 set
->objtype
= objtype
;
3218 set
->dlen
= desc
.dlen
;
3220 set
->size
= desc
.size
;
3221 set
->policy
= policy
;
3224 set
->timeout
= timeout
;
3225 set
->gc_int
= gc_int
;
3227 err
= ops
->init(set
, &desc
, nla
);
3231 err
= nft_trans_set_add(&ctx
, NFT_MSG_NEWSET
, set
);
3235 list_add_tail_rcu(&set
->list
, &table
->sets
);
3244 module_put(ops
->type
->owner
);
3248 static void nft_set_destroy(struct nft_set
*set
)
3250 set
->ops
->destroy(set
);
3251 module_put(set
->ops
->type
->owner
);
3256 static void nf_tables_set_destroy(const struct nft_ctx
*ctx
, struct nft_set
*set
)
3258 list_del_rcu(&set
->list
);
3259 nf_tables_set_notify(ctx
, set
, NFT_MSG_DELSET
, GFP_ATOMIC
);
3260 nft_set_destroy(set
);
3263 static int nf_tables_delset(struct net
*net
, struct sock
*nlsk
,
3264 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
3265 const struct nlattr
* const nla
[],
3266 struct netlink_ext_ack
*extack
)
3268 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
3269 u8 genmask
= nft_genmask_next(net
);
3270 struct nft_set
*set
;
3274 if (nfmsg
->nfgen_family
== NFPROTO_UNSPEC
)
3275 return -EAFNOSUPPORT
;
3276 if (nla
[NFTA_SET_TABLE
] == NULL
)
3279 err
= nft_ctx_init_from_setattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
3283 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_NAME
], genmask
);
3285 return PTR_ERR(set
);
3287 if (!list_empty(&set
->bindings
) ||
3288 (nlh
->nlmsg_flags
& NLM_F_NONREC
&& atomic_read(&set
->nelems
) > 0))
3291 return nft_delset(&ctx
, set
);
3294 static int nf_tables_bind_check_setelem(const struct nft_ctx
*ctx
,
3295 struct nft_set
*set
,
3296 const struct nft_set_iter
*iter
,
3297 struct nft_set_elem
*elem
)
3299 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
3300 enum nft_registers dreg
;
3302 dreg
= nft_type_to_reg(set
->dtype
);
3303 return nft_validate_register_store(ctx
, dreg
, nft_set_ext_data(ext
),
3304 set
->dtype
== NFT_DATA_VERDICT
?
3305 NFT_DATA_VERDICT
: NFT_DATA_VALUE
,
3309 int nf_tables_bind_set(const struct nft_ctx
*ctx
, struct nft_set
*set
,
3310 struct nft_set_binding
*binding
)
3312 struct nft_set_binding
*i
;
3313 struct nft_set_iter iter
;
3315 if (!list_empty(&set
->bindings
) && nft_set_is_anonymous(set
))
3318 if (binding
->flags
& NFT_SET_MAP
) {
3319 /* If the set is already bound to the same chain all
3320 * jumps are already validated for that chain.
3322 list_for_each_entry(i
, &set
->bindings
, list
) {
3323 if (i
->flags
& NFT_SET_MAP
&&
3324 i
->chain
== binding
->chain
)
3328 iter
.genmask
= nft_genmask_next(ctx
->net
);
3332 iter
.fn
= nf_tables_bind_check_setelem
;
3334 set
->ops
->walk(ctx
, set
, &iter
);
3339 binding
->chain
= ctx
->chain
;
3340 list_add_tail_rcu(&binding
->list
, &set
->bindings
);
3343 EXPORT_SYMBOL_GPL(nf_tables_bind_set
);
3345 void nf_tables_unbind_set(const struct nft_ctx
*ctx
, struct nft_set
*set
,
3346 struct nft_set_binding
*binding
)
3348 list_del_rcu(&binding
->list
);
3350 if (list_empty(&set
->bindings
) && nft_set_is_anonymous(set
) &&
3351 nft_is_active(ctx
->net
, set
))
3352 nf_tables_set_destroy(ctx
, set
);
3354 EXPORT_SYMBOL_GPL(nf_tables_unbind_set
);
3356 const struct nft_set_ext_type nft_set_ext_types
[] = {
3357 [NFT_SET_EXT_KEY
] = {
3358 .align
= __alignof__(u32
),
3360 [NFT_SET_EXT_DATA
] = {
3361 .align
= __alignof__(u32
),
3363 [NFT_SET_EXT_EXPR
] = {
3364 .align
= __alignof__(struct nft_expr
),
3366 [NFT_SET_EXT_OBJREF
] = {
3367 .len
= sizeof(struct nft_object
*),
3368 .align
= __alignof__(struct nft_object
*),
3370 [NFT_SET_EXT_FLAGS
] = {
3372 .align
= __alignof__(u8
),
3374 [NFT_SET_EXT_TIMEOUT
] = {
3376 .align
= __alignof__(u64
),
3378 [NFT_SET_EXT_EXPIRATION
] = {
3379 .len
= sizeof(unsigned long),
3380 .align
= __alignof__(unsigned long),
3382 [NFT_SET_EXT_USERDATA
] = {
3383 .len
= sizeof(struct nft_userdata
),
3384 .align
= __alignof__(struct nft_userdata
),
3387 EXPORT_SYMBOL_GPL(nft_set_ext_types
);
3393 static const struct nla_policy nft_set_elem_policy
[NFTA_SET_ELEM_MAX
+ 1] = {
3394 [NFTA_SET_ELEM_KEY
] = { .type
= NLA_NESTED
},
3395 [NFTA_SET_ELEM_DATA
] = { .type
= NLA_NESTED
},
3396 [NFTA_SET_ELEM_FLAGS
] = { .type
= NLA_U32
},
3397 [NFTA_SET_ELEM_TIMEOUT
] = { .type
= NLA_U64
},
3398 [NFTA_SET_ELEM_USERDATA
] = { .type
= NLA_BINARY
,
3399 .len
= NFT_USERDATA_MAXLEN
},
3402 static const struct nla_policy nft_set_elem_list_policy
[NFTA_SET_ELEM_LIST_MAX
+ 1] = {
3403 [NFTA_SET_ELEM_LIST_TABLE
] = { .type
= NLA_STRING
,
3404 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
3405 [NFTA_SET_ELEM_LIST_SET
] = { .type
= NLA_STRING
,
3406 .len
= NFT_SET_MAXNAMELEN
- 1 },
3407 [NFTA_SET_ELEM_LIST_ELEMENTS
] = { .type
= NLA_NESTED
},
3408 [NFTA_SET_ELEM_LIST_SET_ID
] = { .type
= NLA_U32
},
3411 static int nft_ctx_init_from_elemattr(struct nft_ctx
*ctx
, struct net
*net
,
3412 const struct sk_buff
*skb
,
3413 const struct nlmsghdr
*nlh
,
3414 const struct nlattr
* const nla
[],
3417 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
3418 struct nft_af_info
*afi
;
3419 struct nft_table
*table
;
3421 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, false);
3423 return PTR_ERR(afi
);
3425 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_ELEM_LIST_TABLE
],
3428 return PTR_ERR(table
);
3430 nft_ctx_init(ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
3434 static int nf_tables_fill_setelem(struct sk_buff
*skb
,
3435 const struct nft_set
*set
,
3436 const struct nft_set_elem
*elem
)
3438 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
3439 unsigned char *b
= skb_tail_pointer(skb
);
3440 struct nlattr
*nest
;
3442 nest
= nla_nest_start(skb
, NFTA_LIST_ELEM
);
3444 goto nla_put_failure
;
3446 if (nft_data_dump(skb
, NFTA_SET_ELEM_KEY
, nft_set_ext_key(ext
),
3447 NFT_DATA_VALUE
, set
->klen
) < 0)
3448 goto nla_put_failure
;
3450 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
) &&
3451 nft_data_dump(skb
, NFTA_SET_ELEM_DATA
, nft_set_ext_data(ext
),
3452 set
->dtype
== NFT_DATA_VERDICT
? NFT_DATA_VERDICT
: NFT_DATA_VALUE
,
3454 goto nla_put_failure
;
3456 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
) &&
3457 nft_expr_dump(skb
, NFTA_SET_ELEM_EXPR
, nft_set_ext_expr(ext
)) < 0)
3458 goto nla_put_failure
;
3460 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
) &&
3461 nla_put_string(skb
, NFTA_SET_ELEM_OBJREF
,
3462 (*nft_set_ext_obj(ext
))->name
) < 0)
3463 goto nla_put_failure
;
3465 if (nft_set_ext_exists(ext
, NFT_SET_EXT_FLAGS
) &&
3466 nla_put_be32(skb
, NFTA_SET_ELEM_FLAGS
,
3467 htonl(*nft_set_ext_flags(ext
))))
3468 goto nla_put_failure
;
3470 if (nft_set_ext_exists(ext
, NFT_SET_EXT_TIMEOUT
) &&
3471 nla_put_be64(skb
, NFTA_SET_ELEM_TIMEOUT
,
3472 cpu_to_be64(jiffies_to_msecs(
3473 *nft_set_ext_timeout(ext
))),
3475 goto nla_put_failure
;
3477 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPIRATION
)) {
3478 unsigned long expires
, now
= jiffies
;
3480 expires
= *nft_set_ext_expiration(ext
);
3481 if (time_before(now
, expires
))
3486 if (nla_put_be64(skb
, NFTA_SET_ELEM_EXPIRATION
,
3487 cpu_to_be64(jiffies_to_msecs(expires
)),
3489 goto nla_put_failure
;
3492 if (nft_set_ext_exists(ext
, NFT_SET_EXT_USERDATA
)) {
3493 struct nft_userdata
*udata
;
3495 udata
= nft_set_ext_userdata(ext
);
3496 if (nla_put(skb
, NFTA_SET_ELEM_USERDATA
,
3497 udata
->len
+ 1, udata
->data
))
3498 goto nla_put_failure
;
3501 nla_nest_end(skb
, nest
);
3509 struct nft_set_dump_args
{
3510 const struct netlink_callback
*cb
;
3511 struct nft_set_iter iter
;
3512 struct sk_buff
*skb
;
3515 static int nf_tables_dump_setelem(const struct nft_ctx
*ctx
,
3516 struct nft_set
*set
,
3517 const struct nft_set_iter
*iter
,
3518 struct nft_set_elem
*elem
)
3520 struct nft_set_dump_args
*args
;
3522 args
= container_of(iter
, struct nft_set_dump_args
, iter
);
3523 return nf_tables_fill_setelem(args
->skb
, set
, elem
);
3526 struct nft_set_dump_ctx
{
3527 const struct nft_set
*set
;
3531 static int nf_tables_dump_set(struct sk_buff
*skb
, struct netlink_callback
*cb
)
3533 struct nft_set_dump_ctx
*dump_ctx
= cb
->data
;
3534 struct net
*net
= sock_net(skb
->sk
);
3535 struct nft_af_info
*afi
;
3536 struct nft_table
*table
;
3537 struct nft_set
*set
;
3538 struct nft_set_dump_args args
;
3539 bool set_found
= false;
3540 struct nfgenmsg
*nfmsg
;
3541 struct nlmsghdr
*nlh
;
3542 struct nlattr
*nest
;
3547 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
3548 if (afi
!= dump_ctx
->ctx
.afi
)
3551 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
3552 if (table
!= dump_ctx
->ctx
.table
)
3555 list_for_each_entry_rcu(set
, &table
->sets
, list
) {
3556 if (set
== dump_ctx
->set
) {
3571 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, NFT_MSG_NEWSETELEM
);
3572 portid
= NETLINK_CB(cb
->skb
).portid
;
3573 seq
= cb
->nlh
->nlmsg_seq
;
3575 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
3578 goto nla_put_failure
;
3580 nfmsg
= nlmsg_data(nlh
);
3581 nfmsg
->nfgen_family
= afi
->family
;
3582 nfmsg
->version
= NFNETLINK_V0
;
3583 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
3585 if (nla_put_string(skb
, NFTA_SET_ELEM_LIST_TABLE
, table
->name
))
3586 goto nla_put_failure
;
3587 if (nla_put_string(skb
, NFTA_SET_ELEM_LIST_SET
, set
->name
))
3588 goto nla_put_failure
;
3590 nest
= nla_nest_start(skb
, NFTA_SET_ELEM_LIST_ELEMENTS
);
3592 goto nla_put_failure
;
3596 args
.iter
.genmask
= nft_genmask_cur(net
);
3597 args
.iter
.skip
= cb
->args
[0];
3598 args
.iter
.count
= 0;
3600 args
.iter
.fn
= nf_tables_dump_setelem
;
3601 set
->ops
->walk(&dump_ctx
->ctx
, set
, &args
.iter
);
3604 nla_nest_end(skb
, nest
);
3605 nlmsg_end(skb
, nlh
);
3607 if (args
.iter
.err
&& args
.iter
.err
!= -EMSGSIZE
)
3608 return args
.iter
.err
;
3609 if (args
.iter
.count
== cb
->args
[0])
3612 cb
->args
[0] = args
.iter
.count
;
3620 static int nf_tables_dump_set_done(struct netlink_callback
*cb
)
3626 static int nf_tables_fill_setelem_info(struct sk_buff
*skb
,
3627 const struct nft_ctx
*ctx
, u32 seq
,
3628 u32 portid
, int event
, u16 flags
,
3629 const struct nft_set
*set
,
3630 const struct nft_set_elem
*elem
)
3632 struct nfgenmsg
*nfmsg
;
3633 struct nlmsghdr
*nlh
;
3634 struct nlattr
*nest
;
3637 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
3638 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
3641 goto nla_put_failure
;
3643 nfmsg
= nlmsg_data(nlh
);
3644 nfmsg
->nfgen_family
= ctx
->afi
->family
;
3645 nfmsg
->version
= NFNETLINK_V0
;
3646 nfmsg
->res_id
= htons(ctx
->net
->nft
.base_seq
& 0xffff);
3648 if (nla_put_string(skb
, NFTA_SET_TABLE
, ctx
->table
->name
))
3649 goto nla_put_failure
;
3650 if (nla_put_string(skb
, NFTA_SET_NAME
, set
->name
))
3651 goto nla_put_failure
;
3653 nest
= nla_nest_start(skb
, NFTA_SET_ELEM_LIST_ELEMENTS
);
3655 goto nla_put_failure
;
3657 err
= nf_tables_fill_setelem(skb
, set
, elem
);
3659 goto nla_put_failure
;
3661 nla_nest_end(skb
, nest
);
3663 nlmsg_end(skb
, nlh
);
3667 nlmsg_trim(skb
, nlh
);
3671 static int nft_setelem_parse_flags(const struct nft_set
*set
,
3672 const struct nlattr
*attr
, u32
*flags
)
3677 *flags
= ntohl(nla_get_be32(attr
));
3678 if (*flags
& ~NFT_SET_ELEM_INTERVAL_END
)
3680 if (!(set
->flags
& NFT_SET_INTERVAL
) &&
3681 *flags
& NFT_SET_ELEM_INTERVAL_END
)
3687 static int nft_get_set_elem(struct nft_ctx
*ctx
, struct nft_set
*set
,
3688 const struct nlattr
*attr
)
3690 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
3691 const struct nft_set_ext
*ext
;
3692 struct nft_data_desc desc
;
3693 struct nft_set_elem elem
;
3694 struct sk_buff
*skb
;
3699 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
3700 nft_set_elem_policy
, NULL
);
3704 if (!nla
[NFTA_SET_ELEM_KEY
])
3707 err
= nft_setelem_parse_flags(set
, nla
[NFTA_SET_ELEM_FLAGS
], &flags
);
3711 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &desc
,
3712 nla
[NFTA_SET_ELEM_KEY
]);
3717 if (desc
.type
!= NFT_DATA_VALUE
|| desc
.len
!= set
->klen
)
3720 priv
= set
->ops
->get(ctx
->net
, set
, &elem
, flags
);
3722 return PTR_ERR(priv
);
3725 ext
= nft_set_elem_ext(set
, &elem
);
3728 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
3732 err
= nf_tables_fill_setelem_info(skb
, ctx
, ctx
->seq
, ctx
->portid
,
3733 NFT_MSG_NEWSETELEM
, 0, set
, &elem
);
3737 err
= nfnetlink_unicast(skb
, ctx
->net
, ctx
->portid
, MSG_DONTWAIT
);
3738 /* This avoids a loop in nfnetlink. */
3746 /* this avoids a loop in nfnetlink. */
3747 return err
== -EAGAIN
? -ENOBUFS
: err
;
3750 static int nf_tables_getsetelem(struct net
*net
, struct sock
*nlsk
,
3751 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
3752 const struct nlattr
* const nla
[],
3753 struct netlink_ext_ack
*extack
)
3755 u8 genmask
= nft_genmask_cur(net
);
3756 struct nft_set
*set
;
3757 struct nlattr
*attr
;
3761 err
= nft_ctx_init_from_elemattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
3765 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
],
3768 return PTR_ERR(set
);
3770 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
3771 struct netlink_dump_control c
= {
3772 .dump
= nf_tables_dump_set
,
3773 .done
= nf_tables_dump_set_done
,
3775 struct nft_set_dump_ctx
*dump_ctx
;
3777 dump_ctx
= kmalloc(sizeof(*dump_ctx
), GFP_KERNEL
);
3781 dump_ctx
->set
= set
;
3782 dump_ctx
->ctx
= ctx
;
3785 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
3788 if (!nla
[NFTA_SET_ELEM_LIST_ELEMENTS
])
3791 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
3792 err
= nft_get_set_elem(&ctx
, set
, attr
);
3800 static void nf_tables_setelem_notify(const struct nft_ctx
*ctx
,
3801 const struct nft_set
*set
,
3802 const struct nft_set_elem
*elem
,
3803 int event
, u16 flags
)
3805 struct net
*net
= ctx
->net
;
3806 u32 portid
= ctx
->portid
;
3807 struct sk_buff
*skb
;
3810 if (!ctx
->report
&& !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
3813 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
3817 err
= nf_tables_fill_setelem_info(skb
, ctx
, 0, portid
, event
, flags
,
3824 nfnetlink_send(skb
, net
, portid
, NFNLGRP_NFTABLES
, ctx
->report
,
3828 nfnetlink_set_err(net
, portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
3831 static struct nft_trans
*nft_trans_elem_alloc(struct nft_ctx
*ctx
,
3833 struct nft_set
*set
)
3835 struct nft_trans
*trans
;
3837 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_elem
));
3841 nft_trans_elem_set(trans
) = set
;
3845 void *nft_set_elem_init(const struct nft_set
*set
,
3846 const struct nft_set_ext_tmpl
*tmpl
,
3847 const u32
*key
, const u32
*data
,
3848 u64 timeout
, gfp_t gfp
)
3850 struct nft_set_ext
*ext
;
3853 elem
= kzalloc(set
->ops
->elemsize
+ tmpl
->len
, gfp
);
3857 ext
= nft_set_elem_ext(set
, elem
);
3858 nft_set_ext_init(ext
, tmpl
);
3860 memcpy(nft_set_ext_key(ext
), key
, set
->klen
);
3861 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
3862 memcpy(nft_set_ext_data(ext
), data
, set
->dlen
);
3863 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPIRATION
))
3864 *nft_set_ext_expiration(ext
) =
3866 if (nft_set_ext_exists(ext
, NFT_SET_EXT_TIMEOUT
))
3867 *nft_set_ext_timeout(ext
) = timeout
;
3872 void nft_set_elem_destroy(const struct nft_set
*set
, void *elem
,
3875 struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
);
3877 nft_data_release(nft_set_ext_key(ext
), NFT_DATA_VALUE
);
3878 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
3879 nft_data_release(nft_set_ext_data(ext
), set
->dtype
);
3880 if (destroy_expr
&& nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
))
3881 nf_tables_expr_destroy(NULL
, nft_set_ext_expr(ext
));
3882 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
))
3883 (*nft_set_ext_obj(ext
))->use
--;
3886 EXPORT_SYMBOL_GPL(nft_set_elem_destroy
);
3888 /* Only called from commit path, nft_set_elem_deactivate() already deals with
3889 * the refcounting from the preparation phase.
3891 static void nf_tables_set_elem_destroy(const struct nft_set
*set
, void *elem
)
3893 struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
);
3895 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
))
3896 nf_tables_expr_destroy(NULL
, nft_set_ext_expr(ext
));
3900 static int nft_add_set_elem(struct nft_ctx
*ctx
, struct nft_set
*set
,
3901 const struct nlattr
*attr
, u32 nlmsg_flags
)
3903 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
3904 u8 genmask
= nft_genmask_next(ctx
->net
);
3905 struct nft_data_desc d1
, d2
;
3906 struct nft_set_ext_tmpl tmpl
;
3907 struct nft_set_ext
*ext
, *ext2
;
3908 struct nft_set_elem elem
;
3909 struct nft_set_binding
*binding
;
3910 struct nft_object
*obj
= NULL
;
3911 struct nft_userdata
*udata
;
3912 struct nft_data data
;
3913 enum nft_registers dreg
;
3914 struct nft_trans
*trans
;
3920 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
3921 nft_set_elem_policy
, NULL
);
3925 if (nla
[NFTA_SET_ELEM_KEY
] == NULL
)
3928 nft_set_ext_prepare(&tmpl
);
3930 err
= nft_setelem_parse_flags(set
, nla
[NFTA_SET_ELEM_FLAGS
], &flags
);
3934 nft_set_ext_add(&tmpl
, NFT_SET_EXT_FLAGS
);
3936 if (set
->flags
& NFT_SET_MAP
) {
3937 if (nla
[NFTA_SET_ELEM_DATA
] == NULL
&&
3938 !(flags
& NFT_SET_ELEM_INTERVAL_END
))
3940 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
&&
3941 flags
& NFT_SET_ELEM_INTERVAL_END
)
3944 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
)
3949 if (nla
[NFTA_SET_ELEM_TIMEOUT
] != NULL
) {
3950 if (!(set
->flags
& NFT_SET_TIMEOUT
))
3952 timeout
= msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3953 nla
[NFTA_SET_ELEM_TIMEOUT
])));
3954 } else if (set
->flags
& NFT_SET_TIMEOUT
) {
3955 timeout
= set
->timeout
;
3958 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &d1
,
3959 nla
[NFTA_SET_ELEM_KEY
]);
3963 if (d1
.type
!= NFT_DATA_VALUE
|| d1
.len
!= set
->klen
)
3966 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_KEY
, d1
.len
);
3968 nft_set_ext_add(&tmpl
, NFT_SET_EXT_EXPIRATION
);
3969 if (timeout
!= set
->timeout
)
3970 nft_set_ext_add(&tmpl
, NFT_SET_EXT_TIMEOUT
);
3973 if (nla
[NFTA_SET_ELEM_OBJREF
] != NULL
) {
3974 if (!(set
->flags
& NFT_SET_OBJECT
)) {
3978 obj
= nf_tables_obj_lookup(ctx
->table
, nla
[NFTA_SET_ELEM_OBJREF
],
3979 set
->objtype
, genmask
);
3984 nft_set_ext_add(&tmpl
, NFT_SET_EXT_OBJREF
);
3987 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
) {
3988 err
= nft_data_init(ctx
, &data
, sizeof(data
), &d2
,
3989 nla
[NFTA_SET_ELEM_DATA
]);
3994 if (set
->dtype
!= NFT_DATA_VERDICT
&& d2
.len
!= set
->dlen
)
3997 dreg
= nft_type_to_reg(set
->dtype
);
3998 list_for_each_entry(binding
, &set
->bindings
, list
) {
3999 struct nft_ctx bind_ctx
= {
4002 .table
= ctx
->table
,
4003 .chain
= (struct nft_chain
*)binding
->chain
,
4006 if (!(binding
->flags
& NFT_SET_MAP
))
4009 err
= nft_validate_register_store(&bind_ctx
, dreg
,
4016 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_DATA
, d2
.len
);
4019 /* The full maximum length of userdata can exceed the maximum
4020 * offset value (U8_MAX) for following extensions, therefor it
4021 * must be the last extension added.
4024 if (nla
[NFTA_SET_ELEM_USERDATA
] != NULL
) {
4025 ulen
= nla_len(nla
[NFTA_SET_ELEM_USERDATA
]);
4027 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_USERDATA
,
4032 elem
.priv
= nft_set_elem_init(set
, &tmpl
, elem
.key
.val
.data
, data
.data
,
4033 timeout
, GFP_KERNEL
);
4034 if (elem
.priv
== NULL
)
4037 ext
= nft_set_elem_ext(set
, elem
.priv
);
4039 *nft_set_ext_flags(ext
) = flags
;
4041 udata
= nft_set_ext_userdata(ext
);
4042 udata
->len
= ulen
- 1;
4043 nla_memcpy(&udata
->data
, nla
[NFTA_SET_ELEM_USERDATA
], ulen
);
4046 *nft_set_ext_obj(ext
) = obj
;
4050 trans
= nft_trans_elem_alloc(ctx
, NFT_MSG_NEWSETELEM
, set
);
4054 ext
->genmask
= nft_genmask_cur(ctx
->net
) | NFT_SET_ELEM_BUSY_MASK
;
4055 err
= set
->ops
->insert(ctx
->net
, set
, &elem
, &ext2
);
4057 if (err
== -EEXIST
) {
4058 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
) ^
4059 nft_set_ext_exists(ext2
, NFT_SET_EXT_DATA
) ||
4060 nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
) ^
4061 nft_set_ext_exists(ext2
, NFT_SET_EXT_OBJREF
))
4063 if ((nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
) &&
4064 nft_set_ext_exists(ext2
, NFT_SET_EXT_DATA
) &&
4065 memcmp(nft_set_ext_data(ext
),
4066 nft_set_ext_data(ext2
), set
->dlen
) != 0) ||
4067 (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
) &&
4068 nft_set_ext_exists(ext2
, NFT_SET_EXT_OBJREF
) &&
4069 *nft_set_ext_obj(ext
) != *nft_set_ext_obj(ext2
)))
4071 else if (!(nlmsg_flags
& NLM_F_EXCL
))
4078 !atomic_add_unless(&set
->nelems
, 1, set
->size
+ set
->ndeact
)) {
4083 nft_trans_elem(trans
) = elem
;
4084 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
4088 set
->ops
->remove(ctx
->net
, set
, &elem
);
4094 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
)
4095 nft_data_release(&data
, d2
.type
);
4097 nft_data_release(&elem
.key
.val
, d1
.type
);
4102 static int nf_tables_newsetelem(struct net
*net
, struct sock
*nlsk
,
4103 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4104 const struct nlattr
* const nla
[],
4105 struct netlink_ext_ack
*extack
)
4107 u8 genmask
= nft_genmask_next(net
);
4108 const struct nlattr
*attr
;
4109 struct nft_set
*set
;
4113 if (nla
[NFTA_SET_ELEM_LIST_ELEMENTS
] == NULL
)
4116 err
= nft_ctx_init_from_elemattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
4120 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
],
4123 if (nla
[NFTA_SET_ELEM_LIST_SET_ID
]) {
4124 set
= nf_tables_set_lookup_byid(net
,
4125 nla
[NFTA_SET_ELEM_LIST_SET_ID
],
4129 return PTR_ERR(set
);
4132 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_CONSTANT
)
4135 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
4136 err
= nft_add_set_elem(&ctx
, set
, attr
, nlh
->nlmsg_flags
);
4144 * nft_data_hold - hold a nft_data item
4146 * @data: struct nft_data to release
4147 * @type: type of data
4149 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4150 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
4151 * NFT_GOTO verdicts. This function must be called on active data objects
4152 * from the second phase of the commit protocol.
4154 static void nft_data_hold(const struct nft_data
*data
, enum nft_data_types type
)
4156 if (type
== NFT_DATA_VERDICT
) {
4157 switch (data
->verdict
.code
) {
4160 data
->verdict
.chain
->use
++;
4166 static void nft_set_elem_activate(const struct net
*net
,
4167 const struct nft_set
*set
,
4168 struct nft_set_elem
*elem
)
4170 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
4172 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
4173 nft_data_hold(nft_set_ext_data(ext
), set
->dtype
);
4174 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
))
4175 (*nft_set_ext_obj(ext
))->use
++;
4178 static void nft_set_elem_deactivate(const struct net
*net
,
4179 const struct nft_set
*set
,
4180 struct nft_set_elem
*elem
)
4182 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
4184 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
4185 nft_data_release(nft_set_ext_data(ext
), set
->dtype
);
4186 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
))
4187 (*nft_set_ext_obj(ext
))->use
--;
4190 static int nft_del_setelem(struct nft_ctx
*ctx
, struct nft_set
*set
,
4191 const struct nlattr
*attr
)
4193 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
4194 struct nft_set_ext_tmpl tmpl
;
4195 struct nft_data_desc desc
;
4196 struct nft_set_elem elem
;
4197 struct nft_set_ext
*ext
;
4198 struct nft_trans
*trans
;
4203 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
4204 nft_set_elem_policy
, NULL
);
4209 if (nla
[NFTA_SET_ELEM_KEY
] == NULL
)
4212 nft_set_ext_prepare(&tmpl
);
4214 err
= nft_setelem_parse_flags(set
, nla
[NFTA_SET_ELEM_FLAGS
], &flags
);
4218 nft_set_ext_add(&tmpl
, NFT_SET_EXT_FLAGS
);
4220 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &desc
,
4221 nla
[NFTA_SET_ELEM_KEY
]);
4226 if (desc
.type
!= NFT_DATA_VALUE
|| desc
.len
!= set
->klen
)
4229 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_KEY
, desc
.len
);
4232 elem
.priv
= nft_set_elem_init(set
, &tmpl
, elem
.key
.val
.data
, NULL
, 0,
4234 if (elem
.priv
== NULL
)
4237 ext
= nft_set_elem_ext(set
, elem
.priv
);
4239 *nft_set_ext_flags(ext
) = flags
;
4241 trans
= nft_trans_elem_alloc(ctx
, NFT_MSG_DELSETELEM
, set
);
4242 if (trans
== NULL
) {
4247 priv
= set
->ops
->deactivate(ctx
->net
, set
, &elem
);
4255 nft_set_elem_deactivate(ctx
->net
, set
, &elem
);
4257 nft_trans_elem(trans
) = elem
;
4258 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
4266 nft_data_release(&elem
.key
.val
, desc
.type
);
4271 static int nft_flush_set(const struct nft_ctx
*ctx
,
4272 struct nft_set
*set
,
4273 const struct nft_set_iter
*iter
,
4274 struct nft_set_elem
*elem
)
4276 struct nft_trans
*trans
;
4279 trans
= nft_trans_alloc_gfp(ctx
, NFT_MSG_DELSETELEM
,
4280 sizeof(struct nft_trans_elem
), GFP_ATOMIC
);
4284 if (!set
->ops
->flush(ctx
->net
, set
, elem
->priv
)) {
4290 nft_trans_elem_set(trans
) = set
;
4291 nft_trans_elem(trans
) = *elem
;
4292 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
4300 static int nf_tables_delsetelem(struct net
*net
, struct sock
*nlsk
,
4301 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4302 const struct nlattr
* const nla
[],
4303 struct netlink_ext_ack
*extack
)
4305 u8 genmask
= nft_genmask_next(net
);
4306 const struct nlattr
*attr
;
4307 struct nft_set
*set
;
4311 err
= nft_ctx_init_from_elemattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
4315 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
],
4318 return PTR_ERR(set
);
4319 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_CONSTANT
)
4322 if (nla
[NFTA_SET_ELEM_LIST_ELEMENTS
] == NULL
) {
4323 struct nft_set_iter iter
= {
4325 .fn
= nft_flush_set
,
4327 set
->ops
->walk(&ctx
, set
, &iter
);
4332 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
4333 err
= nft_del_setelem(&ctx
, set
, attr
);
4342 void nft_set_gc_batch_release(struct rcu_head
*rcu
)
4344 struct nft_set_gc_batch
*gcb
;
4347 gcb
= container_of(rcu
, struct nft_set_gc_batch
, head
.rcu
);
4348 for (i
= 0; i
< gcb
->head
.cnt
; i
++)
4349 nft_set_elem_destroy(gcb
->head
.set
, gcb
->elems
[i
], true);
4352 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release
);
4354 struct nft_set_gc_batch
*nft_set_gc_batch_alloc(const struct nft_set
*set
,
4357 struct nft_set_gc_batch
*gcb
;
4359 gcb
= kzalloc(sizeof(*gcb
), gfp
);
4362 gcb
->head
.set
= set
;
4365 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc
);
4372 * nft_register_obj- register nf_tables stateful object type
4375 * Registers the object type for use with nf_tables. Returns zero on
4376 * success or a negative errno code otherwise.
4378 int nft_register_obj(struct nft_object_type
*obj_type
)
4380 if (obj_type
->type
== NFT_OBJECT_UNSPEC
)
4383 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4384 list_add_rcu(&obj_type
->list
, &nf_tables_objects
);
4385 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4388 EXPORT_SYMBOL_GPL(nft_register_obj
);
4391 * nft_unregister_obj - unregister nf_tables object type
4394 * Unregisters the object type for use with nf_tables.
4396 void nft_unregister_obj(struct nft_object_type
*obj_type
)
4398 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4399 list_del_rcu(&obj_type
->list
);
4400 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4402 EXPORT_SYMBOL_GPL(nft_unregister_obj
);
4404 struct nft_object
*nf_tables_obj_lookup(const struct nft_table
*table
,
4405 const struct nlattr
*nla
,
4406 u32 objtype
, u8 genmask
)
4408 struct nft_object
*obj
;
4410 list_for_each_entry(obj
, &table
->objects
, list
) {
4411 if (!nla_strcmp(nla
, obj
->name
) &&
4412 objtype
== obj
->ops
->type
->type
&&
4413 nft_active_genmask(obj
, genmask
))
4416 return ERR_PTR(-ENOENT
);
4418 EXPORT_SYMBOL_GPL(nf_tables_obj_lookup
);
4420 static const struct nla_policy nft_obj_policy
[NFTA_OBJ_MAX
+ 1] = {
4421 [NFTA_OBJ_TABLE
] = { .type
= NLA_STRING
,
4422 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
4423 [NFTA_OBJ_NAME
] = { .type
= NLA_STRING
,
4424 .len
= NFT_OBJ_MAXNAMELEN
- 1 },
4425 [NFTA_OBJ_TYPE
] = { .type
= NLA_U32
},
4426 [NFTA_OBJ_DATA
] = { .type
= NLA_NESTED
},
4429 static struct nft_object
*nft_obj_init(const struct nft_ctx
*ctx
,
4430 const struct nft_object_type
*type
,
4431 const struct nlattr
*attr
)
4433 struct nlattr
*tb
[type
->maxattr
+ 1];
4434 const struct nft_object_ops
*ops
;
4435 struct nft_object
*obj
;
4439 err
= nla_parse_nested(tb
, type
->maxattr
, attr
, type
->policy
,
4444 memset(tb
, 0, sizeof(tb
[0]) * (type
->maxattr
+ 1));
4447 if (type
->select_ops
) {
4448 ops
= type
->select_ops(ctx
, (const struct nlattr
* const *)tb
);
4458 obj
= kzalloc(sizeof(*obj
) + ops
->size
, GFP_KERNEL
);
4462 err
= ops
->init(ctx
, (const struct nlattr
* const *)tb
, obj
);
4472 return ERR_PTR(err
);
4475 static int nft_object_dump(struct sk_buff
*skb
, unsigned int attr
,
4476 struct nft_object
*obj
, bool reset
)
4478 struct nlattr
*nest
;
4480 nest
= nla_nest_start(skb
, attr
);
4482 goto nla_put_failure
;
4483 if (obj
->ops
->dump(skb
, obj
, reset
) < 0)
4484 goto nla_put_failure
;
4485 nla_nest_end(skb
, nest
);
4492 static const struct nft_object_type
*__nft_obj_type_get(u32 objtype
)
4494 const struct nft_object_type
*type
;
4496 list_for_each_entry(type
, &nf_tables_objects
, list
) {
4497 if (objtype
== type
->type
)
4503 static const struct nft_object_type
*nft_obj_type_get(u32 objtype
)
4505 const struct nft_object_type
*type
;
4507 type
= __nft_obj_type_get(objtype
);
4508 if (type
!= NULL
&& try_module_get(type
->owner
))
4511 #ifdef CONFIG_MODULES
4513 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4514 request_module("nft-obj-%u", objtype
);
4515 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4516 if (__nft_obj_type_get(objtype
))
4517 return ERR_PTR(-EAGAIN
);
4520 return ERR_PTR(-ENOENT
);
4523 static int nf_tables_newobj(struct net
*net
, struct sock
*nlsk
,
4524 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4525 const struct nlattr
* const nla
[],
4526 struct netlink_ext_ack
*extack
)
4528 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
4529 const struct nft_object_type
*type
;
4530 u8 genmask
= nft_genmask_next(net
);
4531 int family
= nfmsg
->nfgen_family
;
4532 struct nft_af_info
*afi
;
4533 struct nft_table
*table
;
4534 struct nft_object
*obj
;
4539 if (!nla
[NFTA_OBJ_TYPE
] ||
4540 !nla
[NFTA_OBJ_NAME
] ||
4541 !nla
[NFTA_OBJ_DATA
])
4544 afi
= nf_tables_afinfo_lookup(net
, family
, true);
4546 return PTR_ERR(afi
);
4548 table
= nf_tables_table_lookup(afi
, nla
[NFTA_OBJ_TABLE
], genmask
);
4550 return PTR_ERR(table
);
4552 objtype
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4553 obj
= nf_tables_obj_lookup(table
, nla
[NFTA_OBJ_NAME
], objtype
, genmask
);
4560 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
4566 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
4568 type
= nft_obj_type_get(objtype
);
4570 return PTR_ERR(type
);
4572 obj
= nft_obj_init(&ctx
, type
, nla
[NFTA_OBJ_DATA
]);
4578 obj
->name
= nla_strdup(nla
[NFTA_OBJ_NAME
], GFP_KERNEL
);
4584 err
= nft_trans_obj_add(&ctx
, NFT_MSG_NEWOBJ
, obj
);
4588 list_add_tail_rcu(&obj
->list
, &table
->objects
);
4594 if (obj
->ops
->destroy
)
4595 obj
->ops
->destroy(obj
);
4598 module_put(type
->owner
);
4602 static int nf_tables_fill_obj_info(struct sk_buff
*skb
, struct net
*net
,
4603 u32 portid
, u32 seq
, int event
, u32 flags
,
4604 int family
, const struct nft_table
*table
,
4605 struct nft_object
*obj
, bool reset
)
4607 struct nfgenmsg
*nfmsg
;
4608 struct nlmsghdr
*nlh
;
4610 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
4611 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
4613 goto nla_put_failure
;
4615 nfmsg
= nlmsg_data(nlh
);
4616 nfmsg
->nfgen_family
= family
;
4617 nfmsg
->version
= NFNETLINK_V0
;
4618 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
4620 if (nla_put_string(skb
, NFTA_OBJ_TABLE
, table
->name
) ||
4621 nla_put_string(skb
, NFTA_OBJ_NAME
, obj
->name
) ||
4622 nla_put_be32(skb
, NFTA_OBJ_TYPE
, htonl(obj
->ops
->type
->type
)) ||
4623 nla_put_be32(skb
, NFTA_OBJ_USE
, htonl(obj
->use
)) ||
4624 nft_object_dump(skb
, NFTA_OBJ_DATA
, obj
, reset
))
4625 goto nla_put_failure
;
4627 nlmsg_end(skb
, nlh
);
4631 nlmsg_trim(skb
, nlh
);
4635 struct nft_obj_filter
{
4640 static int nf_tables_dump_obj(struct sk_buff
*skb
, struct netlink_callback
*cb
)
4642 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
4643 const struct nft_af_info
*afi
;
4644 const struct nft_table
*table
;
4645 unsigned int idx
= 0, s_idx
= cb
->args
[0];
4646 struct nft_obj_filter
*filter
= cb
->data
;
4647 struct net
*net
= sock_net(skb
->sk
);
4648 int family
= nfmsg
->nfgen_family
;
4649 struct nft_object
*obj
;
4652 if (NFNL_MSG_TYPE(cb
->nlh
->nlmsg_type
) == NFT_MSG_GETOBJ_RESET
)
4656 cb
->seq
= net
->nft
.base_seq
;
4658 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
4659 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
4662 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
4663 list_for_each_entry_rcu(obj
, &table
->objects
, list
) {
4664 if (!nft_is_active(net
, obj
))
4669 memset(&cb
->args
[1], 0,
4670 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
4671 if (filter
&& filter
->table
[0] &&
4672 strcmp(filter
->table
, table
->name
))
4675 filter
->type
!= NFT_OBJECT_UNSPEC
&&
4676 obj
->ops
->type
->type
!= filter
->type
)
4679 if (nf_tables_fill_obj_info(skb
, net
, NETLINK_CB(cb
->skb
).portid
,
4682 NLM_F_MULTI
| NLM_F_APPEND
,
4683 afi
->family
, table
, obj
, reset
) < 0)
4686 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
4699 static int nf_tables_dump_obj_done(struct netlink_callback
*cb
)
4701 struct nft_obj_filter
*filter
= cb
->data
;
4703 kfree(filter
->table
);
4709 static struct nft_obj_filter
*
4710 nft_obj_filter_alloc(const struct nlattr
* const nla
[])
4712 struct nft_obj_filter
*filter
;
4714 filter
= kzalloc(sizeof(*filter
), GFP_KERNEL
);
4716 return ERR_PTR(-ENOMEM
);
4718 if (nla
[NFTA_OBJ_TABLE
]) {
4719 filter
->table
= nla_strdup(nla
[NFTA_OBJ_TABLE
], GFP_KERNEL
);
4720 if (!filter
->table
) {
4722 return ERR_PTR(-ENOMEM
);
4725 if (nla
[NFTA_OBJ_TYPE
])
4726 filter
->type
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4731 static int nf_tables_getobj(struct net
*net
, struct sock
*nlsk
,
4732 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4733 const struct nlattr
* const nla
[],
4734 struct netlink_ext_ack
*extack
)
4736 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
4737 u8 genmask
= nft_genmask_cur(net
);
4738 int family
= nfmsg
->nfgen_family
;
4739 const struct nft_af_info
*afi
;
4740 const struct nft_table
*table
;
4741 struct nft_object
*obj
;
4742 struct sk_buff
*skb2
;
4747 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
4748 struct netlink_dump_control c
= {
4749 .dump
= nf_tables_dump_obj
,
4750 .done
= nf_tables_dump_obj_done
,
4753 if (nla
[NFTA_OBJ_TABLE
] ||
4754 nla
[NFTA_OBJ_TYPE
]) {
4755 struct nft_obj_filter
*filter
;
4757 filter
= nft_obj_filter_alloc(nla
);
4763 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
4766 if (!nla
[NFTA_OBJ_NAME
] ||
4767 !nla
[NFTA_OBJ_TYPE
])
4770 afi
= nf_tables_afinfo_lookup(net
, family
, false);
4772 return PTR_ERR(afi
);
4774 table
= nf_tables_table_lookup(afi
, nla
[NFTA_OBJ_TABLE
], genmask
);
4776 return PTR_ERR(table
);
4778 objtype
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4779 obj
= nf_tables_obj_lookup(table
, nla
[NFTA_OBJ_NAME
], objtype
, genmask
);
4781 return PTR_ERR(obj
);
4783 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
4787 if (NFNL_MSG_TYPE(nlh
->nlmsg_type
) == NFT_MSG_GETOBJ_RESET
)
4790 err
= nf_tables_fill_obj_info(skb2
, net
, NETLINK_CB(skb
).portid
,
4791 nlh
->nlmsg_seq
, NFT_MSG_NEWOBJ
, 0,
4792 family
, table
, obj
, reset
);
4796 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
4802 static void nft_obj_destroy(struct nft_object
*obj
)
4804 if (obj
->ops
->destroy
)
4805 obj
->ops
->destroy(obj
);
4807 module_put(obj
->ops
->type
->owner
);
4812 static int nf_tables_delobj(struct net
*net
, struct sock
*nlsk
,
4813 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4814 const struct nlattr
* const nla
[],
4815 struct netlink_ext_ack
*extack
)
4817 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
4818 u8 genmask
= nft_genmask_next(net
);
4819 int family
= nfmsg
->nfgen_family
;
4820 struct nft_af_info
*afi
;
4821 struct nft_table
*table
;
4822 struct nft_object
*obj
;
4826 if (!nla
[NFTA_OBJ_TYPE
] ||
4827 !nla
[NFTA_OBJ_NAME
])
4830 afi
= nf_tables_afinfo_lookup(net
, family
, true);
4832 return PTR_ERR(afi
);
4834 table
= nf_tables_table_lookup(afi
, nla
[NFTA_OBJ_TABLE
], genmask
);
4836 return PTR_ERR(table
);
4838 objtype
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4839 obj
= nf_tables_obj_lookup(table
, nla
[NFTA_OBJ_NAME
], objtype
, genmask
);
4841 return PTR_ERR(obj
);
4845 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
4847 return nft_delobj(&ctx
, obj
);
4850 void nft_obj_notify(struct net
*net
, struct nft_table
*table
,
4851 struct nft_object
*obj
, u32 portid
, u32 seq
, int event
,
4852 int family
, int report
, gfp_t gfp
)
4854 struct sk_buff
*skb
;
4858 !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
4861 skb
= nlmsg_new(NLMSG_GOODSIZE
, gfp
);
4865 err
= nf_tables_fill_obj_info(skb
, net
, portid
, seq
, event
, 0, family
,
4872 nfnetlink_send(skb
, net
, portid
, NFNLGRP_NFTABLES
, report
, gfp
);
4875 nfnetlink_set_err(net
, portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
4877 EXPORT_SYMBOL_GPL(nft_obj_notify
);
4879 static void nf_tables_obj_notify(const struct nft_ctx
*ctx
,
4880 struct nft_object
*obj
, int event
)
4882 nft_obj_notify(ctx
->net
, ctx
->table
, obj
, ctx
->portid
, ctx
->seq
, event
,
4883 ctx
->afi
->family
, ctx
->report
, GFP_KERNEL
);
4889 void nft_register_flowtable_type(struct nf_flowtable_type
*type
)
4891 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4892 list_add_tail_rcu(&type
->list
, &nf_tables_flowtables
);
4893 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4895 EXPORT_SYMBOL_GPL(nft_register_flowtable_type
);
4897 void nft_unregister_flowtable_type(struct nf_flowtable_type
*type
)
4899 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4900 list_del_rcu(&type
->list
);
4901 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4903 EXPORT_SYMBOL_GPL(nft_unregister_flowtable_type
);
4905 static const struct nla_policy nft_flowtable_policy
[NFTA_FLOWTABLE_MAX
+ 1] = {
4906 [NFTA_FLOWTABLE_TABLE
] = { .type
= NLA_STRING
,
4907 .len
= NFT_NAME_MAXLEN
- 1 },
4908 [NFTA_FLOWTABLE_NAME
] = { .type
= NLA_STRING
,
4909 .len
= NFT_NAME_MAXLEN
- 1 },
4910 [NFTA_FLOWTABLE_HOOK
] = { .type
= NLA_NESTED
},
4913 struct nft_flowtable
*nf_tables_flowtable_lookup(const struct nft_table
*table
,
4914 const struct nlattr
*nla
,
4917 struct nft_flowtable
*flowtable
;
4919 list_for_each_entry(flowtable
, &table
->flowtables
, list
) {
4920 if (!nla_strcmp(nla
, flowtable
->name
) &&
4921 nft_active_genmask(flowtable
, genmask
))
4924 return ERR_PTR(-ENOENT
);
4926 EXPORT_SYMBOL_GPL(nf_tables_flowtable_lookup
);
4928 #define NFT_FLOWTABLE_DEVICE_MAX 8
4930 static int nf_tables_parse_devices(const struct nft_ctx
*ctx
,
4931 const struct nlattr
*attr
,
4932 struct net_device
*dev_array
[], int *len
)
4934 const struct nlattr
*tmp
;
4935 struct net_device
*dev
;
4936 char ifname
[IFNAMSIZ
];
4937 int rem
, n
= 0, err
;
4939 nla_for_each_nested(tmp
, attr
, rem
) {
4940 if (nla_type(tmp
) != NFTA_DEVICE_NAME
) {
4945 nla_strlcpy(ifname
, tmp
, IFNAMSIZ
);
4946 dev
= dev_get_by_name(ctx
->net
, ifname
);
4952 dev_array
[n
++] = dev
;
4953 if (n
== NFT_FLOWTABLE_DEVICE_MAX
) {
4967 static const struct nla_policy nft_flowtable_hook_policy
[NFTA_FLOWTABLE_HOOK_MAX
+ 1] = {
4968 [NFTA_FLOWTABLE_HOOK_NUM
] = { .type
= NLA_U32
},
4969 [NFTA_FLOWTABLE_HOOK_PRIORITY
] = { .type
= NLA_U32
},
4970 [NFTA_FLOWTABLE_HOOK_DEVS
] = { .type
= NLA_NESTED
},
4973 static int nf_tables_flowtable_parse_hook(const struct nft_ctx
*ctx
,
4974 const struct nlattr
*attr
,
4975 struct nft_flowtable
*flowtable
)
4977 struct net_device
*dev_array
[NFT_FLOWTABLE_DEVICE_MAX
];
4978 struct nlattr
*tb
[NFTA_FLOWTABLE_HOOK_MAX
+ 1];
4979 struct nf_hook_ops
*ops
;
4980 int hooknum
, priority
;
4983 err
= nla_parse_nested(tb
, NFTA_FLOWTABLE_HOOK_MAX
, attr
,
4984 nft_flowtable_hook_policy
, NULL
);
4988 if (!tb
[NFTA_FLOWTABLE_HOOK_NUM
] ||
4989 !tb
[NFTA_FLOWTABLE_HOOK_PRIORITY
] ||
4990 !tb
[NFTA_FLOWTABLE_HOOK_DEVS
])
4993 hooknum
= ntohl(nla_get_be32(tb
[NFTA_FLOWTABLE_HOOK_NUM
]));
4994 if (hooknum
>= ctx
->afi
->nhooks
)
4997 priority
= ntohl(nla_get_be32(tb
[NFTA_FLOWTABLE_HOOK_PRIORITY
]));
4999 err
= nf_tables_parse_devices(ctx
, tb
[NFTA_FLOWTABLE_HOOK_DEVS
],
5004 ops
= kzalloc(sizeof(struct nf_hook_ops
) * n
, GFP_KERNEL
);
5010 flowtable
->ops
= ops
;
5011 flowtable
->ops_len
= n
;
5013 for (i
= 0; i
< n
; i
++) {
5014 flowtable
->ops
[i
].pf
= NFPROTO_NETDEV
;
5015 flowtable
->ops
[i
].hooknum
= hooknum
;
5016 flowtable
->ops
[i
].priority
= priority
;
5017 flowtable
->ops
[i
].priv
= &flowtable
->data
.rhashtable
;
5018 flowtable
->ops
[i
].hook
= flowtable
->data
.type
->hook
;
5019 flowtable
->ops
[i
].dev
= dev_array
[i
];
5024 for (i
= 0; i
< n
; i
++)
5025 dev_put(dev_array
[i
]);
5030 static const struct nf_flowtable_type
*
5031 __nft_flowtable_type_get(const struct nft_af_info
*afi
)
5033 const struct nf_flowtable_type
*type
;
5035 list_for_each_entry(type
, &nf_tables_flowtables
, list
) {
5036 if (afi
->family
== type
->family
)
5042 static const struct nf_flowtable_type
*
5043 nft_flowtable_type_get(const struct nft_af_info
*afi
)
5045 const struct nf_flowtable_type
*type
;
5047 type
= __nft_flowtable_type_get(afi
);
5048 if (type
!= NULL
&& try_module_get(type
->owner
))
5051 #ifdef CONFIG_MODULES
5053 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
5054 request_module("nf-flowtable-%u", afi
->family
);
5055 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
5056 if (__nft_flowtable_type_get(afi
))
5057 return ERR_PTR(-EAGAIN
);
5060 return ERR_PTR(-ENOENT
);
5063 void nft_flow_table_iterate(struct net
*net
,
5064 void (*iter
)(struct nf_flowtable
*flowtable
, void *data
),
5067 struct nft_flowtable
*flowtable
;
5068 const struct nft_af_info
*afi
;
5069 const struct nft_table
*table
;
5072 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
5073 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
5074 list_for_each_entry_rcu(flowtable
, &table
->flowtables
, list
) {
5075 iter(&flowtable
->data
, data
);
5081 EXPORT_SYMBOL_GPL(nft_flow_table_iterate
);
5083 static void nft_unregister_flowtable_net_hooks(struct net
*net
,
5084 struct nft_flowtable
*flowtable
)
5088 for (i
= 0; i
< flowtable
->ops_len
; i
++) {
5089 if (!flowtable
->ops
[i
].dev
)
5092 nf_unregister_net_hook(net
, &flowtable
->ops
[i
]);
5096 static int nf_tables_newflowtable(struct net
*net
, struct sock
*nlsk
,
5097 struct sk_buff
*skb
,
5098 const struct nlmsghdr
*nlh
,
5099 const struct nlattr
* const nla
[],
5100 struct netlink_ext_ack
*extack
)
5102 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
5103 const struct nf_flowtable_type
*type
;
5104 u8 genmask
= nft_genmask_next(net
);
5105 int family
= nfmsg
->nfgen_family
;
5106 struct nft_flowtable
*flowtable
;
5107 struct nft_af_info
*afi
;
5108 struct nft_table
*table
;
5112 if (!nla
[NFTA_FLOWTABLE_TABLE
] ||
5113 !nla
[NFTA_FLOWTABLE_NAME
] ||
5114 !nla
[NFTA_FLOWTABLE_HOOK
])
5117 afi
= nf_tables_afinfo_lookup(net
, family
, true);
5119 return PTR_ERR(afi
);
5121 table
= nf_tables_table_lookup(afi
, nla
[NFTA_FLOWTABLE_TABLE
], genmask
);
5123 return PTR_ERR(table
);
5125 flowtable
= nf_tables_flowtable_lookup(table
, nla
[NFTA_FLOWTABLE_NAME
],
5127 if (IS_ERR(flowtable
)) {
5128 err
= PTR_ERR(flowtable
);
5132 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
5138 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
5140 flowtable
= kzalloc(sizeof(*flowtable
), GFP_KERNEL
);
5144 flowtable
->table
= table
;
5145 flowtable
->name
= nla_strdup(nla
[NFTA_FLOWTABLE_NAME
], GFP_KERNEL
);
5146 if (!flowtable
->name
) {
5151 type
= nft_flowtable_type_get(afi
);
5153 err
= PTR_ERR(type
);
5157 flowtable
->data
.type
= type
;
5158 err
= rhashtable_init(&flowtable
->data
.rhashtable
, type
->params
);
5162 err
= nf_tables_flowtable_parse_hook(&ctx
, nla
[NFTA_FLOWTABLE_HOOK
],
5167 for (i
= 0; i
< flowtable
->ops_len
; i
++) {
5168 err
= nf_register_net_hook(net
, &flowtable
->ops
[i
]);
5173 err
= nft_trans_flowtable_add(&ctx
, NFT_MSG_NEWFLOWTABLE
, flowtable
);
5177 INIT_DEFERRABLE_WORK(&flowtable
->data
.gc_work
, type
->gc
);
5178 queue_delayed_work(system_power_efficient_wq
,
5179 &flowtable
->data
.gc_work
, HZ
);
5181 list_add_tail_rcu(&flowtable
->list
, &table
->flowtables
);
5186 i
= flowtable
->ops_len
;
5188 for (k
= i
- 1; k
>= 0; k
--)
5189 nf_unregister_net_hook(net
, &flowtable
->ops
[i
]);
5191 kfree(flowtable
->ops
);
5193 module_put(type
->owner
);
5195 kfree(flowtable
->name
);
5201 static int nf_tables_delflowtable(struct net
*net
, struct sock
*nlsk
,
5202 struct sk_buff
*skb
,
5203 const struct nlmsghdr
*nlh
,
5204 const struct nlattr
* const nla
[],
5205 struct netlink_ext_ack
*extack
)
5207 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
5208 u8 genmask
= nft_genmask_next(net
);
5209 int family
= nfmsg
->nfgen_family
;
5210 struct nft_flowtable
*flowtable
;
5211 struct nft_af_info
*afi
;
5212 struct nft_table
*table
;
5215 afi
= nf_tables_afinfo_lookup(net
, family
, true);
5217 return PTR_ERR(afi
);
5219 table
= nf_tables_table_lookup(afi
, nla
[NFTA_FLOWTABLE_TABLE
], genmask
);
5221 return PTR_ERR(table
);
5223 flowtable
= nf_tables_flowtable_lookup(table
, nla
[NFTA_FLOWTABLE_NAME
],
5225 if (IS_ERR(flowtable
))
5226 return PTR_ERR(flowtable
);
5227 if (flowtable
->use
> 0)
5230 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
5232 return nft_delflowtable(&ctx
, flowtable
);
5235 static int nf_tables_fill_flowtable_info(struct sk_buff
*skb
, struct net
*net
,
5236 u32 portid
, u32 seq
, int event
,
5237 u32 flags
, int family
,
5238 struct nft_flowtable
*flowtable
)
5240 struct nlattr
*nest
, *nest_devs
;
5241 struct nfgenmsg
*nfmsg
;
5242 struct nlmsghdr
*nlh
;
5245 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
5246 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
5248 goto nla_put_failure
;
5250 nfmsg
= nlmsg_data(nlh
);
5251 nfmsg
->nfgen_family
= family
;
5252 nfmsg
->version
= NFNETLINK_V0
;
5253 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
5255 if (nla_put_string(skb
, NFTA_FLOWTABLE_TABLE
, flowtable
->table
->name
) ||
5256 nla_put_string(skb
, NFTA_FLOWTABLE_NAME
, flowtable
->name
) ||
5257 nla_put_be32(skb
, NFTA_FLOWTABLE_USE
, htonl(flowtable
->use
)))
5258 goto nla_put_failure
;
5260 nest
= nla_nest_start(skb
, NFTA_FLOWTABLE_HOOK
);
5261 if (nla_put_be32(skb
, NFTA_FLOWTABLE_HOOK_NUM
, htonl(flowtable
->hooknum
)) ||
5262 nla_put_be32(skb
, NFTA_FLOWTABLE_HOOK_PRIORITY
, htonl(flowtable
->priority
)))
5263 goto nla_put_failure
;
5265 nest_devs
= nla_nest_start(skb
, NFTA_FLOWTABLE_HOOK_DEVS
);
5267 goto nla_put_failure
;
5269 for (i
= 0; i
< flowtable
->ops_len
; i
++) {
5270 if (flowtable
->ops
[i
].dev
&&
5271 nla_put_string(skb
, NFTA_DEVICE_NAME
,
5272 flowtable
->ops
[i
].dev
->name
))
5273 goto nla_put_failure
;
5275 nla_nest_end(skb
, nest_devs
);
5276 nla_nest_end(skb
, nest
);
5278 nlmsg_end(skb
, nlh
);
5282 nlmsg_trim(skb
, nlh
);
5286 struct nft_flowtable_filter
{
5290 static int nf_tables_dump_flowtable(struct sk_buff
*skb
,
5291 struct netlink_callback
*cb
)
5293 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
5294 struct nft_flowtable_filter
*filter
= cb
->data
;
5295 unsigned int idx
= 0, s_idx
= cb
->args
[0];
5296 struct net
*net
= sock_net(skb
->sk
);
5297 int family
= nfmsg
->nfgen_family
;
5298 struct nft_flowtable
*flowtable
;
5299 const struct nft_af_info
*afi
;
5300 const struct nft_table
*table
;
5303 cb
->seq
= net
->nft
.base_seq
;
5305 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
5306 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
5309 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
5310 list_for_each_entry_rcu(flowtable
, &table
->flowtables
, list
) {
5311 if (!nft_is_active(net
, flowtable
))
5316 memset(&cb
->args
[1], 0,
5317 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
5318 if (filter
&& filter
->table
[0] &&
5319 strcmp(filter
->table
, table
->name
))
5322 if (nf_tables_fill_flowtable_info(skb
, net
, NETLINK_CB(cb
->skb
).portid
,
5324 NFT_MSG_NEWFLOWTABLE
,
5325 NLM_F_MULTI
| NLM_F_APPEND
,
5326 afi
->family
, flowtable
) < 0)
5329 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
5342 static int nf_tables_dump_flowtable_done(struct netlink_callback
*cb
)
5344 struct nft_flowtable_filter
*filter
= cb
->data
;
5349 kfree(filter
->table
);
5355 static struct nft_flowtable_filter
*
5356 nft_flowtable_filter_alloc(const struct nlattr
* const nla
[])
5358 struct nft_flowtable_filter
*filter
;
5360 filter
= kzalloc(sizeof(*filter
), GFP_KERNEL
);
5362 return ERR_PTR(-ENOMEM
);
5364 if (nla
[NFTA_FLOWTABLE_TABLE
]) {
5365 filter
->table
= nla_strdup(nla
[NFTA_FLOWTABLE_TABLE
],
5367 if (!filter
->table
) {
5369 return ERR_PTR(-ENOMEM
);
5375 static int nf_tables_getflowtable(struct net
*net
, struct sock
*nlsk
,
5376 struct sk_buff
*skb
,
5377 const struct nlmsghdr
*nlh
,
5378 const struct nlattr
* const nla
[],
5379 struct netlink_ext_ack
*extack
)
5381 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
5382 u8 genmask
= nft_genmask_cur(net
);
5383 int family
= nfmsg
->nfgen_family
;
5384 struct nft_flowtable
*flowtable
;
5385 const struct nft_af_info
*afi
;
5386 const struct nft_table
*table
;
5387 struct sk_buff
*skb2
;
5390 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
5391 struct netlink_dump_control c
= {
5392 .dump
= nf_tables_dump_flowtable
,
5393 .done
= nf_tables_dump_flowtable_done
,
5396 if (nla
[NFTA_FLOWTABLE_TABLE
]) {
5397 struct nft_flowtable_filter
*filter
;
5399 filter
= nft_flowtable_filter_alloc(nla
);
5405 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
5408 if (!nla
[NFTA_FLOWTABLE_NAME
])
5411 afi
= nf_tables_afinfo_lookup(net
, family
, false);
5413 return PTR_ERR(afi
);
5415 table
= nf_tables_table_lookup(afi
, nla
[NFTA_FLOWTABLE_TABLE
], genmask
);
5417 return PTR_ERR(table
);
5419 flowtable
= nf_tables_flowtable_lookup(table
, nla
[NFTA_FLOWTABLE_NAME
],
5422 return PTR_ERR(flowtable
);
5424 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
5428 err
= nf_tables_fill_flowtable_info(skb2
, net
, NETLINK_CB(skb
).portid
,
5430 NFT_MSG_NEWFLOWTABLE
, 0, family
,
5435 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
5441 static void nf_tables_flowtable_notify(struct nft_ctx
*ctx
,
5442 struct nft_flowtable
*flowtable
,
5445 struct sk_buff
*skb
;
5449 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
5452 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
5456 err
= nf_tables_fill_flowtable_info(skb
, ctx
->net
, ctx
->portid
,
5458 ctx
->afi
->family
, flowtable
);
5464 nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
5465 ctx
->report
, GFP_KERNEL
);
5468 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
5471 static void nft_flowtable_destroy(void *ptr
, void *arg
)
5476 static void nf_tables_flowtable_destroy(struct nft_flowtable
*flowtable
)
5478 cancel_delayed_work_sync(&flowtable
->data
.gc_work
);
5479 kfree(flowtable
->name
);
5480 rhashtable_free_and_destroy(&flowtable
->data
.rhashtable
,
5481 nft_flowtable_destroy
, NULL
);
5482 module_put(flowtable
->data
.type
->owner
);
5485 static int nf_tables_fill_gen_info(struct sk_buff
*skb
, struct net
*net
,
5486 u32 portid
, u32 seq
)
5488 struct nlmsghdr
*nlh
;
5489 struct nfgenmsg
*nfmsg
;
5490 char buf
[TASK_COMM_LEN
];
5491 int event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, NFT_MSG_NEWGEN
);
5493 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), 0);
5495 goto nla_put_failure
;
5497 nfmsg
= nlmsg_data(nlh
);
5498 nfmsg
->nfgen_family
= AF_UNSPEC
;
5499 nfmsg
->version
= NFNETLINK_V0
;
5500 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
5502 if (nla_put_be32(skb
, NFTA_GEN_ID
, htonl(net
->nft
.base_seq
)) ||
5503 nla_put_be32(skb
, NFTA_GEN_PROC_PID
, htonl(task_pid_nr(current
))) ||
5504 nla_put_string(skb
, NFTA_GEN_PROC_NAME
, get_task_comm(buf
, current
)))
5505 goto nla_put_failure
;
5507 nlmsg_end(skb
, nlh
);
5511 nlmsg_trim(skb
, nlh
);
5515 static void nft_flowtable_event(unsigned long event
, struct net_device
*dev
,
5516 struct nft_flowtable
*flowtable
)
5520 for (i
= 0; i
< flowtable
->ops_len
; i
++) {
5521 if (flowtable
->ops
[i
].dev
!= dev
)
5524 nf_unregister_net_hook(dev_net(dev
), &flowtable
->ops
[i
]);
5525 flowtable
->ops
[i
].dev
= NULL
;
5530 static int nf_tables_flowtable_event(struct notifier_block
*this,
5531 unsigned long event
, void *ptr
)
5533 struct net_device
*dev
= netdev_notifier_info_to_dev(ptr
);
5534 struct nft_flowtable
*flowtable
;
5535 struct nft_table
*table
;
5536 struct nft_af_info
*afi
;
5538 if (event
!= NETDEV_UNREGISTER
)
5541 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
5542 list_for_each_entry(afi
, &dev_net(dev
)->nft
.af_info
, list
) {
5543 list_for_each_entry(table
, &afi
->tables
, list
) {
5544 list_for_each_entry(flowtable
, &table
->flowtables
, list
) {
5545 nft_flowtable_event(event
, dev
, flowtable
);
5549 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
5554 static struct notifier_block nf_tables_flowtable_notifier
= {
5555 .notifier_call
= nf_tables_flowtable_event
,
5558 static void nf_tables_gen_notify(struct net
*net
, struct sk_buff
*skb
,
5561 struct nlmsghdr
*nlh
= nlmsg_hdr(skb
);
5562 struct sk_buff
*skb2
;
5565 if (nlmsg_report(nlh
) &&
5566 !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
5569 skb2
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
5573 err
= nf_tables_fill_gen_info(skb2
, net
, NETLINK_CB(skb
).portid
,
5580 nfnetlink_send(skb2
, net
, NETLINK_CB(skb
).portid
, NFNLGRP_NFTABLES
,
5581 nlmsg_report(nlh
), GFP_KERNEL
);
5584 nfnetlink_set_err(net
, NETLINK_CB(skb
).portid
, NFNLGRP_NFTABLES
,
5588 static int nf_tables_getgen(struct net
*net
, struct sock
*nlsk
,
5589 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
5590 const struct nlattr
* const nla
[],
5591 struct netlink_ext_ack
*extack
)
5593 struct sk_buff
*skb2
;
5596 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
5600 err
= nf_tables_fill_gen_info(skb2
, net
, NETLINK_CB(skb
).portid
,
5605 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
5611 static const struct nfnl_callback nf_tables_cb
[NFT_MSG_MAX
] = {
5612 [NFT_MSG_NEWTABLE
] = {
5613 .call_batch
= nf_tables_newtable
,
5614 .attr_count
= NFTA_TABLE_MAX
,
5615 .policy
= nft_table_policy
,
5617 [NFT_MSG_GETTABLE
] = {
5618 .call
= nf_tables_gettable
,
5619 .attr_count
= NFTA_TABLE_MAX
,
5620 .policy
= nft_table_policy
,
5622 [NFT_MSG_DELTABLE
] = {
5623 .call_batch
= nf_tables_deltable
,
5624 .attr_count
= NFTA_TABLE_MAX
,
5625 .policy
= nft_table_policy
,
5627 [NFT_MSG_NEWCHAIN
] = {
5628 .call_batch
= nf_tables_newchain
,
5629 .attr_count
= NFTA_CHAIN_MAX
,
5630 .policy
= nft_chain_policy
,
5632 [NFT_MSG_GETCHAIN
] = {
5633 .call
= nf_tables_getchain
,
5634 .attr_count
= NFTA_CHAIN_MAX
,
5635 .policy
= nft_chain_policy
,
5637 [NFT_MSG_DELCHAIN
] = {
5638 .call_batch
= nf_tables_delchain
,
5639 .attr_count
= NFTA_CHAIN_MAX
,
5640 .policy
= nft_chain_policy
,
5642 [NFT_MSG_NEWRULE
] = {
5643 .call_batch
= nf_tables_newrule
,
5644 .attr_count
= NFTA_RULE_MAX
,
5645 .policy
= nft_rule_policy
,
5647 [NFT_MSG_GETRULE
] = {
5648 .call
= nf_tables_getrule
,
5649 .attr_count
= NFTA_RULE_MAX
,
5650 .policy
= nft_rule_policy
,
5652 [NFT_MSG_DELRULE
] = {
5653 .call_batch
= nf_tables_delrule
,
5654 .attr_count
= NFTA_RULE_MAX
,
5655 .policy
= nft_rule_policy
,
5657 [NFT_MSG_NEWSET
] = {
5658 .call_batch
= nf_tables_newset
,
5659 .attr_count
= NFTA_SET_MAX
,
5660 .policy
= nft_set_policy
,
5662 [NFT_MSG_GETSET
] = {
5663 .call
= nf_tables_getset
,
5664 .attr_count
= NFTA_SET_MAX
,
5665 .policy
= nft_set_policy
,
5667 [NFT_MSG_DELSET
] = {
5668 .call_batch
= nf_tables_delset
,
5669 .attr_count
= NFTA_SET_MAX
,
5670 .policy
= nft_set_policy
,
5672 [NFT_MSG_NEWSETELEM
] = {
5673 .call_batch
= nf_tables_newsetelem
,
5674 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
5675 .policy
= nft_set_elem_list_policy
,
5677 [NFT_MSG_GETSETELEM
] = {
5678 .call
= nf_tables_getsetelem
,
5679 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
5680 .policy
= nft_set_elem_list_policy
,
5682 [NFT_MSG_DELSETELEM
] = {
5683 .call_batch
= nf_tables_delsetelem
,
5684 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
5685 .policy
= nft_set_elem_list_policy
,
5687 [NFT_MSG_GETGEN
] = {
5688 .call
= nf_tables_getgen
,
5690 [NFT_MSG_NEWOBJ
] = {
5691 .call_batch
= nf_tables_newobj
,
5692 .attr_count
= NFTA_OBJ_MAX
,
5693 .policy
= nft_obj_policy
,
5695 [NFT_MSG_GETOBJ
] = {
5696 .call
= nf_tables_getobj
,
5697 .attr_count
= NFTA_OBJ_MAX
,
5698 .policy
= nft_obj_policy
,
5700 [NFT_MSG_DELOBJ
] = {
5701 .call_batch
= nf_tables_delobj
,
5702 .attr_count
= NFTA_OBJ_MAX
,
5703 .policy
= nft_obj_policy
,
5705 [NFT_MSG_GETOBJ_RESET
] = {
5706 .call
= nf_tables_getobj
,
5707 .attr_count
= NFTA_OBJ_MAX
,
5708 .policy
= nft_obj_policy
,
5710 [NFT_MSG_NEWFLOWTABLE
] = {
5711 .call_batch
= nf_tables_newflowtable
,
5712 .attr_count
= NFTA_FLOWTABLE_MAX
,
5713 .policy
= nft_flowtable_policy
,
5715 [NFT_MSG_GETFLOWTABLE
] = {
5716 .call
= nf_tables_getflowtable
,
5717 .attr_count
= NFTA_FLOWTABLE_MAX
,
5718 .policy
= nft_flowtable_policy
,
5720 [NFT_MSG_DELFLOWTABLE
] = {
5721 .call_batch
= nf_tables_delflowtable
,
5722 .attr_count
= NFTA_FLOWTABLE_MAX
,
5723 .policy
= nft_flowtable_policy
,
5727 static void nft_chain_commit_update(struct nft_trans
*trans
)
5729 struct nft_base_chain
*basechain
;
5731 if (nft_trans_chain_name(trans
))
5732 strcpy(trans
->ctx
.chain
->name
, nft_trans_chain_name(trans
));
5734 if (!nft_is_base_chain(trans
->ctx
.chain
))
5737 basechain
= nft_base_chain(trans
->ctx
.chain
);
5738 nft_chain_stats_replace(basechain
, nft_trans_chain_stats(trans
));
5740 switch (nft_trans_chain_policy(trans
)) {
5743 basechain
->policy
= nft_trans_chain_policy(trans
);
5748 static void nf_tables_commit_release(struct nft_trans
*trans
)
5750 switch (trans
->msg_type
) {
5751 case NFT_MSG_DELTABLE
:
5752 nf_tables_table_destroy(&trans
->ctx
);
5754 case NFT_MSG_DELCHAIN
:
5755 nf_tables_chain_destroy(trans
->ctx
.chain
);
5757 case NFT_MSG_DELRULE
:
5758 nf_tables_rule_destroy(&trans
->ctx
, nft_trans_rule(trans
));
5760 case NFT_MSG_DELSET
:
5761 nft_set_destroy(nft_trans_set(trans
));
5763 case NFT_MSG_DELSETELEM
:
5764 nf_tables_set_elem_destroy(nft_trans_elem_set(trans
),
5765 nft_trans_elem(trans
).priv
);
5767 case NFT_MSG_DELOBJ
:
5768 nft_obj_destroy(nft_trans_obj(trans
));
5770 case NFT_MSG_DELFLOWTABLE
:
5771 nf_tables_flowtable_destroy(nft_trans_flowtable(trans
));
5777 static int nf_tables_commit(struct net
*net
, struct sk_buff
*skb
)
5779 struct nft_trans
*trans
, *next
;
5780 struct nft_trans_elem
*te
;
5782 /* Bump generation counter, invalidate any dump in progress */
5783 while (++net
->nft
.base_seq
== 0);
5785 /* A new generation has just started */
5786 net
->nft
.gencursor
= nft_gencursor_next(net
);
5788 /* Make sure all packets have left the previous generation before
5789 * purging old rules.
5793 list_for_each_entry_safe(trans
, next
, &net
->nft
.commit_list
, list
) {
5794 switch (trans
->msg_type
) {
5795 case NFT_MSG_NEWTABLE
:
5796 if (nft_trans_table_update(trans
)) {
5797 if (!nft_trans_table_enable(trans
)) {
5798 nf_tables_table_disable(net
,
5801 trans
->ctx
.table
->flags
|= NFT_TABLE_F_DORMANT
;
5804 nft_clear(net
, trans
->ctx
.table
);
5806 nf_tables_table_notify(&trans
->ctx
, NFT_MSG_NEWTABLE
);
5807 nft_trans_destroy(trans
);
5809 case NFT_MSG_DELTABLE
:
5810 list_del_rcu(&trans
->ctx
.table
->list
);
5811 nf_tables_table_notify(&trans
->ctx
, NFT_MSG_DELTABLE
);
5813 case NFT_MSG_NEWCHAIN
:
5814 if (nft_trans_chain_update(trans
))
5815 nft_chain_commit_update(trans
);
5817 nft_clear(net
, trans
->ctx
.chain
);
5819 nf_tables_chain_notify(&trans
->ctx
, NFT_MSG_NEWCHAIN
);
5820 nft_trans_destroy(trans
);
5822 case NFT_MSG_DELCHAIN
:
5823 list_del_rcu(&trans
->ctx
.chain
->list
);
5824 nf_tables_chain_notify(&trans
->ctx
, NFT_MSG_DELCHAIN
);
5825 nf_tables_unregister_hook(trans
->ctx
.net
,
5829 case NFT_MSG_NEWRULE
:
5830 nft_clear(trans
->ctx
.net
, nft_trans_rule(trans
));
5831 nf_tables_rule_notify(&trans
->ctx
,
5832 nft_trans_rule(trans
),
5834 nft_trans_destroy(trans
);
5836 case NFT_MSG_DELRULE
:
5837 list_del_rcu(&nft_trans_rule(trans
)->list
);
5838 nf_tables_rule_notify(&trans
->ctx
,
5839 nft_trans_rule(trans
),
5842 case NFT_MSG_NEWSET
:
5843 nft_clear(net
, nft_trans_set(trans
));
5844 /* This avoids hitting -EBUSY when deleting the table
5845 * from the transaction.
5847 if (nft_set_is_anonymous(nft_trans_set(trans
)) &&
5848 !list_empty(&nft_trans_set(trans
)->bindings
))
5849 trans
->ctx
.table
->use
--;
5851 nf_tables_set_notify(&trans
->ctx
, nft_trans_set(trans
),
5852 NFT_MSG_NEWSET
, GFP_KERNEL
);
5853 nft_trans_destroy(trans
);
5855 case NFT_MSG_DELSET
:
5856 list_del_rcu(&nft_trans_set(trans
)->list
);
5857 nf_tables_set_notify(&trans
->ctx
, nft_trans_set(trans
),
5858 NFT_MSG_DELSET
, GFP_KERNEL
);
5860 case NFT_MSG_NEWSETELEM
:
5861 te
= (struct nft_trans_elem
*)trans
->data
;
5863 te
->set
->ops
->activate(net
, te
->set
, &te
->elem
);
5864 nf_tables_setelem_notify(&trans
->ctx
, te
->set
,
5866 NFT_MSG_NEWSETELEM
, 0);
5867 nft_trans_destroy(trans
);
5869 case NFT_MSG_DELSETELEM
:
5870 te
= (struct nft_trans_elem
*)trans
->data
;
5872 nf_tables_setelem_notify(&trans
->ctx
, te
->set
,
5874 NFT_MSG_DELSETELEM
, 0);
5875 te
->set
->ops
->remove(net
, te
->set
, &te
->elem
);
5876 atomic_dec(&te
->set
->nelems
);
5879 case NFT_MSG_NEWOBJ
:
5880 nft_clear(net
, nft_trans_obj(trans
));
5881 nf_tables_obj_notify(&trans
->ctx
, nft_trans_obj(trans
),
5883 nft_trans_destroy(trans
);
5885 case NFT_MSG_DELOBJ
:
5886 list_del_rcu(&nft_trans_obj(trans
)->list
);
5887 nf_tables_obj_notify(&trans
->ctx
, nft_trans_obj(trans
),
5890 case NFT_MSG_NEWFLOWTABLE
:
5891 nft_clear(net
, nft_trans_flowtable(trans
));
5892 nf_tables_flowtable_notify(&trans
->ctx
,
5893 nft_trans_flowtable(trans
),
5894 NFT_MSG_NEWFLOWTABLE
);
5895 nft_trans_destroy(trans
);
5897 case NFT_MSG_DELFLOWTABLE
:
5898 list_del_rcu(&nft_trans_flowtable(trans
)->list
);
5899 nf_tables_flowtable_notify(&trans
->ctx
,
5900 nft_trans_flowtable(trans
),
5901 NFT_MSG_DELFLOWTABLE
);
5902 nft_unregister_flowtable_net_hooks(net
,
5903 nft_trans_flowtable(trans
));
5910 list_for_each_entry_safe(trans
, next
, &net
->nft
.commit_list
, list
) {
5911 list_del(&trans
->list
);
5912 nf_tables_commit_release(trans
);
5915 nf_tables_gen_notify(net
, skb
, NFT_MSG_NEWGEN
);
5920 static void nf_tables_abort_release(struct nft_trans
*trans
)
5922 switch (trans
->msg_type
) {
5923 case NFT_MSG_NEWTABLE
:
5924 nf_tables_table_destroy(&trans
->ctx
);
5926 case NFT_MSG_NEWCHAIN
:
5927 nf_tables_chain_destroy(trans
->ctx
.chain
);
5929 case NFT_MSG_NEWRULE
:
5930 nf_tables_rule_destroy(&trans
->ctx
, nft_trans_rule(trans
));
5932 case NFT_MSG_NEWSET
:
5933 nft_set_destroy(nft_trans_set(trans
));
5935 case NFT_MSG_NEWSETELEM
:
5936 nft_set_elem_destroy(nft_trans_elem_set(trans
),
5937 nft_trans_elem(trans
).priv
, true);
5939 case NFT_MSG_NEWOBJ
:
5940 nft_obj_destroy(nft_trans_obj(trans
));
5942 case NFT_MSG_NEWFLOWTABLE
:
5943 nf_tables_flowtable_destroy(nft_trans_flowtable(trans
));
5949 static int nf_tables_abort(struct net
*net
, struct sk_buff
*skb
)
5951 struct nft_trans
*trans
, *next
;
5952 struct nft_trans_elem
*te
;
5954 list_for_each_entry_safe_reverse(trans
, next
, &net
->nft
.commit_list
,
5956 switch (trans
->msg_type
) {
5957 case NFT_MSG_NEWTABLE
:
5958 if (nft_trans_table_update(trans
)) {
5959 if (nft_trans_table_enable(trans
)) {
5960 nf_tables_table_disable(net
,
5963 trans
->ctx
.table
->flags
|= NFT_TABLE_F_DORMANT
;
5965 nft_trans_destroy(trans
);
5967 list_del_rcu(&trans
->ctx
.table
->list
);
5970 case NFT_MSG_DELTABLE
:
5971 nft_clear(trans
->ctx
.net
, trans
->ctx
.table
);
5972 nft_trans_destroy(trans
);
5974 case NFT_MSG_NEWCHAIN
:
5975 if (nft_trans_chain_update(trans
)) {
5976 free_percpu(nft_trans_chain_stats(trans
));
5978 nft_trans_destroy(trans
);
5980 trans
->ctx
.table
->use
--;
5981 list_del_rcu(&trans
->ctx
.chain
->list
);
5982 nf_tables_unregister_hook(trans
->ctx
.net
,
5987 case NFT_MSG_DELCHAIN
:
5988 trans
->ctx
.table
->use
++;
5989 nft_clear(trans
->ctx
.net
, trans
->ctx
.chain
);
5990 nft_trans_destroy(trans
);
5992 case NFT_MSG_NEWRULE
:
5993 trans
->ctx
.chain
->use
--;
5994 list_del_rcu(&nft_trans_rule(trans
)->list
);
5996 case NFT_MSG_DELRULE
:
5997 trans
->ctx
.chain
->use
++;
5998 nft_clear(trans
->ctx
.net
, nft_trans_rule(trans
));
5999 nft_trans_destroy(trans
);
6001 case NFT_MSG_NEWSET
:
6002 trans
->ctx
.table
->use
--;
6003 list_del_rcu(&nft_trans_set(trans
)->list
);
6005 case NFT_MSG_DELSET
:
6006 trans
->ctx
.table
->use
++;
6007 nft_clear(trans
->ctx
.net
, nft_trans_set(trans
));
6008 nft_trans_destroy(trans
);
6010 case NFT_MSG_NEWSETELEM
:
6011 te
= (struct nft_trans_elem
*)trans
->data
;
6013 te
->set
->ops
->remove(net
, te
->set
, &te
->elem
);
6014 atomic_dec(&te
->set
->nelems
);
6016 case NFT_MSG_DELSETELEM
:
6017 te
= (struct nft_trans_elem
*)trans
->data
;
6019 nft_set_elem_activate(net
, te
->set
, &te
->elem
);
6020 te
->set
->ops
->activate(net
, te
->set
, &te
->elem
);
6023 nft_trans_destroy(trans
);
6025 case NFT_MSG_NEWOBJ
:
6026 trans
->ctx
.table
->use
--;
6027 list_del_rcu(&nft_trans_obj(trans
)->list
);
6029 case NFT_MSG_DELOBJ
:
6030 trans
->ctx
.table
->use
++;
6031 nft_clear(trans
->ctx
.net
, nft_trans_obj(trans
));
6032 nft_trans_destroy(trans
);
6034 case NFT_MSG_NEWFLOWTABLE
:
6035 trans
->ctx
.table
->use
--;
6036 list_del_rcu(&nft_trans_flowtable(trans
)->list
);
6037 nft_unregister_flowtable_net_hooks(net
,
6038 nft_trans_flowtable(trans
));
6040 case NFT_MSG_DELFLOWTABLE
:
6041 trans
->ctx
.table
->use
++;
6042 nft_clear(trans
->ctx
.net
, nft_trans_flowtable(trans
));
6043 nft_trans_destroy(trans
);
6050 list_for_each_entry_safe_reverse(trans
, next
,
6051 &net
->nft
.commit_list
, list
) {
6052 list_del(&trans
->list
);
6053 nf_tables_abort_release(trans
);
6059 static bool nf_tables_valid_genid(struct net
*net
, u32 genid
)
6061 return net
->nft
.base_seq
== genid
;
6064 static const struct nfnetlink_subsystem nf_tables_subsys
= {
6065 .name
= "nf_tables",
6066 .subsys_id
= NFNL_SUBSYS_NFTABLES
,
6067 .cb_count
= NFT_MSG_MAX
,
6069 .commit
= nf_tables_commit
,
6070 .abort
= nf_tables_abort
,
6071 .valid_genid
= nf_tables_valid_genid
,
6074 int nft_chain_validate_dependency(const struct nft_chain
*chain
,
6075 enum nft_chain_type type
)
6077 const struct nft_base_chain
*basechain
;
6079 if (nft_is_base_chain(chain
)) {
6080 basechain
= nft_base_chain(chain
);
6081 if (basechain
->type
->type
!= type
)
6086 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency
);
6088 int nft_chain_validate_hooks(const struct nft_chain
*chain
,
6089 unsigned int hook_flags
)
6091 struct nft_base_chain
*basechain
;
6093 if (nft_is_base_chain(chain
)) {
6094 basechain
= nft_base_chain(chain
);
6096 if ((1 << basechain
->ops
.hooknum
) & hook_flags
)
6104 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks
);
6107 * Loop detection - walk through the ruleset beginning at the destination chain
6108 * of a new jump until either the source chain is reached (loop) or all
6109 * reachable chains have been traversed.
6111 * The loop check is performed whenever a new jump verdict is added to an
6112 * expression or verdict map or a verdict map is bound to a new chain.
6115 static int nf_tables_check_loops(const struct nft_ctx
*ctx
,
6116 const struct nft_chain
*chain
);
6118 static int nf_tables_loop_check_setelem(const struct nft_ctx
*ctx
,
6119 struct nft_set
*set
,
6120 const struct nft_set_iter
*iter
,
6121 struct nft_set_elem
*elem
)
6123 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
6124 const struct nft_data
*data
;
6126 if (nft_set_ext_exists(ext
, NFT_SET_EXT_FLAGS
) &&
6127 *nft_set_ext_flags(ext
) & NFT_SET_ELEM_INTERVAL_END
)
6130 data
= nft_set_ext_data(ext
);
6131 switch (data
->verdict
.code
) {
6134 return nf_tables_check_loops(ctx
, data
->verdict
.chain
);
6140 static int nf_tables_check_loops(const struct nft_ctx
*ctx
,
6141 const struct nft_chain
*chain
)
6143 const struct nft_rule
*rule
;
6144 const struct nft_expr
*expr
, *last
;
6145 struct nft_set
*set
;
6146 struct nft_set_binding
*binding
;
6147 struct nft_set_iter iter
;
6149 if (ctx
->chain
== chain
)
6152 list_for_each_entry(rule
, &chain
->rules
, list
) {
6153 nft_rule_for_each_expr(expr
, last
, rule
) {
6154 const struct nft_data
*data
= NULL
;
6157 if (!expr
->ops
->validate
)
6160 err
= expr
->ops
->validate(ctx
, expr
, &data
);
6167 switch (data
->verdict
.code
) {
6170 err
= nf_tables_check_loops(ctx
,
6171 data
->verdict
.chain
);
6180 list_for_each_entry(set
, &ctx
->table
->sets
, list
) {
6181 if (!nft_is_active_next(ctx
->net
, set
))
6183 if (!(set
->flags
& NFT_SET_MAP
) ||
6184 set
->dtype
!= NFT_DATA_VERDICT
)
6187 list_for_each_entry(binding
, &set
->bindings
, list
) {
6188 if (!(binding
->flags
& NFT_SET_MAP
) ||
6189 binding
->chain
!= chain
)
6192 iter
.genmask
= nft_genmask_next(ctx
->net
);
6196 iter
.fn
= nf_tables_loop_check_setelem
;
6198 set
->ops
->walk(ctx
, set
, &iter
);
6208 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
6210 * @attr: netlink attribute to fetch value from
6211 * @max: maximum value to be stored in dest
6212 * @dest: pointer to the variable
6214 * Parse, check and store a given u32 netlink attribute into variable.
6215 * This function returns -ERANGE if the value goes over maximum value.
6216 * Otherwise a 0 is returned and the attribute value is stored in the
6217 * destination variable.
6219 int nft_parse_u32_check(const struct nlattr
*attr
, int max
, u32
*dest
)
6223 val
= ntohl(nla_get_be32(attr
));
6230 EXPORT_SYMBOL_GPL(nft_parse_u32_check
);
6233 * nft_parse_register - parse a register value from a netlink attribute
6235 * @attr: netlink attribute
6237 * Parse and translate a register value from a netlink attribute.
6238 * Registers used to be 128 bit wide, these register numbers will be
6239 * mapped to the corresponding 32 bit register numbers.
6241 unsigned int nft_parse_register(const struct nlattr
*attr
)
6245 reg
= ntohl(nla_get_be32(attr
));
6247 case NFT_REG_VERDICT
...NFT_REG_4
:
6248 return reg
* NFT_REG_SIZE
/ NFT_REG32_SIZE
;
6250 return reg
+ NFT_REG_SIZE
/ NFT_REG32_SIZE
- NFT_REG32_00
;
6253 EXPORT_SYMBOL_GPL(nft_parse_register
);
6256 * nft_dump_register - dump a register value to a netlink attribute
6258 * @skb: socket buffer
6259 * @attr: attribute number
6260 * @reg: register number
6262 * Construct a netlink attribute containing the register number. For
6263 * compatibility reasons, register numbers being a multiple of 4 are
6264 * translated to the corresponding 128 bit register numbers.
6266 int nft_dump_register(struct sk_buff
*skb
, unsigned int attr
, unsigned int reg
)
6268 if (reg
% (NFT_REG_SIZE
/ NFT_REG32_SIZE
) == 0)
6269 reg
= reg
/ (NFT_REG_SIZE
/ NFT_REG32_SIZE
);
6271 reg
= reg
- NFT_REG_SIZE
/ NFT_REG32_SIZE
+ NFT_REG32_00
;
6273 return nla_put_be32(skb
, attr
, htonl(reg
));
6275 EXPORT_SYMBOL_GPL(nft_dump_register
);
6278 * nft_validate_register_load - validate a load from a register
6280 * @reg: the register number
6281 * @len: the length of the data
6283 * Validate that the input register is one of the general purpose
6284 * registers and that the length of the load is within the bounds.
6286 int nft_validate_register_load(enum nft_registers reg
, unsigned int len
)
6288 if (reg
< NFT_REG_1
* NFT_REG_SIZE
/ NFT_REG32_SIZE
)
6292 if (reg
* NFT_REG32_SIZE
+ len
> FIELD_SIZEOF(struct nft_regs
, data
))
6297 EXPORT_SYMBOL_GPL(nft_validate_register_load
);
6300 * nft_validate_register_store - validate an expressions' register store
6302 * @ctx: context of the expression performing the load
6303 * @reg: the destination register number
6304 * @data: the data to load
6305 * @type: the data type
6306 * @len: the length of the data
6308 * Validate that a data load uses the appropriate data type for
6309 * the destination register and the length is within the bounds.
6310 * A value of NULL for the data means that its runtime gathered
6313 int nft_validate_register_store(const struct nft_ctx
*ctx
,
6314 enum nft_registers reg
,
6315 const struct nft_data
*data
,
6316 enum nft_data_types type
, unsigned int len
)
6321 case NFT_REG_VERDICT
:
6322 if (type
!= NFT_DATA_VERDICT
)
6326 (data
->verdict
.code
== NFT_GOTO
||
6327 data
->verdict
.code
== NFT_JUMP
)) {
6328 err
= nf_tables_check_loops(ctx
, data
->verdict
.chain
);
6332 if (ctx
->chain
->level
+ 1 >
6333 data
->verdict
.chain
->level
) {
6334 if (ctx
->chain
->level
+ 1 == NFT_JUMP_STACK_SIZE
)
6336 data
->verdict
.chain
->level
= ctx
->chain
->level
+ 1;
6342 if (reg
< NFT_REG_1
* NFT_REG_SIZE
/ NFT_REG32_SIZE
)
6346 if (reg
* NFT_REG32_SIZE
+ len
>
6347 FIELD_SIZEOF(struct nft_regs
, data
))
6350 if (data
!= NULL
&& type
!= NFT_DATA_VALUE
)
6355 EXPORT_SYMBOL_GPL(nft_validate_register_store
);
6357 static const struct nla_policy nft_verdict_policy
[NFTA_VERDICT_MAX
+ 1] = {
6358 [NFTA_VERDICT_CODE
] = { .type
= NLA_U32
},
6359 [NFTA_VERDICT_CHAIN
] = { .type
= NLA_STRING
,
6360 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
6363 static int nft_verdict_init(const struct nft_ctx
*ctx
, struct nft_data
*data
,
6364 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
6366 u8 genmask
= nft_genmask_next(ctx
->net
);
6367 struct nlattr
*tb
[NFTA_VERDICT_MAX
+ 1];
6368 struct nft_chain
*chain
;
6371 err
= nla_parse_nested(tb
, NFTA_VERDICT_MAX
, nla
, nft_verdict_policy
,
6376 if (!tb
[NFTA_VERDICT_CODE
])
6378 data
->verdict
.code
= ntohl(nla_get_be32(tb
[NFTA_VERDICT_CODE
]));
6380 switch (data
->verdict
.code
) {
6382 switch (data
->verdict
.code
& NF_VERDICT_MASK
) {
6397 if (!tb
[NFTA_VERDICT_CHAIN
])
6399 chain
= nf_tables_chain_lookup(ctx
->table
,
6400 tb
[NFTA_VERDICT_CHAIN
], genmask
);
6402 return PTR_ERR(chain
);
6403 if (nft_is_base_chain(chain
))
6407 data
->verdict
.chain
= chain
;
6411 desc
->len
= sizeof(data
->verdict
);
6412 desc
->type
= NFT_DATA_VERDICT
;
6416 static void nft_verdict_uninit(const struct nft_data
*data
)
6418 switch (data
->verdict
.code
) {
6421 data
->verdict
.chain
->use
--;
6426 int nft_verdict_dump(struct sk_buff
*skb
, int type
, const struct nft_verdict
*v
)
6428 struct nlattr
*nest
;
6430 nest
= nla_nest_start(skb
, type
);
6432 goto nla_put_failure
;
6434 if (nla_put_be32(skb
, NFTA_VERDICT_CODE
, htonl(v
->code
)))
6435 goto nla_put_failure
;
6440 if (nla_put_string(skb
, NFTA_VERDICT_CHAIN
,
6442 goto nla_put_failure
;
6444 nla_nest_end(skb
, nest
);
6451 static int nft_value_init(const struct nft_ctx
*ctx
,
6452 struct nft_data
*data
, unsigned int size
,
6453 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
6463 nla_memcpy(data
->data
, nla
, len
);
6464 desc
->type
= NFT_DATA_VALUE
;
6469 static int nft_value_dump(struct sk_buff
*skb
, const struct nft_data
*data
,
6472 return nla_put(skb
, NFTA_DATA_VALUE
, len
, data
->data
);
6475 static const struct nla_policy nft_data_policy
[NFTA_DATA_MAX
+ 1] = {
6476 [NFTA_DATA_VALUE
] = { .type
= NLA_BINARY
},
6477 [NFTA_DATA_VERDICT
] = { .type
= NLA_NESTED
},
6481 * nft_data_init - parse nf_tables data netlink attributes
6483 * @ctx: context of the expression using the data
6484 * @data: destination struct nft_data
6485 * @size: maximum data length
6486 * @desc: data description
6487 * @nla: netlink attribute containing data
6489 * Parse the netlink data attributes and initialize a struct nft_data.
6490 * The type and length of data are returned in the data description.
6492 * The caller can indicate that it only wants to accept data of type
6493 * NFT_DATA_VALUE by passing NULL for the ctx argument.
6495 int nft_data_init(const struct nft_ctx
*ctx
,
6496 struct nft_data
*data
, unsigned int size
,
6497 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
6499 struct nlattr
*tb
[NFTA_DATA_MAX
+ 1];
6502 err
= nla_parse_nested(tb
, NFTA_DATA_MAX
, nla
, nft_data_policy
, NULL
);
6506 if (tb
[NFTA_DATA_VALUE
])
6507 return nft_value_init(ctx
, data
, size
, desc
,
6508 tb
[NFTA_DATA_VALUE
]);
6509 if (tb
[NFTA_DATA_VERDICT
] && ctx
!= NULL
)
6510 return nft_verdict_init(ctx
, data
, desc
, tb
[NFTA_DATA_VERDICT
]);
6513 EXPORT_SYMBOL_GPL(nft_data_init
);
6516 * nft_data_release - release a nft_data item
6518 * @data: struct nft_data to release
6519 * @type: type of data
6521 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
6522 * all others need to be released by calling this function.
6524 void nft_data_release(const struct nft_data
*data
, enum nft_data_types type
)
6526 if (type
< NFT_DATA_VERDICT
)
6529 case NFT_DATA_VERDICT
:
6530 return nft_verdict_uninit(data
);
6535 EXPORT_SYMBOL_GPL(nft_data_release
);
6537 int nft_data_dump(struct sk_buff
*skb
, int attr
, const struct nft_data
*data
,
6538 enum nft_data_types type
, unsigned int len
)
6540 struct nlattr
*nest
;
6543 nest
= nla_nest_start(skb
, attr
);
6548 case NFT_DATA_VALUE
:
6549 err
= nft_value_dump(skb
, data
, len
);
6551 case NFT_DATA_VERDICT
:
6552 err
= nft_verdict_dump(skb
, NFTA_DATA_VERDICT
, &data
->verdict
);
6559 nla_nest_end(skb
, nest
);
6562 EXPORT_SYMBOL_GPL(nft_data_dump
);
6564 static int __net_init
nf_tables_init_net(struct net
*net
)
6566 INIT_LIST_HEAD(&net
->nft
.af_info
);
6567 INIT_LIST_HEAD(&net
->nft
.commit_list
);
6568 net
->nft
.base_seq
= 1;
6572 static void __net_exit
nf_tables_exit_net(struct net
*net
)
6574 WARN_ON_ONCE(!list_empty(&net
->nft
.af_info
));
6575 WARN_ON_ONCE(!list_empty(&net
->nft
.commit_list
));
6578 int __nft_release_basechain(struct nft_ctx
*ctx
)
6580 struct nft_rule
*rule
, *nr
;
6582 BUG_ON(!nft_is_base_chain(ctx
->chain
));
6584 nf_tables_unregister_hook(ctx
->net
, ctx
->chain
->table
, ctx
->chain
);
6585 list_for_each_entry_safe(rule
, nr
, &ctx
->chain
->rules
, list
) {
6586 list_del(&rule
->list
);
6588 nf_tables_rule_destroy(ctx
, rule
);
6590 list_del(&ctx
->chain
->list
);
6592 nf_tables_chain_destroy(ctx
->chain
);
6596 EXPORT_SYMBOL_GPL(__nft_release_basechain
);
6598 /* Called by nft_unregister_afinfo() from __net_exit path, nfnl_lock is held. */
6599 static void __nft_release_afinfo(struct net
*net
, struct nft_af_info
*afi
)
6601 struct nft_flowtable
*flowtable
, *nf
;
6602 struct nft_table
*table
, *nt
;
6603 struct nft_chain
*chain
, *nc
;
6604 struct nft_object
*obj
, *ne
;
6605 struct nft_rule
*rule
, *nr
;
6606 struct nft_set
*set
, *ns
;
6607 struct nft_ctx ctx
= {
6612 list_for_each_entry_safe(table
, nt
, &afi
->tables
, list
) {
6613 list_for_each_entry(chain
, &table
->chains
, list
)
6614 nf_tables_unregister_hook(net
, table
, chain
);
6615 list_for_each_entry(flowtable
, &table
->flowtables
, list
)
6616 nf_unregister_net_hooks(net
, flowtable
->ops
,
6617 flowtable
->ops_len
);
6618 /* No packets are walking on these chains anymore. */
6620 list_for_each_entry(chain
, &table
->chains
, list
) {
6622 list_for_each_entry_safe(rule
, nr
, &chain
->rules
, list
) {
6623 list_del(&rule
->list
);
6625 nf_tables_rule_destroy(&ctx
, rule
);
6628 list_for_each_entry_safe(flowtable
, nf
, &table
->flowtables
, list
) {
6629 list_del(&flowtable
->list
);
6631 nf_tables_flowtable_destroy(flowtable
);
6633 list_for_each_entry_safe(set
, ns
, &table
->sets
, list
) {
6634 list_del(&set
->list
);
6636 nft_set_destroy(set
);
6638 list_for_each_entry_safe(obj
, ne
, &table
->objects
, list
) {
6639 list_del(&obj
->list
);
6641 nft_obj_destroy(obj
);
6643 list_for_each_entry_safe(chain
, nc
, &table
->chains
, list
) {
6644 list_del(&chain
->list
);
6646 nf_tables_chain_destroy(chain
);
6648 list_del(&table
->list
);
6649 nf_tables_table_destroy(&ctx
);
6653 static struct pernet_operations nf_tables_net_ops
= {
6654 .init
= nf_tables_init_net
,
6655 .exit
= nf_tables_exit_net
,
6658 static int __init
nf_tables_module_init(void)
6662 info
= kmalloc(sizeof(struct nft_expr_info
) * NFT_RULE_MAXEXPRS
,
6669 err
= nf_tables_core_module_init();
6673 err
= nfnetlink_subsys_register(&nf_tables_subsys
);
6677 register_netdevice_notifier(&nf_tables_flowtable_notifier
);
6679 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
6680 return register_pernet_subsys(&nf_tables_net_ops
);
6682 nf_tables_core_module_exit();
6689 static void __exit
nf_tables_module_exit(void)
6691 unregister_pernet_subsys(&nf_tables_net_ops
);
6692 nfnetlink_subsys_unregister(&nf_tables_subsys
);
6693 unregister_netdevice_notifier(&nf_tables_flowtable_notifier
);
6695 nf_tables_core_module_exit();
6699 module_init(nf_tables_module_init
);
6700 module_exit(nf_tables_module_exit
);
6702 MODULE_LICENSE("GPL");
6703 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
6704 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES
);