2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/vmalloc.h>
17 #include <linux/netfilter.h>
18 #include <linux/netfilter/nfnetlink.h>
19 #include <linux/netfilter/nf_tables.h>
20 #include <net/netfilter/nf_tables_core.h>
21 #include <net/netfilter/nf_tables.h>
22 #include <net/net_namespace.h>
25 static LIST_HEAD(nf_tables_expressions
);
26 static LIST_HEAD(nf_tables_objects
);
29 * nft_register_afinfo - register nf_tables address family info
31 * @afi: address family info to register
33 * Register the address family for use with nf_tables. Returns zero on
34 * success or a negative errno code otherwise.
36 int nft_register_afinfo(struct net
*net
, struct nft_af_info
*afi
)
38 INIT_LIST_HEAD(&afi
->tables
);
39 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
40 list_add_tail_rcu(&afi
->list
, &net
->nft
.af_info
);
41 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
44 EXPORT_SYMBOL_GPL(nft_register_afinfo
);
46 static void __nft_release_afinfo(struct net
*net
, struct nft_af_info
*afi
);
49 * nft_unregister_afinfo - unregister nf_tables address family info
51 * @afi: address family info to unregister
53 * Unregister the address family for use with nf_tables.
55 void nft_unregister_afinfo(struct net
*net
, struct nft_af_info
*afi
)
57 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
58 __nft_release_afinfo(net
, afi
);
59 list_del_rcu(&afi
->list
);
60 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
62 EXPORT_SYMBOL_GPL(nft_unregister_afinfo
);
64 static struct nft_af_info
*nft_afinfo_lookup(struct net
*net
, int family
)
66 struct nft_af_info
*afi
;
68 list_for_each_entry(afi
, &net
->nft
.af_info
, list
) {
69 if (afi
->family
== family
)
75 static struct nft_af_info
*
76 nf_tables_afinfo_lookup(struct net
*net
, int family
, bool autoload
)
78 struct nft_af_info
*afi
;
80 afi
= nft_afinfo_lookup(net
, family
);
85 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
86 request_module("nft-afinfo-%u", family
);
87 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
88 afi
= nft_afinfo_lookup(net
, family
);
90 return ERR_PTR(-EAGAIN
);
93 return ERR_PTR(-EAFNOSUPPORT
);
96 static void nft_ctx_init(struct nft_ctx
*ctx
,
98 const struct sk_buff
*skb
,
99 const struct nlmsghdr
*nlh
,
100 struct nft_af_info
*afi
,
101 struct nft_table
*table
,
102 struct nft_chain
*chain
,
103 const struct nlattr
* const *nla
)
110 ctx
->portid
= NETLINK_CB(skb
).portid
;
111 ctx
->report
= nlmsg_report(nlh
);
112 ctx
->seq
= nlh
->nlmsg_seq
;
115 static struct nft_trans
*nft_trans_alloc_gfp(const struct nft_ctx
*ctx
,
116 int msg_type
, u32 size
, gfp_t gfp
)
118 struct nft_trans
*trans
;
120 trans
= kzalloc(sizeof(struct nft_trans
) + size
, gfp
);
124 trans
->msg_type
= msg_type
;
130 static struct nft_trans
*nft_trans_alloc(const struct nft_ctx
*ctx
,
131 int msg_type
, u32 size
)
133 return nft_trans_alloc_gfp(ctx
, msg_type
, size
, GFP_KERNEL
);
136 static void nft_trans_destroy(struct nft_trans
*trans
)
138 list_del(&trans
->list
);
142 static int nf_tables_register_hooks(struct net
*net
,
143 const struct nft_table
*table
,
144 struct nft_chain
*chain
,
145 unsigned int hook_nops
)
147 if (table
->flags
& NFT_TABLE_F_DORMANT
||
148 !nft_is_base_chain(chain
))
151 return nf_register_net_hooks(net
, nft_base_chain(chain
)->ops
,
155 static void nf_tables_unregister_hooks(struct net
*net
,
156 const struct nft_table
*table
,
157 struct nft_chain
*chain
,
158 unsigned int hook_nops
)
160 if (table
->flags
& NFT_TABLE_F_DORMANT
||
161 !nft_is_base_chain(chain
))
164 nf_unregister_net_hooks(net
, nft_base_chain(chain
)->ops
, hook_nops
);
167 static int nft_trans_table_add(struct nft_ctx
*ctx
, int msg_type
)
169 struct nft_trans
*trans
;
171 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_table
));
175 if (msg_type
== NFT_MSG_NEWTABLE
)
176 nft_activate_next(ctx
->net
, ctx
->table
);
178 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
182 static int nft_deltable(struct nft_ctx
*ctx
)
186 err
= nft_trans_table_add(ctx
, NFT_MSG_DELTABLE
);
190 nft_deactivate_next(ctx
->net
, ctx
->table
);
194 static int nft_trans_chain_add(struct nft_ctx
*ctx
, int msg_type
)
196 struct nft_trans
*trans
;
198 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_chain
));
202 if (msg_type
== NFT_MSG_NEWCHAIN
)
203 nft_activate_next(ctx
->net
, ctx
->chain
);
205 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
209 static int nft_delchain(struct nft_ctx
*ctx
)
213 err
= nft_trans_chain_add(ctx
, NFT_MSG_DELCHAIN
);
218 nft_deactivate_next(ctx
->net
, ctx
->chain
);
224 nf_tables_delrule_deactivate(struct nft_ctx
*ctx
, struct nft_rule
*rule
)
226 /* You cannot delete the same rule twice */
227 if (nft_is_active_next(ctx
->net
, rule
)) {
228 nft_deactivate_next(ctx
->net
, rule
);
235 static struct nft_trans
*nft_trans_rule_add(struct nft_ctx
*ctx
, int msg_type
,
236 struct nft_rule
*rule
)
238 struct nft_trans
*trans
;
240 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_rule
));
244 if (msg_type
== NFT_MSG_NEWRULE
&& ctx
->nla
[NFTA_RULE_ID
] != NULL
) {
245 nft_trans_rule_id(trans
) =
246 ntohl(nla_get_be32(ctx
->nla
[NFTA_RULE_ID
]));
248 nft_trans_rule(trans
) = rule
;
249 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
254 static int nft_delrule(struct nft_ctx
*ctx
, struct nft_rule
*rule
)
256 struct nft_trans
*trans
;
259 trans
= nft_trans_rule_add(ctx
, NFT_MSG_DELRULE
, rule
);
263 err
= nf_tables_delrule_deactivate(ctx
, rule
);
265 nft_trans_destroy(trans
);
272 static int nft_delrule_by_chain(struct nft_ctx
*ctx
)
274 struct nft_rule
*rule
;
277 list_for_each_entry(rule
, &ctx
->chain
->rules
, list
) {
278 err
= nft_delrule(ctx
, rule
);
285 static int nft_trans_set_add(struct nft_ctx
*ctx
, int msg_type
,
288 struct nft_trans
*trans
;
290 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_set
));
294 if (msg_type
== NFT_MSG_NEWSET
&& ctx
->nla
[NFTA_SET_ID
] != NULL
) {
295 nft_trans_set_id(trans
) =
296 ntohl(nla_get_be32(ctx
->nla
[NFTA_SET_ID
]));
297 nft_activate_next(ctx
->net
, set
);
299 nft_trans_set(trans
) = set
;
300 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
305 static int nft_delset(struct nft_ctx
*ctx
, struct nft_set
*set
)
309 err
= nft_trans_set_add(ctx
, NFT_MSG_DELSET
, set
);
313 nft_deactivate_next(ctx
->net
, set
);
319 static int nft_trans_obj_add(struct nft_ctx
*ctx
, int msg_type
,
320 struct nft_object
*obj
)
322 struct nft_trans
*trans
;
324 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_obj
));
328 if (msg_type
== NFT_MSG_NEWOBJ
)
329 nft_activate_next(ctx
->net
, obj
);
331 nft_trans_obj(trans
) = obj
;
332 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
337 static int nft_delobj(struct nft_ctx
*ctx
, struct nft_object
*obj
)
341 err
= nft_trans_obj_add(ctx
, NFT_MSG_DELOBJ
, obj
);
345 nft_deactivate_next(ctx
->net
, obj
);
355 static struct nft_table
*nft_table_lookup(const struct nft_af_info
*afi
,
356 const struct nlattr
*nla
,
359 struct nft_table
*table
;
361 list_for_each_entry(table
, &afi
->tables
, list
) {
362 if (!nla_strcmp(nla
, table
->name
) &&
363 nft_active_genmask(table
, genmask
))
369 static struct nft_table
*nf_tables_table_lookup(const struct nft_af_info
*afi
,
370 const struct nlattr
*nla
,
373 struct nft_table
*table
;
376 return ERR_PTR(-EINVAL
);
378 table
= nft_table_lookup(afi
, nla
, genmask
);
382 return ERR_PTR(-ENOENT
);
385 static inline u64
nf_tables_alloc_handle(struct nft_table
*table
)
387 return ++table
->hgenerator
;
390 static const struct nf_chain_type
*chain_type
[NFPROTO_NUMPROTO
][NFT_CHAIN_T_MAX
];
392 static const struct nf_chain_type
*
393 __nf_tables_chain_type_lookup(int family
, const struct nlattr
*nla
)
397 for (i
= 0; i
< NFT_CHAIN_T_MAX
; i
++) {
398 if (chain_type
[family
][i
] != NULL
&&
399 !nla_strcmp(nla
, chain_type
[family
][i
]->name
))
400 return chain_type
[family
][i
];
405 static const struct nf_chain_type
*
406 nf_tables_chain_type_lookup(const struct nft_af_info
*afi
,
407 const struct nlattr
*nla
,
410 const struct nf_chain_type
*type
;
412 type
= __nf_tables_chain_type_lookup(afi
->family
, nla
);
415 #ifdef CONFIG_MODULES
417 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
418 request_module("nft-chain-%u-%.*s", afi
->family
,
419 nla_len(nla
), (const char *)nla_data(nla
));
420 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
421 type
= __nf_tables_chain_type_lookup(afi
->family
, nla
);
423 return ERR_PTR(-EAGAIN
);
426 return ERR_PTR(-ENOENT
);
429 static const struct nla_policy nft_table_policy
[NFTA_TABLE_MAX
+ 1] = {
430 [NFTA_TABLE_NAME
] = { .type
= NLA_STRING
,
431 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
432 [NFTA_TABLE_FLAGS
] = { .type
= NLA_U32
},
435 static int nf_tables_fill_table_info(struct sk_buff
*skb
, struct net
*net
,
436 u32 portid
, u32 seq
, int event
, u32 flags
,
437 int family
, const struct nft_table
*table
)
439 struct nlmsghdr
*nlh
;
440 struct nfgenmsg
*nfmsg
;
442 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
443 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
445 goto nla_put_failure
;
447 nfmsg
= nlmsg_data(nlh
);
448 nfmsg
->nfgen_family
= family
;
449 nfmsg
->version
= NFNETLINK_V0
;
450 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
452 if (nla_put_string(skb
, NFTA_TABLE_NAME
, table
->name
) ||
453 nla_put_be32(skb
, NFTA_TABLE_FLAGS
, htonl(table
->flags
)) ||
454 nla_put_be32(skb
, NFTA_TABLE_USE
, htonl(table
->use
)))
455 goto nla_put_failure
;
461 nlmsg_trim(skb
, nlh
);
465 static void nf_tables_table_notify(const struct nft_ctx
*ctx
, int event
)
471 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
474 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
478 err
= nf_tables_fill_table_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
479 event
, 0, ctx
->afi
->family
, ctx
->table
);
485 nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
486 ctx
->report
, GFP_KERNEL
);
489 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
492 static int nf_tables_dump_tables(struct sk_buff
*skb
,
493 struct netlink_callback
*cb
)
495 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
496 const struct nft_af_info
*afi
;
497 const struct nft_table
*table
;
498 unsigned int idx
= 0, s_idx
= cb
->args
[0];
499 struct net
*net
= sock_net(skb
->sk
);
500 int family
= nfmsg
->nfgen_family
;
503 cb
->seq
= net
->nft
.base_seq
;
505 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
506 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
509 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
513 memset(&cb
->args
[1], 0,
514 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
515 if (!nft_is_active(net
, table
))
517 if (nf_tables_fill_table_info(skb
, net
,
518 NETLINK_CB(cb
->skb
).portid
,
522 afi
->family
, table
) < 0)
525 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
536 static int nf_tables_gettable(struct net
*net
, struct sock
*nlsk
,
537 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
538 const struct nlattr
* const nla
[],
539 struct netlink_ext_ack
*extack
)
541 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
542 u8 genmask
= nft_genmask_cur(net
);
543 const struct nft_af_info
*afi
;
544 const struct nft_table
*table
;
545 struct sk_buff
*skb2
;
546 int family
= nfmsg
->nfgen_family
;
549 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
550 struct netlink_dump_control c
= {
551 .dump
= nf_tables_dump_tables
,
553 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
556 afi
= nf_tables_afinfo_lookup(net
, family
, false);
560 table
= nf_tables_table_lookup(afi
, nla
[NFTA_TABLE_NAME
], genmask
);
562 return PTR_ERR(table
);
564 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
568 err
= nf_tables_fill_table_info(skb2
, net
, NETLINK_CB(skb
).portid
,
569 nlh
->nlmsg_seq
, NFT_MSG_NEWTABLE
, 0,
574 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
581 static void _nf_tables_table_disable(struct net
*net
,
582 const struct nft_af_info
*afi
,
583 struct nft_table
*table
,
586 struct nft_chain
*chain
;
589 list_for_each_entry(chain
, &table
->chains
, list
) {
590 if (!nft_is_active_next(net
, chain
))
592 if (!nft_is_base_chain(chain
))
595 if (cnt
&& i
++ == cnt
)
598 nf_unregister_net_hooks(net
, nft_base_chain(chain
)->ops
,
603 static int nf_tables_table_enable(struct net
*net
,
604 const struct nft_af_info
*afi
,
605 struct nft_table
*table
)
607 struct nft_chain
*chain
;
610 list_for_each_entry(chain
, &table
->chains
, list
) {
611 if (!nft_is_active_next(net
, chain
))
613 if (!nft_is_base_chain(chain
))
616 err
= nf_register_net_hooks(net
, nft_base_chain(chain
)->ops
,
626 _nf_tables_table_disable(net
, afi
, table
, i
);
630 static void nf_tables_table_disable(struct net
*net
,
631 const struct nft_af_info
*afi
,
632 struct nft_table
*table
)
634 _nf_tables_table_disable(net
, afi
, table
, 0);
637 static int nf_tables_updtable(struct nft_ctx
*ctx
)
639 struct nft_trans
*trans
;
643 if (!ctx
->nla
[NFTA_TABLE_FLAGS
])
646 flags
= ntohl(nla_get_be32(ctx
->nla
[NFTA_TABLE_FLAGS
]));
647 if (flags
& ~NFT_TABLE_F_DORMANT
)
650 if (flags
== ctx
->table
->flags
)
653 trans
= nft_trans_alloc(ctx
, NFT_MSG_NEWTABLE
,
654 sizeof(struct nft_trans_table
));
658 if ((flags
& NFT_TABLE_F_DORMANT
) &&
659 !(ctx
->table
->flags
& NFT_TABLE_F_DORMANT
)) {
660 nft_trans_table_enable(trans
) = false;
661 } else if (!(flags
& NFT_TABLE_F_DORMANT
) &&
662 ctx
->table
->flags
& NFT_TABLE_F_DORMANT
) {
663 ret
= nf_tables_table_enable(ctx
->net
, ctx
->afi
, ctx
->table
);
665 ctx
->table
->flags
&= ~NFT_TABLE_F_DORMANT
;
666 nft_trans_table_enable(trans
) = true;
672 nft_trans_table_update(trans
) = true;
673 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
676 nft_trans_destroy(trans
);
680 static int nf_tables_newtable(struct net
*net
, struct sock
*nlsk
,
681 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
682 const struct nlattr
* const nla
[],
683 struct netlink_ext_ack
*extack
)
685 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
686 u8 genmask
= nft_genmask_next(net
);
687 const struct nlattr
*name
;
688 struct nft_af_info
*afi
;
689 struct nft_table
*table
;
690 int family
= nfmsg
->nfgen_family
;
695 afi
= nf_tables_afinfo_lookup(net
, family
, true);
699 name
= nla
[NFTA_TABLE_NAME
];
700 table
= nf_tables_table_lookup(afi
, name
, genmask
);
702 if (PTR_ERR(table
) != -ENOENT
)
703 return PTR_ERR(table
);
705 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
707 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
710 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
711 return nf_tables_updtable(&ctx
);
714 if (nla
[NFTA_TABLE_FLAGS
]) {
715 flags
= ntohl(nla_get_be32(nla
[NFTA_TABLE_FLAGS
]));
716 if (flags
& ~NFT_TABLE_F_DORMANT
)
721 if (!try_module_get(afi
->owner
))
725 table
= kzalloc(sizeof(*table
), GFP_KERNEL
);
729 table
->name
= nla_strdup(name
, GFP_KERNEL
);
730 if (table
->name
== NULL
)
733 INIT_LIST_HEAD(&table
->chains
);
734 INIT_LIST_HEAD(&table
->sets
);
735 INIT_LIST_HEAD(&table
->objects
);
736 table
->flags
= flags
;
738 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
739 err
= nft_trans_table_add(&ctx
, NFT_MSG_NEWTABLE
);
743 list_add_tail_rcu(&table
->list
, &afi
->tables
);
750 module_put(afi
->owner
);
755 static int nft_flush_table(struct nft_ctx
*ctx
)
758 struct nft_chain
*chain
, *nc
;
759 struct nft_object
*obj
, *ne
;
760 struct nft_set
*set
, *ns
;
762 list_for_each_entry(chain
, &ctx
->table
->chains
, list
) {
763 if (!nft_is_active_next(ctx
->net
, chain
))
768 err
= nft_delrule_by_chain(ctx
);
773 list_for_each_entry_safe(set
, ns
, &ctx
->table
->sets
, list
) {
774 if (!nft_is_active_next(ctx
->net
, set
))
777 if (set
->flags
& NFT_SET_ANONYMOUS
&&
778 !list_empty(&set
->bindings
))
781 err
= nft_delset(ctx
, set
);
786 list_for_each_entry_safe(obj
, ne
, &ctx
->table
->objects
, list
) {
787 err
= nft_delobj(ctx
, obj
);
792 list_for_each_entry_safe(chain
, nc
, &ctx
->table
->chains
, list
) {
793 if (!nft_is_active_next(ctx
->net
, chain
))
798 err
= nft_delchain(ctx
);
803 err
= nft_deltable(ctx
);
808 static int nft_flush(struct nft_ctx
*ctx
, int family
)
810 struct nft_af_info
*afi
;
811 struct nft_table
*table
, *nt
;
812 const struct nlattr
* const *nla
= ctx
->nla
;
815 list_for_each_entry(afi
, &ctx
->net
->nft
.af_info
, list
) {
816 if (family
!= AF_UNSPEC
&& afi
->family
!= family
)
820 list_for_each_entry_safe(table
, nt
, &afi
->tables
, list
) {
821 if (!nft_is_active_next(ctx
->net
, table
))
824 if (nla
[NFTA_TABLE_NAME
] &&
825 nla_strcmp(nla
[NFTA_TABLE_NAME
], table
->name
) != 0)
830 err
= nft_flush_table(ctx
);
839 static int nf_tables_deltable(struct net
*net
, struct sock
*nlsk
,
840 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
841 const struct nlattr
* const nla
[],
842 struct netlink_ext_ack
*extack
)
844 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
845 u8 genmask
= nft_genmask_next(net
);
846 struct nft_af_info
*afi
;
847 struct nft_table
*table
;
848 int family
= nfmsg
->nfgen_family
;
851 nft_ctx_init(&ctx
, net
, skb
, nlh
, NULL
, NULL
, NULL
, nla
);
852 if (family
== AF_UNSPEC
|| nla
[NFTA_TABLE_NAME
] == NULL
)
853 return nft_flush(&ctx
, family
);
855 afi
= nf_tables_afinfo_lookup(net
, family
, false);
859 table
= nf_tables_table_lookup(afi
, nla
[NFTA_TABLE_NAME
], genmask
);
861 return PTR_ERR(table
);
863 if (nlh
->nlmsg_flags
& NLM_F_NONREC
&&
870 return nft_flush_table(&ctx
);
873 static void nf_tables_table_destroy(struct nft_ctx
*ctx
)
875 BUG_ON(ctx
->table
->use
> 0);
877 kfree(ctx
->table
->name
);
879 module_put(ctx
->afi
->owner
);
882 int nft_register_chain_type(const struct nf_chain_type
*ctype
)
886 if (WARN_ON(ctype
->family
>= NFPROTO_NUMPROTO
))
889 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
890 if (chain_type
[ctype
->family
][ctype
->type
] != NULL
) {
894 chain_type
[ctype
->family
][ctype
->type
] = ctype
;
896 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
899 EXPORT_SYMBOL_GPL(nft_register_chain_type
);
901 void nft_unregister_chain_type(const struct nf_chain_type
*ctype
)
903 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
904 chain_type
[ctype
->family
][ctype
->type
] = NULL
;
905 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
907 EXPORT_SYMBOL_GPL(nft_unregister_chain_type
);
913 static struct nft_chain
*
914 nf_tables_chain_lookup_byhandle(const struct nft_table
*table
, u64 handle
,
917 struct nft_chain
*chain
;
919 list_for_each_entry(chain
, &table
->chains
, list
) {
920 if (chain
->handle
== handle
&&
921 nft_active_genmask(chain
, genmask
))
925 return ERR_PTR(-ENOENT
);
928 static struct nft_chain
*nf_tables_chain_lookup(const struct nft_table
*table
,
929 const struct nlattr
*nla
,
932 struct nft_chain
*chain
;
935 return ERR_PTR(-EINVAL
);
937 list_for_each_entry(chain
, &table
->chains
, list
) {
938 if (!nla_strcmp(nla
, chain
->name
) &&
939 nft_active_genmask(chain
, genmask
))
943 return ERR_PTR(-ENOENT
);
946 static const struct nla_policy nft_chain_policy
[NFTA_CHAIN_MAX
+ 1] = {
947 [NFTA_CHAIN_TABLE
] = { .type
= NLA_STRING
,
948 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
949 [NFTA_CHAIN_HANDLE
] = { .type
= NLA_U64
},
950 [NFTA_CHAIN_NAME
] = { .type
= NLA_STRING
,
951 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
952 [NFTA_CHAIN_HOOK
] = { .type
= NLA_NESTED
},
953 [NFTA_CHAIN_POLICY
] = { .type
= NLA_U32
},
954 [NFTA_CHAIN_TYPE
] = { .type
= NLA_STRING
},
955 [NFTA_CHAIN_COUNTERS
] = { .type
= NLA_NESTED
},
958 static const struct nla_policy nft_hook_policy
[NFTA_HOOK_MAX
+ 1] = {
959 [NFTA_HOOK_HOOKNUM
] = { .type
= NLA_U32
},
960 [NFTA_HOOK_PRIORITY
] = { .type
= NLA_U32
},
961 [NFTA_HOOK_DEV
] = { .type
= NLA_STRING
,
962 .len
= IFNAMSIZ
- 1 },
965 static int nft_dump_stats(struct sk_buff
*skb
, struct nft_stats __percpu
*stats
)
967 struct nft_stats
*cpu_stats
, total
;
973 memset(&total
, 0, sizeof(total
));
974 for_each_possible_cpu(cpu
) {
975 cpu_stats
= per_cpu_ptr(stats
, cpu
);
977 seq
= u64_stats_fetch_begin_irq(&cpu_stats
->syncp
);
978 pkts
= cpu_stats
->pkts
;
979 bytes
= cpu_stats
->bytes
;
980 } while (u64_stats_fetch_retry_irq(&cpu_stats
->syncp
, seq
));
982 total
.bytes
+= bytes
;
984 nest
= nla_nest_start(skb
, NFTA_CHAIN_COUNTERS
);
986 goto nla_put_failure
;
988 if (nla_put_be64(skb
, NFTA_COUNTER_PACKETS
, cpu_to_be64(total
.pkts
),
990 nla_put_be64(skb
, NFTA_COUNTER_BYTES
, cpu_to_be64(total
.bytes
),
992 goto nla_put_failure
;
994 nla_nest_end(skb
, nest
);
1001 static int nf_tables_fill_chain_info(struct sk_buff
*skb
, struct net
*net
,
1002 u32 portid
, u32 seq
, int event
, u32 flags
,
1003 int family
, const struct nft_table
*table
,
1004 const struct nft_chain
*chain
)
1006 struct nlmsghdr
*nlh
;
1007 struct nfgenmsg
*nfmsg
;
1009 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
1010 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
1012 goto nla_put_failure
;
1014 nfmsg
= nlmsg_data(nlh
);
1015 nfmsg
->nfgen_family
= family
;
1016 nfmsg
->version
= NFNETLINK_V0
;
1017 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
1019 if (nla_put_string(skb
, NFTA_CHAIN_TABLE
, table
->name
))
1020 goto nla_put_failure
;
1021 if (nla_put_be64(skb
, NFTA_CHAIN_HANDLE
, cpu_to_be64(chain
->handle
),
1023 goto nla_put_failure
;
1024 if (nla_put_string(skb
, NFTA_CHAIN_NAME
, chain
->name
))
1025 goto nla_put_failure
;
1027 if (nft_is_base_chain(chain
)) {
1028 const struct nft_base_chain
*basechain
= nft_base_chain(chain
);
1029 const struct nf_hook_ops
*ops
= &basechain
->ops
[0];
1030 struct nlattr
*nest
;
1032 nest
= nla_nest_start(skb
, NFTA_CHAIN_HOOK
);
1034 goto nla_put_failure
;
1035 if (nla_put_be32(skb
, NFTA_HOOK_HOOKNUM
, htonl(ops
->hooknum
)))
1036 goto nla_put_failure
;
1037 if (nla_put_be32(skb
, NFTA_HOOK_PRIORITY
, htonl(ops
->priority
)))
1038 goto nla_put_failure
;
1039 if (basechain
->dev_name
[0] &&
1040 nla_put_string(skb
, NFTA_HOOK_DEV
, basechain
->dev_name
))
1041 goto nla_put_failure
;
1042 nla_nest_end(skb
, nest
);
1044 if (nla_put_be32(skb
, NFTA_CHAIN_POLICY
,
1045 htonl(basechain
->policy
)))
1046 goto nla_put_failure
;
1048 if (nla_put_string(skb
, NFTA_CHAIN_TYPE
, basechain
->type
->name
))
1049 goto nla_put_failure
;
1051 if (basechain
->stats
&& nft_dump_stats(skb
, basechain
->stats
))
1052 goto nla_put_failure
;
1055 if (nla_put_be32(skb
, NFTA_CHAIN_USE
, htonl(chain
->use
)))
1056 goto nla_put_failure
;
1058 nlmsg_end(skb
, nlh
);
1062 nlmsg_trim(skb
, nlh
);
1066 static void nf_tables_chain_notify(const struct nft_ctx
*ctx
, int event
)
1068 struct sk_buff
*skb
;
1072 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
1075 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
1079 err
= nf_tables_fill_chain_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
1080 event
, 0, ctx
->afi
->family
, ctx
->table
,
1087 nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
1088 ctx
->report
, GFP_KERNEL
);
1091 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
1094 static int nf_tables_dump_chains(struct sk_buff
*skb
,
1095 struct netlink_callback
*cb
)
1097 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
1098 const struct nft_af_info
*afi
;
1099 const struct nft_table
*table
;
1100 const struct nft_chain
*chain
;
1101 unsigned int idx
= 0, s_idx
= cb
->args
[0];
1102 struct net
*net
= sock_net(skb
->sk
);
1103 int family
= nfmsg
->nfgen_family
;
1106 cb
->seq
= net
->nft
.base_seq
;
1108 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
1109 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
1112 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
1113 list_for_each_entry_rcu(chain
, &table
->chains
, list
) {
1117 memset(&cb
->args
[1], 0,
1118 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
1119 if (!nft_is_active(net
, chain
))
1121 if (nf_tables_fill_chain_info(skb
, net
,
1122 NETLINK_CB(cb
->skb
).portid
,
1126 afi
->family
, table
, chain
) < 0)
1129 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
1141 static int nf_tables_getchain(struct net
*net
, struct sock
*nlsk
,
1142 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
1143 const struct nlattr
* const nla
[],
1144 struct netlink_ext_ack
*extack
)
1146 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1147 u8 genmask
= nft_genmask_cur(net
);
1148 const struct nft_af_info
*afi
;
1149 const struct nft_table
*table
;
1150 const struct nft_chain
*chain
;
1151 struct sk_buff
*skb2
;
1152 int family
= nfmsg
->nfgen_family
;
1155 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
1156 struct netlink_dump_control c
= {
1157 .dump
= nf_tables_dump_chains
,
1159 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
1162 afi
= nf_tables_afinfo_lookup(net
, family
, false);
1164 return PTR_ERR(afi
);
1166 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
], genmask
);
1168 return PTR_ERR(table
);
1170 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
], genmask
);
1172 return PTR_ERR(chain
);
1174 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
1178 err
= nf_tables_fill_chain_info(skb2
, net
, NETLINK_CB(skb
).portid
,
1179 nlh
->nlmsg_seq
, NFT_MSG_NEWCHAIN
, 0,
1180 family
, table
, chain
);
1184 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
1191 static const struct nla_policy nft_counter_policy
[NFTA_COUNTER_MAX
+ 1] = {
1192 [NFTA_COUNTER_PACKETS
] = { .type
= NLA_U64
},
1193 [NFTA_COUNTER_BYTES
] = { .type
= NLA_U64
},
1196 static struct nft_stats __percpu
*nft_stats_alloc(const struct nlattr
*attr
)
1198 struct nlattr
*tb
[NFTA_COUNTER_MAX
+1];
1199 struct nft_stats __percpu
*newstats
;
1200 struct nft_stats
*stats
;
1203 err
= nla_parse_nested(tb
, NFTA_COUNTER_MAX
, attr
, nft_counter_policy
,
1206 return ERR_PTR(err
);
1208 if (!tb
[NFTA_COUNTER_BYTES
] || !tb
[NFTA_COUNTER_PACKETS
])
1209 return ERR_PTR(-EINVAL
);
1211 newstats
= netdev_alloc_pcpu_stats(struct nft_stats
);
1212 if (newstats
== NULL
)
1213 return ERR_PTR(-ENOMEM
);
1215 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1216 * are not exposed to userspace.
1219 stats
= this_cpu_ptr(newstats
);
1220 stats
->bytes
= be64_to_cpu(nla_get_be64(tb
[NFTA_COUNTER_BYTES
]));
1221 stats
->pkts
= be64_to_cpu(nla_get_be64(tb
[NFTA_COUNTER_PACKETS
]));
1227 static void nft_chain_stats_replace(struct nft_base_chain
*chain
,
1228 struct nft_stats __percpu
*newstats
)
1230 if (newstats
== NULL
)
1234 struct nft_stats __percpu
*oldstats
=
1235 nft_dereference(chain
->stats
);
1237 rcu_assign_pointer(chain
->stats
, newstats
);
1239 free_percpu(oldstats
);
1241 rcu_assign_pointer(chain
->stats
, newstats
);
1244 static void nf_tables_chain_destroy(struct nft_chain
*chain
)
1246 BUG_ON(chain
->use
> 0);
1248 if (nft_is_base_chain(chain
)) {
1249 struct nft_base_chain
*basechain
= nft_base_chain(chain
);
1251 module_put(basechain
->type
->owner
);
1252 free_percpu(basechain
->stats
);
1253 if (basechain
->stats
)
1254 static_branch_dec(&nft_counters_enabled
);
1255 if (basechain
->ops
[0].dev
!= NULL
)
1256 dev_put(basechain
->ops
[0].dev
);
1265 struct nft_chain_hook
{
1268 const struct nf_chain_type
*type
;
1269 struct net_device
*dev
;
1272 static int nft_chain_parse_hook(struct net
*net
,
1273 const struct nlattr
* const nla
[],
1274 struct nft_af_info
*afi
,
1275 struct nft_chain_hook
*hook
, bool create
)
1277 struct nlattr
*ha
[NFTA_HOOK_MAX
+ 1];
1278 const struct nf_chain_type
*type
;
1279 struct net_device
*dev
;
1282 err
= nla_parse_nested(ha
, NFTA_HOOK_MAX
, nla
[NFTA_CHAIN_HOOK
],
1283 nft_hook_policy
, NULL
);
1287 if (ha
[NFTA_HOOK_HOOKNUM
] == NULL
||
1288 ha
[NFTA_HOOK_PRIORITY
] == NULL
)
1291 hook
->num
= ntohl(nla_get_be32(ha
[NFTA_HOOK_HOOKNUM
]));
1292 if (hook
->num
>= afi
->nhooks
)
1295 hook
->priority
= ntohl(nla_get_be32(ha
[NFTA_HOOK_PRIORITY
]));
1297 type
= chain_type
[afi
->family
][NFT_CHAIN_T_DEFAULT
];
1298 if (nla
[NFTA_CHAIN_TYPE
]) {
1299 type
= nf_tables_chain_type_lookup(afi
, nla
[NFTA_CHAIN_TYPE
],
1302 return PTR_ERR(type
);
1304 if (!(type
->hook_mask
& (1 << hook
->num
)))
1306 if (!try_module_get(type
->owner
))
1312 if (afi
->flags
& NFT_AF_NEEDS_DEV
) {
1313 char ifname
[IFNAMSIZ
];
1315 if (!ha
[NFTA_HOOK_DEV
]) {
1316 module_put(type
->owner
);
1320 nla_strlcpy(ifname
, ha
[NFTA_HOOK_DEV
], IFNAMSIZ
);
1321 dev
= dev_get_by_name(net
, ifname
);
1323 module_put(type
->owner
);
1327 } else if (ha
[NFTA_HOOK_DEV
]) {
1328 module_put(type
->owner
);
1335 static void nft_chain_release_hook(struct nft_chain_hook
*hook
)
1337 module_put(hook
->type
->owner
);
1338 if (hook
->dev
!= NULL
)
1342 static int nf_tables_addchain(struct nft_ctx
*ctx
, u8 family
, u8 genmask
,
1343 u8 policy
, bool create
)
1345 const struct nlattr
* const *nla
= ctx
->nla
;
1346 struct nft_table
*table
= ctx
->table
;
1347 struct nft_af_info
*afi
= ctx
->afi
;
1348 struct nft_base_chain
*basechain
;
1349 struct nft_stats __percpu
*stats
;
1350 struct net
*net
= ctx
->net
;
1351 struct nft_chain
*chain
;
1355 if (table
->use
== UINT_MAX
)
1358 if (nla
[NFTA_CHAIN_HOOK
]) {
1359 struct nft_chain_hook hook
;
1360 struct nf_hook_ops
*ops
;
1363 err
= nft_chain_parse_hook(net
, nla
, afi
, &hook
, create
);
1367 basechain
= kzalloc(sizeof(*basechain
), GFP_KERNEL
);
1368 if (basechain
== NULL
) {
1369 nft_chain_release_hook(&hook
);
1373 if (hook
.dev
!= NULL
)
1374 strncpy(basechain
->dev_name
, hook
.dev
->name
, IFNAMSIZ
);
1376 if (nla
[NFTA_CHAIN_COUNTERS
]) {
1377 stats
= nft_stats_alloc(nla
[NFTA_CHAIN_COUNTERS
]);
1378 if (IS_ERR(stats
)) {
1379 nft_chain_release_hook(&hook
);
1381 return PTR_ERR(stats
);
1383 basechain
->stats
= stats
;
1384 static_branch_inc(&nft_counters_enabled
);
1387 hookfn
= hook
.type
->hooks
[hook
.num
];
1388 basechain
->type
= hook
.type
;
1389 chain
= &basechain
->chain
;
1391 for (i
= 0; i
< afi
->nops
; i
++) {
1392 ops
= &basechain
->ops
[i
];
1394 ops
->hooknum
= hook
.num
;
1395 ops
->priority
= hook
.priority
;
1397 ops
->hook
= afi
->hooks
[ops
->hooknum
];
1398 ops
->dev
= hook
.dev
;
1401 if (afi
->hook_ops_init
)
1402 afi
->hook_ops_init(ops
, i
);
1405 chain
->flags
|= NFT_BASE_CHAIN
;
1406 basechain
->policy
= policy
;
1408 chain
= kzalloc(sizeof(*chain
), GFP_KERNEL
);
1412 INIT_LIST_HEAD(&chain
->rules
);
1413 chain
->handle
= nf_tables_alloc_handle(table
);
1414 chain
->table
= table
;
1415 chain
->name
= nla_strdup(nla
[NFTA_CHAIN_NAME
], GFP_KERNEL
);
1421 err
= nf_tables_register_hooks(net
, table
, chain
, afi
->nops
);
1426 err
= nft_trans_chain_add(ctx
, NFT_MSG_NEWCHAIN
);
1431 list_add_tail_rcu(&chain
->list
, &table
->chains
);
1435 nf_tables_unregister_hooks(net
, table
, chain
, afi
->nops
);
1437 nf_tables_chain_destroy(chain
);
1442 static int nf_tables_updchain(struct nft_ctx
*ctx
, u8 genmask
, u8 policy
,
1445 const struct nlattr
* const *nla
= ctx
->nla
;
1446 struct nft_table
*table
= ctx
->table
;
1447 struct nft_chain
*chain
= ctx
->chain
;
1448 struct nft_af_info
*afi
= ctx
->afi
;
1449 struct nft_base_chain
*basechain
;
1450 struct nft_stats
*stats
= NULL
;
1451 struct nft_chain_hook hook
;
1452 const struct nlattr
*name
;
1453 struct nf_hook_ops
*ops
;
1454 struct nft_trans
*trans
;
1457 if (nla
[NFTA_CHAIN_HOOK
]) {
1458 if (!nft_is_base_chain(chain
))
1461 err
= nft_chain_parse_hook(ctx
->net
, nla
, ctx
->afi
, &hook
,
1466 basechain
= nft_base_chain(chain
);
1467 if (basechain
->type
!= hook
.type
) {
1468 nft_chain_release_hook(&hook
);
1472 for (i
= 0; i
< afi
->nops
; i
++) {
1473 ops
= &basechain
->ops
[i
];
1474 if (ops
->hooknum
!= hook
.num
||
1475 ops
->priority
!= hook
.priority
||
1476 ops
->dev
!= hook
.dev
) {
1477 nft_chain_release_hook(&hook
);
1481 nft_chain_release_hook(&hook
);
1484 if (nla
[NFTA_CHAIN_HANDLE
] &&
1485 nla
[NFTA_CHAIN_NAME
]) {
1486 struct nft_chain
*chain2
;
1488 chain2
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
],
1490 if (!IS_ERR(chain2
))
1494 if (nla
[NFTA_CHAIN_COUNTERS
]) {
1495 if (!nft_is_base_chain(chain
))
1498 stats
= nft_stats_alloc(nla
[NFTA_CHAIN_COUNTERS
]);
1500 return PTR_ERR(stats
);
1503 trans
= nft_trans_alloc(ctx
, NFT_MSG_NEWCHAIN
,
1504 sizeof(struct nft_trans_chain
));
1505 if (trans
== NULL
) {
1510 nft_trans_chain_stats(trans
) = stats
;
1511 nft_trans_chain_update(trans
) = true;
1513 if (nla
[NFTA_CHAIN_POLICY
])
1514 nft_trans_chain_policy(trans
) = policy
;
1516 nft_trans_chain_policy(trans
) = -1;
1518 name
= nla
[NFTA_CHAIN_NAME
];
1519 if (nla
[NFTA_CHAIN_HANDLE
] && name
) {
1520 nft_trans_chain_name(trans
) =
1521 nla_strdup(name
, GFP_KERNEL
);
1522 if (!nft_trans_chain_name(trans
)) {
1528 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
1533 static int nf_tables_newchain(struct net
*net
, struct sock
*nlsk
,
1534 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
1535 const struct nlattr
* const nla
[],
1536 struct netlink_ext_ack
*extack
)
1538 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1539 const struct nlattr
* uninitialized_var(name
);
1540 u8 genmask
= nft_genmask_next(net
);
1541 int family
= nfmsg
->nfgen_family
;
1542 struct nft_af_info
*afi
;
1543 struct nft_table
*table
;
1544 struct nft_chain
*chain
;
1545 u8 policy
= NF_ACCEPT
;
1550 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
1552 afi
= nf_tables_afinfo_lookup(net
, family
, true);
1554 return PTR_ERR(afi
);
1556 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
], genmask
);
1558 return PTR_ERR(table
);
1561 name
= nla
[NFTA_CHAIN_NAME
];
1563 if (nla
[NFTA_CHAIN_HANDLE
]) {
1564 handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_CHAIN_HANDLE
]));
1565 chain
= nf_tables_chain_lookup_byhandle(table
, handle
, genmask
);
1567 return PTR_ERR(chain
);
1569 chain
= nf_tables_chain_lookup(table
, name
, genmask
);
1570 if (IS_ERR(chain
)) {
1571 if (PTR_ERR(chain
) != -ENOENT
)
1572 return PTR_ERR(chain
);
1577 if (nla
[NFTA_CHAIN_POLICY
]) {
1578 if (chain
!= NULL
&&
1579 !nft_is_base_chain(chain
))
1582 if (chain
== NULL
&&
1583 nla
[NFTA_CHAIN_HOOK
] == NULL
)
1586 policy
= ntohl(nla_get_be32(nla
[NFTA_CHAIN_POLICY
]));
1596 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
1598 if (chain
!= NULL
) {
1599 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
1601 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
1604 return nf_tables_updchain(&ctx
, genmask
, policy
, create
);
1607 return nf_tables_addchain(&ctx
, family
, genmask
, policy
, create
);
1610 static int nf_tables_delchain(struct net
*net
, struct sock
*nlsk
,
1611 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
1612 const struct nlattr
* const nla
[],
1613 struct netlink_ext_ack
*extack
)
1615 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1616 u8 genmask
= nft_genmask_next(net
);
1617 struct nft_af_info
*afi
;
1618 struct nft_table
*table
;
1619 struct nft_chain
*chain
;
1620 struct nft_rule
*rule
;
1621 int family
= nfmsg
->nfgen_family
;
1626 afi
= nf_tables_afinfo_lookup(net
, family
, false);
1628 return PTR_ERR(afi
);
1630 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
], genmask
);
1632 return PTR_ERR(table
);
1634 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
], genmask
);
1636 return PTR_ERR(chain
);
1638 if (nlh
->nlmsg_flags
& NLM_F_NONREC
&&
1642 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
1645 list_for_each_entry(rule
, &chain
->rules
, list
) {
1646 if (!nft_is_active_next(net
, rule
))
1650 err
= nft_delrule(&ctx
, rule
);
1655 /* There are rules and elements that are still holding references to us,
1656 * we cannot do a recursive removal in this case.
1661 return nft_delchain(&ctx
);
1669 * nft_register_expr - register nf_tables expr type
1672 * Registers the expr type for use with nf_tables. Returns zero on
1673 * success or a negative errno code otherwise.
1675 int nft_register_expr(struct nft_expr_type
*type
)
1677 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1678 if (type
->family
== NFPROTO_UNSPEC
)
1679 list_add_tail_rcu(&type
->list
, &nf_tables_expressions
);
1681 list_add_rcu(&type
->list
, &nf_tables_expressions
);
1682 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1685 EXPORT_SYMBOL_GPL(nft_register_expr
);
1688 * nft_unregister_expr - unregister nf_tables expr type
1691 * Unregisters the expr typefor use with nf_tables.
1693 void nft_unregister_expr(struct nft_expr_type
*type
)
1695 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1696 list_del_rcu(&type
->list
);
1697 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1699 EXPORT_SYMBOL_GPL(nft_unregister_expr
);
1701 static const struct nft_expr_type
*__nft_expr_type_get(u8 family
,
1704 const struct nft_expr_type
*type
;
1706 list_for_each_entry(type
, &nf_tables_expressions
, list
) {
1707 if (!nla_strcmp(nla
, type
->name
) &&
1708 (!type
->family
|| type
->family
== family
))
1714 static const struct nft_expr_type
*nft_expr_type_get(u8 family
,
1717 const struct nft_expr_type
*type
;
1720 return ERR_PTR(-EINVAL
);
1722 type
= __nft_expr_type_get(family
, nla
);
1723 if (type
!= NULL
&& try_module_get(type
->owner
))
1726 #ifdef CONFIG_MODULES
1728 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1729 request_module("nft-expr-%u-%.*s", family
,
1730 nla_len(nla
), (char *)nla_data(nla
));
1731 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1732 if (__nft_expr_type_get(family
, nla
))
1733 return ERR_PTR(-EAGAIN
);
1735 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1736 request_module("nft-expr-%.*s",
1737 nla_len(nla
), (char *)nla_data(nla
));
1738 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1739 if (__nft_expr_type_get(family
, nla
))
1740 return ERR_PTR(-EAGAIN
);
1743 return ERR_PTR(-ENOENT
);
1746 static const struct nla_policy nft_expr_policy
[NFTA_EXPR_MAX
+ 1] = {
1747 [NFTA_EXPR_NAME
] = { .type
= NLA_STRING
},
1748 [NFTA_EXPR_DATA
] = { .type
= NLA_NESTED
},
1751 static int nf_tables_fill_expr_info(struct sk_buff
*skb
,
1752 const struct nft_expr
*expr
)
1754 if (nla_put_string(skb
, NFTA_EXPR_NAME
, expr
->ops
->type
->name
))
1755 goto nla_put_failure
;
1757 if (expr
->ops
->dump
) {
1758 struct nlattr
*data
= nla_nest_start(skb
, NFTA_EXPR_DATA
);
1760 goto nla_put_failure
;
1761 if (expr
->ops
->dump(skb
, expr
) < 0)
1762 goto nla_put_failure
;
1763 nla_nest_end(skb
, data
);
1772 int nft_expr_dump(struct sk_buff
*skb
, unsigned int attr
,
1773 const struct nft_expr
*expr
)
1775 struct nlattr
*nest
;
1777 nest
= nla_nest_start(skb
, attr
);
1779 goto nla_put_failure
;
1780 if (nf_tables_fill_expr_info(skb
, expr
) < 0)
1781 goto nla_put_failure
;
1782 nla_nest_end(skb
, nest
);
1789 struct nft_expr_info
{
1790 const struct nft_expr_ops
*ops
;
1791 struct nlattr
*tb
[NFT_EXPR_MAXATTR
+ 1];
1794 static int nf_tables_expr_parse(const struct nft_ctx
*ctx
,
1795 const struct nlattr
*nla
,
1796 struct nft_expr_info
*info
)
1798 const struct nft_expr_type
*type
;
1799 const struct nft_expr_ops
*ops
;
1800 struct nlattr
*tb
[NFTA_EXPR_MAX
+ 1];
1803 err
= nla_parse_nested(tb
, NFTA_EXPR_MAX
, nla
, nft_expr_policy
, NULL
);
1807 type
= nft_expr_type_get(ctx
->afi
->family
, tb
[NFTA_EXPR_NAME
]);
1809 return PTR_ERR(type
);
1811 if (tb
[NFTA_EXPR_DATA
]) {
1812 err
= nla_parse_nested(info
->tb
, type
->maxattr
,
1813 tb
[NFTA_EXPR_DATA
], type
->policy
, NULL
);
1817 memset(info
->tb
, 0, sizeof(info
->tb
[0]) * (type
->maxattr
+ 1));
1819 if (type
->select_ops
!= NULL
) {
1820 ops
= type
->select_ops(ctx
,
1821 (const struct nlattr
* const *)info
->tb
);
1833 module_put(type
->owner
);
1837 static int nf_tables_newexpr(const struct nft_ctx
*ctx
,
1838 const struct nft_expr_info
*info
,
1839 struct nft_expr
*expr
)
1841 const struct nft_expr_ops
*ops
= info
->ops
;
1846 err
= ops
->init(ctx
, expr
, (const struct nlattr
**)info
->tb
);
1851 if (ops
->validate
) {
1852 const struct nft_data
*data
= NULL
;
1854 err
= ops
->validate(ctx
, expr
, &data
);
1863 ops
->destroy(ctx
, expr
);
1869 static void nf_tables_expr_destroy(const struct nft_ctx
*ctx
,
1870 struct nft_expr
*expr
)
1872 if (expr
->ops
->destroy
)
1873 expr
->ops
->destroy(ctx
, expr
);
1874 module_put(expr
->ops
->type
->owner
);
1877 struct nft_expr
*nft_expr_init(const struct nft_ctx
*ctx
,
1878 const struct nlattr
*nla
)
1880 struct nft_expr_info info
;
1881 struct nft_expr
*expr
;
1884 err
= nf_tables_expr_parse(ctx
, nla
, &info
);
1889 expr
= kzalloc(info
.ops
->size
, GFP_KERNEL
);
1893 err
= nf_tables_newexpr(ctx
, &info
, expr
);
1901 module_put(info
.ops
->type
->owner
);
1903 return ERR_PTR(err
);
1906 void nft_expr_destroy(const struct nft_ctx
*ctx
, struct nft_expr
*expr
)
1908 nf_tables_expr_destroy(ctx
, expr
);
1916 static struct nft_rule
*__nf_tables_rule_lookup(const struct nft_chain
*chain
,
1919 struct nft_rule
*rule
;
1921 // FIXME: this sucks
1922 list_for_each_entry(rule
, &chain
->rules
, list
) {
1923 if (handle
== rule
->handle
)
1927 return ERR_PTR(-ENOENT
);
1930 static struct nft_rule
*nf_tables_rule_lookup(const struct nft_chain
*chain
,
1931 const struct nlattr
*nla
)
1934 return ERR_PTR(-EINVAL
);
1936 return __nf_tables_rule_lookup(chain
, be64_to_cpu(nla_get_be64(nla
)));
1939 static const struct nla_policy nft_rule_policy
[NFTA_RULE_MAX
+ 1] = {
1940 [NFTA_RULE_TABLE
] = { .type
= NLA_STRING
,
1941 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
1942 [NFTA_RULE_CHAIN
] = { .type
= NLA_STRING
,
1943 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
1944 [NFTA_RULE_HANDLE
] = { .type
= NLA_U64
},
1945 [NFTA_RULE_EXPRESSIONS
] = { .type
= NLA_NESTED
},
1946 [NFTA_RULE_COMPAT
] = { .type
= NLA_NESTED
},
1947 [NFTA_RULE_POSITION
] = { .type
= NLA_U64
},
1948 [NFTA_RULE_USERDATA
] = { .type
= NLA_BINARY
,
1949 .len
= NFT_USERDATA_MAXLEN
},
1952 static int nf_tables_fill_rule_info(struct sk_buff
*skb
, struct net
*net
,
1953 u32 portid
, u32 seq
, int event
,
1954 u32 flags
, int family
,
1955 const struct nft_table
*table
,
1956 const struct nft_chain
*chain
,
1957 const struct nft_rule
*rule
)
1959 struct nlmsghdr
*nlh
;
1960 struct nfgenmsg
*nfmsg
;
1961 const struct nft_expr
*expr
, *next
;
1962 struct nlattr
*list
;
1963 const struct nft_rule
*prule
;
1964 u16 type
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
1966 nlh
= nlmsg_put(skb
, portid
, seq
, type
, sizeof(struct nfgenmsg
), flags
);
1968 goto nla_put_failure
;
1970 nfmsg
= nlmsg_data(nlh
);
1971 nfmsg
->nfgen_family
= family
;
1972 nfmsg
->version
= NFNETLINK_V0
;
1973 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
1975 if (nla_put_string(skb
, NFTA_RULE_TABLE
, table
->name
))
1976 goto nla_put_failure
;
1977 if (nla_put_string(skb
, NFTA_RULE_CHAIN
, chain
->name
))
1978 goto nla_put_failure
;
1979 if (nla_put_be64(skb
, NFTA_RULE_HANDLE
, cpu_to_be64(rule
->handle
),
1981 goto nla_put_failure
;
1983 if ((event
!= NFT_MSG_DELRULE
) && (rule
->list
.prev
!= &chain
->rules
)) {
1984 prule
= list_prev_entry(rule
, list
);
1985 if (nla_put_be64(skb
, NFTA_RULE_POSITION
,
1986 cpu_to_be64(prule
->handle
),
1988 goto nla_put_failure
;
1991 list
= nla_nest_start(skb
, NFTA_RULE_EXPRESSIONS
);
1993 goto nla_put_failure
;
1994 nft_rule_for_each_expr(expr
, next
, rule
) {
1995 if (nft_expr_dump(skb
, NFTA_LIST_ELEM
, expr
) < 0)
1996 goto nla_put_failure
;
1998 nla_nest_end(skb
, list
);
2001 struct nft_userdata
*udata
= nft_userdata(rule
);
2002 if (nla_put(skb
, NFTA_RULE_USERDATA
, udata
->len
+ 1,
2004 goto nla_put_failure
;
2007 nlmsg_end(skb
, nlh
);
2011 nlmsg_trim(skb
, nlh
);
2015 static void nf_tables_rule_notify(const struct nft_ctx
*ctx
,
2016 const struct nft_rule
*rule
, int event
)
2018 struct sk_buff
*skb
;
2022 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
2025 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
2029 err
= nf_tables_fill_rule_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
2030 event
, 0, ctx
->afi
->family
, ctx
->table
,
2037 nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
2038 ctx
->report
, GFP_KERNEL
);
2041 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
2044 struct nft_rule_dump_ctx
{
2049 static int nf_tables_dump_rules(struct sk_buff
*skb
,
2050 struct netlink_callback
*cb
)
2052 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
2053 const struct nft_rule_dump_ctx
*ctx
= cb
->data
;
2054 const struct nft_af_info
*afi
;
2055 const struct nft_table
*table
;
2056 const struct nft_chain
*chain
;
2057 const struct nft_rule
*rule
;
2058 unsigned int idx
= 0, s_idx
= cb
->args
[0];
2059 struct net
*net
= sock_net(skb
->sk
);
2060 int family
= nfmsg
->nfgen_family
;
2063 cb
->seq
= net
->nft
.base_seq
;
2065 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
2066 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
2069 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
2070 if (ctx
&& ctx
->table
&&
2071 strcmp(ctx
->table
, table
->name
) != 0)
2074 list_for_each_entry_rcu(chain
, &table
->chains
, list
) {
2075 if (ctx
&& ctx
->chain
[0] &&
2076 strcmp(ctx
->chain
, chain
->name
) != 0)
2079 list_for_each_entry_rcu(rule
, &chain
->rules
, list
) {
2080 if (!nft_is_active(net
, rule
))
2085 memset(&cb
->args
[1], 0,
2086 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
2087 if (nf_tables_fill_rule_info(skb
, net
, NETLINK_CB(cb
->skb
).portid
,
2090 NLM_F_MULTI
| NLM_F_APPEND
,
2091 afi
->family
, table
, chain
, rule
) < 0)
2094 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
2108 static int nf_tables_dump_rules_done(struct netlink_callback
*cb
)
2110 struct nft_rule_dump_ctx
*ctx
= cb
->data
;
2120 static int nf_tables_getrule(struct net
*net
, struct sock
*nlsk
,
2121 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2122 const struct nlattr
* const nla
[],
2123 struct netlink_ext_ack
*extack
)
2125 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2126 u8 genmask
= nft_genmask_cur(net
);
2127 const struct nft_af_info
*afi
;
2128 const struct nft_table
*table
;
2129 const struct nft_chain
*chain
;
2130 const struct nft_rule
*rule
;
2131 struct sk_buff
*skb2
;
2132 int family
= nfmsg
->nfgen_family
;
2135 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
2136 struct netlink_dump_control c
= {
2137 .dump
= nf_tables_dump_rules
,
2138 .done
= nf_tables_dump_rules_done
,
2141 if (nla
[NFTA_RULE_TABLE
] || nla
[NFTA_RULE_CHAIN
]) {
2142 struct nft_rule_dump_ctx
*ctx
;
2144 ctx
= kzalloc(sizeof(*ctx
), GFP_KERNEL
);
2148 if (nla
[NFTA_RULE_TABLE
]) {
2149 ctx
->table
= nla_strdup(nla
[NFTA_RULE_TABLE
],
2156 if (nla
[NFTA_RULE_CHAIN
]) {
2157 ctx
->chain
= nla_strdup(nla
[NFTA_RULE_CHAIN
],
2168 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
2171 afi
= nf_tables_afinfo_lookup(net
, family
, false);
2173 return PTR_ERR(afi
);
2175 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
], genmask
);
2177 return PTR_ERR(table
);
2179 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
], genmask
);
2181 return PTR_ERR(chain
);
2183 rule
= nf_tables_rule_lookup(chain
, nla
[NFTA_RULE_HANDLE
]);
2185 return PTR_ERR(rule
);
2187 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
2191 err
= nf_tables_fill_rule_info(skb2
, net
, NETLINK_CB(skb
).portid
,
2192 nlh
->nlmsg_seq
, NFT_MSG_NEWRULE
, 0,
2193 family
, table
, chain
, rule
);
2197 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
2204 static void nf_tables_rule_destroy(const struct nft_ctx
*ctx
,
2205 struct nft_rule
*rule
)
2207 struct nft_expr
*expr
;
2210 * Careful: some expressions might not be initialized in case this
2211 * is called on error from nf_tables_newrule().
2213 expr
= nft_expr_first(rule
);
2214 while (expr
!= nft_expr_last(rule
) && expr
->ops
) {
2215 nf_tables_expr_destroy(ctx
, expr
);
2216 expr
= nft_expr_next(expr
);
2221 #define NFT_RULE_MAXEXPRS 128
2223 static struct nft_expr_info
*info
;
2225 static int nf_tables_newrule(struct net
*net
, struct sock
*nlsk
,
2226 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2227 const struct nlattr
* const nla
[],
2228 struct netlink_ext_ack
*extack
)
2230 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2231 u8 genmask
= nft_genmask_next(net
);
2232 struct nft_af_info
*afi
;
2233 struct nft_table
*table
;
2234 struct nft_chain
*chain
;
2235 struct nft_rule
*rule
, *old_rule
= NULL
;
2236 struct nft_userdata
*udata
;
2237 struct nft_trans
*trans
= NULL
;
2238 struct nft_expr
*expr
;
2241 unsigned int size
, i
, n
, ulen
= 0, usize
= 0;
2244 u64 handle
, pos_handle
;
2246 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
2248 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, create
);
2250 return PTR_ERR(afi
);
2252 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
], genmask
);
2254 return PTR_ERR(table
);
2256 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
], genmask
);
2258 return PTR_ERR(chain
);
2260 if (nla
[NFTA_RULE_HANDLE
]) {
2261 handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_RULE_HANDLE
]));
2262 rule
= __nf_tables_rule_lookup(chain
, handle
);
2264 return PTR_ERR(rule
);
2266 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
2268 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
2273 if (!create
|| nlh
->nlmsg_flags
& NLM_F_REPLACE
)
2275 handle
= nf_tables_alloc_handle(table
);
2277 if (chain
->use
== UINT_MAX
)
2281 if (nla
[NFTA_RULE_POSITION
]) {
2282 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
))
2285 pos_handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_RULE_POSITION
]));
2286 old_rule
= __nf_tables_rule_lookup(chain
, pos_handle
);
2287 if (IS_ERR(old_rule
))
2288 return PTR_ERR(old_rule
);
2291 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
2295 if (nla
[NFTA_RULE_EXPRESSIONS
]) {
2296 nla_for_each_nested(tmp
, nla
[NFTA_RULE_EXPRESSIONS
], rem
) {
2298 if (nla_type(tmp
) != NFTA_LIST_ELEM
)
2300 if (n
== NFT_RULE_MAXEXPRS
)
2302 err
= nf_tables_expr_parse(&ctx
, tmp
, &info
[n
]);
2305 size
+= info
[n
].ops
->size
;
2309 /* Check for overflow of dlen field */
2311 if (size
>= 1 << 12)
2314 if (nla
[NFTA_RULE_USERDATA
]) {
2315 ulen
= nla_len(nla
[NFTA_RULE_USERDATA
]);
2317 usize
= sizeof(struct nft_userdata
) + ulen
;
2321 rule
= kzalloc(sizeof(*rule
) + size
+ usize
, GFP_KERNEL
);
2325 nft_activate_next(net
, rule
);
2327 rule
->handle
= handle
;
2329 rule
->udata
= ulen
? 1 : 0;
2332 udata
= nft_userdata(rule
);
2333 udata
->len
= ulen
- 1;
2334 nla_memcpy(udata
->data
, nla
[NFTA_RULE_USERDATA
], ulen
);
2337 expr
= nft_expr_first(rule
);
2338 for (i
= 0; i
< n
; i
++) {
2339 err
= nf_tables_newexpr(&ctx
, &info
[i
], expr
);
2343 expr
= nft_expr_next(expr
);
2346 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
) {
2347 if (nft_is_active_next(net
, old_rule
)) {
2348 trans
= nft_trans_rule_add(&ctx
, NFT_MSG_DELRULE
,
2350 if (trans
== NULL
) {
2354 nft_deactivate_next(net
, old_rule
);
2356 list_add_tail_rcu(&rule
->list
, &old_rule
->list
);
2361 } else if (nlh
->nlmsg_flags
& NLM_F_APPEND
)
2363 list_add_rcu(&rule
->list
, &old_rule
->list
);
2365 list_add_tail_rcu(&rule
->list
, &chain
->rules
);
2368 list_add_tail_rcu(&rule
->list
, &old_rule
->list
);
2370 list_add_rcu(&rule
->list
, &chain
->rules
);
2373 if (nft_trans_rule_add(&ctx
, NFT_MSG_NEWRULE
, rule
) == NULL
) {
2381 list_del_rcu(&rule
->list
);
2383 nf_tables_rule_destroy(&ctx
, rule
);
2385 for (i
= 0; i
< n
; i
++) {
2386 if (info
[i
].ops
!= NULL
)
2387 module_put(info
[i
].ops
->type
->owner
);
2392 static struct nft_rule
*nft_rule_lookup_byid(const struct net
*net
,
2393 const struct nlattr
*nla
)
2395 u32 id
= ntohl(nla_get_be32(nla
));
2396 struct nft_trans
*trans
;
2398 list_for_each_entry(trans
, &net
->nft
.commit_list
, list
) {
2399 struct nft_rule
*rule
= nft_trans_rule(trans
);
2401 if (trans
->msg_type
== NFT_MSG_NEWRULE
&&
2402 id
== nft_trans_rule_id(trans
))
2405 return ERR_PTR(-ENOENT
);
2408 static int nf_tables_delrule(struct net
*net
, struct sock
*nlsk
,
2409 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2410 const struct nlattr
* const nla
[],
2411 struct netlink_ext_ack
*extack
)
2413 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2414 u8 genmask
= nft_genmask_next(net
);
2415 struct nft_af_info
*afi
;
2416 struct nft_table
*table
;
2417 struct nft_chain
*chain
= NULL
;
2418 struct nft_rule
*rule
;
2419 int family
= nfmsg
->nfgen_family
, err
= 0;
2422 afi
= nf_tables_afinfo_lookup(net
, family
, false);
2424 return PTR_ERR(afi
);
2426 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
], genmask
);
2428 return PTR_ERR(table
);
2430 if (nla
[NFTA_RULE_CHAIN
]) {
2431 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
],
2434 return PTR_ERR(chain
);
2437 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, chain
, nla
);
2440 if (nla
[NFTA_RULE_HANDLE
]) {
2441 rule
= nf_tables_rule_lookup(chain
,
2442 nla
[NFTA_RULE_HANDLE
]);
2444 return PTR_ERR(rule
);
2446 err
= nft_delrule(&ctx
, rule
);
2447 } else if (nla
[NFTA_RULE_ID
]) {
2448 rule
= nft_rule_lookup_byid(net
, nla
[NFTA_RULE_ID
]);
2450 return PTR_ERR(rule
);
2452 err
= nft_delrule(&ctx
, rule
);
2454 err
= nft_delrule_by_chain(&ctx
);
2457 list_for_each_entry(chain
, &table
->chains
, list
) {
2458 if (!nft_is_active_next(net
, chain
))
2462 err
= nft_delrule_by_chain(&ctx
);
2475 static LIST_HEAD(nf_tables_set_types
);
2477 int nft_register_set(struct nft_set_type
*type
)
2479 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2480 list_add_tail_rcu(&type
->list
, &nf_tables_set_types
);
2481 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2484 EXPORT_SYMBOL_GPL(nft_register_set
);
2486 void nft_unregister_set(struct nft_set_type
*type
)
2488 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2489 list_del_rcu(&type
->list
);
2490 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2492 EXPORT_SYMBOL_GPL(nft_unregister_set
);
2494 #define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
2495 NFT_SET_TIMEOUT | NFT_SET_OBJECT)
2497 static bool nft_set_ops_candidate(const struct nft_set_ops
*ops
, u32 flags
)
2499 return (flags
& ops
->features
) == (flags
& NFT_SET_FEATURES
);
2503 * Select a set implementation based on the data characteristics and the
2504 * given policy. The total memory use might not be known if no size is
2505 * given, in that case the amount of memory per element is used.
2507 static const struct nft_set_ops
*
2508 nft_select_set_ops(const struct nft_ctx
*ctx
,
2509 const struct nlattr
* const nla
[],
2510 const struct nft_set_desc
*desc
,
2511 enum nft_set_policies policy
)
2513 const struct nft_set_ops
*ops
, *bops
;
2514 struct nft_set_estimate est
, best
;
2515 const struct nft_set_type
*type
;
2518 #ifdef CONFIG_MODULES
2519 if (list_empty(&nf_tables_set_types
)) {
2520 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2521 request_module("nft-set");
2522 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2523 if (!list_empty(&nf_tables_set_types
))
2524 return ERR_PTR(-EAGAIN
);
2527 if (nla
[NFTA_SET_FLAGS
] != NULL
)
2528 flags
= ntohl(nla_get_be32(nla
[NFTA_SET_FLAGS
]));
2535 list_for_each_entry(type
, &nf_tables_set_types
, list
) {
2536 if (!type
->select_ops
)
2539 ops
= type
->select_ops(ctx
, desc
, flags
);
2543 if (!nft_set_ops_candidate(ops
, flags
))
2545 if (!ops
->estimate(desc
, flags
, &est
))
2549 case NFT_SET_POL_PERFORMANCE
:
2550 if (est
.lookup
< best
.lookup
)
2552 if (est
.lookup
== best
.lookup
&&
2553 est
.space
< best
.space
)
2556 case NFT_SET_POL_MEMORY
:
2558 if (est
.space
< best
.space
)
2560 if (est
.space
== best
.space
&&
2561 est
.lookup
< best
.lookup
)
2563 } else if (est
.size
< best
.size
) {
2571 if (!try_module_get(type
->owner
))
2574 module_put(bops
->type
->owner
);
2583 return ERR_PTR(-EOPNOTSUPP
);
2586 static const struct nla_policy nft_set_policy
[NFTA_SET_MAX
+ 1] = {
2587 [NFTA_SET_TABLE
] = { .type
= NLA_STRING
,
2588 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
2589 [NFTA_SET_NAME
] = { .type
= NLA_STRING
,
2590 .len
= NFT_SET_MAXNAMELEN
- 1 },
2591 [NFTA_SET_FLAGS
] = { .type
= NLA_U32
},
2592 [NFTA_SET_KEY_TYPE
] = { .type
= NLA_U32
},
2593 [NFTA_SET_KEY_LEN
] = { .type
= NLA_U32
},
2594 [NFTA_SET_DATA_TYPE
] = { .type
= NLA_U32
},
2595 [NFTA_SET_DATA_LEN
] = { .type
= NLA_U32
},
2596 [NFTA_SET_POLICY
] = { .type
= NLA_U32
},
2597 [NFTA_SET_DESC
] = { .type
= NLA_NESTED
},
2598 [NFTA_SET_ID
] = { .type
= NLA_U32
},
2599 [NFTA_SET_TIMEOUT
] = { .type
= NLA_U64
},
2600 [NFTA_SET_GC_INTERVAL
] = { .type
= NLA_U32
},
2601 [NFTA_SET_USERDATA
] = { .type
= NLA_BINARY
,
2602 .len
= NFT_USERDATA_MAXLEN
},
2603 [NFTA_SET_OBJ_TYPE
] = { .type
= NLA_U32
},
2606 static const struct nla_policy nft_set_desc_policy
[NFTA_SET_DESC_MAX
+ 1] = {
2607 [NFTA_SET_DESC_SIZE
] = { .type
= NLA_U32
},
2610 static int nft_ctx_init_from_setattr(struct nft_ctx
*ctx
, struct net
*net
,
2611 const struct sk_buff
*skb
,
2612 const struct nlmsghdr
*nlh
,
2613 const struct nlattr
* const nla
[],
2616 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2617 struct nft_af_info
*afi
= NULL
;
2618 struct nft_table
*table
= NULL
;
2620 if (nfmsg
->nfgen_family
!= NFPROTO_UNSPEC
) {
2621 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, false);
2623 return PTR_ERR(afi
);
2626 if (nla
[NFTA_SET_TABLE
] != NULL
) {
2628 return -EAFNOSUPPORT
;
2630 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_TABLE
],
2633 return PTR_ERR(table
);
2636 nft_ctx_init(ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
2640 static struct nft_set
*nf_tables_set_lookup(const struct nft_table
*table
,
2641 const struct nlattr
*nla
, u8 genmask
)
2643 struct nft_set
*set
;
2646 return ERR_PTR(-EINVAL
);
2648 list_for_each_entry(set
, &table
->sets
, list
) {
2649 if (!nla_strcmp(nla
, set
->name
) &&
2650 nft_active_genmask(set
, genmask
))
2653 return ERR_PTR(-ENOENT
);
2656 static struct nft_set
*nf_tables_set_lookup_byid(const struct net
*net
,
2657 const struct nlattr
*nla
,
2660 struct nft_trans
*trans
;
2661 u32 id
= ntohl(nla_get_be32(nla
));
2663 list_for_each_entry(trans
, &net
->nft
.commit_list
, list
) {
2664 struct nft_set
*set
= nft_trans_set(trans
);
2666 if (trans
->msg_type
== NFT_MSG_NEWSET
&&
2667 id
== nft_trans_set_id(trans
) &&
2668 nft_active_genmask(set
, genmask
))
2671 return ERR_PTR(-ENOENT
);
2674 struct nft_set
*nft_set_lookup(const struct net
*net
,
2675 const struct nft_table
*table
,
2676 const struct nlattr
*nla_set_name
,
2677 const struct nlattr
*nla_set_id
,
2680 struct nft_set
*set
;
2682 set
= nf_tables_set_lookup(table
, nla_set_name
, genmask
);
2687 set
= nf_tables_set_lookup_byid(net
, nla_set_id
, genmask
);
2691 EXPORT_SYMBOL_GPL(nft_set_lookup
);
2693 static int nf_tables_set_alloc_name(struct nft_ctx
*ctx
, struct nft_set
*set
,
2696 const struct nft_set
*i
;
2698 unsigned long *inuse
;
2699 unsigned int n
= 0, min
= 0;
2701 p
= strchr(name
, '%');
2703 if (p
[1] != 'd' || strchr(p
+ 2, '%'))
2706 inuse
= (unsigned long *)get_zeroed_page(GFP_KERNEL
);
2710 list_for_each_entry(i
, &ctx
->table
->sets
, list
) {
2713 if (!nft_is_active_next(ctx
->net
, set
))
2715 if (!sscanf(i
->name
, name
, &tmp
))
2717 if (tmp
< min
|| tmp
>= min
+ BITS_PER_BYTE
* PAGE_SIZE
)
2720 set_bit(tmp
- min
, inuse
);
2723 n
= find_first_zero_bit(inuse
, BITS_PER_BYTE
* PAGE_SIZE
);
2724 if (n
>= BITS_PER_BYTE
* PAGE_SIZE
) {
2725 min
+= BITS_PER_BYTE
* PAGE_SIZE
;
2726 memset(inuse
, 0, PAGE_SIZE
);
2729 free_page((unsigned long)inuse
);
2732 set
->name
= kasprintf(GFP_KERNEL
, name
, min
+ n
);
2736 list_for_each_entry(i
, &ctx
->table
->sets
, list
) {
2737 if (!nft_is_active_next(ctx
->net
, i
))
2739 if (!strcmp(set
->name
, i
->name
)) {
2747 static int nf_tables_fill_set(struct sk_buff
*skb
, const struct nft_ctx
*ctx
,
2748 const struct nft_set
*set
, u16 event
, u16 flags
)
2750 struct nfgenmsg
*nfmsg
;
2751 struct nlmsghdr
*nlh
;
2752 struct nlattr
*desc
;
2753 u32 portid
= ctx
->portid
;
2756 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
2757 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
2760 goto nla_put_failure
;
2762 nfmsg
= nlmsg_data(nlh
);
2763 nfmsg
->nfgen_family
= ctx
->afi
->family
;
2764 nfmsg
->version
= NFNETLINK_V0
;
2765 nfmsg
->res_id
= htons(ctx
->net
->nft
.base_seq
& 0xffff);
2767 if (nla_put_string(skb
, NFTA_SET_TABLE
, ctx
->table
->name
))
2768 goto nla_put_failure
;
2769 if (nla_put_string(skb
, NFTA_SET_NAME
, set
->name
))
2770 goto nla_put_failure
;
2771 if (set
->flags
!= 0)
2772 if (nla_put_be32(skb
, NFTA_SET_FLAGS
, htonl(set
->flags
)))
2773 goto nla_put_failure
;
2775 if (nla_put_be32(skb
, NFTA_SET_KEY_TYPE
, htonl(set
->ktype
)))
2776 goto nla_put_failure
;
2777 if (nla_put_be32(skb
, NFTA_SET_KEY_LEN
, htonl(set
->klen
)))
2778 goto nla_put_failure
;
2779 if (set
->flags
& NFT_SET_MAP
) {
2780 if (nla_put_be32(skb
, NFTA_SET_DATA_TYPE
, htonl(set
->dtype
)))
2781 goto nla_put_failure
;
2782 if (nla_put_be32(skb
, NFTA_SET_DATA_LEN
, htonl(set
->dlen
)))
2783 goto nla_put_failure
;
2785 if (set
->flags
& NFT_SET_OBJECT
&&
2786 nla_put_be32(skb
, NFTA_SET_OBJ_TYPE
, htonl(set
->objtype
)))
2787 goto nla_put_failure
;
2790 nla_put_be64(skb
, NFTA_SET_TIMEOUT
,
2791 cpu_to_be64(jiffies_to_msecs(set
->timeout
)),
2793 goto nla_put_failure
;
2795 nla_put_be32(skb
, NFTA_SET_GC_INTERVAL
, htonl(set
->gc_int
)))
2796 goto nla_put_failure
;
2798 if (set
->policy
!= NFT_SET_POL_PERFORMANCE
) {
2799 if (nla_put_be32(skb
, NFTA_SET_POLICY
, htonl(set
->policy
)))
2800 goto nla_put_failure
;
2803 if (nla_put(skb
, NFTA_SET_USERDATA
, set
->udlen
, set
->udata
))
2804 goto nla_put_failure
;
2806 desc
= nla_nest_start(skb
, NFTA_SET_DESC
);
2808 goto nla_put_failure
;
2810 nla_put_be32(skb
, NFTA_SET_DESC_SIZE
, htonl(set
->size
)))
2811 goto nla_put_failure
;
2812 nla_nest_end(skb
, desc
);
2814 nlmsg_end(skb
, nlh
);
2818 nlmsg_trim(skb
, nlh
);
2822 static void nf_tables_set_notify(const struct nft_ctx
*ctx
,
2823 const struct nft_set
*set
, int event
,
2826 struct sk_buff
*skb
;
2827 u32 portid
= ctx
->portid
;
2831 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
2834 skb
= nlmsg_new(NLMSG_GOODSIZE
, gfp_flags
);
2838 err
= nf_tables_fill_set(skb
, ctx
, set
, event
, 0);
2844 nfnetlink_send(skb
, ctx
->net
, portid
, NFNLGRP_NFTABLES
, ctx
->report
,
2848 nfnetlink_set_err(ctx
->net
, portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
2851 static int nf_tables_dump_sets(struct sk_buff
*skb
, struct netlink_callback
*cb
)
2853 const struct nft_set
*set
;
2854 unsigned int idx
, s_idx
= cb
->args
[0];
2855 struct nft_af_info
*afi
;
2856 struct nft_table
*table
, *cur_table
= (struct nft_table
*)cb
->args
[2];
2857 struct net
*net
= sock_net(skb
->sk
);
2858 int cur_family
= cb
->args
[3];
2859 struct nft_ctx
*ctx
= cb
->data
, ctx_set
;
2865 cb
->seq
= net
->nft
.base_seq
;
2867 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
2868 if (ctx
->afi
&& ctx
->afi
!= afi
)
2872 if (afi
->family
!= cur_family
)
2877 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
2878 if (ctx
->table
&& ctx
->table
!= table
)
2882 if (cur_table
!= table
)
2888 list_for_each_entry_rcu(set
, &table
->sets
, list
) {
2891 if (!nft_is_active(net
, set
))
2895 ctx_set
.table
= table
;
2897 if (nf_tables_fill_set(skb
, &ctx_set
, set
,
2901 cb
->args
[2] = (unsigned long) table
;
2902 cb
->args
[3] = afi
->family
;
2905 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
2919 static int nf_tables_dump_sets_done(struct netlink_callback
*cb
)
2925 static int nf_tables_getset(struct net
*net
, struct sock
*nlsk
,
2926 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
2927 const struct nlattr
* const nla
[],
2928 struct netlink_ext_ack
*extack
)
2930 u8 genmask
= nft_genmask_cur(net
);
2931 const struct nft_set
*set
;
2933 struct sk_buff
*skb2
;
2934 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2937 /* Verify existence before starting dump */
2938 err
= nft_ctx_init_from_setattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
2942 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
2943 struct netlink_dump_control c
= {
2944 .dump
= nf_tables_dump_sets
,
2945 .done
= nf_tables_dump_sets_done
,
2947 struct nft_ctx
*ctx_dump
;
2949 ctx_dump
= kmalloc(sizeof(*ctx_dump
), GFP_KERNEL
);
2950 if (ctx_dump
== NULL
)
2956 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
2959 /* Only accept unspec with dump */
2960 if (nfmsg
->nfgen_family
== NFPROTO_UNSPEC
)
2961 return -EAFNOSUPPORT
;
2962 if (!nla
[NFTA_SET_TABLE
])
2965 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_NAME
], genmask
);
2967 return PTR_ERR(set
);
2969 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
2973 err
= nf_tables_fill_set(skb2
, &ctx
, set
, NFT_MSG_NEWSET
, 0);
2977 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
2984 static int nf_tables_set_desc_parse(const struct nft_ctx
*ctx
,
2985 struct nft_set_desc
*desc
,
2986 const struct nlattr
*nla
)
2988 struct nlattr
*da
[NFTA_SET_DESC_MAX
+ 1];
2991 err
= nla_parse_nested(da
, NFTA_SET_DESC_MAX
, nla
,
2992 nft_set_desc_policy
, NULL
);
2996 if (da
[NFTA_SET_DESC_SIZE
] != NULL
)
2997 desc
->size
= ntohl(nla_get_be32(da
[NFTA_SET_DESC_SIZE
]));
3002 static int nf_tables_newset(struct net
*net
, struct sock
*nlsk
,
3003 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
3004 const struct nlattr
* const nla
[],
3005 struct netlink_ext_ack
*extack
)
3007 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
3008 u8 genmask
= nft_genmask_next(net
);
3009 const struct nft_set_ops
*ops
;
3010 struct nft_af_info
*afi
;
3011 struct nft_table
*table
;
3012 struct nft_set
*set
;
3018 u32 ktype
, dtype
, flags
, policy
, gc_int
, objtype
;
3019 struct nft_set_desc desc
;
3020 unsigned char *udata
;
3024 if (nla
[NFTA_SET_TABLE
] == NULL
||
3025 nla
[NFTA_SET_NAME
] == NULL
||
3026 nla
[NFTA_SET_KEY_LEN
] == NULL
||
3027 nla
[NFTA_SET_ID
] == NULL
)
3030 memset(&desc
, 0, sizeof(desc
));
3032 ktype
= NFT_DATA_VALUE
;
3033 if (nla
[NFTA_SET_KEY_TYPE
] != NULL
) {
3034 ktype
= ntohl(nla_get_be32(nla
[NFTA_SET_KEY_TYPE
]));
3035 if ((ktype
& NFT_DATA_RESERVED_MASK
) == NFT_DATA_RESERVED_MASK
)
3039 desc
.klen
= ntohl(nla_get_be32(nla
[NFTA_SET_KEY_LEN
]));
3040 if (desc
.klen
== 0 || desc
.klen
> NFT_DATA_VALUE_MAXLEN
)
3044 if (nla
[NFTA_SET_FLAGS
] != NULL
) {
3045 flags
= ntohl(nla_get_be32(nla
[NFTA_SET_FLAGS
]));
3046 if (flags
& ~(NFT_SET_ANONYMOUS
| NFT_SET_CONSTANT
|
3047 NFT_SET_INTERVAL
| NFT_SET_TIMEOUT
|
3048 NFT_SET_MAP
| NFT_SET_EVAL
|
3051 /* Only one of these operations is supported */
3052 if ((flags
& (NFT_SET_MAP
| NFT_SET_EVAL
| NFT_SET_OBJECT
)) ==
3053 (NFT_SET_MAP
| NFT_SET_EVAL
| NFT_SET_OBJECT
))
3058 if (nla
[NFTA_SET_DATA_TYPE
] != NULL
) {
3059 if (!(flags
& NFT_SET_MAP
))
3062 dtype
= ntohl(nla_get_be32(nla
[NFTA_SET_DATA_TYPE
]));
3063 if ((dtype
& NFT_DATA_RESERVED_MASK
) == NFT_DATA_RESERVED_MASK
&&
3064 dtype
!= NFT_DATA_VERDICT
)
3067 if (dtype
!= NFT_DATA_VERDICT
) {
3068 if (nla
[NFTA_SET_DATA_LEN
] == NULL
)
3070 desc
.dlen
= ntohl(nla_get_be32(nla
[NFTA_SET_DATA_LEN
]));
3071 if (desc
.dlen
== 0 || desc
.dlen
> NFT_DATA_VALUE_MAXLEN
)
3074 desc
.dlen
= sizeof(struct nft_verdict
);
3075 } else if (flags
& NFT_SET_MAP
)
3078 if (nla
[NFTA_SET_OBJ_TYPE
] != NULL
) {
3079 if (!(flags
& NFT_SET_OBJECT
))
3082 objtype
= ntohl(nla_get_be32(nla
[NFTA_SET_OBJ_TYPE
]));
3083 if (objtype
== NFT_OBJECT_UNSPEC
||
3084 objtype
> NFT_OBJECT_MAX
)
3086 } else if (flags
& NFT_SET_OBJECT
)
3089 objtype
= NFT_OBJECT_UNSPEC
;
3092 if (nla
[NFTA_SET_TIMEOUT
] != NULL
) {
3093 if (!(flags
& NFT_SET_TIMEOUT
))
3095 timeout
= msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3096 nla
[NFTA_SET_TIMEOUT
])));
3099 if (nla
[NFTA_SET_GC_INTERVAL
] != NULL
) {
3100 if (!(flags
& NFT_SET_TIMEOUT
))
3102 gc_int
= ntohl(nla_get_be32(nla
[NFTA_SET_GC_INTERVAL
]));
3105 policy
= NFT_SET_POL_PERFORMANCE
;
3106 if (nla
[NFTA_SET_POLICY
] != NULL
)
3107 policy
= ntohl(nla_get_be32(nla
[NFTA_SET_POLICY
]));
3109 if (nla
[NFTA_SET_DESC
] != NULL
) {
3110 err
= nf_tables_set_desc_parse(&ctx
, &desc
, nla
[NFTA_SET_DESC
]);
3115 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
3117 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, create
);
3119 return PTR_ERR(afi
);
3121 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_TABLE
], genmask
);
3123 return PTR_ERR(table
);
3125 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
3127 set
= nf_tables_set_lookup(table
, nla
[NFTA_SET_NAME
], genmask
);
3129 if (PTR_ERR(set
) != -ENOENT
)
3130 return PTR_ERR(set
);
3132 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
3134 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
3139 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
))
3142 ops
= nft_select_set_ops(&ctx
, nla
, &desc
, policy
);
3144 return PTR_ERR(ops
);
3147 if (nla
[NFTA_SET_USERDATA
])
3148 udlen
= nla_len(nla
[NFTA_SET_USERDATA
]);
3151 if (ops
->privsize
!= NULL
)
3152 size
= ops
->privsize(nla
, &desc
);
3154 set
= kvzalloc(sizeof(*set
) + size
+ udlen
, GFP_KERNEL
);
3160 name
= nla_strdup(nla
[NFTA_SET_NAME
], GFP_KERNEL
);
3166 err
= nf_tables_set_alloc_name(&ctx
, set
, name
);
3173 udata
= set
->data
+ size
;
3174 nla_memcpy(udata
, nla
[NFTA_SET_USERDATA
], udlen
);
3177 INIT_LIST_HEAD(&set
->bindings
);
3180 set
->klen
= desc
.klen
;
3182 set
->objtype
= objtype
;
3183 set
->dlen
= desc
.dlen
;
3185 set
->size
= desc
.size
;
3186 set
->policy
= policy
;
3189 set
->timeout
= timeout
;
3190 set
->gc_int
= gc_int
;
3192 err
= ops
->init(set
, &desc
, nla
);
3196 err
= nft_trans_set_add(&ctx
, NFT_MSG_NEWSET
, set
);
3200 list_add_tail_rcu(&set
->list
, &table
->sets
);
3209 module_put(ops
->type
->owner
);
3213 static void nft_set_destroy(struct nft_set
*set
)
3215 set
->ops
->destroy(set
);
3216 module_put(set
->ops
->type
->owner
);
3221 static void nf_tables_set_destroy(const struct nft_ctx
*ctx
, struct nft_set
*set
)
3223 list_del_rcu(&set
->list
);
3224 nf_tables_set_notify(ctx
, set
, NFT_MSG_DELSET
, GFP_ATOMIC
);
3225 nft_set_destroy(set
);
3228 static int nf_tables_delset(struct net
*net
, struct sock
*nlsk
,
3229 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
3230 const struct nlattr
* const nla
[],
3231 struct netlink_ext_ack
*extack
)
3233 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
3234 u8 genmask
= nft_genmask_next(net
);
3235 struct nft_set
*set
;
3239 if (nfmsg
->nfgen_family
== NFPROTO_UNSPEC
)
3240 return -EAFNOSUPPORT
;
3241 if (nla
[NFTA_SET_TABLE
] == NULL
)
3244 err
= nft_ctx_init_from_setattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
3248 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_NAME
], genmask
);
3250 return PTR_ERR(set
);
3252 if (!list_empty(&set
->bindings
) ||
3253 (nlh
->nlmsg_flags
& NLM_F_NONREC
&& atomic_read(&set
->nelems
) > 0))
3256 return nft_delset(&ctx
, set
);
3259 static int nf_tables_bind_check_setelem(const struct nft_ctx
*ctx
,
3260 struct nft_set
*set
,
3261 const struct nft_set_iter
*iter
,
3262 struct nft_set_elem
*elem
)
3264 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
3265 enum nft_registers dreg
;
3267 dreg
= nft_type_to_reg(set
->dtype
);
3268 return nft_validate_register_store(ctx
, dreg
, nft_set_ext_data(ext
),
3269 set
->dtype
== NFT_DATA_VERDICT
?
3270 NFT_DATA_VERDICT
: NFT_DATA_VALUE
,
3274 int nf_tables_bind_set(const struct nft_ctx
*ctx
, struct nft_set
*set
,
3275 struct nft_set_binding
*binding
)
3277 struct nft_set_binding
*i
;
3278 struct nft_set_iter iter
;
3280 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_ANONYMOUS
)
3283 if (binding
->flags
& NFT_SET_MAP
) {
3284 /* If the set is already bound to the same chain all
3285 * jumps are already validated for that chain.
3287 list_for_each_entry(i
, &set
->bindings
, list
) {
3288 if (i
->flags
& NFT_SET_MAP
&&
3289 i
->chain
== binding
->chain
)
3293 iter
.genmask
= nft_genmask_next(ctx
->net
);
3297 iter
.fn
= nf_tables_bind_check_setelem
;
3299 set
->ops
->walk(ctx
, set
, &iter
);
3304 binding
->chain
= ctx
->chain
;
3305 list_add_tail_rcu(&binding
->list
, &set
->bindings
);
3308 EXPORT_SYMBOL_GPL(nf_tables_bind_set
);
3310 void nf_tables_unbind_set(const struct nft_ctx
*ctx
, struct nft_set
*set
,
3311 struct nft_set_binding
*binding
)
3313 list_del_rcu(&binding
->list
);
3315 if (list_empty(&set
->bindings
) && set
->flags
& NFT_SET_ANONYMOUS
&&
3316 nft_is_active(ctx
->net
, set
))
3317 nf_tables_set_destroy(ctx
, set
);
3319 EXPORT_SYMBOL_GPL(nf_tables_unbind_set
);
3321 const struct nft_set_ext_type nft_set_ext_types
[] = {
3322 [NFT_SET_EXT_KEY
] = {
3323 .align
= __alignof__(u32
),
3325 [NFT_SET_EXT_DATA
] = {
3326 .align
= __alignof__(u32
),
3328 [NFT_SET_EXT_EXPR
] = {
3329 .align
= __alignof__(struct nft_expr
),
3331 [NFT_SET_EXT_OBJREF
] = {
3332 .len
= sizeof(struct nft_object
*),
3333 .align
= __alignof__(struct nft_object
*),
3335 [NFT_SET_EXT_FLAGS
] = {
3337 .align
= __alignof__(u8
),
3339 [NFT_SET_EXT_TIMEOUT
] = {
3341 .align
= __alignof__(u64
),
3343 [NFT_SET_EXT_EXPIRATION
] = {
3344 .len
= sizeof(unsigned long),
3345 .align
= __alignof__(unsigned long),
3347 [NFT_SET_EXT_USERDATA
] = {
3348 .len
= sizeof(struct nft_userdata
),
3349 .align
= __alignof__(struct nft_userdata
),
3352 EXPORT_SYMBOL_GPL(nft_set_ext_types
);
3358 static const struct nla_policy nft_set_elem_policy
[NFTA_SET_ELEM_MAX
+ 1] = {
3359 [NFTA_SET_ELEM_KEY
] = { .type
= NLA_NESTED
},
3360 [NFTA_SET_ELEM_DATA
] = { .type
= NLA_NESTED
},
3361 [NFTA_SET_ELEM_FLAGS
] = { .type
= NLA_U32
},
3362 [NFTA_SET_ELEM_TIMEOUT
] = { .type
= NLA_U64
},
3363 [NFTA_SET_ELEM_USERDATA
] = { .type
= NLA_BINARY
,
3364 .len
= NFT_USERDATA_MAXLEN
},
3367 static const struct nla_policy nft_set_elem_list_policy
[NFTA_SET_ELEM_LIST_MAX
+ 1] = {
3368 [NFTA_SET_ELEM_LIST_TABLE
] = { .type
= NLA_STRING
,
3369 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
3370 [NFTA_SET_ELEM_LIST_SET
] = { .type
= NLA_STRING
,
3371 .len
= NFT_SET_MAXNAMELEN
- 1 },
3372 [NFTA_SET_ELEM_LIST_ELEMENTS
] = { .type
= NLA_NESTED
},
3373 [NFTA_SET_ELEM_LIST_SET_ID
] = { .type
= NLA_U32
},
3376 static int nft_ctx_init_from_elemattr(struct nft_ctx
*ctx
, struct net
*net
,
3377 const struct sk_buff
*skb
,
3378 const struct nlmsghdr
*nlh
,
3379 const struct nlattr
* const nla
[],
3382 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
3383 struct nft_af_info
*afi
;
3384 struct nft_table
*table
;
3386 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, false);
3388 return PTR_ERR(afi
);
3390 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_ELEM_LIST_TABLE
],
3393 return PTR_ERR(table
);
3395 nft_ctx_init(ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
3399 static int nf_tables_fill_setelem(struct sk_buff
*skb
,
3400 const struct nft_set
*set
,
3401 const struct nft_set_elem
*elem
)
3403 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
3404 unsigned char *b
= skb_tail_pointer(skb
);
3405 struct nlattr
*nest
;
3407 nest
= nla_nest_start(skb
, NFTA_LIST_ELEM
);
3409 goto nla_put_failure
;
3411 if (nft_data_dump(skb
, NFTA_SET_ELEM_KEY
, nft_set_ext_key(ext
),
3412 NFT_DATA_VALUE
, set
->klen
) < 0)
3413 goto nla_put_failure
;
3415 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
) &&
3416 nft_data_dump(skb
, NFTA_SET_ELEM_DATA
, nft_set_ext_data(ext
),
3417 set
->dtype
== NFT_DATA_VERDICT
? NFT_DATA_VERDICT
: NFT_DATA_VALUE
,
3419 goto nla_put_failure
;
3421 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
) &&
3422 nft_expr_dump(skb
, NFTA_SET_ELEM_EXPR
, nft_set_ext_expr(ext
)) < 0)
3423 goto nla_put_failure
;
3425 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
) &&
3426 nla_put_string(skb
, NFTA_SET_ELEM_OBJREF
,
3427 (*nft_set_ext_obj(ext
))->name
) < 0)
3428 goto nla_put_failure
;
3430 if (nft_set_ext_exists(ext
, NFT_SET_EXT_FLAGS
) &&
3431 nla_put_be32(skb
, NFTA_SET_ELEM_FLAGS
,
3432 htonl(*nft_set_ext_flags(ext
))))
3433 goto nla_put_failure
;
3435 if (nft_set_ext_exists(ext
, NFT_SET_EXT_TIMEOUT
) &&
3436 nla_put_be64(skb
, NFTA_SET_ELEM_TIMEOUT
,
3437 cpu_to_be64(jiffies_to_msecs(
3438 *nft_set_ext_timeout(ext
))),
3440 goto nla_put_failure
;
3442 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPIRATION
)) {
3443 unsigned long expires
, now
= jiffies
;
3445 expires
= *nft_set_ext_expiration(ext
);
3446 if (time_before(now
, expires
))
3451 if (nla_put_be64(skb
, NFTA_SET_ELEM_EXPIRATION
,
3452 cpu_to_be64(jiffies_to_msecs(expires
)),
3454 goto nla_put_failure
;
3457 if (nft_set_ext_exists(ext
, NFT_SET_EXT_USERDATA
)) {
3458 struct nft_userdata
*udata
;
3460 udata
= nft_set_ext_userdata(ext
);
3461 if (nla_put(skb
, NFTA_SET_ELEM_USERDATA
,
3462 udata
->len
+ 1, udata
->data
))
3463 goto nla_put_failure
;
3466 nla_nest_end(skb
, nest
);
3474 struct nft_set_dump_args
{
3475 const struct netlink_callback
*cb
;
3476 struct nft_set_iter iter
;
3477 struct sk_buff
*skb
;
3480 static int nf_tables_dump_setelem(const struct nft_ctx
*ctx
,
3481 struct nft_set
*set
,
3482 const struct nft_set_iter
*iter
,
3483 struct nft_set_elem
*elem
)
3485 struct nft_set_dump_args
*args
;
3487 args
= container_of(iter
, struct nft_set_dump_args
, iter
);
3488 return nf_tables_fill_setelem(args
->skb
, set
, elem
);
3491 struct nft_set_dump_ctx
{
3492 const struct nft_set
*set
;
3496 static int nf_tables_dump_set(struct sk_buff
*skb
, struct netlink_callback
*cb
)
3498 struct nft_set_dump_ctx
*dump_ctx
= cb
->data
;
3499 struct net
*net
= sock_net(skb
->sk
);
3500 struct nft_af_info
*afi
;
3501 struct nft_table
*table
;
3502 struct nft_set
*set
;
3503 struct nft_set_dump_args args
;
3504 bool set_found
= false;
3505 struct nfgenmsg
*nfmsg
;
3506 struct nlmsghdr
*nlh
;
3507 struct nlattr
*nest
;
3512 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
3513 if (afi
!= dump_ctx
->ctx
.afi
)
3516 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
3517 if (table
!= dump_ctx
->ctx
.table
)
3520 list_for_each_entry_rcu(set
, &table
->sets
, list
) {
3521 if (set
== dump_ctx
->set
) {
3536 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, NFT_MSG_NEWSETELEM
);
3537 portid
= NETLINK_CB(cb
->skb
).portid
;
3538 seq
= cb
->nlh
->nlmsg_seq
;
3540 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
3543 goto nla_put_failure
;
3545 nfmsg
= nlmsg_data(nlh
);
3546 nfmsg
->nfgen_family
= afi
->family
;
3547 nfmsg
->version
= NFNETLINK_V0
;
3548 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
3550 if (nla_put_string(skb
, NFTA_SET_ELEM_LIST_TABLE
, table
->name
))
3551 goto nla_put_failure
;
3552 if (nla_put_string(skb
, NFTA_SET_ELEM_LIST_SET
, set
->name
))
3553 goto nla_put_failure
;
3555 nest
= nla_nest_start(skb
, NFTA_SET_ELEM_LIST_ELEMENTS
);
3557 goto nla_put_failure
;
3561 args
.iter
.genmask
= nft_genmask_cur(net
);
3562 args
.iter
.skip
= cb
->args
[0];
3563 args
.iter
.count
= 0;
3565 args
.iter
.fn
= nf_tables_dump_setelem
;
3566 set
->ops
->walk(&dump_ctx
->ctx
, set
, &args
.iter
);
3569 nla_nest_end(skb
, nest
);
3570 nlmsg_end(skb
, nlh
);
3572 if (args
.iter
.err
&& args
.iter
.err
!= -EMSGSIZE
)
3573 return args
.iter
.err
;
3574 if (args
.iter
.count
== cb
->args
[0])
3577 cb
->args
[0] = args
.iter
.count
;
3585 static int nf_tables_dump_set_done(struct netlink_callback
*cb
)
3591 static int nf_tables_fill_setelem_info(struct sk_buff
*skb
,
3592 const struct nft_ctx
*ctx
, u32 seq
,
3593 u32 portid
, int event
, u16 flags
,
3594 const struct nft_set
*set
,
3595 const struct nft_set_elem
*elem
)
3597 struct nfgenmsg
*nfmsg
;
3598 struct nlmsghdr
*nlh
;
3599 struct nlattr
*nest
;
3602 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
3603 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
3606 goto nla_put_failure
;
3608 nfmsg
= nlmsg_data(nlh
);
3609 nfmsg
->nfgen_family
= ctx
->afi
->family
;
3610 nfmsg
->version
= NFNETLINK_V0
;
3611 nfmsg
->res_id
= htons(ctx
->net
->nft
.base_seq
& 0xffff);
3613 if (nla_put_string(skb
, NFTA_SET_TABLE
, ctx
->table
->name
))
3614 goto nla_put_failure
;
3615 if (nla_put_string(skb
, NFTA_SET_NAME
, set
->name
))
3616 goto nla_put_failure
;
3618 nest
= nla_nest_start(skb
, NFTA_SET_ELEM_LIST_ELEMENTS
);
3620 goto nla_put_failure
;
3622 err
= nf_tables_fill_setelem(skb
, set
, elem
);
3624 goto nla_put_failure
;
3626 nla_nest_end(skb
, nest
);
3628 nlmsg_end(skb
, nlh
);
3632 nlmsg_trim(skb
, nlh
);
3636 static int nft_setelem_parse_flags(const struct nft_set
*set
,
3637 const struct nlattr
*attr
, u32
*flags
)
3642 *flags
= ntohl(nla_get_be32(attr
));
3643 if (*flags
& ~NFT_SET_ELEM_INTERVAL_END
)
3645 if (!(set
->flags
& NFT_SET_INTERVAL
) &&
3646 *flags
& NFT_SET_ELEM_INTERVAL_END
)
3652 static int nft_get_set_elem(struct nft_ctx
*ctx
, struct nft_set
*set
,
3653 const struct nlattr
*attr
)
3655 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
3656 const struct nft_set_ext
*ext
;
3657 struct nft_data_desc desc
;
3658 struct nft_set_elem elem
;
3659 struct sk_buff
*skb
;
3664 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
3665 nft_set_elem_policy
, NULL
);
3669 if (!nla
[NFTA_SET_ELEM_KEY
])
3672 err
= nft_setelem_parse_flags(set
, nla
[NFTA_SET_ELEM_FLAGS
], &flags
);
3676 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &desc
,
3677 nla
[NFTA_SET_ELEM_KEY
]);
3682 if (desc
.type
!= NFT_DATA_VALUE
|| desc
.len
!= set
->klen
)
3685 priv
= set
->ops
->get(ctx
->net
, set
, &elem
, flags
);
3687 return PTR_ERR(priv
);
3690 ext
= nft_set_elem_ext(set
, &elem
);
3693 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
3697 err
= nf_tables_fill_setelem_info(skb
, ctx
, ctx
->seq
, ctx
->portid
,
3698 NFT_MSG_NEWSETELEM
, 0, set
, &elem
);
3702 err
= nfnetlink_unicast(skb
, ctx
->net
, ctx
->portid
, MSG_DONTWAIT
);
3703 /* This avoids a loop in nfnetlink. */
3711 /* this avoids a loop in nfnetlink. */
3712 return err
== -EAGAIN
? -ENOBUFS
: err
;
3715 static int nf_tables_getsetelem(struct net
*net
, struct sock
*nlsk
,
3716 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
3717 const struct nlattr
* const nla
[],
3718 struct netlink_ext_ack
*extack
)
3720 u8 genmask
= nft_genmask_cur(net
);
3721 struct nft_set
*set
;
3722 struct nlattr
*attr
;
3726 err
= nft_ctx_init_from_elemattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
3730 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
],
3733 return PTR_ERR(set
);
3735 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
3736 struct netlink_dump_control c
= {
3737 .dump
= nf_tables_dump_set
,
3738 .done
= nf_tables_dump_set_done
,
3740 struct nft_set_dump_ctx
*dump_ctx
;
3742 dump_ctx
= kmalloc(sizeof(*dump_ctx
), GFP_KERNEL
);
3746 dump_ctx
->set
= set
;
3747 dump_ctx
->ctx
= ctx
;
3750 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
3753 if (!nla
[NFTA_SET_ELEM_LIST_ELEMENTS
])
3756 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
3757 err
= nft_get_set_elem(&ctx
, set
, attr
);
3765 static void nf_tables_setelem_notify(const struct nft_ctx
*ctx
,
3766 const struct nft_set
*set
,
3767 const struct nft_set_elem
*elem
,
3768 int event
, u16 flags
)
3770 struct net
*net
= ctx
->net
;
3771 u32 portid
= ctx
->portid
;
3772 struct sk_buff
*skb
;
3775 if (!ctx
->report
&& !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
3778 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
3782 err
= nf_tables_fill_setelem_info(skb
, ctx
, 0, portid
, event
, flags
,
3789 nfnetlink_send(skb
, net
, portid
, NFNLGRP_NFTABLES
, ctx
->report
,
3793 nfnetlink_set_err(net
, portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
3796 static struct nft_trans
*nft_trans_elem_alloc(struct nft_ctx
*ctx
,
3798 struct nft_set
*set
)
3800 struct nft_trans
*trans
;
3802 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_elem
));
3806 nft_trans_elem_set(trans
) = set
;
3810 void *nft_set_elem_init(const struct nft_set
*set
,
3811 const struct nft_set_ext_tmpl
*tmpl
,
3812 const u32
*key
, const u32
*data
,
3813 u64 timeout
, gfp_t gfp
)
3815 struct nft_set_ext
*ext
;
3818 elem
= kzalloc(set
->ops
->elemsize
+ tmpl
->len
, gfp
);
3822 ext
= nft_set_elem_ext(set
, elem
);
3823 nft_set_ext_init(ext
, tmpl
);
3825 memcpy(nft_set_ext_key(ext
), key
, set
->klen
);
3826 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
3827 memcpy(nft_set_ext_data(ext
), data
, set
->dlen
);
3828 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPIRATION
))
3829 *nft_set_ext_expiration(ext
) =
3831 if (nft_set_ext_exists(ext
, NFT_SET_EXT_TIMEOUT
))
3832 *nft_set_ext_timeout(ext
) = timeout
;
3837 void nft_set_elem_destroy(const struct nft_set
*set
, void *elem
,
3840 struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
);
3842 nft_data_release(nft_set_ext_key(ext
), NFT_DATA_VALUE
);
3843 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
3844 nft_data_release(nft_set_ext_data(ext
), set
->dtype
);
3845 if (destroy_expr
&& nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
))
3846 nf_tables_expr_destroy(NULL
, nft_set_ext_expr(ext
));
3847 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
))
3848 (*nft_set_ext_obj(ext
))->use
--;
3851 EXPORT_SYMBOL_GPL(nft_set_elem_destroy
);
3853 /* Only called from commit path, nft_set_elem_deactivate() already deals with
3854 * the refcounting from the preparation phase.
3856 static void nf_tables_set_elem_destroy(const struct nft_set
*set
, void *elem
)
3858 struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
);
3860 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
))
3861 nf_tables_expr_destroy(NULL
, nft_set_ext_expr(ext
));
3865 static int nft_add_set_elem(struct nft_ctx
*ctx
, struct nft_set
*set
,
3866 const struct nlattr
*attr
, u32 nlmsg_flags
)
3868 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
3869 u8 genmask
= nft_genmask_next(ctx
->net
);
3870 struct nft_data_desc d1
, d2
;
3871 struct nft_set_ext_tmpl tmpl
;
3872 struct nft_set_ext
*ext
, *ext2
;
3873 struct nft_set_elem elem
;
3874 struct nft_set_binding
*binding
;
3875 struct nft_object
*obj
= NULL
;
3876 struct nft_userdata
*udata
;
3877 struct nft_data data
;
3878 enum nft_registers dreg
;
3879 struct nft_trans
*trans
;
3885 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
3886 nft_set_elem_policy
, NULL
);
3890 if (nla
[NFTA_SET_ELEM_KEY
] == NULL
)
3893 nft_set_ext_prepare(&tmpl
);
3895 err
= nft_setelem_parse_flags(set
, nla
[NFTA_SET_ELEM_FLAGS
], &flags
);
3899 nft_set_ext_add(&tmpl
, NFT_SET_EXT_FLAGS
);
3901 if (set
->flags
& NFT_SET_MAP
) {
3902 if (nla
[NFTA_SET_ELEM_DATA
] == NULL
&&
3903 !(flags
& NFT_SET_ELEM_INTERVAL_END
))
3905 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
&&
3906 flags
& NFT_SET_ELEM_INTERVAL_END
)
3909 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
)
3914 if (nla
[NFTA_SET_ELEM_TIMEOUT
] != NULL
) {
3915 if (!(set
->flags
& NFT_SET_TIMEOUT
))
3917 timeout
= msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3918 nla
[NFTA_SET_ELEM_TIMEOUT
])));
3919 } else if (set
->flags
& NFT_SET_TIMEOUT
) {
3920 timeout
= set
->timeout
;
3923 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &d1
,
3924 nla
[NFTA_SET_ELEM_KEY
]);
3928 if (d1
.type
!= NFT_DATA_VALUE
|| d1
.len
!= set
->klen
)
3931 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_KEY
, d1
.len
);
3933 nft_set_ext_add(&tmpl
, NFT_SET_EXT_EXPIRATION
);
3934 if (timeout
!= set
->timeout
)
3935 nft_set_ext_add(&tmpl
, NFT_SET_EXT_TIMEOUT
);
3938 if (nla
[NFTA_SET_ELEM_OBJREF
] != NULL
) {
3939 if (!(set
->flags
& NFT_SET_OBJECT
)) {
3943 obj
= nf_tables_obj_lookup(ctx
->table
, nla
[NFTA_SET_ELEM_OBJREF
],
3944 set
->objtype
, genmask
);
3949 nft_set_ext_add(&tmpl
, NFT_SET_EXT_OBJREF
);
3952 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
) {
3953 err
= nft_data_init(ctx
, &data
, sizeof(data
), &d2
,
3954 nla
[NFTA_SET_ELEM_DATA
]);
3959 if (set
->dtype
!= NFT_DATA_VERDICT
&& d2
.len
!= set
->dlen
)
3962 dreg
= nft_type_to_reg(set
->dtype
);
3963 list_for_each_entry(binding
, &set
->bindings
, list
) {
3964 struct nft_ctx bind_ctx
= {
3967 .table
= ctx
->table
,
3968 .chain
= (struct nft_chain
*)binding
->chain
,
3971 if (!(binding
->flags
& NFT_SET_MAP
))
3974 err
= nft_validate_register_store(&bind_ctx
, dreg
,
3981 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_DATA
, d2
.len
);
3984 /* The full maximum length of userdata can exceed the maximum
3985 * offset value (U8_MAX) for following extensions, therefor it
3986 * must be the last extension added.
3989 if (nla
[NFTA_SET_ELEM_USERDATA
] != NULL
) {
3990 ulen
= nla_len(nla
[NFTA_SET_ELEM_USERDATA
]);
3992 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_USERDATA
,
3997 elem
.priv
= nft_set_elem_init(set
, &tmpl
, elem
.key
.val
.data
, data
.data
,
3998 timeout
, GFP_KERNEL
);
3999 if (elem
.priv
== NULL
)
4002 ext
= nft_set_elem_ext(set
, elem
.priv
);
4004 *nft_set_ext_flags(ext
) = flags
;
4006 udata
= nft_set_ext_userdata(ext
);
4007 udata
->len
= ulen
- 1;
4008 nla_memcpy(&udata
->data
, nla
[NFTA_SET_ELEM_USERDATA
], ulen
);
4011 *nft_set_ext_obj(ext
) = obj
;
4015 trans
= nft_trans_elem_alloc(ctx
, NFT_MSG_NEWSETELEM
, set
);
4019 ext
->genmask
= nft_genmask_cur(ctx
->net
) | NFT_SET_ELEM_BUSY_MASK
;
4020 err
= set
->ops
->insert(ctx
->net
, set
, &elem
, &ext2
);
4022 if (err
== -EEXIST
) {
4023 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
) ^
4024 nft_set_ext_exists(ext2
, NFT_SET_EXT_DATA
) ||
4025 nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
) ^
4026 nft_set_ext_exists(ext2
, NFT_SET_EXT_OBJREF
))
4028 if ((nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
) &&
4029 nft_set_ext_exists(ext2
, NFT_SET_EXT_DATA
) &&
4030 memcmp(nft_set_ext_data(ext
),
4031 nft_set_ext_data(ext2
), set
->dlen
) != 0) ||
4032 (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
) &&
4033 nft_set_ext_exists(ext2
, NFT_SET_EXT_OBJREF
) &&
4034 *nft_set_ext_obj(ext
) != *nft_set_ext_obj(ext2
)))
4036 else if (!(nlmsg_flags
& NLM_F_EXCL
))
4043 !atomic_add_unless(&set
->nelems
, 1, set
->size
+ set
->ndeact
)) {
4048 nft_trans_elem(trans
) = elem
;
4049 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
4053 set
->ops
->remove(ctx
->net
, set
, &elem
);
4059 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
)
4060 nft_data_release(&data
, d2
.type
);
4062 nft_data_release(&elem
.key
.val
, d1
.type
);
4067 static int nf_tables_newsetelem(struct net
*net
, struct sock
*nlsk
,
4068 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4069 const struct nlattr
* const nla
[],
4070 struct netlink_ext_ack
*extack
)
4072 u8 genmask
= nft_genmask_next(net
);
4073 const struct nlattr
*attr
;
4074 struct nft_set
*set
;
4078 if (nla
[NFTA_SET_ELEM_LIST_ELEMENTS
] == NULL
)
4081 err
= nft_ctx_init_from_elemattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
4085 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
],
4088 if (nla
[NFTA_SET_ELEM_LIST_SET_ID
]) {
4089 set
= nf_tables_set_lookup_byid(net
,
4090 nla
[NFTA_SET_ELEM_LIST_SET_ID
],
4094 return PTR_ERR(set
);
4097 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_CONSTANT
)
4100 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
4101 err
= nft_add_set_elem(&ctx
, set
, attr
, nlh
->nlmsg_flags
);
4109 * nft_data_hold - hold a nft_data item
4111 * @data: struct nft_data to release
4112 * @type: type of data
4114 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4115 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
4116 * NFT_GOTO verdicts. This function must be called on active data objects
4117 * from the second phase of the commit protocol.
4119 static void nft_data_hold(const struct nft_data
*data
, enum nft_data_types type
)
4121 if (type
== NFT_DATA_VERDICT
) {
4122 switch (data
->verdict
.code
) {
4125 data
->verdict
.chain
->use
++;
4131 static void nft_set_elem_activate(const struct net
*net
,
4132 const struct nft_set
*set
,
4133 struct nft_set_elem
*elem
)
4135 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
4137 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
4138 nft_data_hold(nft_set_ext_data(ext
), set
->dtype
);
4139 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
))
4140 (*nft_set_ext_obj(ext
))->use
++;
4143 static void nft_set_elem_deactivate(const struct net
*net
,
4144 const struct nft_set
*set
,
4145 struct nft_set_elem
*elem
)
4147 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
4149 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
4150 nft_data_release(nft_set_ext_data(ext
), set
->dtype
);
4151 if (nft_set_ext_exists(ext
, NFT_SET_EXT_OBJREF
))
4152 (*nft_set_ext_obj(ext
))->use
--;
4155 static int nft_del_setelem(struct nft_ctx
*ctx
, struct nft_set
*set
,
4156 const struct nlattr
*attr
)
4158 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
4159 struct nft_set_ext_tmpl tmpl
;
4160 struct nft_data_desc desc
;
4161 struct nft_set_elem elem
;
4162 struct nft_set_ext
*ext
;
4163 struct nft_trans
*trans
;
4168 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
4169 nft_set_elem_policy
, NULL
);
4174 if (nla
[NFTA_SET_ELEM_KEY
] == NULL
)
4177 nft_set_ext_prepare(&tmpl
);
4179 err
= nft_setelem_parse_flags(set
, nla
[NFTA_SET_ELEM_FLAGS
], &flags
);
4183 nft_set_ext_add(&tmpl
, NFT_SET_EXT_FLAGS
);
4185 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &desc
,
4186 nla
[NFTA_SET_ELEM_KEY
]);
4191 if (desc
.type
!= NFT_DATA_VALUE
|| desc
.len
!= set
->klen
)
4194 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_KEY
, desc
.len
);
4197 elem
.priv
= nft_set_elem_init(set
, &tmpl
, elem
.key
.val
.data
, NULL
, 0,
4199 if (elem
.priv
== NULL
)
4202 ext
= nft_set_elem_ext(set
, elem
.priv
);
4204 *nft_set_ext_flags(ext
) = flags
;
4206 trans
= nft_trans_elem_alloc(ctx
, NFT_MSG_DELSETELEM
, set
);
4207 if (trans
== NULL
) {
4212 priv
= set
->ops
->deactivate(ctx
->net
, set
, &elem
);
4220 nft_set_elem_deactivate(ctx
->net
, set
, &elem
);
4222 nft_trans_elem(trans
) = elem
;
4223 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
4231 nft_data_release(&elem
.key
.val
, desc
.type
);
4236 static int nft_flush_set(const struct nft_ctx
*ctx
,
4237 struct nft_set
*set
,
4238 const struct nft_set_iter
*iter
,
4239 struct nft_set_elem
*elem
)
4241 struct nft_trans
*trans
;
4244 trans
= nft_trans_alloc_gfp(ctx
, NFT_MSG_DELSETELEM
,
4245 sizeof(struct nft_trans_elem
), GFP_ATOMIC
);
4249 if (!set
->ops
->flush(ctx
->net
, set
, elem
->priv
)) {
4255 nft_trans_elem_set(trans
) = set
;
4256 nft_trans_elem(trans
) = *elem
;
4257 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
4265 static int nf_tables_delsetelem(struct net
*net
, struct sock
*nlsk
,
4266 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4267 const struct nlattr
* const nla
[],
4268 struct netlink_ext_ack
*extack
)
4270 u8 genmask
= nft_genmask_next(net
);
4271 const struct nlattr
*attr
;
4272 struct nft_set
*set
;
4276 err
= nft_ctx_init_from_elemattr(&ctx
, net
, skb
, nlh
, nla
, genmask
);
4280 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
],
4283 return PTR_ERR(set
);
4284 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_CONSTANT
)
4287 if (nla
[NFTA_SET_ELEM_LIST_ELEMENTS
] == NULL
) {
4288 struct nft_set_iter iter
= {
4290 .fn
= nft_flush_set
,
4292 set
->ops
->walk(&ctx
, set
, &iter
);
4297 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
4298 err
= nft_del_setelem(&ctx
, set
, attr
);
4307 void nft_set_gc_batch_release(struct rcu_head
*rcu
)
4309 struct nft_set_gc_batch
*gcb
;
4312 gcb
= container_of(rcu
, struct nft_set_gc_batch
, head
.rcu
);
4313 for (i
= 0; i
< gcb
->head
.cnt
; i
++)
4314 nft_set_elem_destroy(gcb
->head
.set
, gcb
->elems
[i
], true);
4317 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release
);
4319 struct nft_set_gc_batch
*nft_set_gc_batch_alloc(const struct nft_set
*set
,
4322 struct nft_set_gc_batch
*gcb
;
4324 gcb
= kzalloc(sizeof(*gcb
), gfp
);
4327 gcb
->head
.set
= set
;
4330 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc
);
4337 * nft_register_obj- register nf_tables stateful object type
4340 * Registers the object type for use with nf_tables. Returns zero on
4341 * success or a negative errno code otherwise.
4343 int nft_register_obj(struct nft_object_type
*obj_type
)
4345 if (obj_type
->type
== NFT_OBJECT_UNSPEC
)
4348 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4349 list_add_rcu(&obj_type
->list
, &nf_tables_objects
);
4350 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4353 EXPORT_SYMBOL_GPL(nft_register_obj
);
4356 * nft_unregister_obj - unregister nf_tables object type
4359 * Unregisters the object type for use with nf_tables.
4361 void nft_unregister_obj(struct nft_object_type
*obj_type
)
4363 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4364 list_del_rcu(&obj_type
->list
);
4365 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4367 EXPORT_SYMBOL_GPL(nft_unregister_obj
);
4369 struct nft_object
*nf_tables_obj_lookup(const struct nft_table
*table
,
4370 const struct nlattr
*nla
,
4371 u32 objtype
, u8 genmask
)
4373 struct nft_object
*obj
;
4375 list_for_each_entry(obj
, &table
->objects
, list
) {
4376 if (!nla_strcmp(nla
, obj
->name
) &&
4377 objtype
== obj
->ops
->type
->type
&&
4378 nft_active_genmask(obj
, genmask
))
4381 return ERR_PTR(-ENOENT
);
4383 EXPORT_SYMBOL_GPL(nf_tables_obj_lookup
);
4385 static const struct nla_policy nft_obj_policy
[NFTA_OBJ_MAX
+ 1] = {
4386 [NFTA_OBJ_TABLE
] = { .type
= NLA_STRING
,
4387 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
4388 [NFTA_OBJ_NAME
] = { .type
= NLA_STRING
,
4389 .len
= NFT_OBJ_MAXNAMELEN
- 1 },
4390 [NFTA_OBJ_TYPE
] = { .type
= NLA_U32
},
4391 [NFTA_OBJ_DATA
] = { .type
= NLA_NESTED
},
4394 static struct nft_object
*nft_obj_init(const struct nft_ctx
*ctx
,
4395 const struct nft_object_type
*type
,
4396 const struct nlattr
*attr
)
4398 struct nlattr
*tb
[type
->maxattr
+ 1];
4399 const struct nft_object_ops
*ops
;
4400 struct nft_object
*obj
;
4404 err
= nla_parse_nested(tb
, type
->maxattr
, attr
, type
->policy
,
4409 memset(tb
, 0, sizeof(tb
[0]) * (type
->maxattr
+ 1));
4412 if (type
->select_ops
) {
4413 ops
= type
->select_ops(ctx
, (const struct nlattr
* const *)tb
);
4423 obj
= kzalloc(sizeof(*obj
) + ops
->size
, GFP_KERNEL
);
4427 err
= ops
->init(ctx
, (const struct nlattr
* const *)tb
, obj
);
4437 return ERR_PTR(err
);
4440 static int nft_object_dump(struct sk_buff
*skb
, unsigned int attr
,
4441 struct nft_object
*obj
, bool reset
)
4443 struct nlattr
*nest
;
4445 nest
= nla_nest_start(skb
, attr
);
4447 goto nla_put_failure
;
4448 if (obj
->ops
->dump(skb
, obj
, reset
) < 0)
4449 goto nla_put_failure
;
4450 nla_nest_end(skb
, nest
);
4457 static const struct nft_object_type
*__nft_obj_type_get(u32 objtype
)
4459 const struct nft_object_type
*type
;
4461 list_for_each_entry(type
, &nf_tables_objects
, list
) {
4462 if (objtype
== type
->type
)
4468 static const struct nft_object_type
*nft_obj_type_get(u32 objtype
)
4470 const struct nft_object_type
*type
;
4472 type
= __nft_obj_type_get(objtype
);
4473 if (type
!= NULL
&& try_module_get(type
->owner
))
4476 #ifdef CONFIG_MODULES
4478 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
4479 request_module("nft-obj-%u", objtype
);
4480 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
4481 if (__nft_obj_type_get(objtype
))
4482 return ERR_PTR(-EAGAIN
);
4485 return ERR_PTR(-ENOENT
);
4488 static int nf_tables_newobj(struct net
*net
, struct sock
*nlsk
,
4489 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4490 const struct nlattr
* const nla
[],
4491 struct netlink_ext_ack
*extack
)
4493 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
4494 const struct nft_object_type
*type
;
4495 u8 genmask
= nft_genmask_next(net
);
4496 int family
= nfmsg
->nfgen_family
;
4497 struct nft_af_info
*afi
;
4498 struct nft_table
*table
;
4499 struct nft_object
*obj
;
4504 if (!nla
[NFTA_OBJ_TYPE
] ||
4505 !nla
[NFTA_OBJ_NAME
] ||
4506 !nla
[NFTA_OBJ_DATA
])
4509 afi
= nf_tables_afinfo_lookup(net
, family
, true);
4511 return PTR_ERR(afi
);
4513 table
= nf_tables_table_lookup(afi
, nla
[NFTA_OBJ_TABLE
], genmask
);
4515 return PTR_ERR(table
);
4517 objtype
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4518 obj
= nf_tables_obj_lookup(table
, nla
[NFTA_OBJ_NAME
], objtype
, genmask
);
4525 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
4531 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
4533 type
= nft_obj_type_get(objtype
);
4535 return PTR_ERR(type
);
4537 obj
= nft_obj_init(&ctx
, type
, nla
[NFTA_OBJ_DATA
]);
4543 obj
->name
= nla_strdup(nla
[NFTA_OBJ_NAME
], GFP_KERNEL
);
4549 err
= nft_trans_obj_add(&ctx
, NFT_MSG_NEWOBJ
, obj
);
4553 list_add_tail_rcu(&obj
->list
, &table
->objects
);
4559 if (obj
->ops
->destroy
)
4560 obj
->ops
->destroy(obj
);
4563 module_put(type
->owner
);
4567 static int nf_tables_fill_obj_info(struct sk_buff
*skb
, struct net
*net
,
4568 u32 portid
, u32 seq
, int event
, u32 flags
,
4569 int family
, const struct nft_table
*table
,
4570 struct nft_object
*obj
, bool reset
)
4572 struct nfgenmsg
*nfmsg
;
4573 struct nlmsghdr
*nlh
;
4575 event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, event
);
4576 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
4578 goto nla_put_failure
;
4580 nfmsg
= nlmsg_data(nlh
);
4581 nfmsg
->nfgen_family
= family
;
4582 nfmsg
->version
= NFNETLINK_V0
;
4583 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
4585 if (nla_put_string(skb
, NFTA_OBJ_TABLE
, table
->name
) ||
4586 nla_put_string(skb
, NFTA_OBJ_NAME
, obj
->name
) ||
4587 nla_put_be32(skb
, NFTA_OBJ_TYPE
, htonl(obj
->ops
->type
->type
)) ||
4588 nla_put_be32(skb
, NFTA_OBJ_USE
, htonl(obj
->use
)) ||
4589 nft_object_dump(skb
, NFTA_OBJ_DATA
, obj
, reset
))
4590 goto nla_put_failure
;
4592 nlmsg_end(skb
, nlh
);
4596 nlmsg_trim(skb
, nlh
);
4600 struct nft_obj_filter
{
4605 static int nf_tables_dump_obj(struct sk_buff
*skb
, struct netlink_callback
*cb
)
4607 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
4608 const struct nft_af_info
*afi
;
4609 const struct nft_table
*table
;
4610 unsigned int idx
= 0, s_idx
= cb
->args
[0];
4611 struct nft_obj_filter
*filter
= cb
->data
;
4612 struct net
*net
= sock_net(skb
->sk
);
4613 int family
= nfmsg
->nfgen_family
;
4614 struct nft_object
*obj
;
4617 if (NFNL_MSG_TYPE(cb
->nlh
->nlmsg_type
) == NFT_MSG_GETOBJ_RESET
)
4621 cb
->seq
= net
->nft
.base_seq
;
4623 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
4624 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
4627 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
4628 list_for_each_entry_rcu(obj
, &table
->objects
, list
) {
4629 if (!nft_is_active(net
, obj
))
4634 memset(&cb
->args
[1], 0,
4635 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
4636 if (filter
&& filter
->table
[0] &&
4637 strcmp(filter
->table
, table
->name
))
4640 filter
->type
!= NFT_OBJECT_UNSPEC
&&
4641 obj
->ops
->type
->type
!= filter
->type
)
4644 if (nf_tables_fill_obj_info(skb
, net
, NETLINK_CB(cb
->skb
).portid
,
4647 NLM_F_MULTI
| NLM_F_APPEND
,
4648 afi
->family
, table
, obj
, reset
) < 0)
4651 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
4664 static int nf_tables_dump_obj_done(struct netlink_callback
*cb
)
4666 struct nft_obj_filter
*filter
= cb
->data
;
4668 kfree(filter
->table
);
4674 static struct nft_obj_filter
*
4675 nft_obj_filter_alloc(const struct nlattr
* const nla
[])
4677 struct nft_obj_filter
*filter
;
4679 filter
= kzalloc(sizeof(*filter
), GFP_KERNEL
);
4681 return ERR_PTR(-ENOMEM
);
4683 if (nla
[NFTA_OBJ_TABLE
]) {
4684 filter
->table
= nla_strdup(nla
[NFTA_OBJ_TABLE
], GFP_KERNEL
);
4685 if (!filter
->table
) {
4687 return ERR_PTR(-ENOMEM
);
4690 if (nla
[NFTA_OBJ_TYPE
])
4691 filter
->type
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4696 static int nf_tables_getobj(struct net
*net
, struct sock
*nlsk
,
4697 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4698 const struct nlattr
* const nla
[],
4699 struct netlink_ext_ack
*extack
)
4701 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
4702 u8 genmask
= nft_genmask_cur(net
);
4703 int family
= nfmsg
->nfgen_family
;
4704 const struct nft_af_info
*afi
;
4705 const struct nft_table
*table
;
4706 struct nft_object
*obj
;
4707 struct sk_buff
*skb2
;
4712 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
4713 struct netlink_dump_control c
= {
4714 .dump
= nf_tables_dump_obj
,
4715 .done
= nf_tables_dump_obj_done
,
4718 if (nla
[NFTA_OBJ_TABLE
] ||
4719 nla
[NFTA_OBJ_TYPE
]) {
4720 struct nft_obj_filter
*filter
;
4722 filter
= nft_obj_filter_alloc(nla
);
4728 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
4731 if (!nla
[NFTA_OBJ_NAME
] ||
4732 !nla
[NFTA_OBJ_TYPE
])
4735 afi
= nf_tables_afinfo_lookup(net
, family
, false);
4737 return PTR_ERR(afi
);
4739 table
= nf_tables_table_lookup(afi
, nla
[NFTA_OBJ_TABLE
], genmask
);
4741 return PTR_ERR(table
);
4743 objtype
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4744 obj
= nf_tables_obj_lookup(table
, nla
[NFTA_OBJ_NAME
], objtype
, genmask
);
4746 return PTR_ERR(obj
);
4748 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
4752 if (NFNL_MSG_TYPE(nlh
->nlmsg_type
) == NFT_MSG_GETOBJ_RESET
)
4755 err
= nf_tables_fill_obj_info(skb2
, net
, NETLINK_CB(skb
).portid
,
4756 nlh
->nlmsg_seq
, NFT_MSG_NEWOBJ
, 0,
4757 family
, table
, obj
, reset
);
4761 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
4767 static void nft_obj_destroy(struct nft_object
*obj
)
4769 if (obj
->ops
->destroy
)
4770 obj
->ops
->destroy(obj
);
4772 module_put(obj
->ops
->type
->owner
);
4777 static int nf_tables_delobj(struct net
*net
, struct sock
*nlsk
,
4778 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4779 const struct nlattr
* const nla
[],
4780 struct netlink_ext_ack
*extack
)
4782 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
4783 u8 genmask
= nft_genmask_next(net
);
4784 int family
= nfmsg
->nfgen_family
;
4785 struct nft_af_info
*afi
;
4786 struct nft_table
*table
;
4787 struct nft_object
*obj
;
4791 if (!nla
[NFTA_OBJ_TYPE
] ||
4792 !nla
[NFTA_OBJ_NAME
])
4795 afi
= nf_tables_afinfo_lookup(net
, family
, true);
4797 return PTR_ERR(afi
);
4799 table
= nf_tables_table_lookup(afi
, nla
[NFTA_OBJ_TABLE
], genmask
);
4801 return PTR_ERR(table
);
4803 objtype
= ntohl(nla_get_be32(nla
[NFTA_OBJ_TYPE
]));
4804 obj
= nf_tables_obj_lookup(table
, nla
[NFTA_OBJ_NAME
], objtype
, genmask
);
4806 return PTR_ERR(obj
);
4810 nft_ctx_init(&ctx
, net
, skb
, nlh
, afi
, table
, NULL
, nla
);
4812 return nft_delobj(&ctx
, obj
);
4815 void nft_obj_notify(struct net
*net
, struct nft_table
*table
,
4816 struct nft_object
*obj
, u32 portid
, u32 seq
, int event
,
4817 int family
, int report
, gfp_t gfp
)
4819 struct sk_buff
*skb
;
4823 !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
4826 skb
= nlmsg_new(NLMSG_GOODSIZE
, gfp
);
4830 err
= nf_tables_fill_obj_info(skb
, net
, portid
, seq
, event
, 0, family
,
4837 nfnetlink_send(skb
, net
, portid
, NFNLGRP_NFTABLES
, report
, gfp
);
4840 nfnetlink_set_err(net
, portid
, NFNLGRP_NFTABLES
, -ENOBUFS
);
4842 EXPORT_SYMBOL_GPL(nft_obj_notify
);
4844 static void nf_tables_obj_notify(const struct nft_ctx
*ctx
,
4845 struct nft_object
*obj
, int event
)
4847 nft_obj_notify(ctx
->net
, ctx
->table
, obj
, ctx
->portid
, ctx
->seq
, event
,
4848 ctx
->afi
->family
, ctx
->report
, GFP_KERNEL
);
4851 static int nf_tables_fill_gen_info(struct sk_buff
*skb
, struct net
*net
,
4852 u32 portid
, u32 seq
)
4854 struct nlmsghdr
*nlh
;
4855 struct nfgenmsg
*nfmsg
;
4856 char buf
[TASK_COMM_LEN
];
4857 int event
= nfnl_msg_type(NFNL_SUBSYS_NFTABLES
, NFT_MSG_NEWGEN
);
4859 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), 0);
4861 goto nla_put_failure
;
4863 nfmsg
= nlmsg_data(nlh
);
4864 nfmsg
->nfgen_family
= AF_UNSPEC
;
4865 nfmsg
->version
= NFNETLINK_V0
;
4866 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
4868 if (nla_put_be32(skb
, NFTA_GEN_ID
, htonl(net
->nft
.base_seq
)) ||
4869 nla_put_be32(skb
, NFTA_GEN_PROC_PID
, htonl(task_pid_nr(current
))) ||
4870 nla_put_string(skb
, NFTA_GEN_PROC_NAME
, get_task_comm(buf
, current
)))
4871 goto nla_put_failure
;
4873 nlmsg_end(skb
, nlh
);
4877 nlmsg_trim(skb
, nlh
);
4881 static void nf_tables_gen_notify(struct net
*net
, struct sk_buff
*skb
,
4884 struct nlmsghdr
*nlh
= nlmsg_hdr(skb
);
4885 struct sk_buff
*skb2
;
4888 if (nlmsg_report(nlh
) &&
4889 !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
4892 skb2
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
4896 err
= nf_tables_fill_gen_info(skb2
, net
, NETLINK_CB(skb
).portid
,
4903 nfnetlink_send(skb2
, net
, NETLINK_CB(skb
).portid
, NFNLGRP_NFTABLES
,
4904 nlmsg_report(nlh
), GFP_KERNEL
);
4907 nfnetlink_set_err(net
, NETLINK_CB(skb
).portid
, NFNLGRP_NFTABLES
,
4911 static int nf_tables_getgen(struct net
*net
, struct sock
*nlsk
,
4912 struct sk_buff
*skb
, const struct nlmsghdr
*nlh
,
4913 const struct nlattr
* const nla
[],
4914 struct netlink_ext_ack
*extack
)
4916 struct sk_buff
*skb2
;
4919 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
4923 err
= nf_tables_fill_gen_info(skb2
, net
, NETLINK_CB(skb
).portid
,
4928 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
4934 static const struct nfnl_callback nf_tables_cb
[NFT_MSG_MAX
] = {
4935 [NFT_MSG_NEWTABLE
] = {
4936 .call_batch
= nf_tables_newtable
,
4937 .attr_count
= NFTA_TABLE_MAX
,
4938 .policy
= nft_table_policy
,
4940 [NFT_MSG_GETTABLE
] = {
4941 .call
= nf_tables_gettable
,
4942 .attr_count
= NFTA_TABLE_MAX
,
4943 .policy
= nft_table_policy
,
4945 [NFT_MSG_DELTABLE
] = {
4946 .call_batch
= nf_tables_deltable
,
4947 .attr_count
= NFTA_TABLE_MAX
,
4948 .policy
= nft_table_policy
,
4950 [NFT_MSG_NEWCHAIN
] = {
4951 .call_batch
= nf_tables_newchain
,
4952 .attr_count
= NFTA_CHAIN_MAX
,
4953 .policy
= nft_chain_policy
,
4955 [NFT_MSG_GETCHAIN
] = {
4956 .call
= nf_tables_getchain
,
4957 .attr_count
= NFTA_CHAIN_MAX
,
4958 .policy
= nft_chain_policy
,
4960 [NFT_MSG_DELCHAIN
] = {
4961 .call_batch
= nf_tables_delchain
,
4962 .attr_count
= NFTA_CHAIN_MAX
,
4963 .policy
= nft_chain_policy
,
4965 [NFT_MSG_NEWRULE
] = {
4966 .call_batch
= nf_tables_newrule
,
4967 .attr_count
= NFTA_RULE_MAX
,
4968 .policy
= nft_rule_policy
,
4970 [NFT_MSG_GETRULE
] = {
4971 .call
= nf_tables_getrule
,
4972 .attr_count
= NFTA_RULE_MAX
,
4973 .policy
= nft_rule_policy
,
4975 [NFT_MSG_DELRULE
] = {
4976 .call_batch
= nf_tables_delrule
,
4977 .attr_count
= NFTA_RULE_MAX
,
4978 .policy
= nft_rule_policy
,
4980 [NFT_MSG_NEWSET
] = {
4981 .call_batch
= nf_tables_newset
,
4982 .attr_count
= NFTA_SET_MAX
,
4983 .policy
= nft_set_policy
,
4985 [NFT_MSG_GETSET
] = {
4986 .call
= nf_tables_getset
,
4987 .attr_count
= NFTA_SET_MAX
,
4988 .policy
= nft_set_policy
,
4990 [NFT_MSG_DELSET
] = {
4991 .call_batch
= nf_tables_delset
,
4992 .attr_count
= NFTA_SET_MAX
,
4993 .policy
= nft_set_policy
,
4995 [NFT_MSG_NEWSETELEM
] = {
4996 .call_batch
= nf_tables_newsetelem
,
4997 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
4998 .policy
= nft_set_elem_list_policy
,
5000 [NFT_MSG_GETSETELEM
] = {
5001 .call
= nf_tables_getsetelem
,
5002 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
5003 .policy
= nft_set_elem_list_policy
,
5005 [NFT_MSG_DELSETELEM
] = {
5006 .call_batch
= nf_tables_delsetelem
,
5007 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
5008 .policy
= nft_set_elem_list_policy
,
5010 [NFT_MSG_GETGEN
] = {
5011 .call
= nf_tables_getgen
,
5013 [NFT_MSG_NEWOBJ
] = {
5014 .call_batch
= nf_tables_newobj
,
5015 .attr_count
= NFTA_OBJ_MAX
,
5016 .policy
= nft_obj_policy
,
5018 [NFT_MSG_GETOBJ
] = {
5019 .call
= nf_tables_getobj
,
5020 .attr_count
= NFTA_OBJ_MAX
,
5021 .policy
= nft_obj_policy
,
5023 [NFT_MSG_DELOBJ
] = {
5024 .call_batch
= nf_tables_delobj
,
5025 .attr_count
= NFTA_OBJ_MAX
,
5026 .policy
= nft_obj_policy
,
5028 [NFT_MSG_GETOBJ_RESET
] = {
5029 .call
= nf_tables_getobj
,
5030 .attr_count
= NFTA_OBJ_MAX
,
5031 .policy
= nft_obj_policy
,
5035 static void nft_chain_commit_update(struct nft_trans
*trans
)
5037 struct nft_base_chain
*basechain
;
5039 if (nft_trans_chain_name(trans
))
5040 strcpy(trans
->ctx
.chain
->name
, nft_trans_chain_name(trans
));
5042 if (!nft_is_base_chain(trans
->ctx
.chain
))
5045 basechain
= nft_base_chain(trans
->ctx
.chain
);
5046 nft_chain_stats_replace(basechain
, nft_trans_chain_stats(trans
));
5048 switch (nft_trans_chain_policy(trans
)) {
5051 basechain
->policy
= nft_trans_chain_policy(trans
);
5056 static void nf_tables_commit_release(struct nft_trans
*trans
)
5058 switch (trans
->msg_type
) {
5059 case NFT_MSG_DELTABLE
:
5060 nf_tables_table_destroy(&trans
->ctx
);
5062 case NFT_MSG_DELCHAIN
:
5063 nf_tables_chain_destroy(trans
->ctx
.chain
);
5065 case NFT_MSG_DELRULE
:
5066 nf_tables_rule_destroy(&trans
->ctx
, nft_trans_rule(trans
));
5068 case NFT_MSG_DELSET
:
5069 nft_set_destroy(nft_trans_set(trans
));
5071 case NFT_MSG_DELSETELEM
:
5072 nf_tables_set_elem_destroy(nft_trans_elem_set(trans
),
5073 nft_trans_elem(trans
).priv
);
5075 case NFT_MSG_DELOBJ
:
5076 nft_obj_destroy(nft_trans_obj(trans
));
5082 static int nf_tables_commit(struct net
*net
, struct sk_buff
*skb
)
5084 struct nft_trans
*trans
, *next
;
5085 struct nft_trans_elem
*te
;
5087 /* Bump generation counter, invalidate any dump in progress */
5088 while (++net
->nft
.base_seq
== 0);
5090 /* A new generation has just started */
5091 net
->nft
.gencursor
= nft_gencursor_next(net
);
5093 /* Make sure all packets have left the previous generation before
5094 * purging old rules.
5098 list_for_each_entry_safe(trans
, next
, &net
->nft
.commit_list
, list
) {
5099 switch (trans
->msg_type
) {
5100 case NFT_MSG_NEWTABLE
:
5101 if (nft_trans_table_update(trans
)) {
5102 if (!nft_trans_table_enable(trans
)) {
5103 nf_tables_table_disable(net
,
5106 trans
->ctx
.table
->flags
|= NFT_TABLE_F_DORMANT
;
5109 nft_clear(net
, trans
->ctx
.table
);
5111 nf_tables_table_notify(&trans
->ctx
, NFT_MSG_NEWTABLE
);
5112 nft_trans_destroy(trans
);
5114 case NFT_MSG_DELTABLE
:
5115 list_del_rcu(&trans
->ctx
.table
->list
);
5116 nf_tables_table_notify(&trans
->ctx
, NFT_MSG_DELTABLE
);
5118 case NFT_MSG_NEWCHAIN
:
5119 if (nft_trans_chain_update(trans
))
5120 nft_chain_commit_update(trans
);
5122 nft_clear(net
, trans
->ctx
.chain
);
5124 nf_tables_chain_notify(&trans
->ctx
, NFT_MSG_NEWCHAIN
);
5125 nft_trans_destroy(trans
);
5127 case NFT_MSG_DELCHAIN
:
5128 list_del_rcu(&trans
->ctx
.chain
->list
);
5129 nf_tables_chain_notify(&trans
->ctx
, NFT_MSG_DELCHAIN
);
5130 nf_tables_unregister_hooks(trans
->ctx
.net
,
5133 trans
->ctx
.afi
->nops
);
5135 case NFT_MSG_NEWRULE
:
5136 nft_clear(trans
->ctx
.net
, nft_trans_rule(trans
));
5137 nf_tables_rule_notify(&trans
->ctx
,
5138 nft_trans_rule(trans
),
5140 nft_trans_destroy(trans
);
5142 case NFT_MSG_DELRULE
:
5143 list_del_rcu(&nft_trans_rule(trans
)->list
);
5144 nf_tables_rule_notify(&trans
->ctx
,
5145 nft_trans_rule(trans
),
5148 case NFT_MSG_NEWSET
:
5149 nft_clear(net
, nft_trans_set(trans
));
5150 /* This avoids hitting -EBUSY when deleting the table
5151 * from the transaction.
5153 if (nft_trans_set(trans
)->flags
& NFT_SET_ANONYMOUS
&&
5154 !list_empty(&nft_trans_set(trans
)->bindings
))
5155 trans
->ctx
.table
->use
--;
5157 nf_tables_set_notify(&trans
->ctx
, nft_trans_set(trans
),
5158 NFT_MSG_NEWSET
, GFP_KERNEL
);
5159 nft_trans_destroy(trans
);
5161 case NFT_MSG_DELSET
:
5162 list_del_rcu(&nft_trans_set(trans
)->list
);
5163 nf_tables_set_notify(&trans
->ctx
, nft_trans_set(trans
),
5164 NFT_MSG_DELSET
, GFP_KERNEL
);
5166 case NFT_MSG_NEWSETELEM
:
5167 te
= (struct nft_trans_elem
*)trans
->data
;
5169 te
->set
->ops
->activate(net
, te
->set
, &te
->elem
);
5170 nf_tables_setelem_notify(&trans
->ctx
, te
->set
,
5172 NFT_MSG_NEWSETELEM
, 0);
5173 nft_trans_destroy(trans
);
5175 case NFT_MSG_DELSETELEM
:
5176 te
= (struct nft_trans_elem
*)trans
->data
;
5178 nf_tables_setelem_notify(&trans
->ctx
, te
->set
,
5180 NFT_MSG_DELSETELEM
, 0);
5181 te
->set
->ops
->remove(net
, te
->set
, &te
->elem
);
5182 atomic_dec(&te
->set
->nelems
);
5185 case NFT_MSG_NEWOBJ
:
5186 nft_clear(net
, nft_trans_obj(trans
));
5187 nf_tables_obj_notify(&trans
->ctx
, nft_trans_obj(trans
),
5189 nft_trans_destroy(trans
);
5191 case NFT_MSG_DELOBJ
:
5192 list_del_rcu(&nft_trans_obj(trans
)->list
);
5193 nf_tables_obj_notify(&trans
->ctx
, nft_trans_obj(trans
),
5201 list_for_each_entry_safe(trans
, next
, &net
->nft
.commit_list
, list
) {
5202 list_del(&trans
->list
);
5203 nf_tables_commit_release(trans
);
5206 nf_tables_gen_notify(net
, skb
, NFT_MSG_NEWGEN
);
5211 static void nf_tables_abort_release(struct nft_trans
*trans
)
5213 switch (trans
->msg_type
) {
5214 case NFT_MSG_NEWTABLE
:
5215 nf_tables_table_destroy(&trans
->ctx
);
5217 case NFT_MSG_NEWCHAIN
:
5218 nf_tables_chain_destroy(trans
->ctx
.chain
);
5220 case NFT_MSG_NEWRULE
:
5221 nf_tables_rule_destroy(&trans
->ctx
, nft_trans_rule(trans
));
5223 case NFT_MSG_NEWSET
:
5224 nft_set_destroy(nft_trans_set(trans
));
5226 case NFT_MSG_NEWSETELEM
:
5227 nft_set_elem_destroy(nft_trans_elem_set(trans
),
5228 nft_trans_elem(trans
).priv
, true);
5230 case NFT_MSG_NEWOBJ
:
5231 nft_obj_destroy(nft_trans_obj(trans
));
5237 static int nf_tables_abort(struct net
*net
, struct sk_buff
*skb
)
5239 struct nft_trans
*trans
, *next
;
5240 struct nft_trans_elem
*te
;
5242 list_for_each_entry_safe_reverse(trans
, next
, &net
->nft
.commit_list
,
5244 switch (trans
->msg_type
) {
5245 case NFT_MSG_NEWTABLE
:
5246 if (nft_trans_table_update(trans
)) {
5247 if (nft_trans_table_enable(trans
)) {
5248 nf_tables_table_disable(net
,
5251 trans
->ctx
.table
->flags
|= NFT_TABLE_F_DORMANT
;
5253 nft_trans_destroy(trans
);
5255 list_del_rcu(&trans
->ctx
.table
->list
);
5258 case NFT_MSG_DELTABLE
:
5259 nft_clear(trans
->ctx
.net
, trans
->ctx
.table
);
5260 nft_trans_destroy(trans
);
5262 case NFT_MSG_NEWCHAIN
:
5263 if (nft_trans_chain_update(trans
)) {
5264 free_percpu(nft_trans_chain_stats(trans
));
5266 nft_trans_destroy(trans
);
5268 trans
->ctx
.table
->use
--;
5269 list_del_rcu(&trans
->ctx
.chain
->list
);
5270 nf_tables_unregister_hooks(trans
->ctx
.net
,
5273 trans
->ctx
.afi
->nops
);
5276 case NFT_MSG_DELCHAIN
:
5277 trans
->ctx
.table
->use
++;
5278 nft_clear(trans
->ctx
.net
, trans
->ctx
.chain
);
5279 nft_trans_destroy(trans
);
5281 case NFT_MSG_NEWRULE
:
5282 trans
->ctx
.chain
->use
--;
5283 list_del_rcu(&nft_trans_rule(trans
)->list
);
5285 case NFT_MSG_DELRULE
:
5286 trans
->ctx
.chain
->use
++;
5287 nft_clear(trans
->ctx
.net
, nft_trans_rule(trans
));
5288 nft_trans_destroy(trans
);
5290 case NFT_MSG_NEWSET
:
5291 trans
->ctx
.table
->use
--;
5292 list_del_rcu(&nft_trans_set(trans
)->list
);
5294 case NFT_MSG_DELSET
:
5295 trans
->ctx
.table
->use
++;
5296 nft_clear(trans
->ctx
.net
, nft_trans_set(trans
));
5297 nft_trans_destroy(trans
);
5299 case NFT_MSG_NEWSETELEM
:
5300 te
= (struct nft_trans_elem
*)trans
->data
;
5302 te
->set
->ops
->remove(net
, te
->set
, &te
->elem
);
5303 atomic_dec(&te
->set
->nelems
);
5305 case NFT_MSG_DELSETELEM
:
5306 te
= (struct nft_trans_elem
*)trans
->data
;
5308 nft_set_elem_activate(net
, te
->set
, &te
->elem
);
5309 te
->set
->ops
->activate(net
, te
->set
, &te
->elem
);
5312 nft_trans_destroy(trans
);
5314 case NFT_MSG_NEWOBJ
:
5315 trans
->ctx
.table
->use
--;
5316 list_del_rcu(&nft_trans_obj(trans
)->list
);
5318 case NFT_MSG_DELOBJ
:
5319 trans
->ctx
.table
->use
++;
5320 nft_clear(trans
->ctx
.net
, nft_trans_obj(trans
));
5321 nft_trans_destroy(trans
);
5328 list_for_each_entry_safe_reverse(trans
, next
,
5329 &net
->nft
.commit_list
, list
) {
5330 list_del(&trans
->list
);
5331 nf_tables_abort_release(trans
);
5337 static bool nf_tables_valid_genid(struct net
*net
, u32 genid
)
5339 return net
->nft
.base_seq
== genid
;
5342 static const struct nfnetlink_subsystem nf_tables_subsys
= {
5343 .name
= "nf_tables",
5344 .subsys_id
= NFNL_SUBSYS_NFTABLES
,
5345 .cb_count
= NFT_MSG_MAX
,
5347 .commit
= nf_tables_commit
,
5348 .abort
= nf_tables_abort
,
5349 .valid_genid
= nf_tables_valid_genid
,
5352 int nft_chain_validate_dependency(const struct nft_chain
*chain
,
5353 enum nft_chain_type type
)
5355 const struct nft_base_chain
*basechain
;
5357 if (nft_is_base_chain(chain
)) {
5358 basechain
= nft_base_chain(chain
);
5359 if (basechain
->type
->type
!= type
)
5364 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency
);
5366 int nft_chain_validate_hooks(const struct nft_chain
*chain
,
5367 unsigned int hook_flags
)
5369 struct nft_base_chain
*basechain
;
5371 if (nft_is_base_chain(chain
)) {
5372 basechain
= nft_base_chain(chain
);
5374 if ((1 << basechain
->ops
[0].hooknum
) & hook_flags
)
5382 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks
);
5385 * Loop detection - walk through the ruleset beginning at the destination chain
5386 * of a new jump until either the source chain is reached (loop) or all
5387 * reachable chains have been traversed.
5389 * The loop check is performed whenever a new jump verdict is added to an
5390 * expression or verdict map or a verdict map is bound to a new chain.
5393 static int nf_tables_check_loops(const struct nft_ctx
*ctx
,
5394 const struct nft_chain
*chain
);
5396 static int nf_tables_loop_check_setelem(const struct nft_ctx
*ctx
,
5397 struct nft_set
*set
,
5398 const struct nft_set_iter
*iter
,
5399 struct nft_set_elem
*elem
)
5401 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
5402 const struct nft_data
*data
;
5404 if (nft_set_ext_exists(ext
, NFT_SET_EXT_FLAGS
) &&
5405 *nft_set_ext_flags(ext
) & NFT_SET_ELEM_INTERVAL_END
)
5408 data
= nft_set_ext_data(ext
);
5409 switch (data
->verdict
.code
) {
5412 return nf_tables_check_loops(ctx
, data
->verdict
.chain
);
5418 static int nf_tables_check_loops(const struct nft_ctx
*ctx
,
5419 const struct nft_chain
*chain
)
5421 const struct nft_rule
*rule
;
5422 const struct nft_expr
*expr
, *last
;
5423 struct nft_set
*set
;
5424 struct nft_set_binding
*binding
;
5425 struct nft_set_iter iter
;
5427 if (ctx
->chain
== chain
)
5430 list_for_each_entry(rule
, &chain
->rules
, list
) {
5431 nft_rule_for_each_expr(expr
, last
, rule
) {
5432 const struct nft_data
*data
= NULL
;
5435 if (!expr
->ops
->validate
)
5438 err
= expr
->ops
->validate(ctx
, expr
, &data
);
5445 switch (data
->verdict
.code
) {
5448 err
= nf_tables_check_loops(ctx
,
5449 data
->verdict
.chain
);
5458 list_for_each_entry(set
, &ctx
->table
->sets
, list
) {
5459 if (!nft_is_active_next(ctx
->net
, set
))
5461 if (!(set
->flags
& NFT_SET_MAP
) ||
5462 set
->dtype
!= NFT_DATA_VERDICT
)
5465 list_for_each_entry(binding
, &set
->bindings
, list
) {
5466 if (!(binding
->flags
& NFT_SET_MAP
) ||
5467 binding
->chain
!= chain
)
5470 iter
.genmask
= nft_genmask_next(ctx
->net
);
5474 iter
.fn
= nf_tables_loop_check_setelem
;
5476 set
->ops
->walk(ctx
, set
, &iter
);
5486 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
5488 * @attr: netlink attribute to fetch value from
5489 * @max: maximum value to be stored in dest
5490 * @dest: pointer to the variable
5492 * Parse, check and store a given u32 netlink attribute into variable.
5493 * This function returns -ERANGE if the value goes over maximum value.
5494 * Otherwise a 0 is returned and the attribute value is stored in the
5495 * destination variable.
5497 int nft_parse_u32_check(const struct nlattr
*attr
, int max
, u32
*dest
)
5501 val
= ntohl(nla_get_be32(attr
));
5508 EXPORT_SYMBOL_GPL(nft_parse_u32_check
);
5511 * nft_parse_register - parse a register value from a netlink attribute
5513 * @attr: netlink attribute
5515 * Parse and translate a register value from a netlink attribute.
5516 * Registers used to be 128 bit wide, these register numbers will be
5517 * mapped to the corresponding 32 bit register numbers.
5519 unsigned int nft_parse_register(const struct nlattr
*attr
)
5523 reg
= ntohl(nla_get_be32(attr
));
5525 case NFT_REG_VERDICT
...NFT_REG_4
:
5526 return reg
* NFT_REG_SIZE
/ NFT_REG32_SIZE
;
5528 return reg
+ NFT_REG_SIZE
/ NFT_REG32_SIZE
- NFT_REG32_00
;
5531 EXPORT_SYMBOL_GPL(nft_parse_register
);
5534 * nft_dump_register - dump a register value to a netlink attribute
5536 * @skb: socket buffer
5537 * @attr: attribute number
5538 * @reg: register number
5540 * Construct a netlink attribute containing the register number. For
5541 * compatibility reasons, register numbers being a multiple of 4 are
5542 * translated to the corresponding 128 bit register numbers.
5544 int nft_dump_register(struct sk_buff
*skb
, unsigned int attr
, unsigned int reg
)
5546 if (reg
% (NFT_REG_SIZE
/ NFT_REG32_SIZE
) == 0)
5547 reg
= reg
/ (NFT_REG_SIZE
/ NFT_REG32_SIZE
);
5549 reg
= reg
- NFT_REG_SIZE
/ NFT_REG32_SIZE
+ NFT_REG32_00
;
5551 return nla_put_be32(skb
, attr
, htonl(reg
));
5553 EXPORT_SYMBOL_GPL(nft_dump_register
);
5556 * nft_validate_register_load - validate a load from a register
5558 * @reg: the register number
5559 * @len: the length of the data
5561 * Validate that the input register is one of the general purpose
5562 * registers and that the length of the load is within the bounds.
5564 int nft_validate_register_load(enum nft_registers reg
, unsigned int len
)
5566 if (reg
< NFT_REG_1
* NFT_REG_SIZE
/ NFT_REG32_SIZE
)
5570 if (reg
* NFT_REG32_SIZE
+ len
> FIELD_SIZEOF(struct nft_regs
, data
))
5575 EXPORT_SYMBOL_GPL(nft_validate_register_load
);
5578 * nft_validate_register_store - validate an expressions' register store
5580 * @ctx: context of the expression performing the load
5581 * @reg: the destination register number
5582 * @data: the data to load
5583 * @type: the data type
5584 * @len: the length of the data
5586 * Validate that a data load uses the appropriate data type for
5587 * the destination register and the length is within the bounds.
5588 * A value of NULL for the data means that its runtime gathered
5591 int nft_validate_register_store(const struct nft_ctx
*ctx
,
5592 enum nft_registers reg
,
5593 const struct nft_data
*data
,
5594 enum nft_data_types type
, unsigned int len
)
5599 case NFT_REG_VERDICT
:
5600 if (type
!= NFT_DATA_VERDICT
)
5604 (data
->verdict
.code
== NFT_GOTO
||
5605 data
->verdict
.code
== NFT_JUMP
)) {
5606 err
= nf_tables_check_loops(ctx
, data
->verdict
.chain
);
5610 if (ctx
->chain
->level
+ 1 >
5611 data
->verdict
.chain
->level
) {
5612 if (ctx
->chain
->level
+ 1 == NFT_JUMP_STACK_SIZE
)
5614 data
->verdict
.chain
->level
= ctx
->chain
->level
+ 1;
5620 if (reg
< NFT_REG_1
* NFT_REG_SIZE
/ NFT_REG32_SIZE
)
5624 if (reg
* NFT_REG32_SIZE
+ len
>
5625 FIELD_SIZEOF(struct nft_regs
, data
))
5628 if (data
!= NULL
&& type
!= NFT_DATA_VALUE
)
5633 EXPORT_SYMBOL_GPL(nft_validate_register_store
);
5635 static const struct nla_policy nft_verdict_policy
[NFTA_VERDICT_MAX
+ 1] = {
5636 [NFTA_VERDICT_CODE
] = { .type
= NLA_U32
},
5637 [NFTA_VERDICT_CHAIN
] = { .type
= NLA_STRING
,
5638 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
5641 static int nft_verdict_init(const struct nft_ctx
*ctx
, struct nft_data
*data
,
5642 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
5644 u8 genmask
= nft_genmask_next(ctx
->net
);
5645 struct nlattr
*tb
[NFTA_VERDICT_MAX
+ 1];
5646 struct nft_chain
*chain
;
5649 err
= nla_parse_nested(tb
, NFTA_VERDICT_MAX
, nla
, nft_verdict_policy
,
5654 if (!tb
[NFTA_VERDICT_CODE
])
5656 data
->verdict
.code
= ntohl(nla_get_be32(tb
[NFTA_VERDICT_CODE
]));
5658 switch (data
->verdict
.code
) {
5660 switch (data
->verdict
.code
& NF_VERDICT_MASK
) {
5675 if (!tb
[NFTA_VERDICT_CHAIN
])
5677 chain
= nf_tables_chain_lookup(ctx
->table
,
5678 tb
[NFTA_VERDICT_CHAIN
], genmask
);
5680 return PTR_ERR(chain
);
5681 if (nft_is_base_chain(chain
))
5685 data
->verdict
.chain
= chain
;
5689 desc
->len
= sizeof(data
->verdict
);
5690 desc
->type
= NFT_DATA_VERDICT
;
5694 static void nft_verdict_uninit(const struct nft_data
*data
)
5696 switch (data
->verdict
.code
) {
5699 data
->verdict
.chain
->use
--;
5704 int nft_verdict_dump(struct sk_buff
*skb
, int type
, const struct nft_verdict
*v
)
5706 struct nlattr
*nest
;
5708 nest
= nla_nest_start(skb
, type
);
5710 goto nla_put_failure
;
5712 if (nla_put_be32(skb
, NFTA_VERDICT_CODE
, htonl(v
->code
)))
5713 goto nla_put_failure
;
5718 if (nla_put_string(skb
, NFTA_VERDICT_CHAIN
,
5720 goto nla_put_failure
;
5722 nla_nest_end(skb
, nest
);
5729 static int nft_value_init(const struct nft_ctx
*ctx
,
5730 struct nft_data
*data
, unsigned int size
,
5731 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
5741 nla_memcpy(data
->data
, nla
, len
);
5742 desc
->type
= NFT_DATA_VALUE
;
5747 static int nft_value_dump(struct sk_buff
*skb
, const struct nft_data
*data
,
5750 return nla_put(skb
, NFTA_DATA_VALUE
, len
, data
->data
);
5753 static const struct nla_policy nft_data_policy
[NFTA_DATA_MAX
+ 1] = {
5754 [NFTA_DATA_VALUE
] = { .type
= NLA_BINARY
},
5755 [NFTA_DATA_VERDICT
] = { .type
= NLA_NESTED
},
5759 * nft_data_init - parse nf_tables data netlink attributes
5761 * @ctx: context of the expression using the data
5762 * @data: destination struct nft_data
5763 * @size: maximum data length
5764 * @desc: data description
5765 * @nla: netlink attribute containing data
5767 * Parse the netlink data attributes and initialize a struct nft_data.
5768 * The type and length of data are returned in the data description.
5770 * The caller can indicate that it only wants to accept data of type
5771 * NFT_DATA_VALUE by passing NULL for the ctx argument.
5773 int nft_data_init(const struct nft_ctx
*ctx
,
5774 struct nft_data
*data
, unsigned int size
,
5775 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
5777 struct nlattr
*tb
[NFTA_DATA_MAX
+ 1];
5780 err
= nla_parse_nested(tb
, NFTA_DATA_MAX
, nla
, nft_data_policy
, NULL
);
5784 if (tb
[NFTA_DATA_VALUE
])
5785 return nft_value_init(ctx
, data
, size
, desc
,
5786 tb
[NFTA_DATA_VALUE
]);
5787 if (tb
[NFTA_DATA_VERDICT
] && ctx
!= NULL
)
5788 return nft_verdict_init(ctx
, data
, desc
, tb
[NFTA_DATA_VERDICT
]);
5791 EXPORT_SYMBOL_GPL(nft_data_init
);
5794 * nft_data_release - release a nft_data item
5796 * @data: struct nft_data to release
5797 * @type: type of data
5799 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
5800 * all others need to be released by calling this function.
5802 void nft_data_release(const struct nft_data
*data
, enum nft_data_types type
)
5804 if (type
< NFT_DATA_VERDICT
)
5807 case NFT_DATA_VERDICT
:
5808 return nft_verdict_uninit(data
);
5813 EXPORT_SYMBOL_GPL(nft_data_release
);
5815 int nft_data_dump(struct sk_buff
*skb
, int attr
, const struct nft_data
*data
,
5816 enum nft_data_types type
, unsigned int len
)
5818 struct nlattr
*nest
;
5821 nest
= nla_nest_start(skb
, attr
);
5826 case NFT_DATA_VALUE
:
5827 err
= nft_value_dump(skb
, data
, len
);
5829 case NFT_DATA_VERDICT
:
5830 err
= nft_verdict_dump(skb
, NFTA_DATA_VERDICT
, &data
->verdict
);
5837 nla_nest_end(skb
, nest
);
5840 EXPORT_SYMBOL_GPL(nft_data_dump
);
5842 static int __net_init
nf_tables_init_net(struct net
*net
)
5844 INIT_LIST_HEAD(&net
->nft
.af_info
);
5845 INIT_LIST_HEAD(&net
->nft
.commit_list
);
5846 net
->nft
.base_seq
= 1;
5850 static void __net_exit
nf_tables_exit_net(struct net
*net
)
5852 WARN_ON_ONCE(!list_empty(&net
->nft
.af_info
));
5853 WARN_ON_ONCE(!list_empty(&net
->nft
.commit_list
));
5856 int __nft_release_basechain(struct nft_ctx
*ctx
)
5858 struct nft_rule
*rule
, *nr
;
5860 BUG_ON(!nft_is_base_chain(ctx
->chain
));
5862 nf_tables_unregister_hooks(ctx
->net
, ctx
->chain
->table
, ctx
->chain
,
5864 list_for_each_entry_safe(rule
, nr
, &ctx
->chain
->rules
, list
) {
5865 list_del(&rule
->list
);
5867 nf_tables_rule_destroy(ctx
, rule
);
5869 list_del(&ctx
->chain
->list
);
5871 nf_tables_chain_destroy(ctx
->chain
);
5875 EXPORT_SYMBOL_GPL(__nft_release_basechain
);
5877 /* Called by nft_unregister_afinfo() from __net_exit path, nfnl_lock is held. */
5878 static void __nft_release_afinfo(struct net
*net
, struct nft_af_info
*afi
)
5880 struct nft_table
*table
, *nt
;
5881 struct nft_chain
*chain
, *nc
;
5882 struct nft_object
*obj
, *ne
;
5883 struct nft_rule
*rule
, *nr
;
5884 struct nft_set
*set
, *ns
;
5885 struct nft_ctx ctx
= {
5890 list_for_each_entry_safe(table
, nt
, &afi
->tables
, list
) {
5891 list_for_each_entry(chain
, &table
->chains
, list
)
5892 nf_tables_unregister_hooks(net
, table
, chain
,
5894 /* No packets are walking on these chains anymore. */
5896 list_for_each_entry(chain
, &table
->chains
, list
) {
5898 list_for_each_entry_safe(rule
, nr
, &chain
->rules
, list
) {
5899 list_del(&rule
->list
);
5901 nf_tables_rule_destroy(&ctx
, rule
);
5904 list_for_each_entry_safe(set
, ns
, &table
->sets
, list
) {
5905 list_del(&set
->list
);
5907 nft_set_destroy(set
);
5909 list_for_each_entry_safe(obj
, ne
, &table
->objects
, list
) {
5910 list_del(&obj
->list
);
5912 nft_obj_destroy(obj
);
5914 list_for_each_entry_safe(chain
, nc
, &table
->chains
, list
) {
5915 list_del(&chain
->list
);
5917 nf_tables_chain_destroy(chain
);
5919 list_del(&table
->list
);
5920 nf_tables_table_destroy(&ctx
);
5924 static struct pernet_operations nf_tables_net_ops
= {
5925 .init
= nf_tables_init_net
,
5926 .exit
= nf_tables_exit_net
,
5929 static int __init
nf_tables_module_init(void)
5933 info
= kmalloc(sizeof(struct nft_expr_info
) * NFT_RULE_MAXEXPRS
,
5940 err
= nf_tables_core_module_init();
5944 err
= nfnetlink_subsys_register(&nf_tables_subsys
);
5948 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
5949 return register_pernet_subsys(&nf_tables_net_ops
);
5951 nf_tables_core_module_exit();
5958 static void __exit
nf_tables_module_exit(void)
5960 unregister_pernet_subsys(&nf_tables_net_ops
);
5961 nfnetlink_subsys_unregister(&nf_tables_subsys
);
5963 nf_tables_core_module_exit();
5967 module_init(nf_tables_module_init
);
5968 module_exit(nf_tables_module_exit
);
5970 MODULE_LICENSE("GPL");
5971 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
5972 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES
);