]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blob - net/netfilter/nf_tables_api.c
netfilter: nf_tables: rename deactivate_one() to flush()
[mirror_ubuntu-artful-kernel.git] / net / netfilter / nf_tables_api.c
1 /*
2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
7 *
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
9 */
10
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/netfilter.h>
17 #include <linux/netfilter/nfnetlink.h>
18 #include <linux/netfilter/nf_tables.h>
19 #include <net/netfilter/nf_tables_core.h>
20 #include <net/netfilter/nf_tables.h>
21 #include <net/net_namespace.h>
22 #include <net/sock.h>
23
24 static LIST_HEAD(nf_tables_expressions);
25 static LIST_HEAD(nf_tables_objects);
26
27 /**
28 * nft_register_afinfo - register nf_tables address family info
29 *
30 * @afi: address family info to register
31 *
32 * Register the address family for use with nf_tables. Returns zero on
33 * success or a negative errno code otherwise.
34 */
35 int nft_register_afinfo(struct net *net, struct nft_af_info *afi)
36 {
37 INIT_LIST_HEAD(&afi->tables);
38 nfnl_lock(NFNL_SUBSYS_NFTABLES);
39 list_add_tail_rcu(&afi->list, &net->nft.af_info);
40 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
41 return 0;
42 }
43 EXPORT_SYMBOL_GPL(nft_register_afinfo);
44
45 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi);
46
47 /**
48 * nft_unregister_afinfo - unregister nf_tables address family info
49 *
50 * @afi: address family info to unregister
51 *
52 * Unregister the address family for use with nf_tables.
53 */
54 void nft_unregister_afinfo(struct net *net, struct nft_af_info *afi)
55 {
56 nfnl_lock(NFNL_SUBSYS_NFTABLES);
57 __nft_release_afinfo(net, afi);
58 list_del_rcu(&afi->list);
59 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
60 }
61 EXPORT_SYMBOL_GPL(nft_unregister_afinfo);
62
63 static struct nft_af_info *nft_afinfo_lookup(struct net *net, int family)
64 {
65 struct nft_af_info *afi;
66
67 list_for_each_entry(afi, &net->nft.af_info, list) {
68 if (afi->family == family)
69 return afi;
70 }
71 return NULL;
72 }
73
74 static struct nft_af_info *
75 nf_tables_afinfo_lookup(struct net *net, int family, bool autoload)
76 {
77 struct nft_af_info *afi;
78
79 afi = nft_afinfo_lookup(net, family);
80 if (afi != NULL)
81 return afi;
82 #ifdef CONFIG_MODULES
83 if (autoload) {
84 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
85 request_module("nft-afinfo-%u", family);
86 nfnl_lock(NFNL_SUBSYS_NFTABLES);
87 afi = nft_afinfo_lookup(net, family);
88 if (afi != NULL)
89 return ERR_PTR(-EAGAIN);
90 }
91 #endif
92 return ERR_PTR(-EAFNOSUPPORT);
93 }
94
95 static void nft_ctx_init(struct nft_ctx *ctx,
96 struct net *net,
97 const struct sk_buff *skb,
98 const struct nlmsghdr *nlh,
99 struct nft_af_info *afi,
100 struct nft_table *table,
101 struct nft_chain *chain,
102 const struct nlattr * const *nla)
103 {
104 ctx->net = net;
105 ctx->afi = afi;
106 ctx->table = table;
107 ctx->chain = chain;
108 ctx->nla = nla;
109 ctx->portid = NETLINK_CB(skb).portid;
110 ctx->report = nlmsg_report(nlh);
111 ctx->seq = nlh->nlmsg_seq;
112 }
113
114 static struct nft_trans *nft_trans_alloc_gfp(const struct nft_ctx *ctx,
115 int msg_type, u32 size, gfp_t gfp)
116 {
117 struct nft_trans *trans;
118
119 trans = kzalloc(sizeof(struct nft_trans) + size, gfp);
120 if (trans == NULL)
121 return NULL;
122
123 trans->msg_type = msg_type;
124 trans->ctx = *ctx;
125
126 return trans;
127 }
128
129 static struct nft_trans *nft_trans_alloc(const struct nft_ctx *ctx,
130 int msg_type, u32 size)
131 {
132 return nft_trans_alloc_gfp(ctx, msg_type, size, GFP_KERNEL);
133 }
134
135 static void nft_trans_destroy(struct nft_trans *trans)
136 {
137 list_del(&trans->list);
138 kfree(trans);
139 }
140
141 static int nf_tables_register_hooks(struct net *net,
142 const struct nft_table *table,
143 struct nft_chain *chain,
144 unsigned int hook_nops)
145 {
146 if (table->flags & NFT_TABLE_F_DORMANT ||
147 !(chain->flags & NFT_BASE_CHAIN))
148 return 0;
149
150 return nf_register_net_hooks(net, nft_base_chain(chain)->ops,
151 hook_nops);
152 }
153
154 static void nf_tables_unregister_hooks(struct net *net,
155 const struct nft_table *table,
156 struct nft_chain *chain,
157 unsigned int hook_nops)
158 {
159 if (table->flags & NFT_TABLE_F_DORMANT ||
160 !(chain->flags & NFT_BASE_CHAIN))
161 return;
162
163 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops, hook_nops);
164 }
165
166 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
167 {
168 struct nft_trans *trans;
169
170 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
171 if (trans == NULL)
172 return -ENOMEM;
173
174 if (msg_type == NFT_MSG_NEWTABLE)
175 nft_activate_next(ctx->net, ctx->table);
176
177 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
178 return 0;
179 }
180
181 static int nft_deltable(struct nft_ctx *ctx)
182 {
183 int err;
184
185 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
186 if (err < 0)
187 return err;
188
189 nft_deactivate_next(ctx->net, ctx->table);
190 return err;
191 }
192
193 static int nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
194 {
195 struct nft_trans *trans;
196
197 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
198 if (trans == NULL)
199 return -ENOMEM;
200
201 if (msg_type == NFT_MSG_NEWCHAIN)
202 nft_activate_next(ctx->net, ctx->chain);
203
204 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
205 return 0;
206 }
207
208 static int nft_delchain(struct nft_ctx *ctx)
209 {
210 int err;
211
212 err = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
213 if (err < 0)
214 return err;
215
216 ctx->table->use--;
217 nft_deactivate_next(ctx->net, ctx->chain);
218
219 return err;
220 }
221
222 static int
223 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
224 {
225 /* You cannot delete the same rule twice */
226 if (nft_is_active_next(ctx->net, rule)) {
227 nft_deactivate_next(ctx->net, rule);
228 ctx->chain->use--;
229 return 0;
230 }
231 return -ENOENT;
232 }
233
234 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
235 struct nft_rule *rule)
236 {
237 struct nft_trans *trans;
238
239 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
240 if (trans == NULL)
241 return NULL;
242
243 nft_trans_rule(trans) = rule;
244 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
245
246 return trans;
247 }
248
249 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
250 {
251 struct nft_trans *trans;
252 int err;
253
254 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
255 if (trans == NULL)
256 return -ENOMEM;
257
258 err = nf_tables_delrule_deactivate(ctx, rule);
259 if (err < 0) {
260 nft_trans_destroy(trans);
261 return err;
262 }
263
264 return 0;
265 }
266
267 static int nft_delrule_by_chain(struct nft_ctx *ctx)
268 {
269 struct nft_rule *rule;
270 int err;
271
272 list_for_each_entry(rule, &ctx->chain->rules, list) {
273 err = nft_delrule(ctx, rule);
274 if (err < 0)
275 return err;
276 }
277 return 0;
278 }
279
280 static int nft_trans_set_add(struct nft_ctx *ctx, int msg_type,
281 struct nft_set *set)
282 {
283 struct nft_trans *trans;
284
285 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
286 if (trans == NULL)
287 return -ENOMEM;
288
289 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
290 nft_trans_set_id(trans) =
291 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
292 nft_activate_next(ctx->net, set);
293 }
294 nft_trans_set(trans) = set;
295 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
296
297 return 0;
298 }
299
300 static int nft_delset(struct nft_ctx *ctx, struct nft_set *set)
301 {
302 int err;
303
304 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
305 if (err < 0)
306 return err;
307
308 nft_deactivate_next(ctx->net, set);
309 ctx->table->use--;
310
311 return err;
312 }
313
314 static int nft_trans_obj_add(struct nft_ctx *ctx, int msg_type,
315 struct nft_object *obj)
316 {
317 struct nft_trans *trans;
318
319 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_obj));
320 if (trans == NULL)
321 return -ENOMEM;
322
323 if (msg_type == NFT_MSG_NEWOBJ)
324 nft_activate_next(ctx->net, obj);
325
326 nft_trans_obj(trans) = obj;
327 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
328
329 return 0;
330 }
331
332 static int nft_delobj(struct nft_ctx *ctx, struct nft_object *obj)
333 {
334 int err;
335
336 err = nft_trans_obj_add(ctx, NFT_MSG_DELOBJ, obj);
337 if (err < 0)
338 return err;
339
340 nft_deactivate_next(ctx->net, obj);
341 ctx->table->use--;
342
343 return err;
344 }
345
346 /*
347 * Tables
348 */
349
350 static struct nft_table *nft_table_lookup(const struct nft_af_info *afi,
351 const struct nlattr *nla,
352 u8 genmask)
353 {
354 struct nft_table *table;
355
356 list_for_each_entry(table, &afi->tables, list) {
357 if (!nla_strcmp(nla, table->name) &&
358 nft_active_genmask(table, genmask))
359 return table;
360 }
361 return NULL;
362 }
363
364 static struct nft_table *nf_tables_table_lookup(const struct nft_af_info *afi,
365 const struct nlattr *nla,
366 u8 genmask)
367 {
368 struct nft_table *table;
369
370 if (nla == NULL)
371 return ERR_PTR(-EINVAL);
372
373 table = nft_table_lookup(afi, nla, genmask);
374 if (table != NULL)
375 return table;
376
377 return ERR_PTR(-ENOENT);
378 }
379
380 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
381 {
382 return ++table->hgenerator;
383 }
384
385 static const struct nf_chain_type *chain_type[AF_MAX][NFT_CHAIN_T_MAX];
386
387 static const struct nf_chain_type *
388 __nf_tables_chain_type_lookup(int family, const struct nlattr *nla)
389 {
390 int i;
391
392 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
393 if (chain_type[family][i] != NULL &&
394 !nla_strcmp(nla, chain_type[family][i]->name))
395 return chain_type[family][i];
396 }
397 return NULL;
398 }
399
400 static const struct nf_chain_type *
401 nf_tables_chain_type_lookup(const struct nft_af_info *afi,
402 const struct nlattr *nla,
403 bool autoload)
404 {
405 const struct nf_chain_type *type;
406
407 type = __nf_tables_chain_type_lookup(afi->family, nla);
408 if (type != NULL)
409 return type;
410 #ifdef CONFIG_MODULES
411 if (autoload) {
412 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
413 request_module("nft-chain-%u-%.*s", afi->family,
414 nla_len(nla), (const char *)nla_data(nla));
415 nfnl_lock(NFNL_SUBSYS_NFTABLES);
416 type = __nf_tables_chain_type_lookup(afi->family, nla);
417 if (type != NULL)
418 return ERR_PTR(-EAGAIN);
419 }
420 #endif
421 return ERR_PTR(-ENOENT);
422 }
423
424 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
425 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
426 .len = NFT_TABLE_MAXNAMELEN - 1 },
427 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
428 };
429
430 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
431 u32 portid, u32 seq, int event, u32 flags,
432 int family, const struct nft_table *table)
433 {
434 struct nlmsghdr *nlh;
435 struct nfgenmsg *nfmsg;
436
437 event |= NFNL_SUBSYS_NFTABLES << 8;
438 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
439 if (nlh == NULL)
440 goto nla_put_failure;
441
442 nfmsg = nlmsg_data(nlh);
443 nfmsg->nfgen_family = family;
444 nfmsg->version = NFNETLINK_V0;
445 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
446
447 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
448 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
449 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)))
450 goto nla_put_failure;
451
452 nlmsg_end(skb, nlh);
453 return 0;
454
455 nla_put_failure:
456 nlmsg_trim(skb, nlh);
457 return -1;
458 }
459
460 static int nf_tables_table_notify(const struct nft_ctx *ctx, int event)
461 {
462 struct sk_buff *skb;
463 int err;
464
465 if (!ctx->report &&
466 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
467 return 0;
468
469 err = -ENOBUFS;
470 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
471 if (skb == NULL)
472 goto err;
473
474 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
475 event, 0, ctx->afi->family, ctx->table);
476 if (err < 0) {
477 kfree_skb(skb);
478 goto err;
479 }
480
481 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
482 ctx->report, GFP_KERNEL);
483 err:
484 if (err < 0) {
485 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
486 err);
487 }
488 return err;
489 }
490
491 static int nf_tables_dump_tables(struct sk_buff *skb,
492 struct netlink_callback *cb)
493 {
494 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
495 const struct nft_af_info *afi;
496 const struct nft_table *table;
497 unsigned int idx = 0, s_idx = cb->args[0];
498 struct net *net = sock_net(skb->sk);
499 int family = nfmsg->nfgen_family;
500
501 rcu_read_lock();
502 cb->seq = net->nft.base_seq;
503
504 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
505 if (family != NFPROTO_UNSPEC && family != afi->family)
506 continue;
507
508 list_for_each_entry_rcu(table, &afi->tables, list) {
509 if (idx < s_idx)
510 goto cont;
511 if (idx > s_idx)
512 memset(&cb->args[1], 0,
513 sizeof(cb->args) - sizeof(cb->args[0]));
514 if (!nft_is_active(net, table))
515 continue;
516 if (nf_tables_fill_table_info(skb, net,
517 NETLINK_CB(cb->skb).portid,
518 cb->nlh->nlmsg_seq,
519 NFT_MSG_NEWTABLE,
520 NLM_F_MULTI,
521 afi->family, table) < 0)
522 goto done;
523
524 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
525 cont:
526 idx++;
527 }
528 }
529 done:
530 rcu_read_unlock();
531 cb->args[0] = idx;
532 return skb->len;
533 }
534
535 static int nf_tables_gettable(struct net *net, struct sock *nlsk,
536 struct sk_buff *skb, const struct nlmsghdr *nlh,
537 const struct nlattr * const nla[])
538 {
539 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
540 u8 genmask = nft_genmask_cur(net);
541 const struct nft_af_info *afi;
542 const struct nft_table *table;
543 struct sk_buff *skb2;
544 int family = nfmsg->nfgen_family;
545 int err;
546
547 if (nlh->nlmsg_flags & NLM_F_DUMP) {
548 struct netlink_dump_control c = {
549 .dump = nf_tables_dump_tables,
550 };
551 return netlink_dump_start(nlsk, skb, nlh, &c);
552 }
553
554 afi = nf_tables_afinfo_lookup(net, family, false);
555 if (IS_ERR(afi))
556 return PTR_ERR(afi);
557
558 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
559 if (IS_ERR(table))
560 return PTR_ERR(table);
561
562 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
563 if (!skb2)
564 return -ENOMEM;
565
566 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
567 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
568 family, table);
569 if (err < 0)
570 goto err;
571
572 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
573
574 err:
575 kfree_skb(skb2);
576 return err;
577 }
578
579 static void _nf_tables_table_disable(struct net *net,
580 const struct nft_af_info *afi,
581 struct nft_table *table,
582 u32 cnt)
583 {
584 struct nft_chain *chain;
585 u32 i = 0;
586
587 list_for_each_entry(chain, &table->chains, list) {
588 if (!nft_is_active_next(net, chain))
589 continue;
590 if (!(chain->flags & NFT_BASE_CHAIN))
591 continue;
592
593 if (cnt && i++ == cnt)
594 break;
595
596 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops,
597 afi->nops);
598 }
599 }
600
601 static int nf_tables_table_enable(struct net *net,
602 const struct nft_af_info *afi,
603 struct nft_table *table)
604 {
605 struct nft_chain *chain;
606 int err, i = 0;
607
608 list_for_each_entry(chain, &table->chains, list) {
609 if (!nft_is_active_next(net, chain))
610 continue;
611 if (!(chain->flags & NFT_BASE_CHAIN))
612 continue;
613
614 err = nf_register_net_hooks(net, nft_base_chain(chain)->ops,
615 afi->nops);
616 if (err < 0)
617 goto err;
618
619 i++;
620 }
621 return 0;
622 err:
623 if (i)
624 _nf_tables_table_disable(net, afi, table, i);
625 return err;
626 }
627
628 static void nf_tables_table_disable(struct net *net,
629 const struct nft_af_info *afi,
630 struct nft_table *table)
631 {
632 _nf_tables_table_disable(net, afi, table, 0);
633 }
634
635 static int nf_tables_updtable(struct nft_ctx *ctx)
636 {
637 struct nft_trans *trans;
638 u32 flags;
639 int ret = 0;
640
641 if (!ctx->nla[NFTA_TABLE_FLAGS])
642 return 0;
643
644 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
645 if (flags & ~NFT_TABLE_F_DORMANT)
646 return -EINVAL;
647
648 if (flags == ctx->table->flags)
649 return 0;
650
651 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
652 sizeof(struct nft_trans_table));
653 if (trans == NULL)
654 return -ENOMEM;
655
656 if ((flags & NFT_TABLE_F_DORMANT) &&
657 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
658 nft_trans_table_enable(trans) = false;
659 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
660 ctx->table->flags & NFT_TABLE_F_DORMANT) {
661 ret = nf_tables_table_enable(ctx->net, ctx->afi, ctx->table);
662 if (ret >= 0) {
663 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
664 nft_trans_table_enable(trans) = true;
665 }
666 }
667 if (ret < 0)
668 goto err;
669
670 nft_trans_table_update(trans) = true;
671 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
672 return 0;
673 err:
674 nft_trans_destroy(trans);
675 return ret;
676 }
677
678 static int nf_tables_newtable(struct net *net, struct sock *nlsk,
679 struct sk_buff *skb, const struct nlmsghdr *nlh,
680 const struct nlattr * const nla[])
681 {
682 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
683 u8 genmask = nft_genmask_next(net);
684 const struct nlattr *name;
685 struct nft_af_info *afi;
686 struct nft_table *table;
687 int family = nfmsg->nfgen_family;
688 u32 flags = 0;
689 struct nft_ctx ctx;
690 int err;
691
692 afi = nf_tables_afinfo_lookup(net, family, true);
693 if (IS_ERR(afi))
694 return PTR_ERR(afi);
695
696 name = nla[NFTA_TABLE_NAME];
697 table = nf_tables_table_lookup(afi, name, genmask);
698 if (IS_ERR(table)) {
699 if (PTR_ERR(table) != -ENOENT)
700 return PTR_ERR(table);
701 } else {
702 if (nlh->nlmsg_flags & NLM_F_EXCL)
703 return -EEXIST;
704 if (nlh->nlmsg_flags & NLM_F_REPLACE)
705 return -EOPNOTSUPP;
706
707 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
708 return nf_tables_updtable(&ctx);
709 }
710
711 if (nla[NFTA_TABLE_FLAGS]) {
712 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
713 if (flags & ~NFT_TABLE_F_DORMANT)
714 return -EINVAL;
715 }
716
717 err = -EAFNOSUPPORT;
718 if (!try_module_get(afi->owner))
719 goto err1;
720
721 err = -ENOMEM;
722 table = kzalloc(sizeof(*table), GFP_KERNEL);
723 if (table == NULL)
724 goto err2;
725
726 nla_strlcpy(table->name, name, NFT_TABLE_MAXNAMELEN);
727 INIT_LIST_HEAD(&table->chains);
728 INIT_LIST_HEAD(&table->sets);
729 INIT_LIST_HEAD(&table->objects);
730 table->flags = flags;
731
732 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
733 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
734 if (err < 0)
735 goto err3;
736
737 list_add_tail_rcu(&table->list, &afi->tables);
738 return 0;
739 err3:
740 kfree(table);
741 err2:
742 module_put(afi->owner);
743 err1:
744 return err;
745 }
746
747 static int nft_flush_table(struct nft_ctx *ctx)
748 {
749 int err;
750 struct nft_chain *chain, *nc;
751 struct nft_object *obj, *ne;
752 struct nft_set *set, *ns;
753
754 list_for_each_entry(chain, &ctx->table->chains, list) {
755 if (!nft_is_active_next(ctx->net, chain))
756 continue;
757
758 ctx->chain = chain;
759
760 err = nft_delrule_by_chain(ctx);
761 if (err < 0)
762 goto out;
763 }
764
765 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
766 if (!nft_is_active_next(ctx->net, set))
767 continue;
768
769 if (set->flags & NFT_SET_ANONYMOUS &&
770 !list_empty(&set->bindings))
771 continue;
772
773 err = nft_delset(ctx, set);
774 if (err < 0)
775 goto out;
776 }
777
778 list_for_each_entry_safe(obj, ne, &ctx->table->objects, list) {
779 err = nft_delobj(ctx, obj);
780 if (err < 0)
781 goto out;
782 }
783
784 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
785 if (!nft_is_active_next(ctx->net, chain))
786 continue;
787
788 ctx->chain = chain;
789
790 err = nft_delchain(ctx);
791 if (err < 0)
792 goto out;
793 }
794
795 err = nft_deltable(ctx);
796 out:
797 return err;
798 }
799
800 static int nft_flush(struct nft_ctx *ctx, int family)
801 {
802 struct nft_af_info *afi;
803 struct nft_table *table, *nt;
804 const struct nlattr * const *nla = ctx->nla;
805 int err = 0;
806
807 list_for_each_entry(afi, &ctx->net->nft.af_info, list) {
808 if (family != AF_UNSPEC && afi->family != family)
809 continue;
810
811 ctx->afi = afi;
812 list_for_each_entry_safe(table, nt, &afi->tables, list) {
813 if (!nft_is_active_next(ctx->net, table))
814 continue;
815
816 if (nla[NFTA_TABLE_NAME] &&
817 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
818 continue;
819
820 ctx->table = table;
821
822 err = nft_flush_table(ctx);
823 if (err < 0)
824 goto out;
825 }
826 }
827 out:
828 return err;
829 }
830
831 static int nf_tables_deltable(struct net *net, struct sock *nlsk,
832 struct sk_buff *skb, const struct nlmsghdr *nlh,
833 const struct nlattr * const nla[])
834 {
835 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
836 u8 genmask = nft_genmask_next(net);
837 struct nft_af_info *afi;
838 struct nft_table *table;
839 int family = nfmsg->nfgen_family;
840 struct nft_ctx ctx;
841
842 nft_ctx_init(&ctx, net, skb, nlh, NULL, NULL, NULL, nla);
843 if (family == AF_UNSPEC || nla[NFTA_TABLE_NAME] == NULL)
844 return nft_flush(&ctx, family);
845
846 afi = nf_tables_afinfo_lookup(net, family, false);
847 if (IS_ERR(afi))
848 return PTR_ERR(afi);
849
850 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
851 if (IS_ERR(table))
852 return PTR_ERR(table);
853
854 ctx.afi = afi;
855 ctx.table = table;
856
857 return nft_flush_table(&ctx);
858 }
859
860 static void nf_tables_table_destroy(struct nft_ctx *ctx)
861 {
862 BUG_ON(ctx->table->use > 0);
863
864 kfree(ctx->table);
865 module_put(ctx->afi->owner);
866 }
867
868 int nft_register_chain_type(const struct nf_chain_type *ctype)
869 {
870 int err = 0;
871
872 nfnl_lock(NFNL_SUBSYS_NFTABLES);
873 if (chain_type[ctype->family][ctype->type] != NULL) {
874 err = -EBUSY;
875 goto out;
876 }
877 chain_type[ctype->family][ctype->type] = ctype;
878 out:
879 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
880 return err;
881 }
882 EXPORT_SYMBOL_GPL(nft_register_chain_type);
883
884 void nft_unregister_chain_type(const struct nf_chain_type *ctype)
885 {
886 nfnl_lock(NFNL_SUBSYS_NFTABLES);
887 chain_type[ctype->family][ctype->type] = NULL;
888 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
889 }
890 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
891
892 /*
893 * Chains
894 */
895
896 static struct nft_chain *
897 nf_tables_chain_lookup_byhandle(const struct nft_table *table, u64 handle,
898 u8 genmask)
899 {
900 struct nft_chain *chain;
901
902 list_for_each_entry(chain, &table->chains, list) {
903 if (chain->handle == handle &&
904 nft_active_genmask(chain, genmask))
905 return chain;
906 }
907
908 return ERR_PTR(-ENOENT);
909 }
910
911 static struct nft_chain *nf_tables_chain_lookup(const struct nft_table *table,
912 const struct nlattr *nla,
913 u8 genmask)
914 {
915 struct nft_chain *chain;
916
917 if (nla == NULL)
918 return ERR_PTR(-EINVAL);
919
920 list_for_each_entry(chain, &table->chains, list) {
921 if (!nla_strcmp(nla, chain->name) &&
922 nft_active_genmask(chain, genmask))
923 return chain;
924 }
925
926 return ERR_PTR(-ENOENT);
927 }
928
929 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
930 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING,
931 .len = NFT_TABLE_MAXNAMELEN - 1 },
932 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
933 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
934 .len = NFT_CHAIN_MAXNAMELEN - 1 },
935 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
936 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
937 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING },
938 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
939 };
940
941 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
942 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
943 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
944 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
945 .len = IFNAMSIZ - 1 },
946 };
947
948 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
949 {
950 struct nft_stats *cpu_stats, total;
951 struct nlattr *nest;
952 unsigned int seq;
953 u64 pkts, bytes;
954 int cpu;
955
956 memset(&total, 0, sizeof(total));
957 for_each_possible_cpu(cpu) {
958 cpu_stats = per_cpu_ptr(stats, cpu);
959 do {
960 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
961 pkts = cpu_stats->pkts;
962 bytes = cpu_stats->bytes;
963 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
964 total.pkts += pkts;
965 total.bytes += bytes;
966 }
967 nest = nla_nest_start(skb, NFTA_CHAIN_COUNTERS);
968 if (nest == NULL)
969 goto nla_put_failure;
970
971 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
972 NFTA_COUNTER_PAD) ||
973 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
974 NFTA_COUNTER_PAD))
975 goto nla_put_failure;
976
977 nla_nest_end(skb, nest);
978 return 0;
979
980 nla_put_failure:
981 return -ENOSPC;
982 }
983
984 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
985 u32 portid, u32 seq, int event, u32 flags,
986 int family, const struct nft_table *table,
987 const struct nft_chain *chain)
988 {
989 struct nlmsghdr *nlh;
990 struct nfgenmsg *nfmsg;
991
992 event |= NFNL_SUBSYS_NFTABLES << 8;
993 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
994 if (nlh == NULL)
995 goto nla_put_failure;
996
997 nfmsg = nlmsg_data(nlh);
998 nfmsg->nfgen_family = family;
999 nfmsg->version = NFNETLINK_V0;
1000 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1001
1002 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
1003 goto nla_put_failure;
1004 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
1005 NFTA_CHAIN_PAD))
1006 goto nla_put_failure;
1007 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
1008 goto nla_put_failure;
1009
1010 if (chain->flags & NFT_BASE_CHAIN) {
1011 const struct nft_base_chain *basechain = nft_base_chain(chain);
1012 const struct nf_hook_ops *ops = &basechain->ops[0];
1013 struct nlattr *nest;
1014
1015 nest = nla_nest_start(skb, NFTA_CHAIN_HOOK);
1016 if (nest == NULL)
1017 goto nla_put_failure;
1018 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
1019 goto nla_put_failure;
1020 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
1021 goto nla_put_failure;
1022 if (basechain->dev_name[0] &&
1023 nla_put_string(skb, NFTA_HOOK_DEV, basechain->dev_name))
1024 goto nla_put_failure;
1025 nla_nest_end(skb, nest);
1026
1027 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
1028 htonl(basechain->policy)))
1029 goto nla_put_failure;
1030
1031 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
1032 goto nla_put_failure;
1033
1034 if (nft_dump_stats(skb, nft_base_chain(chain)->stats))
1035 goto nla_put_failure;
1036 }
1037
1038 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
1039 goto nla_put_failure;
1040
1041 nlmsg_end(skb, nlh);
1042 return 0;
1043
1044 nla_put_failure:
1045 nlmsg_trim(skb, nlh);
1046 return -1;
1047 }
1048
1049 static int nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
1050 {
1051 struct sk_buff *skb;
1052 int err;
1053
1054 if (!ctx->report &&
1055 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1056 return 0;
1057
1058 err = -ENOBUFS;
1059 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1060 if (skb == NULL)
1061 goto err;
1062
1063 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
1064 event, 0, ctx->afi->family, ctx->table,
1065 ctx->chain);
1066 if (err < 0) {
1067 kfree_skb(skb);
1068 goto err;
1069 }
1070
1071 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1072 ctx->report, GFP_KERNEL);
1073 err:
1074 if (err < 0) {
1075 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1076 err);
1077 }
1078 return err;
1079 }
1080
1081 static int nf_tables_dump_chains(struct sk_buff *skb,
1082 struct netlink_callback *cb)
1083 {
1084 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1085 const struct nft_af_info *afi;
1086 const struct nft_table *table;
1087 const struct nft_chain *chain;
1088 unsigned int idx = 0, s_idx = cb->args[0];
1089 struct net *net = sock_net(skb->sk);
1090 int family = nfmsg->nfgen_family;
1091
1092 rcu_read_lock();
1093 cb->seq = net->nft.base_seq;
1094
1095 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1096 if (family != NFPROTO_UNSPEC && family != afi->family)
1097 continue;
1098
1099 list_for_each_entry_rcu(table, &afi->tables, list) {
1100 list_for_each_entry_rcu(chain, &table->chains, list) {
1101 if (idx < s_idx)
1102 goto cont;
1103 if (idx > s_idx)
1104 memset(&cb->args[1], 0,
1105 sizeof(cb->args) - sizeof(cb->args[0]));
1106 if (!nft_is_active(net, chain))
1107 continue;
1108 if (nf_tables_fill_chain_info(skb, net,
1109 NETLINK_CB(cb->skb).portid,
1110 cb->nlh->nlmsg_seq,
1111 NFT_MSG_NEWCHAIN,
1112 NLM_F_MULTI,
1113 afi->family, table, chain) < 0)
1114 goto done;
1115
1116 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1117 cont:
1118 idx++;
1119 }
1120 }
1121 }
1122 done:
1123 rcu_read_unlock();
1124 cb->args[0] = idx;
1125 return skb->len;
1126 }
1127
1128 static int nf_tables_getchain(struct net *net, struct sock *nlsk,
1129 struct sk_buff *skb, const struct nlmsghdr *nlh,
1130 const struct nlattr * const nla[])
1131 {
1132 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1133 u8 genmask = nft_genmask_cur(net);
1134 const struct nft_af_info *afi;
1135 const struct nft_table *table;
1136 const struct nft_chain *chain;
1137 struct sk_buff *skb2;
1138 int family = nfmsg->nfgen_family;
1139 int err;
1140
1141 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1142 struct netlink_dump_control c = {
1143 .dump = nf_tables_dump_chains,
1144 };
1145 return netlink_dump_start(nlsk, skb, nlh, &c);
1146 }
1147
1148 afi = nf_tables_afinfo_lookup(net, family, false);
1149 if (IS_ERR(afi))
1150 return PTR_ERR(afi);
1151
1152 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1153 if (IS_ERR(table))
1154 return PTR_ERR(table);
1155
1156 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1157 if (IS_ERR(chain))
1158 return PTR_ERR(chain);
1159
1160 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1161 if (!skb2)
1162 return -ENOMEM;
1163
1164 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
1165 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1166 family, table, chain);
1167 if (err < 0)
1168 goto err;
1169
1170 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1171
1172 err:
1173 kfree_skb(skb2);
1174 return err;
1175 }
1176
1177 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1178 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1179 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1180 };
1181
1182 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
1183 {
1184 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1185 struct nft_stats __percpu *newstats;
1186 struct nft_stats *stats;
1187 int err;
1188
1189 err = nla_parse_nested(tb, NFTA_COUNTER_MAX, attr, nft_counter_policy);
1190 if (err < 0)
1191 return ERR_PTR(err);
1192
1193 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
1194 return ERR_PTR(-EINVAL);
1195
1196 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
1197 if (newstats == NULL)
1198 return ERR_PTR(-ENOMEM);
1199
1200 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1201 * are not exposed to userspace.
1202 */
1203 preempt_disable();
1204 stats = this_cpu_ptr(newstats);
1205 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1206 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
1207 preempt_enable();
1208
1209 return newstats;
1210 }
1211
1212 static void nft_chain_stats_replace(struct nft_base_chain *chain,
1213 struct nft_stats __percpu *newstats)
1214 {
1215 if (newstats == NULL)
1216 return;
1217
1218 if (chain->stats) {
1219 struct nft_stats __percpu *oldstats =
1220 nft_dereference(chain->stats);
1221
1222 rcu_assign_pointer(chain->stats, newstats);
1223 synchronize_rcu();
1224 free_percpu(oldstats);
1225 } else
1226 rcu_assign_pointer(chain->stats, newstats);
1227 }
1228
1229 static void nf_tables_chain_destroy(struct nft_chain *chain)
1230 {
1231 BUG_ON(chain->use > 0);
1232
1233 if (chain->flags & NFT_BASE_CHAIN) {
1234 struct nft_base_chain *basechain = nft_base_chain(chain);
1235
1236 module_put(basechain->type->owner);
1237 free_percpu(basechain->stats);
1238 if (basechain->ops[0].dev != NULL)
1239 dev_put(basechain->ops[0].dev);
1240 kfree(basechain);
1241 } else {
1242 kfree(chain);
1243 }
1244 }
1245
1246 struct nft_chain_hook {
1247 u32 num;
1248 u32 priority;
1249 const struct nf_chain_type *type;
1250 struct net_device *dev;
1251 };
1252
1253 static int nft_chain_parse_hook(struct net *net,
1254 const struct nlattr * const nla[],
1255 struct nft_af_info *afi,
1256 struct nft_chain_hook *hook, bool create)
1257 {
1258 struct nlattr *ha[NFTA_HOOK_MAX + 1];
1259 const struct nf_chain_type *type;
1260 struct net_device *dev;
1261 int err;
1262
1263 err = nla_parse_nested(ha, NFTA_HOOK_MAX, nla[NFTA_CHAIN_HOOK],
1264 nft_hook_policy);
1265 if (err < 0)
1266 return err;
1267
1268 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1269 ha[NFTA_HOOK_PRIORITY] == NULL)
1270 return -EINVAL;
1271
1272 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
1273 if (hook->num >= afi->nhooks)
1274 return -EINVAL;
1275
1276 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1277
1278 type = chain_type[afi->family][NFT_CHAIN_T_DEFAULT];
1279 if (nla[NFTA_CHAIN_TYPE]) {
1280 type = nf_tables_chain_type_lookup(afi, nla[NFTA_CHAIN_TYPE],
1281 create);
1282 if (IS_ERR(type))
1283 return PTR_ERR(type);
1284 }
1285 if (!(type->hook_mask & (1 << hook->num)))
1286 return -EOPNOTSUPP;
1287 if (!try_module_get(type->owner))
1288 return -ENOENT;
1289
1290 hook->type = type;
1291
1292 hook->dev = NULL;
1293 if (afi->flags & NFT_AF_NEEDS_DEV) {
1294 char ifname[IFNAMSIZ];
1295
1296 if (!ha[NFTA_HOOK_DEV]) {
1297 module_put(type->owner);
1298 return -EOPNOTSUPP;
1299 }
1300
1301 nla_strlcpy(ifname, ha[NFTA_HOOK_DEV], IFNAMSIZ);
1302 dev = dev_get_by_name(net, ifname);
1303 if (!dev) {
1304 module_put(type->owner);
1305 return -ENOENT;
1306 }
1307 hook->dev = dev;
1308 } else if (ha[NFTA_HOOK_DEV]) {
1309 module_put(type->owner);
1310 return -EOPNOTSUPP;
1311 }
1312
1313 return 0;
1314 }
1315
1316 static void nft_chain_release_hook(struct nft_chain_hook *hook)
1317 {
1318 module_put(hook->type->owner);
1319 if (hook->dev != NULL)
1320 dev_put(hook->dev);
1321 }
1322
1323 static int nf_tables_newchain(struct net *net, struct sock *nlsk,
1324 struct sk_buff *skb, const struct nlmsghdr *nlh,
1325 const struct nlattr * const nla[])
1326 {
1327 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1328 const struct nlattr * uninitialized_var(name);
1329 struct nft_af_info *afi;
1330 struct nft_table *table;
1331 struct nft_chain *chain;
1332 struct nft_base_chain *basechain = NULL;
1333 u8 genmask = nft_genmask_next(net);
1334 int family = nfmsg->nfgen_family;
1335 u8 policy = NF_ACCEPT;
1336 u64 handle = 0;
1337 unsigned int i;
1338 struct nft_stats __percpu *stats;
1339 int err;
1340 bool create;
1341 struct nft_ctx ctx;
1342
1343 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1344
1345 afi = nf_tables_afinfo_lookup(net, family, true);
1346 if (IS_ERR(afi))
1347 return PTR_ERR(afi);
1348
1349 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1350 if (IS_ERR(table))
1351 return PTR_ERR(table);
1352
1353 chain = NULL;
1354 name = nla[NFTA_CHAIN_NAME];
1355
1356 if (nla[NFTA_CHAIN_HANDLE]) {
1357 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
1358 chain = nf_tables_chain_lookup_byhandle(table, handle, genmask);
1359 if (IS_ERR(chain))
1360 return PTR_ERR(chain);
1361 } else {
1362 chain = nf_tables_chain_lookup(table, name, genmask);
1363 if (IS_ERR(chain)) {
1364 if (PTR_ERR(chain) != -ENOENT)
1365 return PTR_ERR(chain);
1366 chain = NULL;
1367 }
1368 }
1369
1370 if (nla[NFTA_CHAIN_POLICY]) {
1371 if ((chain != NULL &&
1372 !(chain->flags & NFT_BASE_CHAIN)))
1373 return -EOPNOTSUPP;
1374
1375 if (chain == NULL &&
1376 nla[NFTA_CHAIN_HOOK] == NULL)
1377 return -EOPNOTSUPP;
1378
1379 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
1380 switch (policy) {
1381 case NF_DROP:
1382 case NF_ACCEPT:
1383 break;
1384 default:
1385 return -EINVAL;
1386 }
1387 }
1388
1389 if (chain != NULL) {
1390 struct nft_stats *stats = NULL;
1391 struct nft_trans *trans;
1392
1393 if (nlh->nlmsg_flags & NLM_F_EXCL)
1394 return -EEXIST;
1395 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1396 return -EOPNOTSUPP;
1397
1398 if (nla[NFTA_CHAIN_HOOK]) {
1399 struct nft_base_chain *basechain;
1400 struct nft_chain_hook hook;
1401 struct nf_hook_ops *ops;
1402
1403 if (!(chain->flags & NFT_BASE_CHAIN))
1404 return -EBUSY;
1405
1406 err = nft_chain_parse_hook(net, nla, afi, &hook,
1407 create);
1408 if (err < 0)
1409 return err;
1410
1411 basechain = nft_base_chain(chain);
1412 if (basechain->type != hook.type) {
1413 nft_chain_release_hook(&hook);
1414 return -EBUSY;
1415 }
1416
1417 for (i = 0; i < afi->nops; i++) {
1418 ops = &basechain->ops[i];
1419 if (ops->hooknum != hook.num ||
1420 ops->priority != hook.priority ||
1421 ops->dev != hook.dev) {
1422 nft_chain_release_hook(&hook);
1423 return -EBUSY;
1424 }
1425 }
1426 nft_chain_release_hook(&hook);
1427 }
1428
1429 if (nla[NFTA_CHAIN_HANDLE] && name) {
1430 struct nft_chain *chain2;
1431
1432 chain2 = nf_tables_chain_lookup(table,
1433 nla[NFTA_CHAIN_NAME],
1434 genmask);
1435 if (IS_ERR(chain2))
1436 return PTR_ERR(chain2);
1437 }
1438
1439 if (nla[NFTA_CHAIN_COUNTERS]) {
1440 if (!(chain->flags & NFT_BASE_CHAIN))
1441 return -EOPNOTSUPP;
1442
1443 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1444 if (IS_ERR(stats))
1445 return PTR_ERR(stats);
1446 }
1447
1448 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1449 trans = nft_trans_alloc(&ctx, NFT_MSG_NEWCHAIN,
1450 sizeof(struct nft_trans_chain));
1451 if (trans == NULL) {
1452 free_percpu(stats);
1453 return -ENOMEM;
1454 }
1455
1456 nft_trans_chain_stats(trans) = stats;
1457 nft_trans_chain_update(trans) = true;
1458
1459 if (nla[NFTA_CHAIN_POLICY])
1460 nft_trans_chain_policy(trans) = policy;
1461 else
1462 nft_trans_chain_policy(trans) = -1;
1463
1464 if (nla[NFTA_CHAIN_HANDLE] && name) {
1465 nla_strlcpy(nft_trans_chain_name(trans), name,
1466 NFT_CHAIN_MAXNAMELEN);
1467 }
1468 list_add_tail(&trans->list, &net->nft.commit_list);
1469 return 0;
1470 }
1471
1472 if (table->use == UINT_MAX)
1473 return -EOVERFLOW;
1474
1475 if (nla[NFTA_CHAIN_HOOK]) {
1476 struct nft_chain_hook hook;
1477 struct nf_hook_ops *ops;
1478 nf_hookfn *hookfn;
1479
1480 err = nft_chain_parse_hook(net, nla, afi, &hook, create);
1481 if (err < 0)
1482 return err;
1483
1484 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1485 if (basechain == NULL) {
1486 nft_chain_release_hook(&hook);
1487 return -ENOMEM;
1488 }
1489
1490 if (hook.dev != NULL)
1491 strncpy(basechain->dev_name, hook.dev->name, IFNAMSIZ);
1492
1493 if (nla[NFTA_CHAIN_COUNTERS]) {
1494 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1495 if (IS_ERR(stats)) {
1496 nft_chain_release_hook(&hook);
1497 kfree(basechain);
1498 return PTR_ERR(stats);
1499 }
1500 basechain->stats = stats;
1501 } else {
1502 stats = netdev_alloc_pcpu_stats(struct nft_stats);
1503 if (stats == NULL) {
1504 nft_chain_release_hook(&hook);
1505 kfree(basechain);
1506 return -ENOMEM;
1507 }
1508 rcu_assign_pointer(basechain->stats, stats);
1509 }
1510
1511 hookfn = hook.type->hooks[hook.num];
1512 basechain->type = hook.type;
1513 chain = &basechain->chain;
1514
1515 for (i = 0; i < afi->nops; i++) {
1516 ops = &basechain->ops[i];
1517 ops->pf = family;
1518 ops->hooknum = hook.num;
1519 ops->priority = hook.priority;
1520 ops->priv = chain;
1521 ops->hook = afi->hooks[ops->hooknum];
1522 ops->dev = hook.dev;
1523 if (hookfn)
1524 ops->hook = hookfn;
1525 if (afi->hook_ops_init)
1526 afi->hook_ops_init(ops, i);
1527 }
1528
1529 chain->flags |= NFT_BASE_CHAIN;
1530 basechain->policy = policy;
1531 } else {
1532 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1533 if (chain == NULL)
1534 return -ENOMEM;
1535 }
1536
1537 INIT_LIST_HEAD(&chain->rules);
1538 chain->handle = nf_tables_alloc_handle(table);
1539 chain->table = table;
1540 nla_strlcpy(chain->name, name, NFT_CHAIN_MAXNAMELEN);
1541
1542 err = nf_tables_register_hooks(net, table, chain, afi->nops);
1543 if (err < 0)
1544 goto err1;
1545
1546 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1547 err = nft_trans_chain_add(&ctx, NFT_MSG_NEWCHAIN);
1548 if (err < 0)
1549 goto err2;
1550
1551 table->use++;
1552 list_add_tail_rcu(&chain->list, &table->chains);
1553 return 0;
1554 err2:
1555 nf_tables_unregister_hooks(net, table, chain, afi->nops);
1556 err1:
1557 nf_tables_chain_destroy(chain);
1558 return err;
1559 }
1560
1561 static int nf_tables_delchain(struct net *net, struct sock *nlsk,
1562 struct sk_buff *skb, const struct nlmsghdr *nlh,
1563 const struct nlattr * const nla[])
1564 {
1565 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1566 u8 genmask = nft_genmask_next(net);
1567 struct nft_af_info *afi;
1568 struct nft_table *table;
1569 struct nft_chain *chain;
1570 int family = nfmsg->nfgen_family;
1571 struct nft_ctx ctx;
1572
1573 afi = nf_tables_afinfo_lookup(net, family, false);
1574 if (IS_ERR(afi))
1575 return PTR_ERR(afi);
1576
1577 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1578 if (IS_ERR(table))
1579 return PTR_ERR(table);
1580
1581 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1582 if (IS_ERR(chain))
1583 return PTR_ERR(chain);
1584 if (chain->use > 0)
1585 return -EBUSY;
1586
1587 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1588
1589 return nft_delchain(&ctx);
1590 }
1591
1592 /*
1593 * Expressions
1594 */
1595
1596 /**
1597 * nft_register_expr - register nf_tables expr type
1598 * @ops: expr type
1599 *
1600 * Registers the expr type for use with nf_tables. Returns zero on
1601 * success or a negative errno code otherwise.
1602 */
1603 int nft_register_expr(struct nft_expr_type *type)
1604 {
1605 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1606 if (type->family == NFPROTO_UNSPEC)
1607 list_add_tail_rcu(&type->list, &nf_tables_expressions);
1608 else
1609 list_add_rcu(&type->list, &nf_tables_expressions);
1610 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1611 return 0;
1612 }
1613 EXPORT_SYMBOL_GPL(nft_register_expr);
1614
1615 /**
1616 * nft_unregister_expr - unregister nf_tables expr type
1617 * @ops: expr type
1618 *
1619 * Unregisters the expr typefor use with nf_tables.
1620 */
1621 void nft_unregister_expr(struct nft_expr_type *type)
1622 {
1623 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1624 list_del_rcu(&type->list);
1625 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1626 }
1627 EXPORT_SYMBOL_GPL(nft_unregister_expr);
1628
1629 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
1630 struct nlattr *nla)
1631 {
1632 const struct nft_expr_type *type;
1633
1634 list_for_each_entry(type, &nf_tables_expressions, list) {
1635 if (!nla_strcmp(nla, type->name) &&
1636 (!type->family || type->family == family))
1637 return type;
1638 }
1639 return NULL;
1640 }
1641
1642 static const struct nft_expr_type *nft_expr_type_get(u8 family,
1643 struct nlattr *nla)
1644 {
1645 const struct nft_expr_type *type;
1646
1647 if (nla == NULL)
1648 return ERR_PTR(-EINVAL);
1649
1650 type = __nft_expr_type_get(family, nla);
1651 if (type != NULL && try_module_get(type->owner))
1652 return type;
1653
1654 #ifdef CONFIG_MODULES
1655 if (type == NULL) {
1656 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1657 request_module("nft-expr-%u-%.*s", family,
1658 nla_len(nla), (char *)nla_data(nla));
1659 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1660 if (__nft_expr_type_get(family, nla))
1661 return ERR_PTR(-EAGAIN);
1662
1663 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1664 request_module("nft-expr-%.*s",
1665 nla_len(nla), (char *)nla_data(nla));
1666 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1667 if (__nft_expr_type_get(family, nla))
1668 return ERR_PTR(-EAGAIN);
1669 }
1670 #endif
1671 return ERR_PTR(-ENOENT);
1672 }
1673
1674 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
1675 [NFTA_EXPR_NAME] = { .type = NLA_STRING },
1676 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
1677 };
1678
1679 static int nf_tables_fill_expr_info(struct sk_buff *skb,
1680 const struct nft_expr *expr)
1681 {
1682 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
1683 goto nla_put_failure;
1684
1685 if (expr->ops->dump) {
1686 struct nlattr *data = nla_nest_start(skb, NFTA_EXPR_DATA);
1687 if (data == NULL)
1688 goto nla_put_failure;
1689 if (expr->ops->dump(skb, expr) < 0)
1690 goto nla_put_failure;
1691 nla_nest_end(skb, data);
1692 }
1693
1694 return skb->len;
1695
1696 nla_put_failure:
1697 return -1;
1698 };
1699
1700 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
1701 const struct nft_expr *expr)
1702 {
1703 struct nlattr *nest;
1704
1705 nest = nla_nest_start(skb, attr);
1706 if (!nest)
1707 goto nla_put_failure;
1708 if (nf_tables_fill_expr_info(skb, expr) < 0)
1709 goto nla_put_failure;
1710 nla_nest_end(skb, nest);
1711 return 0;
1712
1713 nla_put_failure:
1714 return -1;
1715 }
1716
1717 struct nft_expr_info {
1718 const struct nft_expr_ops *ops;
1719 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
1720 };
1721
1722 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
1723 const struct nlattr *nla,
1724 struct nft_expr_info *info)
1725 {
1726 const struct nft_expr_type *type;
1727 const struct nft_expr_ops *ops;
1728 struct nlattr *tb[NFTA_EXPR_MAX + 1];
1729 int err;
1730
1731 err = nla_parse_nested(tb, NFTA_EXPR_MAX, nla, nft_expr_policy);
1732 if (err < 0)
1733 return err;
1734
1735 type = nft_expr_type_get(ctx->afi->family, tb[NFTA_EXPR_NAME]);
1736 if (IS_ERR(type))
1737 return PTR_ERR(type);
1738
1739 if (tb[NFTA_EXPR_DATA]) {
1740 err = nla_parse_nested(info->tb, type->maxattr,
1741 tb[NFTA_EXPR_DATA], type->policy);
1742 if (err < 0)
1743 goto err1;
1744 } else
1745 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
1746
1747 if (type->select_ops != NULL) {
1748 ops = type->select_ops(ctx,
1749 (const struct nlattr * const *)info->tb);
1750 if (IS_ERR(ops)) {
1751 err = PTR_ERR(ops);
1752 goto err1;
1753 }
1754 } else
1755 ops = type->ops;
1756
1757 info->ops = ops;
1758 return 0;
1759
1760 err1:
1761 module_put(type->owner);
1762 return err;
1763 }
1764
1765 static int nf_tables_newexpr(const struct nft_ctx *ctx,
1766 const struct nft_expr_info *info,
1767 struct nft_expr *expr)
1768 {
1769 const struct nft_expr_ops *ops = info->ops;
1770 int err;
1771
1772 expr->ops = ops;
1773 if (ops->init) {
1774 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
1775 if (err < 0)
1776 goto err1;
1777 }
1778
1779 return 0;
1780
1781 err1:
1782 expr->ops = NULL;
1783 return err;
1784 }
1785
1786 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
1787 struct nft_expr *expr)
1788 {
1789 if (expr->ops->destroy)
1790 expr->ops->destroy(ctx, expr);
1791 module_put(expr->ops->type->owner);
1792 }
1793
1794 struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
1795 const struct nlattr *nla)
1796 {
1797 struct nft_expr_info info;
1798 struct nft_expr *expr;
1799 int err;
1800
1801 err = nf_tables_expr_parse(ctx, nla, &info);
1802 if (err < 0)
1803 goto err1;
1804
1805 err = -ENOMEM;
1806 expr = kzalloc(info.ops->size, GFP_KERNEL);
1807 if (expr == NULL)
1808 goto err2;
1809
1810 err = nf_tables_newexpr(ctx, &info, expr);
1811 if (err < 0)
1812 goto err3;
1813
1814 return expr;
1815 err3:
1816 kfree(expr);
1817 err2:
1818 module_put(info.ops->type->owner);
1819 err1:
1820 return ERR_PTR(err);
1821 }
1822
1823 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
1824 {
1825 nf_tables_expr_destroy(ctx, expr);
1826 kfree(expr);
1827 }
1828
1829 /*
1830 * Rules
1831 */
1832
1833 static struct nft_rule *__nf_tables_rule_lookup(const struct nft_chain *chain,
1834 u64 handle)
1835 {
1836 struct nft_rule *rule;
1837
1838 // FIXME: this sucks
1839 list_for_each_entry(rule, &chain->rules, list) {
1840 if (handle == rule->handle)
1841 return rule;
1842 }
1843
1844 return ERR_PTR(-ENOENT);
1845 }
1846
1847 static struct nft_rule *nf_tables_rule_lookup(const struct nft_chain *chain,
1848 const struct nlattr *nla)
1849 {
1850 if (nla == NULL)
1851 return ERR_PTR(-EINVAL);
1852
1853 return __nf_tables_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
1854 }
1855
1856 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
1857 [NFTA_RULE_TABLE] = { .type = NLA_STRING,
1858 .len = NFT_TABLE_MAXNAMELEN - 1 },
1859 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
1860 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1861 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
1862 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
1863 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
1864 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
1865 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
1866 .len = NFT_USERDATA_MAXLEN },
1867 };
1868
1869 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
1870 u32 portid, u32 seq, int event,
1871 u32 flags, int family,
1872 const struct nft_table *table,
1873 const struct nft_chain *chain,
1874 const struct nft_rule *rule)
1875 {
1876 struct nlmsghdr *nlh;
1877 struct nfgenmsg *nfmsg;
1878 const struct nft_expr *expr, *next;
1879 struct nlattr *list;
1880 const struct nft_rule *prule;
1881 int type = event | NFNL_SUBSYS_NFTABLES << 8;
1882
1883 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg),
1884 flags);
1885 if (nlh == NULL)
1886 goto nla_put_failure;
1887
1888 nfmsg = nlmsg_data(nlh);
1889 nfmsg->nfgen_family = family;
1890 nfmsg->version = NFNETLINK_V0;
1891 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1892
1893 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
1894 goto nla_put_failure;
1895 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
1896 goto nla_put_failure;
1897 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
1898 NFTA_RULE_PAD))
1899 goto nla_put_failure;
1900
1901 if ((event != NFT_MSG_DELRULE) && (rule->list.prev != &chain->rules)) {
1902 prule = list_entry(rule->list.prev, struct nft_rule, list);
1903 if (nla_put_be64(skb, NFTA_RULE_POSITION,
1904 cpu_to_be64(prule->handle),
1905 NFTA_RULE_PAD))
1906 goto nla_put_failure;
1907 }
1908
1909 list = nla_nest_start(skb, NFTA_RULE_EXPRESSIONS);
1910 if (list == NULL)
1911 goto nla_put_failure;
1912 nft_rule_for_each_expr(expr, next, rule) {
1913 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
1914 goto nla_put_failure;
1915 }
1916 nla_nest_end(skb, list);
1917
1918 if (rule->udata) {
1919 struct nft_userdata *udata = nft_userdata(rule);
1920 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
1921 udata->data) < 0)
1922 goto nla_put_failure;
1923 }
1924
1925 nlmsg_end(skb, nlh);
1926 return 0;
1927
1928 nla_put_failure:
1929 nlmsg_trim(skb, nlh);
1930 return -1;
1931 }
1932
1933 static int nf_tables_rule_notify(const struct nft_ctx *ctx,
1934 const struct nft_rule *rule,
1935 int event)
1936 {
1937 struct sk_buff *skb;
1938 int err;
1939
1940 if (!ctx->report &&
1941 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1942 return 0;
1943
1944 err = -ENOBUFS;
1945 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1946 if (skb == NULL)
1947 goto err;
1948
1949 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
1950 event, 0, ctx->afi->family, ctx->table,
1951 ctx->chain, rule);
1952 if (err < 0) {
1953 kfree_skb(skb);
1954 goto err;
1955 }
1956
1957 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1958 ctx->report, GFP_KERNEL);
1959 err:
1960 if (err < 0) {
1961 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1962 err);
1963 }
1964 return err;
1965 }
1966
1967 struct nft_rule_dump_ctx {
1968 char table[NFT_TABLE_MAXNAMELEN];
1969 char chain[NFT_CHAIN_MAXNAMELEN];
1970 };
1971
1972 static int nf_tables_dump_rules(struct sk_buff *skb,
1973 struct netlink_callback *cb)
1974 {
1975 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1976 const struct nft_rule_dump_ctx *ctx = cb->data;
1977 const struct nft_af_info *afi;
1978 const struct nft_table *table;
1979 const struct nft_chain *chain;
1980 const struct nft_rule *rule;
1981 unsigned int idx = 0, s_idx = cb->args[0];
1982 struct net *net = sock_net(skb->sk);
1983 int family = nfmsg->nfgen_family;
1984
1985 rcu_read_lock();
1986 cb->seq = net->nft.base_seq;
1987
1988 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1989 if (family != NFPROTO_UNSPEC && family != afi->family)
1990 continue;
1991
1992 list_for_each_entry_rcu(table, &afi->tables, list) {
1993 if (ctx && ctx->table[0] &&
1994 strcmp(ctx->table, table->name) != 0)
1995 continue;
1996
1997 list_for_each_entry_rcu(chain, &table->chains, list) {
1998 if (ctx && ctx->chain[0] &&
1999 strcmp(ctx->chain, chain->name) != 0)
2000 continue;
2001
2002 list_for_each_entry_rcu(rule, &chain->rules, list) {
2003 if (!nft_is_active(net, rule))
2004 goto cont;
2005 if (idx < s_idx)
2006 goto cont;
2007 if (idx > s_idx)
2008 memset(&cb->args[1], 0,
2009 sizeof(cb->args) - sizeof(cb->args[0]));
2010 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
2011 cb->nlh->nlmsg_seq,
2012 NFT_MSG_NEWRULE,
2013 NLM_F_MULTI | NLM_F_APPEND,
2014 afi->family, table, chain, rule) < 0)
2015 goto done;
2016
2017 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2018 cont:
2019 idx++;
2020 }
2021 }
2022 }
2023 }
2024 done:
2025 rcu_read_unlock();
2026
2027 cb->args[0] = idx;
2028 return skb->len;
2029 }
2030
2031 static int nf_tables_dump_rules_done(struct netlink_callback *cb)
2032 {
2033 kfree(cb->data);
2034 return 0;
2035 }
2036
2037 static int nf_tables_getrule(struct net *net, struct sock *nlsk,
2038 struct sk_buff *skb, const struct nlmsghdr *nlh,
2039 const struct nlattr * const nla[])
2040 {
2041 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2042 u8 genmask = nft_genmask_cur(net);
2043 const struct nft_af_info *afi;
2044 const struct nft_table *table;
2045 const struct nft_chain *chain;
2046 const struct nft_rule *rule;
2047 struct sk_buff *skb2;
2048 int family = nfmsg->nfgen_family;
2049 int err;
2050
2051 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2052 struct netlink_dump_control c = {
2053 .dump = nf_tables_dump_rules,
2054 .done = nf_tables_dump_rules_done,
2055 };
2056
2057 if (nla[NFTA_RULE_TABLE] || nla[NFTA_RULE_CHAIN]) {
2058 struct nft_rule_dump_ctx *ctx;
2059
2060 ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
2061 if (!ctx)
2062 return -ENOMEM;
2063
2064 if (nla[NFTA_RULE_TABLE])
2065 nla_strlcpy(ctx->table, nla[NFTA_RULE_TABLE],
2066 sizeof(ctx->table));
2067 if (nla[NFTA_RULE_CHAIN])
2068 nla_strlcpy(ctx->chain, nla[NFTA_RULE_CHAIN],
2069 sizeof(ctx->chain));
2070 c.data = ctx;
2071 }
2072
2073 return netlink_dump_start(nlsk, skb, nlh, &c);
2074 }
2075
2076 afi = nf_tables_afinfo_lookup(net, family, false);
2077 if (IS_ERR(afi))
2078 return PTR_ERR(afi);
2079
2080 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2081 if (IS_ERR(table))
2082 return PTR_ERR(table);
2083
2084 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2085 if (IS_ERR(chain))
2086 return PTR_ERR(chain);
2087
2088 rule = nf_tables_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2089 if (IS_ERR(rule))
2090 return PTR_ERR(rule);
2091
2092 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2093 if (!skb2)
2094 return -ENOMEM;
2095
2096 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
2097 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
2098 family, table, chain, rule);
2099 if (err < 0)
2100 goto err;
2101
2102 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2103
2104 err:
2105 kfree_skb(skb2);
2106 return err;
2107 }
2108
2109 static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
2110 struct nft_rule *rule)
2111 {
2112 struct nft_expr *expr;
2113
2114 /*
2115 * Careful: some expressions might not be initialized in case this
2116 * is called on error from nf_tables_newrule().
2117 */
2118 expr = nft_expr_first(rule);
2119 while (expr != nft_expr_last(rule) && expr->ops) {
2120 nf_tables_expr_destroy(ctx, expr);
2121 expr = nft_expr_next(expr);
2122 }
2123 kfree(rule);
2124 }
2125
2126 #define NFT_RULE_MAXEXPRS 128
2127
2128 static struct nft_expr_info *info;
2129
2130 static int nf_tables_newrule(struct net *net, struct sock *nlsk,
2131 struct sk_buff *skb, const struct nlmsghdr *nlh,
2132 const struct nlattr * const nla[])
2133 {
2134 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2135 u8 genmask = nft_genmask_next(net);
2136 struct nft_af_info *afi;
2137 struct nft_table *table;
2138 struct nft_chain *chain;
2139 struct nft_rule *rule, *old_rule = NULL;
2140 struct nft_userdata *udata;
2141 struct nft_trans *trans = NULL;
2142 struct nft_expr *expr;
2143 struct nft_ctx ctx;
2144 struct nlattr *tmp;
2145 unsigned int size, i, n, ulen = 0, usize = 0;
2146 int err, rem;
2147 bool create;
2148 u64 handle, pos_handle;
2149
2150 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2151
2152 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
2153 if (IS_ERR(afi))
2154 return PTR_ERR(afi);
2155
2156 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2157 if (IS_ERR(table))
2158 return PTR_ERR(table);
2159
2160 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2161 if (IS_ERR(chain))
2162 return PTR_ERR(chain);
2163
2164 if (nla[NFTA_RULE_HANDLE]) {
2165 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
2166 rule = __nf_tables_rule_lookup(chain, handle);
2167 if (IS_ERR(rule))
2168 return PTR_ERR(rule);
2169
2170 if (nlh->nlmsg_flags & NLM_F_EXCL)
2171 return -EEXIST;
2172 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2173 old_rule = rule;
2174 else
2175 return -EOPNOTSUPP;
2176 } else {
2177 if (!create || nlh->nlmsg_flags & NLM_F_REPLACE)
2178 return -EINVAL;
2179 handle = nf_tables_alloc_handle(table);
2180
2181 if (chain->use == UINT_MAX)
2182 return -EOVERFLOW;
2183 }
2184
2185 if (nla[NFTA_RULE_POSITION]) {
2186 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2187 return -EOPNOTSUPP;
2188
2189 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
2190 old_rule = __nf_tables_rule_lookup(chain, pos_handle);
2191 if (IS_ERR(old_rule))
2192 return PTR_ERR(old_rule);
2193 }
2194
2195 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2196
2197 n = 0;
2198 size = 0;
2199 if (nla[NFTA_RULE_EXPRESSIONS]) {
2200 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
2201 err = -EINVAL;
2202 if (nla_type(tmp) != NFTA_LIST_ELEM)
2203 goto err1;
2204 if (n == NFT_RULE_MAXEXPRS)
2205 goto err1;
2206 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
2207 if (err < 0)
2208 goto err1;
2209 size += info[n].ops->size;
2210 n++;
2211 }
2212 }
2213 /* Check for overflow of dlen field */
2214 err = -EFBIG;
2215 if (size >= 1 << 12)
2216 goto err1;
2217
2218 if (nla[NFTA_RULE_USERDATA]) {
2219 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
2220 if (ulen > 0)
2221 usize = sizeof(struct nft_userdata) + ulen;
2222 }
2223
2224 err = -ENOMEM;
2225 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
2226 if (rule == NULL)
2227 goto err1;
2228
2229 nft_activate_next(net, rule);
2230
2231 rule->handle = handle;
2232 rule->dlen = size;
2233 rule->udata = ulen ? 1 : 0;
2234
2235 if (ulen) {
2236 udata = nft_userdata(rule);
2237 udata->len = ulen - 1;
2238 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
2239 }
2240
2241 expr = nft_expr_first(rule);
2242 for (i = 0; i < n; i++) {
2243 err = nf_tables_newexpr(&ctx, &info[i], expr);
2244 if (err < 0)
2245 goto err2;
2246 info[i].ops = NULL;
2247 expr = nft_expr_next(expr);
2248 }
2249
2250 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
2251 if (nft_is_active_next(net, old_rule)) {
2252 trans = nft_trans_rule_add(&ctx, NFT_MSG_DELRULE,
2253 old_rule);
2254 if (trans == NULL) {
2255 err = -ENOMEM;
2256 goto err2;
2257 }
2258 nft_deactivate_next(net, old_rule);
2259 chain->use--;
2260 list_add_tail_rcu(&rule->list, &old_rule->list);
2261 } else {
2262 err = -ENOENT;
2263 goto err2;
2264 }
2265 } else if (nlh->nlmsg_flags & NLM_F_APPEND)
2266 if (old_rule)
2267 list_add_rcu(&rule->list, &old_rule->list);
2268 else
2269 list_add_tail_rcu(&rule->list, &chain->rules);
2270 else {
2271 if (old_rule)
2272 list_add_tail_rcu(&rule->list, &old_rule->list);
2273 else
2274 list_add_rcu(&rule->list, &chain->rules);
2275 }
2276
2277 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2278 err = -ENOMEM;
2279 goto err3;
2280 }
2281 chain->use++;
2282 return 0;
2283
2284 err3:
2285 list_del_rcu(&rule->list);
2286 err2:
2287 nf_tables_rule_destroy(&ctx, rule);
2288 err1:
2289 for (i = 0; i < n; i++) {
2290 if (info[i].ops != NULL)
2291 module_put(info[i].ops->type->owner);
2292 }
2293 return err;
2294 }
2295
2296 static int nf_tables_delrule(struct net *net, struct sock *nlsk,
2297 struct sk_buff *skb, const struct nlmsghdr *nlh,
2298 const struct nlattr * const nla[])
2299 {
2300 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2301 u8 genmask = nft_genmask_next(net);
2302 struct nft_af_info *afi;
2303 struct nft_table *table;
2304 struct nft_chain *chain = NULL;
2305 struct nft_rule *rule;
2306 int family = nfmsg->nfgen_family, err = 0;
2307 struct nft_ctx ctx;
2308
2309 afi = nf_tables_afinfo_lookup(net, family, false);
2310 if (IS_ERR(afi))
2311 return PTR_ERR(afi);
2312
2313 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2314 if (IS_ERR(table))
2315 return PTR_ERR(table);
2316
2317 if (nla[NFTA_RULE_CHAIN]) {
2318 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN],
2319 genmask);
2320 if (IS_ERR(chain))
2321 return PTR_ERR(chain);
2322 }
2323
2324 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2325
2326 if (chain) {
2327 if (nla[NFTA_RULE_HANDLE]) {
2328 rule = nf_tables_rule_lookup(chain,
2329 nla[NFTA_RULE_HANDLE]);
2330 if (IS_ERR(rule))
2331 return PTR_ERR(rule);
2332
2333 err = nft_delrule(&ctx, rule);
2334 } else {
2335 err = nft_delrule_by_chain(&ctx);
2336 }
2337 } else {
2338 list_for_each_entry(chain, &table->chains, list) {
2339 if (!nft_is_active_next(net, chain))
2340 continue;
2341
2342 ctx.chain = chain;
2343 err = nft_delrule_by_chain(&ctx);
2344 if (err < 0)
2345 break;
2346 }
2347 }
2348
2349 return err;
2350 }
2351
2352 /*
2353 * Sets
2354 */
2355
2356 static LIST_HEAD(nf_tables_set_ops);
2357
2358 int nft_register_set(struct nft_set_ops *ops)
2359 {
2360 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2361 list_add_tail_rcu(&ops->list, &nf_tables_set_ops);
2362 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2363 return 0;
2364 }
2365 EXPORT_SYMBOL_GPL(nft_register_set);
2366
2367 void nft_unregister_set(struct nft_set_ops *ops)
2368 {
2369 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2370 list_del_rcu(&ops->list);
2371 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2372 }
2373 EXPORT_SYMBOL_GPL(nft_unregister_set);
2374
2375 /*
2376 * Select a set implementation based on the data characteristics and the
2377 * given policy. The total memory use might not be known if no size is
2378 * given, in that case the amount of memory per element is used.
2379 */
2380 static const struct nft_set_ops *
2381 nft_select_set_ops(const struct nlattr * const nla[],
2382 const struct nft_set_desc *desc,
2383 enum nft_set_policies policy)
2384 {
2385 const struct nft_set_ops *ops, *bops;
2386 struct nft_set_estimate est, best;
2387 u32 features;
2388
2389 #ifdef CONFIG_MODULES
2390 if (list_empty(&nf_tables_set_ops)) {
2391 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2392 request_module("nft-set");
2393 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2394 if (!list_empty(&nf_tables_set_ops))
2395 return ERR_PTR(-EAGAIN);
2396 }
2397 #endif
2398 features = 0;
2399 if (nla[NFTA_SET_FLAGS] != NULL) {
2400 features = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2401 features &= NFT_SET_INTERVAL | NFT_SET_MAP | NFT_SET_TIMEOUT;
2402 }
2403
2404 bops = NULL;
2405 best.size = ~0;
2406 best.class = ~0;
2407
2408 list_for_each_entry(ops, &nf_tables_set_ops, list) {
2409 if ((ops->features & features) != features)
2410 continue;
2411 if (!ops->estimate(desc, features, &est))
2412 continue;
2413
2414 switch (policy) {
2415 case NFT_SET_POL_PERFORMANCE:
2416 if (est.class < best.class)
2417 break;
2418 if (est.class == best.class && est.size < best.size)
2419 break;
2420 continue;
2421 case NFT_SET_POL_MEMORY:
2422 if (est.size < best.size)
2423 break;
2424 if (est.size == best.size && est.class < best.class)
2425 break;
2426 continue;
2427 default:
2428 break;
2429 }
2430
2431 if (!try_module_get(ops->owner))
2432 continue;
2433 if (bops != NULL)
2434 module_put(bops->owner);
2435
2436 bops = ops;
2437 best = est;
2438 }
2439
2440 if (bops != NULL)
2441 return bops;
2442
2443 return ERR_PTR(-EOPNOTSUPP);
2444 }
2445
2446 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
2447 [NFTA_SET_TABLE] = { .type = NLA_STRING,
2448 .len = NFT_TABLE_MAXNAMELEN - 1 },
2449 [NFTA_SET_NAME] = { .type = NLA_STRING,
2450 .len = NFT_SET_MAXNAMELEN - 1 },
2451 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
2452 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
2453 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
2454 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
2455 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
2456 [NFTA_SET_POLICY] = { .type = NLA_U32 },
2457 [NFTA_SET_DESC] = { .type = NLA_NESTED },
2458 [NFTA_SET_ID] = { .type = NLA_U32 },
2459 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
2460 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
2461 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
2462 .len = NFT_USERDATA_MAXLEN },
2463 [NFTA_SET_OBJ_TYPE] = { .type = NLA_U32 },
2464 };
2465
2466 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
2467 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
2468 };
2469
2470 static int nft_ctx_init_from_setattr(struct nft_ctx *ctx, struct net *net,
2471 const struct sk_buff *skb,
2472 const struct nlmsghdr *nlh,
2473 const struct nlattr * const nla[],
2474 u8 genmask)
2475 {
2476 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2477 struct nft_af_info *afi = NULL;
2478 struct nft_table *table = NULL;
2479
2480 if (nfmsg->nfgen_family != NFPROTO_UNSPEC) {
2481 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
2482 if (IS_ERR(afi))
2483 return PTR_ERR(afi);
2484 }
2485
2486 if (nla[NFTA_SET_TABLE] != NULL) {
2487 if (afi == NULL)
2488 return -EAFNOSUPPORT;
2489
2490 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE],
2491 genmask);
2492 if (IS_ERR(table))
2493 return PTR_ERR(table);
2494 }
2495
2496 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
2497 return 0;
2498 }
2499
2500 struct nft_set *nf_tables_set_lookup(const struct nft_table *table,
2501 const struct nlattr *nla, u8 genmask)
2502 {
2503 struct nft_set *set;
2504
2505 if (nla == NULL)
2506 return ERR_PTR(-EINVAL);
2507
2508 list_for_each_entry(set, &table->sets, list) {
2509 if (!nla_strcmp(nla, set->name) &&
2510 nft_active_genmask(set, genmask))
2511 return set;
2512 }
2513 return ERR_PTR(-ENOENT);
2514 }
2515 EXPORT_SYMBOL_GPL(nf_tables_set_lookup);
2516
2517 struct nft_set *nf_tables_set_lookup_byid(const struct net *net,
2518 const struct nlattr *nla,
2519 u8 genmask)
2520 {
2521 struct nft_trans *trans;
2522 u32 id = ntohl(nla_get_be32(nla));
2523
2524 list_for_each_entry(trans, &net->nft.commit_list, list) {
2525 struct nft_set *set = nft_trans_set(trans);
2526
2527 if (trans->msg_type == NFT_MSG_NEWSET &&
2528 id == nft_trans_set_id(trans) &&
2529 nft_active_genmask(set, genmask))
2530 return set;
2531 }
2532 return ERR_PTR(-ENOENT);
2533 }
2534 EXPORT_SYMBOL_GPL(nf_tables_set_lookup_byid);
2535
2536 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
2537 const char *name)
2538 {
2539 const struct nft_set *i;
2540 const char *p;
2541 unsigned long *inuse;
2542 unsigned int n = 0, min = 0;
2543
2544 p = strnchr(name, NFT_SET_MAXNAMELEN, '%');
2545 if (p != NULL) {
2546 if (p[1] != 'd' || strchr(p + 2, '%'))
2547 return -EINVAL;
2548
2549 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
2550 if (inuse == NULL)
2551 return -ENOMEM;
2552 cont:
2553 list_for_each_entry(i, &ctx->table->sets, list) {
2554 int tmp;
2555
2556 if (!nft_is_active_next(ctx->net, set))
2557 continue;
2558 if (!sscanf(i->name, name, &tmp))
2559 continue;
2560 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
2561 continue;
2562
2563 set_bit(tmp - min, inuse);
2564 }
2565
2566 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
2567 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
2568 min += BITS_PER_BYTE * PAGE_SIZE;
2569 memset(inuse, 0, PAGE_SIZE);
2570 goto cont;
2571 }
2572 free_page((unsigned long)inuse);
2573 }
2574
2575 snprintf(set->name, sizeof(set->name), name, min + n);
2576 list_for_each_entry(i, &ctx->table->sets, list) {
2577 if (!nft_is_active_next(ctx->net, i))
2578 continue;
2579 if (!strcmp(set->name, i->name))
2580 return -ENFILE;
2581 }
2582 return 0;
2583 }
2584
2585 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
2586 const struct nft_set *set, u16 event, u16 flags)
2587 {
2588 struct nfgenmsg *nfmsg;
2589 struct nlmsghdr *nlh;
2590 struct nlattr *desc;
2591 u32 portid = ctx->portid;
2592 u32 seq = ctx->seq;
2593
2594 event |= NFNL_SUBSYS_NFTABLES << 8;
2595 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
2596 flags);
2597 if (nlh == NULL)
2598 goto nla_put_failure;
2599
2600 nfmsg = nlmsg_data(nlh);
2601 nfmsg->nfgen_family = ctx->afi->family;
2602 nfmsg->version = NFNETLINK_V0;
2603 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
2604
2605 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
2606 goto nla_put_failure;
2607 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
2608 goto nla_put_failure;
2609 if (set->flags != 0)
2610 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
2611 goto nla_put_failure;
2612
2613 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
2614 goto nla_put_failure;
2615 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
2616 goto nla_put_failure;
2617 if (set->flags & NFT_SET_MAP) {
2618 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
2619 goto nla_put_failure;
2620 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
2621 goto nla_put_failure;
2622 }
2623 if (set->flags & NFT_SET_OBJECT &&
2624 nla_put_be32(skb, NFTA_SET_OBJ_TYPE, htonl(set->objtype)))
2625 goto nla_put_failure;
2626
2627 if (set->timeout &&
2628 nla_put_be64(skb, NFTA_SET_TIMEOUT,
2629 cpu_to_be64(jiffies_to_msecs(set->timeout)),
2630 NFTA_SET_PAD))
2631 goto nla_put_failure;
2632 if (set->gc_int &&
2633 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
2634 goto nla_put_failure;
2635
2636 if (set->policy != NFT_SET_POL_PERFORMANCE) {
2637 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
2638 goto nla_put_failure;
2639 }
2640
2641 if (nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
2642 goto nla_put_failure;
2643
2644 desc = nla_nest_start(skb, NFTA_SET_DESC);
2645 if (desc == NULL)
2646 goto nla_put_failure;
2647 if (set->size &&
2648 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
2649 goto nla_put_failure;
2650 nla_nest_end(skb, desc);
2651
2652 nlmsg_end(skb, nlh);
2653 return 0;
2654
2655 nla_put_failure:
2656 nlmsg_trim(skb, nlh);
2657 return -1;
2658 }
2659
2660 static int nf_tables_set_notify(const struct nft_ctx *ctx,
2661 const struct nft_set *set,
2662 int event, gfp_t gfp_flags)
2663 {
2664 struct sk_buff *skb;
2665 u32 portid = ctx->portid;
2666 int err;
2667
2668 if (!ctx->report &&
2669 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2670 return 0;
2671
2672 err = -ENOBUFS;
2673 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
2674 if (skb == NULL)
2675 goto err;
2676
2677 err = nf_tables_fill_set(skb, ctx, set, event, 0);
2678 if (err < 0) {
2679 kfree_skb(skb);
2680 goto err;
2681 }
2682
2683 err = nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES,
2684 ctx->report, gfp_flags);
2685 err:
2686 if (err < 0)
2687 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, err);
2688 return err;
2689 }
2690
2691 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
2692 {
2693 const struct nft_set *set;
2694 unsigned int idx, s_idx = cb->args[0];
2695 struct nft_af_info *afi;
2696 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
2697 struct net *net = sock_net(skb->sk);
2698 int cur_family = cb->args[3];
2699 struct nft_ctx *ctx = cb->data, ctx_set;
2700
2701 if (cb->args[1])
2702 return skb->len;
2703
2704 rcu_read_lock();
2705 cb->seq = net->nft.base_seq;
2706
2707 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
2708 if (ctx->afi && ctx->afi != afi)
2709 continue;
2710
2711 if (cur_family) {
2712 if (afi->family != cur_family)
2713 continue;
2714
2715 cur_family = 0;
2716 }
2717 list_for_each_entry_rcu(table, &afi->tables, list) {
2718 if (ctx->table && ctx->table != table)
2719 continue;
2720
2721 if (cur_table) {
2722 if (cur_table != table)
2723 continue;
2724
2725 cur_table = NULL;
2726 }
2727 idx = 0;
2728 list_for_each_entry_rcu(set, &table->sets, list) {
2729 if (idx < s_idx)
2730 goto cont;
2731 if (!nft_is_active(net, set))
2732 goto cont;
2733
2734 ctx_set = *ctx;
2735 ctx_set.table = table;
2736 ctx_set.afi = afi;
2737 if (nf_tables_fill_set(skb, &ctx_set, set,
2738 NFT_MSG_NEWSET,
2739 NLM_F_MULTI) < 0) {
2740 cb->args[0] = idx;
2741 cb->args[2] = (unsigned long) table;
2742 cb->args[3] = afi->family;
2743 goto done;
2744 }
2745 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2746 cont:
2747 idx++;
2748 }
2749 if (s_idx)
2750 s_idx = 0;
2751 }
2752 }
2753 cb->args[1] = 1;
2754 done:
2755 rcu_read_unlock();
2756 return skb->len;
2757 }
2758
2759 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
2760 {
2761 kfree(cb->data);
2762 return 0;
2763 }
2764
2765 static int nf_tables_getset(struct net *net, struct sock *nlsk,
2766 struct sk_buff *skb, const struct nlmsghdr *nlh,
2767 const struct nlattr * const nla[])
2768 {
2769 u8 genmask = nft_genmask_cur(net);
2770 const struct nft_set *set;
2771 struct nft_ctx ctx;
2772 struct sk_buff *skb2;
2773 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2774 int err;
2775
2776 /* Verify existence before starting dump */
2777 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
2778 if (err < 0)
2779 return err;
2780
2781 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2782 struct netlink_dump_control c = {
2783 .dump = nf_tables_dump_sets,
2784 .done = nf_tables_dump_sets_done,
2785 };
2786 struct nft_ctx *ctx_dump;
2787
2788 ctx_dump = kmalloc(sizeof(*ctx_dump), GFP_KERNEL);
2789 if (ctx_dump == NULL)
2790 return -ENOMEM;
2791
2792 *ctx_dump = ctx;
2793 c.data = ctx_dump;
2794
2795 return netlink_dump_start(nlsk, skb, nlh, &c);
2796 }
2797
2798 /* Only accept unspec with dump */
2799 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2800 return -EAFNOSUPPORT;
2801 if (!nla[NFTA_SET_TABLE])
2802 return -EINVAL;
2803
2804 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
2805 if (IS_ERR(set))
2806 return PTR_ERR(set);
2807
2808 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2809 if (skb2 == NULL)
2810 return -ENOMEM;
2811
2812 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
2813 if (err < 0)
2814 goto err;
2815
2816 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2817
2818 err:
2819 kfree_skb(skb2);
2820 return err;
2821 }
2822
2823 static int nf_tables_set_desc_parse(const struct nft_ctx *ctx,
2824 struct nft_set_desc *desc,
2825 const struct nlattr *nla)
2826 {
2827 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
2828 int err;
2829
2830 err = nla_parse_nested(da, NFTA_SET_DESC_MAX, nla, nft_set_desc_policy);
2831 if (err < 0)
2832 return err;
2833
2834 if (da[NFTA_SET_DESC_SIZE] != NULL)
2835 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
2836
2837 return 0;
2838 }
2839
2840 static int nf_tables_newset(struct net *net, struct sock *nlsk,
2841 struct sk_buff *skb, const struct nlmsghdr *nlh,
2842 const struct nlattr * const nla[])
2843 {
2844 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2845 u8 genmask = nft_genmask_next(net);
2846 const struct nft_set_ops *ops;
2847 struct nft_af_info *afi;
2848 struct nft_table *table;
2849 struct nft_set *set;
2850 struct nft_ctx ctx;
2851 char name[NFT_SET_MAXNAMELEN];
2852 unsigned int size;
2853 bool create;
2854 u64 timeout;
2855 u32 ktype, dtype, flags, policy, gc_int, objtype;
2856 struct nft_set_desc desc;
2857 unsigned char *udata;
2858 u16 udlen;
2859 int err;
2860
2861 if (nla[NFTA_SET_TABLE] == NULL ||
2862 nla[NFTA_SET_NAME] == NULL ||
2863 nla[NFTA_SET_KEY_LEN] == NULL ||
2864 nla[NFTA_SET_ID] == NULL)
2865 return -EINVAL;
2866
2867 memset(&desc, 0, sizeof(desc));
2868
2869 ktype = NFT_DATA_VALUE;
2870 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
2871 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
2872 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
2873 return -EINVAL;
2874 }
2875
2876 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
2877 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
2878 return -EINVAL;
2879
2880 flags = 0;
2881 if (nla[NFTA_SET_FLAGS] != NULL) {
2882 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2883 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
2884 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
2885 NFT_SET_MAP | NFT_SET_EVAL |
2886 NFT_SET_OBJECT))
2887 return -EINVAL;
2888 /* Only one of these operations is supported */
2889 if ((flags & (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT)) ==
2890 (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT))
2891 return -EOPNOTSUPP;
2892 }
2893
2894 dtype = 0;
2895 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
2896 if (!(flags & NFT_SET_MAP))
2897 return -EINVAL;
2898
2899 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
2900 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
2901 dtype != NFT_DATA_VERDICT)
2902 return -EINVAL;
2903
2904 if (dtype != NFT_DATA_VERDICT) {
2905 if (nla[NFTA_SET_DATA_LEN] == NULL)
2906 return -EINVAL;
2907 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
2908 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
2909 return -EINVAL;
2910 } else
2911 desc.dlen = sizeof(struct nft_verdict);
2912 } else if (flags & NFT_SET_MAP)
2913 return -EINVAL;
2914
2915 if (nla[NFTA_SET_OBJ_TYPE] != NULL) {
2916 if (!(flags & NFT_SET_OBJECT))
2917 return -EINVAL;
2918
2919 objtype = ntohl(nla_get_be32(nla[NFTA_SET_OBJ_TYPE]));
2920 if (objtype == NFT_OBJECT_UNSPEC ||
2921 objtype > NFT_OBJECT_MAX)
2922 return -EINVAL;
2923 } else if (flags & NFT_SET_OBJECT)
2924 return -EINVAL;
2925 else
2926 objtype = NFT_OBJECT_UNSPEC;
2927
2928 timeout = 0;
2929 if (nla[NFTA_SET_TIMEOUT] != NULL) {
2930 if (!(flags & NFT_SET_TIMEOUT))
2931 return -EINVAL;
2932 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
2933 nla[NFTA_SET_TIMEOUT])));
2934 }
2935 gc_int = 0;
2936 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
2937 if (!(flags & NFT_SET_TIMEOUT))
2938 return -EINVAL;
2939 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
2940 }
2941
2942 policy = NFT_SET_POL_PERFORMANCE;
2943 if (nla[NFTA_SET_POLICY] != NULL)
2944 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
2945
2946 if (nla[NFTA_SET_DESC] != NULL) {
2947 err = nf_tables_set_desc_parse(&ctx, &desc, nla[NFTA_SET_DESC]);
2948 if (err < 0)
2949 return err;
2950 }
2951
2952 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2953
2954 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
2955 if (IS_ERR(afi))
2956 return PTR_ERR(afi);
2957
2958 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE], genmask);
2959 if (IS_ERR(table))
2960 return PTR_ERR(table);
2961
2962 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
2963
2964 set = nf_tables_set_lookup(table, nla[NFTA_SET_NAME], genmask);
2965 if (IS_ERR(set)) {
2966 if (PTR_ERR(set) != -ENOENT)
2967 return PTR_ERR(set);
2968 } else {
2969 if (nlh->nlmsg_flags & NLM_F_EXCL)
2970 return -EEXIST;
2971 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2972 return -EOPNOTSUPP;
2973 return 0;
2974 }
2975
2976 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2977 return -ENOENT;
2978
2979 ops = nft_select_set_ops(nla, &desc, policy);
2980 if (IS_ERR(ops))
2981 return PTR_ERR(ops);
2982
2983 udlen = 0;
2984 if (nla[NFTA_SET_USERDATA])
2985 udlen = nla_len(nla[NFTA_SET_USERDATA]);
2986
2987 size = 0;
2988 if (ops->privsize != NULL)
2989 size = ops->privsize(nla);
2990
2991 err = -ENOMEM;
2992 set = kzalloc(sizeof(*set) + size + udlen, GFP_KERNEL);
2993 if (set == NULL)
2994 goto err1;
2995
2996 nla_strlcpy(name, nla[NFTA_SET_NAME], sizeof(set->name));
2997 err = nf_tables_set_alloc_name(&ctx, set, name);
2998 if (err < 0)
2999 goto err2;
3000
3001 udata = NULL;
3002 if (udlen) {
3003 udata = set->data + size;
3004 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
3005 }
3006
3007 INIT_LIST_HEAD(&set->bindings);
3008 set->ops = ops;
3009 set->ktype = ktype;
3010 set->klen = desc.klen;
3011 set->dtype = dtype;
3012 set->objtype = objtype;
3013 set->dlen = desc.dlen;
3014 set->flags = flags;
3015 set->size = desc.size;
3016 set->policy = policy;
3017 set->udlen = udlen;
3018 set->udata = udata;
3019 set->timeout = timeout;
3020 set->gc_int = gc_int;
3021
3022 err = ops->init(set, &desc, nla);
3023 if (err < 0)
3024 goto err2;
3025
3026 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
3027 if (err < 0)
3028 goto err3;
3029
3030 list_add_tail_rcu(&set->list, &table->sets);
3031 table->use++;
3032 return 0;
3033
3034 err3:
3035 ops->destroy(set);
3036 err2:
3037 kfree(set);
3038 err1:
3039 module_put(ops->owner);
3040 return err;
3041 }
3042
3043 static void nft_set_destroy(struct nft_set *set)
3044 {
3045 set->ops->destroy(set);
3046 module_put(set->ops->owner);
3047 kfree(set);
3048 }
3049
3050 static void nf_tables_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
3051 {
3052 list_del_rcu(&set->list);
3053 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET, GFP_ATOMIC);
3054 nft_set_destroy(set);
3055 }
3056
3057 static int nf_tables_delset(struct net *net, struct sock *nlsk,
3058 struct sk_buff *skb, const struct nlmsghdr *nlh,
3059 const struct nlattr * const nla[])
3060 {
3061 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3062 u8 genmask = nft_genmask_next(net);
3063 struct nft_set *set;
3064 struct nft_ctx ctx;
3065 int err;
3066
3067 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
3068 return -EAFNOSUPPORT;
3069 if (nla[NFTA_SET_TABLE] == NULL)
3070 return -EINVAL;
3071
3072 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
3073 if (err < 0)
3074 return err;
3075
3076 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
3077 if (IS_ERR(set))
3078 return PTR_ERR(set);
3079 if (!list_empty(&set->bindings))
3080 return -EBUSY;
3081
3082 return nft_delset(&ctx, set);
3083 }
3084
3085 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
3086 struct nft_set *set,
3087 const struct nft_set_iter *iter,
3088 struct nft_set_elem *elem)
3089 {
3090 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3091 enum nft_registers dreg;
3092
3093 dreg = nft_type_to_reg(set->dtype);
3094 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
3095 set->dtype == NFT_DATA_VERDICT ?
3096 NFT_DATA_VERDICT : NFT_DATA_VALUE,
3097 set->dlen);
3098 }
3099
3100 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
3101 struct nft_set_binding *binding)
3102 {
3103 struct nft_set_binding *i;
3104 struct nft_set_iter iter;
3105
3106 if (!list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS)
3107 return -EBUSY;
3108
3109 if (binding->flags & NFT_SET_MAP) {
3110 /* If the set is already bound to the same chain all
3111 * jumps are already validated for that chain.
3112 */
3113 list_for_each_entry(i, &set->bindings, list) {
3114 if (i->flags & NFT_SET_MAP &&
3115 i->chain == binding->chain)
3116 goto bind;
3117 }
3118
3119 iter.genmask = nft_genmask_next(ctx->net);
3120 iter.skip = 0;
3121 iter.count = 0;
3122 iter.err = 0;
3123 iter.fn = nf_tables_bind_check_setelem;
3124
3125 set->ops->walk(ctx, set, &iter);
3126 if (iter.err < 0)
3127 return iter.err;
3128 }
3129 bind:
3130 binding->chain = ctx->chain;
3131 list_add_tail_rcu(&binding->list, &set->bindings);
3132 return 0;
3133 }
3134 EXPORT_SYMBOL_GPL(nf_tables_bind_set);
3135
3136 void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
3137 struct nft_set_binding *binding)
3138 {
3139 list_del_rcu(&binding->list);
3140
3141 if (list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS &&
3142 nft_is_active(ctx->net, set))
3143 nf_tables_set_destroy(ctx, set);
3144 }
3145 EXPORT_SYMBOL_GPL(nf_tables_unbind_set);
3146
3147 const struct nft_set_ext_type nft_set_ext_types[] = {
3148 [NFT_SET_EXT_KEY] = {
3149 .align = __alignof__(u32),
3150 },
3151 [NFT_SET_EXT_DATA] = {
3152 .align = __alignof__(u32),
3153 },
3154 [NFT_SET_EXT_EXPR] = {
3155 .align = __alignof__(struct nft_expr),
3156 },
3157 [NFT_SET_EXT_OBJREF] = {
3158 .len = sizeof(struct nft_object *),
3159 .align = __alignof__(struct nft_object *),
3160 },
3161 [NFT_SET_EXT_FLAGS] = {
3162 .len = sizeof(u8),
3163 .align = __alignof__(u8),
3164 },
3165 [NFT_SET_EXT_TIMEOUT] = {
3166 .len = sizeof(u64),
3167 .align = __alignof__(u64),
3168 },
3169 [NFT_SET_EXT_EXPIRATION] = {
3170 .len = sizeof(unsigned long),
3171 .align = __alignof__(unsigned long),
3172 },
3173 [NFT_SET_EXT_USERDATA] = {
3174 .len = sizeof(struct nft_userdata),
3175 .align = __alignof__(struct nft_userdata),
3176 },
3177 };
3178 EXPORT_SYMBOL_GPL(nft_set_ext_types);
3179
3180 /*
3181 * Set elements
3182 */
3183
3184 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
3185 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
3186 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
3187 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
3188 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
3189 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
3190 .len = NFT_USERDATA_MAXLEN },
3191 };
3192
3193 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
3194 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING,
3195 .len = NFT_TABLE_MAXNAMELEN - 1 },
3196 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING,
3197 .len = NFT_SET_MAXNAMELEN - 1 },
3198 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
3199 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
3200 };
3201
3202 static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx, struct net *net,
3203 const struct sk_buff *skb,
3204 const struct nlmsghdr *nlh,
3205 const struct nlattr * const nla[],
3206 u8 genmask)
3207 {
3208 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3209 struct nft_af_info *afi;
3210 struct nft_table *table;
3211
3212 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
3213 if (IS_ERR(afi))
3214 return PTR_ERR(afi);
3215
3216 table = nf_tables_table_lookup(afi, nla[NFTA_SET_ELEM_LIST_TABLE],
3217 genmask);
3218 if (IS_ERR(table))
3219 return PTR_ERR(table);
3220
3221 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
3222 return 0;
3223 }
3224
3225 static int nf_tables_fill_setelem(struct sk_buff *skb,
3226 const struct nft_set *set,
3227 const struct nft_set_elem *elem)
3228 {
3229 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3230 unsigned char *b = skb_tail_pointer(skb);
3231 struct nlattr *nest;
3232
3233 nest = nla_nest_start(skb, NFTA_LIST_ELEM);
3234 if (nest == NULL)
3235 goto nla_put_failure;
3236
3237 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
3238 NFT_DATA_VALUE, set->klen) < 0)
3239 goto nla_put_failure;
3240
3241 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3242 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
3243 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
3244 set->dlen) < 0)
3245 goto nla_put_failure;
3246
3247 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
3248 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
3249 goto nla_put_failure;
3250
3251 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3252 nla_put_string(skb, NFTA_SET_ELEM_OBJREF,
3253 (*nft_set_ext_obj(ext))->name) < 0)
3254 goto nla_put_failure;
3255
3256 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
3257 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
3258 htonl(*nft_set_ext_flags(ext))))
3259 goto nla_put_failure;
3260
3261 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
3262 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
3263 cpu_to_be64(jiffies_to_msecs(
3264 *nft_set_ext_timeout(ext))),
3265 NFTA_SET_ELEM_PAD))
3266 goto nla_put_failure;
3267
3268 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
3269 unsigned long expires, now = jiffies;
3270
3271 expires = *nft_set_ext_expiration(ext);
3272 if (time_before(now, expires))
3273 expires -= now;
3274 else
3275 expires = 0;
3276
3277 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
3278 cpu_to_be64(jiffies_to_msecs(expires)),
3279 NFTA_SET_ELEM_PAD))
3280 goto nla_put_failure;
3281 }
3282
3283 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
3284 struct nft_userdata *udata;
3285
3286 udata = nft_set_ext_userdata(ext);
3287 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
3288 udata->len + 1, udata->data))
3289 goto nla_put_failure;
3290 }
3291
3292 nla_nest_end(skb, nest);
3293 return 0;
3294
3295 nla_put_failure:
3296 nlmsg_trim(skb, b);
3297 return -EMSGSIZE;
3298 }
3299
3300 struct nft_set_dump_args {
3301 const struct netlink_callback *cb;
3302 struct nft_set_iter iter;
3303 struct sk_buff *skb;
3304 };
3305
3306 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
3307 struct nft_set *set,
3308 const struct nft_set_iter *iter,
3309 struct nft_set_elem *elem)
3310 {
3311 struct nft_set_dump_args *args;
3312
3313 args = container_of(iter, struct nft_set_dump_args, iter);
3314 return nf_tables_fill_setelem(args->skb, set, elem);
3315 }
3316
3317 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
3318 {
3319 struct net *net = sock_net(skb->sk);
3320 u8 genmask = nft_genmask_cur(net);
3321 struct nft_set *set;
3322 struct nft_set_dump_args args;
3323 struct nft_ctx ctx;
3324 struct nlattr *nla[NFTA_SET_ELEM_LIST_MAX + 1];
3325 struct nfgenmsg *nfmsg;
3326 struct nlmsghdr *nlh;
3327 struct nlattr *nest;
3328 u32 portid, seq;
3329 int event, err;
3330
3331 err = nlmsg_parse(cb->nlh, sizeof(struct nfgenmsg), nla,
3332 NFTA_SET_ELEM_LIST_MAX, nft_set_elem_list_policy);
3333 if (err < 0)
3334 return err;
3335
3336 err = nft_ctx_init_from_elemattr(&ctx, net, cb->skb, cb->nlh,
3337 (void *)nla, genmask);
3338 if (err < 0)
3339 return err;
3340
3341 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3342 genmask);
3343 if (IS_ERR(set))
3344 return PTR_ERR(set);
3345
3346 event = NFT_MSG_NEWSETELEM;
3347 event |= NFNL_SUBSYS_NFTABLES << 8;
3348 portid = NETLINK_CB(cb->skb).portid;
3349 seq = cb->nlh->nlmsg_seq;
3350
3351 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3352 NLM_F_MULTI);
3353 if (nlh == NULL)
3354 goto nla_put_failure;
3355
3356 nfmsg = nlmsg_data(nlh);
3357 nfmsg->nfgen_family = ctx.afi->family;
3358 nfmsg->version = NFNETLINK_V0;
3359 nfmsg->res_id = htons(ctx.net->nft.base_seq & 0xffff);
3360
3361 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, ctx.table->name))
3362 goto nla_put_failure;
3363 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
3364 goto nla_put_failure;
3365
3366 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3367 if (nest == NULL)
3368 goto nla_put_failure;
3369
3370 args.cb = cb;
3371 args.skb = skb;
3372 args.iter.genmask = nft_genmask_cur(ctx.net);
3373 args.iter.skip = cb->args[0];
3374 args.iter.count = 0;
3375 args.iter.err = 0;
3376 args.iter.fn = nf_tables_dump_setelem;
3377 set->ops->walk(&ctx, set, &args.iter);
3378
3379 nla_nest_end(skb, nest);
3380 nlmsg_end(skb, nlh);
3381
3382 if (args.iter.err && args.iter.err != -EMSGSIZE)
3383 return args.iter.err;
3384 if (args.iter.count == cb->args[0])
3385 return 0;
3386
3387 cb->args[0] = args.iter.count;
3388 return skb->len;
3389
3390 nla_put_failure:
3391 return -ENOSPC;
3392 }
3393
3394 static int nf_tables_getsetelem(struct net *net, struct sock *nlsk,
3395 struct sk_buff *skb, const struct nlmsghdr *nlh,
3396 const struct nlattr * const nla[])
3397 {
3398 u8 genmask = nft_genmask_cur(net);
3399 const struct nft_set *set;
3400 struct nft_ctx ctx;
3401 int err;
3402
3403 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3404 if (err < 0)
3405 return err;
3406
3407 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3408 genmask);
3409 if (IS_ERR(set))
3410 return PTR_ERR(set);
3411
3412 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3413 struct netlink_dump_control c = {
3414 .dump = nf_tables_dump_set,
3415 };
3416 return netlink_dump_start(nlsk, skb, nlh, &c);
3417 }
3418 return -EOPNOTSUPP;
3419 }
3420
3421 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
3422 const struct nft_ctx *ctx, u32 seq,
3423 u32 portid, int event, u16 flags,
3424 const struct nft_set *set,
3425 const struct nft_set_elem *elem)
3426 {
3427 struct nfgenmsg *nfmsg;
3428 struct nlmsghdr *nlh;
3429 struct nlattr *nest;
3430 int err;
3431
3432 event |= NFNL_SUBSYS_NFTABLES << 8;
3433 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3434 flags);
3435 if (nlh == NULL)
3436 goto nla_put_failure;
3437
3438 nfmsg = nlmsg_data(nlh);
3439 nfmsg->nfgen_family = ctx->afi->family;
3440 nfmsg->version = NFNETLINK_V0;
3441 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
3442
3443 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3444 goto nla_put_failure;
3445 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3446 goto nla_put_failure;
3447
3448 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3449 if (nest == NULL)
3450 goto nla_put_failure;
3451
3452 err = nf_tables_fill_setelem(skb, set, elem);
3453 if (err < 0)
3454 goto nla_put_failure;
3455
3456 nla_nest_end(skb, nest);
3457
3458 nlmsg_end(skb, nlh);
3459 return 0;
3460
3461 nla_put_failure:
3462 nlmsg_trim(skb, nlh);
3463 return -1;
3464 }
3465
3466 static int nf_tables_setelem_notify(const struct nft_ctx *ctx,
3467 const struct nft_set *set,
3468 const struct nft_set_elem *elem,
3469 int event, u16 flags)
3470 {
3471 struct net *net = ctx->net;
3472 u32 portid = ctx->portid;
3473 struct sk_buff *skb;
3474 int err;
3475
3476 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3477 return 0;
3478
3479 err = -ENOBUFS;
3480 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3481 if (skb == NULL)
3482 goto err;
3483
3484 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
3485 set, elem);
3486 if (err < 0) {
3487 kfree_skb(skb);
3488 goto err;
3489 }
3490
3491 err = nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
3492 GFP_KERNEL);
3493 err:
3494 if (err < 0)
3495 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, err);
3496 return err;
3497 }
3498
3499 static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
3500 int msg_type,
3501 struct nft_set *set)
3502 {
3503 struct nft_trans *trans;
3504
3505 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
3506 if (trans == NULL)
3507 return NULL;
3508
3509 nft_trans_elem_set(trans) = set;
3510 return trans;
3511 }
3512
3513 void *nft_set_elem_init(const struct nft_set *set,
3514 const struct nft_set_ext_tmpl *tmpl,
3515 const u32 *key, const u32 *data,
3516 u64 timeout, gfp_t gfp)
3517 {
3518 struct nft_set_ext *ext;
3519 void *elem;
3520
3521 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
3522 if (elem == NULL)
3523 return NULL;
3524
3525 ext = nft_set_elem_ext(set, elem);
3526 nft_set_ext_init(ext, tmpl);
3527
3528 memcpy(nft_set_ext_key(ext), key, set->klen);
3529 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3530 memcpy(nft_set_ext_data(ext), data, set->dlen);
3531 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION))
3532 *nft_set_ext_expiration(ext) =
3533 jiffies + timeout;
3534 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
3535 *nft_set_ext_timeout(ext) = timeout;
3536
3537 return elem;
3538 }
3539
3540 void nft_set_elem_destroy(const struct nft_set *set, void *elem,
3541 bool destroy_expr)
3542 {
3543 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3544
3545 nft_data_uninit(nft_set_ext_key(ext), NFT_DATA_VALUE);
3546 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3547 nft_data_uninit(nft_set_ext_data(ext), set->dtype);
3548 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3549 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3550 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
3551 (*nft_set_ext_obj(ext))->use--;
3552 kfree(elem);
3553 }
3554 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
3555
3556 static int nft_setelem_parse_flags(const struct nft_set *set,
3557 const struct nlattr *attr, u32 *flags)
3558 {
3559 if (attr == NULL)
3560 return 0;
3561
3562 *flags = ntohl(nla_get_be32(attr));
3563 if (*flags & ~NFT_SET_ELEM_INTERVAL_END)
3564 return -EINVAL;
3565 if (!(set->flags & NFT_SET_INTERVAL) &&
3566 *flags & NFT_SET_ELEM_INTERVAL_END)
3567 return -EINVAL;
3568
3569 return 0;
3570 }
3571
3572 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3573 const struct nlattr *attr, u32 nlmsg_flags)
3574 {
3575 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3576 u8 genmask = nft_genmask_next(ctx->net);
3577 struct nft_data_desc d1, d2;
3578 struct nft_set_ext_tmpl tmpl;
3579 struct nft_set_ext *ext, *ext2;
3580 struct nft_set_elem elem;
3581 struct nft_set_binding *binding;
3582 struct nft_object *obj = NULL;
3583 struct nft_userdata *udata;
3584 struct nft_data data;
3585 enum nft_registers dreg;
3586 struct nft_trans *trans;
3587 u32 flags = 0;
3588 u64 timeout;
3589 u8 ulen;
3590 int err;
3591
3592 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3593 nft_set_elem_policy);
3594 if (err < 0)
3595 return err;
3596
3597 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3598 return -EINVAL;
3599
3600 nft_set_ext_prepare(&tmpl);
3601
3602 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3603 if (err < 0)
3604 return err;
3605 if (flags != 0)
3606 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3607
3608 if (set->flags & NFT_SET_MAP) {
3609 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
3610 !(flags & NFT_SET_ELEM_INTERVAL_END))
3611 return -EINVAL;
3612 if (nla[NFTA_SET_ELEM_DATA] != NULL &&
3613 flags & NFT_SET_ELEM_INTERVAL_END)
3614 return -EINVAL;
3615 } else {
3616 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3617 return -EINVAL;
3618 }
3619
3620 timeout = 0;
3621 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
3622 if (!(set->flags & NFT_SET_TIMEOUT))
3623 return -EINVAL;
3624 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3625 nla[NFTA_SET_ELEM_TIMEOUT])));
3626 } else if (set->flags & NFT_SET_TIMEOUT) {
3627 timeout = set->timeout;
3628 }
3629
3630 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
3631 nla[NFTA_SET_ELEM_KEY]);
3632 if (err < 0)
3633 goto err1;
3634 err = -EINVAL;
3635 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
3636 goto err2;
3637
3638 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
3639 if (timeout > 0) {
3640 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
3641 if (timeout != set->timeout)
3642 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
3643 }
3644
3645 if (nla[NFTA_SET_ELEM_OBJREF] != NULL) {
3646 if (!(set->flags & NFT_SET_OBJECT)) {
3647 err = -EINVAL;
3648 goto err2;
3649 }
3650 obj = nf_tables_obj_lookup(ctx->table, nla[NFTA_SET_ELEM_OBJREF],
3651 set->objtype, genmask);
3652 if (IS_ERR(obj)) {
3653 err = PTR_ERR(obj);
3654 goto err2;
3655 }
3656 nft_set_ext_add(&tmpl, NFT_SET_EXT_OBJREF);
3657 }
3658
3659 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
3660 err = nft_data_init(ctx, &data, sizeof(data), &d2,
3661 nla[NFTA_SET_ELEM_DATA]);
3662 if (err < 0)
3663 goto err2;
3664
3665 err = -EINVAL;
3666 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
3667 goto err3;
3668
3669 dreg = nft_type_to_reg(set->dtype);
3670 list_for_each_entry(binding, &set->bindings, list) {
3671 struct nft_ctx bind_ctx = {
3672 .net = ctx->net,
3673 .afi = ctx->afi,
3674 .table = ctx->table,
3675 .chain = (struct nft_chain *)binding->chain,
3676 };
3677
3678 if (!(binding->flags & NFT_SET_MAP))
3679 continue;
3680
3681 err = nft_validate_register_store(&bind_ctx, dreg,
3682 &data,
3683 d2.type, d2.len);
3684 if (err < 0)
3685 goto err3;
3686 }
3687
3688 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
3689 }
3690
3691 /* The full maximum length of userdata can exceed the maximum
3692 * offset value (U8_MAX) for following extensions, therefor it
3693 * must be the last extension added.
3694 */
3695 ulen = 0;
3696 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
3697 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
3698 if (ulen > 0)
3699 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
3700 ulen);
3701 }
3702
3703 err = -ENOMEM;
3704 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
3705 timeout, GFP_KERNEL);
3706 if (elem.priv == NULL)
3707 goto err3;
3708
3709 ext = nft_set_elem_ext(set, elem.priv);
3710 if (flags)
3711 *nft_set_ext_flags(ext) = flags;
3712 if (ulen > 0) {
3713 udata = nft_set_ext_userdata(ext);
3714 udata->len = ulen - 1;
3715 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
3716 }
3717 if (obj) {
3718 *nft_set_ext_obj(ext) = obj;
3719 obj->use++;
3720 }
3721
3722 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
3723 if (trans == NULL)
3724 goto err4;
3725
3726 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
3727 err = set->ops->insert(ctx->net, set, &elem, &ext2);
3728 if (err) {
3729 if (err == -EEXIST) {
3730 if ((nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3731 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
3732 memcmp(nft_set_ext_data(ext),
3733 nft_set_ext_data(ext2), set->dlen) != 0) ||
3734 (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3735 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF) &&
3736 *nft_set_ext_obj(ext) != *nft_set_ext_obj(ext2)))
3737 err = -EBUSY;
3738 else if (!(nlmsg_flags & NLM_F_EXCL))
3739 err = 0;
3740 }
3741 goto err5;
3742 }
3743
3744 if (set->size &&
3745 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact)) {
3746 err = -ENFILE;
3747 goto err6;
3748 }
3749
3750 nft_trans_elem(trans) = elem;
3751 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3752 return 0;
3753
3754 err6:
3755 set->ops->remove(ctx->net, set, &elem);
3756 err5:
3757 kfree(trans);
3758 err4:
3759 kfree(elem.priv);
3760 err3:
3761 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3762 nft_data_uninit(&data, d2.type);
3763 err2:
3764 nft_data_uninit(&elem.key.val, d1.type);
3765 err1:
3766 return err;
3767 }
3768
3769 static int nf_tables_newsetelem(struct net *net, struct sock *nlsk,
3770 struct sk_buff *skb, const struct nlmsghdr *nlh,
3771 const struct nlattr * const nla[])
3772 {
3773 u8 genmask = nft_genmask_next(net);
3774 const struct nlattr *attr;
3775 struct nft_set *set;
3776 struct nft_ctx ctx;
3777 int rem, err = 0;
3778
3779 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
3780 return -EINVAL;
3781
3782 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3783 if (err < 0)
3784 return err;
3785
3786 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3787 genmask);
3788 if (IS_ERR(set)) {
3789 if (nla[NFTA_SET_ELEM_LIST_SET_ID]) {
3790 set = nf_tables_set_lookup_byid(net,
3791 nla[NFTA_SET_ELEM_LIST_SET_ID],
3792 genmask);
3793 }
3794 if (IS_ERR(set))
3795 return PTR_ERR(set);
3796 }
3797
3798 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
3799 return -EBUSY;
3800
3801 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3802 err = nft_add_set_elem(&ctx, set, attr, nlh->nlmsg_flags);
3803 if (err < 0)
3804 break;
3805 }
3806 return err;
3807 }
3808
3809 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
3810 const struct nlattr *attr)
3811 {
3812 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3813 struct nft_set_ext_tmpl tmpl;
3814 struct nft_data_desc desc;
3815 struct nft_set_elem elem;
3816 struct nft_set_ext *ext;
3817 struct nft_trans *trans;
3818 u32 flags = 0;
3819 void *priv;
3820 int err;
3821
3822 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3823 nft_set_elem_policy);
3824 if (err < 0)
3825 goto err1;
3826
3827 err = -EINVAL;
3828 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3829 goto err1;
3830
3831 nft_set_ext_prepare(&tmpl);
3832
3833 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3834 if (err < 0)
3835 return err;
3836 if (flags != 0)
3837 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3838
3839 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
3840 nla[NFTA_SET_ELEM_KEY]);
3841 if (err < 0)
3842 goto err1;
3843
3844 err = -EINVAL;
3845 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
3846 goto err2;
3847
3848 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, desc.len);
3849
3850 err = -ENOMEM;
3851 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, NULL, 0,
3852 GFP_KERNEL);
3853 if (elem.priv == NULL)
3854 goto err2;
3855
3856 ext = nft_set_elem_ext(set, elem.priv);
3857 if (flags)
3858 *nft_set_ext_flags(ext) = flags;
3859
3860 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
3861 if (trans == NULL) {
3862 err = -ENOMEM;
3863 goto err3;
3864 }
3865
3866 priv = set->ops->deactivate(ctx->net, set, &elem);
3867 if (priv == NULL) {
3868 err = -ENOENT;
3869 goto err4;
3870 }
3871 kfree(elem.priv);
3872 elem.priv = priv;
3873
3874 nft_trans_elem(trans) = elem;
3875 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3876 return 0;
3877
3878 err4:
3879 kfree(trans);
3880 err3:
3881 kfree(elem.priv);
3882 err2:
3883 nft_data_uninit(&elem.key.val, desc.type);
3884 err1:
3885 return err;
3886 }
3887
3888 static int nft_flush_set(const struct nft_ctx *ctx,
3889 struct nft_set *set,
3890 const struct nft_set_iter *iter,
3891 struct nft_set_elem *elem)
3892 {
3893 struct nft_trans *trans;
3894 int err;
3895
3896 trans = nft_trans_alloc_gfp(ctx, NFT_MSG_DELSETELEM,
3897 sizeof(struct nft_trans_elem), GFP_ATOMIC);
3898 if (!trans)
3899 return -ENOMEM;
3900
3901 if (!set->ops->flush(ctx->net, set, elem->priv)) {
3902 err = -ENOENT;
3903 goto err1;
3904 }
3905 set->ndeact++;
3906
3907 nft_trans_elem_set(trans) = set;
3908 nft_trans_elem(trans) = *elem;
3909 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3910
3911 return 0;
3912 err1:
3913 kfree(trans);
3914 return err;
3915 }
3916
3917 static int nf_tables_delsetelem(struct net *net, struct sock *nlsk,
3918 struct sk_buff *skb, const struct nlmsghdr *nlh,
3919 const struct nlattr * const nla[])
3920 {
3921 u8 genmask = nft_genmask_next(net);
3922 const struct nlattr *attr;
3923 struct nft_set *set;
3924 struct nft_ctx ctx;
3925 int rem, err = 0;
3926
3927 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3928 if (err < 0)
3929 return err;
3930
3931 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3932 genmask);
3933 if (IS_ERR(set))
3934 return PTR_ERR(set);
3935 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
3936 return -EBUSY;
3937
3938 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL) {
3939 struct nft_set_iter iter = {
3940 .genmask = genmask,
3941 .fn = nft_flush_set,
3942 };
3943 set->ops->walk(&ctx, set, &iter);
3944
3945 return iter.err;
3946 }
3947
3948 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3949 err = nft_del_setelem(&ctx, set, attr);
3950 if (err < 0)
3951 break;
3952
3953 set->ndeact++;
3954 }
3955 return err;
3956 }
3957
3958 void nft_set_gc_batch_release(struct rcu_head *rcu)
3959 {
3960 struct nft_set_gc_batch *gcb;
3961 unsigned int i;
3962
3963 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
3964 for (i = 0; i < gcb->head.cnt; i++)
3965 nft_set_elem_destroy(gcb->head.set, gcb->elems[i], true);
3966 kfree(gcb);
3967 }
3968 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
3969
3970 struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
3971 gfp_t gfp)
3972 {
3973 struct nft_set_gc_batch *gcb;
3974
3975 gcb = kzalloc(sizeof(*gcb), gfp);
3976 if (gcb == NULL)
3977 return gcb;
3978 gcb->head.set = set;
3979 return gcb;
3980 }
3981 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
3982
3983 /*
3984 * Stateful objects
3985 */
3986
3987 /**
3988 * nft_register_obj- register nf_tables stateful object type
3989 * @obj: object type
3990 *
3991 * Registers the object type for use with nf_tables. Returns zero on
3992 * success or a negative errno code otherwise.
3993 */
3994 int nft_register_obj(struct nft_object_type *obj_type)
3995 {
3996 if (obj_type->type == NFT_OBJECT_UNSPEC)
3997 return -EINVAL;
3998
3999 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4000 list_add_rcu(&obj_type->list, &nf_tables_objects);
4001 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4002 return 0;
4003 }
4004 EXPORT_SYMBOL_GPL(nft_register_obj);
4005
4006 /**
4007 * nft_unregister_obj - unregister nf_tables object type
4008 * @obj: object type
4009 *
4010 * Unregisters the object type for use with nf_tables.
4011 */
4012 void nft_unregister_obj(struct nft_object_type *obj_type)
4013 {
4014 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4015 list_del_rcu(&obj_type->list);
4016 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4017 }
4018 EXPORT_SYMBOL_GPL(nft_unregister_obj);
4019
4020 struct nft_object *nf_tables_obj_lookup(const struct nft_table *table,
4021 const struct nlattr *nla,
4022 u32 objtype, u8 genmask)
4023 {
4024 struct nft_object *obj;
4025
4026 list_for_each_entry(obj, &table->objects, list) {
4027 if (!nla_strcmp(nla, obj->name) &&
4028 objtype == obj->type->type &&
4029 nft_active_genmask(obj, genmask))
4030 return obj;
4031 }
4032 return ERR_PTR(-ENOENT);
4033 }
4034 EXPORT_SYMBOL_GPL(nf_tables_obj_lookup);
4035
4036 static const struct nla_policy nft_obj_policy[NFTA_OBJ_MAX + 1] = {
4037 [NFTA_OBJ_TABLE] = { .type = NLA_STRING,
4038 .len = NFT_TABLE_MAXNAMELEN - 1 },
4039 [NFTA_OBJ_NAME] = { .type = NLA_STRING,
4040 .len = NFT_OBJ_MAXNAMELEN - 1 },
4041 [NFTA_OBJ_TYPE] = { .type = NLA_U32 },
4042 [NFTA_OBJ_DATA] = { .type = NLA_NESTED },
4043 };
4044
4045 static struct nft_object *nft_obj_init(const struct nft_object_type *type,
4046 const struct nlattr *attr)
4047 {
4048 struct nlattr *tb[type->maxattr + 1];
4049 struct nft_object *obj;
4050 int err;
4051
4052 if (attr) {
4053 err = nla_parse_nested(tb, type->maxattr, attr, type->policy);
4054 if (err < 0)
4055 goto err1;
4056 } else {
4057 memset(tb, 0, sizeof(tb[0]) * (type->maxattr + 1));
4058 }
4059
4060 err = -ENOMEM;
4061 obj = kzalloc(sizeof(struct nft_object) + type->size, GFP_KERNEL);
4062 if (obj == NULL)
4063 goto err1;
4064
4065 err = type->init((const struct nlattr * const *)tb, obj);
4066 if (err < 0)
4067 goto err2;
4068
4069 obj->type = type;
4070 return obj;
4071 err2:
4072 kfree(obj);
4073 err1:
4074 return ERR_PTR(err);
4075 }
4076
4077 static int nft_object_dump(struct sk_buff *skb, unsigned int attr,
4078 struct nft_object *obj, bool reset)
4079 {
4080 struct nlattr *nest;
4081
4082 nest = nla_nest_start(skb, attr);
4083 if (!nest)
4084 goto nla_put_failure;
4085 if (obj->type->dump(skb, obj, reset) < 0)
4086 goto nla_put_failure;
4087 nla_nest_end(skb, nest);
4088 return 0;
4089
4090 nla_put_failure:
4091 return -1;
4092 }
4093
4094 static const struct nft_object_type *__nft_obj_type_get(u32 objtype)
4095 {
4096 const struct nft_object_type *type;
4097
4098 list_for_each_entry(type, &nf_tables_objects, list) {
4099 if (objtype == type->type)
4100 return type;
4101 }
4102 return NULL;
4103 }
4104
4105 static const struct nft_object_type *nft_obj_type_get(u32 objtype)
4106 {
4107 const struct nft_object_type *type;
4108
4109 type = __nft_obj_type_get(objtype);
4110 if (type != NULL && try_module_get(type->owner))
4111 return type;
4112
4113 #ifdef CONFIG_MODULES
4114 if (type == NULL) {
4115 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4116 request_module("nft-obj-%u", objtype);
4117 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4118 if (__nft_obj_type_get(objtype))
4119 return ERR_PTR(-EAGAIN);
4120 }
4121 #endif
4122 return ERR_PTR(-ENOENT);
4123 }
4124
4125 static int nf_tables_newobj(struct net *net, struct sock *nlsk,
4126 struct sk_buff *skb, const struct nlmsghdr *nlh,
4127 const struct nlattr * const nla[])
4128 {
4129 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4130 const struct nft_object_type *type;
4131 u8 genmask = nft_genmask_next(net);
4132 int family = nfmsg->nfgen_family;
4133 struct nft_af_info *afi;
4134 struct nft_table *table;
4135 struct nft_object *obj;
4136 struct nft_ctx ctx;
4137 u32 objtype;
4138 int err;
4139
4140 if (!nla[NFTA_OBJ_TYPE] ||
4141 !nla[NFTA_OBJ_NAME] ||
4142 !nla[NFTA_OBJ_DATA])
4143 return -EINVAL;
4144
4145 afi = nf_tables_afinfo_lookup(net, family, true);
4146 if (IS_ERR(afi))
4147 return PTR_ERR(afi);
4148
4149 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4150 if (IS_ERR(table))
4151 return PTR_ERR(table);
4152
4153 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4154 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4155 if (IS_ERR(obj)) {
4156 err = PTR_ERR(obj);
4157 if (err != -ENOENT)
4158 return err;
4159
4160 } else {
4161 if (nlh->nlmsg_flags & NLM_F_EXCL)
4162 return -EEXIST;
4163
4164 return 0;
4165 }
4166
4167 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
4168
4169 type = nft_obj_type_get(objtype);
4170 if (IS_ERR(type))
4171 return PTR_ERR(type);
4172
4173 obj = nft_obj_init(type, nla[NFTA_OBJ_DATA]);
4174 if (IS_ERR(obj)) {
4175 err = PTR_ERR(obj);
4176 goto err1;
4177 }
4178 obj->table = table;
4179 nla_strlcpy(obj->name, nla[NFTA_OBJ_NAME], NFT_OBJ_MAXNAMELEN);
4180
4181 err = nft_trans_obj_add(&ctx, NFT_MSG_NEWOBJ, obj);
4182 if (err < 0)
4183 goto err2;
4184
4185 list_add_tail_rcu(&obj->list, &table->objects);
4186 table->use++;
4187 return 0;
4188 err2:
4189 if (obj->type->destroy)
4190 obj->type->destroy(obj);
4191 kfree(obj);
4192 err1:
4193 module_put(type->owner);
4194 return err;
4195 }
4196
4197 static int nf_tables_fill_obj_info(struct sk_buff *skb, struct net *net,
4198 u32 portid, u32 seq, int event, u32 flags,
4199 int family, const struct nft_table *table,
4200 struct nft_object *obj, bool reset)
4201 {
4202 struct nfgenmsg *nfmsg;
4203 struct nlmsghdr *nlh;
4204
4205 event |= NFNL_SUBSYS_NFTABLES << 8;
4206 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
4207 if (nlh == NULL)
4208 goto nla_put_failure;
4209
4210 nfmsg = nlmsg_data(nlh);
4211 nfmsg->nfgen_family = family;
4212 nfmsg->version = NFNETLINK_V0;
4213 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4214
4215 if (nla_put_string(skb, NFTA_OBJ_TABLE, table->name) ||
4216 nla_put_string(skb, NFTA_OBJ_NAME, obj->name) ||
4217 nla_put_be32(skb, NFTA_OBJ_TYPE, htonl(obj->type->type)) ||
4218 nla_put_be32(skb, NFTA_OBJ_USE, htonl(obj->use)) ||
4219 nft_object_dump(skb, NFTA_OBJ_DATA, obj, reset))
4220 goto nla_put_failure;
4221
4222 nlmsg_end(skb, nlh);
4223 return 0;
4224
4225 nla_put_failure:
4226 nlmsg_trim(skb, nlh);
4227 return -1;
4228 }
4229
4230 struct nft_obj_filter {
4231 char table[NFT_OBJ_MAXNAMELEN];
4232 u32 type;
4233 };
4234
4235 static int nf_tables_dump_obj(struct sk_buff *skb, struct netlink_callback *cb)
4236 {
4237 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
4238 const struct nft_af_info *afi;
4239 const struct nft_table *table;
4240 unsigned int idx = 0, s_idx = cb->args[0];
4241 struct nft_obj_filter *filter = cb->data;
4242 struct net *net = sock_net(skb->sk);
4243 int family = nfmsg->nfgen_family;
4244 struct nft_object *obj;
4245 bool reset = false;
4246
4247 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4248 reset = true;
4249
4250 rcu_read_lock();
4251 cb->seq = net->nft.base_seq;
4252
4253 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
4254 if (family != NFPROTO_UNSPEC && family != afi->family)
4255 continue;
4256
4257 list_for_each_entry_rcu(table, &afi->tables, list) {
4258 list_for_each_entry_rcu(obj, &table->objects, list) {
4259 if (!nft_is_active(net, obj))
4260 goto cont;
4261 if (idx < s_idx)
4262 goto cont;
4263 if (idx > s_idx)
4264 memset(&cb->args[1], 0,
4265 sizeof(cb->args) - sizeof(cb->args[0]));
4266 if (filter && filter->table[0] &&
4267 strcmp(filter->table, table->name))
4268 goto cont;
4269 if (filter &&
4270 filter->type != NFT_OBJECT_UNSPEC &&
4271 obj->type->type != filter->type)
4272 goto cont;
4273
4274 if (nf_tables_fill_obj_info(skb, net, NETLINK_CB(cb->skb).portid,
4275 cb->nlh->nlmsg_seq,
4276 NFT_MSG_NEWOBJ,
4277 NLM_F_MULTI | NLM_F_APPEND,
4278 afi->family, table, obj, reset) < 0)
4279 goto done;
4280
4281 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
4282 cont:
4283 idx++;
4284 }
4285 }
4286 }
4287 done:
4288 rcu_read_unlock();
4289
4290 cb->args[0] = idx;
4291 return skb->len;
4292 }
4293
4294 static int nf_tables_dump_obj_done(struct netlink_callback *cb)
4295 {
4296 kfree(cb->data);
4297
4298 return 0;
4299 }
4300
4301 static struct nft_obj_filter *
4302 nft_obj_filter_alloc(const struct nlattr * const nla[])
4303 {
4304 struct nft_obj_filter *filter;
4305
4306 filter = kzalloc(sizeof(*filter), GFP_KERNEL);
4307 if (!filter)
4308 return ERR_PTR(-ENOMEM);
4309
4310 if (nla[NFTA_OBJ_TABLE])
4311 nla_strlcpy(filter->table, nla[NFTA_OBJ_TABLE],
4312 NFT_TABLE_MAXNAMELEN);
4313 if (nla[NFTA_OBJ_TYPE])
4314 filter->type = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4315
4316 return filter;
4317 }
4318
4319 static int nf_tables_getobj(struct net *net, struct sock *nlsk,
4320 struct sk_buff *skb, const struct nlmsghdr *nlh,
4321 const struct nlattr * const nla[])
4322 {
4323 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4324 u8 genmask = nft_genmask_cur(net);
4325 int family = nfmsg->nfgen_family;
4326 const struct nft_af_info *afi;
4327 const struct nft_table *table;
4328 struct nft_object *obj;
4329 struct sk_buff *skb2;
4330 bool reset = false;
4331 u32 objtype;
4332 int err;
4333
4334 if (nlh->nlmsg_flags & NLM_F_DUMP) {
4335 struct netlink_dump_control c = {
4336 .dump = nf_tables_dump_obj,
4337 .done = nf_tables_dump_obj_done,
4338 };
4339
4340 if (nla[NFTA_OBJ_TABLE] ||
4341 nla[NFTA_OBJ_TYPE]) {
4342 struct nft_obj_filter *filter;
4343
4344 filter = nft_obj_filter_alloc(nla);
4345 if (IS_ERR(filter))
4346 return -ENOMEM;
4347
4348 c.data = filter;
4349 }
4350 return netlink_dump_start(nlsk, skb, nlh, &c);
4351 }
4352
4353 if (!nla[NFTA_OBJ_NAME] ||
4354 !nla[NFTA_OBJ_TYPE])
4355 return -EINVAL;
4356
4357 afi = nf_tables_afinfo_lookup(net, family, false);
4358 if (IS_ERR(afi))
4359 return PTR_ERR(afi);
4360
4361 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4362 if (IS_ERR(table))
4363 return PTR_ERR(table);
4364
4365 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4366 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4367 if (IS_ERR(obj))
4368 return PTR_ERR(obj);
4369
4370 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4371 if (!skb2)
4372 return -ENOMEM;
4373
4374 if (NFNL_MSG_TYPE(nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4375 reset = true;
4376
4377 err = nf_tables_fill_obj_info(skb2, net, NETLINK_CB(skb).portid,
4378 nlh->nlmsg_seq, NFT_MSG_NEWOBJ, 0,
4379 family, table, obj, reset);
4380 if (err < 0)
4381 goto err;
4382
4383 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4384 err:
4385 kfree_skb(skb2);
4386 return err;
4387
4388 return 0;
4389 }
4390
4391 static void nft_obj_destroy(struct nft_object *obj)
4392 {
4393 if (obj->type->destroy)
4394 obj->type->destroy(obj);
4395
4396 module_put(obj->type->owner);
4397 kfree(obj);
4398 }
4399
4400 static int nf_tables_delobj(struct net *net, struct sock *nlsk,
4401 struct sk_buff *skb, const struct nlmsghdr *nlh,
4402 const struct nlattr * const nla[])
4403 {
4404 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4405 u8 genmask = nft_genmask_next(net);
4406 int family = nfmsg->nfgen_family;
4407 struct nft_af_info *afi;
4408 struct nft_table *table;
4409 struct nft_object *obj;
4410 struct nft_ctx ctx;
4411 u32 objtype;
4412
4413 if (!nla[NFTA_OBJ_TYPE] ||
4414 !nla[NFTA_OBJ_NAME])
4415 return -EINVAL;
4416
4417 afi = nf_tables_afinfo_lookup(net, family, true);
4418 if (IS_ERR(afi))
4419 return PTR_ERR(afi);
4420
4421 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4422 if (IS_ERR(table))
4423 return PTR_ERR(table);
4424
4425 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4426 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4427 if (IS_ERR(obj))
4428 return PTR_ERR(obj);
4429 if (obj->use > 0)
4430 return -EBUSY;
4431
4432 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
4433
4434 return nft_delobj(&ctx, obj);
4435 }
4436
4437 int nft_obj_notify(struct net *net, struct nft_table *table,
4438 struct nft_object *obj, u32 portid, u32 seq, int event,
4439 int family, int report, gfp_t gfp)
4440 {
4441 struct sk_buff *skb;
4442 int err;
4443
4444 if (!report &&
4445 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4446 return 0;
4447
4448 err = -ENOBUFS;
4449 skb = nlmsg_new(NLMSG_GOODSIZE, gfp);
4450 if (skb == NULL)
4451 goto err;
4452
4453 err = nf_tables_fill_obj_info(skb, net, portid, seq, event, 0, family,
4454 table, obj, false);
4455 if (err < 0) {
4456 kfree_skb(skb);
4457 goto err;
4458 }
4459
4460 err = nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, report, gfp);
4461 err:
4462 if (err < 0) {
4463 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, err);
4464 }
4465 return err;
4466 }
4467 EXPORT_SYMBOL_GPL(nft_obj_notify);
4468
4469 static int nf_tables_obj_notify(const struct nft_ctx *ctx,
4470 struct nft_object *obj, int event)
4471 {
4472 return nft_obj_notify(ctx->net, ctx->table, obj, ctx->portid,
4473 ctx->seq, event, ctx->afi->family, ctx->report,
4474 GFP_KERNEL);
4475 }
4476
4477 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
4478 u32 portid, u32 seq)
4479 {
4480 struct nlmsghdr *nlh;
4481 struct nfgenmsg *nfmsg;
4482 int event = (NFNL_SUBSYS_NFTABLES << 8) | NFT_MSG_NEWGEN;
4483
4484 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
4485 if (nlh == NULL)
4486 goto nla_put_failure;
4487
4488 nfmsg = nlmsg_data(nlh);
4489 nfmsg->nfgen_family = AF_UNSPEC;
4490 nfmsg->version = NFNETLINK_V0;
4491 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4492
4493 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)))
4494 goto nla_put_failure;
4495
4496 nlmsg_end(skb, nlh);
4497 return 0;
4498
4499 nla_put_failure:
4500 nlmsg_trim(skb, nlh);
4501 return -EMSGSIZE;
4502 }
4503
4504 static int nf_tables_gen_notify(struct net *net, struct sk_buff *skb, int event)
4505 {
4506 struct nlmsghdr *nlh = nlmsg_hdr(skb);
4507 struct sk_buff *skb2;
4508 int err;
4509
4510 if (nlmsg_report(nlh) &&
4511 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4512 return 0;
4513
4514 err = -ENOBUFS;
4515 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
4516 if (skb2 == NULL)
4517 goto err;
4518
4519 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
4520 nlh->nlmsg_seq);
4521 if (err < 0) {
4522 kfree_skb(skb2);
4523 goto err;
4524 }
4525
4526 err = nfnetlink_send(skb2, net, NETLINK_CB(skb).portid,
4527 NFNLGRP_NFTABLES, nlmsg_report(nlh), GFP_KERNEL);
4528 err:
4529 if (err < 0) {
4530 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
4531 err);
4532 }
4533 return err;
4534 }
4535
4536 static int nf_tables_getgen(struct net *net, struct sock *nlsk,
4537 struct sk_buff *skb, const struct nlmsghdr *nlh,
4538 const struct nlattr * const nla[])
4539 {
4540 struct sk_buff *skb2;
4541 int err;
4542
4543 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4544 if (skb2 == NULL)
4545 return -ENOMEM;
4546
4547 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
4548 nlh->nlmsg_seq);
4549 if (err < 0)
4550 goto err;
4551
4552 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4553 err:
4554 kfree_skb(skb2);
4555 return err;
4556 }
4557
4558 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
4559 [NFT_MSG_NEWTABLE] = {
4560 .call_batch = nf_tables_newtable,
4561 .attr_count = NFTA_TABLE_MAX,
4562 .policy = nft_table_policy,
4563 },
4564 [NFT_MSG_GETTABLE] = {
4565 .call = nf_tables_gettable,
4566 .attr_count = NFTA_TABLE_MAX,
4567 .policy = nft_table_policy,
4568 },
4569 [NFT_MSG_DELTABLE] = {
4570 .call_batch = nf_tables_deltable,
4571 .attr_count = NFTA_TABLE_MAX,
4572 .policy = nft_table_policy,
4573 },
4574 [NFT_MSG_NEWCHAIN] = {
4575 .call_batch = nf_tables_newchain,
4576 .attr_count = NFTA_CHAIN_MAX,
4577 .policy = nft_chain_policy,
4578 },
4579 [NFT_MSG_GETCHAIN] = {
4580 .call = nf_tables_getchain,
4581 .attr_count = NFTA_CHAIN_MAX,
4582 .policy = nft_chain_policy,
4583 },
4584 [NFT_MSG_DELCHAIN] = {
4585 .call_batch = nf_tables_delchain,
4586 .attr_count = NFTA_CHAIN_MAX,
4587 .policy = nft_chain_policy,
4588 },
4589 [NFT_MSG_NEWRULE] = {
4590 .call_batch = nf_tables_newrule,
4591 .attr_count = NFTA_RULE_MAX,
4592 .policy = nft_rule_policy,
4593 },
4594 [NFT_MSG_GETRULE] = {
4595 .call = nf_tables_getrule,
4596 .attr_count = NFTA_RULE_MAX,
4597 .policy = nft_rule_policy,
4598 },
4599 [NFT_MSG_DELRULE] = {
4600 .call_batch = nf_tables_delrule,
4601 .attr_count = NFTA_RULE_MAX,
4602 .policy = nft_rule_policy,
4603 },
4604 [NFT_MSG_NEWSET] = {
4605 .call_batch = nf_tables_newset,
4606 .attr_count = NFTA_SET_MAX,
4607 .policy = nft_set_policy,
4608 },
4609 [NFT_MSG_GETSET] = {
4610 .call = nf_tables_getset,
4611 .attr_count = NFTA_SET_MAX,
4612 .policy = nft_set_policy,
4613 },
4614 [NFT_MSG_DELSET] = {
4615 .call_batch = nf_tables_delset,
4616 .attr_count = NFTA_SET_MAX,
4617 .policy = nft_set_policy,
4618 },
4619 [NFT_MSG_NEWSETELEM] = {
4620 .call_batch = nf_tables_newsetelem,
4621 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4622 .policy = nft_set_elem_list_policy,
4623 },
4624 [NFT_MSG_GETSETELEM] = {
4625 .call = nf_tables_getsetelem,
4626 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4627 .policy = nft_set_elem_list_policy,
4628 },
4629 [NFT_MSG_DELSETELEM] = {
4630 .call_batch = nf_tables_delsetelem,
4631 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4632 .policy = nft_set_elem_list_policy,
4633 },
4634 [NFT_MSG_GETGEN] = {
4635 .call = nf_tables_getgen,
4636 },
4637 [NFT_MSG_NEWOBJ] = {
4638 .call_batch = nf_tables_newobj,
4639 .attr_count = NFTA_OBJ_MAX,
4640 .policy = nft_obj_policy,
4641 },
4642 [NFT_MSG_GETOBJ] = {
4643 .call = nf_tables_getobj,
4644 .attr_count = NFTA_OBJ_MAX,
4645 .policy = nft_obj_policy,
4646 },
4647 [NFT_MSG_DELOBJ] = {
4648 .call_batch = nf_tables_delobj,
4649 .attr_count = NFTA_OBJ_MAX,
4650 .policy = nft_obj_policy,
4651 },
4652 [NFT_MSG_GETOBJ_RESET] = {
4653 .call = nf_tables_getobj,
4654 .attr_count = NFTA_OBJ_MAX,
4655 .policy = nft_obj_policy,
4656 },
4657 };
4658
4659 static void nft_chain_commit_update(struct nft_trans *trans)
4660 {
4661 struct nft_base_chain *basechain;
4662
4663 if (nft_trans_chain_name(trans)[0])
4664 strcpy(trans->ctx.chain->name, nft_trans_chain_name(trans));
4665
4666 if (!(trans->ctx.chain->flags & NFT_BASE_CHAIN))
4667 return;
4668
4669 basechain = nft_base_chain(trans->ctx.chain);
4670 nft_chain_stats_replace(basechain, nft_trans_chain_stats(trans));
4671
4672 switch (nft_trans_chain_policy(trans)) {
4673 case NF_DROP:
4674 case NF_ACCEPT:
4675 basechain->policy = nft_trans_chain_policy(trans);
4676 break;
4677 }
4678 }
4679
4680 static void nf_tables_commit_release(struct nft_trans *trans)
4681 {
4682 switch (trans->msg_type) {
4683 case NFT_MSG_DELTABLE:
4684 nf_tables_table_destroy(&trans->ctx);
4685 break;
4686 case NFT_MSG_DELCHAIN:
4687 nf_tables_chain_destroy(trans->ctx.chain);
4688 break;
4689 case NFT_MSG_DELRULE:
4690 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
4691 break;
4692 case NFT_MSG_DELSET:
4693 nft_set_destroy(nft_trans_set(trans));
4694 break;
4695 case NFT_MSG_DELSETELEM:
4696 nft_set_elem_destroy(nft_trans_elem_set(trans),
4697 nft_trans_elem(trans).priv, true);
4698 break;
4699 case NFT_MSG_DELOBJ:
4700 nft_obj_destroy(nft_trans_obj(trans));
4701 break;
4702 }
4703 kfree(trans);
4704 }
4705
4706 static int nf_tables_commit(struct net *net, struct sk_buff *skb)
4707 {
4708 struct nft_trans *trans, *next;
4709 struct nft_trans_elem *te;
4710
4711 /* Bump generation counter, invalidate any dump in progress */
4712 while (++net->nft.base_seq == 0);
4713
4714 /* A new generation has just started */
4715 net->nft.gencursor = nft_gencursor_next(net);
4716
4717 /* Make sure all packets have left the previous generation before
4718 * purging old rules.
4719 */
4720 synchronize_rcu();
4721
4722 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
4723 switch (trans->msg_type) {
4724 case NFT_MSG_NEWTABLE:
4725 if (nft_trans_table_update(trans)) {
4726 if (!nft_trans_table_enable(trans)) {
4727 nf_tables_table_disable(net,
4728 trans->ctx.afi,
4729 trans->ctx.table);
4730 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
4731 }
4732 } else {
4733 nft_clear(net, trans->ctx.table);
4734 }
4735 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
4736 nft_trans_destroy(trans);
4737 break;
4738 case NFT_MSG_DELTABLE:
4739 list_del_rcu(&trans->ctx.table->list);
4740 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
4741 break;
4742 case NFT_MSG_NEWCHAIN:
4743 if (nft_trans_chain_update(trans))
4744 nft_chain_commit_update(trans);
4745 else
4746 nft_clear(net, trans->ctx.chain);
4747
4748 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
4749 nft_trans_destroy(trans);
4750 break;
4751 case NFT_MSG_DELCHAIN:
4752 list_del_rcu(&trans->ctx.chain->list);
4753 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
4754 nf_tables_unregister_hooks(trans->ctx.net,
4755 trans->ctx.table,
4756 trans->ctx.chain,
4757 trans->ctx.afi->nops);
4758 break;
4759 case NFT_MSG_NEWRULE:
4760 nft_clear(trans->ctx.net, nft_trans_rule(trans));
4761 nf_tables_rule_notify(&trans->ctx,
4762 nft_trans_rule(trans),
4763 NFT_MSG_NEWRULE);
4764 nft_trans_destroy(trans);
4765 break;
4766 case NFT_MSG_DELRULE:
4767 list_del_rcu(&nft_trans_rule(trans)->list);
4768 nf_tables_rule_notify(&trans->ctx,
4769 nft_trans_rule(trans),
4770 NFT_MSG_DELRULE);
4771 break;
4772 case NFT_MSG_NEWSET:
4773 nft_clear(net, nft_trans_set(trans));
4774 /* This avoids hitting -EBUSY when deleting the table
4775 * from the transaction.
4776 */
4777 if (nft_trans_set(trans)->flags & NFT_SET_ANONYMOUS &&
4778 !list_empty(&nft_trans_set(trans)->bindings))
4779 trans->ctx.table->use--;
4780
4781 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
4782 NFT_MSG_NEWSET, GFP_KERNEL);
4783 nft_trans_destroy(trans);
4784 break;
4785 case NFT_MSG_DELSET:
4786 list_del_rcu(&nft_trans_set(trans)->list);
4787 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
4788 NFT_MSG_DELSET, GFP_KERNEL);
4789 break;
4790 case NFT_MSG_NEWSETELEM:
4791 te = (struct nft_trans_elem *)trans->data;
4792
4793 te->set->ops->activate(net, te->set, &te->elem);
4794 nf_tables_setelem_notify(&trans->ctx, te->set,
4795 &te->elem,
4796 NFT_MSG_NEWSETELEM, 0);
4797 nft_trans_destroy(trans);
4798 break;
4799 case NFT_MSG_DELSETELEM:
4800 te = (struct nft_trans_elem *)trans->data;
4801
4802 nf_tables_setelem_notify(&trans->ctx, te->set,
4803 &te->elem,
4804 NFT_MSG_DELSETELEM, 0);
4805 te->set->ops->remove(net, te->set, &te->elem);
4806 atomic_dec(&te->set->nelems);
4807 te->set->ndeact--;
4808 break;
4809 case NFT_MSG_NEWOBJ:
4810 nft_clear(net, nft_trans_obj(trans));
4811 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
4812 NFT_MSG_NEWOBJ);
4813 nft_trans_destroy(trans);
4814 break;
4815 case NFT_MSG_DELOBJ:
4816 list_del_rcu(&nft_trans_obj(trans)->list);
4817 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
4818 NFT_MSG_DELOBJ);
4819 break;
4820 }
4821 }
4822
4823 synchronize_rcu();
4824
4825 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
4826 list_del(&trans->list);
4827 nf_tables_commit_release(trans);
4828 }
4829
4830 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
4831
4832 return 0;
4833 }
4834
4835 static void nf_tables_abort_release(struct nft_trans *trans)
4836 {
4837 switch (trans->msg_type) {
4838 case NFT_MSG_NEWTABLE:
4839 nf_tables_table_destroy(&trans->ctx);
4840 break;
4841 case NFT_MSG_NEWCHAIN:
4842 nf_tables_chain_destroy(trans->ctx.chain);
4843 break;
4844 case NFT_MSG_NEWRULE:
4845 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
4846 break;
4847 case NFT_MSG_NEWSET:
4848 nft_set_destroy(nft_trans_set(trans));
4849 break;
4850 case NFT_MSG_NEWSETELEM:
4851 nft_set_elem_destroy(nft_trans_elem_set(trans),
4852 nft_trans_elem(trans).priv, true);
4853 break;
4854 case NFT_MSG_NEWOBJ:
4855 nft_obj_destroy(nft_trans_obj(trans));
4856 break;
4857 }
4858 kfree(trans);
4859 }
4860
4861 static int nf_tables_abort(struct net *net, struct sk_buff *skb)
4862 {
4863 struct nft_trans *trans, *next;
4864 struct nft_trans_elem *te;
4865
4866 list_for_each_entry_safe_reverse(trans, next, &net->nft.commit_list,
4867 list) {
4868 switch (trans->msg_type) {
4869 case NFT_MSG_NEWTABLE:
4870 if (nft_trans_table_update(trans)) {
4871 if (nft_trans_table_enable(trans)) {
4872 nf_tables_table_disable(net,
4873 trans->ctx.afi,
4874 trans->ctx.table);
4875 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
4876 }
4877 nft_trans_destroy(trans);
4878 } else {
4879 list_del_rcu(&trans->ctx.table->list);
4880 }
4881 break;
4882 case NFT_MSG_DELTABLE:
4883 nft_clear(trans->ctx.net, trans->ctx.table);
4884 nft_trans_destroy(trans);
4885 break;
4886 case NFT_MSG_NEWCHAIN:
4887 if (nft_trans_chain_update(trans)) {
4888 free_percpu(nft_trans_chain_stats(trans));
4889
4890 nft_trans_destroy(trans);
4891 } else {
4892 trans->ctx.table->use--;
4893 list_del_rcu(&trans->ctx.chain->list);
4894 nf_tables_unregister_hooks(trans->ctx.net,
4895 trans->ctx.table,
4896 trans->ctx.chain,
4897 trans->ctx.afi->nops);
4898 }
4899 break;
4900 case NFT_MSG_DELCHAIN:
4901 trans->ctx.table->use++;
4902 nft_clear(trans->ctx.net, trans->ctx.chain);
4903 nft_trans_destroy(trans);
4904 break;
4905 case NFT_MSG_NEWRULE:
4906 trans->ctx.chain->use--;
4907 list_del_rcu(&nft_trans_rule(trans)->list);
4908 break;
4909 case NFT_MSG_DELRULE:
4910 trans->ctx.chain->use++;
4911 nft_clear(trans->ctx.net, nft_trans_rule(trans));
4912 nft_trans_destroy(trans);
4913 break;
4914 case NFT_MSG_NEWSET:
4915 trans->ctx.table->use--;
4916 list_del_rcu(&nft_trans_set(trans)->list);
4917 break;
4918 case NFT_MSG_DELSET:
4919 trans->ctx.table->use++;
4920 nft_clear(trans->ctx.net, nft_trans_set(trans));
4921 nft_trans_destroy(trans);
4922 break;
4923 case NFT_MSG_NEWSETELEM:
4924 te = (struct nft_trans_elem *)trans->data;
4925
4926 te->set->ops->remove(net, te->set, &te->elem);
4927 atomic_dec(&te->set->nelems);
4928 break;
4929 case NFT_MSG_DELSETELEM:
4930 te = (struct nft_trans_elem *)trans->data;
4931
4932 te->set->ops->activate(net, te->set, &te->elem);
4933 te->set->ndeact--;
4934
4935 nft_trans_destroy(trans);
4936 break;
4937 case NFT_MSG_NEWOBJ:
4938 trans->ctx.table->use--;
4939 list_del_rcu(&nft_trans_obj(trans)->list);
4940 break;
4941 case NFT_MSG_DELOBJ:
4942 trans->ctx.table->use++;
4943 nft_clear(trans->ctx.net, nft_trans_obj(trans));
4944 nft_trans_destroy(trans);
4945 break;
4946 }
4947 }
4948
4949 synchronize_rcu();
4950
4951 list_for_each_entry_safe_reverse(trans, next,
4952 &net->nft.commit_list, list) {
4953 list_del(&trans->list);
4954 nf_tables_abort_release(trans);
4955 }
4956
4957 return 0;
4958 }
4959
4960 static const struct nfnetlink_subsystem nf_tables_subsys = {
4961 .name = "nf_tables",
4962 .subsys_id = NFNL_SUBSYS_NFTABLES,
4963 .cb_count = NFT_MSG_MAX,
4964 .cb = nf_tables_cb,
4965 .commit = nf_tables_commit,
4966 .abort = nf_tables_abort,
4967 };
4968
4969 int nft_chain_validate_dependency(const struct nft_chain *chain,
4970 enum nft_chain_type type)
4971 {
4972 const struct nft_base_chain *basechain;
4973
4974 if (chain->flags & NFT_BASE_CHAIN) {
4975 basechain = nft_base_chain(chain);
4976 if (basechain->type->type != type)
4977 return -EOPNOTSUPP;
4978 }
4979 return 0;
4980 }
4981 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
4982
4983 int nft_chain_validate_hooks(const struct nft_chain *chain,
4984 unsigned int hook_flags)
4985 {
4986 struct nft_base_chain *basechain;
4987
4988 if (chain->flags & NFT_BASE_CHAIN) {
4989 basechain = nft_base_chain(chain);
4990
4991 if ((1 << basechain->ops[0].hooknum) & hook_flags)
4992 return 0;
4993
4994 return -EOPNOTSUPP;
4995 }
4996
4997 return 0;
4998 }
4999 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
5000
5001 /*
5002 * Loop detection - walk through the ruleset beginning at the destination chain
5003 * of a new jump until either the source chain is reached (loop) or all
5004 * reachable chains have been traversed.
5005 *
5006 * The loop check is performed whenever a new jump verdict is added to an
5007 * expression or verdict map or a verdict map is bound to a new chain.
5008 */
5009
5010 static int nf_tables_check_loops(const struct nft_ctx *ctx,
5011 const struct nft_chain *chain);
5012
5013 static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
5014 struct nft_set *set,
5015 const struct nft_set_iter *iter,
5016 struct nft_set_elem *elem)
5017 {
5018 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
5019 const struct nft_data *data;
5020
5021 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
5022 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
5023 return 0;
5024
5025 data = nft_set_ext_data(ext);
5026 switch (data->verdict.code) {
5027 case NFT_JUMP:
5028 case NFT_GOTO:
5029 return nf_tables_check_loops(ctx, data->verdict.chain);
5030 default:
5031 return 0;
5032 }
5033 }
5034
5035 static int nf_tables_check_loops(const struct nft_ctx *ctx,
5036 const struct nft_chain *chain)
5037 {
5038 const struct nft_rule *rule;
5039 const struct nft_expr *expr, *last;
5040 struct nft_set *set;
5041 struct nft_set_binding *binding;
5042 struct nft_set_iter iter;
5043
5044 if (ctx->chain == chain)
5045 return -ELOOP;
5046
5047 list_for_each_entry(rule, &chain->rules, list) {
5048 nft_rule_for_each_expr(expr, last, rule) {
5049 const struct nft_data *data = NULL;
5050 int err;
5051
5052 if (!expr->ops->validate)
5053 continue;
5054
5055 err = expr->ops->validate(ctx, expr, &data);
5056 if (err < 0)
5057 return err;
5058
5059 if (data == NULL)
5060 continue;
5061
5062 switch (data->verdict.code) {
5063 case NFT_JUMP:
5064 case NFT_GOTO:
5065 err = nf_tables_check_loops(ctx,
5066 data->verdict.chain);
5067 if (err < 0)
5068 return err;
5069 default:
5070 break;
5071 }
5072 }
5073 }
5074
5075 list_for_each_entry(set, &ctx->table->sets, list) {
5076 if (!nft_is_active_next(ctx->net, set))
5077 continue;
5078 if (!(set->flags & NFT_SET_MAP) ||
5079 set->dtype != NFT_DATA_VERDICT)
5080 continue;
5081
5082 list_for_each_entry(binding, &set->bindings, list) {
5083 if (!(binding->flags & NFT_SET_MAP) ||
5084 binding->chain != chain)
5085 continue;
5086
5087 iter.genmask = nft_genmask_next(ctx->net);
5088 iter.skip = 0;
5089 iter.count = 0;
5090 iter.err = 0;
5091 iter.fn = nf_tables_loop_check_setelem;
5092
5093 set->ops->walk(ctx, set, &iter);
5094 if (iter.err < 0)
5095 return iter.err;
5096 }
5097 }
5098
5099 return 0;
5100 }
5101
5102 /**
5103 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
5104 *
5105 * @attr: netlink attribute to fetch value from
5106 * @max: maximum value to be stored in dest
5107 * @dest: pointer to the variable
5108 *
5109 * Parse, check and store a given u32 netlink attribute into variable.
5110 * This function returns -ERANGE if the value goes over maximum value.
5111 * Otherwise a 0 is returned and the attribute value is stored in the
5112 * destination variable.
5113 */
5114 int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
5115 {
5116 u32 val;
5117
5118 val = ntohl(nla_get_be32(attr));
5119 if (val > max)
5120 return -ERANGE;
5121
5122 *dest = val;
5123 return 0;
5124 }
5125 EXPORT_SYMBOL_GPL(nft_parse_u32_check);
5126
5127 /**
5128 * nft_parse_register - parse a register value from a netlink attribute
5129 *
5130 * @attr: netlink attribute
5131 *
5132 * Parse and translate a register value from a netlink attribute.
5133 * Registers used to be 128 bit wide, these register numbers will be
5134 * mapped to the corresponding 32 bit register numbers.
5135 */
5136 unsigned int nft_parse_register(const struct nlattr *attr)
5137 {
5138 unsigned int reg;
5139
5140 reg = ntohl(nla_get_be32(attr));
5141 switch (reg) {
5142 case NFT_REG_VERDICT...NFT_REG_4:
5143 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
5144 default:
5145 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
5146 }
5147 }
5148 EXPORT_SYMBOL_GPL(nft_parse_register);
5149
5150 /**
5151 * nft_dump_register - dump a register value to a netlink attribute
5152 *
5153 * @skb: socket buffer
5154 * @attr: attribute number
5155 * @reg: register number
5156 *
5157 * Construct a netlink attribute containing the register number. For
5158 * compatibility reasons, register numbers being a multiple of 4 are
5159 * translated to the corresponding 128 bit register numbers.
5160 */
5161 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
5162 {
5163 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
5164 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
5165 else
5166 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
5167
5168 return nla_put_be32(skb, attr, htonl(reg));
5169 }
5170 EXPORT_SYMBOL_GPL(nft_dump_register);
5171
5172 /**
5173 * nft_validate_register_load - validate a load from a register
5174 *
5175 * @reg: the register number
5176 * @len: the length of the data
5177 *
5178 * Validate that the input register is one of the general purpose
5179 * registers and that the length of the load is within the bounds.
5180 */
5181 int nft_validate_register_load(enum nft_registers reg, unsigned int len)
5182 {
5183 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
5184 return -EINVAL;
5185 if (len == 0)
5186 return -EINVAL;
5187 if (reg * NFT_REG32_SIZE + len > FIELD_SIZEOF(struct nft_regs, data))
5188 return -ERANGE;
5189
5190 return 0;
5191 }
5192 EXPORT_SYMBOL_GPL(nft_validate_register_load);
5193
5194 /**
5195 * nft_validate_register_store - validate an expressions' register store
5196 *
5197 * @ctx: context of the expression performing the load
5198 * @reg: the destination register number
5199 * @data: the data to load
5200 * @type: the data type
5201 * @len: the length of the data
5202 *
5203 * Validate that a data load uses the appropriate data type for
5204 * the destination register and the length is within the bounds.
5205 * A value of NULL for the data means that its runtime gathered
5206 * data.
5207 */
5208 int nft_validate_register_store(const struct nft_ctx *ctx,
5209 enum nft_registers reg,
5210 const struct nft_data *data,
5211 enum nft_data_types type, unsigned int len)
5212 {
5213 int err;
5214
5215 switch (reg) {
5216 case NFT_REG_VERDICT:
5217 if (type != NFT_DATA_VERDICT)
5218 return -EINVAL;
5219
5220 if (data != NULL &&
5221 (data->verdict.code == NFT_GOTO ||
5222 data->verdict.code == NFT_JUMP)) {
5223 err = nf_tables_check_loops(ctx, data->verdict.chain);
5224 if (err < 0)
5225 return err;
5226
5227 if (ctx->chain->level + 1 >
5228 data->verdict.chain->level) {
5229 if (ctx->chain->level + 1 == NFT_JUMP_STACK_SIZE)
5230 return -EMLINK;
5231 data->verdict.chain->level = ctx->chain->level + 1;
5232 }
5233 }
5234
5235 return 0;
5236 default:
5237 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
5238 return -EINVAL;
5239 if (len == 0)
5240 return -EINVAL;
5241 if (reg * NFT_REG32_SIZE + len >
5242 FIELD_SIZEOF(struct nft_regs, data))
5243 return -ERANGE;
5244
5245 if (data != NULL && type != NFT_DATA_VALUE)
5246 return -EINVAL;
5247 return 0;
5248 }
5249 }
5250 EXPORT_SYMBOL_GPL(nft_validate_register_store);
5251
5252 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
5253 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
5254 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
5255 .len = NFT_CHAIN_MAXNAMELEN - 1 },
5256 };
5257
5258 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
5259 struct nft_data_desc *desc, const struct nlattr *nla)
5260 {
5261 u8 genmask = nft_genmask_next(ctx->net);
5262 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
5263 struct nft_chain *chain;
5264 int err;
5265
5266 err = nla_parse_nested(tb, NFTA_VERDICT_MAX, nla, nft_verdict_policy);
5267 if (err < 0)
5268 return err;
5269
5270 if (!tb[NFTA_VERDICT_CODE])
5271 return -EINVAL;
5272 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
5273
5274 switch (data->verdict.code) {
5275 default:
5276 switch (data->verdict.code & NF_VERDICT_MASK) {
5277 case NF_ACCEPT:
5278 case NF_DROP:
5279 case NF_QUEUE:
5280 break;
5281 default:
5282 return -EINVAL;
5283 }
5284 /* fall through */
5285 case NFT_CONTINUE:
5286 case NFT_BREAK:
5287 case NFT_RETURN:
5288 break;
5289 case NFT_JUMP:
5290 case NFT_GOTO:
5291 if (!tb[NFTA_VERDICT_CHAIN])
5292 return -EINVAL;
5293 chain = nf_tables_chain_lookup(ctx->table,
5294 tb[NFTA_VERDICT_CHAIN], genmask);
5295 if (IS_ERR(chain))
5296 return PTR_ERR(chain);
5297 if (chain->flags & NFT_BASE_CHAIN)
5298 return -EOPNOTSUPP;
5299
5300 chain->use++;
5301 data->verdict.chain = chain;
5302 break;
5303 }
5304
5305 desc->len = sizeof(data->verdict);
5306 desc->type = NFT_DATA_VERDICT;
5307 return 0;
5308 }
5309
5310 static void nft_verdict_uninit(const struct nft_data *data)
5311 {
5312 switch (data->verdict.code) {
5313 case NFT_JUMP:
5314 case NFT_GOTO:
5315 data->verdict.chain->use--;
5316 break;
5317 }
5318 }
5319
5320 int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
5321 {
5322 struct nlattr *nest;
5323
5324 nest = nla_nest_start(skb, type);
5325 if (!nest)
5326 goto nla_put_failure;
5327
5328 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
5329 goto nla_put_failure;
5330
5331 switch (v->code) {
5332 case NFT_JUMP:
5333 case NFT_GOTO:
5334 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
5335 v->chain->name))
5336 goto nla_put_failure;
5337 }
5338 nla_nest_end(skb, nest);
5339 return 0;
5340
5341 nla_put_failure:
5342 return -1;
5343 }
5344
5345 static int nft_value_init(const struct nft_ctx *ctx,
5346 struct nft_data *data, unsigned int size,
5347 struct nft_data_desc *desc, const struct nlattr *nla)
5348 {
5349 unsigned int len;
5350
5351 len = nla_len(nla);
5352 if (len == 0)
5353 return -EINVAL;
5354 if (len > size)
5355 return -EOVERFLOW;
5356
5357 nla_memcpy(data->data, nla, len);
5358 desc->type = NFT_DATA_VALUE;
5359 desc->len = len;
5360 return 0;
5361 }
5362
5363 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
5364 unsigned int len)
5365 {
5366 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
5367 }
5368
5369 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
5370 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
5371 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
5372 };
5373
5374 /**
5375 * nft_data_init - parse nf_tables data netlink attributes
5376 *
5377 * @ctx: context of the expression using the data
5378 * @data: destination struct nft_data
5379 * @size: maximum data length
5380 * @desc: data description
5381 * @nla: netlink attribute containing data
5382 *
5383 * Parse the netlink data attributes and initialize a struct nft_data.
5384 * The type and length of data are returned in the data description.
5385 *
5386 * The caller can indicate that it only wants to accept data of type
5387 * NFT_DATA_VALUE by passing NULL for the ctx argument.
5388 */
5389 int nft_data_init(const struct nft_ctx *ctx,
5390 struct nft_data *data, unsigned int size,
5391 struct nft_data_desc *desc, const struct nlattr *nla)
5392 {
5393 struct nlattr *tb[NFTA_DATA_MAX + 1];
5394 int err;
5395
5396 err = nla_parse_nested(tb, NFTA_DATA_MAX, nla, nft_data_policy);
5397 if (err < 0)
5398 return err;
5399
5400 if (tb[NFTA_DATA_VALUE])
5401 return nft_value_init(ctx, data, size, desc,
5402 tb[NFTA_DATA_VALUE]);
5403 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
5404 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
5405 return -EINVAL;
5406 }
5407 EXPORT_SYMBOL_GPL(nft_data_init);
5408
5409 /**
5410 * nft_data_uninit - release a nft_data item
5411 *
5412 * @data: struct nft_data to release
5413 * @type: type of data
5414 *
5415 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
5416 * all others need to be released by calling this function.
5417 */
5418 void nft_data_uninit(const struct nft_data *data, enum nft_data_types type)
5419 {
5420 if (type < NFT_DATA_VERDICT)
5421 return;
5422 switch (type) {
5423 case NFT_DATA_VERDICT:
5424 return nft_verdict_uninit(data);
5425 default:
5426 WARN_ON(1);
5427 }
5428 }
5429 EXPORT_SYMBOL_GPL(nft_data_uninit);
5430
5431 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
5432 enum nft_data_types type, unsigned int len)
5433 {
5434 struct nlattr *nest;
5435 int err;
5436
5437 nest = nla_nest_start(skb, attr);
5438 if (nest == NULL)
5439 return -1;
5440
5441 switch (type) {
5442 case NFT_DATA_VALUE:
5443 err = nft_value_dump(skb, data, len);
5444 break;
5445 case NFT_DATA_VERDICT:
5446 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
5447 break;
5448 default:
5449 err = -EINVAL;
5450 WARN_ON(1);
5451 }
5452
5453 nla_nest_end(skb, nest);
5454 return err;
5455 }
5456 EXPORT_SYMBOL_GPL(nft_data_dump);
5457
5458 static int __net_init nf_tables_init_net(struct net *net)
5459 {
5460 INIT_LIST_HEAD(&net->nft.af_info);
5461 INIT_LIST_HEAD(&net->nft.commit_list);
5462 net->nft.base_seq = 1;
5463 return 0;
5464 }
5465
5466 int __nft_release_basechain(struct nft_ctx *ctx)
5467 {
5468 struct nft_rule *rule, *nr;
5469
5470 BUG_ON(!(ctx->chain->flags & NFT_BASE_CHAIN));
5471
5472 nf_tables_unregister_hooks(ctx->net, ctx->chain->table, ctx->chain,
5473 ctx->afi->nops);
5474 list_for_each_entry_safe(rule, nr, &ctx->chain->rules, list) {
5475 list_del(&rule->list);
5476 ctx->chain->use--;
5477 nf_tables_rule_destroy(ctx, rule);
5478 }
5479 list_del(&ctx->chain->list);
5480 ctx->table->use--;
5481 nf_tables_chain_destroy(ctx->chain);
5482
5483 return 0;
5484 }
5485 EXPORT_SYMBOL_GPL(__nft_release_basechain);
5486
5487 /* Called by nft_unregister_afinfo() from __net_exit path, nfnl_lock is held. */
5488 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi)
5489 {
5490 struct nft_table *table, *nt;
5491 struct nft_chain *chain, *nc;
5492 struct nft_object *obj, *ne;
5493 struct nft_rule *rule, *nr;
5494 struct nft_set *set, *ns;
5495 struct nft_ctx ctx = {
5496 .net = net,
5497 .afi = afi,
5498 };
5499
5500 list_for_each_entry_safe(table, nt, &afi->tables, list) {
5501 list_for_each_entry(chain, &table->chains, list)
5502 nf_tables_unregister_hooks(net, table, chain,
5503 afi->nops);
5504 /* No packets are walking on these chains anymore. */
5505 ctx.table = table;
5506 list_for_each_entry(chain, &table->chains, list) {
5507 ctx.chain = chain;
5508 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
5509 list_del(&rule->list);
5510 chain->use--;
5511 nf_tables_rule_destroy(&ctx, rule);
5512 }
5513 }
5514 list_for_each_entry_safe(set, ns, &table->sets, list) {
5515 list_del(&set->list);
5516 table->use--;
5517 nft_set_destroy(set);
5518 }
5519 list_for_each_entry_safe(obj, ne, &table->objects, list) {
5520 list_del(&obj->list);
5521 table->use--;
5522 nft_obj_destroy(obj);
5523 }
5524 list_for_each_entry_safe(chain, nc, &table->chains, list) {
5525 list_del(&chain->list);
5526 table->use--;
5527 nf_tables_chain_destroy(chain);
5528 }
5529 list_del(&table->list);
5530 nf_tables_table_destroy(&ctx);
5531 }
5532 }
5533
5534 static struct pernet_operations nf_tables_net_ops = {
5535 .init = nf_tables_init_net,
5536 };
5537
5538 static int __init nf_tables_module_init(void)
5539 {
5540 int err;
5541
5542 info = kmalloc(sizeof(struct nft_expr_info) * NFT_RULE_MAXEXPRS,
5543 GFP_KERNEL);
5544 if (info == NULL) {
5545 err = -ENOMEM;
5546 goto err1;
5547 }
5548
5549 err = nf_tables_core_module_init();
5550 if (err < 0)
5551 goto err2;
5552
5553 err = nfnetlink_subsys_register(&nf_tables_subsys);
5554 if (err < 0)
5555 goto err3;
5556
5557 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
5558 return register_pernet_subsys(&nf_tables_net_ops);
5559 err3:
5560 nf_tables_core_module_exit();
5561 err2:
5562 kfree(info);
5563 err1:
5564 return err;
5565 }
5566
5567 static void __exit nf_tables_module_exit(void)
5568 {
5569 unregister_pernet_subsys(&nf_tables_net_ops);
5570 nfnetlink_subsys_unregister(&nf_tables_subsys);
5571 rcu_barrier();
5572 nf_tables_core_module_exit();
5573 kfree(info);
5574 }
5575
5576 module_init(nf_tables_module_init);
5577 module_exit(nf_tables_module_exit);
5578
5579 MODULE_LICENSE("GPL");
5580 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
5581 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);