]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blob - net/netfilter/nf_tables_api.c
7d6a626b08f17d04c5192f25b58c078d84fe8a3b
[mirror_ubuntu-artful-kernel.git] / net / netfilter / nf_tables_api.c
1 /*
2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
7 *
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
9 */
10
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/netfilter.h>
17 #include <linux/netfilter/nfnetlink.h>
18 #include <linux/netfilter/nf_tables.h>
19 #include <net/netfilter/nf_tables_core.h>
20 #include <net/netfilter/nf_tables.h>
21 #include <net/net_namespace.h>
22 #include <net/sock.h>
23
24 static LIST_HEAD(nf_tables_expressions);
25
26 /**
27 * nft_register_afinfo - register nf_tables address family info
28 *
29 * @afi: address family info to register
30 *
31 * Register the address family for use with nf_tables. Returns zero on
32 * success or a negative errno code otherwise.
33 */
34 int nft_register_afinfo(struct net *net, struct nft_af_info *afi)
35 {
36 INIT_LIST_HEAD(&afi->tables);
37 nfnl_lock(NFNL_SUBSYS_NFTABLES);
38 list_add_tail_rcu(&afi->list, &net->nft.af_info);
39 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
40 return 0;
41 }
42 EXPORT_SYMBOL_GPL(nft_register_afinfo);
43
44 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi);
45
46 /**
47 * nft_unregister_afinfo - unregister nf_tables address family info
48 *
49 * @afi: address family info to unregister
50 *
51 * Unregister the address family for use with nf_tables.
52 */
53 void nft_unregister_afinfo(struct net *net, struct nft_af_info *afi)
54 {
55 nfnl_lock(NFNL_SUBSYS_NFTABLES);
56 __nft_release_afinfo(net, afi);
57 list_del_rcu(&afi->list);
58 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
59 }
60 EXPORT_SYMBOL_GPL(nft_unregister_afinfo);
61
62 static struct nft_af_info *nft_afinfo_lookup(struct net *net, int family)
63 {
64 struct nft_af_info *afi;
65
66 list_for_each_entry(afi, &net->nft.af_info, list) {
67 if (afi->family == family)
68 return afi;
69 }
70 return NULL;
71 }
72
73 static struct nft_af_info *
74 nf_tables_afinfo_lookup(struct net *net, int family, bool autoload)
75 {
76 struct nft_af_info *afi;
77
78 afi = nft_afinfo_lookup(net, family);
79 if (afi != NULL)
80 return afi;
81 #ifdef CONFIG_MODULES
82 if (autoload) {
83 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
84 request_module("nft-afinfo-%u", family);
85 nfnl_lock(NFNL_SUBSYS_NFTABLES);
86 afi = nft_afinfo_lookup(net, family);
87 if (afi != NULL)
88 return ERR_PTR(-EAGAIN);
89 }
90 #endif
91 return ERR_PTR(-EAFNOSUPPORT);
92 }
93
94 static void nft_ctx_init(struct nft_ctx *ctx,
95 struct net *net,
96 const struct sk_buff *skb,
97 const struct nlmsghdr *nlh,
98 struct nft_af_info *afi,
99 struct nft_table *table,
100 struct nft_chain *chain,
101 const struct nlattr * const *nla)
102 {
103 ctx->net = net;
104 ctx->afi = afi;
105 ctx->table = table;
106 ctx->chain = chain;
107 ctx->nla = nla;
108 ctx->portid = NETLINK_CB(skb).portid;
109 ctx->report = nlmsg_report(nlh);
110 ctx->seq = nlh->nlmsg_seq;
111 }
112
113 static struct nft_trans *nft_trans_alloc(struct nft_ctx *ctx, int msg_type,
114 u32 size)
115 {
116 struct nft_trans *trans;
117
118 trans = kzalloc(sizeof(struct nft_trans) + size, GFP_KERNEL);
119 if (trans == NULL)
120 return NULL;
121
122 trans->msg_type = msg_type;
123 trans->ctx = *ctx;
124
125 return trans;
126 }
127
128 static void nft_trans_destroy(struct nft_trans *trans)
129 {
130 list_del(&trans->list);
131 kfree(trans);
132 }
133
134 static int nf_tables_register_hooks(struct net *net,
135 const struct nft_table *table,
136 struct nft_chain *chain,
137 unsigned int hook_nops)
138 {
139 if (table->flags & NFT_TABLE_F_DORMANT ||
140 !(chain->flags & NFT_BASE_CHAIN))
141 return 0;
142
143 return nf_register_net_hooks(net, nft_base_chain(chain)->ops,
144 hook_nops);
145 }
146
147 static void nf_tables_unregister_hooks(struct net *net,
148 const struct nft_table *table,
149 struct nft_chain *chain,
150 unsigned int hook_nops)
151 {
152 if (table->flags & NFT_TABLE_F_DORMANT ||
153 !(chain->flags & NFT_BASE_CHAIN))
154 return;
155
156 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops, hook_nops);
157 }
158
159 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
160 {
161 struct nft_trans *trans;
162
163 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
164 if (trans == NULL)
165 return -ENOMEM;
166
167 if (msg_type == NFT_MSG_NEWTABLE)
168 nft_activate_next(ctx->net, ctx->table);
169
170 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
171 return 0;
172 }
173
174 static int nft_deltable(struct nft_ctx *ctx)
175 {
176 int err;
177
178 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
179 if (err < 0)
180 return err;
181
182 nft_deactivate_next(ctx->net, ctx->table);
183 return err;
184 }
185
186 static int nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
187 {
188 struct nft_trans *trans;
189
190 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
191 if (trans == NULL)
192 return -ENOMEM;
193
194 if (msg_type == NFT_MSG_NEWCHAIN)
195 nft_activate_next(ctx->net, ctx->chain);
196
197 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
198 return 0;
199 }
200
201 static int nft_delchain(struct nft_ctx *ctx)
202 {
203 int err;
204
205 err = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
206 if (err < 0)
207 return err;
208
209 ctx->table->use--;
210 nft_deactivate_next(ctx->net, ctx->chain);
211
212 return err;
213 }
214
215 static int
216 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
217 {
218 /* You cannot delete the same rule twice */
219 if (nft_is_active_next(ctx->net, rule)) {
220 nft_deactivate_next(ctx->net, rule);
221 ctx->chain->use--;
222 return 0;
223 }
224 return -ENOENT;
225 }
226
227 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
228 struct nft_rule *rule)
229 {
230 struct nft_trans *trans;
231
232 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
233 if (trans == NULL)
234 return NULL;
235
236 nft_trans_rule(trans) = rule;
237 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
238
239 return trans;
240 }
241
242 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
243 {
244 struct nft_trans *trans;
245 int err;
246
247 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
248 if (trans == NULL)
249 return -ENOMEM;
250
251 err = nf_tables_delrule_deactivate(ctx, rule);
252 if (err < 0) {
253 nft_trans_destroy(trans);
254 return err;
255 }
256
257 return 0;
258 }
259
260 static int nft_delrule_by_chain(struct nft_ctx *ctx)
261 {
262 struct nft_rule *rule;
263 int err;
264
265 list_for_each_entry(rule, &ctx->chain->rules, list) {
266 err = nft_delrule(ctx, rule);
267 if (err < 0)
268 return err;
269 }
270 return 0;
271 }
272
273 static int nft_trans_set_add(struct nft_ctx *ctx, int msg_type,
274 struct nft_set *set)
275 {
276 struct nft_trans *trans;
277
278 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
279 if (trans == NULL)
280 return -ENOMEM;
281
282 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
283 nft_trans_set_id(trans) =
284 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
285 nft_activate_next(ctx->net, set);
286 }
287 nft_trans_set(trans) = set;
288 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
289
290 return 0;
291 }
292
293 static int nft_delset(struct nft_ctx *ctx, struct nft_set *set)
294 {
295 int err;
296
297 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
298 if (err < 0)
299 return err;
300
301 nft_deactivate_next(ctx->net, set);
302 ctx->table->use--;
303
304 return err;
305 }
306
307 /*
308 * Tables
309 */
310
311 static struct nft_table *nft_table_lookup(const struct nft_af_info *afi,
312 const struct nlattr *nla,
313 u8 genmask)
314 {
315 struct nft_table *table;
316
317 list_for_each_entry(table, &afi->tables, list) {
318 if (!nla_strcmp(nla, table->name) &&
319 nft_active_genmask(table, genmask))
320 return table;
321 }
322 return NULL;
323 }
324
325 static struct nft_table *nf_tables_table_lookup(const struct nft_af_info *afi,
326 const struct nlattr *nla,
327 u8 genmask)
328 {
329 struct nft_table *table;
330
331 if (nla == NULL)
332 return ERR_PTR(-EINVAL);
333
334 table = nft_table_lookup(afi, nla, genmask);
335 if (table != NULL)
336 return table;
337
338 return ERR_PTR(-ENOENT);
339 }
340
341 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
342 {
343 return ++table->hgenerator;
344 }
345
346 static const struct nf_chain_type *chain_type[AF_MAX][NFT_CHAIN_T_MAX];
347
348 static const struct nf_chain_type *
349 __nf_tables_chain_type_lookup(int family, const struct nlattr *nla)
350 {
351 int i;
352
353 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
354 if (chain_type[family][i] != NULL &&
355 !nla_strcmp(nla, chain_type[family][i]->name))
356 return chain_type[family][i];
357 }
358 return NULL;
359 }
360
361 static const struct nf_chain_type *
362 nf_tables_chain_type_lookup(const struct nft_af_info *afi,
363 const struct nlattr *nla,
364 bool autoload)
365 {
366 const struct nf_chain_type *type;
367
368 type = __nf_tables_chain_type_lookup(afi->family, nla);
369 if (type != NULL)
370 return type;
371 #ifdef CONFIG_MODULES
372 if (autoload) {
373 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
374 request_module("nft-chain-%u-%.*s", afi->family,
375 nla_len(nla), (const char *)nla_data(nla));
376 nfnl_lock(NFNL_SUBSYS_NFTABLES);
377 type = __nf_tables_chain_type_lookup(afi->family, nla);
378 if (type != NULL)
379 return ERR_PTR(-EAGAIN);
380 }
381 #endif
382 return ERR_PTR(-ENOENT);
383 }
384
385 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
386 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
387 .len = NFT_TABLE_MAXNAMELEN - 1 },
388 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
389 };
390
391 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
392 u32 portid, u32 seq, int event, u32 flags,
393 int family, const struct nft_table *table)
394 {
395 struct nlmsghdr *nlh;
396 struct nfgenmsg *nfmsg;
397
398 event |= NFNL_SUBSYS_NFTABLES << 8;
399 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
400 if (nlh == NULL)
401 goto nla_put_failure;
402
403 nfmsg = nlmsg_data(nlh);
404 nfmsg->nfgen_family = family;
405 nfmsg->version = NFNETLINK_V0;
406 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
407
408 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
409 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
410 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)))
411 goto nla_put_failure;
412
413 nlmsg_end(skb, nlh);
414 return 0;
415
416 nla_put_failure:
417 nlmsg_trim(skb, nlh);
418 return -1;
419 }
420
421 static int nf_tables_table_notify(const struct nft_ctx *ctx, int event)
422 {
423 struct sk_buff *skb;
424 int err;
425
426 if (!ctx->report &&
427 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
428 return 0;
429
430 err = -ENOBUFS;
431 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
432 if (skb == NULL)
433 goto err;
434
435 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
436 event, 0, ctx->afi->family, ctx->table);
437 if (err < 0) {
438 kfree_skb(skb);
439 goto err;
440 }
441
442 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
443 ctx->report, GFP_KERNEL);
444 err:
445 if (err < 0) {
446 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
447 err);
448 }
449 return err;
450 }
451
452 static int nf_tables_dump_tables(struct sk_buff *skb,
453 struct netlink_callback *cb)
454 {
455 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
456 const struct nft_af_info *afi;
457 const struct nft_table *table;
458 unsigned int idx = 0, s_idx = cb->args[0];
459 struct net *net = sock_net(skb->sk);
460 int family = nfmsg->nfgen_family;
461
462 rcu_read_lock();
463 cb->seq = net->nft.base_seq;
464
465 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
466 if (family != NFPROTO_UNSPEC && family != afi->family)
467 continue;
468
469 list_for_each_entry_rcu(table, &afi->tables, list) {
470 if (idx < s_idx)
471 goto cont;
472 if (idx > s_idx)
473 memset(&cb->args[1], 0,
474 sizeof(cb->args) - sizeof(cb->args[0]));
475 if (!nft_is_active(net, table))
476 continue;
477 if (nf_tables_fill_table_info(skb, net,
478 NETLINK_CB(cb->skb).portid,
479 cb->nlh->nlmsg_seq,
480 NFT_MSG_NEWTABLE,
481 NLM_F_MULTI,
482 afi->family, table) < 0)
483 goto done;
484
485 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
486 cont:
487 idx++;
488 }
489 }
490 done:
491 rcu_read_unlock();
492 cb->args[0] = idx;
493 return skb->len;
494 }
495
496 static int nf_tables_gettable(struct net *net, struct sock *nlsk,
497 struct sk_buff *skb, const struct nlmsghdr *nlh,
498 const struct nlattr * const nla[])
499 {
500 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
501 u8 genmask = nft_genmask_cur(net);
502 const struct nft_af_info *afi;
503 const struct nft_table *table;
504 struct sk_buff *skb2;
505 int family = nfmsg->nfgen_family;
506 int err;
507
508 if (nlh->nlmsg_flags & NLM_F_DUMP) {
509 struct netlink_dump_control c = {
510 .dump = nf_tables_dump_tables,
511 };
512 return netlink_dump_start(nlsk, skb, nlh, &c);
513 }
514
515 afi = nf_tables_afinfo_lookup(net, family, false);
516 if (IS_ERR(afi))
517 return PTR_ERR(afi);
518
519 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
520 if (IS_ERR(table))
521 return PTR_ERR(table);
522
523 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
524 if (!skb2)
525 return -ENOMEM;
526
527 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
528 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
529 family, table);
530 if (err < 0)
531 goto err;
532
533 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
534
535 err:
536 kfree_skb(skb2);
537 return err;
538 }
539
540 static int nf_tables_table_enable(struct net *net,
541 const struct nft_af_info *afi,
542 struct nft_table *table)
543 {
544 struct nft_chain *chain;
545 int err, i = 0;
546
547 list_for_each_entry(chain, &table->chains, list) {
548 if (!nft_is_active_next(net, chain))
549 continue;
550 if (!(chain->flags & NFT_BASE_CHAIN))
551 continue;
552
553 err = nf_register_net_hooks(net, nft_base_chain(chain)->ops,
554 afi->nops);
555 if (err < 0)
556 goto err;
557
558 i++;
559 }
560 return 0;
561 err:
562 list_for_each_entry(chain, &table->chains, list) {
563 if (!nft_is_active_next(net, chain))
564 continue;
565 if (!(chain->flags & NFT_BASE_CHAIN))
566 continue;
567
568 if (i-- <= 0)
569 break;
570
571 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops,
572 afi->nops);
573 }
574 return err;
575 }
576
577 static void nf_tables_table_disable(struct net *net,
578 const struct nft_af_info *afi,
579 struct nft_table *table)
580 {
581 struct nft_chain *chain;
582
583 list_for_each_entry(chain, &table->chains, list) {
584 if (!nft_is_active_next(net, chain))
585 continue;
586 if (!(chain->flags & NFT_BASE_CHAIN))
587 continue;
588
589 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops,
590 afi->nops);
591 }
592 }
593
594 static int nf_tables_updtable(struct nft_ctx *ctx)
595 {
596 struct nft_trans *trans;
597 u32 flags;
598 int ret = 0;
599
600 if (!ctx->nla[NFTA_TABLE_FLAGS])
601 return 0;
602
603 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
604 if (flags & ~NFT_TABLE_F_DORMANT)
605 return -EINVAL;
606
607 if (flags == ctx->table->flags)
608 return 0;
609
610 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
611 sizeof(struct nft_trans_table));
612 if (trans == NULL)
613 return -ENOMEM;
614
615 if ((flags & NFT_TABLE_F_DORMANT) &&
616 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
617 nft_trans_table_enable(trans) = false;
618 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
619 ctx->table->flags & NFT_TABLE_F_DORMANT) {
620 ret = nf_tables_table_enable(ctx->net, ctx->afi, ctx->table);
621 if (ret >= 0) {
622 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
623 nft_trans_table_enable(trans) = true;
624 }
625 }
626 if (ret < 0)
627 goto err;
628
629 nft_trans_table_update(trans) = true;
630 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
631 return 0;
632 err:
633 nft_trans_destroy(trans);
634 return ret;
635 }
636
637 static int nf_tables_newtable(struct net *net, struct sock *nlsk,
638 struct sk_buff *skb, const struct nlmsghdr *nlh,
639 const struct nlattr * const nla[])
640 {
641 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
642 u8 genmask = nft_genmask_next(net);
643 const struct nlattr *name;
644 struct nft_af_info *afi;
645 struct nft_table *table;
646 int family = nfmsg->nfgen_family;
647 u32 flags = 0;
648 struct nft_ctx ctx;
649 int err;
650
651 afi = nf_tables_afinfo_lookup(net, family, true);
652 if (IS_ERR(afi))
653 return PTR_ERR(afi);
654
655 name = nla[NFTA_TABLE_NAME];
656 table = nf_tables_table_lookup(afi, name, genmask);
657 if (IS_ERR(table)) {
658 if (PTR_ERR(table) != -ENOENT)
659 return PTR_ERR(table);
660 table = NULL;
661 }
662
663 if (table != NULL) {
664 if (nlh->nlmsg_flags & NLM_F_EXCL)
665 return -EEXIST;
666 if (nlh->nlmsg_flags & NLM_F_REPLACE)
667 return -EOPNOTSUPP;
668
669 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
670 return nf_tables_updtable(&ctx);
671 }
672
673 if (nla[NFTA_TABLE_FLAGS]) {
674 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
675 if (flags & ~NFT_TABLE_F_DORMANT)
676 return -EINVAL;
677 }
678
679 err = -EAFNOSUPPORT;
680 if (!try_module_get(afi->owner))
681 goto err1;
682
683 err = -ENOMEM;
684 table = kzalloc(sizeof(*table), GFP_KERNEL);
685 if (table == NULL)
686 goto err2;
687
688 nla_strlcpy(table->name, name, NFT_TABLE_MAXNAMELEN);
689 INIT_LIST_HEAD(&table->chains);
690 INIT_LIST_HEAD(&table->sets);
691 table->flags = flags;
692
693 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
694 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
695 if (err < 0)
696 goto err3;
697
698 list_add_tail_rcu(&table->list, &afi->tables);
699 return 0;
700 err3:
701 kfree(table);
702 err2:
703 module_put(afi->owner);
704 err1:
705 return err;
706 }
707
708 static int nft_flush_table(struct nft_ctx *ctx)
709 {
710 int err;
711 struct nft_chain *chain, *nc;
712 struct nft_set *set, *ns;
713
714 list_for_each_entry(chain, &ctx->table->chains, list) {
715 if (!nft_is_active_next(ctx->net, chain))
716 continue;
717
718 ctx->chain = chain;
719
720 err = nft_delrule_by_chain(ctx);
721 if (err < 0)
722 goto out;
723 }
724
725 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
726 if (!nft_is_active_next(ctx->net, set))
727 continue;
728
729 if (set->flags & NFT_SET_ANONYMOUS &&
730 !list_empty(&set->bindings))
731 continue;
732
733 err = nft_delset(ctx, set);
734 if (err < 0)
735 goto out;
736 }
737
738 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
739 if (!nft_is_active_next(ctx->net, chain))
740 continue;
741
742 ctx->chain = chain;
743
744 err = nft_delchain(ctx);
745 if (err < 0)
746 goto out;
747 }
748
749 err = nft_deltable(ctx);
750 out:
751 return err;
752 }
753
754 static int nft_flush(struct nft_ctx *ctx, int family)
755 {
756 struct nft_af_info *afi;
757 struct nft_table *table, *nt;
758 const struct nlattr * const *nla = ctx->nla;
759 int err = 0;
760
761 list_for_each_entry(afi, &ctx->net->nft.af_info, list) {
762 if (family != AF_UNSPEC && afi->family != family)
763 continue;
764
765 ctx->afi = afi;
766 list_for_each_entry_safe(table, nt, &afi->tables, list) {
767 if (!nft_is_active_next(ctx->net, table))
768 continue;
769
770 if (nla[NFTA_TABLE_NAME] &&
771 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
772 continue;
773
774 ctx->table = table;
775
776 err = nft_flush_table(ctx);
777 if (err < 0)
778 goto out;
779 }
780 }
781 out:
782 return err;
783 }
784
785 static int nf_tables_deltable(struct net *net, struct sock *nlsk,
786 struct sk_buff *skb, const struct nlmsghdr *nlh,
787 const struct nlattr * const nla[])
788 {
789 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
790 u8 genmask = nft_genmask_next(net);
791 struct nft_af_info *afi;
792 struct nft_table *table;
793 int family = nfmsg->nfgen_family;
794 struct nft_ctx ctx;
795
796 nft_ctx_init(&ctx, net, skb, nlh, NULL, NULL, NULL, nla);
797 if (family == AF_UNSPEC || nla[NFTA_TABLE_NAME] == NULL)
798 return nft_flush(&ctx, family);
799
800 afi = nf_tables_afinfo_lookup(net, family, false);
801 if (IS_ERR(afi))
802 return PTR_ERR(afi);
803
804 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
805 if (IS_ERR(table))
806 return PTR_ERR(table);
807
808 ctx.afi = afi;
809 ctx.table = table;
810
811 return nft_flush_table(&ctx);
812 }
813
814 static void nf_tables_table_destroy(struct nft_ctx *ctx)
815 {
816 BUG_ON(ctx->table->use > 0);
817
818 kfree(ctx->table);
819 module_put(ctx->afi->owner);
820 }
821
822 int nft_register_chain_type(const struct nf_chain_type *ctype)
823 {
824 int err = 0;
825
826 nfnl_lock(NFNL_SUBSYS_NFTABLES);
827 if (chain_type[ctype->family][ctype->type] != NULL) {
828 err = -EBUSY;
829 goto out;
830 }
831 chain_type[ctype->family][ctype->type] = ctype;
832 out:
833 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
834 return err;
835 }
836 EXPORT_SYMBOL_GPL(nft_register_chain_type);
837
838 void nft_unregister_chain_type(const struct nf_chain_type *ctype)
839 {
840 nfnl_lock(NFNL_SUBSYS_NFTABLES);
841 chain_type[ctype->family][ctype->type] = NULL;
842 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
843 }
844 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
845
846 /*
847 * Chains
848 */
849
850 static struct nft_chain *
851 nf_tables_chain_lookup_byhandle(const struct nft_table *table, u64 handle,
852 u8 genmask)
853 {
854 struct nft_chain *chain;
855
856 list_for_each_entry(chain, &table->chains, list) {
857 if (chain->handle == handle &&
858 nft_active_genmask(chain, genmask))
859 return chain;
860 }
861
862 return ERR_PTR(-ENOENT);
863 }
864
865 static struct nft_chain *nf_tables_chain_lookup(const struct nft_table *table,
866 const struct nlattr *nla,
867 u8 genmask)
868 {
869 struct nft_chain *chain;
870
871 if (nla == NULL)
872 return ERR_PTR(-EINVAL);
873
874 list_for_each_entry(chain, &table->chains, list) {
875 if (!nla_strcmp(nla, chain->name) &&
876 nft_active_genmask(chain, genmask))
877 return chain;
878 }
879
880 return ERR_PTR(-ENOENT);
881 }
882
883 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
884 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING },
885 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
886 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
887 .len = NFT_CHAIN_MAXNAMELEN - 1 },
888 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
889 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
890 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING },
891 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
892 };
893
894 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
895 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
896 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
897 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
898 .len = IFNAMSIZ - 1 },
899 };
900
901 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
902 {
903 struct nft_stats *cpu_stats, total;
904 struct nlattr *nest;
905 unsigned int seq;
906 u64 pkts, bytes;
907 int cpu;
908
909 memset(&total, 0, sizeof(total));
910 for_each_possible_cpu(cpu) {
911 cpu_stats = per_cpu_ptr(stats, cpu);
912 do {
913 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
914 pkts = cpu_stats->pkts;
915 bytes = cpu_stats->bytes;
916 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
917 total.pkts += pkts;
918 total.bytes += bytes;
919 }
920 nest = nla_nest_start(skb, NFTA_CHAIN_COUNTERS);
921 if (nest == NULL)
922 goto nla_put_failure;
923
924 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
925 NFTA_COUNTER_PAD) ||
926 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
927 NFTA_COUNTER_PAD))
928 goto nla_put_failure;
929
930 nla_nest_end(skb, nest);
931 return 0;
932
933 nla_put_failure:
934 return -ENOSPC;
935 }
936
937 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
938 u32 portid, u32 seq, int event, u32 flags,
939 int family, const struct nft_table *table,
940 const struct nft_chain *chain)
941 {
942 struct nlmsghdr *nlh;
943 struct nfgenmsg *nfmsg;
944
945 event |= NFNL_SUBSYS_NFTABLES << 8;
946 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
947 if (nlh == NULL)
948 goto nla_put_failure;
949
950 nfmsg = nlmsg_data(nlh);
951 nfmsg->nfgen_family = family;
952 nfmsg->version = NFNETLINK_V0;
953 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
954
955 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
956 goto nla_put_failure;
957 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
958 NFTA_CHAIN_PAD))
959 goto nla_put_failure;
960 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
961 goto nla_put_failure;
962
963 if (chain->flags & NFT_BASE_CHAIN) {
964 const struct nft_base_chain *basechain = nft_base_chain(chain);
965 const struct nf_hook_ops *ops = &basechain->ops[0];
966 struct nlattr *nest;
967
968 nest = nla_nest_start(skb, NFTA_CHAIN_HOOK);
969 if (nest == NULL)
970 goto nla_put_failure;
971 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
972 goto nla_put_failure;
973 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
974 goto nla_put_failure;
975 if (basechain->dev_name[0] &&
976 nla_put_string(skb, NFTA_HOOK_DEV, basechain->dev_name))
977 goto nla_put_failure;
978 nla_nest_end(skb, nest);
979
980 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
981 htonl(basechain->policy)))
982 goto nla_put_failure;
983
984 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
985 goto nla_put_failure;
986
987 if (nft_dump_stats(skb, nft_base_chain(chain)->stats))
988 goto nla_put_failure;
989 }
990
991 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
992 goto nla_put_failure;
993
994 nlmsg_end(skb, nlh);
995 return 0;
996
997 nla_put_failure:
998 nlmsg_trim(skb, nlh);
999 return -1;
1000 }
1001
1002 static int nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
1003 {
1004 struct sk_buff *skb;
1005 int err;
1006
1007 if (!ctx->report &&
1008 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1009 return 0;
1010
1011 err = -ENOBUFS;
1012 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1013 if (skb == NULL)
1014 goto err;
1015
1016 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
1017 event, 0, ctx->afi->family, ctx->table,
1018 ctx->chain);
1019 if (err < 0) {
1020 kfree_skb(skb);
1021 goto err;
1022 }
1023
1024 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1025 ctx->report, GFP_KERNEL);
1026 err:
1027 if (err < 0) {
1028 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1029 err);
1030 }
1031 return err;
1032 }
1033
1034 static int nf_tables_dump_chains(struct sk_buff *skb,
1035 struct netlink_callback *cb)
1036 {
1037 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1038 const struct nft_af_info *afi;
1039 const struct nft_table *table;
1040 const struct nft_chain *chain;
1041 unsigned int idx = 0, s_idx = cb->args[0];
1042 struct net *net = sock_net(skb->sk);
1043 int family = nfmsg->nfgen_family;
1044
1045 rcu_read_lock();
1046 cb->seq = net->nft.base_seq;
1047
1048 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1049 if (family != NFPROTO_UNSPEC && family != afi->family)
1050 continue;
1051
1052 list_for_each_entry_rcu(table, &afi->tables, list) {
1053 list_for_each_entry_rcu(chain, &table->chains, list) {
1054 if (idx < s_idx)
1055 goto cont;
1056 if (idx > s_idx)
1057 memset(&cb->args[1], 0,
1058 sizeof(cb->args) - sizeof(cb->args[0]));
1059 if (!nft_is_active(net, chain))
1060 continue;
1061 if (nf_tables_fill_chain_info(skb, net,
1062 NETLINK_CB(cb->skb).portid,
1063 cb->nlh->nlmsg_seq,
1064 NFT_MSG_NEWCHAIN,
1065 NLM_F_MULTI,
1066 afi->family, table, chain) < 0)
1067 goto done;
1068
1069 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1070 cont:
1071 idx++;
1072 }
1073 }
1074 }
1075 done:
1076 rcu_read_unlock();
1077 cb->args[0] = idx;
1078 return skb->len;
1079 }
1080
1081 static int nf_tables_getchain(struct net *net, struct sock *nlsk,
1082 struct sk_buff *skb, const struct nlmsghdr *nlh,
1083 const struct nlattr * const nla[])
1084 {
1085 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1086 u8 genmask = nft_genmask_cur(net);
1087 const struct nft_af_info *afi;
1088 const struct nft_table *table;
1089 const struct nft_chain *chain;
1090 struct sk_buff *skb2;
1091 int family = nfmsg->nfgen_family;
1092 int err;
1093
1094 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1095 struct netlink_dump_control c = {
1096 .dump = nf_tables_dump_chains,
1097 };
1098 return netlink_dump_start(nlsk, skb, nlh, &c);
1099 }
1100
1101 afi = nf_tables_afinfo_lookup(net, family, false);
1102 if (IS_ERR(afi))
1103 return PTR_ERR(afi);
1104
1105 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1106 if (IS_ERR(table))
1107 return PTR_ERR(table);
1108
1109 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1110 if (IS_ERR(chain))
1111 return PTR_ERR(chain);
1112
1113 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1114 if (!skb2)
1115 return -ENOMEM;
1116
1117 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
1118 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1119 family, table, chain);
1120 if (err < 0)
1121 goto err;
1122
1123 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1124
1125 err:
1126 kfree_skb(skb2);
1127 return err;
1128 }
1129
1130 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1131 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1132 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1133 };
1134
1135 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
1136 {
1137 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1138 struct nft_stats __percpu *newstats;
1139 struct nft_stats *stats;
1140 int err;
1141
1142 err = nla_parse_nested(tb, NFTA_COUNTER_MAX, attr, nft_counter_policy);
1143 if (err < 0)
1144 return ERR_PTR(err);
1145
1146 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
1147 return ERR_PTR(-EINVAL);
1148
1149 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
1150 if (newstats == NULL)
1151 return ERR_PTR(-ENOMEM);
1152
1153 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1154 * are not exposed to userspace.
1155 */
1156 preempt_disable();
1157 stats = this_cpu_ptr(newstats);
1158 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1159 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
1160 preempt_enable();
1161
1162 return newstats;
1163 }
1164
1165 static void nft_chain_stats_replace(struct nft_base_chain *chain,
1166 struct nft_stats __percpu *newstats)
1167 {
1168 if (newstats == NULL)
1169 return;
1170
1171 if (chain->stats) {
1172 struct nft_stats __percpu *oldstats =
1173 nft_dereference(chain->stats);
1174
1175 rcu_assign_pointer(chain->stats, newstats);
1176 synchronize_rcu();
1177 free_percpu(oldstats);
1178 } else
1179 rcu_assign_pointer(chain->stats, newstats);
1180 }
1181
1182 static void nf_tables_chain_destroy(struct nft_chain *chain)
1183 {
1184 BUG_ON(chain->use > 0);
1185
1186 if (chain->flags & NFT_BASE_CHAIN) {
1187 struct nft_base_chain *basechain = nft_base_chain(chain);
1188
1189 module_put(basechain->type->owner);
1190 free_percpu(basechain->stats);
1191 if (basechain->ops[0].dev != NULL)
1192 dev_put(basechain->ops[0].dev);
1193 kfree(basechain);
1194 } else {
1195 kfree(chain);
1196 }
1197 }
1198
1199 struct nft_chain_hook {
1200 u32 num;
1201 u32 priority;
1202 const struct nf_chain_type *type;
1203 struct net_device *dev;
1204 };
1205
1206 static int nft_chain_parse_hook(struct net *net,
1207 const struct nlattr * const nla[],
1208 struct nft_af_info *afi,
1209 struct nft_chain_hook *hook, bool create)
1210 {
1211 struct nlattr *ha[NFTA_HOOK_MAX + 1];
1212 const struct nf_chain_type *type;
1213 struct net_device *dev;
1214 int err;
1215
1216 err = nla_parse_nested(ha, NFTA_HOOK_MAX, nla[NFTA_CHAIN_HOOK],
1217 nft_hook_policy);
1218 if (err < 0)
1219 return err;
1220
1221 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1222 ha[NFTA_HOOK_PRIORITY] == NULL)
1223 return -EINVAL;
1224
1225 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
1226 if (hook->num >= afi->nhooks)
1227 return -EINVAL;
1228
1229 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1230
1231 type = chain_type[afi->family][NFT_CHAIN_T_DEFAULT];
1232 if (nla[NFTA_CHAIN_TYPE]) {
1233 type = nf_tables_chain_type_lookup(afi, nla[NFTA_CHAIN_TYPE],
1234 create);
1235 if (IS_ERR(type))
1236 return PTR_ERR(type);
1237 }
1238 if (!(type->hook_mask & (1 << hook->num)))
1239 return -EOPNOTSUPP;
1240 if (!try_module_get(type->owner))
1241 return -ENOENT;
1242
1243 hook->type = type;
1244
1245 hook->dev = NULL;
1246 if (afi->flags & NFT_AF_NEEDS_DEV) {
1247 char ifname[IFNAMSIZ];
1248
1249 if (!ha[NFTA_HOOK_DEV]) {
1250 module_put(type->owner);
1251 return -EOPNOTSUPP;
1252 }
1253
1254 nla_strlcpy(ifname, ha[NFTA_HOOK_DEV], IFNAMSIZ);
1255 dev = dev_get_by_name(net, ifname);
1256 if (!dev) {
1257 module_put(type->owner);
1258 return -ENOENT;
1259 }
1260 hook->dev = dev;
1261 } else if (ha[NFTA_HOOK_DEV]) {
1262 module_put(type->owner);
1263 return -EOPNOTSUPP;
1264 }
1265
1266 return 0;
1267 }
1268
1269 static void nft_chain_release_hook(struct nft_chain_hook *hook)
1270 {
1271 module_put(hook->type->owner);
1272 if (hook->dev != NULL)
1273 dev_put(hook->dev);
1274 }
1275
1276 static int nf_tables_newchain(struct net *net, struct sock *nlsk,
1277 struct sk_buff *skb, const struct nlmsghdr *nlh,
1278 const struct nlattr * const nla[])
1279 {
1280 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1281 const struct nlattr * uninitialized_var(name);
1282 struct nft_af_info *afi;
1283 struct nft_table *table;
1284 struct nft_chain *chain;
1285 struct nft_base_chain *basechain = NULL;
1286 u8 genmask = nft_genmask_next(net);
1287 int family = nfmsg->nfgen_family;
1288 u8 policy = NF_ACCEPT;
1289 u64 handle = 0;
1290 unsigned int i;
1291 struct nft_stats __percpu *stats;
1292 int err;
1293 bool create;
1294 struct nft_ctx ctx;
1295
1296 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1297
1298 afi = nf_tables_afinfo_lookup(net, family, true);
1299 if (IS_ERR(afi))
1300 return PTR_ERR(afi);
1301
1302 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1303 if (IS_ERR(table))
1304 return PTR_ERR(table);
1305
1306 chain = NULL;
1307 name = nla[NFTA_CHAIN_NAME];
1308
1309 if (nla[NFTA_CHAIN_HANDLE]) {
1310 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
1311 chain = nf_tables_chain_lookup_byhandle(table, handle, genmask);
1312 if (IS_ERR(chain))
1313 return PTR_ERR(chain);
1314 } else {
1315 chain = nf_tables_chain_lookup(table, name, genmask);
1316 if (IS_ERR(chain)) {
1317 if (PTR_ERR(chain) != -ENOENT)
1318 return PTR_ERR(chain);
1319 chain = NULL;
1320 }
1321 }
1322
1323 if (nla[NFTA_CHAIN_POLICY]) {
1324 if ((chain != NULL &&
1325 !(chain->flags & NFT_BASE_CHAIN)))
1326 return -EOPNOTSUPP;
1327
1328 if (chain == NULL &&
1329 nla[NFTA_CHAIN_HOOK] == NULL)
1330 return -EOPNOTSUPP;
1331
1332 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
1333 switch (policy) {
1334 case NF_DROP:
1335 case NF_ACCEPT:
1336 break;
1337 default:
1338 return -EINVAL;
1339 }
1340 }
1341
1342 if (chain != NULL) {
1343 struct nft_stats *stats = NULL;
1344 struct nft_trans *trans;
1345
1346 if (nlh->nlmsg_flags & NLM_F_EXCL)
1347 return -EEXIST;
1348 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1349 return -EOPNOTSUPP;
1350
1351 if (nla[NFTA_CHAIN_HOOK]) {
1352 struct nft_base_chain *basechain;
1353 struct nft_chain_hook hook;
1354 struct nf_hook_ops *ops;
1355
1356 if (!(chain->flags & NFT_BASE_CHAIN))
1357 return -EBUSY;
1358
1359 err = nft_chain_parse_hook(net, nla, afi, &hook,
1360 create);
1361 if (err < 0)
1362 return err;
1363
1364 basechain = nft_base_chain(chain);
1365 if (basechain->type != hook.type) {
1366 nft_chain_release_hook(&hook);
1367 return -EBUSY;
1368 }
1369
1370 for (i = 0; i < afi->nops; i++) {
1371 ops = &basechain->ops[i];
1372 if (ops->hooknum != hook.num ||
1373 ops->priority != hook.priority ||
1374 ops->dev != hook.dev) {
1375 nft_chain_release_hook(&hook);
1376 return -EBUSY;
1377 }
1378 }
1379 nft_chain_release_hook(&hook);
1380 }
1381
1382 if (nla[NFTA_CHAIN_HANDLE] && name) {
1383 struct nft_chain *chain2;
1384
1385 chain2 = nf_tables_chain_lookup(table,
1386 nla[NFTA_CHAIN_NAME],
1387 genmask);
1388 if (IS_ERR(chain2))
1389 return PTR_ERR(chain2);
1390 }
1391
1392 if (nla[NFTA_CHAIN_COUNTERS]) {
1393 if (!(chain->flags & NFT_BASE_CHAIN))
1394 return -EOPNOTSUPP;
1395
1396 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1397 if (IS_ERR(stats))
1398 return PTR_ERR(stats);
1399 }
1400
1401 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1402 trans = nft_trans_alloc(&ctx, NFT_MSG_NEWCHAIN,
1403 sizeof(struct nft_trans_chain));
1404 if (trans == NULL) {
1405 free_percpu(stats);
1406 return -ENOMEM;
1407 }
1408
1409 nft_trans_chain_stats(trans) = stats;
1410 nft_trans_chain_update(trans) = true;
1411
1412 if (nla[NFTA_CHAIN_POLICY])
1413 nft_trans_chain_policy(trans) = policy;
1414 else
1415 nft_trans_chain_policy(trans) = -1;
1416
1417 if (nla[NFTA_CHAIN_HANDLE] && name) {
1418 nla_strlcpy(nft_trans_chain_name(trans), name,
1419 NFT_CHAIN_MAXNAMELEN);
1420 }
1421 list_add_tail(&trans->list, &net->nft.commit_list);
1422 return 0;
1423 }
1424
1425 if (table->use == UINT_MAX)
1426 return -EOVERFLOW;
1427
1428 if (nla[NFTA_CHAIN_HOOK]) {
1429 struct nft_chain_hook hook;
1430 struct nf_hook_ops *ops;
1431 nf_hookfn *hookfn;
1432
1433 err = nft_chain_parse_hook(net, nla, afi, &hook, create);
1434 if (err < 0)
1435 return err;
1436
1437 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1438 if (basechain == NULL) {
1439 nft_chain_release_hook(&hook);
1440 return -ENOMEM;
1441 }
1442
1443 if (hook.dev != NULL)
1444 strncpy(basechain->dev_name, hook.dev->name, IFNAMSIZ);
1445
1446 if (nla[NFTA_CHAIN_COUNTERS]) {
1447 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1448 if (IS_ERR(stats)) {
1449 nft_chain_release_hook(&hook);
1450 kfree(basechain);
1451 return PTR_ERR(stats);
1452 }
1453 basechain->stats = stats;
1454 } else {
1455 stats = netdev_alloc_pcpu_stats(struct nft_stats);
1456 if (stats == NULL) {
1457 nft_chain_release_hook(&hook);
1458 kfree(basechain);
1459 return -ENOMEM;
1460 }
1461 rcu_assign_pointer(basechain->stats, stats);
1462 }
1463
1464 hookfn = hook.type->hooks[hook.num];
1465 basechain->type = hook.type;
1466 chain = &basechain->chain;
1467
1468 for (i = 0; i < afi->nops; i++) {
1469 ops = &basechain->ops[i];
1470 ops->pf = family;
1471 ops->hooknum = hook.num;
1472 ops->priority = hook.priority;
1473 ops->priv = chain;
1474 ops->hook = afi->hooks[ops->hooknum];
1475 ops->dev = hook.dev;
1476 if (hookfn)
1477 ops->hook = hookfn;
1478 if (afi->hook_ops_init)
1479 afi->hook_ops_init(ops, i);
1480 }
1481
1482 chain->flags |= NFT_BASE_CHAIN;
1483 basechain->policy = policy;
1484 } else {
1485 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1486 if (chain == NULL)
1487 return -ENOMEM;
1488 }
1489
1490 INIT_LIST_HEAD(&chain->rules);
1491 chain->handle = nf_tables_alloc_handle(table);
1492 chain->table = table;
1493 nla_strlcpy(chain->name, name, NFT_CHAIN_MAXNAMELEN);
1494
1495 err = nf_tables_register_hooks(net, table, chain, afi->nops);
1496 if (err < 0)
1497 goto err1;
1498
1499 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1500 err = nft_trans_chain_add(&ctx, NFT_MSG_NEWCHAIN);
1501 if (err < 0)
1502 goto err2;
1503
1504 table->use++;
1505 list_add_tail_rcu(&chain->list, &table->chains);
1506 return 0;
1507 err2:
1508 nf_tables_unregister_hooks(net, table, chain, afi->nops);
1509 err1:
1510 nf_tables_chain_destroy(chain);
1511 return err;
1512 }
1513
1514 static int nf_tables_delchain(struct net *net, struct sock *nlsk,
1515 struct sk_buff *skb, const struct nlmsghdr *nlh,
1516 const struct nlattr * const nla[])
1517 {
1518 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1519 u8 genmask = nft_genmask_next(net);
1520 struct nft_af_info *afi;
1521 struct nft_table *table;
1522 struct nft_chain *chain;
1523 int family = nfmsg->nfgen_family;
1524 struct nft_ctx ctx;
1525
1526 afi = nf_tables_afinfo_lookup(net, family, false);
1527 if (IS_ERR(afi))
1528 return PTR_ERR(afi);
1529
1530 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1531 if (IS_ERR(table))
1532 return PTR_ERR(table);
1533
1534 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1535 if (IS_ERR(chain))
1536 return PTR_ERR(chain);
1537 if (chain->use > 0)
1538 return -EBUSY;
1539
1540 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1541
1542 return nft_delchain(&ctx);
1543 }
1544
1545 /*
1546 * Expressions
1547 */
1548
1549 /**
1550 * nft_register_expr - register nf_tables expr type
1551 * @ops: expr type
1552 *
1553 * Registers the expr type for use with nf_tables. Returns zero on
1554 * success or a negative errno code otherwise.
1555 */
1556 int nft_register_expr(struct nft_expr_type *type)
1557 {
1558 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1559 if (type->family == NFPROTO_UNSPEC)
1560 list_add_tail_rcu(&type->list, &nf_tables_expressions);
1561 else
1562 list_add_rcu(&type->list, &nf_tables_expressions);
1563 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1564 return 0;
1565 }
1566 EXPORT_SYMBOL_GPL(nft_register_expr);
1567
1568 /**
1569 * nft_unregister_expr - unregister nf_tables expr type
1570 * @ops: expr type
1571 *
1572 * Unregisters the expr typefor use with nf_tables.
1573 */
1574 void nft_unregister_expr(struct nft_expr_type *type)
1575 {
1576 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1577 list_del_rcu(&type->list);
1578 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1579 }
1580 EXPORT_SYMBOL_GPL(nft_unregister_expr);
1581
1582 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
1583 struct nlattr *nla)
1584 {
1585 const struct nft_expr_type *type;
1586
1587 list_for_each_entry(type, &nf_tables_expressions, list) {
1588 if (!nla_strcmp(nla, type->name) &&
1589 (!type->family || type->family == family))
1590 return type;
1591 }
1592 return NULL;
1593 }
1594
1595 static const struct nft_expr_type *nft_expr_type_get(u8 family,
1596 struct nlattr *nla)
1597 {
1598 const struct nft_expr_type *type;
1599
1600 if (nla == NULL)
1601 return ERR_PTR(-EINVAL);
1602
1603 type = __nft_expr_type_get(family, nla);
1604 if (type != NULL && try_module_get(type->owner))
1605 return type;
1606
1607 #ifdef CONFIG_MODULES
1608 if (type == NULL) {
1609 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1610 request_module("nft-expr-%u-%.*s", family,
1611 nla_len(nla), (char *)nla_data(nla));
1612 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1613 if (__nft_expr_type_get(family, nla))
1614 return ERR_PTR(-EAGAIN);
1615
1616 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1617 request_module("nft-expr-%.*s",
1618 nla_len(nla), (char *)nla_data(nla));
1619 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1620 if (__nft_expr_type_get(family, nla))
1621 return ERR_PTR(-EAGAIN);
1622 }
1623 #endif
1624 return ERR_PTR(-ENOENT);
1625 }
1626
1627 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
1628 [NFTA_EXPR_NAME] = { .type = NLA_STRING },
1629 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
1630 };
1631
1632 static int nf_tables_fill_expr_info(struct sk_buff *skb,
1633 const struct nft_expr *expr)
1634 {
1635 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
1636 goto nla_put_failure;
1637
1638 if (expr->ops->dump) {
1639 struct nlattr *data = nla_nest_start(skb, NFTA_EXPR_DATA);
1640 if (data == NULL)
1641 goto nla_put_failure;
1642 if (expr->ops->dump(skb, expr) < 0)
1643 goto nla_put_failure;
1644 nla_nest_end(skb, data);
1645 }
1646
1647 return skb->len;
1648
1649 nla_put_failure:
1650 return -1;
1651 };
1652
1653 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
1654 const struct nft_expr *expr)
1655 {
1656 struct nlattr *nest;
1657
1658 nest = nla_nest_start(skb, attr);
1659 if (!nest)
1660 goto nla_put_failure;
1661 if (nf_tables_fill_expr_info(skb, expr) < 0)
1662 goto nla_put_failure;
1663 nla_nest_end(skb, nest);
1664 return 0;
1665
1666 nla_put_failure:
1667 return -1;
1668 }
1669
1670 struct nft_expr_info {
1671 const struct nft_expr_ops *ops;
1672 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
1673 };
1674
1675 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
1676 const struct nlattr *nla,
1677 struct nft_expr_info *info)
1678 {
1679 const struct nft_expr_type *type;
1680 const struct nft_expr_ops *ops;
1681 struct nlattr *tb[NFTA_EXPR_MAX + 1];
1682 int err;
1683
1684 err = nla_parse_nested(tb, NFTA_EXPR_MAX, nla, nft_expr_policy);
1685 if (err < 0)
1686 return err;
1687
1688 type = nft_expr_type_get(ctx->afi->family, tb[NFTA_EXPR_NAME]);
1689 if (IS_ERR(type))
1690 return PTR_ERR(type);
1691
1692 if (tb[NFTA_EXPR_DATA]) {
1693 err = nla_parse_nested(info->tb, type->maxattr,
1694 tb[NFTA_EXPR_DATA], type->policy);
1695 if (err < 0)
1696 goto err1;
1697 } else
1698 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
1699
1700 if (type->select_ops != NULL) {
1701 ops = type->select_ops(ctx,
1702 (const struct nlattr * const *)info->tb);
1703 if (IS_ERR(ops)) {
1704 err = PTR_ERR(ops);
1705 goto err1;
1706 }
1707 } else
1708 ops = type->ops;
1709
1710 info->ops = ops;
1711 return 0;
1712
1713 err1:
1714 module_put(type->owner);
1715 return err;
1716 }
1717
1718 static int nf_tables_newexpr(const struct nft_ctx *ctx,
1719 const struct nft_expr_info *info,
1720 struct nft_expr *expr)
1721 {
1722 const struct nft_expr_ops *ops = info->ops;
1723 int err;
1724
1725 expr->ops = ops;
1726 if (ops->init) {
1727 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
1728 if (err < 0)
1729 goto err1;
1730 }
1731
1732 return 0;
1733
1734 err1:
1735 expr->ops = NULL;
1736 return err;
1737 }
1738
1739 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
1740 struct nft_expr *expr)
1741 {
1742 if (expr->ops->destroy)
1743 expr->ops->destroy(ctx, expr);
1744 module_put(expr->ops->type->owner);
1745 }
1746
1747 struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
1748 const struct nlattr *nla)
1749 {
1750 struct nft_expr_info info;
1751 struct nft_expr *expr;
1752 int err;
1753
1754 err = nf_tables_expr_parse(ctx, nla, &info);
1755 if (err < 0)
1756 goto err1;
1757
1758 err = -ENOMEM;
1759 expr = kzalloc(info.ops->size, GFP_KERNEL);
1760 if (expr == NULL)
1761 goto err2;
1762
1763 err = nf_tables_newexpr(ctx, &info, expr);
1764 if (err < 0)
1765 goto err3;
1766
1767 return expr;
1768 err3:
1769 kfree(expr);
1770 err2:
1771 module_put(info.ops->type->owner);
1772 err1:
1773 return ERR_PTR(err);
1774 }
1775
1776 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
1777 {
1778 nf_tables_expr_destroy(ctx, expr);
1779 kfree(expr);
1780 }
1781
1782 /*
1783 * Rules
1784 */
1785
1786 static struct nft_rule *__nf_tables_rule_lookup(const struct nft_chain *chain,
1787 u64 handle)
1788 {
1789 struct nft_rule *rule;
1790
1791 // FIXME: this sucks
1792 list_for_each_entry(rule, &chain->rules, list) {
1793 if (handle == rule->handle)
1794 return rule;
1795 }
1796
1797 return ERR_PTR(-ENOENT);
1798 }
1799
1800 static struct nft_rule *nf_tables_rule_lookup(const struct nft_chain *chain,
1801 const struct nlattr *nla)
1802 {
1803 if (nla == NULL)
1804 return ERR_PTR(-EINVAL);
1805
1806 return __nf_tables_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
1807 }
1808
1809 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
1810 [NFTA_RULE_TABLE] = { .type = NLA_STRING },
1811 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
1812 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1813 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
1814 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
1815 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
1816 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
1817 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
1818 .len = NFT_USERDATA_MAXLEN },
1819 };
1820
1821 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
1822 u32 portid, u32 seq, int event,
1823 u32 flags, int family,
1824 const struct nft_table *table,
1825 const struct nft_chain *chain,
1826 const struct nft_rule *rule)
1827 {
1828 struct nlmsghdr *nlh;
1829 struct nfgenmsg *nfmsg;
1830 const struct nft_expr *expr, *next;
1831 struct nlattr *list;
1832 const struct nft_rule *prule;
1833 int type = event | NFNL_SUBSYS_NFTABLES << 8;
1834
1835 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg),
1836 flags);
1837 if (nlh == NULL)
1838 goto nla_put_failure;
1839
1840 nfmsg = nlmsg_data(nlh);
1841 nfmsg->nfgen_family = family;
1842 nfmsg->version = NFNETLINK_V0;
1843 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1844
1845 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
1846 goto nla_put_failure;
1847 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
1848 goto nla_put_failure;
1849 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
1850 NFTA_RULE_PAD))
1851 goto nla_put_failure;
1852
1853 if ((event != NFT_MSG_DELRULE) && (rule->list.prev != &chain->rules)) {
1854 prule = list_entry(rule->list.prev, struct nft_rule, list);
1855 if (nla_put_be64(skb, NFTA_RULE_POSITION,
1856 cpu_to_be64(prule->handle),
1857 NFTA_RULE_PAD))
1858 goto nla_put_failure;
1859 }
1860
1861 list = nla_nest_start(skb, NFTA_RULE_EXPRESSIONS);
1862 if (list == NULL)
1863 goto nla_put_failure;
1864 nft_rule_for_each_expr(expr, next, rule) {
1865 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
1866 goto nla_put_failure;
1867 }
1868 nla_nest_end(skb, list);
1869
1870 if (rule->udata) {
1871 struct nft_userdata *udata = nft_userdata(rule);
1872 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
1873 udata->data) < 0)
1874 goto nla_put_failure;
1875 }
1876
1877 nlmsg_end(skb, nlh);
1878 return 0;
1879
1880 nla_put_failure:
1881 nlmsg_trim(skb, nlh);
1882 return -1;
1883 }
1884
1885 static int nf_tables_rule_notify(const struct nft_ctx *ctx,
1886 const struct nft_rule *rule,
1887 int event)
1888 {
1889 struct sk_buff *skb;
1890 int err;
1891
1892 if (!ctx->report &&
1893 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1894 return 0;
1895
1896 err = -ENOBUFS;
1897 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1898 if (skb == NULL)
1899 goto err;
1900
1901 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
1902 event, 0, ctx->afi->family, ctx->table,
1903 ctx->chain, rule);
1904 if (err < 0) {
1905 kfree_skb(skb);
1906 goto err;
1907 }
1908
1909 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1910 ctx->report, GFP_KERNEL);
1911 err:
1912 if (err < 0) {
1913 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1914 err);
1915 }
1916 return err;
1917 }
1918
1919 struct nft_rule_dump_ctx {
1920 char table[NFT_TABLE_MAXNAMELEN];
1921 char chain[NFT_CHAIN_MAXNAMELEN];
1922 };
1923
1924 static int nf_tables_dump_rules(struct sk_buff *skb,
1925 struct netlink_callback *cb)
1926 {
1927 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1928 const struct nft_rule_dump_ctx *ctx = cb->data;
1929 const struct nft_af_info *afi;
1930 const struct nft_table *table;
1931 const struct nft_chain *chain;
1932 const struct nft_rule *rule;
1933 unsigned int idx = 0, s_idx = cb->args[0];
1934 struct net *net = sock_net(skb->sk);
1935 int family = nfmsg->nfgen_family;
1936
1937 rcu_read_lock();
1938 cb->seq = net->nft.base_seq;
1939
1940 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1941 if (family != NFPROTO_UNSPEC && family != afi->family)
1942 continue;
1943
1944 list_for_each_entry_rcu(table, &afi->tables, list) {
1945 if (ctx && ctx->table[0] &&
1946 strcmp(ctx->table, table->name) != 0)
1947 continue;
1948
1949 list_for_each_entry_rcu(chain, &table->chains, list) {
1950 if (ctx && ctx->chain[0] &&
1951 strcmp(ctx->chain, chain->name) != 0)
1952 continue;
1953
1954 list_for_each_entry_rcu(rule, &chain->rules, list) {
1955 if (!nft_is_active(net, rule))
1956 goto cont;
1957 if (idx < s_idx)
1958 goto cont;
1959 if (idx > s_idx)
1960 memset(&cb->args[1], 0,
1961 sizeof(cb->args) - sizeof(cb->args[0]));
1962 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
1963 cb->nlh->nlmsg_seq,
1964 NFT_MSG_NEWRULE,
1965 NLM_F_MULTI | NLM_F_APPEND,
1966 afi->family, table, chain, rule) < 0)
1967 goto done;
1968
1969 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1970 cont:
1971 idx++;
1972 }
1973 }
1974 }
1975 }
1976 done:
1977 rcu_read_unlock();
1978
1979 cb->args[0] = idx;
1980 return skb->len;
1981 }
1982
1983 static int nf_tables_dump_rules_done(struct netlink_callback *cb)
1984 {
1985 kfree(cb->data);
1986 return 0;
1987 }
1988
1989 static int nf_tables_getrule(struct net *net, struct sock *nlsk,
1990 struct sk_buff *skb, const struct nlmsghdr *nlh,
1991 const struct nlattr * const nla[])
1992 {
1993 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1994 u8 genmask = nft_genmask_cur(net);
1995 const struct nft_af_info *afi;
1996 const struct nft_table *table;
1997 const struct nft_chain *chain;
1998 const struct nft_rule *rule;
1999 struct sk_buff *skb2;
2000 int family = nfmsg->nfgen_family;
2001 int err;
2002
2003 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2004 struct netlink_dump_control c = {
2005 .dump = nf_tables_dump_rules,
2006 .done = nf_tables_dump_rules_done,
2007 };
2008
2009 if (nla[NFTA_RULE_TABLE] || nla[NFTA_RULE_CHAIN]) {
2010 struct nft_rule_dump_ctx *ctx;
2011
2012 ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
2013 if (!ctx)
2014 return -ENOMEM;
2015
2016 if (nla[NFTA_RULE_TABLE])
2017 nla_strlcpy(ctx->table, nla[NFTA_RULE_TABLE],
2018 sizeof(ctx->table));
2019 if (nla[NFTA_RULE_CHAIN])
2020 nla_strlcpy(ctx->chain, nla[NFTA_RULE_CHAIN],
2021 sizeof(ctx->chain));
2022 c.data = ctx;
2023 }
2024
2025 return netlink_dump_start(nlsk, skb, nlh, &c);
2026 }
2027
2028 afi = nf_tables_afinfo_lookup(net, family, false);
2029 if (IS_ERR(afi))
2030 return PTR_ERR(afi);
2031
2032 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2033 if (IS_ERR(table))
2034 return PTR_ERR(table);
2035
2036 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2037 if (IS_ERR(chain))
2038 return PTR_ERR(chain);
2039
2040 rule = nf_tables_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2041 if (IS_ERR(rule))
2042 return PTR_ERR(rule);
2043
2044 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2045 if (!skb2)
2046 return -ENOMEM;
2047
2048 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
2049 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
2050 family, table, chain, rule);
2051 if (err < 0)
2052 goto err;
2053
2054 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2055
2056 err:
2057 kfree_skb(skb2);
2058 return err;
2059 }
2060
2061 static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
2062 struct nft_rule *rule)
2063 {
2064 struct nft_expr *expr;
2065
2066 /*
2067 * Careful: some expressions might not be initialized in case this
2068 * is called on error from nf_tables_newrule().
2069 */
2070 expr = nft_expr_first(rule);
2071 while (expr->ops && expr != nft_expr_last(rule)) {
2072 nf_tables_expr_destroy(ctx, expr);
2073 expr = nft_expr_next(expr);
2074 }
2075 kfree(rule);
2076 }
2077
2078 #define NFT_RULE_MAXEXPRS 128
2079
2080 static struct nft_expr_info *info;
2081
2082 static int nf_tables_newrule(struct net *net, struct sock *nlsk,
2083 struct sk_buff *skb, const struct nlmsghdr *nlh,
2084 const struct nlattr * const nla[])
2085 {
2086 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2087 u8 genmask = nft_genmask_next(net);
2088 struct nft_af_info *afi;
2089 struct nft_table *table;
2090 struct nft_chain *chain;
2091 struct nft_rule *rule, *old_rule = NULL;
2092 struct nft_userdata *udata;
2093 struct nft_trans *trans = NULL;
2094 struct nft_expr *expr;
2095 struct nft_ctx ctx;
2096 struct nlattr *tmp;
2097 unsigned int size, i, n, ulen = 0, usize = 0;
2098 int err, rem;
2099 bool create;
2100 u64 handle, pos_handle;
2101
2102 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2103
2104 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
2105 if (IS_ERR(afi))
2106 return PTR_ERR(afi);
2107
2108 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2109 if (IS_ERR(table))
2110 return PTR_ERR(table);
2111
2112 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2113 if (IS_ERR(chain))
2114 return PTR_ERR(chain);
2115
2116 if (nla[NFTA_RULE_HANDLE]) {
2117 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
2118 rule = __nf_tables_rule_lookup(chain, handle);
2119 if (IS_ERR(rule))
2120 return PTR_ERR(rule);
2121
2122 if (nlh->nlmsg_flags & NLM_F_EXCL)
2123 return -EEXIST;
2124 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2125 old_rule = rule;
2126 else
2127 return -EOPNOTSUPP;
2128 } else {
2129 if (!create || nlh->nlmsg_flags & NLM_F_REPLACE)
2130 return -EINVAL;
2131 handle = nf_tables_alloc_handle(table);
2132
2133 if (chain->use == UINT_MAX)
2134 return -EOVERFLOW;
2135 }
2136
2137 if (nla[NFTA_RULE_POSITION]) {
2138 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2139 return -EOPNOTSUPP;
2140
2141 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
2142 old_rule = __nf_tables_rule_lookup(chain, pos_handle);
2143 if (IS_ERR(old_rule))
2144 return PTR_ERR(old_rule);
2145 }
2146
2147 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2148
2149 n = 0;
2150 size = 0;
2151 if (nla[NFTA_RULE_EXPRESSIONS]) {
2152 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
2153 err = -EINVAL;
2154 if (nla_type(tmp) != NFTA_LIST_ELEM)
2155 goto err1;
2156 if (n == NFT_RULE_MAXEXPRS)
2157 goto err1;
2158 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
2159 if (err < 0)
2160 goto err1;
2161 size += info[n].ops->size;
2162 n++;
2163 }
2164 }
2165 /* Check for overflow of dlen field */
2166 err = -EFBIG;
2167 if (size >= 1 << 12)
2168 goto err1;
2169
2170 if (nla[NFTA_RULE_USERDATA]) {
2171 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
2172 if (ulen > 0)
2173 usize = sizeof(struct nft_userdata) + ulen;
2174 }
2175
2176 err = -ENOMEM;
2177 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
2178 if (rule == NULL)
2179 goto err1;
2180
2181 nft_activate_next(net, rule);
2182
2183 rule->handle = handle;
2184 rule->dlen = size;
2185 rule->udata = ulen ? 1 : 0;
2186
2187 if (ulen) {
2188 udata = nft_userdata(rule);
2189 udata->len = ulen - 1;
2190 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
2191 }
2192
2193 expr = nft_expr_first(rule);
2194 for (i = 0; i < n; i++) {
2195 err = nf_tables_newexpr(&ctx, &info[i], expr);
2196 if (err < 0)
2197 goto err2;
2198 info[i].ops = NULL;
2199 expr = nft_expr_next(expr);
2200 }
2201
2202 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
2203 if (nft_is_active_next(net, old_rule)) {
2204 trans = nft_trans_rule_add(&ctx, NFT_MSG_DELRULE,
2205 old_rule);
2206 if (trans == NULL) {
2207 err = -ENOMEM;
2208 goto err2;
2209 }
2210 nft_deactivate_next(net, old_rule);
2211 chain->use--;
2212 list_add_tail_rcu(&rule->list, &old_rule->list);
2213 } else {
2214 err = -ENOENT;
2215 goto err2;
2216 }
2217 } else if (nlh->nlmsg_flags & NLM_F_APPEND)
2218 if (old_rule)
2219 list_add_rcu(&rule->list, &old_rule->list);
2220 else
2221 list_add_tail_rcu(&rule->list, &chain->rules);
2222 else {
2223 if (old_rule)
2224 list_add_tail_rcu(&rule->list, &old_rule->list);
2225 else
2226 list_add_rcu(&rule->list, &chain->rules);
2227 }
2228
2229 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2230 err = -ENOMEM;
2231 goto err3;
2232 }
2233 chain->use++;
2234 return 0;
2235
2236 err3:
2237 list_del_rcu(&rule->list);
2238 err2:
2239 nf_tables_rule_destroy(&ctx, rule);
2240 err1:
2241 for (i = 0; i < n; i++) {
2242 if (info[i].ops != NULL)
2243 module_put(info[i].ops->type->owner);
2244 }
2245 return err;
2246 }
2247
2248 static int nf_tables_delrule(struct net *net, struct sock *nlsk,
2249 struct sk_buff *skb, const struct nlmsghdr *nlh,
2250 const struct nlattr * const nla[])
2251 {
2252 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2253 u8 genmask = nft_genmask_next(net);
2254 struct nft_af_info *afi;
2255 struct nft_table *table;
2256 struct nft_chain *chain = NULL;
2257 struct nft_rule *rule;
2258 int family = nfmsg->nfgen_family, err = 0;
2259 struct nft_ctx ctx;
2260
2261 afi = nf_tables_afinfo_lookup(net, family, false);
2262 if (IS_ERR(afi))
2263 return PTR_ERR(afi);
2264
2265 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2266 if (IS_ERR(table))
2267 return PTR_ERR(table);
2268
2269 if (nla[NFTA_RULE_CHAIN]) {
2270 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN],
2271 genmask);
2272 if (IS_ERR(chain))
2273 return PTR_ERR(chain);
2274 }
2275
2276 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2277
2278 if (chain) {
2279 if (nla[NFTA_RULE_HANDLE]) {
2280 rule = nf_tables_rule_lookup(chain,
2281 nla[NFTA_RULE_HANDLE]);
2282 if (IS_ERR(rule))
2283 return PTR_ERR(rule);
2284
2285 err = nft_delrule(&ctx, rule);
2286 } else {
2287 err = nft_delrule_by_chain(&ctx);
2288 }
2289 } else {
2290 list_for_each_entry(chain, &table->chains, list) {
2291 if (!nft_is_active_next(net, chain))
2292 continue;
2293
2294 ctx.chain = chain;
2295 err = nft_delrule_by_chain(&ctx);
2296 if (err < 0)
2297 break;
2298 }
2299 }
2300
2301 return err;
2302 }
2303
2304 /*
2305 * Sets
2306 */
2307
2308 static LIST_HEAD(nf_tables_set_ops);
2309
2310 int nft_register_set(struct nft_set_ops *ops)
2311 {
2312 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2313 list_add_tail_rcu(&ops->list, &nf_tables_set_ops);
2314 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2315 return 0;
2316 }
2317 EXPORT_SYMBOL_GPL(nft_register_set);
2318
2319 void nft_unregister_set(struct nft_set_ops *ops)
2320 {
2321 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2322 list_del_rcu(&ops->list);
2323 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2324 }
2325 EXPORT_SYMBOL_GPL(nft_unregister_set);
2326
2327 /*
2328 * Select a set implementation based on the data characteristics and the
2329 * given policy. The total memory use might not be known if no size is
2330 * given, in that case the amount of memory per element is used.
2331 */
2332 static const struct nft_set_ops *
2333 nft_select_set_ops(const struct nlattr * const nla[],
2334 const struct nft_set_desc *desc,
2335 enum nft_set_policies policy)
2336 {
2337 const struct nft_set_ops *ops, *bops;
2338 struct nft_set_estimate est, best;
2339 u32 features;
2340
2341 #ifdef CONFIG_MODULES
2342 if (list_empty(&nf_tables_set_ops)) {
2343 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2344 request_module("nft-set");
2345 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2346 if (!list_empty(&nf_tables_set_ops))
2347 return ERR_PTR(-EAGAIN);
2348 }
2349 #endif
2350 features = 0;
2351 if (nla[NFTA_SET_FLAGS] != NULL) {
2352 features = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2353 features &= NFT_SET_INTERVAL | NFT_SET_MAP | NFT_SET_TIMEOUT;
2354 }
2355
2356 bops = NULL;
2357 best.size = ~0;
2358 best.class = ~0;
2359
2360 list_for_each_entry(ops, &nf_tables_set_ops, list) {
2361 if ((ops->features & features) != features)
2362 continue;
2363 if (!ops->estimate(desc, features, &est))
2364 continue;
2365
2366 switch (policy) {
2367 case NFT_SET_POL_PERFORMANCE:
2368 if (est.class < best.class)
2369 break;
2370 if (est.class == best.class && est.size < best.size)
2371 break;
2372 continue;
2373 case NFT_SET_POL_MEMORY:
2374 if (est.size < best.size)
2375 break;
2376 if (est.size == best.size && est.class < best.class)
2377 break;
2378 continue;
2379 default:
2380 break;
2381 }
2382
2383 if (!try_module_get(ops->owner))
2384 continue;
2385 if (bops != NULL)
2386 module_put(bops->owner);
2387
2388 bops = ops;
2389 best = est;
2390 }
2391
2392 if (bops != NULL)
2393 return bops;
2394
2395 return ERR_PTR(-EOPNOTSUPP);
2396 }
2397
2398 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
2399 [NFTA_SET_TABLE] = { .type = NLA_STRING },
2400 [NFTA_SET_NAME] = { .type = NLA_STRING,
2401 .len = NFT_SET_MAXNAMELEN - 1 },
2402 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
2403 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
2404 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
2405 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
2406 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
2407 [NFTA_SET_POLICY] = { .type = NLA_U32 },
2408 [NFTA_SET_DESC] = { .type = NLA_NESTED },
2409 [NFTA_SET_ID] = { .type = NLA_U32 },
2410 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
2411 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
2412 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
2413 .len = NFT_USERDATA_MAXLEN },
2414 };
2415
2416 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
2417 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
2418 };
2419
2420 static int nft_ctx_init_from_setattr(struct nft_ctx *ctx, struct net *net,
2421 const struct sk_buff *skb,
2422 const struct nlmsghdr *nlh,
2423 const struct nlattr * const nla[],
2424 u8 genmask)
2425 {
2426 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2427 struct nft_af_info *afi = NULL;
2428 struct nft_table *table = NULL;
2429
2430 if (nfmsg->nfgen_family != NFPROTO_UNSPEC) {
2431 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
2432 if (IS_ERR(afi))
2433 return PTR_ERR(afi);
2434 }
2435
2436 if (nla[NFTA_SET_TABLE] != NULL) {
2437 if (afi == NULL)
2438 return -EAFNOSUPPORT;
2439
2440 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE],
2441 genmask);
2442 if (IS_ERR(table))
2443 return PTR_ERR(table);
2444 }
2445
2446 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
2447 return 0;
2448 }
2449
2450 struct nft_set *nf_tables_set_lookup(const struct nft_table *table,
2451 const struct nlattr *nla, u8 genmask)
2452 {
2453 struct nft_set *set;
2454
2455 if (nla == NULL)
2456 return ERR_PTR(-EINVAL);
2457
2458 list_for_each_entry(set, &table->sets, list) {
2459 if (!nla_strcmp(nla, set->name) &&
2460 nft_active_genmask(set, genmask))
2461 return set;
2462 }
2463 return ERR_PTR(-ENOENT);
2464 }
2465
2466 struct nft_set *nf_tables_set_lookup_byid(const struct net *net,
2467 const struct nlattr *nla,
2468 u8 genmask)
2469 {
2470 struct nft_trans *trans;
2471 u32 id = ntohl(nla_get_be32(nla));
2472
2473 list_for_each_entry(trans, &net->nft.commit_list, list) {
2474 struct nft_set *set = nft_trans_set(trans);
2475
2476 if (trans->msg_type == NFT_MSG_NEWSET &&
2477 id == nft_trans_set_id(trans) &&
2478 nft_active_genmask(set, genmask))
2479 return set;
2480 }
2481 return ERR_PTR(-ENOENT);
2482 }
2483
2484 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
2485 const char *name)
2486 {
2487 const struct nft_set *i;
2488 const char *p;
2489 unsigned long *inuse;
2490 unsigned int n = 0, min = 0;
2491
2492 p = strnchr(name, NFT_SET_MAXNAMELEN, '%');
2493 if (p != NULL) {
2494 if (p[1] != 'd' || strchr(p + 2, '%'))
2495 return -EINVAL;
2496
2497 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
2498 if (inuse == NULL)
2499 return -ENOMEM;
2500 cont:
2501 list_for_each_entry(i, &ctx->table->sets, list) {
2502 int tmp;
2503
2504 if (!nft_is_active_next(ctx->net, set))
2505 continue;
2506 if (!sscanf(i->name, name, &tmp))
2507 continue;
2508 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
2509 continue;
2510
2511 set_bit(tmp - min, inuse);
2512 }
2513
2514 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
2515 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
2516 min += BITS_PER_BYTE * PAGE_SIZE;
2517 memset(inuse, 0, PAGE_SIZE);
2518 goto cont;
2519 }
2520 free_page((unsigned long)inuse);
2521 }
2522
2523 snprintf(set->name, sizeof(set->name), name, min + n);
2524 list_for_each_entry(i, &ctx->table->sets, list) {
2525 if (!nft_is_active_next(ctx->net, i))
2526 continue;
2527 if (!strcmp(set->name, i->name))
2528 return -ENFILE;
2529 }
2530 return 0;
2531 }
2532
2533 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
2534 const struct nft_set *set, u16 event, u16 flags)
2535 {
2536 struct nfgenmsg *nfmsg;
2537 struct nlmsghdr *nlh;
2538 struct nlattr *desc;
2539 u32 portid = ctx->portid;
2540 u32 seq = ctx->seq;
2541
2542 event |= NFNL_SUBSYS_NFTABLES << 8;
2543 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
2544 flags);
2545 if (nlh == NULL)
2546 goto nla_put_failure;
2547
2548 nfmsg = nlmsg_data(nlh);
2549 nfmsg->nfgen_family = ctx->afi->family;
2550 nfmsg->version = NFNETLINK_V0;
2551 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
2552
2553 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
2554 goto nla_put_failure;
2555 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
2556 goto nla_put_failure;
2557 if (set->flags != 0)
2558 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
2559 goto nla_put_failure;
2560
2561 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
2562 goto nla_put_failure;
2563 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
2564 goto nla_put_failure;
2565 if (set->flags & NFT_SET_MAP) {
2566 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
2567 goto nla_put_failure;
2568 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
2569 goto nla_put_failure;
2570 }
2571
2572 if (set->timeout &&
2573 nla_put_be64(skb, NFTA_SET_TIMEOUT, cpu_to_be64(set->timeout),
2574 NFTA_SET_PAD))
2575 goto nla_put_failure;
2576 if (set->gc_int &&
2577 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
2578 goto nla_put_failure;
2579
2580 if (set->policy != NFT_SET_POL_PERFORMANCE) {
2581 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
2582 goto nla_put_failure;
2583 }
2584
2585 if (nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
2586 goto nla_put_failure;
2587
2588 desc = nla_nest_start(skb, NFTA_SET_DESC);
2589 if (desc == NULL)
2590 goto nla_put_failure;
2591 if (set->size &&
2592 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
2593 goto nla_put_failure;
2594 nla_nest_end(skb, desc);
2595
2596 nlmsg_end(skb, nlh);
2597 return 0;
2598
2599 nla_put_failure:
2600 nlmsg_trim(skb, nlh);
2601 return -1;
2602 }
2603
2604 static int nf_tables_set_notify(const struct nft_ctx *ctx,
2605 const struct nft_set *set,
2606 int event, gfp_t gfp_flags)
2607 {
2608 struct sk_buff *skb;
2609 u32 portid = ctx->portid;
2610 int err;
2611
2612 if (!ctx->report &&
2613 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2614 return 0;
2615
2616 err = -ENOBUFS;
2617 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
2618 if (skb == NULL)
2619 goto err;
2620
2621 err = nf_tables_fill_set(skb, ctx, set, event, 0);
2622 if (err < 0) {
2623 kfree_skb(skb);
2624 goto err;
2625 }
2626
2627 err = nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES,
2628 ctx->report, gfp_flags);
2629 err:
2630 if (err < 0)
2631 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, err);
2632 return err;
2633 }
2634
2635 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
2636 {
2637 const struct nft_set *set;
2638 unsigned int idx, s_idx = cb->args[0];
2639 struct nft_af_info *afi;
2640 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
2641 struct net *net = sock_net(skb->sk);
2642 int cur_family = cb->args[3];
2643 struct nft_ctx *ctx = cb->data, ctx_set;
2644
2645 if (cb->args[1])
2646 return skb->len;
2647
2648 rcu_read_lock();
2649 cb->seq = net->nft.base_seq;
2650
2651 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
2652 if (ctx->afi && ctx->afi != afi)
2653 continue;
2654
2655 if (cur_family) {
2656 if (afi->family != cur_family)
2657 continue;
2658
2659 cur_family = 0;
2660 }
2661 list_for_each_entry_rcu(table, &afi->tables, list) {
2662 if (ctx->table && ctx->table != table)
2663 continue;
2664
2665 if (cur_table) {
2666 if (cur_table != table)
2667 continue;
2668
2669 cur_table = NULL;
2670 }
2671 idx = 0;
2672 list_for_each_entry_rcu(set, &table->sets, list) {
2673 if (idx < s_idx)
2674 goto cont;
2675 if (!nft_is_active(net, set))
2676 goto cont;
2677
2678 ctx_set = *ctx;
2679 ctx_set.table = table;
2680 ctx_set.afi = afi;
2681 if (nf_tables_fill_set(skb, &ctx_set, set,
2682 NFT_MSG_NEWSET,
2683 NLM_F_MULTI) < 0) {
2684 cb->args[0] = idx;
2685 cb->args[2] = (unsigned long) table;
2686 cb->args[3] = afi->family;
2687 goto done;
2688 }
2689 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2690 cont:
2691 idx++;
2692 }
2693 if (s_idx)
2694 s_idx = 0;
2695 }
2696 }
2697 cb->args[1] = 1;
2698 done:
2699 rcu_read_unlock();
2700 return skb->len;
2701 }
2702
2703 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
2704 {
2705 kfree(cb->data);
2706 return 0;
2707 }
2708
2709 static int nf_tables_getset(struct net *net, struct sock *nlsk,
2710 struct sk_buff *skb, const struct nlmsghdr *nlh,
2711 const struct nlattr * const nla[])
2712 {
2713 u8 genmask = nft_genmask_cur(net);
2714 const struct nft_set *set;
2715 struct nft_ctx ctx;
2716 struct sk_buff *skb2;
2717 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2718 int err;
2719
2720 /* Verify existence before starting dump */
2721 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
2722 if (err < 0)
2723 return err;
2724
2725 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2726 struct netlink_dump_control c = {
2727 .dump = nf_tables_dump_sets,
2728 .done = nf_tables_dump_sets_done,
2729 };
2730 struct nft_ctx *ctx_dump;
2731
2732 ctx_dump = kmalloc(sizeof(*ctx_dump), GFP_KERNEL);
2733 if (ctx_dump == NULL)
2734 return -ENOMEM;
2735
2736 *ctx_dump = ctx;
2737 c.data = ctx_dump;
2738
2739 return netlink_dump_start(nlsk, skb, nlh, &c);
2740 }
2741
2742 /* Only accept unspec with dump */
2743 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2744 return -EAFNOSUPPORT;
2745 if (!nla[NFTA_SET_TABLE])
2746 return -EINVAL;
2747
2748 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
2749 if (IS_ERR(set))
2750 return PTR_ERR(set);
2751
2752 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2753 if (skb2 == NULL)
2754 return -ENOMEM;
2755
2756 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
2757 if (err < 0)
2758 goto err;
2759
2760 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2761
2762 err:
2763 kfree_skb(skb2);
2764 return err;
2765 }
2766
2767 static int nf_tables_set_desc_parse(const struct nft_ctx *ctx,
2768 struct nft_set_desc *desc,
2769 const struct nlattr *nla)
2770 {
2771 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
2772 int err;
2773
2774 err = nla_parse_nested(da, NFTA_SET_DESC_MAX, nla, nft_set_desc_policy);
2775 if (err < 0)
2776 return err;
2777
2778 if (da[NFTA_SET_DESC_SIZE] != NULL)
2779 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
2780
2781 return 0;
2782 }
2783
2784 static int nf_tables_newset(struct net *net, struct sock *nlsk,
2785 struct sk_buff *skb, const struct nlmsghdr *nlh,
2786 const struct nlattr * const nla[])
2787 {
2788 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2789 u8 genmask = nft_genmask_next(net);
2790 const struct nft_set_ops *ops;
2791 struct nft_af_info *afi;
2792 struct nft_table *table;
2793 struct nft_set *set;
2794 struct nft_ctx ctx;
2795 char name[NFT_SET_MAXNAMELEN];
2796 unsigned int size;
2797 bool create;
2798 u64 timeout;
2799 u32 ktype, dtype, flags, policy, gc_int;
2800 struct nft_set_desc desc;
2801 unsigned char *udata;
2802 u16 udlen;
2803 int err;
2804
2805 if (nla[NFTA_SET_TABLE] == NULL ||
2806 nla[NFTA_SET_NAME] == NULL ||
2807 nla[NFTA_SET_KEY_LEN] == NULL ||
2808 nla[NFTA_SET_ID] == NULL)
2809 return -EINVAL;
2810
2811 memset(&desc, 0, sizeof(desc));
2812
2813 ktype = NFT_DATA_VALUE;
2814 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
2815 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
2816 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
2817 return -EINVAL;
2818 }
2819
2820 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
2821 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
2822 return -EINVAL;
2823
2824 flags = 0;
2825 if (nla[NFTA_SET_FLAGS] != NULL) {
2826 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2827 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
2828 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
2829 NFT_SET_MAP | NFT_SET_EVAL))
2830 return -EINVAL;
2831 /* Only one of both operations is supported */
2832 if ((flags & (NFT_SET_MAP | NFT_SET_EVAL)) ==
2833 (NFT_SET_MAP | NFT_SET_EVAL))
2834 return -EOPNOTSUPP;
2835 }
2836
2837 dtype = 0;
2838 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
2839 if (!(flags & NFT_SET_MAP))
2840 return -EINVAL;
2841
2842 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
2843 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
2844 dtype != NFT_DATA_VERDICT)
2845 return -EINVAL;
2846
2847 if (dtype != NFT_DATA_VERDICT) {
2848 if (nla[NFTA_SET_DATA_LEN] == NULL)
2849 return -EINVAL;
2850 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
2851 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
2852 return -EINVAL;
2853 } else
2854 desc.dlen = sizeof(struct nft_verdict);
2855 } else if (flags & NFT_SET_MAP)
2856 return -EINVAL;
2857
2858 timeout = 0;
2859 if (nla[NFTA_SET_TIMEOUT] != NULL) {
2860 if (!(flags & NFT_SET_TIMEOUT))
2861 return -EINVAL;
2862 timeout = be64_to_cpu(nla_get_be64(nla[NFTA_SET_TIMEOUT]));
2863 }
2864 gc_int = 0;
2865 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
2866 if (!(flags & NFT_SET_TIMEOUT))
2867 return -EINVAL;
2868 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
2869 }
2870
2871 policy = NFT_SET_POL_PERFORMANCE;
2872 if (nla[NFTA_SET_POLICY] != NULL)
2873 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
2874
2875 if (nla[NFTA_SET_DESC] != NULL) {
2876 err = nf_tables_set_desc_parse(&ctx, &desc, nla[NFTA_SET_DESC]);
2877 if (err < 0)
2878 return err;
2879 }
2880
2881 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2882
2883 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
2884 if (IS_ERR(afi))
2885 return PTR_ERR(afi);
2886
2887 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE], genmask);
2888 if (IS_ERR(table))
2889 return PTR_ERR(table);
2890
2891 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
2892
2893 set = nf_tables_set_lookup(table, nla[NFTA_SET_NAME], genmask);
2894 if (IS_ERR(set)) {
2895 if (PTR_ERR(set) != -ENOENT)
2896 return PTR_ERR(set);
2897 set = NULL;
2898 }
2899
2900 if (set != NULL) {
2901 if (nlh->nlmsg_flags & NLM_F_EXCL)
2902 return -EEXIST;
2903 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2904 return -EOPNOTSUPP;
2905 return 0;
2906 }
2907
2908 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2909 return -ENOENT;
2910
2911 ops = nft_select_set_ops(nla, &desc, policy);
2912 if (IS_ERR(ops))
2913 return PTR_ERR(ops);
2914
2915 udlen = 0;
2916 if (nla[NFTA_SET_USERDATA])
2917 udlen = nla_len(nla[NFTA_SET_USERDATA]);
2918
2919 size = 0;
2920 if (ops->privsize != NULL)
2921 size = ops->privsize(nla);
2922
2923 err = -ENOMEM;
2924 set = kzalloc(sizeof(*set) + size + udlen, GFP_KERNEL);
2925 if (set == NULL)
2926 goto err1;
2927
2928 nla_strlcpy(name, nla[NFTA_SET_NAME], sizeof(set->name));
2929 err = nf_tables_set_alloc_name(&ctx, set, name);
2930 if (err < 0)
2931 goto err2;
2932
2933 udata = NULL;
2934 if (udlen) {
2935 udata = set->data + size;
2936 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
2937 }
2938
2939 INIT_LIST_HEAD(&set->bindings);
2940 set->ops = ops;
2941 set->ktype = ktype;
2942 set->klen = desc.klen;
2943 set->dtype = dtype;
2944 set->dlen = desc.dlen;
2945 set->flags = flags;
2946 set->size = desc.size;
2947 set->policy = policy;
2948 set->udlen = udlen;
2949 set->udata = udata;
2950 set->timeout = timeout;
2951 set->gc_int = gc_int;
2952
2953 err = ops->init(set, &desc, nla);
2954 if (err < 0)
2955 goto err2;
2956
2957 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
2958 if (err < 0)
2959 goto err3;
2960
2961 list_add_tail_rcu(&set->list, &table->sets);
2962 table->use++;
2963 return 0;
2964
2965 err3:
2966 ops->destroy(set);
2967 err2:
2968 kfree(set);
2969 err1:
2970 module_put(ops->owner);
2971 return err;
2972 }
2973
2974 static void nft_set_destroy(struct nft_set *set)
2975 {
2976 set->ops->destroy(set);
2977 module_put(set->ops->owner);
2978 kfree(set);
2979 }
2980
2981 static void nf_tables_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
2982 {
2983 list_del_rcu(&set->list);
2984 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET, GFP_ATOMIC);
2985 nft_set_destroy(set);
2986 }
2987
2988 static int nf_tables_delset(struct net *net, struct sock *nlsk,
2989 struct sk_buff *skb, const struct nlmsghdr *nlh,
2990 const struct nlattr * const nla[])
2991 {
2992 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2993 u8 genmask = nft_genmask_next(net);
2994 struct nft_set *set;
2995 struct nft_ctx ctx;
2996 int err;
2997
2998 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2999 return -EAFNOSUPPORT;
3000 if (nla[NFTA_SET_TABLE] == NULL)
3001 return -EINVAL;
3002
3003 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
3004 if (err < 0)
3005 return err;
3006
3007 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
3008 if (IS_ERR(set))
3009 return PTR_ERR(set);
3010 if (!list_empty(&set->bindings))
3011 return -EBUSY;
3012
3013 return nft_delset(&ctx, set);
3014 }
3015
3016 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
3017 const struct nft_set *set,
3018 const struct nft_set_iter *iter,
3019 const struct nft_set_elem *elem)
3020 {
3021 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3022 enum nft_registers dreg;
3023
3024 dreg = nft_type_to_reg(set->dtype);
3025 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
3026 set->dtype == NFT_DATA_VERDICT ?
3027 NFT_DATA_VERDICT : NFT_DATA_VALUE,
3028 set->dlen);
3029 }
3030
3031 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
3032 struct nft_set_binding *binding)
3033 {
3034 struct nft_set_binding *i;
3035 struct nft_set_iter iter;
3036
3037 if (!list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS)
3038 return -EBUSY;
3039
3040 if (binding->flags & NFT_SET_MAP) {
3041 /* If the set is already bound to the same chain all
3042 * jumps are already validated for that chain.
3043 */
3044 list_for_each_entry(i, &set->bindings, list) {
3045 if (i->flags & NFT_SET_MAP &&
3046 i->chain == binding->chain)
3047 goto bind;
3048 }
3049
3050 iter.genmask = nft_genmask_next(ctx->net);
3051 iter.skip = 0;
3052 iter.count = 0;
3053 iter.err = 0;
3054 iter.fn = nf_tables_bind_check_setelem;
3055
3056 set->ops->walk(ctx, set, &iter);
3057 if (iter.err < 0)
3058 return iter.err;
3059 }
3060 bind:
3061 binding->chain = ctx->chain;
3062 list_add_tail_rcu(&binding->list, &set->bindings);
3063 return 0;
3064 }
3065
3066 void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
3067 struct nft_set_binding *binding)
3068 {
3069 list_del_rcu(&binding->list);
3070
3071 if (list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS &&
3072 nft_is_active(ctx->net, set))
3073 nf_tables_set_destroy(ctx, set);
3074 }
3075
3076 const struct nft_set_ext_type nft_set_ext_types[] = {
3077 [NFT_SET_EXT_KEY] = {
3078 .align = __alignof__(u32),
3079 },
3080 [NFT_SET_EXT_DATA] = {
3081 .align = __alignof__(u32),
3082 },
3083 [NFT_SET_EXT_EXPR] = {
3084 .align = __alignof__(struct nft_expr),
3085 },
3086 [NFT_SET_EXT_FLAGS] = {
3087 .len = sizeof(u8),
3088 .align = __alignof__(u8),
3089 },
3090 [NFT_SET_EXT_TIMEOUT] = {
3091 .len = sizeof(u64),
3092 .align = __alignof__(u64),
3093 },
3094 [NFT_SET_EXT_EXPIRATION] = {
3095 .len = sizeof(unsigned long),
3096 .align = __alignof__(unsigned long),
3097 },
3098 [NFT_SET_EXT_USERDATA] = {
3099 .len = sizeof(struct nft_userdata),
3100 .align = __alignof__(struct nft_userdata),
3101 },
3102 };
3103 EXPORT_SYMBOL_GPL(nft_set_ext_types);
3104
3105 /*
3106 * Set elements
3107 */
3108
3109 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
3110 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
3111 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
3112 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
3113 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
3114 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
3115 .len = NFT_USERDATA_MAXLEN },
3116 };
3117
3118 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
3119 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING },
3120 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING },
3121 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
3122 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
3123 };
3124
3125 static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx, struct net *net,
3126 const struct sk_buff *skb,
3127 const struct nlmsghdr *nlh,
3128 const struct nlattr * const nla[],
3129 u8 genmask)
3130 {
3131 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3132 struct nft_af_info *afi;
3133 struct nft_table *table;
3134
3135 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
3136 if (IS_ERR(afi))
3137 return PTR_ERR(afi);
3138
3139 table = nf_tables_table_lookup(afi, nla[NFTA_SET_ELEM_LIST_TABLE],
3140 genmask);
3141 if (IS_ERR(table))
3142 return PTR_ERR(table);
3143
3144 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
3145 return 0;
3146 }
3147
3148 static int nf_tables_fill_setelem(struct sk_buff *skb,
3149 const struct nft_set *set,
3150 const struct nft_set_elem *elem)
3151 {
3152 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3153 unsigned char *b = skb_tail_pointer(skb);
3154 struct nlattr *nest;
3155
3156 nest = nla_nest_start(skb, NFTA_LIST_ELEM);
3157 if (nest == NULL)
3158 goto nla_put_failure;
3159
3160 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
3161 NFT_DATA_VALUE, set->klen) < 0)
3162 goto nla_put_failure;
3163
3164 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3165 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
3166 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
3167 set->dlen) < 0)
3168 goto nla_put_failure;
3169
3170 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
3171 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
3172 goto nla_put_failure;
3173
3174 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
3175 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
3176 htonl(*nft_set_ext_flags(ext))))
3177 goto nla_put_failure;
3178
3179 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
3180 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
3181 cpu_to_be64(*nft_set_ext_timeout(ext)),
3182 NFTA_SET_ELEM_PAD))
3183 goto nla_put_failure;
3184
3185 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
3186 unsigned long expires, now = jiffies;
3187
3188 expires = *nft_set_ext_expiration(ext);
3189 if (time_before(now, expires))
3190 expires -= now;
3191 else
3192 expires = 0;
3193
3194 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
3195 cpu_to_be64(jiffies_to_msecs(expires)),
3196 NFTA_SET_ELEM_PAD))
3197 goto nla_put_failure;
3198 }
3199
3200 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
3201 struct nft_userdata *udata;
3202
3203 udata = nft_set_ext_userdata(ext);
3204 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
3205 udata->len + 1, udata->data))
3206 goto nla_put_failure;
3207 }
3208
3209 nla_nest_end(skb, nest);
3210 return 0;
3211
3212 nla_put_failure:
3213 nlmsg_trim(skb, b);
3214 return -EMSGSIZE;
3215 }
3216
3217 struct nft_set_dump_args {
3218 const struct netlink_callback *cb;
3219 struct nft_set_iter iter;
3220 struct sk_buff *skb;
3221 };
3222
3223 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
3224 const struct nft_set *set,
3225 const struct nft_set_iter *iter,
3226 const struct nft_set_elem *elem)
3227 {
3228 struct nft_set_dump_args *args;
3229
3230 args = container_of(iter, struct nft_set_dump_args, iter);
3231 return nf_tables_fill_setelem(args->skb, set, elem);
3232 }
3233
3234 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
3235 {
3236 struct net *net = sock_net(skb->sk);
3237 u8 genmask = nft_genmask_cur(net);
3238 const struct nft_set *set;
3239 struct nft_set_dump_args args;
3240 struct nft_ctx ctx;
3241 struct nlattr *nla[NFTA_SET_ELEM_LIST_MAX + 1];
3242 struct nfgenmsg *nfmsg;
3243 struct nlmsghdr *nlh;
3244 struct nlattr *nest;
3245 u32 portid, seq;
3246 int event, err;
3247
3248 err = nlmsg_parse(cb->nlh, sizeof(struct nfgenmsg), nla,
3249 NFTA_SET_ELEM_LIST_MAX, nft_set_elem_list_policy);
3250 if (err < 0)
3251 return err;
3252
3253 err = nft_ctx_init_from_elemattr(&ctx, net, cb->skb, cb->nlh,
3254 (void *)nla, genmask);
3255 if (err < 0)
3256 return err;
3257
3258 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3259 genmask);
3260 if (IS_ERR(set))
3261 return PTR_ERR(set);
3262
3263 event = NFT_MSG_NEWSETELEM;
3264 event |= NFNL_SUBSYS_NFTABLES << 8;
3265 portid = NETLINK_CB(cb->skb).portid;
3266 seq = cb->nlh->nlmsg_seq;
3267
3268 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3269 NLM_F_MULTI);
3270 if (nlh == NULL)
3271 goto nla_put_failure;
3272
3273 nfmsg = nlmsg_data(nlh);
3274 nfmsg->nfgen_family = ctx.afi->family;
3275 nfmsg->version = NFNETLINK_V0;
3276 nfmsg->res_id = htons(ctx.net->nft.base_seq & 0xffff);
3277
3278 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, ctx.table->name))
3279 goto nla_put_failure;
3280 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
3281 goto nla_put_failure;
3282
3283 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3284 if (nest == NULL)
3285 goto nla_put_failure;
3286
3287 args.cb = cb;
3288 args.skb = skb;
3289 args.iter.genmask = nft_genmask_cur(ctx.net);
3290 args.iter.skip = cb->args[0];
3291 args.iter.count = 0;
3292 args.iter.err = 0;
3293 args.iter.fn = nf_tables_dump_setelem;
3294 set->ops->walk(&ctx, set, &args.iter);
3295
3296 nla_nest_end(skb, nest);
3297 nlmsg_end(skb, nlh);
3298
3299 if (args.iter.err && args.iter.err != -EMSGSIZE)
3300 return args.iter.err;
3301 if (args.iter.count == cb->args[0])
3302 return 0;
3303
3304 cb->args[0] = args.iter.count;
3305 return skb->len;
3306
3307 nla_put_failure:
3308 return -ENOSPC;
3309 }
3310
3311 static int nf_tables_getsetelem(struct net *net, struct sock *nlsk,
3312 struct sk_buff *skb, const struct nlmsghdr *nlh,
3313 const struct nlattr * const nla[])
3314 {
3315 u8 genmask = nft_genmask_cur(net);
3316 const struct nft_set *set;
3317 struct nft_ctx ctx;
3318 int err;
3319
3320 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3321 if (err < 0)
3322 return err;
3323
3324 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3325 genmask);
3326 if (IS_ERR(set))
3327 return PTR_ERR(set);
3328
3329 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3330 struct netlink_dump_control c = {
3331 .dump = nf_tables_dump_set,
3332 };
3333 return netlink_dump_start(nlsk, skb, nlh, &c);
3334 }
3335 return -EOPNOTSUPP;
3336 }
3337
3338 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
3339 const struct nft_ctx *ctx, u32 seq,
3340 u32 portid, int event, u16 flags,
3341 const struct nft_set *set,
3342 const struct nft_set_elem *elem)
3343 {
3344 struct nfgenmsg *nfmsg;
3345 struct nlmsghdr *nlh;
3346 struct nlattr *nest;
3347 int err;
3348
3349 event |= NFNL_SUBSYS_NFTABLES << 8;
3350 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3351 flags);
3352 if (nlh == NULL)
3353 goto nla_put_failure;
3354
3355 nfmsg = nlmsg_data(nlh);
3356 nfmsg->nfgen_family = ctx->afi->family;
3357 nfmsg->version = NFNETLINK_V0;
3358 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
3359
3360 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3361 goto nla_put_failure;
3362 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3363 goto nla_put_failure;
3364
3365 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3366 if (nest == NULL)
3367 goto nla_put_failure;
3368
3369 err = nf_tables_fill_setelem(skb, set, elem);
3370 if (err < 0)
3371 goto nla_put_failure;
3372
3373 nla_nest_end(skb, nest);
3374
3375 nlmsg_end(skb, nlh);
3376 return 0;
3377
3378 nla_put_failure:
3379 nlmsg_trim(skb, nlh);
3380 return -1;
3381 }
3382
3383 static int nf_tables_setelem_notify(const struct nft_ctx *ctx,
3384 const struct nft_set *set,
3385 const struct nft_set_elem *elem,
3386 int event, u16 flags)
3387 {
3388 struct net *net = ctx->net;
3389 u32 portid = ctx->portid;
3390 struct sk_buff *skb;
3391 int err;
3392
3393 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3394 return 0;
3395
3396 err = -ENOBUFS;
3397 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3398 if (skb == NULL)
3399 goto err;
3400
3401 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
3402 set, elem);
3403 if (err < 0) {
3404 kfree_skb(skb);
3405 goto err;
3406 }
3407
3408 err = nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
3409 GFP_KERNEL);
3410 err:
3411 if (err < 0)
3412 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, err);
3413 return err;
3414 }
3415
3416 static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
3417 int msg_type,
3418 struct nft_set *set)
3419 {
3420 struct nft_trans *trans;
3421
3422 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
3423 if (trans == NULL)
3424 return NULL;
3425
3426 nft_trans_elem_set(trans) = set;
3427 return trans;
3428 }
3429
3430 void *nft_set_elem_init(const struct nft_set *set,
3431 const struct nft_set_ext_tmpl *tmpl,
3432 const u32 *key, const u32 *data,
3433 u64 timeout, gfp_t gfp)
3434 {
3435 struct nft_set_ext *ext;
3436 void *elem;
3437
3438 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
3439 if (elem == NULL)
3440 return NULL;
3441
3442 ext = nft_set_elem_ext(set, elem);
3443 nft_set_ext_init(ext, tmpl);
3444
3445 memcpy(nft_set_ext_key(ext), key, set->klen);
3446 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3447 memcpy(nft_set_ext_data(ext), data, set->dlen);
3448 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION))
3449 *nft_set_ext_expiration(ext) =
3450 jiffies + msecs_to_jiffies(timeout);
3451 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
3452 *nft_set_ext_timeout(ext) = timeout;
3453
3454 return elem;
3455 }
3456
3457 void nft_set_elem_destroy(const struct nft_set *set, void *elem,
3458 bool destroy_expr)
3459 {
3460 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3461
3462 nft_data_uninit(nft_set_ext_key(ext), NFT_DATA_VALUE);
3463 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3464 nft_data_uninit(nft_set_ext_data(ext), set->dtype);
3465 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3466 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3467
3468 kfree(elem);
3469 }
3470 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
3471
3472 static int nft_setelem_parse_flags(const struct nft_set *set,
3473 const struct nlattr *attr, u32 *flags)
3474 {
3475 if (attr == NULL)
3476 return 0;
3477
3478 *flags = ntohl(nla_get_be32(attr));
3479 if (*flags & ~NFT_SET_ELEM_INTERVAL_END)
3480 return -EINVAL;
3481 if (!(set->flags & NFT_SET_INTERVAL) &&
3482 *flags & NFT_SET_ELEM_INTERVAL_END)
3483 return -EINVAL;
3484
3485 return 0;
3486 }
3487
3488 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3489 const struct nlattr *attr, u32 nlmsg_flags)
3490 {
3491 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3492 struct nft_data_desc d1, d2;
3493 struct nft_set_ext_tmpl tmpl;
3494 struct nft_set_ext *ext, *ext2;
3495 struct nft_set_elem elem;
3496 struct nft_set_binding *binding;
3497 struct nft_userdata *udata;
3498 struct nft_data data;
3499 enum nft_registers dreg;
3500 struct nft_trans *trans;
3501 u32 flags = 0;
3502 u64 timeout;
3503 u8 ulen;
3504 int err;
3505
3506 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3507 nft_set_elem_policy);
3508 if (err < 0)
3509 return err;
3510
3511 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3512 return -EINVAL;
3513
3514 nft_set_ext_prepare(&tmpl);
3515
3516 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3517 if (err < 0)
3518 return err;
3519 if (flags != 0)
3520 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3521
3522 if (set->flags & NFT_SET_MAP) {
3523 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
3524 !(flags & NFT_SET_ELEM_INTERVAL_END))
3525 return -EINVAL;
3526 if (nla[NFTA_SET_ELEM_DATA] != NULL &&
3527 flags & NFT_SET_ELEM_INTERVAL_END)
3528 return -EINVAL;
3529 } else {
3530 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3531 return -EINVAL;
3532 }
3533
3534 timeout = 0;
3535 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
3536 if (!(set->flags & NFT_SET_TIMEOUT))
3537 return -EINVAL;
3538 timeout = be64_to_cpu(nla_get_be64(nla[NFTA_SET_ELEM_TIMEOUT]));
3539 } else if (set->flags & NFT_SET_TIMEOUT) {
3540 timeout = set->timeout;
3541 }
3542
3543 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
3544 nla[NFTA_SET_ELEM_KEY]);
3545 if (err < 0)
3546 goto err1;
3547 err = -EINVAL;
3548 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
3549 goto err2;
3550
3551 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
3552 if (timeout > 0) {
3553 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
3554 if (timeout != set->timeout)
3555 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
3556 }
3557
3558 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
3559 err = nft_data_init(ctx, &data, sizeof(data), &d2,
3560 nla[NFTA_SET_ELEM_DATA]);
3561 if (err < 0)
3562 goto err2;
3563
3564 err = -EINVAL;
3565 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
3566 goto err3;
3567
3568 dreg = nft_type_to_reg(set->dtype);
3569 list_for_each_entry(binding, &set->bindings, list) {
3570 struct nft_ctx bind_ctx = {
3571 .afi = ctx->afi,
3572 .table = ctx->table,
3573 .chain = (struct nft_chain *)binding->chain,
3574 };
3575
3576 if (!(binding->flags & NFT_SET_MAP))
3577 continue;
3578
3579 err = nft_validate_register_store(&bind_ctx, dreg,
3580 &data,
3581 d2.type, d2.len);
3582 if (err < 0)
3583 goto err3;
3584 }
3585
3586 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
3587 }
3588
3589 /* The full maximum length of userdata can exceed the maximum
3590 * offset value (U8_MAX) for following extensions, therefor it
3591 * must be the last extension added.
3592 */
3593 ulen = 0;
3594 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
3595 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
3596 if (ulen > 0)
3597 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
3598 ulen);
3599 }
3600
3601 err = -ENOMEM;
3602 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
3603 timeout, GFP_KERNEL);
3604 if (elem.priv == NULL)
3605 goto err3;
3606
3607 ext = nft_set_elem_ext(set, elem.priv);
3608 if (flags)
3609 *nft_set_ext_flags(ext) = flags;
3610 if (ulen > 0) {
3611 udata = nft_set_ext_userdata(ext);
3612 udata->len = ulen - 1;
3613 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
3614 }
3615
3616 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
3617 if (trans == NULL)
3618 goto err4;
3619
3620 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
3621 err = set->ops->insert(ctx->net, set, &elem, &ext2);
3622 if (err) {
3623 if (err == -EEXIST) {
3624 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3625 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
3626 memcmp(nft_set_ext_data(ext),
3627 nft_set_ext_data(ext2), set->dlen) != 0)
3628 err = -EBUSY;
3629 else if (!(nlmsg_flags & NLM_F_EXCL))
3630 err = 0;
3631 }
3632 goto err5;
3633 }
3634
3635 nft_trans_elem(trans) = elem;
3636 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3637 return 0;
3638
3639 err5:
3640 kfree(trans);
3641 err4:
3642 kfree(elem.priv);
3643 err3:
3644 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3645 nft_data_uninit(&data, d2.type);
3646 err2:
3647 nft_data_uninit(&elem.key.val, d1.type);
3648 err1:
3649 return err;
3650 }
3651
3652 static int nf_tables_newsetelem(struct net *net, struct sock *nlsk,
3653 struct sk_buff *skb, const struct nlmsghdr *nlh,
3654 const struct nlattr * const nla[])
3655 {
3656 u8 genmask = nft_genmask_next(net);
3657 const struct nlattr *attr;
3658 struct nft_set *set;
3659 struct nft_ctx ctx;
3660 int rem, err = 0;
3661
3662 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
3663 return -EINVAL;
3664
3665 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3666 if (err < 0)
3667 return err;
3668
3669 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3670 genmask);
3671 if (IS_ERR(set)) {
3672 if (nla[NFTA_SET_ELEM_LIST_SET_ID]) {
3673 set = nf_tables_set_lookup_byid(net,
3674 nla[NFTA_SET_ELEM_LIST_SET_ID],
3675 genmask);
3676 }
3677 if (IS_ERR(set))
3678 return PTR_ERR(set);
3679 }
3680
3681 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
3682 return -EBUSY;
3683
3684 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3685 if (set->size &&
3686 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact))
3687 return -ENFILE;
3688
3689 err = nft_add_set_elem(&ctx, set, attr, nlh->nlmsg_flags);
3690 if (err < 0) {
3691 atomic_dec(&set->nelems);
3692 break;
3693 }
3694 }
3695 return err;
3696 }
3697
3698 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
3699 const struct nlattr *attr)
3700 {
3701 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3702 struct nft_set_ext_tmpl tmpl;
3703 struct nft_data_desc desc;
3704 struct nft_set_elem elem;
3705 struct nft_set_ext *ext;
3706 struct nft_trans *trans;
3707 u32 flags = 0;
3708 void *priv;
3709 int err;
3710
3711 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3712 nft_set_elem_policy);
3713 if (err < 0)
3714 goto err1;
3715
3716 err = -EINVAL;
3717 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3718 goto err1;
3719
3720 nft_set_ext_prepare(&tmpl);
3721
3722 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3723 if (err < 0)
3724 return err;
3725 if (flags != 0)
3726 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3727
3728 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
3729 nla[NFTA_SET_ELEM_KEY]);
3730 if (err < 0)
3731 goto err1;
3732
3733 err = -EINVAL;
3734 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
3735 goto err2;
3736
3737 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, desc.len);
3738
3739 err = -ENOMEM;
3740 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, NULL, 0,
3741 GFP_KERNEL);
3742 if (elem.priv == NULL)
3743 goto err2;
3744
3745 ext = nft_set_elem_ext(set, elem.priv);
3746 if (flags)
3747 *nft_set_ext_flags(ext) = flags;
3748
3749 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
3750 if (trans == NULL) {
3751 err = -ENOMEM;
3752 goto err3;
3753 }
3754
3755 priv = set->ops->deactivate(ctx->net, set, &elem);
3756 if (priv == NULL) {
3757 err = -ENOENT;
3758 goto err4;
3759 }
3760 kfree(elem.priv);
3761 elem.priv = priv;
3762
3763 nft_trans_elem(trans) = elem;
3764 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3765 return 0;
3766
3767 err4:
3768 kfree(trans);
3769 err3:
3770 kfree(elem.priv);
3771 err2:
3772 nft_data_uninit(&elem.key.val, desc.type);
3773 err1:
3774 return err;
3775 }
3776
3777 static int nf_tables_delsetelem(struct net *net, struct sock *nlsk,
3778 struct sk_buff *skb, const struct nlmsghdr *nlh,
3779 const struct nlattr * const nla[])
3780 {
3781 u8 genmask = nft_genmask_next(net);
3782 const struct nlattr *attr;
3783 struct nft_set *set;
3784 struct nft_ctx ctx;
3785 int rem, err = 0;
3786
3787 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
3788 return -EINVAL;
3789
3790 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3791 if (err < 0)
3792 return err;
3793
3794 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3795 genmask);
3796 if (IS_ERR(set))
3797 return PTR_ERR(set);
3798 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
3799 return -EBUSY;
3800
3801 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3802 err = nft_del_setelem(&ctx, set, attr);
3803 if (err < 0)
3804 break;
3805
3806 set->ndeact++;
3807 }
3808 return err;
3809 }
3810
3811 void nft_set_gc_batch_release(struct rcu_head *rcu)
3812 {
3813 struct nft_set_gc_batch *gcb;
3814 unsigned int i;
3815
3816 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
3817 for (i = 0; i < gcb->head.cnt; i++)
3818 nft_set_elem_destroy(gcb->head.set, gcb->elems[i], true);
3819 kfree(gcb);
3820 }
3821 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
3822
3823 struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
3824 gfp_t gfp)
3825 {
3826 struct nft_set_gc_batch *gcb;
3827
3828 gcb = kzalloc(sizeof(*gcb), gfp);
3829 if (gcb == NULL)
3830 return gcb;
3831 gcb->head.set = set;
3832 return gcb;
3833 }
3834 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
3835
3836 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
3837 u32 portid, u32 seq)
3838 {
3839 struct nlmsghdr *nlh;
3840 struct nfgenmsg *nfmsg;
3841 int event = (NFNL_SUBSYS_NFTABLES << 8) | NFT_MSG_NEWGEN;
3842
3843 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
3844 if (nlh == NULL)
3845 goto nla_put_failure;
3846
3847 nfmsg = nlmsg_data(nlh);
3848 nfmsg->nfgen_family = AF_UNSPEC;
3849 nfmsg->version = NFNETLINK_V0;
3850 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
3851
3852 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)))
3853 goto nla_put_failure;
3854
3855 nlmsg_end(skb, nlh);
3856 return 0;
3857
3858 nla_put_failure:
3859 nlmsg_trim(skb, nlh);
3860 return -EMSGSIZE;
3861 }
3862
3863 static int nf_tables_gen_notify(struct net *net, struct sk_buff *skb, int event)
3864 {
3865 struct nlmsghdr *nlh = nlmsg_hdr(skb);
3866 struct sk_buff *skb2;
3867 int err;
3868
3869 if (nlmsg_report(nlh) &&
3870 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3871 return 0;
3872
3873 err = -ENOBUFS;
3874 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3875 if (skb2 == NULL)
3876 goto err;
3877
3878 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
3879 nlh->nlmsg_seq);
3880 if (err < 0) {
3881 kfree_skb(skb2);
3882 goto err;
3883 }
3884
3885 err = nfnetlink_send(skb2, net, NETLINK_CB(skb).portid,
3886 NFNLGRP_NFTABLES, nlmsg_report(nlh), GFP_KERNEL);
3887 err:
3888 if (err < 0) {
3889 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
3890 err);
3891 }
3892 return err;
3893 }
3894
3895 static int nf_tables_getgen(struct net *net, struct sock *nlsk,
3896 struct sk_buff *skb, const struct nlmsghdr *nlh,
3897 const struct nlattr * const nla[])
3898 {
3899 struct sk_buff *skb2;
3900 int err;
3901
3902 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
3903 if (skb2 == NULL)
3904 return -ENOMEM;
3905
3906 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
3907 nlh->nlmsg_seq);
3908 if (err < 0)
3909 goto err;
3910
3911 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
3912 err:
3913 kfree_skb(skb2);
3914 return err;
3915 }
3916
3917 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
3918 [NFT_MSG_NEWTABLE] = {
3919 .call_batch = nf_tables_newtable,
3920 .attr_count = NFTA_TABLE_MAX,
3921 .policy = nft_table_policy,
3922 },
3923 [NFT_MSG_GETTABLE] = {
3924 .call = nf_tables_gettable,
3925 .attr_count = NFTA_TABLE_MAX,
3926 .policy = nft_table_policy,
3927 },
3928 [NFT_MSG_DELTABLE] = {
3929 .call_batch = nf_tables_deltable,
3930 .attr_count = NFTA_TABLE_MAX,
3931 .policy = nft_table_policy,
3932 },
3933 [NFT_MSG_NEWCHAIN] = {
3934 .call_batch = nf_tables_newchain,
3935 .attr_count = NFTA_CHAIN_MAX,
3936 .policy = nft_chain_policy,
3937 },
3938 [NFT_MSG_GETCHAIN] = {
3939 .call = nf_tables_getchain,
3940 .attr_count = NFTA_CHAIN_MAX,
3941 .policy = nft_chain_policy,
3942 },
3943 [NFT_MSG_DELCHAIN] = {
3944 .call_batch = nf_tables_delchain,
3945 .attr_count = NFTA_CHAIN_MAX,
3946 .policy = nft_chain_policy,
3947 },
3948 [NFT_MSG_NEWRULE] = {
3949 .call_batch = nf_tables_newrule,
3950 .attr_count = NFTA_RULE_MAX,
3951 .policy = nft_rule_policy,
3952 },
3953 [NFT_MSG_GETRULE] = {
3954 .call = nf_tables_getrule,
3955 .attr_count = NFTA_RULE_MAX,
3956 .policy = nft_rule_policy,
3957 },
3958 [NFT_MSG_DELRULE] = {
3959 .call_batch = nf_tables_delrule,
3960 .attr_count = NFTA_RULE_MAX,
3961 .policy = nft_rule_policy,
3962 },
3963 [NFT_MSG_NEWSET] = {
3964 .call_batch = nf_tables_newset,
3965 .attr_count = NFTA_SET_MAX,
3966 .policy = nft_set_policy,
3967 },
3968 [NFT_MSG_GETSET] = {
3969 .call = nf_tables_getset,
3970 .attr_count = NFTA_SET_MAX,
3971 .policy = nft_set_policy,
3972 },
3973 [NFT_MSG_DELSET] = {
3974 .call_batch = nf_tables_delset,
3975 .attr_count = NFTA_SET_MAX,
3976 .policy = nft_set_policy,
3977 },
3978 [NFT_MSG_NEWSETELEM] = {
3979 .call_batch = nf_tables_newsetelem,
3980 .attr_count = NFTA_SET_ELEM_LIST_MAX,
3981 .policy = nft_set_elem_list_policy,
3982 },
3983 [NFT_MSG_GETSETELEM] = {
3984 .call = nf_tables_getsetelem,
3985 .attr_count = NFTA_SET_ELEM_LIST_MAX,
3986 .policy = nft_set_elem_list_policy,
3987 },
3988 [NFT_MSG_DELSETELEM] = {
3989 .call_batch = nf_tables_delsetelem,
3990 .attr_count = NFTA_SET_ELEM_LIST_MAX,
3991 .policy = nft_set_elem_list_policy,
3992 },
3993 [NFT_MSG_GETGEN] = {
3994 .call = nf_tables_getgen,
3995 },
3996 };
3997
3998 static void nft_chain_commit_update(struct nft_trans *trans)
3999 {
4000 struct nft_base_chain *basechain;
4001
4002 if (nft_trans_chain_name(trans)[0])
4003 strcpy(trans->ctx.chain->name, nft_trans_chain_name(trans));
4004
4005 if (!(trans->ctx.chain->flags & NFT_BASE_CHAIN))
4006 return;
4007
4008 basechain = nft_base_chain(trans->ctx.chain);
4009 nft_chain_stats_replace(basechain, nft_trans_chain_stats(trans));
4010
4011 switch (nft_trans_chain_policy(trans)) {
4012 case NF_DROP:
4013 case NF_ACCEPT:
4014 basechain->policy = nft_trans_chain_policy(trans);
4015 break;
4016 }
4017 }
4018
4019 static void nf_tables_commit_release(struct nft_trans *trans)
4020 {
4021 switch (trans->msg_type) {
4022 case NFT_MSG_DELTABLE:
4023 nf_tables_table_destroy(&trans->ctx);
4024 break;
4025 case NFT_MSG_DELCHAIN:
4026 nf_tables_chain_destroy(trans->ctx.chain);
4027 break;
4028 case NFT_MSG_DELRULE:
4029 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
4030 break;
4031 case NFT_MSG_DELSET:
4032 nft_set_destroy(nft_trans_set(trans));
4033 break;
4034 case NFT_MSG_DELSETELEM:
4035 nft_set_elem_destroy(nft_trans_elem_set(trans),
4036 nft_trans_elem(trans).priv, true);
4037 break;
4038 }
4039 kfree(trans);
4040 }
4041
4042 static int nf_tables_commit(struct net *net, struct sk_buff *skb)
4043 {
4044 struct nft_trans *trans, *next;
4045 struct nft_trans_elem *te;
4046
4047 /* Bump generation counter, invalidate any dump in progress */
4048 while (++net->nft.base_seq == 0);
4049
4050 /* A new generation has just started */
4051 net->nft.gencursor = nft_gencursor_next(net);
4052
4053 /* Make sure all packets have left the previous generation before
4054 * purging old rules.
4055 */
4056 synchronize_rcu();
4057
4058 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
4059 switch (trans->msg_type) {
4060 case NFT_MSG_NEWTABLE:
4061 if (nft_trans_table_update(trans)) {
4062 if (!nft_trans_table_enable(trans)) {
4063 nf_tables_table_disable(net,
4064 trans->ctx.afi,
4065 trans->ctx.table);
4066 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
4067 }
4068 } else {
4069 nft_clear(net, trans->ctx.table);
4070 }
4071 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
4072 nft_trans_destroy(trans);
4073 break;
4074 case NFT_MSG_DELTABLE:
4075 list_del_rcu(&trans->ctx.table->list);
4076 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
4077 break;
4078 case NFT_MSG_NEWCHAIN:
4079 if (nft_trans_chain_update(trans))
4080 nft_chain_commit_update(trans);
4081 else
4082 nft_clear(net, trans->ctx.chain);
4083
4084 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
4085 nft_trans_destroy(trans);
4086 break;
4087 case NFT_MSG_DELCHAIN:
4088 list_del_rcu(&trans->ctx.chain->list);
4089 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
4090 nf_tables_unregister_hooks(trans->ctx.net,
4091 trans->ctx.table,
4092 trans->ctx.chain,
4093 trans->ctx.afi->nops);
4094 break;
4095 case NFT_MSG_NEWRULE:
4096 nft_clear(trans->ctx.net, nft_trans_rule(trans));
4097 nf_tables_rule_notify(&trans->ctx,
4098 nft_trans_rule(trans),
4099 NFT_MSG_NEWRULE);
4100 nft_trans_destroy(trans);
4101 break;
4102 case NFT_MSG_DELRULE:
4103 list_del_rcu(&nft_trans_rule(trans)->list);
4104 nf_tables_rule_notify(&trans->ctx,
4105 nft_trans_rule(trans),
4106 NFT_MSG_DELRULE);
4107 break;
4108 case NFT_MSG_NEWSET:
4109 nft_clear(net, nft_trans_set(trans));
4110 /* This avoids hitting -EBUSY when deleting the table
4111 * from the transaction.
4112 */
4113 if (nft_trans_set(trans)->flags & NFT_SET_ANONYMOUS &&
4114 !list_empty(&nft_trans_set(trans)->bindings))
4115 trans->ctx.table->use--;
4116
4117 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
4118 NFT_MSG_NEWSET, GFP_KERNEL);
4119 nft_trans_destroy(trans);
4120 break;
4121 case NFT_MSG_DELSET:
4122 list_del_rcu(&nft_trans_set(trans)->list);
4123 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
4124 NFT_MSG_DELSET, GFP_KERNEL);
4125 break;
4126 case NFT_MSG_NEWSETELEM:
4127 te = (struct nft_trans_elem *)trans->data;
4128
4129 te->set->ops->activate(net, te->set, &te->elem);
4130 nf_tables_setelem_notify(&trans->ctx, te->set,
4131 &te->elem,
4132 NFT_MSG_NEWSETELEM, 0);
4133 nft_trans_destroy(trans);
4134 break;
4135 case NFT_MSG_DELSETELEM:
4136 te = (struct nft_trans_elem *)trans->data;
4137
4138 nf_tables_setelem_notify(&trans->ctx, te->set,
4139 &te->elem,
4140 NFT_MSG_DELSETELEM, 0);
4141 te->set->ops->remove(te->set, &te->elem);
4142 atomic_dec(&te->set->nelems);
4143 te->set->ndeact--;
4144 break;
4145 }
4146 }
4147
4148 synchronize_rcu();
4149
4150 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
4151 list_del(&trans->list);
4152 nf_tables_commit_release(trans);
4153 }
4154
4155 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
4156
4157 return 0;
4158 }
4159
4160 static void nf_tables_abort_release(struct nft_trans *trans)
4161 {
4162 switch (trans->msg_type) {
4163 case NFT_MSG_NEWTABLE:
4164 nf_tables_table_destroy(&trans->ctx);
4165 break;
4166 case NFT_MSG_NEWCHAIN:
4167 nf_tables_chain_destroy(trans->ctx.chain);
4168 break;
4169 case NFT_MSG_NEWRULE:
4170 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
4171 break;
4172 case NFT_MSG_NEWSET:
4173 nft_set_destroy(nft_trans_set(trans));
4174 break;
4175 case NFT_MSG_NEWSETELEM:
4176 nft_set_elem_destroy(nft_trans_elem_set(trans),
4177 nft_trans_elem(trans).priv, true);
4178 break;
4179 }
4180 kfree(trans);
4181 }
4182
4183 static int nf_tables_abort(struct net *net, struct sk_buff *skb)
4184 {
4185 struct nft_trans *trans, *next;
4186 struct nft_trans_elem *te;
4187
4188 list_for_each_entry_safe_reverse(trans, next, &net->nft.commit_list,
4189 list) {
4190 switch (trans->msg_type) {
4191 case NFT_MSG_NEWTABLE:
4192 if (nft_trans_table_update(trans)) {
4193 if (nft_trans_table_enable(trans)) {
4194 nf_tables_table_disable(net,
4195 trans->ctx.afi,
4196 trans->ctx.table);
4197 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
4198 }
4199 nft_trans_destroy(trans);
4200 } else {
4201 list_del_rcu(&trans->ctx.table->list);
4202 }
4203 break;
4204 case NFT_MSG_DELTABLE:
4205 nft_clear(trans->ctx.net, trans->ctx.table);
4206 nft_trans_destroy(trans);
4207 break;
4208 case NFT_MSG_NEWCHAIN:
4209 if (nft_trans_chain_update(trans)) {
4210 free_percpu(nft_trans_chain_stats(trans));
4211
4212 nft_trans_destroy(trans);
4213 } else {
4214 trans->ctx.table->use--;
4215 list_del_rcu(&trans->ctx.chain->list);
4216 nf_tables_unregister_hooks(trans->ctx.net,
4217 trans->ctx.table,
4218 trans->ctx.chain,
4219 trans->ctx.afi->nops);
4220 }
4221 break;
4222 case NFT_MSG_DELCHAIN:
4223 trans->ctx.table->use++;
4224 nft_clear(trans->ctx.net, trans->ctx.chain);
4225 nft_trans_destroy(trans);
4226 break;
4227 case NFT_MSG_NEWRULE:
4228 trans->ctx.chain->use--;
4229 list_del_rcu(&nft_trans_rule(trans)->list);
4230 break;
4231 case NFT_MSG_DELRULE:
4232 trans->ctx.chain->use++;
4233 nft_clear(trans->ctx.net, nft_trans_rule(trans));
4234 nft_trans_destroy(trans);
4235 break;
4236 case NFT_MSG_NEWSET:
4237 trans->ctx.table->use--;
4238 list_del_rcu(&nft_trans_set(trans)->list);
4239 break;
4240 case NFT_MSG_DELSET:
4241 trans->ctx.table->use++;
4242 nft_clear(trans->ctx.net, nft_trans_set(trans));
4243 nft_trans_destroy(trans);
4244 break;
4245 case NFT_MSG_NEWSETELEM:
4246 te = (struct nft_trans_elem *)trans->data;
4247
4248 te->set->ops->remove(te->set, &te->elem);
4249 atomic_dec(&te->set->nelems);
4250 break;
4251 case NFT_MSG_DELSETELEM:
4252 te = (struct nft_trans_elem *)trans->data;
4253
4254 te->set->ops->activate(net, te->set, &te->elem);
4255 te->set->ndeact--;
4256
4257 nft_trans_destroy(trans);
4258 break;
4259 }
4260 }
4261
4262 synchronize_rcu();
4263
4264 list_for_each_entry_safe_reverse(trans, next,
4265 &net->nft.commit_list, list) {
4266 list_del(&trans->list);
4267 nf_tables_abort_release(trans);
4268 }
4269
4270 return 0;
4271 }
4272
4273 static const struct nfnetlink_subsystem nf_tables_subsys = {
4274 .name = "nf_tables",
4275 .subsys_id = NFNL_SUBSYS_NFTABLES,
4276 .cb_count = NFT_MSG_MAX,
4277 .cb = nf_tables_cb,
4278 .commit = nf_tables_commit,
4279 .abort = nf_tables_abort,
4280 };
4281
4282 int nft_chain_validate_dependency(const struct nft_chain *chain,
4283 enum nft_chain_type type)
4284 {
4285 const struct nft_base_chain *basechain;
4286
4287 if (chain->flags & NFT_BASE_CHAIN) {
4288 basechain = nft_base_chain(chain);
4289 if (basechain->type->type != type)
4290 return -EOPNOTSUPP;
4291 }
4292 return 0;
4293 }
4294 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
4295
4296 int nft_chain_validate_hooks(const struct nft_chain *chain,
4297 unsigned int hook_flags)
4298 {
4299 struct nft_base_chain *basechain;
4300
4301 if (chain->flags & NFT_BASE_CHAIN) {
4302 basechain = nft_base_chain(chain);
4303
4304 if ((1 << basechain->ops[0].hooknum) & hook_flags)
4305 return 0;
4306
4307 return -EOPNOTSUPP;
4308 }
4309
4310 return 0;
4311 }
4312 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
4313
4314 /*
4315 * Loop detection - walk through the ruleset beginning at the destination chain
4316 * of a new jump until either the source chain is reached (loop) or all
4317 * reachable chains have been traversed.
4318 *
4319 * The loop check is performed whenever a new jump verdict is added to an
4320 * expression or verdict map or a verdict map is bound to a new chain.
4321 */
4322
4323 static int nf_tables_check_loops(const struct nft_ctx *ctx,
4324 const struct nft_chain *chain);
4325
4326 static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
4327 const struct nft_set *set,
4328 const struct nft_set_iter *iter,
4329 const struct nft_set_elem *elem)
4330 {
4331 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4332 const struct nft_data *data;
4333
4334 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
4335 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
4336 return 0;
4337
4338 data = nft_set_ext_data(ext);
4339 switch (data->verdict.code) {
4340 case NFT_JUMP:
4341 case NFT_GOTO:
4342 return nf_tables_check_loops(ctx, data->verdict.chain);
4343 default:
4344 return 0;
4345 }
4346 }
4347
4348 static int nf_tables_check_loops(const struct nft_ctx *ctx,
4349 const struct nft_chain *chain)
4350 {
4351 const struct nft_rule *rule;
4352 const struct nft_expr *expr, *last;
4353 const struct nft_set *set;
4354 struct nft_set_binding *binding;
4355 struct nft_set_iter iter;
4356
4357 if (ctx->chain == chain)
4358 return -ELOOP;
4359
4360 list_for_each_entry(rule, &chain->rules, list) {
4361 nft_rule_for_each_expr(expr, last, rule) {
4362 const struct nft_data *data = NULL;
4363 int err;
4364
4365 if (!expr->ops->validate)
4366 continue;
4367
4368 err = expr->ops->validate(ctx, expr, &data);
4369 if (err < 0)
4370 return err;
4371
4372 if (data == NULL)
4373 continue;
4374
4375 switch (data->verdict.code) {
4376 case NFT_JUMP:
4377 case NFT_GOTO:
4378 err = nf_tables_check_loops(ctx,
4379 data->verdict.chain);
4380 if (err < 0)
4381 return err;
4382 default:
4383 break;
4384 }
4385 }
4386 }
4387
4388 list_for_each_entry(set, &ctx->table->sets, list) {
4389 if (!nft_is_active_next(ctx->net, set))
4390 continue;
4391 if (!(set->flags & NFT_SET_MAP) ||
4392 set->dtype != NFT_DATA_VERDICT)
4393 continue;
4394
4395 list_for_each_entry(binding, &set->bindings, list) {
4396 if (!(binding->flags & NFT_SET_MAP) ||
4397 binding->chain != chain)
4398 continue;
4399
4400 iter.genmask = nft_genmask_next(ctx->net);
4401 iter.skip = 0;
4402 iter.count = 0;
4403 iter.err = 0;
4404 iter.fn = nf_tables_loop_check_setelem;
4405
4406 set->ops->walk(ctx, set, &iter);
4407 if (iter.err < 0)
4408 return iter.err;
4409 }
4410 }
4411
4412 return 0;
4413 }
4414
4415 /**
4416 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
4417 *
4418 * @attr: netlink attribute to fetch value from
4419 * @max: maximum value to be stored in dest
4420 * @dest: pointer to the variable
4421 *
4422 * Parse, check and store a given u32 netlink attribute into variable.
4423 * This function returns -ERANGE if the value goes over maximum value.
4424 * Otherwise a 0 is returned and the attribute value is stored in the
4425 * destination variable.
4426 */
4427 int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
4428 {
4429 u32 val;
4430
4431 val = ntohl(nla_get_be32(attr));
4432 if (val > max)
4433 return -ERANGE;
4434
4435 *dest = val;
4436 return 0;
4437 }
4438 EXPORT_SYMBOL_GPL(nft_parse_u32_check);
4439
4440 /**
4441 * nft_parse_register - parse a register value from a netlink attribute
4442 *
4443 * @attr: netlink attribute
4444 *
4445 * Parse and translate a register value from a netlink attribute.
4446 * Registers used to be 128 bit wide, these register numbers will be
4447 * mapped to the corresponding 32 bit register numbers.
4448 */
4449 unsigned int nft_parse_register(const struct nlattr *attr)
4450 {
4451 unsigned int reg;
4452
4453 reg = ntohl(nla_get_be32(attr));
4454 switch (reg) {
4455 case NFT_REG_VERDICT...NFT_REG_4:
4456 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
4457 default:
4458 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
4459 }
4460 }
4461 EXPORT_SYMBOL_GPL(nft_parse_register);
4462
4463 /**
4464 * nft_dump_register - dump a register value to a netlink attribute
4465 *
4466 * @skb: socket buffer
4467 * @attr: attribute number
4468 * @reg: register number
4469 *
4470 * Construct a netlink attribute containing the register number. For
4471 * compatibility reasons, register numbers being a multiple of 4 are
4472 * translated to the corresponding 128 bit register numbers.
4473 */
4474 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
4475 {
4476 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
4477 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
4478 else
4479 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
4480
4481 return nla_put_be32(skb, attr, htonl(reg));
4482 }
4483 EXPORT_SYMBOL_GPL(nft_dump_register);
4484
4485 /**
4486 * nft_validate_register_load - validate a load from a register
4487 *
4488 * @reg: the register number
4489 * @len: the length of the data
4490 *
4491 * Validate that the input register is one of the general purpose
4492 * registers and that the length of the load is within the bounds.
4493 */
4494 int nft_validate_register_load(enum nft_registers reg, unsigned int len)
4495 {
4496 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
4497 return -EINVAL;
4498 if (len == 0)
4499 return -EINVAL;
4500 if (reg * NFT_REG32_SIZE + len > FIELD_SIZEOF(struct nft_regs, data))
4501 return -ERANGE;
4502
4503 return 0;
4504 }
4505 EXPORT_SYMBOL_GPL(nft_validate_register_load);
4506
4507 /**
4508 * nft_validate_register_store - validate an expressions' register store
4509 *
4510 * @ctx: context of the expression performing the load
4511 * @reg: the destination register number
4512 * @data: the data to load
4513 * @type: the data type
4514 * @len: the length of the data
4515 *
4516 * Validate that a data load uses the appropriate data type for
4517 * the destination register and the length is within the bounds.
4518 * A value of NULL for the data means that its runtime gathered
4519 * data.
4520 */
4521 int nft_validate_register_store(const struct nft_ctx *ctx,
4522 enum nft_registers reg,
4523 const struct nft_data *data,
4524 enum nft_data_types type, unsigned int len)
4525 {
4526 int err;
4527
4528 switch (reg) {
4529 case NFT_REG_VERDICT:
4530 if (type != NFT_DATA_VERDICT)
4531 return -EINVAL;
4532
4533 if (data != NULL &&
4534 (data->verdict.code == NFT_GOTO ||
4535 data->verdict.code == NFT_JUMP)) {
4536 err = nf_tables_check_loops(ctx, data->verdict.chain);
4537 if (err < 0)
4538 return err;
4539
4540 if (ctx->chain->level + 1 >
4541 data->verdict.chain->level) {
4542 if (ctx->chain->level + 1 == NFT_JUMP_STACK_SIZE)
4543 return -EMLINK;
4544 data->verdict.chain->level = ctx->chain->level + 1;
4545 }
4546 }
4547
4548 return 0;
4549 default:
4550 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
4551 return -EINVAL;
4552 if (len == 0)
4553 return -EINVAL;
4554 if (reg * NFT_REG32_SIZE + len >
4555 FIELD_SIZEOF(struct nft_regs, data))
4556 return -ERANGE;
4557
4558 if (data != NULL && type != NFT_DATA_VALUE)
4559 return -EINVAL;
4560 return 0;
4561 }
4562 }
4563 EXPORT_SYMBOL_GPL(nft_validate_register_store);
4564
4565 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
4566 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
4567 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
4568 .len = NFT_CHAIN_MAXNAMELEN - 1 },
4569 };
4570
4571 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
4572 struct nft_data_desc *desc, const struct nlattr *nla)
4573 {
4574 u8 genmask = nft_genmask_next(ctx->net);
4575 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
4576 struct nft_chain *chain;
4577 int err;
4578
4579 err = nla_parse_nested(tb, NFTA_VERDICT_MAX, nla, nft_verdict_policy);
4580 if (err < 0)
4581 return err;
4582
4583 if (!tb[NFTA_VERDICT_CODE])
4584 return -EINVAL;
4585 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
4586
4587 switch (data->verdict.code) {
4588 default:
4589 switch (data->verdict.code & NF_VERDICT_MASK) {
4590 case NF_ACCEPT:
4591 case NF_DROP:
4592 case NF_QUEUE:
4593 break;
4594 default:
4595 return -EINVAL;
4596 }
4597 /* fall through */
4598 case NFT_CONTINUE:
4599 case NFT_BREAK:
4600 case NFT_RETURN:
4601 break;
4602 case NFT_JUMP:
4603 case NFT_GOTO:
4604 if (!tb[NFTA_VERDICT_CHAIN])
4605 return -EINVAL;
4606 chain = nf_tables_chain_lookup(ctx->table,
4607 tb[NFTA_VERDICT_CHAIN], genmask);
4608 if (IS_ERR(chain))
4609 return PTR_ERR(chain);
4610 if (chain->flags & NFT_BASE_CHAIN)
4611 return -EOPNOTSUPP;
4612
4613 chain->use++;
4614 data->verdict.chain = chain;
4615 break;
4616 }
4617
4618 desc->len = sizeof(data->verdict);
4619 desc->type = NFT_DATA_VERDICT;
4620 return 0;
4621 }
4622
4623 static void nft_verdict_uninit(const struct nft_data *data)
4624 {
4625 switch (data->verdict.code) {
4626 case NFT_JUMP:
4627 case NFT_GOTO:
4628 data->verdict.chain->use--;
4629 break;
4630 }
4631 }
4632
4633 int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
4634 {
4635 struct nlattr *nest;
4636
4637 nest = nla_nest_start(skb, type);
4638 if (!nest)
4639 goto nla_put_failure;
4640
4641 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
4642 goto nla_put_failure;
4643
4644 switch (v->code) {
4645 case NFT_JUMP:
4646 case NFT_GOTO:
4647 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
4648 v->chain->name))
4649 goto nla_put_failure;
4650 }
4651 nla_nest_end(skb, nest);
4652 return 0;
4653
4654 nla_put_failure:
4655 return -1;
4656 }
4657
4658 static int nft_value_init(const struct nft_ctx *ctx,
4659 struct nft_data *data, unsigned int size,
4660 struct nft_data_desc *desc, const struct nlattr *nla)
4661 {
4662 unsigned int len;
4663
4664 len = nla_len(nla);
4665 if (len == 0)
4666 return -EINVAL;
4667 if (len > size)
4668 return -EOVERFLOW;
4669
4670 nla_memcpy(data->data, nla, len);
4671 desc->type = NFT_DATA_VALUE;
4672 desc->len = len;
4673 return 0;
4674 }
4675
4676 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
4677 unsigned int len)
4678 {
4679 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
4680 }
4681
4682 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
4683 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
4684 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
4685 };
4686
4687 /**
4688 * nft_data_init - parse nf_tables data netlink attributes
4689 *
4690 * @ctx: context of the expression using the data
4691 * @data: destination struct nft_data
4692 * @size: maximum data length
4693 * @desc: data description
4694 * @nla: netlink attribute containing data
4695 *
4696 * Parse the netlink data attributes and initialize a struct nft_data.
4697 * The type and length of data are returned in the data description.
4698 *
4699 * The caller can indicate that it only wants to accept data of type
4700 * NFT_DATA_VALUE by passing NULL for the ctx argument.
4701 */
4702 int nft_data_init(const struct nft_ctx *ctx,
4703 struct nft_data *data, unsigned int size,
4704 struct nft_data_desc *desc, const struct nlattr *nla)
4705 {
4706 struct nlattr *tb[NFTA_DATA_MAX + 1];
4707 int err;
4708
4709 err = nla_parse_nested(tb, NFTA_DATA_MAX, nla, nft_data_policy);
4710 if (err < 0)
4711 return err;
4712
4713 if (tb[NFTA_DATA_VALUE])
4714 return nft_value_init(ctx, data, size, desc,
4715 tb[NFTA_DATA_VALUE]);
4716 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
4717 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
4718 return -EINVAL;
4719 }
4720 EXPORT_SYMBOL_GPL(nft_data_init);
4721
4722 /**
4723 * nft_data_uninit - release a nft_data item
4724 *
4725 * @data: struct nft_data to release
4726 * @type: type of data
4727 *
4728 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4729 * all others need to be released by calling this function.
4730 */
4731 void nft_data_uninit(const struct nft_data *data, enum nft_data_types type)
4732 {
4733 if (type < NFT_DATA_VERDICT)
4734 return;
4735 switch (type) {
4736 case NFT_DATA_VERDICT:
4737 return nft_verdict_uninit(data);
4738 default:
4739 WARN_ON(1);
4740 }
4741 }
4742 EXPORT_SYMBOL_GPL(nft_data_uninit);
4743
4744 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
4745 enum nft_data_types type, unsigned int len)
4746 {
4747 struct nlattr *nest;
4748 int err;
4749
4750 nest = nla_nest_start(skb, attr);
4751 if (nest == NULL)
4752 return -1;
4753
4754 switch (type) {
4755 case NFT_DATA_VALUE:
4756 err = nft_value_dump(skb, data, len);
4757 break;
4758 case NFT_DATA_VERDICT:
4759 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
4760 break;
4761 default:
4762 err = -EINVAL;
4763 WARN_ON(1);
4764 }
4765
4766 nla_nest_end(skb, nest);
4767 return err;
4768 }
4769 EXPORT_SYMBOL_GPL(nft_data_dump);
4770
4771 static int __net_init nf_tables_init_net(struct net *net)
4772 {
4773 INIT_LIST_HEAD(&net->nft.af_info);
4774 INIT_LIST_HEAD(&net->nft.commit_list);
4775 net->nft.base_seq = 1;
4776 return 0;
4777 }
4778
4779 int __nft_release_basechain(struct nft_ctx *ctx)
4780 {
4781 struct nft_rule *rule, *nr;
4782
4783 BUG_ON(!(ctx->chain->flags & NFT_BASE_CHAIN));
4784
4785 nf_tables_unregister_hooks(ctx->net, ctx->chain->table, ctx->chain,
4786 ctx->afi->nops);
4787 list_for_each_entry_safe(rule, nr, &ctx->chain->rules, list) {
4788 list_del(&rule->list);
4789 ctx->chain->use--;
4790 nf_tables_rule_destroy(ctx, rule);
4791 }
4792 list_del(&ctx->chain->list);
4793 ctx->table->use--;
4794 nf_tables_chain_destroy(ctx->chain);
4795
4796 return 0;
4797 }
4798 EXPORT_SYMBOL_GPL(__nft_release_basechain);
4799
4800 /* Called by nft_unregister_afinfo() from __net_exit path, nfnl_lock is held. */
4801 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi)
4802 {
4803 struct nft_table *table, *nt;
4804 struct nft_chain *chain, *nc;
4805 struct nft_rule *rule, *nr;
4806 struct nft_set *set, *ns;
4807 struct nft_ctx ctx = {
4808 .net = net,
4809 .afi = afi,
4810 };
4811
4812 list_for_each_entry_safe(table, nt, &afi->tables, list) {
4813 list_for_each_entry(chain, &table->chains, list)
4814 nf_tables_unregister_hooks(net, table, chain,
4815 afi->nops);
4816 /* No packets are walking on these chains anymore. */
4817 ctx.table = table;
4818 list_for_each_entry(chain, &table->chains, list) {
4819 ctx.chain = chain;
4820 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
4821 list_del(&rule->list);
4822 chain->use--;
4823 nf_tables_rule_destroy(&ctx, rule);
4824 }
4825 }
4826 list_for_each_entry_safe(set, ns, &table->sets, list) {
4827 list_del(&set->list);
4828 table->use--;
4829 nft_set_destroy(set);
4830 }
4831 list_for_each_entry_safe(chain, nc, &table->chains, list) {
4832 list_del(&chain->list);
4833 table->use--;
4834 nf_tables_chain_destroy(chain);
4835 }
4836 list_del(&table->list);
4837 nf_tables_table_destroy(&ctx);
4838 }
4839 }
4840
4841 static struct pernet_operations nf_tables_net_ops = {
4842 .init = nf_tables_init_net,
4843 };
4844
4845 static int __init nf_tables_module_init(void)
4846 {
4847 int err;
4848
4849 info = kmalloc(sizeof(struct nft_expr_info) * NFT_RULE_MAXEXPRS,
4850 GFP_KERNEL);
4851 if (info == NULL) {
4852 err = -ENOMEM;
4853 goto err1;
4854 }
4855
4856 err = nf_tables_core_module_init();
4857 if (err < 0)
4858 goto err2;
4859
4860 err = nfnetlink_subsys_register(&nf_tables_subsys);
4861 if (err < 0)
4862 goto err3;
4863
4864 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
4865 return register_pernet_subsys(&nf_tables_net_ops);
4866 err3:
4867 nf_tables_core_module_exit();
4868 err2:
4869 kfree(info);
4870 err1:
4871 return err;
4872 }
4873
4874 static void __exit nf_tables_module_exit(void)
4875 {
4876 unregister_pernet_subsys(&nf_tables_net_ops);
4877 nfnetlink_subsys_unregister(&nf_tables_subsys);
4878 rcu_barrier();
4879 nf_tables_core_module_exit();
4880 kfree(info);
4881 }
4882
4883 module_init(nf_tables_module_init);
4884 module_exit(nf_tables_module_exit);
4885
4886 MODULE_LICENSE("GPL");
4887 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
4888 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);