]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - net/netfilter/nf_tables_api.c
netfilter: x_tables: check name length in find_match/target, too
[mirror_ubuntu-jammy-kernel.git] / net / netfilter / nf_tables_api.c
CommitLineData
96518518 1/*
20a69341 2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
96518518
PM
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
7 *
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
9 */
10
11#include <linux/module.h>
12#include <linux/init.h>
13#include <linux/list.h>
14#include <linux/skbuff.h>
15#include <linux/netlink.h>
1ff75a3e 16#include <linux/vmalloc.h>
96518518
PM
17#include <linux/netfilter.h>
18#include <linux/netfilter/nfnetlink.h>
19#include <linux/netfilter/nf_tables.h>
3b49e2e9 20#include <net/netfilter/nf_flow_table.h>
96518518
PM
21#include <net/netfilter/nf_tables_core.h>
22#include <net/netfilter/nf_tables.h>
99633ab2 23#include <net/net_namespace.h>
96518518
PM
24#include <net/sock.h>
25
96518518 26static LIST_HEAD(nf_tables_expressions);
e5009240 27static LIST_HEAD(nf_tables_objects);
3b49e2e9 28static LIST_HEAD(nf_tables_flowtables);
3ecbfd65 29static u64 table_handle;
96518518 30
7c95f6d8 31static void nft_ctx_init(struct nft_ctx *ctx,
633c9a84 32 struct net *net,
7c95f6d8
PNA
33 const struct sk_buff *skb,
34 const struct nlmsghdr *nlh,
36596dad 35 u8 family,
7c95f6d8
PNA
36 struct nft_table *table,
37 struct nft_chain *chain,
38 const struct nlattr * const *nla)
39{
633c9a84 40 ctx->net = net;
36596dad 41 ctx->family = family;
128ad332
PNA
42 ctx->table = table;
43 ctx->chain = chain;
44 ctx->nla = nla;
45 ctx->portid = NETLINK_CB(skb).portid;
46 ctx->report = nlmsg_report(nlh);
47 ctx->seq = nlh->nlmsg_seq;
7c95f6d8
PNA
48}
49
8411b644
PNA
50static struct nft_trans *nft_trans_alloc_gfp(const struct nft_ctx *ctx,
51 int msg_type, u32 size, gfp_t gfp)
1081d11b
PNA
52{
53 struct nft_trans *trans;
54
8411b644 55 trans = kzalloc(sizeof(struct nft_trans) + size, gfp);
1081d11b
PNA
56 if (trans == NULL)
57 return NULL;
58
b380e5c7 59 trans->msg_type = msg_type;
1081d11b
PNA
60 trans->ctx = *ctx;
61
62 return trans;
63}
64
8411b644
PNA
65static struct nft_trans *nft_trans_alloc(const struct nft_ctx *ctx,
66 int msg_type, u32 size)
67{
68 return nft_trans_alloc_gfp(ctx, msg_type, size, GFP_KERNEL);
69}
70
1081d11b
PNA
71static void nft_trans_destroy(struct nft_trans *trans)
72{
73 list_del(&trans->list);
74 kfree(trans);
75}
76
ae6153b5
FW
77/* removal requests are queued in the commit_list, but not acted upon
78 * until after all new rules are in place.
79 *
80 * Therefore, nf_register_net_hook(net, &nat_hook) runs before pending
81 * nf_unregister_net_hook().
82 *
83 * nf_register_net_hook thus fails if a nat hook is already in place
84 * even if the conflicting hook is about to be removed.
85 *
86 * If collision is detected, search commit_log for DELCHAIN matching
87 * the new nat hooknum; if we find one collision is temporary:
88 *
89 * Either transaction is aborted (new/colliding hook is removed), or
90 * transaction is committed (old hook is removed).
91 */
92static bool nf_tables_allow_nat_conflict(const struct net *net,
93 const struct nf_hook_ops *ops)
94{
95 const struct nft_trans *trans;
96 bool ret = false;
97
98 if (!ops->nat_hook)
99 return false;
100
101 list_for_each_entry(trans, &net->nft.commit_list, list) {
102 const struct nf_hook_ops *pending_ops;
103 const struct nft_chain *pending;
104
105 if (trans->msg_type != NFT_MSG_NEWCHAIN &&
106 trans->msg_type != NFT_MSG_DELCHAIN)
107 continue;
108
109 pending = trans->ctx.chain;
110 if (!nft_is_base_chain(pending))
111 continue;
112
113 pending_ops = &nft_base_chain(pending)->ops;
114 if (pending_ops->nat_hook &&
115 pending_ops->pf == ops->pf &&
116 pending_ops->hooknum == ops->hooknum) {
117 /* other hook registration already pending? */
118 if (trans->msg_type == NFT_MSG_NEWCHAIN)
119 return false;
120
121 ret = true;
122 }
123 }
124
125 return ret;
126}
127
c974a3a3
PNA
128static int nf_tables_register_hook(struct net *net,
129 const struct nft_table *table,
130 struct nft_chain *chain)
d8ee8f7c 131{
ae6153b5
FW
132 struct nf_hook_ops *ops;
133 int ret;
134
d8ee8f7c 135 if (table->flags & NFT_TABLE_F_DORMANT ||
f323d954 136 !nft_is_base_chain(chain))
d8ee8f7c
PNA
137 return 0;
138
ae6153b5
FW
139 ops = &nft_base_chain(chain)->ops;
140 ret = nf_register_net_hook(net, ops);
141 if (ret == -EBUSY && nf_tables_allow_nat_conflict(net, ops)) {
142 ops->nat_hook = false;
143 ret = nf_register_net_hook(net, ops);
144 ops->nat_hook = true;
145 }
146
147 return ret;
d8ee8f7c
PNA
148}
149
c974a3a3
PNA
150static void nf_tables_unregister_hook(struct net *net,
151 const struct nft_table *table,
152 struct nft_chain *chain)
c5598794 153{
d8ee8f7c 154 if (table->flags & NFT_TABLE_F_DORMANT ||
f323d954 155 !nft_is_base_chain(chain))
d8ee8f7c
PNA
156 return;
157
c974a3a3 158 nf_unregister_net_hook(net, &nft_base_chain(chain)->ops);
c5598794
AB
159}
160
ee01d542
AB
161static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
162{
163 struct nft_trans *trans;
164
165 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
166 if (trans == NULL)
167 return -ENOMEM;
168
169 if (msg_type == NFT_MSG_NEWTABLE)
f2a6d766 170 nft_activate_next(ctx->net, ctx->table);
ee01d542
AB
171
172 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
173 return 0;
174}
175
176static int nft_deltable(struct nft_ctx *ctx)
177{
178 int err;
179
180 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
181 if (err < 0)
182 return err;
183
f2a6d766 184 nft_deactivate_next(ctx->net, ctx->table);
ee01d542
AB
185 return err;
186}
187
188static int nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
189{
190 struct nft_trans *trans;
191
192 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
193 if (trans == NULL)
194 return -ENOMEM;
195
196 if (msg_type == NFT_MSG_NEWCHAIN)
664b0f8c 197 nft_activate_next(ctx->net, ctx->chain);
ee01d542
AB
198
199 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
200 return 0;
201}
202
203static int nft_delchain(struct nft_ctx *ctx)
204{
205 int err;
206
207 err = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
208 if (err < 0)
209 return err;
210
211 ctx->table->use--;
664b0f8c 212 nft_deactivate_next(ctx->net, ctx->chain);
ee01d542
AB
213
214 return err;
215}
216
ee01d542
AB
217static int
218nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
219{
220 /* You cannot delete the same rule twice */
889f7ee7
PNA
221 if (nft_is_active_next(ctx->net, rule)) {
222 nft_deactivate_next(ctx->net, rule);
ee01d542
AB
223 ctx->chain->use--;
224 return 0;
225 }
226 return -ENOENT;
227}
228
229static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
230 struct nft_rule *rule)
231{
232 struct nft_trans *trans;
233
234 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
235 if (trans == NULL)
236 return NULL;
237
1a94e38d
PNA
238 if (msg_type == NFT_MSG_NEWRULE && ctx->nla[NFTA_RULE_ID] != NULL) {
239 nft_trans_rule_id(trans) =
240 ntohl(nla_get_be32(ctx->nla[NFTA_RULE_ID]));
241 }
ee01d542
AB
242 nft_trans_rule(trans) = rule;
243 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
244
245 return trans;
246}
247
248static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
249{
250 struct nft_trans *trans;
251 int err;
252
253 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
254 if (trans == NULL)
255 return -ENOMEM;
256
257 err = nf_tables_delrule_deactivate(ctx, rule);
258 if (err < 0) {
259 nft_trans_destroy(trans);
260 return err;
261 }
262
263 return 0;
264}
265
266static int nft_delrule_by_chain(struct nft_ctx *ctx)
267{
268 struct nft_rule *rule;
269 int err;
270
271 list_for_each_entry(rule, &ctx->chain->rules, list) {
272 err = nft_delrule(ctx, rule);
273 if (err < 0)
274 return err;
275 }
276 return 0;
277}
278
ee01d542
AB
279static int nft_trans_set_add(struct nft_ctx *ctx, int msg_type,
280 struct nft_set *set)
281{
282 struct nft_trans *trans;
283
284 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
285 if (trans == NULL)
286 return -ENOMEM;
287
288 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
289 nft_trans_set_id(trans) =
290 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
37a9cc52 291 nft_activate_next(ctx->net, set);
ee01d542
AB
292 }
293 nft_trans_set(trans) = set;
294 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
295
296 return 0;
297}
298
299static int nft_delset(struct nft_ctx *ctx, struct nft_set *set)
300{
301 int err;
302
303 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
304 if (err < 0)
305 return err;
306
37a9cc52 307 nft_deactivate_next(ctx->net, set);
ee01d542
AB
308 ctx->table->use--;
309
310 return err;
311}
312
e5009240
PNA
313static int nft_trans_obj_add(struct nft_ctx *ctx, int msg_type,
314 struct nft_object *obj)
315{
316 struct nft_trans *trans;
317
318 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_obj));
319 if (trans == NULL)
320 return -ENOMEM;
321
322 if (msg_type == NFT_MSG_NEWOBJ)
323 nft_activate_next(ctx->net, obj);
324
325 nft_trans_obj(trans) = obj;
326 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
327
328 return 0;
329}
330
331static int nft_delobj(struct nft_ctx *ctx, struct nft_object *obj)
332{
333 int err;
334
335 err = nft_trans_obj_add(ctx, NFT_MSG_DELOBJ, obj);
336 if (err < 0)
337 return err;
338
339 nft_deactivate_next(ctx->net, obj);
340 ctx->table->use--;
341
342 return err;
343}
344
3b49e2e9
PNA
345static int nft_trans_flowtable_add(struct nft_ctx *ctx, int msg_type,
346 struct nft_flowtable *flowtable)
347{
348 struct nft_trans *trans;
349
350 trans = nft_trans_alloc(ctx, msg_type,
351 sizeof(struct nft_trans_flowtable));
352 if (trans == NULL)
353 return -ENOMEM;
354
355 if (msg_type == NFT_MSG_NEWFLOWTABLE)
356 nft_activate_next(ctx->net, flowtable);
357
358 nft_trans_flowtable(trans) = flowtable;
359 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
360
361 return 0;
362}
363
364static int nft_delflowtable(struct nft_ctx *ctx,
365 struct nft_flowtable *flowtable)
366{
367 int err;
368
369 err = nft_trans_flowtable_add(ctx, NFT_MSG_DELFLOWTABLE, flowtable);
370 if (err < 0)
371 return err;
372
373 nft_deactivate_next(ctx->net, flowtable);
374 ctx->table->use--;
375
376 return err;
377}
378
96518518
PM
379/*
380 * Tables
381 */
382
36596dad 383static struct nft_table *nft_table_lookup(const struct net *net,
f2a6d766 384 const struct nlattr *nla,
36596dad 385 u8 family, u8 genmask)
96518518
PM
386{
387 struct nft_table *table;
388
36596dad 389 list_for_each_entry(table, &net->nft.tables, list) {
f2a6d766 390 if (!nla_strcmp(nla, table->name) &&
98319cb9 391 table->family == family &&
f2a6d766 392 nft_active_genmask(table, genmask))
96518518
PM
393 return table;
394 }
395 return NULL;
396}
397
3ecbfd65
HS
398static struct nft_table *nft_table_lookup_byhandle(const struct net *net,
399 const struct nlattr *nla,
400 u8 genmask)
401{
402 struct nft_table *table;
403
404 list_for_each_entry(table, &net->nft.tables, list) {
405 if (be64_to_cpu(nla_get_be64(nla)) == table->handle &&
406 nft_active_genmask(table, genmask))
407 return table;
408 }
409 return NULL;
410}
411
36596dad 412static struct nft_table *nf_tables_table_lookup(const struct net *net,
f2a6d766 413 const struct nlattr *nla,
36596dad 414 u8 family, u8 genmask)
96518518
PM
415{
416 struct nft_table *table;
417
418 if (nla == NULL)
419 return ERR_PTR(-EINVAL);
420
36596dad 421 table = nft_table_lookup(net, nla, family, genmask);
96518518
PM
422 if (table != NULL)
423 return table;
424
96518518
PM
425 return ERR_PTR(-ENOENT);
426}
427
3ecbfd65
HS
428static struct nft_table *nf_tables_table_lookup_byhandle(const struct net *net,
429 const struct nlattr *nla,
430 u8 genmask)
431{
432 struct nft_table *table;
433
434 if (nla == NULL)
435 return ERR_PTR(-EINVAL);
436
437 table = nft_table_lookup_byhandle(net, nla, genmask);
438 if (table != NULL)
439 return table;
440
441 return ERR_PTR(-ENOENT);
442}
443
96518518
PM
444static inline u64 nf_tables_alloc_handle(struct nft_table *table)
445{
446 return ++table->hgenerator;
447}
448
32537e91 449static const struct nft_chain_type *chain_type[NFPROTO_NUMPROTO][NFT_CHAIN_T_MAX];
9370761c 450
32537e91 451static const struct nft_chain_type *
1ea26cca 452__nf_tables_chain_type_lookup(const struct nlattr *nla, u8 family)
9370761c
PNA
453{
454 int i;
455
baae3e62 456 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
9370761c
PNA
457 if (chain_type[family][i] != NULL &&
458 !nla_strcmp(nla, chain_type[family][i]->name))
baae3e62 459 return chain_type[family][i];
9370761c 460 }
baae3e62 461 return NULL;
9370761c
PNA
462}
463
32537e91 464static const struct nft_chain_type *
1ea26cca 465nf_tables_chain_type_lookup(const struct nlattr *nla, u8 family, bool autoload)
9370761c 466{
32537e91 467 const struct nft_chain_type *type;
9370761c 468
1ea26cca 469 type = __nf_tables_chain_type_lookup(nla, family);
93b0806f
PM
470 if (type != NULL)
471 return type;
9370761c 472#ifdef CONFIG_MODULES
93b0806f 473 if (autoload) {
9370761c 474 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1ea26cca 475 request_module("nft-chain-%u-%.*s", family,
2fec6bb6 476 nla_len(nla), (const char *)nla_data(nla));
9370761c 477 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1ea26cca 478 type = __nf_tables_chain_type_lookup(nla, family);
93b0806f
PM
479 if (type != NULL)
480 return ERR_PTR(-EAGAIN);
9370761c
PNA
481 }
482#endif
93b0806f 483 return ERR_PTR(-ENOENT);
9370761c
PNA
484}
485
96518518 486static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
1cae565e
PNA
487 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
488 .len = NFT_TABLE_MAXNAMELEN - 1 },
9ddf6323 489 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
3ecbfd65 490 [NFTA_TABLE_HANDLE] = { .type = NLA_U64 },
96518518
PM
491};
492
84d7fce6
PNA
493static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
494 u32 portid, u32 seq, int event, u32 flags,
495 int family, const struct nft_table *table)
96518518
PM
496{
497 struct nlmsghdr *nlh;
498 struct nfgenmsg *nfmsg;
499
dedb67c4 500 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
96518518
PM
501 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
502 if (nlh == NULL)
503 goto nla_put_failure;
504
505 nfmsg = nlmsg_data(nlh);
506 nfmsg->nfgen_family = family;
507 nfmsg->version = NFNETLINK_V0;
84d7fce6 508 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
96518518 509
9ddf6323 510 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
d8bcc768 511 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
3ecbfd65
HS
512 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)) ||
513 nla_put_be64(skb, NFTA_TABLE_HANDLE, cpu_to_be64(table->handle),
514 NFTA_TABLE_PAD))
96518518
PM
515 goto nla_put_failure;
516
053c095a
JB
517 nlmsg_end(skb, nlh);
518 return 0;
96518518
PM
519
520nla_put_failure:
521 nlmsg_trim(skb, nlh);
522 return -1;
523}
524
25e94a99 525static void nf_tables_table_notify(const struct nft_ctx *ctx, int event)
96518518
PM
526{
527 struct sk_buff *skb;
96518518
PM
528 int err;
529
128ad332
PNA
530 if (!ctx->report &&
531 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
25e94a99 532 return;
96518518 533
96518518
PM
534 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
535 if (skb == NULL)
536 goto err;
537
84d7fce6 538 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
36596dad 539 event, 0, ctx->family, ctx->table);
96518518
PM
540 if (err < 0) {
541 kfree_skb(skb);
542 goto err;
543 }
544
25e94a99
PNA
545 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
546 ctx->report, GFP_KERNEL);
547 return;
96518518 548err:
25e94a99 549 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
96518518
PM
550}
551
552static int nf_tables_dump_tables(struct sk_buff *skb,
553 struct netlink_callback *cb)
554{
555 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
96518518
PM
556 const struct nft_table *table;
557 unsigned int idx = 0, s_idx = cb->args[0];
99633ab2 558 struct net *net = sock_net(skb->sk);
96518518
PM
559 int family = nfmsg->nfgen_family;
560
e688a7f8 561 rcu_read_lock();
38e029f1
PNA
562 cb->seq = net->nft.base_seq;
563
36596dad 564 list_for_each_entry_rcu(table, &net->nft.tables, list) {
98319cb9 565 if (family != NFPROTO_UNSPEC && family != table->family)
96518518
PM
566 continue;
567
36596dad
PNA
568 if (idx < s_idx)
569 goto cont;
570 if (idx > s_idx)
571 memset(&cb->args[1], 0,
572 sizeof(cb->args) - sizeof(cb->args[0]));
573 if (!nft_is_active(net, table))
574 continue;
575 if (nf_tables_fill_table_info(skb, net,
576 NETLINK_CB(cb->skb).portid,
577 cb->nlh->nlmsg_seq,
578 NFT_MSG_NEWTABLE, NLM_F_MULTI,
98319cb9 579 table->family, table) < 0)
36596dad
PNA
580 goto done;
581
582 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
96518518 583cont:
36596dad 584 idx++;
96518518
PM
585 }
586done:
e688a7f8 587 rcu_read_unlock();
96518518
PM
588 cb->args[0] = idx;
589 return skb->len;
590}
591
7b8002a1
PNA
592static int nf_tables_gettable(struct net *net, struct sock *nlsk,
593 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
594 const struct nlattr * const nla[],
595 struct netlink_ext_ack *extack)
96518518
PM
596{
597 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 598 u8 genmask = nft_genmask_cur(net);
96518518
PM
599 const struct nft_table *table;
600 struct sk_buff *skb2;
601 int family = nfmsg->nfgen_family;
602 int err;
603
604 if (nlh->nlmsg_flags & NLM_F_DUMP) {
605 struct netlink_dump_control c = {
606 .dump = nf_tables_dump_tables,
607 };
608 return netlink_dump_start(nlsk, skb, nlh, &c);
609 }
610
98319cb9 611 table = nf_tables_table_lookup(net, nla[NFTA_TABLE_NAME], family,
36596dad 612 genmask);
96518518
PM
613 if (IS_ERR(table))
614 return PTR_ERR(table);
615
616 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
617 if (!skb2)
618 return -ENOMEM;
619
84d7fce6 620 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
96518518
PM
621 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
622 family, table);
623 if (err < 0)
624 goto err;
625
626 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
627
628err:
629 kfree_skb(skb2);
630 return err;
631}
632
c9c17211 633static void nft_table_disable(struct net *net, struct nft_table *table, u32 cnt)
10435c11
F
634{
635 struct nft_chain *chain;
636 u32 i = 0;
637
638 list_for_each_entry(chain, &table->chains, list) {
639 if (!nft_is_active_next(net, chain))
640 continue;
f323d954 641 if (!nft_is_base_chain(chain))
10435c11
F
642 continue;
643
644 if (cnt && i++ == cnt)
645 break;
646
c974a3a3 647 nf_unregister_net_hook(net, &nft_base_chain(chain)->ops);
10435c11
F
648 }
649}
650
c9c17211 651static int nf_tables_table_enable(struct net *net, struct nft_table *table)
9ddf6323
PNA
652{
653 struct nft_chain *chain;
654 int err, i = 0;
655
656 list_for_each_entry(chain, &table->chains, list) {
664b0f8c
PNA
657 if (!nft_is_active_next(net, chain))
658 continue;
f323d954 659 if (!nft_is_base_chain(chain))
d2012975
PNA
660 continue;
661
c974a3a3 662 err = nf_register_net_hook(net, &nft_base_chain(chain)->ops);
9ddf6323
PNA
663 if (err < 0)
664 goto err;
665
666 i++;
667 }
668 return 0;
669err:
10435c11 670 if (i)
c9c17211 671 nft_table_disable(net, table, i);
9ddf6323
PNA
672 return err;
673}
674
c9c17211 675static void nf_tables_table_disable(struct net *net, struct nft_table *table)
9ddf6323 676{
c9c17211 677 nft_table_disable(net, table, 0);
9ddf6323
PNA
678}
679
e1aaca93 680static int nf_tables_updtable(struct nft_ctx *ctx)
9ddf6323 681{
55dd6f93 682 struct nft_trans *trans;
e1aaca93 683 u32 flags;
55dd6f93 684 int ret = 0;
9ddf6323 685
e1aaca93
PNA
686 if (!ctx->nla[NFTA_TABLE_FLAGS])
687 return 0;
9ddf6323 688
e1aaca93
PNA
689 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
690 if (flags & ~NFT_TABLE_F_DORMANT)
691 return -EINVAL;
692
63283dd2
PNA
693 if (flags == ctx->table->flags)
694 return 0;
695
55dd6f93
PNA
696 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
697 sizeof(struct nft_trans_table));
698 if (trans == NULL)
699 return -ENOMEM;
9ddf6323 700
e1aaca93
PNA
701 if ((flags & NFT_TABLE_F_DORMANT) &&
702 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
55dd6f93 703 nft_trans_table_enable(trans) = false;
e1aaca93
PNA
704 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
705 ctx->table->flags & NFT_TABLE_F_DORMANT) {
c9c17211 706 ret = nf_tables_table_enable(ctx->net, ctx->table);
55dd6f93 707 if (ret >= 0) {
e1aaca93 708 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
55dd6f93 709 nft_trans_table_enable(trans) = true;
9ddf6323 710 }
9ddf6323 711 }
e1aaca93
PNA
712 if (ret < 0)
713 goto err;
9ddf6323 714
55dd6f93
PNA
715 nft_trans_table_update(trans) = true;
716 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
717 return 0;
9ddf6323 718err:
55dd6f93 719 nft_trans_destroy(trans);
9ddf6323
PNA
720 return ret;
721}
722
633c9a84
PNA
723static int nf_tables_newtable(struct net *net, struct sock *nlsk,
724 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
725 const struct nlattr * const nla[],
726 struct netlink_ext_ack *extack)
96518518
PM
727{
728 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 729 u8 genmask = nft_genmask_next(net);
96518518 730 const struct nlattr *name;
96518518
PM
731 struct nft_table *table;
732 int family = nfmsg->nfgen_family;
c5c1f975 733 u32 flags = 0;
e1aaca93 734 struct nft_ctx ctx;
55dd6f93 735 int err;
96518518 736
96518518 737 name = nla[NFTA_TABLE_NAME];
98319cb9 738 table = nf_tables_table_lookup(net, name, family, genmask);
96518518
PM
739 if (IS_ERR(table)) {
740 if (PTR_ERR(table) != -ENOENT)
741 return PTR_ERR(table);
1a28ad74 742 } else {
96518518
PM
743 if (nlh->nlmsg_flags & NLM_F_EXCL)
744 return -EEXIST;
745 if (nlh->nlmsg_flags & NLM_F_REPLACE)
746 return -EOPNOTSUPP;
e1aaca93 747
98319cb9 748 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
e1aaca93 749 return nf_tables_updtable(&ctx);
96518518
PM
750 }
751
c5c1f975
PM
752 if (nla[NFTA_TABLE_FLAGS]) {
753 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
754 if (flags & ~NFT_TABLE_F_DORMANT)
755 return -EINVAL;
756 }
757
ffdb210e 758 err = -ENOMEM;
1cae565e 759 table = kzalloc(sizeof(*table), GFP_KERNEL);
ffdb210e 760 if (table == NULL)
98319cb9 761 goto err_kzalloc;
96518518 762
e46abbcc
PS
763 table->name = nla_strdup(name, GFP_KERNEL);
764 if (table->name == NULL)
98319cb9 765 goto err_strdup;
e46abbcc 766
96518518 767 INIT_LIST_HEAD(&table->chains);
20a69341 768 INIT_LIST_HEAD(&table->sets);
e5009240 769 INIT_LIST_HEAD(&table->objects);
3b49e2e9 770 INIT_LIST_HEAD(&table->flowtables);
98319cb9 771 table->family = family;
c5c1f975 772 table->flags = flags;
3ecbfd65 773 table->handle = ++table_handle;
9ddf6323 774
98319cb9 775 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
55dd6f93 776 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
ffdb210e 777 if (err < 0)
98319cb9 778 goto err_trans;
ffdb210e 779
36596dad 780 list_add_tail_rcu(&table->list, &net->nft.tables);
96518518 781 return 0;
98319cb9 782err_trans:
e46abbcc 783 kfree(table->name);
98319cb9 784err_strdup:
ffdb210e 785 kfree(table);
98319cb9 786err_kzalloc:
ffdb210e 787 return err;
96518518
PM
788}
789
b9ac12ef
AB
790static int nft_flush_table(struct nft_ctx *ctx)
791{
3b49e2e9 792 struct nft_flowtable *flowtable, *nft;
b9ac12ef 793 struct nft_chain *chain, *nc;
e5009240 794 struct nft_object *obj, *ne;
b9ac12ef 795 struct nft_set *set, *ns;
3b49e2e9 796 int err;
b9ac12ef 797
a2f18db0 798 list_for_each_entry(chain, &ctx->table->chains, list) {
664b0f8c
PNA
799 if (!nft_is_active_next(ctx->net, chain))
800 continue;
801
b9ac12ef
AB
802 ctx->chain = chain;
803
804 err = nft_delrule_by_chain(ctx);
805 if (err < 0)
806 goto out;
b9ac12ef
AB
807 }
808
809 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
37a9cc52
PNA
810 if (!nft_is_active_next(ctx->net, set))
811 continue;
812
408070d6 813 if (nft_set_is_anonymous(set) &&
b9ac12ef
AB
814 !list_empty(&set->bindings))
815 continue;
816
817 err = nft_delset(ctx, set);
818 if (err < 0)
819 goto out;
820 }
821
3b49e2e9
PNA
822 list_for_each_entry_safe(flowtable, nft, &ctx->table->flowtables, list) {
823 err = nft_delflowtable(ctx, flowtable);
824 if (err < 0)
825 goto out;
826 }
827
e5009240
PNA
828 list_for_each_entry_safe(obj, ne, &ctx->table->objects, list) {
829 err = nft_delobj(ctx, obj);
830 if (err < 0)
831 goto out;
832 }
833
a2f18db0 834 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
664b0f8c
PNA
835 if (!nft_is_active_next(ctx->net, chain))
836 continue;
837
a2f18db0
PNA
838 ctx->chain = chain;
839
840 err = nft_delchain(ctx);
841 if (err < 0)
842 goto out;
843 }
844
b9ac12ef
AB
845 err = nft_deltable(ctx);
846out:
847 return err;
848}
849
850static int nft_flush(struct nft_ctx *ctx, int family)
851{
b9ac12ef
AB
852 struct nft_table *table, *nt;
853 const struct nlattr * const *nla = ctx->nla;
854 int err = 0;
855
36596dad 856 list_for_each_entry_safe(table, nt, &ctx->net->nft.tables, list) {
98319cb9 857 if (family != AF_UNSPEC && table->family != family)
b9ac12ef
AB
858 continue;
859
98319cb9 860 ctx->family = table->family;
f2a6d766 861
36596dad
PNA
862 if (!nft_is_active_next(ctx->net, table))
863 continue;
b9ac12ef 864
36596dad
PNA
865 if (nla[NFTA_TABLE_NAME] &&
866 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
867 continue;
b9ac12ef 868
36596dad
PNA
869 ctx->table = table;
870
871 err = nft_flush_table(ctx);
872 if (err < 0)
873 goto out;
b9ac12ef
AB
874 }
875out:
876 return err;
877}
878
633c9a84
PNA
879static int nf_tables_deltable(struct net *net, struct sock *nlsk,
880 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
881 const struct nlattr * const nla[],
882 struct netlink_ext_ack *extack)
96518518
PM
883{
884 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 885 u8 genmask = nft_genmask_next(net);
96518518 886 struct nft_table *table;
ee01d542 887 int family = nfmsg->nfgen_family;
55dd6f93 888 struct nft_ctx ctx;
96518518 889
36596dad 890 nft_ctx_init(&ctx, net, skb, nlh, 0, NULL, NULL, nla);
3ecbfd65
HS
891 if (family == AF_UNSPEC ||
892 (!nla[NFTA_TABLE_NAME] && !nla[NFTA_TABLE_HANDLE]))
b9ac12ef
AB
893 return nft_flush(&ctx, family);
894
3ecbfd65
HS
895 if (nla[NFTA_TABLE_HANDLE])
896 table = nf_tables_table_lookup_byhandle(net,
897 nla[NFTA_TABLE_HANDLE],
898 genmask);
899 else
900 table = nf_tables_table_lookup(net, nla[NFTA_TABLE_NAME],
901 family, genmask);
902
96518518
PM
903 if (IS_ERR(table))
904 return PTR_ERR(table);
96518518 905
a8278400
PNA
906 if (nlh->nlmsg_flags & NLM_F_NONREC &&
907 table->use > 0)
908 return -EBUSY;
909
98319cb9 910 ctx.family = family;
b9ac12ef 911 ctx.table = table;
55dd6f93 912
b9ac12ef 913 return nft_flush_table(&ctx);
96518518
PM
914}
915
55dd6f93
PNA
916static void nf_tables_table_destroy(struct nft_ctx *ctx)
917{
4fefee57
PNA
918 BUG_ON(ctx->table->use > 0);
919
e46abbcc 920 kfree(ctx->table->name);
55dd6f93 921 kfree(ctx->table);
55dd6f93
PNA
922}
923
cc07eeb0 924void nft_register_chain_type(const struct nft_chain_type *ctype)
96518518 925{
d8297d4f 926 if (WARN_ON(ctype->family >= NFPROTO_NUMPROTO))
cc07eeb0 927 return;
d8297d4f 928
96518518 929 nfnl_lock(NFNL_SUBSYS_NFTABLES);
cc07eeb0
PNA
930 if (WARN_ON(chain_type[ctype->family][ctype->type] != NULL)) {
931 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
932 return;
96518518 933 }
9370761c 934 chain_type[ctype->family][ctype->type] = ctype;
96518518 935 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
96518518 936}
9370761c 937EXPORT_SYMBOL_GPL(nft_register_chain_type);
96518518 938
32537e91 939void nft_unregister_chain_type(const struct nft_chain_type *ctype)
96518518 940{
96518518 941 nfnl_lock(NFNL_SUBSYS_NFTABLES);
9370761c 942 chain_type[ctype->family][ctype->type] = NULL;
96518518
PM
943 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
944}
9370761c 945EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
96518518
PM
946
947/*
948 * Chains
949 */
950
951static struct nft_chain *
664b0f8c
PNA
952nf_tables_chain_lookup_byhandle(const struct nft_table *table, u64 handle,
953 u8 genmask)
96518518
PM
954{
955 struct nft_chain *chain;
956
957 list_for_each_entry(chain, &table->chains, list) {
664b0f8c
PNA
958 if (chain->handle == handle &&
959 nft_active_genmask(chain, genmask))
96518518
PM
960 return chain;
961 }
962
963 return ERR_PTR(-ENOENT);
964}
965
966static struct nft_chain *nf_tables_chain_lookup(const struct nft_table *table,
664b0f8c
PNA
967 const struct nlattr *nla,
968 u8 genmask)
96518518
PM
969{
970 struct nft_chain *chain;
971
972 if (nla == NULL)
973 return ERR_PTR(-EINVAL);
974
975 list_for_each_entry(chain, &table->chains, list) {
664b0f8c
PNA
976 if (!nla_strcmp(nla, chain->name) &&
977 nft_active_genmask(chain, genmask))
96518518
PM
978 return chain;
979 }
980
981 return ERR_PTR(-ENOENT);
982}
983
984static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
b2fbd044
LZ
985 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING,
986 .len = NFT_TABLE_MAXNAMELEN - 1 },
96518518
PM
987 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
988 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
989 .len = NFT_CHAIN_MAXNAMELEN - 1 },
990 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
0ca743a5 991 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
4c1f7818 992 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING },
0ca743a5 993 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
96518518
PM
994};
995
996static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
997 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
998 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
2cbce139
PNA
999 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
1000 .len = IFNAMSIZ - 1 },
96518518
PM
1001};
1002
0ca743a5
PNA
1003static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
1004{
1005 struct nft_stats *cpu_stats, total;
1006 struct nlattr *nest;
ce355e20
ED
1007 unsigned int seq;
1008 u64 pkts, bytes;
0ca743a5
PNA
1009 int cpu;
1010
1011 memset(&total, 0, sizeof(total));
1012 for_each_possible_cpu(cpu) {
1013 cpu_stats = per_cpu_ptr(stats, cpu);
ce355e20
ED
1014 do {
1015 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
1016 pkts = cpu_stats->pkts;
1017 bytes = cpu_stats->bytes;
1018 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
1019 total.pkts += pkts;
1020 total.bytes += bytes;
0ca743a5
PNA
1021 }
1022 nest = nla_nest_start(skb, NFTA_CHAIN_COUNTERS);
1023 if (nest == NULL)
1024 goto nla_put_failure;
1025
b46f6ded
ND
1026 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
1027 NFTA_COUNTER_PAD) ||
1028 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
1029 NFTA_COUNTER_PAD))
0ca743a5
PNA
1030 goto nla_put_failure;
1031
1032 nla_nest_end(skb, nest);
1033 return 0;
1034
1035nla_put_failure:
1036 return -ENOSPC;
1037}
1038
84d7fce6
PNA
1039static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
1040 u32 portid, u32 seq, int event, u32 flags,
1041 int family, const struct nft_table *table,
96518518
PM
1042 const struct nft_chain *chain)
1043{
1044 struct nlmsghdr *nlh;
1045 struct nfgenmsg *nfmsg;
1046
dedb67c4 1047 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
96518518
PM
1048 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
1049 if (nlh == NULL)
1050 goto nla_put_failure;
1051
1052 nfmsg = nlmsg_data(nlh);
1053 nfmsg->nfgen_family = family;
1054 nfmsg->version = NFNETLINK_V0;
84d7fce6 1055 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
96518518
PM
1056
1057 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
1058 goto nla_put_failure;
b46f6ded
ND
1059 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
1060 NFTA_CHAIN_PAD))
96518518
PM
1061 goto nla_put_failure;
1062 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
1063 goto nla_put_failure;
1064
f323d954 1065 if (nft_is_base_chain(chain)) {
0ca743a5 1066 const struct nft_base_chain *basechain = nft_base_chain(chain);
c974a3a3 1067 const struct nf_hook_ops *ops = &basechain->ops;
0ca743a5
PNA
1068 struct nlattr *nest;
1069
1070 nest = nla_nest_start(skb, NFTA_CHAIN_HOOK);
96518518
PM
1071 if (nest == NULL)
1072 goto nla_put_failure;
1073 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
1074 goto nla_put_failure;
1075 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
1076 goto nla_put_failure;
2cbce139
PNA
1077 if (basechain->dev_name[0] &&
1078 nla_put_string(skb, NFTA_HOOK_DEV, basechain->dev_name))
1079 goto nla_put_failure;
96518518 1080 nla_nest_end(skb, nest);
9370761c 1081
0ca743a5
PNA
1082 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
1083 htonl(basechain->policy)))
1084 goto nla_put_failure;
1085
baae3e62
PM
1086 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
1087 goto nla_put_failure;
0ca743a5 1088
5f9bfe0e 1089 if (basechain->stats && nft_dump_stats(skb, basechain->stats))
0ca743a5 1090 goto nla_put_failure;
96518518
PM
1091 }
1092
0ca743a5
PNA
1093 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
1094 goto nla_put_failure;
1095
053c095a
JB
1096 nlmsg_end(skb, nlh);
1097 return 0;
96518518
PM
1098
1099nla_put_failure:
1100 nlmsg_trim(skb, nlh);
1101 return -1;
1102}
1103
25e94a99 1104static void nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
96518518
PM
1105{
1106 struct sk_buff *skb;
96518518
PM
1107 int err;
1108
128ad332
PNA
1109 if (!ctx->report &&
1110 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
25e94a99 1111 return;
96518518 1112
96518518
PM
1113 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1114 if (skb == NULL)
1115 goto err;
1116
84d7fce6 1117 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
36596dad 1118 event, 0, ctx->family, ctx->table,
35151d84 1119 ctx->chain);
96518518
PM
1120 if (err < 0) {
1121 kfree_skb(skb);
1122 goto err;
1123 }
1124
25e94a99
PNA
1125 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1126 ctx->report, GFP_KERNEL);
1127 return;
96518518 1128err:
25e94a99 1129 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
96518518
PM
1130}
1131
1132static int nf_tables_dump_chains(struct sk_buff *skb,
1133 struct netlink_callback *cb)
1134{
1135 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
96518518
PM
1136 const struct nft_table *table;
1137 const struct nft_chain *chain;
1138 unsigned int idx = 0, s_idx = cb->args[0];
99633ab2 1139 struct net *net = sock_net(skb->sk);
96518518
PM
1140 int family = nfmsg->nfgen_family;
1141
e688a7f8 1142 rcu_read_lock();
38e029f1
PNA
1143 cb->seq = net->nft.base_seq;
1144
36596dad 1145 list_for_each_entry_rcu(table, &net->nft.tables, list) {
98319cb9 1146 if (family != NFPROTO_UNSPEC && family != table->family)
96518518
PM
1147 continue;
1148
36596dad
PNA
1149 list_for_each_entry_rcu(chain, &table->chains, list) {
1150 if (idx < s_idx)
1151 goto cont;
1152 if (idx > s_idx)
1153 memset(&cb->args[1], 0,
1154 sizeof(cb->args) - sizeof(cb->args[0]));
1155 if (!nft_is_active(net, chain))
1156 continue;
1157 if (nf_tables_fill_chain_info(skb, net,
1158 NETLINK_CB(cb->skb).portid,
1159 cb->nlh->nlmsg_seq,
1160 NFT_MSG_NEWCHAIN,
1161 NLM_F_MULTI,
98319cb9 1162 table->family, table,
36596dad
PNA
1163 chain) < 0)
1164 goto done;
38e029f1 1165
36596dad 1166 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
96518518 1167cont:
36596dad 1168 idx++;
96518518
PM
1169 }
1170 }
1171done:
e688a7f8 1172 rcu_read_unlock();
96518518
PM
1173 cb->args[0] = idx;
1174 return skb->len;
1175}
1176
7b8002a1
PNA
1177static int nf_tables_getchain(struct net *net, struct sock *nlsk,
1178 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
1179 const struct nlattr * const nla[],
1180 struct netlink_ext_ack *extack)
96518518
PM
1181{
1182 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 1183 u8 genmask = nft_genmask_cur(net);
96518518
PM
1184 const struct nft_table *table;
1185 const struct nft_chain *chain;
1186 struct sk_buff *skb2;
1187 int family = nfmsg->nfgen_family;
1188 int err;
1189
1190 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1191 struct netlink_dump_control c = {
1192 .dump = nf_tables_dump_chains,
1193 };
1194 return netlink_dump_start(nlsk, skb, nlh, &c);
1195 }
1196
98319cb9 1197 table = nf_tables_table_lookup(net, nla[NFTA_CHAIN_TABLE], family,
36596dad 1198 genmask);
96518518
PM
1199 if (IS_ERR(table))
1200 return PTR_ERR(table);
1201
664b0f8c 1202 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
96518518
PM
1203 if (IS_ERR(chain))
1204 return PTR_ERR(chain);
1205
1206 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1207 if (!skb2)
1208 return -ENOMEM;
1209
84d7fce6 1210 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
96518518
PM
1211 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1212 family, table, chain);
1213 if (err < 0)
1214 goto err;
1215
1216 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1217
1218err:
1219 kfree_skb(skb2);
1220 return err;
1221}
1222
0ca743a5
PNA
1223static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1224 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1225 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1226};
1227
ff3cd7b3 1228static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
0ca743a5
PNA
1229{
1230 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1231 struct nft_stats __percpu *newstats;
1232 struct nft_stats *stats;
1233 int err;
1234
fceb6435
JB
1235 err = nla_parse_nested(tb, NFTA_COUNTER_MAX, attr, nft_counter_policy,
1236 NULL);
0ca743a5 1237 if (err < 0)
ff3cd7b3 1238 return ERR_PTR(err);
0ca743a5
PNA
1239
1240 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
ff3cd7b3 1241 return ERR_PTR(-EINVAL);
0ca743a5 1242
ce355e20 1243 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
0ca743a5 1244 if (newstats == NULL)
ff3cd7b3 1245 return ERR_PTR(-ENOMEM);
0ca743a5
PNA
1246
1247 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1248 * are not exposed to userspace.
1249 */
e8781f70 1250 preempt_disable();
0ca743a5
PNA
1251 stats = this_cpu_ptr(newstats);
1252 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1253 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
e8781f70 1254 preempt_enable();
0ca743a5 1255
ff3cd7b3
PNA
1256 return newstats;
1257}
1258
1259static void nft_chain_stats_replace(struct nft_base_chain *chain,
1260 struct nft_stats __percpu *newstats)
1261{
0befd061
PNA
1262 struct nft_stats __percpu *oldstats;
1263
b88825de
PNA
1264 if (newstats == NULL)
1265 return;
1266
0ca743a5 1267 if (chain->stats) {
0befd061 1268 oldstats = nfnl_dereference(chain->stats, NFNL_SUBSYS_NFTABLES);
0ca743a5
PNA
1269 rcu_assign_pointer(chain->stats, newstats);
1270 synchronize_rcu();
1271 free_percpu(oldstats);
1272 } else
1273 rcu_assign_pointer(chain->stats, newstats);
0ca743a5
PNA
1274}
1275
43a605f2 1276static void nf_tables_chain_destroy(struct nft_ctx *ctx)
91c7b38d 1277{
43a605f2
PNA
1278 struct nft_chain *chain = ctx->chain;
1279
91c7b38d
PNA
1280 BUG_ON(chain->use > 0);
1281
f323d954 1282 if (nft_is_base_chain(chain)) {
2cbce139
PNA
1283 struct nft_base_chain *basechain = nft_base_chain(chain);
1284
43a605f2
PNA
1285 if (basechain->type->free)
1286 basechain->type->free(ctx);
2cbce139
PNA
1287 module_put(basechain->type->owner);
1288 free_percpu(basechain->stats);
9f08ea84
PNA
1289 if (basechain->stats)
1290 static_branch_dec(&nft_counters_enabled);
b7263e07 1291 kfree(chain->name);
2cbce139 1292 kfree(basechain);
91c7b38d 1293 } else {
b7263e07 1294 kfree(chain->name);
91c7b38d
PNA
1295 kfree(chain);
1296 }
1297}
1298
508f8ccd
PNA
1299struct nft_chain_hook {
1300 u32 num;
84ba7dd7 1301 s32 priority;
32537e91 1302 const struct nft_chain_type *type;
508f8ccd
PNA
1303 struct net_device *dev;
1304};
1305
1306static int nft_chain_parse_hook(struct net *net,
1307 const struct nlattr * const nla[],
36596dad
PNA
1308 struct nft_chain_hook *hook, u8 family,
1309 bool create)
508f8ccd
PNA
1310{
1311 struct nlattr *ha[NFTA_HOOK_MAX + 1];
32537e91 1312 const struct nft_chain_type *type;
508f8ccd
PNA
1313 struct net_device *dev;
1314 int err;
1315
1316 err = nla_parse_nested(ha, NFTA_HOOK_MAX, nla[NFTA_CHAIN_HOOK],
fceb6435 1317 nft_hook_policy, NULL);
508f8ccd
PNA
1318 if (err < 0)
1319 return err;
1320
1321 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1322 ha[NFTA_HOOK_PRIORITY] == NULL)
1323 return -EINVAL;
1324
1325 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
508f8ccd
PNA
1326 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1327
36596dad 1328 type = chain_type[family][NFT_CHAIN_T_DEFAULT];
508f8ccd 1329 if (nla[NFTA_CHAIN_TYPE]) {
1ea26cca 1330 type = nf_tables_chain_type_lookup(nla[NFTA_CHAIN_TYPE],
36596dad 1331 family, create);
508f8ccd
PNA
1332 if (IS_ERR(type))
1333 return PTR_ERR(type);
1334 }
1335 if (!(type->hook_mask & (1 << hook->num)))
1336 return -EOPNOTSUPP;
84ba7dd7
FW
1337
1338 if (type->type == NFT_CHAIN_T_NAT &&
1339 hook->priority <= NF_IP_PRI_CONNTRACK)
1340 return -EOPNOTSUPP;
1341
508f8ccd
PNA
1342 if (!try_module_get(type->owner))
1343 return -ENOENT;
1344
1345 hook->type = type;
1346
1347 hook->dev = NULL;
36596dad 1348 if (family == NFPROTO_NETDEV) {
508f8ccd
PNA
1349 char ifname[IFNAMSIZ];
1350
1351 if (!ha[NFTA_HOOK_DEV]) {
1352 module_put(type->owner);
1353 return -EOPNOTSUPP;
1354 }
1355
1356 nla_strlcpy(ifname, ha[NFTA_HOOK_DEV], IFNAMSIZ);
90d2723c 1357 dev = __dev_get_by_name(net, ifname);
508f8ccd
PNA
1358 if (!dev) {
1359 module_put(type->owner);
1360 return -ENOENT;
1361 }
1362 hook->dev = dev;
1363 } else if (ha[NFTA_HOOK_DEV]) {
1364 module_put(type->owner);
1365 return -EOPNOTSUPP;
1366 }
1367
1368 return 0;
1369}
1370
1371static void nft_chain_release_hook(struct nft_chain_hook *hook)
1372{
1373 module_put(hook->type->owner);
508f8ccd
PNA
1374}
1375
4035285f
PNA
1376static int nf_tables_addchain(struct nft_ctx *ctx, u8 family, u8 genmask,
1377 u8 policy, bool create)
1378{
1379 const struct nlattr * const *nla = ctx->nla;
1380 struct nft_table *table = ctx->table;
4035285f
PNA
1381 struct nft_base_chain *basechain;
1382 struct nft_stats __percpu *stats;
1383 struct net *net = ctx->net;
1384 struct nft_chain *chain;
4035285f
PNA
1385 int err;
1386
1387 if (table->use == UINT_MAX)
1388 return -EOVERFLOW;
1389
1390 if (nla[NFTA_CHAIN_HOOK]) {
1391 struct nft_chain_hook hook;
1392 struct nf_hook_ops *ops;
4035285f 1393
36596dad 1394 err = nft_chain_parse_hook(net, nla, &hook, family, create);
4035285f
PNA
1395 if (err < 0)
1396 return err;
1397
1398 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1399 if (basechain == NULL) {
1400 nft_chain_release_hook(&hook);
1401 return -ENOMEM;
1402 }
1403
1404 if (hook.dev != NULL)
1405 strncpy(basechain->dev_name, hook.dev->name, IFNAMSIZ);
1406
1407 if (nla[NFTA_CHAIN_COUNTERS]) {
1408 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1409 if (IS_ERR(stats)) {
1410 nft_chain_release_hook(&hook);
1411 kfree(basechain);
1412 return PTR_ERR(stats);
1413 }
1414 basechain->stats = stats;
1415 static_branch_inc(&nft_counters_enabled);
1416 }
1417
4035285f 1418 basechain->type = hook.type;
43a605f2
PNA
1419 if (basechain->type->init)
1420 basechain->type->init(ctx);
1421
4035285f
PNA
1422 chain = &basechain->chain;
1423
c974a3a3
PNA
1424 ops = &basechain->ops;
1425 ops->pf = family;
1426 ops->hooknum = hook.num;
1427 ops->priority = hook.priority;
1428 ops->priv = chain;
c2f9eafe 1429 ops->hook = hook.type->hooks[ops->hooknum];
c974a3a3 1430 ops->dev = hook.dev;
c974a3a3
PNA
1431
1432 if (basechain->type->type == NFT_CHAIN_T_NAT)
1433 ops->nat_hook = true;
4035285f
PNA
1434
1435 chain->flags |= NFT_BASE_CHAIN;
1436 basechain->policy = policy;
1437 } else {
1438 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1439 if (chain == NULL)
1440 return -ENOMEM;
1441 }
43a605f2
PNA
1442 ctx->chain = chain;
1443
4035285f
PNA
1444 INIT_LIST_HEAD(&chain->rules);
1445 chain->handle = nf_tables_alloc_handle(table);
1446 chain->table = table;
1447 chain->name = nla_strdup(nla[NFTA_CHAIN_NAME], GFP_KERNEL);
1448 if (!chain->name) {
1449 err = -ENOMEM;
1450 goto err1;
1451 }
1452
c974a3a3 1453 err = nf_tables_register_hook(net, table, chain);
4035285f
PNA
1454 if (err < 0)
1455 goto err1;
1456
4035285f
PNA
1457 err = nft_trans_chain_add(ctx, NFT_MSG_NEWCHAIN);
1458 if (err < 0)
1459 goto err2;
1460
1461 table->use++;
1462 list_add_tail_rcu(&chain->list, &table->chains);
1463
1464 return 0;
1465err2:
c974a3a3 1466 nf_tables_unregister_hook(net, table, chain);
4035285f 1467err1:
43a605f2 1468 nf_tables_chain_destroy(ctx);
4035285f
PNA
1469
1470 return err;
1471}
1472
2c4a488a
PNA
1473static int nf_tables_updchain(struct nft_ctx *ctx, u8 genmask, u8 policy,
1474 bool create)
1475{
1476 const struct nlattr * const *nla = ctx->nla;
1477 struct nft_table *table = ctx->table;
1478 struct nft_chain *chain = ctx->chain;
2c4a488a
PNA
1479 struct nft_base_chain *basechain;
1480 struct nft_stats *stats = NULL;
1481 struct nft_chain_hook hook;
1482 const struct nlattr *name;
1483 struct nf_hook_ops *ops;
1484 struct nft_trans *trans;
c974a3a3 1485 int err;
2c4a488a
PNA
1486
1487 if (nla[NFTA_CHAIN_HOOK]) {
1488 if (!nft_is_base_chain(chain))
1489 return -EBUSY;
1490
36596dad 1491 err = nft_chain_parse_hook(ctx->net, nla, &hook, ctx->family,
2c4a488a
PNA
1492 create);
1493 if (err < 0)
1494 return err;
1495
1496 basechain = nft_base_chain(chain);
1497 if (basechain->type != hook.type) {
1498 nft_chain_release_hook(&hook);
1499 return -EBUSY;
1500 }
1501
c974a3a3
PNA
1502 ops = &basechain->ops;
1503 if (ops->hooknum != hook.num ||
1504 ops->priority != hook.priority ||
1505 ops->dev != hook.dev) {
1506 nft_chain_release_hook(&hook);
1507 return -EBUSY;
2c4a488a
PNA
1508 }
1509 nft_chain_release_hook(&hook);
1510 }
1511
1512 if (nla[NFTA_CHAIN_HANDLE] &&
1513 nla[NFTA_CHAIN_NAME]) {
1514 struct nft_chain *chain2;
1515
1516 chain2 = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME],
1517 genmask);
0d18779b
JC
1518 if (!IS_ERR(chain2))
1519 return -EEXIST;
2c4a488a
PNA
1520 }
1521
1522 if (nla[NFTA_CHAIN_COUNTERS]) {
1523 if (!nft_is_base_chain(chain))
1524 return -EOPNOTSUPP;
1525
1526 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1527 if (IS_ERR(stats))
1528 return PTR_ERR(stats);
1529 }
1530
1531 trans = nft_trans_alloc(ctx, NFT_MSG_NEWCHAIN,
1532 sizeof(struct nft_trans_chain));
1533 if (trans == NULL) {
1534 free_percpu(stats);
1535 return -ENOMEM;
1536 }
1537
1538 nft_trans_chain_stats(trans) = stats;
1539 nft_trans_chain_update(trans) = true;
1540
1541 if (nla[NFTA_CHAIN_POLICY])
1542 nft_trans_chain_policy(trans) = policy;
1543 else
1544 nft_trans_chain_policy(trans) = -1;
1545
1546 name = nla[NFTA_CHAIN_NAME];
1547 if (nla[NFTA_CHAIN_HANDLE] && name) {
1548 nft_trans_chain_name(trans) =
1549 nla_strdup(name, GFP_KERNEL);
1550 if (!nft_trans_chain_name(trans)) {
1551 kfree(trans);
1552 free_percpu(stats);
1553 return -ENOMEM;
1554 }
1555 }
1556 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
1557
1558 return 0;
1559}
1560
633c9a84
PNA
1561static int nf_tables_newchain(struct net *net, struct sock *nlsk,
1562 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
1563 const struct nlattr * const nla[],
1564 struct netlink_ext_ack *extack)
96518518
PM
1565{
1566 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1567 const struct nlattr * uninitialized_var(name);
4035285f
PNA
1568 u8 genmask = nft_genmask_next(net);
1569 int family = nfmsg->nfgen_family;
96518518
PM
1570 struct nft_table *table;
1571 struct nft_chain *chain;
57de2a0c 1572 u8 policy = NF_ACCEPT;
4035285f 1573 struct nft_ctx ctx;
96518518 1574 u64 handle = 0;
96518518
PM
1575 bool create;
1576
1577 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1578
98319cb9 1579 table = nf_tables_table_lookup(net, nla[NFTA_CHAIN_TABLE], family,
36596dad 1580 genmask);
96518518
PM
1581 if (IS_ERR(table))
1582 return PTR_ERR(table);
1583
96518518
PM
1584 chain = NULL;
1585 name = nla[NFTA_CHAIN_NAME];
1586
1587 if (nla[NFTA_CHAIN_HANDLE]) {
1588 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
664b0f8c 1589 chain = nf_tables_chain_lookup_byhandle(table, handle, genmask);
96518518
PM
1590 if (IS_ERR(chain))
1591 return PTR_ERR(chain);
1592 } else {
664b0f8c 1593 chain = nf_tables_chain_lookup(table, name, genmask);
96518518
PM
1594 if (IS_ERR(chain)) {
1595 if (PTR_ERR(chain) != -ENOENT)
1596 return PTR_ERR(chain);
1597 chain = NULL;
1598 }
1599 }
1600
57de2a0c 1601 if (nla[NFTA_CHAIN_POLICY]) {
f323d954
PNA
1602 if (chain != NULL &&
1603 !nft_is_base_chain(chain))
d6b6cb1d
PNA
1604 return -EOPNOTSUPP;
1605
1606 if (chain == NULL &&
57de2a0c
PM
1607 nla[NFTA_CHAIN_HOOK] == NULL)
1608 return -EOPNOTSUPP;
1609
8f46df18 1610 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
57de2a0c
PM
1611 switch (policy) {
1612 case NF_DROP:
1613 case NF_ACCEPT:
1614 break;
1615 default:
1616 return -EINVAL;
1617 }
1618 }
1619
98319cb9 1620 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
4035285f 1621
96518518
PM
1622 if (chain != NULL) {
1623 if (nlh->nlmsg_flags & NLM_F_EXCL)
1624 return -EEXIST;
1625 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1626 return -EOPNOTSUPP;
1627
2c4a488a 1628 return nf_tables_updchain(&ctx, genmask, policy, create);
96518518
PM
1629 }
1630
4035285f 1631 return nf_tables_addchain(&ctx, family, genmask, policy, create);
96518518
PM
1632}
1633
633c9a84
PNA
1634static int nf_tables_delchain(struct net *net, struct sock *nlsk,
1635 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
1636 const struct nlattr * const nla[],
1637 struct netlink_ext_ack *extack)
96518518
PM
1638{
1639 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 1640 u8 genmask = nft_genmask_next(net);
96518518
PM
1641 struct nft_table *table;
1642 struct nft_chain *chain;
9dee1474 1643 struct nft_rule *rule;
96518518 1644 int family = nfmsg->nfgen_family;
91c7b38d 1645 struct nft_ctx ctx;
3ecbfd65 1646 u64 handle;
9dee1474
PNA
1647 u32 use;
1648 int err;
96518518 1649
98319cb9 1650 table = nf_tables_table_lookup(net, nla[NFTA_CHAIN_TABLE], family,
36596dad 1651 genmask);
96518518
PM
1652 if (IS_ERR(table))
1653 return PTR_ERR(table);
1654
3ecbfd65
HS
1655 if (nla[NFTA_CHAIN_HANDLE]) {
1656 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
1657 chain = nf_tables_chain_lookup_byhandle(table, handle, genmask);
1658 } else {
1659 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1660 }
96518518
PM
1661 if (IS_ERR(chain))
1662 return PTR_ERR(chain);
9dee1474
PNA
1663
1664 if (nlh->nlmsg_flags & NLM_F_NONREC &&
1665 chain->use > 0)
96518518
PM
1666 return -EBUSY;
1667
98319cb9 1668 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
0165d932 1669
9dee1474
PNA
1670 use = chain->use;
1671 list_for_each_entry(rule, &chain->rules, list) {
1672 if (!nft_is_active_next(net, rule))
1673 continue;
1674 use--;
1675
1676 err = nft_delrule(&ctx, rule);
1677 if (err < 0)
1678 return err;
1679 }
1680
1681 /* There are rules and elements that are still holding references to us,
1682 * we cannot do a recursive removal in this case.
1683 */
1684 if (use > 0)
1685 return -EBUSY;
1686
ee01d542 1687 return nft_delchain(&ctx);
96518518
PM
1688}
1689
96518518
PM
1690/*
1691 * Expressions
1692 */
1693
1694/**
ef1f7df9
PM
1695 * nft_register_expr - register nf_tables expr type
1696 * @ops: expr type
96518518 1697 *
ef1f7df9 1698 * Registers the expr type for use with nf_tables. Returns zero on
96518518
PM
1699 * success or a negative errno code otherwise.
1700 */
ef1f7df9 1701int nft_register_expr(struct nft_expr_type *type)
96518518
PM
1702{
1703 nfnl_lock(NFNL_SUBSYS_NFTABLES);
758dbcec 1704 if (type->family == NFPROTO_UNSPEC)
e688a7f8 1705 list_add_tail_rcu(&type->list, &nf_tables_expressions);
758dbcec 1706 else
e688a7f8 1707 list_add_rcu(&type->list, &nf_tables_expressions);
96518518
PM
1708 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1709 return 0;
1710}
1711EXPORT_SYMBOL_GPL(nft_register_expr);
1712
1713/**
ef1f7df9
PM
1714 * nft_unregister_expr - unregister nf_tables expr type
1715 * @ops: expr type
96518518 1716 *
ef1f7df9 1717 * Unregisters the expr typefor use with nf_tables.
96518518 1718 */
ef1f7df9 1719void nft_unregister_expr(struct nft_expr_type *type)
96518518
PM
1720{
1721 nfnl_lock(NFNL_SUBSYS_NFTABLES);
e688a7f8 1722 list_del_rcu(&type->list);
96518518
PM
1723 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1724}
1725EXPORT_SYMBOL_GPL(nft_unregister_expr);
1726
64d46806
PM
1727static const struct nft_expr_type *__nft_expr_type_get(u8 family,
1728 struct nlattr *nla)
96518518 1729{
ef1f7df9 1730 const struct nft_expr_type *type;
96518518 1731
ef1f7df9 1732 list_for_each_entry(type, &nf_tables_expressions, list) {
64d46806
PM
1733 if (!nla_strcmp(nla, type->name) &&
1734 (!type->family || type->family == family))
ef1f7df9 1735 return type;
96518518
PM
1736 }
1737 return NULL;
1738}
1739
64d46806
PM
1740static const struct nft_expr_type *nft_expr_type_get(u8 family,
1741 struct nlattr *nla)
96518518 1742{
ef1f7df9 1743 const struct nft_expr_type *type;
96518518
PM
1744
1745 if (nla == NULL)
1746 return ERR_PTR(-EINVAL);
1747
64d46806 1748 type = __nft_expr_type_get(family, nla);
ef1f7df9
PM
1749 if (type != NULL && try_module_get(type->owner))
1750 return type;
96518518
PM
1751
1752#ifdef CONFIG_MODULES
ef1f7df9 1753 if (type == NULL) {
64d46806
PM
1754 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1755 request_module("nft-expr-%u-%.*s", family,
1756 nla_len(nla), (char *)nla_data(nla));
1757 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1758 if (__nft_expr_type_get(family, nla))
1759 return ERR_PTR(-EAGAIN);
1760
96518518
PM
1761 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1762 request_module("nft-expr-%.*s",
1763 nla_len(nla), (char *)nla_data(nla));
1764 nfnl_lock(NFNL_SUBSYS_NFTABLES);
64d46806 1765 if (__nft_expr_type_get(family, nla))
96518518
PM
1766 return ERR_PTR(-EAGAIN);
1767 }
1768#endif
1769 return ERR_PTR(-ENOENT);
1770}
1771
1772static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
1773 [NFTA_EXPR_NAME] = { .type = NLA_STRING },
1774 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
1775};
1776
1777static int nf_tables_fill_expr_info(struct sk_buff *skb,
1778 const struct nft_expr *expr)
1779{
ef1f7df9 1780 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
96518518
PM
1781 goto nla_put_failure;
1782
1783 if (expr->ops->dump) {
1784 struct nlattr *data = nla_nest_start(skb, NFTA_EXPR_DATA);
1785 if (data == NULL)
1786 goto nla_put_failure;
1787 if (expr->ops->dump(skb, expr) < 0)
1788 goto nla_put_failure;
1789 nla_nest_end(skb, data);
1790 }
1791
1792 return skb->len;
1793
1794nla_put_failure:
1795 return -1;
1796};
1797
0b2d8a7b
PM
1798int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
1799 const struct nft_expr *expr)
1800{
1801 struct nlattr *nest;
1802
1803 nest = nla_nest_start(skb, attr);
1804 if (!nest)
1805 goto nla_put_failure;
1806 if (nf_tables_fill_expr_info(skb, expr) < 0)
1807 goto nla_put_failure;
1808 nla_nest_end(skb, nest);
1809 return 0;
1810
1811nla_put_failure:
1812 return -1;
1813}
1814
96518518
PM
1815struct nft_expr_info {
1816 const struct nft_expr_ops *ops;
ef1f7df9 1817 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
96518518
PM
1818};
1819
0ca743a5
PNA
1820static int nf_tables_expr_parse(const struct nft_ctx *ctx,
1821 const struct nlattr *nla,
96518518
PM
1822 struct nft_expr_info *info)
1823{
ef1f7df9 1824 const struct nft_expr_type *type;
96518518 1825 const struct nft_expr_ops *ops;
ef1f7df9 1826 struct nlattr *tb[NFTA_EXPR_MAX + 1];
96518518
PM
1827 int err;
1828
fceb6435 1829 err = nla_parse_nested(tb, NFTA_EXPR_MAX, nla, nft_expr_policy, NULL);
96518518
PM
1830 if (err < 0)
1831 return err;
1832
36596dad 1833 type = nft_expr_type_get(ctx->family, tb[NFTA_EXPR_NAME]);
ef1f7df9
PM
1834 if (IS_ERR(type))
1835 return PTR_ERR(type);
1836
1837 if (tb[NFTA_EXPR_DATA]) {
1838 err = nla_parse_nested(info->tb, type->maxattr,
fceb6435 1839 tb[NFTA_EXPR_DATA], type->policy, NULL);
ef1f7df9
PM
1840 if (err < 0)
1841 goto err1;
1842 } else
1843 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
1844
1845 if (type->select_ops != NULL) {
0ca743a5
PNA
1846 ops = type->select_ops(ctx,
1847 (const struct nlattr * const *)info->tb);
ef1f7df9
PM
1848 if (IS_ERR(ops)) {
1849 err = PTR_ERR(ops);
1850 goto err1;
1851 }
1852 } else
1853 ops = type->ops;
1854
96518518
PM
1855 info->ops = ops;
1856 return 0;
ef1f7df9
PM
1857
1858err1:
1859 module_put(type->owner);
1860 return err;
96518518
PM
1861}
1862
1863static int nf_tables_newexpr(const struct nft_ctx *ctx,
ef1f7df9 1864 const struct nft_expr_info *info,
96518518
PM
1865 struct nft_expr *expr)
1866{
1867 const struct nft_expr_ops *ops = info->ops;
1868 int err;
1869
1870 expr->ops = ops;
1871 if (ops->init) {
ef1f7df9 1872 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
96518518
PM
1873 if (err < 0)
1874 goto err1;
1875 }
1876
c56e3956
LZ
1877 if (ops->validate) {
1878 const struct nft_data *data = NULL;
1879
1880 err = ops->validate(ctx, expr, &data);
1881 if (err < 0)
1882 goto err2;
1883 }
1884
96518518
PM
1885 return 0;
1886
c56e3956
LZ
1887err2:
1888 if (ops->destroy)
1889 ops->destroy(ctx, expr);
96518518
PM
1890err1:
1891 expr->ops = NULL;
1892 return err;
1893}
1894
62472bce
PM
1895static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
1896 struct nft_expr *expr)
96518518
PM
1897{
1898 if (expr->ops->destroy)
62472bce 1899 expr->ops->destroy(ctx, expr);
ef1f7df9 1900 module_put(expr->ops->type->owner);
96518518
PM
1901}
1902
0b2d8a7b
PM
1903struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
1904 const struct nlattr *nla)
1905{
1906 struct nft_expr_info info;
1907 struct nft_expr *expr;
1908 int err;
1909
1910 err = nf_tables_expr_parse(ctx, nla, &info);
1911 if (err < 0)
1912 goto err1;
1913
1914 err = -ENOMEM;
1915 expr = kzalloc(info.ops->size, GFP_KERNEL);
1916 if (expr == NULL)
1917 goto err2;
1918
1919 err = nf_tables_newexpr(ctx, &info, expr);
1920 if (err < 0)
6cafaf47 1921 goto err3;
0b2d8a7b
PM
1922
1923 return expr;
6cafaf47
LZ
1924err3:
1925 kfree(expr);
0b2d8a7b
PM
1926err2:
1927 module_put(info.ops->type->owner);
1928err1:
1929 return ERR_PTR(err);
1930}
1931
1932void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
1933{
1934 nf_tables_expr_destroy(ctx, expr);
1935 kfree(expr);
1936}
1937
96518518
PM
1938/*
1939 * Rules
1940 */
1941
1942static struct nft_rule *__nf_tables_rule_lookup(const struct nft_chain *chain,
1943 u64 handle)
1944{
1945 struct nft_rule *rule;
1946
1947 // FIXME: this sucks
1948 list_for_each_entry(rule, &chain->rules, list) {
1949 if (handle == rule->handle)
1950 return rule;
1951 }
1952
1953 return ERR_PTR(-ENOENT);
1954}
1955
1956static struct nft_rule *nf_tables_rule_lookup(const struct nft_chain *chain,
1957 const struct nlattr *nla)
1958{
1959 if (nla == NULL)
1960 return ERR_PTR(-EINVAL);
1961
1962 return __nf_tables_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
1963}
1964
1965static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
b2fbd044
LZ
1966 [NFTA_RULE_TABLE] = { .type = NLA_STRING,
1967 .len = NFT_TABLE_MAXNAMELEN - 1 },
96518518
PM
1968 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
1969 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1970 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
1971 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
0ca743a5 1972 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
5e948466 1973 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
0768b3b3
PNA
1974 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
1975 .len = NFT_USERDATA_MAXLEN },
467697d2 1976 [NFTA_RULE_ID] = { .type = NLA_U32 },
96518518
PM
1977};
1978
84d7fce6
PNA
1979static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
1980 u32 portid, u32 seq, int event,
1981 u32 flags, int family,
96518518
PM
1982 const struct nft_table *table,
1983 const struct nft_chain *chain,
1984 const struct nft_rule *rule)
1985{
1986 struct nlmsghdr *nlh;
1987 struct nfgenmsg *nfmsg;
1988 const struct nft_expr *expr, *next;
1989 struct nlattr *list;
5e948466 1990 const struct nft_rule *prule;
dedb67c4 1991 u16 type = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
96518518 1992
dedb67c4 1993 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg), flags);
96518518
PM
1994 if (nlh == NULL)
1995 goto nla_put_failure;
1996
1997 nfmsg = nlmsg_data(nlh);
1998 nfmsg->nfgen_family = family;
1999 nfmsg->version = NFNETLINK_V0;
84d7fce6 2000 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
96518518
PM
2001
2002 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
2003 goto nla_put_failure;
2004 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
2005 goto nla_put_failure;
b46f6ded
ND
2006 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
2007 NFTA_RULE_PAD))
96518518
PM
2008 goto nla_put_failure;
2009
5e948466 2010 if ((event != NFT_MSG_DELRULE) && (rule->list.prev != &chain->rules)) {
cbbb40e2 2011 prule = list_prev_entry(rule, list);
5e948466 2012 if (nla_put_be64(skb, NFTA_RULE_POSITION,
b46f6ded
ND
2013 cpu_to_be64(prule->handle),
2014 NFTA_RULE_PAD))
5e948466
EL
2015 goto nla_put_failure;
2016 }
2017
96518518
PM
2018 list = nla_nest_start(skb, NFTA_RULE_EXPRESSIONS);
2019 if (list == NULL)
2020 goto nla_put_failure;
2021 nft_rule_for_each_expr(expr, next, rule) {
0b2d8a7b 2022 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
96518518 2023 goto nla_put_failure;
96518518
PM
2024 }
2025 nla_nest_end(skb, list);
2026
86f1ec32
PM
2027 if (rule->udata) {
2028 struct nft_userdata *udata = nft_userdata(rule);
2029 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
2030 udata->data) < 0)
2031 goto nla_put_failure;
2032 }
0768b3b3 2033
053c095a
JB
2034 nlmsg_end(skb, nlh);
2035 return 0;
96518518
PM
2036
2037nla_put_failure:
2038 nlmsg_trim(skb, nlh);
2039 return -1;
2040}
2041
25e94a99
PNA
2042static void nf_tables_rule_notify(const struct nft_ctx *ctx,
2043 const struct nft_rule *rule, int event)
96518518
PM
2044{
2045 struct sk_buff *skb;
96518518
PM
2046 int err;
2047
128ad332
PNA
2048 if (!ctx->report &&
2049 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
25e94a99 2050 return;
96518518 2051
96518518
PM
2052 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
2053 if (skb == NULL)
2054 goto err;
2055
84d7fce6 2056 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
36596dad 2057 event, 0, ctx->family, ctx->table,
35151d84 2058 ctx->chain, rule);
96518518
PM
2059 if (err < 0) {
2060 kfree_skb(skb);
2061 goto err;
2062 }
2063
25e94a99
PNA
2064 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
2065 ctx->report, GFP_KERNEL);
2066 return;
96518518 2067err:
25e94a99 2068 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
96518518
PM
2069}
2070
6e1f760e 2071struct nft_rule_dump_ctx {
e46abbcc 2072 char *table;
b7263e07 2073 char *chain;
6e1f760e
PNA
2074};
2075
96518518
PM
2076static int nf_tables_dump_rules(struct sk_buff *skb,
2077 struct netlink_callback *cb)
2078{
2079 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
6e1f760e 2080 const struct nft_rule_dump_ctx *ctx = cb->data;
96518518
PM
2081 const struct nft_table *table;
2082 const struct nft_chain *chain;
2083 const struct nft_rule *rule;
2084 unsigned int idx = 0, s_idx = cb->args[0];
99633ab2 2085 struct net *net = sock_net(skb->sk);
96518518
PM
2086 int family = nfmsg->nfgen_family;
2087
e688a7f8 2088 rcu_read_lock();
38e029f1
PNA
2089 cb->seq = net->nft.base_seq;
2090
36596dad 2091 list_for_each_entry_rcu(table, &net->nft.tables, list) {
98319cb9 2092 if (family != NFPROTO_UNSPEC && family != table->family)
36596dad
PNA
2093 continue;
2094
2095 if (ctx && ctx->table && strcmp(ctx->table, table->name) != 0)
96518518
PM
2096 continue;
2097
36596dad
PNA
2098 list_for_each_entry_rcu(chain, &table->chains, list) {
2099 if (ctx && ctx->chain &&
2100 strcmp(ctx->chain, chain->name) != 0)
6e1f760e
PNA
2101 continue;
2102
36596dad
PNA
2103 list_for_each_entry_rcu(rule, &chain->rules, list) {
2104 if (!nft_is_active(net, rule))
2105 goto cont;
2106 if (idx < s_idx)
2107 goto cont;
2108 if (idx > s_idx)
2109 memset(&cb->args[1], 0,
2110 sizeof(cb->args) - sizeof(cb->args[0]));
2111 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
2112 cb->nlh->nlmsg_seq,
2113 NFT_MSG_NEWRULE,
2114 NLM_F_MULTI | NLM_F_APPEND,
98319cb9 2115 table->family,
36596dad
PNA
2116 table, chain, rule) < 0)
2117 goto done;
2118
2119 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
96518518 2120cont:
36596dad 2121 idx++;
96518518
PM
2122 }
2123 }
2124 }
2125done:
e688a7f8
PNA
2126 rcu_read_unlock();
2127
96518518
PM
2128 cb->args[0] = idx;
2129 return skb->len;
2130}
2131
6e1f760e
PNA
2132static int nf_tables_dump_rules_done(struct netlink_callback *cb)
2133{
e46abbcc
PS
2134 struct nft_rule_dump_ctx *ctx = cb->data;
2135
2136 if (ctx) {
2137 kfree(ctx->table);
b7263e07 2138 kfree(ctx->chain);
e46abbcc
PS
2139 kfree(ctx);
2140 }
6e1f760e
PNA
2141 return 0;
2142}
2143
7b8002a1
PNA
2144static int nf_tables_getrule(struct net *net, struct sock *nlsk,
2145 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
2146 const struct nlattr * const nla[],
2147 struct netlink_ext_ack *extack)
96518518
PM
2148{
2149 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 2150 u8 genmask = nft_genmask_cur(net);
96518518
PM
2151 const struct nft_table *table;
2152 const struct nft_chain *chain;
2153 const struct nft_rule *rule;
2154 struct sk_buff *skb2;
2155 int family = nfmsg->nfgen_family;
2156 int err;
2157
2158 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2159 struct netlink_dump_control c = {
2160 .dump = nf_tables_dump_rules,
6e1f760e 2161 .done = nf_tables_dump_rules_done,
96518518 2162 };
6e1f760e
PNA
2163
2164 if (nla[NFTA_RULE_TABLE] || nla[NFTA_RULE_CHAIN]) {
2165 struct nft_rule_dump_ctx *ctx;
2166
2167 ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
2168 if (!ctx)
2169 return -ENOMEM;
2170
e46abbcc
PS
2171 if (nla[NFTA_RULE_TABLE]) {
2172 ctx->table = nla_strdup(nla[NFTA_RULE_TABLE],
2173 GFP_KERNEL);
2174 if (!ctx->table) {
2175 kfree(ctx);
2176 return -ENOMEM;
2177 }
2178 }
b7263e07
PS
2179 if (nla[NFTA_RULE_CHAIN]) {
2180 ctx->chain = nla_strdup(nla[NFTA_RULE_CHAIN],
2181 GFP_KERNEL);
2182 if (!ctx->chain) {
2183 kfree(ctx->table);
2184 kfree(ctx);
2185 return -ENOMEM;
2186 }
2187 }
6e1f760e
PNA
2188 c.data = ctx;
2189 }
2190
96518518
PM
2191 return netlink_dump_start(nlsk, skb, nlh, &c);
2192 }
2193
98319cb9 2194 table = nf_tables_table_lookup(net, nla[NFTA_RULE_TABLE], family,
36596dad 2195 genmask);
96518518
PM
2196 if (IS_ERR(table))
2197 return PTR_ERR(table);
2198
664b0f8c 2199 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
96518518
PM
2200 if (IS_ERR(chain))
2201 return PTR_ERR(chain);
2202
2203 rule = nf_tables_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2204 if (IS_ERR(rule))
2205 return PTR_ERR(rule);
2206
2207 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2208 if (!skb2)
2209 return -ENOMEM;
2210
84d7fce6 2211 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
96518518
PM
2212 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
2213 family, table, chain, rule);
2214 if (err < 0)
2215 goto err;
2216
2217 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2218
2219err:
2220 kfree_skb(skb2);
2221 return err;
2222}
2223
62472bce
PM
2224static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
2225 struct nft_rule *rule)
96518518 2226{
96518518
PM
2227 struct nft_expr *expr;
2228
2229 /*
2230 * Careful: some expressions might not be initialized in case this
2231 * is called on error from nf_tables_newrule().
2232 */
2233 expr = nft_expr_first(rule);
3e38df13 2234 while (expr != nft_expr_last(rule) && expr->ops) {
62472bce 2235 nf_tables_expr_destroy(ctx, expr);
96518518
PM
2236 expr = nft_expr_next(expr);
2237 }
2238 kfree(rule);
2239}
2240
1081d11b
PNA
2241#define NFT_RULE_MAXEXPRS 128
2242
2243static struct nft_expr_info *info;
2244
633c9a84
PNA
2245static int nf_tables_newrule(struct net *net, struct sock *nlsk,
2246 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
2247 const struct nlattr * const nla[],
2248 struct netlink_ext_ack *extack)
96518518
PM
2249{
2250 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 2251 u8 genmask = nft_genmask_next(net);
98319cb9 2252 int family = nfmsg->nfgen_family;
96518518
PM
2253 struct nft_table *table;
2254 struct nft_chain *chain;
2255 struct nft_rule *rule, *old_rule = NULL;
86f1ec32 2256 struct nft_userdata *udata;
1081d11b 2257 struct nft_trans *trans = NULL;
96518518
PM
2258 struct nft_expr *expr;
2259 struct nft_ctx ctx;
2260 struct nlattr *tmp;
86f1ec32 2261 unsigned int size, i, n, ulen = 0, usize = 0;
96518518
PM
2262 int err, rem;
2263 bool create;
5e948466 2264 u64 handle, pos_handle;
96518518
PM
2265
2266 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2267
98319cb9 2268 table = nf_tables_table_lookup(net, nla[NFTA_RULE_TABLE], family,
36596dad 2269 genmask);
96518518
PM
2270 if (IS_ERR(table))
2271 return PTR_ERR(table);
2272
664b0f8c 2273 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
96518518
PM
2274 if (IS_ERR(chain))
2275 return PTR_ERR(chain);
2276
2277 if (nla[NFTA_RULE_HANDLE]) {
2278 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
2279 rule = __nf_tables_rule_lookup(chain, handle);
2280 if (IS_ERR(rule))
2281 return PTR_ERR(rule);
2282
2283 if (nlh->nlmsg_flags & NLM_F_EXCL)
2284 return -EEXIST;
2285 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2286 old_rule = rule;
2287 else
2288 return -EOPNOTSUPP;
2289 } else {
2290 if (!create || nlh->nlmsg_flags & NLM_F_REPLACE)
2291 return -EINVAL;
2292 handle = nf_tables_alloc_handle(table);
a0a7379e
PNA
2293
2294 if (chain->use == UINT_MAX)
2295 return -EOVERFLOW;
96518518
PM
2296 }
2297
5e948466
EL
2298 if (nla[NFTA_RULE_POSITION]) {
2299 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2300 return -EOPNOTSUPP;
2301
2302 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
2303 old_rule = __nf_tables_rule_lookup(chain, pos_handle);
2304 if (IS_ERR(old_rule))
2305 return PTR_ERR(old_rule);
2306 }
2307
98319cb9 2308 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
0ca743a5 2309
96518518
PM
2310 n = 0;
2311 size = 0;
2312 if (nla[NFTA_RULE_EXPRESSIONS]) {
2313 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
2314 err = -EINVAL;
2315 if (nla_type(tmp) != NFTA_LIST_ELEM)
2316 goto err1;
2317 if (n == NFT_RULE_MAXEXPRS)
2318 goto err1;
0ca743a5 2319 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
96518518
PM
2320 if (err < 0)
2321 goto err1;
2322 size += info[n].ops->size;
2323 n++;
2324 }
2325 }
9889840f
PM
2326 /* Check for overflow of dlen field */
2327 err = -EFBIG;
2328 if (size >= 1 << 12)
2329 goto err1;
96518518 2330
86f1ec32 2331 if (nla[NFTA_RULE_USERDATA]) {
0768b3b3 2332 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
86f1ec32
PM
2333 if (ulen > 0)
2334 usize = sizeof(struct nft_userdata) + ulen;
2335 }
0768b3b3 2336
96518518 2337 err = -ENOMEM;
86f1ec32 2338 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
96518518
PM
2339 if (rule == NULL)
2340 goto err1;
2341
889f7ee7 2342 nft_activate_next(net, rule);
0628b123 2343
96518518
PM
2344 rule->handle = handle;
2345 rule->dlen = size;
86f1ec32 2346 rule->udata = ulen ? 1 : 0;
0768b3b3 2347
86f1ec32
PM
2348 if (ulen) {
2349 udata = nft_userdata(rule);
2350 udata->len = ulen - 1;
2351 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
2352 }
96518518 2353
96518518
PM
2354 expr = nft_expr_first(rule);
2355 for (i = 0; i < n; i++) {
2356 err = nf_tables_newexpr(&ctx, &info[i], expr);
2357 if (err < 0)
2358 goto err2;
ef1f7df9 2359 info[i].ops = NULL;
96518518
PM
2360 expr = nft_expr_next(expr);
2361 }
2362
96518518 2363 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
569ccae6 2364 if (!nft_is_active_next(net, old_rule)) {
0628b123
PNA
2365 err = -ENOENT;
2366 goto err2;
2367 }
569ccae6
FW
2368 trans = nft_trans_rule_add(&ctx, NFT_MSG_DELRULE,
2369 old_rule);
2370 if (trans == NULL) {
2371 err = -ENOMEM;
2372 goto err2;
2373 }
2374 nft_deactivate_next(net, old_rule);
2375 chain->use--;
96518518 2376
569ccae6
FW
2377 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2378 err = -ENOMEM;
2379 goto err2;
2380 }
2381
2382 list_add_tail_rcu(&rule->list, &old_rule->list);
2383 } else {
2384 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2385 err = -ENOMEM;
2386 goto err2;
2387 }
2388
2389 if (nlh->nlmsg_flags & NLM_F_APPEND) {
2390 if (old_rule)
2391 list_add_rcu(&rule->list, &old_rule->list);
2392 else
2393 list_add_tail_rcu(&rule->list, &chain->rules);
2394 } else {
2395 if (old_rule)
2396 list_add_tail_rcu(&rule->list, &old_rule->list);
2397 else
2398 list_add_rcu(&rule->list, &chain->rules);
2399 }
0628b123 2400 }
4fefee57 2401 chain->use++;
96518518
PM
2402 return 0;
2403
2404err2:
62472bce 2405 nf_tables_rule_destroy(&ctx, rule);
96518518
PM
2406err1:
2407 for (i = 0; i < n; i++) {
2408 if (info[i].ops != NULL)
ef1f7df9 2409 module_put(info[i].ops->type->owner);
96518518
PM
2410 }
2411 return err;
2412}
2413
1a94e38d
PNA
2414static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
2415 const struct nlattr *nla)
2416{
2417 u32 id = ntohl(nla_get_be32(nla));
2418 struct nft_trans *trans;
2419
2420 list_for_each_entry(trans, &net->nft.commit_list, list) {
2421 struct nft_rule *rule = nft_trans_rule(trans);
2422
2423 if (trans->msg_type == NFT_MSG_NEWRULE &&
2424 id == nft_trans_rule_id(trans))
2425 return rule;
2426 }
2427 return ERR_PTR(-ENOENT);
2428}
2429
633c9a84
PNA
2430static int nf_tables_delrule(struct net *net, struct sock *nlsk,
2431 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
2432 const struct nlattr * const nla[],
2433 struct netlink_ext_ack *extack)
96518518
PM
2434{
2435 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 2436 u8 genmask = nft_genmask_next(net);
7c95f6d8 2437 struct nft_table *table;
cf9dc09d
PNA
2438 struct nft_chain *chain = NULL;
2439 struct nft_rule *rule;
0628b123
PNA
2440 int family = nfmsg->nfgen_family, err = 0;
2441 struct nft_ctx ctx;
96518518 2442
98319cb9 2443 table = nf_tables_table_lookup(net, nla[NFTA_RULE_TABLE], family,
36596dad 2444 genmask);
96518518
PM
2445 if (IS_ERR(table))
2446 return PTR_ERR(table);
2447
cf9dc09d 2448 if (nla[NFTA_RULE_CHAIN]) {
664b0f8c
PNA
2449 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN],
2450 genmask);
cf9dc09d
PNA
2451 if (IS_ERR(chain))
2452 return PTR_ERR(chain);
2453 }
96518518 2454
98319cb9 2455 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
0628b123 2456
cf9dc09d
PNA
2457 if (chain) {
2458 if (nla[NFTA_RULE_HANDLE]) {
2459 rule = nf_tables_rule_lookup(chain,
2460 nla[NFTA_RULE_HANDLE]);
2461 if (IS_ERR(rule))
2462 return PTR_ERR(rule);
96518518 2463
1a94e38d
PNA
2464 err = nft_delrule(&ctx, rule);
2465 } else if (nla[NFTA_RULE_ID]) {
2466 rule = nft_rule_lookup_byid(net, nla[NFTA_RULE_ID]);
2467 if (IS_ERR(rule))
2468 return PTR_ERR(rule);
2469
5e266fe7 2470 err = nft_delrule(&ctx, rule);
cf9dc09d 2471 } else {
ce24b721 2472 err = nft_delrule_by_chain(&ctx);
cf9dc09d
PNA
2473 }
2474 } else {
2475 list_for_each_entry(chain, &table->chains, list) {
664b0f8c
PNA
2476 if (!nft_is_active_next(net, chain))
2477 continue;
2478
cf9dc09d 2479 ctx.chain = chain;
ce24b721 2480 err = nft_delrule_by_chain(&ctx);
0628b123
PNA
2481 if (err < 0)
2482 break;
2483 }
2484 }
2485
2486 return err;
2487}
2488
20a69341
PM
2489/*
2490 * Sets
2491 */
2492
2b664957 2493static LIST_HEAD(nf_tables_set_types);
20a69341 2494
2b664957 2495int nft_register_set(struct nft_set_type *type)
20a69341
PM
2496{
2497 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2b664957 2498 list_add_tail_rcu(&type->list, &nf_tables_set_types);
20a69341
PM
2499 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2500 return 0;
2501}
2502EXPORT_SYMBOL_GPL(nft_register_set);
2503
2b664957 2504void nft_unregister_set(struct nft_set_type *type)
20a69341
PM
2505{
2506 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2b664957 2507 list_del_rcu(&type->list);
20a69341
PM
2508 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2509}
2510EXPORT_SYMBOL_GPL(nft_unregister_set);
2511
2b664957
PNA
2512#define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
2513 NFT_SET_TIMEOUT | NFT_SET_OBJECT)
2514
2515static bool nft_set_ops_candidate(const struct nft_set_ops *ops, u32 flags)
2516{
4f2921ca
FW
2517 if ((flags & NFT_SET_EVAL) && !ops->update)
2518 return false;
2519
2b664957
PNA
2520 return (flags & ops->features) == (flags & NFT_SET_FEATURES);
2521}
2522
c50b960c
PM
2523/*
2524 * Select a set implementation based on the data characteristics and the
2525 * given policy. The total memory use might not be known if no size is
2526 * given, in that case the amount of memory per element is used.
2527 */
2528static const struct nft_set_ops *
2b664957
PNA
2529nft_select_set_ops(const struct nft_ctx *ctx,
2530 const struct nlattr * const nla[],
c50b960c
PM
2531 const struct nft_set_desc *desc,
2532 enum nft_set_policies policy)
20a69341 2533{
c50b960c
PM
2534 const struct nft_set_ops *ops, *bops;
2535 struct nft_set_estimate est, best;
2b664957
PNA
2536 const struct nft_set_type *type;
2537 u32 flags = 0;
20a69341
PM
2538
2539#ifdef CONFIG_MODULES
2b664957 2540 if (list_empty(&nf_tables_set_types)) {
20a69341
PM
2541 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2542 request_module("nft-set");
2543 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2b664957 2544 if (!list_empty(&nf_tables_set_types))
20a69341
PM
2545 return ERR_PTR(-EAGAIN);
2546 }
2547#endif
2b664957
PNA
2548 if (nla[NFTA_SET_FLAGS] != NULL)
2549 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
20a69341 2550
55af753c
PNA
2551 bops = NULL;
2552 best.size = ~0;
2553 best.lookup = ~0;
0b5a7874 2554 best.space = ~0;
c50b960c 2555
2b664957
PNA
2556 list_for_each_entry(type, &nf_tables_set_types, list) {
2557 if (!type->select_ops)
2558 ops = type->ops;
2559 else
2560 ops = type->select_ops(ctx, desc, flags);
2561 if (!ops)
2562 continue;
2563
2564 if (!nft_set_ops_candidate(ops, flags))
20a69341 2565 continue;
2b664957 2566 if (!ops->estimate(desc, flags, &est))
c50b960c
PM
2567 continue;
2568
2569 switch (policy) {
2570 case NFT_SET_POL_PERFORMANCE:
55af753c 2571 if (est.lookup < best.lookup)
c50b960c 2572 break;
644e334e
PNA
2573 if (est.lookup == best.lookup &&
2574 est.space < best.space)
2575 break;
c50b960c
PM
2576 continue;
2577 case NFT_SET_POL_MEMORY:
0b5a7874
PNA
2578 if (!desc->size) {
2579 if (est.space < best.space)
2580 break;
2581 if (est.space == best.space &&
2582 est.lookup < best.lookup)
2583 break;
4f2921ca 2584 } else if (est.size < best.size || !bops) {
c50b960c 2585 break;
0b5a7874 2586 }
c50b960c
PM
2587 continue;
2588 default:
2589 break;
2590 }
2591
2b664957 2592 if (!try_module_get(type->owner))
20a69341 2593 continue;
c50b960c 2594 if (bops != NULL)
2b664957 2595 module_put(bops->type->owner);
c50b960c
PM
2596
2597 bops = ops;
2598 best = est;
20a69341
PM
2599 }
2600
c50b960c
PM
2601 if (bops != NULL)
2602 return bops;
2603
20a69341
PM
2604 return ERR_PTR(-EOPNOTSUPP);
2605}
2606
2607static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
b2fbd044
LZ
2608 [NFTA_SET_TABLE] = { .type = NLA_STRING,
2609 .len = NFT_TABLE_MAXNAMELEN - 1 },
a9bdd836 2610 [NFTA_SET_NAME] = { .type = NLA_STRING,
cb39ad8b 2611 .len = NFT_SET_MAXNAMELEN - 1 },
20a69341
PM
2612 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
2613 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
2614 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
2615 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
2616 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
c50b960c
PM
2617 [NFTA_SET_POLICY] = { .type = NLA_U32 },
2618 [NFTA_SET_DESC] = { .type = NLA_NESTED },
958bee14 2619 [NFTA_SET_ID] = { .type = NLA_U32 },
761da293
PM
2620 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
2621 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
e6d8ecac
CFG
2622 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
2623 .len = NFT_USERDATA_MAXLEN },
8aeff920 2624 [NFTA_SET_OBJ_TYPE] = { .type = NLA_U32 },
3ecbfd65 2625 [NFTA_SET_HANDLE] = { .type = NLA_U64 },
c50b960c
PM
2626};
2627
2628static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
2629 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
20a69341
PM
2630};
2631
633c9a84 2632static int nft_ctx_init_from_setattr(struct nft_ctx *ctx, struct net *net,
20a69341
PM
2633 const struct sk_buff *skb,
2634 const struct nlmsghdr *nlh,
f2a6d766
PNA
2635 const struct nlattr * const nla[],
2636 u8 genmask)
20a69341
PM
2637{
2638 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
98319cb9 2639 int family = nfmsg->nfgen_family;
7c95f6d8 2640 struct nft_table *table = NULL;
20a69341 2641
20a69341 2642 if (nla[NFTA_SET_TABLE] != NULL) {
36596dad 2643 table = nf_tables_table_lookup(net, nla[NFTA_SET_TABLE],
98319cb9 2644 family, genmask);
20a69341
PM
2645 if (IS_ERR(table))
2646 return PTR_ERR(table);
2647 }
2648
98319cb9 2649 nft_ctx_init(ctx, net, skb, nlh, family, table, NULL, nla);
20a69341
PM
2650 return 0;
2651}
2652
c7a72e3f
PNA
2653static struct nft_set *nf_tables_set_lookup(const struct nft_table *table,
2654 const struct nlattr *nla, u8 genmask)
20a69341
PM
2655{
2656 struct nft_set *set;
2657
2658 if (nla == NULL)
2659 return ERR_PTR(-EINVAL);
2660
2661 list_for_each_entry(set, &table->sets, list) {
37a9cc52
PNA
2662 if (!nla_strcmp(nla, set->name) &&
2663 nft_active_genmask(set, genmask))
20a69341
PM
2664 return set;
2665 }
2666 return ERR_PTR(-ENOENT);
2667}
2668
3ecbfd65
HS
2669static struct nft_set *nf_tables_set_lookup_byhandle(const struct nft_table *table,
2670 const struct nlattr *nla, u8 genmask)
2671{
2672 struct nft_set *set;
2673
2674 if (nla == NULL)
2675 return ERR_PTR(-EINVAL);
2676
2677 list_for_each_entry(set, &table->sets, list) {
2678 if (be64_to_cpu(nla_get_be64(nla)) == set->handle &&
2679 nft_active_genmask(set, genmask))
2680 return set;
2681 }
2682 return ERR_PTR(-ENOENT);
2683}
2684
c7a72e3f
PNA
2685static struct nft_set *nf_tables_set_lookup_byid(const struct net *net,
2686 const struct nlattr *nla,
2687 u8 genmask)
958bee14
PNA
2688{
2689 struct nft_trans *trans;
2690 u32 id = ntohl(nla_get_be32(nla));
2691
2692 list_for_each_entry(trans, &net->nft.commit_list, list) {
37a9cc52
PNA
2693 struct nft_set *set = nft_trans_set(trans);
2694
958bee14 2695 if (trans->msg_type == NFT_MSG_NEWSET &&
37a9cc52
PNA
2696 id == nft_trans_set_id(trans) &&
2697 nft_active_genmask(set, genmask))
2698 return set;
958bee14
PNA
2699 }
2700 return ERR_PTR(-ENOENT);
2701}
c7a72e3f 2702
10659cba
PNA
2703struct nft_set *nft_set_lookup_global(const struct net *net,
2704 const struct nft_table *table,
2705 const struct nlattr *nla_set_name,
2706 const struct nlattr *nla_set_id,
2707 u8 genmask)
c7a72e3f
PNA
2708{
2709 struct nft_set *set;
2710
2711 set = nf_tables_set_lookup(table, nla_set_name, genmask);
2712 if (IS_ERR(set)) {
2713 if (!nla_set_id)
2714 return set;
2715
2716 set = nf_tables_set_lookup_byid(net, nla_set_id, genmask);
2717 }
2718 return set;
2719}
10659cba 2720EXPORT_SYMBOL_GPL(nft_set_lookup_global);
958bee14 2721
20a69341
PM
2722static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
2723 const char *name)
2724{
2725 const struct nft_set *i;
2726 const char *p;
2727 unsigned long *inuse;
60eb1894 2728 unsigned int n = 0, min = 0;
20a69341 2729
38745490 2730 p = strchr(name, '%');
20a69341
PM
2731 if (p != NULL) {
2732 if (p[1] != 'd' || strchr(p + 2, '%'))
2733 return -EINVAL;
2734
2735 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
2736 if (inuse == NULL)
2737 return -ENOMEM;
60eb1894 2738cont:
20a69341 2739 list_for_each_entry(i, &ctx->table->sets, list) {
14662917
DB
2740 int tmp;
2741
37a9cc52
PNA
2742 if (!nft_is_active_next(ctx->net, set))
2743 continue;
14662917 2744 if (!sscanf(i->name, name, &tmp))
20a69341 2745 continue;
60eb1894 2746 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
20a69341 2747 continue;
14662917 2748
60eb1894 2749 set_bit(tmp - min, inuse);
20a69341
PM
2750 }
2751
53b70287 2752 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
60eb1894
PM
2753 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
2754 min += BITS_PER_BYTE * PAGE_SIZE;
2755 memset(inuse, 0, PAGE_SIZE);
2756 goto cont;
2757 }
20a69341
PM
2758 free_page((unsigned long)inuse);
2759 }
2760
38745490
PS
2761 set->name = kasprintf(GFP_KERNEL, name, min + n);
2762 if (!set->name)
2763 return -ENOMEM;
2764
20a69341 2765 list_for_each_entry(i, &ctx->table->sets, list) {
37a9cc52
PNA
2766 if (!nft_is_active_next(ctx->net, i))
2767 continue;
e63aaaa6
AY
2768 if (!strcmp(set->name, i->name)) {
2769 kfree(set->name);
20a69341 2770 return -ENFILE;
e63aaaa6 2771 }
20a69341
PM
2772 }
2773 return 0;
2774}
2775
2776static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
2777 const struct nft_set *set, u16 event, u16 flags)
2778{
2779 struct nfgenmsg *nfmsg;
2780 struct nlmsghdr *nlh;
c50b960c 2781 struct nlattr *desc;
128ad332
PNA
2782 u32 portid = ctx->portid;
2783 u32 seq = ctx->seq;
20a69341 2784
dedb67c4 2785 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
20a69341
PM
2786 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
2787 flags);
2788 if (nlh == NULL)
2789 goto nla_put_failure;
2790
2791 nfmsg = nlmsg_data(nlh);
36596dad 2792 nfmsg->nfgen_family = ctx->family;
20a69341 2793 nfmsg->version = NFNETLINK_V0;
84d7fce6 2794 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
20a69341
PM
2795
2796 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
2797 goto nla_put_failure;
2798 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
2799 goto nla_put_failure;
3ecbfd65
HS
2800 if (nla_put_be64(skb, NFTA_SET_HANDLE, cpu_to_be64(set->handle),
2801 NFTA_SET_PAD))
2802 goto nla_put_failure;
20a69341
PM
2803 if (set->flags != 0)
2804 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
2805 goto nla_put_failure;
2806
2807 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
2808 goto nla_put_failure;
2809 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
2810 goto nla_put_failure;
2811 if (set->flags & NFT_SET_MAP) {
2812 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
2813 goto nla_put_failure;
2814 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
2815 goto nla_put_failure;
2816 }
8aeff920
PNA
2817 if (set->flags & NFT_SET_OBJECT &&
2818 nla_put_be32(skb, NFTA_SET_OBJ_TYPE, htonl(set->objtype)))
2819 goto nla_put_failure;
20a69341 2820
761da293 2821 if (set->timeout &&
d3e2a111
AP
2822 nla_put_be64(skb, NFTA_SET_TIMEOUT,
2823 cpu_to_be64(jiffies_to_msecs(set->timeout)),
b46f6ded 2824 NFTA_SET_PAD))
761da293
PM
2825 goto nla_put_failure;
2826 if (set->gc_int &&
2827 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
2828 goto nla_put_failure;
2829
9363dc4b
AB
2830 if (set->policy != NFT_SET_POL_PERFORMANCE) {
2831 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
2832 goto nla_put_failure;
2833 }
2834
e6d8ecac
CFG
2835 if (nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
2836 goto nla_put_failure;
2837
c50b960c
PM
2838 desc = nla_nest_start(skb, NFTA_SET_DESC);
2839 if (desc == NULL)
2840 goto nla_put_failure;
2841 if (set->size &&
2842 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
2843 goto nla_put_failure;
2844 nla_nest_end(skb, desc);
2845
053c095a
JB
2846 nlmsg_end(skb, nlh);
2847 return 0;
20a69341
PM
2848
2849nla_put_failure:
2850 nlmsg_trim(skb, nlh);
2851 return -1;
2852}
2853
25e94a99
PNA
2854static void nf_tables_set_notify(const struct nft_ctx *ctx,
2855 const struct nft_set *set, int event,
2856 gfp_t gfp_flags)
20a69341
PM
2857{
2858 struct sk_buff *skb;
128ad332 2859 u32 portid = ctx->portid;
20a69341
PM
2860 int err;
2861
128ad332
PNA
2862 if (!ctx->report &&
2863 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
25e94a99 2864 return;
20a69341 2865
31f8441c 2866 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
20a69341
PM
2867 if (skb == NULL)
2868 goto err;
2869
2870 err = nf_tables_fill_set(skb, ctx, set, event, 0);
2871 if (err < 0) {
2872 kfree_skb(skb);
2873 goto err;
2874 }
2875
25e94a99
PNA
2876 nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES, ctx->report,
2877 gfp_flags);
2878 return;
20a69341 2879err:
25e94a99 2880 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
20a69341
PM
2881}
2882
5b96af77 2883static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
c9c8e485
PNA
2884{
2885 const struct nft_set *set;
2886 unsigned int idx, s_idx = cb->args[0];
c9c8e485
PNA
2887 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
2888 struct net *net = sock_net(skb->sk);
5b96af77 2889 struct nft_ctx *ctx = cb->data, ctx_set;
c9c8e485
PNA
2890
2891 if (cb->args[1])
2892 return skb->len;
2893
e688a7f8 2894 rcu_read_lock();
38e029f1
PNA
2895 cb->seq = net->nft.base_seq;
2896
36596dad
PNA
2897 list_for_each_entry_rcu(table, &net->nft.tables, list) {
2898 if (ctx->family != NFPROTO_UNSPEC &&
98319cb9 2899 ctx->family != table->family)
36596dad
PNA
2900 continue;
2901
2902 if (ctx->table && ctx->table != table)
5b96af77
PNA
2903 continue;
2904
36596dad
PNA
2905 if (cur_table) {
2906 if (cur_table != table)
c9c8e485
PNA
2907 continue;
2908
36596dad 2909 cur_table = NULL;
c9c8e485 2910 }
36596dad
PNA
2911 idx = 0;
2912 list_for_each_entry_rcu(set, &table->sets, list) {
2913 if (idx < s_idx)
2914 goto cont;
2915 if (!nft_is_active(net, set))
2916 goto cont;
5b96af77 2917
36596dad
PNA
2918 ctx_set = *ctx;
2919 ctx_set.table = table;
98319cb9 2920 ctx_set.family = table->family;
c9c8e485 2921
36596dad
PNA
2922 if (nf_tables_fill_set(skb, &ctx_set, set,
2923 NFT_MSG_NEWSET,
2924 NLM_F_MULTI) < 0) {
2925 cb->args[0] = idx;
2926 cb->args[2] = (unsigned long) table;
2927 goto done;
c9c8e485 2928 }
36596dad 2929 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
c9c8e485 2930cont:
36596dad 2931 idx++;
c9c8e485 2932 }
36596dad
PNA
2933 if (s_idx)
2934 s_idx = 0;
c9c8e485
PNA
2935 }
2936 cb->args[1] = 1;
2937done:
e688a7f8 2938 rcu_read_unlock();
c9c8e485
PNA
2939 return skb->len;
2940}
2941
5b96af77 2942static int nf_tables_dump_sets_done(struct netlink_callback *cb)
20a69341 2943{
5b96af77
PNA
2944 kfree(cb->data);
2945 return 0;
20a69341
PM
2946}
2947
7b8002a1
PNA
2948static int nf_tables_getset(struct net *net, struct sock *nlsk,
2949 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
2950 const struct nlattr * const nla[],
2951 struct netlink_ext_ack *extack)
20a69341 2952{
f2a6d766 2953 u8 genmask = nft_genmask_cur(net);
20a69341
PM
2954 const struct nft_set *set;
2955 struct nft_ctx ctx;
2956 struct sk_buff *skb2;
c9c8e485 2957 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
20a69341
PM
2958 int err;
2959
01cfa0a4 2960 /* Verify existence before starting dump */
f2a6d766 2961 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
20a69341
PM
2962 if (err < 0)
2963 return err;
2964
2965 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2966 struct netlink_dump_control c = {
2967 .dump = nf_tables_dump_sets,
5b96af77 2968 .done = nf_tables_dump_sets_done,
20a69341 2969 };
5b96af77
PNA
2970 struct nft_ctx *ctx_dump;
2971
2972 ctx_dump = kmalloc(sizeof(*ctx_dump), GFP_KERNEL);
2973 if (ctx_dump == NULL)
2974 return -ENOMEM;
2975
2976 *ctx_dump = ctx;
2977 c.data = ctx_dump;
2978
20a69341
PM
2979 return netlink_dump_start(nlsk, skb, nlh, &c);
2980 }
2981
c9c8e485
PNA
2982 /* Only accept unspec with dump */
2983 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2984 return -EAFNOSUPPORT;
eaa2bcd6
PT
2985 if (!nla[NFTA_SET_TABLE])
2986 return -EINVAL;
c9c8e485 2987
37a9cc52 2988 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
20a69341
PM
2989 if (IS_ERR(set))
2990 return PTR_ERR(set);
2991
2992 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2993 if (skb2 == NULL)
2994 return -ENOMEM;
2995
2996 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
2997 if (err < 0)
2998 goto err;
2999
3000 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
3001
3002err:
3003 kfree_skb(skb2);
3004 return err;
3005}
3006
c50b960c
PM
3007static int nf_tables_set_desc_parse(const struct nft_ctx *ctx,
3008 struct nft_set_desc *desc,
3009 const struct nlattr *nla)
3010{
3011 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
3012 int err;
3013
fceb6435
JB
3014 err = nla_parse_nested(da, NFTA_SET_DESC_MAX, nla,
3015 nft_set_desc_policy, NULL);
c50b960c
PM
3016 if (err < 0)
3017 return err;
3018
3019 if (da[NFTA_SET_DESC_SIZE] != NULL)
3020 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
3021
3022 return 0;
3023}
3024
633c9a84
PNA
3025static int nf_tables_newset(struct net *net, struct sock *nlsk,
3026 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
3027 const struct nlattr * const nla[],
3028 struct netlink_ext_ack *extack)
20a69341
PM
3029{
3030 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 3031 u8 genmask = nft_genmask_next(net);
98319cb9 3032 int family = nfmsg->nfgen_family;
20a69341 3033 const struct nft_set_ops *ops;
20a69341
PM
3034 struct nft_table *table;
3035 struct nft_set *set;
3036 struct nft_ctx ctx;
38745490 3037 char *name;
20a69341
PM
3038 unsigned int size;
3039 bool create;
761da293 3040 u64 timeout;
8aeff920 3041 u32 ktype, dtype, flags, policy, gc_int, objtype;
c50b960c 3042 struct nft_set_desc desc;
e6d8ecac
CFG
3043 unsigned char *udata;
3044 u16 udlen;
20a69341
PM
3045 int err;
3046
3047 if (nla[NFTA_SET_TABLE] == NULL ||
3048 nla[NFTA_SET_NAME] == NULL ||
958bee14
PNA
3049 nla[NFTA_SET_KEY_LEN] == NULL ||
3050 nla[NFTA_SET_ID] == NULL)
20a69341
PM
3051 return -EINVAL;
3052
c50b960c
PM
3053 memset(&desc, 0, sizeof(desc));
3054
20a69341
PM
3055 ktype = NFT_DATA_VALUE;
3056 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
3057 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
3058 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
3059 return -EINVAL;
3060 }
3061
c50b960c 3062 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
7d740264 3063 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
20a69341
PM
3064 return -EINVAL;
3065
3066 flags = 0;
3067 if (nla[NFTA_SET_FLAGS] != NULL) {
3068 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
3069 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
7c6c6e95 3070 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
8aeff920
PNA
3071 NFT_SET_MAP | NFT_SET_EVAL |
3072 NFT_SET_OBJECT))
20a69341 3073 return -EINVAL;
8aeff920
PNA
3074 /* Only one of these operations is supported */
3075 if ((flags & (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT)) ==
3076 (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT))
7c6c6e95 3077 return -EOPNOTSUPP;
20a69341
PM
3078 }
3079
3080 dtype = 0;
20a69341
PM
3081 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
3082 if (!(flags & NFT_SET_MAP))
3083 return -EINVAL;
3084
3085 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
3086 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
3087 dtype != NFT_DATA_VERDICT)
3088 return -EINVAL;
3089
3090 if (dtype != NFT_DATA_VERDICT) {
3091 if (nla[NFTA_SET_DATA_LEN] == NULL)
3092 return -EINVAL;
c50b960c 3093 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
7d740264 3094 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
20a69341
PM
3095 return -EINVAL;
3096 } else
7d740264 3097 desc.dlen = sizeof(struct nft_verdict);
20a69341
PM
3098 } else if (flags & NFT_SET_MAP)
3099 return -EINVAL;
3100
8aeff920
PNA
3101 if (nla[NFTA_SET_OBJ_TYPE] != NULL) {
3102 if (!(flags & NFT_SET_OBJECT))
3103 return -EINVAL;
3104
3105 objtype = ntohl(nla_get_be32(nla[NFTA_SET_OBJ_TYPE]));
3106 if (objtype == NFT_OBJECT_UNSPEC ||
3107 objtype > NFT_OBJECT_MAX)
3108 return -EINVAL;
3109 } else if (flags & NFT_SET_OBJECT)
3110 return -EINVAL;
3111 else
3112 objtype = NFT_OBJECT_UNSPEC;
3113
761da293
PM
3114 timeout = 0;
3115 if (nla[NFTA_SET_TIMEOUT] != NULL) {
3116 if (!(flags & NFT_SET_TIMEOUT))
3117 return -EINVAL;
d3e2a111
AP
3118 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3119 nla[NFTA_SET_TIMEOUT])));
761da293
PM
3120 }
3121 gc_int = 0;
3122 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
3123 if (!(flags & NFT_SET_TIMEOUT))
3124 return -EINVAL;
3125 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
3126 }
3127
c50b960c
PM
3128 policy = NFT_SET_POL_PERFORMANCE;
3129 if (nla[NFTA_SET_POLICY] != NULL)
3130 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
3131
3132 if (nla[NFTA_SET_DESC] != NULL) {
3133 err = nf_tables_set_desc_parse(&ctx, &desc, nla[NFTA_SET_DESC]);
3134 if (err < 0)
3135 return err;
3136 }
3137
20a69341
PM
3138 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
3139
98319cb9 3140 table = nf_tables_table_lookup(net, nla[NFTA_SET_TABLE], family,
36596dad 3141 genmask);
20a69341
PM
3142 if (IS_ERR(table))
3143 return PTR_ERR(table);
3144
98319cb9 3145 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
20a69341 3146
37a9cc52 3147 set = nf_tables_set_lookup(table, nla[NFTA_SET_NAME], genmask);
20a69341
PM
3148 if (IS_ERR(set)) {
3149 if (PTR_ERR(set) != -ENOENT)
3150 return PTR_ERR(set);
1a28ad74 3151 } else {
20a69341
PM
3152 if (nlh->nlmsg_flags & NLM_F_EXCL)
3153 return -EEXIST;
3154 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3155 return -EOPNOTSUPP;
3156 return 0;
3157 }
3158
3159 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
3160 return -ENOENT;
3161
2b664957 3162 ops = nft_select_set_ops(&ctx, nla, &desc, policy);
20a69341
PM
3163 if (IS_ERR(ops))
3164 return PTR_ERR(ops);
3165
e6d8ecac
CFG
3166 udlen = 0;
3167 if (nla[NFTA_SET_USERDATA])
3168 udlen = nla_len(nla[NFTA_SET_USERDATA]);
3169
20a69341
PM
3170 size = 0;
3171 if (ops->privsize != NULL)
347b408d 3172 size = ops->privsize(nla, &desc);
20a69341 3173
1ff75a3e
PNA
3174 set = kvzalloc(sizeof(*set) + size + udlen, GFP_KERNEL);
3175 if (!set) {
3176 err = -ENOMEM;
20a69341 3177 goto err1;
1ff75a3e 3178 }
20a69341 3179
38745490
PS
3180 name = nla_strdup(nla[NFTA_SET_NAME], GFP_KERNEL);
3181 if (!name) {
3182 err = -ENOMEM;
3183 goto err2;
3184 }
3185
20a69341 3186 err = nf_tables_set_alloc_name(&ctx, set, name);
38745490 3187 kfree(name);
20a69341
PM
3188 if (err < 0)
3189 goto err2;
3190
e6d8ecac
CFG
3191 udata = NULL;
3192 if (udlen) {
3193 udata = set->data + size;
3194 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
3195 }
3196
20a69341
PM
3197 INIT_LIST_HEAD(&set->bindings);
3198 set->ops = ops;
3199 set->ktype = ktype;
c50b960c 3200 set->klen = desc.klen;
20a69341 3201 set->dtype = dtype;
8aeff920 3202 set->objtype = objtype;
c50b960c 3203 set->dlen = desc.dlen;
20a69341 3204 set->flags = flags;
c50b960c 3205 set->size = desc.size;
9363dc4b 3206 set->policy = policy;
e6d8ecac
CFG
3207 set->udlen = udlen;
3208 set->udata = udata;
761da293
PM
3209 set->timeout = timeout;
3210 set->gc_int = gc_int;
3ecbfd65 3211 set->handle = nf_tables_alloc_handle(table);
20a69341 3212
c50b960c 3213 err = ops->init(set, &desc, nla);
20a69341 3214 if (err < 0)
2f6adf48 3215 goto err3;
20a69341 3216
958bee14 3217 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
20a69341 3218 if (err < 0)
2f6adf48 3219 goto err4;
20a69341 3220
e688a7f8 3221 list_add_tail_rcu(&set->list, &table->sets);
4fefee57 3222 table->use++;
20a69341
PM
3223 return 0;
3224
2f6adf48 3225err4:
c17c3cdf 3226 ops->destroy(set);
2f6adf48
FW
3227err3:
3228 kfree(set->name);
20a69341 3229err2:
1ff75a3e 3230 kvfree(set);
20a69341 3231err1:
2b664957 3232 module_put(ops->type->owner);
20a69341
PM
3233 return err;
3234}
3235
958bee14 3236static void nft_set_destroy(struct nft_set *set)
20a69341 3237{
20a69341 3238 set->ops->destroy(set);
2b664957 3239 module_put(set->ops->type->owner);
38745490 3240 kfree(set->name);
1ff75a3e 3241 kvfree(set);
20a69341
PM
3242}
3243
958bee14
PNA
3244static void nf_tables_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
3245{
e688a7f8 3246 list_del_rcu(&set->list);
31f8441c 3247 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET, GFP_ATOMIC);
958bee14
PNA
3248 nft_set_destroy(set);
3249}
3250
633c9a84
PNA
3251static int nf_tables_delset(struct net *net, struct sock *nlsk,
3252 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
3253 const struct nlattr * const nla[],
3254 struct netlink_ext_ack *extack)
20a69341 3255{
c9c8e485 3256 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
f2a6d766 3257 u8 genmask = nft_genmask_next(net);
20a69341
PM
3258 struct nft_set *set;
3259 struct nft_ctx ctx;
3260 int err;
3261
ec2c9935
PM
3262 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
3263 return -EAFNOSUPPORT;
20a69341
PM
3264 if (nla[NFTA_SET_TABLE] == NULL)
3265 return -EINVAL;
3266
f2a6d766 3267 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
20a69341
PM
3268 if (err < 0)
3269 return err;
3270
3ecbfd65
HS
3271 if (nla[NFTA_SET_HANDLE])
3272 set = nf_tables_set_lookup_byhandle(ctx.table, nla[NFTA_SET_HANDLE], genmask);
3273 else
3274 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
20a69341
PM
3275 if (IS_ERR(set))
3276 return PTR_ERR(set);
a8278400
PNA
3277
3278 if (!list_empty(&set->bindings) ||
3279 (nlh->nlmsg_flags & NLM_F_NONREC && atomic_read(&set->nelems) > 0))
20a69341
PM
3280 return -EBUSY;
3281
ee01d542 3282 return nft_delset(&ctx, set);
20a69341
PM
3283}
3284
3285static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
de70185d 3286 struct nft_set *set,
20a69341 3287 const struct nft_set_iter *iter,
de70185d 3288 struct nft_set_elem *elem)
20a69341 3289{
fe2811eb 3290 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
20a69341
PM
3291 enum nft_registers dreg;
3292
3293 dreg = nft_type_to_reg(set->dtype);
1ec10212
PM
3294 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
3295 set->dtype == NFT_DATA_VERDICT ?
3296 NFT_DATA_VERDICT : NFT_DATA_VALUE,
3297 set->dlen);
20a69341
PM
3298}
3299
3300int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
3301 struct nft_set_binding *binding)
3302{
3303 struct nft_set_binding *i;
3304 struct nft_set_iter iter;
3305
408070d6 3306 if (!list_empty(&set->bindings) && nft_set_is_anonymous(set))
20a69341
PM
3307 return -EBUSY;
3308
11113e19 3309 if (binding->flags & NFT_SET_MAP) {
20a69341
PM
3310 /* If the set is already bound to the same chain all
3311 * jumps are already validated for that chain.
3312 */
3313 list_for_each_entry(i, &set->bindings, list) {
a4684402 3314 if (i->flags & NFT_SET_MAP &&
11113e19 3315 i->chain == binding->chain)
20a69341
PM
3316 goto bind;
3317 }
3318
8588ac09 3319 iter.genmask = nft_genmask_next(ctx->net);
20a69341
PM
3320 iter.skip = 0;
3321 iter.count = 0;
3322 iter.err = 0;
3323 iter.fn = nf_tables_bind_check_setelem;
3324
3325 set->ops->walk(ctx, set, &iter);
a02f4248 3326 if (iter.err < 0)
20a69341 3327 return iter.err;
20a69341
PM
3328 }
3329bind:
3330 binding->chain = ctx->chain;
e688a7f8 3331 list_add_tail_rcu(&binding->list, &set->bindings);
20a69341
PM
3332 return 0;
3333}
63aea290 3334EXPORT_SYMBOL_GPL(nf_tables_bind_set);
20a69341
PM
3335
3336void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
3337 struct nft_set_binding *binding)
3338{
e688a7f8 3339 list_del_rcu(&binding->list);
20a69341 3340
408070d6 3341 if (list_empty(&set->bindings) && nft_set_is_anonymous(set) &&
37a9cc52 3342 nft_is_active(ctx->net, set))
20a69341
PM
3343 nf_tables_set_destroy(ctx, set);
3344}
63aea290 3345EXPORT_SYMBOL_GPL(nf_tables_unbind_set);
20a69341 3346
3ac4c07a
PM
3347const struct nft_set_ext_type nft_set_ext_types[] = {
3348 [NFT_SET_EXT_KEY] = {
7d740264 3349 .align = __alignof__(u32),
3ac4c07a
PM
3350 },
3351 [NFT_SET_EXT_DATA] = {
7d740264 3352 .align = __alignof__(u32),
3ac4c07a 3353 },
f25ad2e9
PM
3354 [NFT_SET_EXT_EXPR] = {
3355 .align = __alignof__(struct nft_expr),
3356 },
8aeff920
PNA
3357 [NFT_SET_EXT_OBJREF] = {
3358 .len = sizeof(struct nft_object *),
3359 .align = __alignof__(struct nft_object *),
3360 },
3ac4c07a
PM
3361 [NFT_SET_EXT_FLAGS] = {
3362 .len = sizeof(u8),
3363 .align = __alignof__(u8),
3364 },
c3e1b005
PM
3365 [NFT_SET_EXT_TIMEOUT] = {
3366 .len = sizeof(u64),
3367 .align = __alignof__(u64),
3368 },
3369 [NFT_SET_EXT_EXPIRATION] = {
3370 .len = sizeof(unsigned long),
3371 .align = __alignof__(unsigned long),
3372 },
68e942e8
PM
3373 [NFT_SET_EXT_USERDATA] = {
3374 .len = sizeof(struct nft_userdata),
3375 .align = __alignof__(struct nft_userdata),
3376 },
3ac4c07a
PM
3377};
3378EXPORT_SYMBOL_GPL(nft_set_ext_types);
3379
20a69341
PM
3380/*
3381 * Set elements
3382 */
3383
3384static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
3385 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
3386 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
3387 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
c3e1b005 3388 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
68e942e8
PM
3389 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
3390 .len = NFT_USERDATA_MAXLEN },
467697d2
FW
3391 [NFTA_SET_ELEM_EXPR] = { .type = NLA_NESTED },
3392 [NFTA_SET_ELEM_OBJREF] = { .type = NLA_STRING },
20a69341
PM
3393};
3394
3395static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
b2fbd044
LZ
3396 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING,
3397 .len = NFT_TABLE_MAXNAMELEN - 1 },
3398 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING,
3399 .len = NFT_SET_MAXNAMELEN - 1 },
20a69341 3400 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
958bee14 3401 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
20a69341
PM
3402};
3403
633c9a84 3404static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx, struct net *net,
20a69341
PM
3405 const struct sk_buff *skb,
3406 const struct nlmsghdr *nlh,
f2a6d766
PNA
3407 const struct nlattr * const nla[],
3408 u8 genmask)
20a69341
PM
3409{
3410 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
98319cb9 3411 int family = nfmsg->nfgen_family;
7c95f6d8 3412 struct nft_table *table;
20a69341 3413
36596dad 3414 table = nf_tables_table_lookup(net, nla[NFTA_SET_ELEM_LIST_TABLE],
98319cb9 3415 family, genmask);
20a69341
PM
3416 if (IS_ERR(table))
3417 return PTR_ERR(table);
3418
98319cb9 3419 nft_ctx_init(ctx, net, skb, nlh, family, table, NULL, nla);
20a69341
PM
3420 return 0;
3421}
3422
3423static int nf_tables_fill_setelem(struct sk_buff *skb,
3424 const struct nft_set *set,
3425 const struct nft_set_elem *elem)
3426{
fe2811eb 3427 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
20a69341
PM
3428 unsigned char *b = skb_tail_pointer(skb);
3429 struct nlattr *nest;
3430
3431 nest = nla_nest_start(skb, NFTA_LIST_ELEM);
3432 if (nest == NULL)
3433 goto nla_put_failure;
3434
fe2811eb
PM
3435 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
3436 NFT_DATA_VALUE, set->klen) < 0)
20a69341
PM
3437 goto nla_put_failure;
3438
fe2811eb
PM
3439 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3440 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
20a69341
PM
3441 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
3442 set->dlen) < 0)
3443 goto nla_put_failure;
3444
f25ad2e9
PM
3445 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
3446 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
3447 goto nla_put_failure;
3448
8aeff920
PNA
3449 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3450 nla_put_string(skb, NFTA_SET_ELEM_OBJREF,
3451 (*nft_set_ext_obj(ext))->name) < 0)
3452 goto nla_put_failure;
3453
fe2811eb
PM
3454 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
3455 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
3456 htonl(*nft_set_ext_flags(ext))))
3457 goto nla_put_failure;
20a69341 3458
c3e1b005
PM
3459 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
3460 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
d3e2a111
AP
3461 cpu_to_be64(jiffies_to_msecs(
3462 *nft_set_ext_timeout(ext))),
b46f6ded 3463 NFTA_SET_ELEM_PAD))
c3e1b005
PM
3464 goto nla_put_failure;
3465
3466 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
3467 unsigned long expires, now = jiffies;
3468
3469 expires = *nft_set_ext_expiration(ext);
3470 if (time_before(now, expires))
3471 expires -= now;
3472 else
3473 expires = 0;
3474
3475 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
b46f6ded
ND
3476 cpu_to_be64(jiffies_to_msecs(expires)),
3477 NFTA_SET_ELEM_PAD))
c3e1b005
PM
3478 goto nla_put_failure;
3479 }
3480
68e942e8
PM
3481 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
3482 struct nft_userdata *udata;
3483
3484 udata = nft_set_ext_userdata(ext);
3485 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
3486 udata->len + 1, udata->data))
3487 goto nla_put_failure;
3488 }
3489
20a69341
PM
3490 nla_nest_end(skb, nest);
3491 return 0;
3492
3493nla_put_failure:
3494 nlmsg_trim(skb, b);
3495 return -EMSGSIZE;
3496}
3497
3498struct nft_set_dump_args {
3499 const struct netlink_callback *cb;
3500 struct nft_set_iter iter;
3501 struct sk_buff *skb;
3502};
3503
3504static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
de70185d 3505 struct nft_set *set,
20a69341 3506 const struct nft_set_iter *iter,
de70185d 3507 struct nft_set_elem *elem)
20a69341
PM
3508{
3509 struct nft_set_dump_args *args;
3510
3511 args = container_of(iter, struct nft_set_dump_args, iter);
3512 return nf_tables_fill_setelem(args->skb, set, elem);
3513}
3514
fa803605
LZ
3515struct nft_set_dump_ctx {
3516 const struct nft_set *set;
3517 struct nft_ctx ctx;
3518};
3519
20a69341
PM
3520static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
3521{
fa803605 3522 struct nft_set_dump_ctx *dump_ctx = cb->data;
633c9a84 3523 struct net *net = sock_net(skb->sk);
fa803605 3524 struct nft_table *table;
de70185d 3525 struct nft_set *set;
20a69341 3526 struct nft_set_dump_args args;
fa803605 3527 bool set_found = false;
20a69341
PM
3528 struct nfgenmsg *nfmsg;
3529 struct nlmsghdr *nlh;
3530 struct nlattr *nest;
3531 u32 portid, seq;
fa803605 3532 int event;
20a69341 3533
fa803605 3534 rcu_read_lock();
36596dad
PNA
3535 list_for_each_entry_rcu(table, &net->nft.tables, list) {
3536 if (dump_ctx->ctx.family != NFPROTO_UNSPEC &&
98319cb9 3537 dump_ctx->ctx.family != table->family)
fa803605 3538 continue;
20a69341 3539
36596dad
PNA
3540 if (table != dump_ctx->ctx.table)
3541 continue;
20a69341 3542
36596dad
PNA
3543 list_for_each_entry_rcu(set, &table->sets, list) {
3544 if (set == dump_ctx->set) {
3545 set_found = true;
3546 break;
fa803605 3547 }
fa803605
LZ
3548 }
3549 break;
3550 }
3551
3552 if (!set_found) {
3553 rcu_read_unlock();
3554 return -ENOENT;
3555 }
20a69341 3556
dedb67c4 3557 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWSETELEM);
20a69341
PM
3558 portid = NETLINK_CB(cb->skb).portid;
3559 seq = cb->nlh->nlmsg_seq;
3560
3561 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3562 NLM_F_MULTI);
3563 if (nlh == NULL)
3564 goto nla_put_failure;
3565
3566 nfmsg = nlmsg_data(nlh);
98319cb9 3567 nfmsg->nfgen_family = table->family;
20a69341 3568 nfmsg->version = NFNETLINK_V0;
fa803605 3569 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
20a69341 3570
fa803605 3571 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, table->name))
20a69341
PM
3572 goto nla_put_failure;
3573 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
3574 goto nla_put_failure;
3575
3576 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3577 if (nest == NULL)
3578 goto nla_put_failure;
3579
8588ac09
PNA
3580 args.cb = cb;
3581 args.skb = skb;
fa803605 3582 args.iter.genmask = nft_genmask_cur(net);
8588ac09
PNA
3583 args.iter.skip = cb->args[0];
3584 args.iter.count = 0;
3585 args.iter.err = 0;
3586 args.iter.fn = nf_tables_dump_setelem;
fa803605
LZ
3587 set->ops->walk(&dump_ctx->ctx, set, &args.iter);
3588 rcu_read_unlock();
20a69341
PM
3589
3590 nla_nest_end(skb, nest);
3591 nlmsg_end(skb, nlh);
3592
3593 if (args.iter.err && args.iter.err != -EMSGSIZE)
3594 return args.iter.err;
3595 if (args.iter.count == cb->args[0])
3596 return 0;
3597
3598 cb->args[0] = args.iter.count;
3599 return skb->len;
3600
3601nla_put_failure:
fa803605 3602 rcu_read_unlock();
20a69341
PM
3603 return -ENOSPC;
3604}
3605
fa803605
LZ
3606static int nf_tables_dump_set_done(struct netlink_callback *cb)
3607{
3608 kfree(cb->data);
3609 return 0;
3610}
3611
d60ce62f
AB
3612static int nf_tables_fill_setelem_info(struct sk_buff *skb,
3613 const struct nft_ctx *ctx, u32 seq,
3614 u32 portid, int event, u16 flags,
3615 const struct nft_set *set,
3616 const struct nft_set_elem *elem)
3617{
3618 struct nfgenmsg *nfmsg;
3619 struct nlmsghdr *nlh;
3620 struct nlattr *nest;
3621 int err;
3622
dedb67c4 3623 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
d60ce62f
AB
3624 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3625 flags);
3626 if (nlh == NULL)
3627 goto nla_put_failure;
3628
3629 nfmsg = nlmsg_data(nlh);
36596dad 3630 nfmsg->nfgen_family = ctx->family;
d60ce62f 3631 nfmsg->version = NFNETLINK_V0;
84d7fce6 3632 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
d60ce62f
AB
3633
3634 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3635 goto nla_put_failure;
3636 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3637 goto nla_put_failure;
3638
3639 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3640 if (nest == NULL)
3641 goto nla_put_failure;
3642
3643 err = nf_tables_fill_setelem(skb, set, elem);
3644 if (err < 0)
3645 goto nla_put_failure;
3646
3647 nla_nest_end(skb, nest);
3648
053c095a
JB
3649 nlmsg_end(skb, nlh);
3650 return 0;
d60ce62f
AB
3651
3652nla_put_failure:
3653 nlmsg_trim(skb, nlh);
3654 return -1;
3655}
3656
ba0e4d99
PNA
3657static int nft_setelem_parse_flags(const struct nft_set *set,
3658 const struct nlattr *attr, u32 *flags)
3659{
3660 if (attr == NULL)
3661 return 0;
3662
3663 *flags = ntohl(nla_get_be32(attr));
3664 if (*flags & ~NFT_SET_ELEM_INTERVAL_END)
3665 return -EINVAL;
3666 if (!(set->flags & NFT_SET_INTERVAL) &&
3667 *flags & NFT_SET_ELEM_INTERVAL_END)
3668 return -EINVAL;
3669
3670 return 0;
3671}
3672
3673static int nft_get_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3674 const struct nlattr *attr)
3675{
3676 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3677 const struct nft_set_ext *ext;
3678 struct nft_data_desc desc;
3679 struct nft_set_elem elem;
3680 struct sk_buff *skb;
3681 uint32_t flags = 0;
3682 void *priv;
3683 int err;
3684
3685 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3686 nft_set_elem_policy, NULL);
3687 if (err < 0)
3688 return err;
3689
3690 if (!nla[NFTA_SET_ELEM_KEY])
3691 return -EINVAL;
3692
3693 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3694 if (err < 0)
3695 return err;
3696
3697 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
3698 nla[NFTA_SET_ELEM_KEY]);
3699 if (err < 0)
3700 return err;
3701
3702 err = -EINVAL;
3703 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
3704 return err;
3705
3706 priv = set->ops->get(ctx->net, set, &elem, flags);
3707 if (IS_ERR(priv))
3708 return PTR_ERR(priv);
3709
3710 elem.priv = priv;
3711 ext = nft_set_elem_ext(set, &elem);
3712
3713 err = -ENOMEM;
3714 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3715 if (skb == NULL)
3716 goto err1;
3717
3718 err = nf_tables_fill_setelem_info(skb, ctx, ctx->seq, ctx->portid,
3719 NFT_MSG_NEWSETELEM, 0, set, &elem);
3720 if (err < 0)
3721 goto err2;
3722
3723 err = nfnetlink_unicast(skb, ctx->net, ctx->portid, MSG_DONTWAIT);
3724 /* This avoids a loop in nfnetlink. */
3725 if (err < 0)
3726 goto err1;
3727
3728 return 0;
3729err2:
3730 kfree_skb(skb);
3731err1:
3732 /* this avoids a loop in nfnetlink. */
3733 return err == -EAGAIN ? -ENOBUFS : err;
3734}
3735
3736static int nf_tables_getsetelem(struct net *net, struct sock *nlsk,
3737 struct sk_buff *skb, const struct nlmsghdr *nlh,
3738 const struct nlattr * const nla[],
3739 struct netlink_ext_ack *extack)
3740{
3741 u8 genmask = nft_genmask_cur(net);
3742 struct nft_set *set;
3743 struct nlattr *attr;
3744 struct nft_ctx ctx;
3745 int rem, err = 0;
3746
3747 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3748 if (err < 0)
3749 return err;
3750
3751 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3752 genmask);
3753 if (IS_ERR(set))
3754 return PTR_ERR(set);
3755
3756 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3757 struct netlink_dump_control c = {
3758 .dump = nf_tables_dump_set,
3759 .done = nf_tables_dump_set_done,
3760 };
3761 struct nft_set_dump_ctx *dump_ctx;
3762
3763 dump_ctx = kmalloc(sizeof(*dump_ctx), GFP_KERNEL);
3764 if (!dump_ctx)
3765 return -ENOMEM;
3766
3767 dump_ctx->set = set;
3768 dump_ctx->ctx = ctx;
3769
3770 c.data = dump_ctx;
3771 return netlink_dump_start(nlsk, skb, nlh, &c);
3772 }
3773
3774 if (!nla[NFTA_SET_ELEM_LIST_ELEMENTS])
3775 return -EINVAL;
3776
3777 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3778 err = nft_get_set_elem(&ctx, set, attr);
3779 if (err < 0)
3780 break;
3781 }
3782
3783 return err;
3784}
3785
25e94a99
PNA
3786static void nf_tables_setelem_notify(const struct nft_ctx *ctx,
3787 const struct nft_set *set,
3788 const struct nft_set_elem *elem,
3789 int event, u16 flags)
d60ce62f 3790{
128ad332
PNA
3791 struct net *net = ctx->net;
3792 u32 portid = ctx->portid;
d60ce62f
AB
3793 struct sk_buff *skb;
3794 int err;
3795
128ad332 3796 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
25e94a99 3797 return;
d60ce62f 3798
d60ce62f
AB
3799 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3800 if (skb == NULL)
3801 goto err;
3802
3803 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
3804 set, elem);
3805 if (err < 0) {
3806 kfree_skb(skb);
3807 goto err;
3808 }
3809
25e94a99
PNA
3810 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
3811 GFP_KERNEL);
3812 return;
d60ce62f 3813err:
25e94a99 3814 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
d60ce62f
AB
3815}
3816
60319eb1
PNA
3817static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
3818 int msg_type,
3819 struct nft_set *set)
3820{
3821 struct nft_trans *trans;
3822
3823 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
3824 if (trans == NULL)
3825 return NULL;
3826
3827 nft_trans_elem_set(trans) = set;
3828 return trans;
3829}
3830
22fe54d5
PM
3831void *nft_set_elem_init(const struct nft_set *set,
3832 const struct nft_set_ext_tmpl *tmpl,
49499c3e 3833 const u32 *key, const u32 *data,
22fe54d5 3834 u64 timeout, gfp_t gfp)
fe2811eb
PM
3835{
3836 struct nft_set_ext *ext;
3837 void *elem;
3838
3839 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
3840 if (elem == NULL)
3841 return NULL;
3842
3843 ext = nft_set_elem_ext(set, elem);
3844 nft_set_ext_init(ext, tmpl);
3845
3846 memcpy(nft_set_ext_key(ext), key, set->klen);
3847 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3848 memcpy(nft_set_ext_data(ext), data, set->dlen);
c3e1b005
PM
3849 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION))
3850 *nft_set_ext_expiration(ext) =
d3e2a111 3851 jiffies + timeout;
c3e1b005
PM
3852 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
3853 *nft_set_ext_timeout(ext) = timeout;
fe2811eb
PM
3854
3855 return elem;
3856}
3857
61f9e292
LZ
3858void nft_set_elem_destroy(const struct nft_set *set, void *elem,
3859 bool destroy_expr)
61edafbb
PM
3860{
3861 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3862
59105446 3863 nft_data_release(nft_set_ext_key(ext), NFT_DATA_VALUE);
61edafbb 3864 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
59105446 3865 nft_data_release(nft_set_ext_data(ext), set->dtype);
61f9e292 3866 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
f25ad2e9 3867 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
8aeff920
PNA
3868 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
3869 (*nft_set_ext_obj(ext))->use--;
61edafbb
PM
3870 kfree(elem);
3871}
3872EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
3873
59105446
PNA
3874/* Only called from commit path, nft_set_elem_deactivate() already deals with
3875 * the refcounting from the preparation phase.
3876 */
3877static void nf_tables_set_elem_destroy(const struct nft_set *set, void *elem)
3878{
3879 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3880
3881 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3882 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3883 kfree(elem);
3884}
3885
60319eb1 3886static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
c016c7e4 3887 const struct nlattr *attr, u32 nlmsg_flags)
20a69341
PM
3888{
3889 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
8aeff920 3890 u8 genmask = nft_genmask_next(ctx->net);
20a69341 3891 struct nft_data_desc d1, d2;
fe2811eb 3892 struct nft_set_ext_tmpl tmpl;
c016c7e4 3893 struct nft_set_ext *ext, *ext2;
20a69341
PM
3894 struct nft_set_elem elem;
3895 struct nft_set_binding *binding;
8aeff920 3896 struct nft_object *obj = NULL;
68e942e8 3897 struct nft_userdata *udata;
fe2811eb 3898 struct nft_data data;
20a69341 3899 enum nft_registers dreg;
60319eb1 3900 struct nft_trans *trans;
0e9091d6 3901 u32 flags = 0;
c3e1b005 3902 u64 timeout;
68e942e8 3903 u8 ulen;
20a69341
PM
3904 int err;
3905
3906 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
fceb6435 3907 nft_set_elem_policy, NULL);
20a69341
PM
3908 if (err < 0)
3909 return err;
3910
3911 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3912 return -EINVAL;
3913
fe2811eb
PM
3914 nft_set_ext_prepare(&tmpl);
3915
0e9091d6
PNA
3916 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3917 if (err < 0)
3918 return err;
3919 if (flags != 0)
3920 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
20a69341
PM
3921
3922 if (set->flags & NFT_SET_MAP) {
3923 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
fe2811eb 3924 !(flags & NFT_SET_ELEM_INTERVAL_END))
20a69341 3925 return -EINVAL;
bd7fc645 3926 if (nla[NFTA_SET_ELEM_DATA] != NULL &&
fe2811eb 3927 flags & NFT_SET_ELEM_INTERVAL_END)
bd7fc645 3928 return -EINVAL;
20a69341
PM
3929 } else {
3930 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3931 return -EINVAL;
3932 }
3933
c3e1b005
PM
3934 timeout = 0;
3935 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
3936 if (!(set->flags & NFT_SET_TIMEOUT))
3937 return -EINVAL;
d3e2a111
AP
3938 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3939 nla[NFTA_SET_ELEM_TIMEOUT])));
c3e1b005
PM
3940 } else if (set->flags & NFT_SET_TIMEOUT) {
3941 timeout = set->timeout;
3942 }
3943
7d740264 3944 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
d0a11fc3 3945 nla[NFTA_SET_ELEM_KEY]);
20a69341
PM
3946 if (err < 0)
3947 goto err1;
3948 err = -EINVAL;
3949 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
3950 goto err2;
3951
7d740264 3952 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
c3e1b005
PM
3953 if (timeout > 0) {
3954 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
3955 if (timeout != set->timeout)
3956 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
3957 }
fe2811eb 3958
8aeff920
PNA
3959 if (nla[NFTA_SET_ELEM_OBJREF] != NULL) {
3960 if (!(set->flags & NFT_SET_OBJECT)) {
3961 err = -EINVAL;
3962 goto err2;
3963 }
3964 obj = nf_tables_obj_lookup(ctx->table, nla[NFTA_SET_ELEM_OBJREF],
3965 set->objtype, genmask);
3966 if (IS_ERR(obj)) {
3967 err = PTR_ERR(obj);
3968 goto err2;
3969 }
3970 nft_set_ext_add(&tmpl, NFT_SET_EXT_OBJREF);
3971 }
3972
20a69341 3973 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
d0a11fc3
PM
3974 err = nft_data_init(ctx, &data, sizeof(data), &d2,
3975 nla[NFTA_SET_ELEM_DATA]);
20a69341
PM
3976 if (err < 0)
3977 goto err2;
3978
3979 err = -EINVAL;
3980 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
3981 goto err3;
3982
3983 dreg = nft_type_to_reg(set->dtype);
3984 list_for_each_entry(binding, &set->bindings, list) {
3985 struct nft_ctx bind_ctx = {
58c78e10 3986 .net = ctx->net,
36596dad 3987 .family = ctx->family,
20a69341 3988 .table = ctx->table,
7c95f6d8 3989 .chain = (struct nft_chain *)binding->chain,
20a69341
PM
3990 };
3991
11113e19
PM
3992 if (!(binding->flags & NFT_SET_MAP))
3993 continue;
3994
1ec10212
PM
3995 err = nft_validate_register_store(&bind_ctx, dreg,
3996 &data,
3997 d2.type, d2.len);
20a69341
PM
3998 if (err < 0)
3999 goto err3;
4000 }
fe2811eb 4001
7d740264 4002 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
20a69341
PM
4003 }
4004
68e942e8
PM
4005 /* The full maximum length of userdata can exceed the maximum
4006 * offset value (U8_MAX) for following extensions, therefor it
4007 * must be the last extension added.
4008 */
4009 ulen = 0;
4010 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
4011 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
4012 if (ulen > 0)
4013 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
4014 ulen);
4015 }
4016
fe2811eb 4017 err = -ENOMEM;
7d740264 4018 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
c3e1b005 4019 timeout, GFP_KERNEL);
fe2811eb
PM
4020 if (elem.priv == NULL)
4021 goto err3;
4022
4023 ext = nft_set_elem_ext(set, elem.priv);
4024 if (flags)
4025 *nft_set_ext_flags(ext) = flags;
68e942e8
PM
4026 if (ulen > 0) {
4027 udata = nft_set_ext_userdata(ext);
4028 udata->len = ulen - 1;
4029 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
4030 }
8aeff920
PNA
4031 if (obj) {
4032 *nft_set_ext_obj(ext) = obj;
4033 obj->use++;
4034 }
fe2811eb 4035
60319eb1
PNA
4036 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
4037 if (trans == NULL)
fe2811eb 4038 goto err4;
60319eb1 4039
69086658 4040 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
c016c7e4
PNA
4041 err = set->ops->insert(ctx->net, set, &elem, &ext2);
4042 if (err) {
4043 if (err == -EEXIST) {
9744a6fc
PNA
4044 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) ^
4045 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) ||
4046 nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) ^
4047 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF))
4048 return -EBUSY;
8aeff920
PNA
4049 if ((nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
4050 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
4051 memcmp(nft_set_ext_data(ext),
4052 nft_set_ext_data(ext2), set->dlen) != 0) ||
4053 (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
4054 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF) &&
4055 *nft_set_ext_obj(ext) != *nft_set_ext_obj(ext2)))
c016c7e4
PNA
4056 err = -EBUSY;
4057 else if (!(nlmsg_flags & NLM_F_EXCL))
4058 err = 0;
4059 }
fe2811eb 4060 goto err5;
c016c7e4 4061 }
20a69341 4062
35d0ac90
PNA
4063 if (set->size &&
4064 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact)) {
4065 err = -ENFILE;
4066 goto err6;
4067 }
4068
60319eb1 4069 nft_trans_elem(trans) = elem;
46bbafce 4070 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
20a69341
PM
4071 return 0;
4072
35d0ac90 4073err6:
5cb82a38 4074 set->ops->remove(ctx->net, set, &elem);
fe2811eb 4075err5:
60319eb1 4076 kfree(trans);
fe2811eb
PM
4077err4:
4078 kfree(elem.priv);
20a69341
PM
4079err3:
4080 if (nla[NFTA_SET_ELEM_DATA] != NULL)
59105446 4081 nft_data_release(&data, d2.type);
20a69341 4082err2:
59105446 4083 nft_data_release(&elem.key.val, d1.type);
20a69341
PM
4084err1:
4085 return err;
4086}
4087
633c9a84
PNA
4088static int nf_tables_newsetelem(struct net *net, struct sock *nlsk,
4089 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
4090 const struct nlattr * const nla[],
4091 struct netlink_ext_ack *extack)
20a69341 4092{
f2a6d766 4093 u8 genmask = nft_genmask_next(net);
20a69341
PM
4094 const struct nlattr *attr;
4095 struct nft_set *set;
4096 struct nft_ctx ctx;
60319eb1 4097 int rem, err = 0;
20a69341 4098
7d5570ca
PNA
4099 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
4100 return -EINVAL;
4101
f2a6d766 4102 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
20a69341
PM
4103 if (err < 0)
4104 return err;
4105
a3073c17
PNA
4106 set = nft_set_lookup_global(net, ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
4107 nla[NFTA_SET_ELEM_LIST_SET_ID], genmask);
4108 if (IS_ERR(set))
4109 return PTR_ERR(set);
958bee14 4110
20a69341
PM
4111 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4112 return -EBUSY;
4113
4114 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
c016c7e4 4115 err = nft_add_set_elem(&ctx, set, attr, nlh->nlmsg_flags);
35d0ac90 4116 if (err < 0)
60319eb1 4117 break;
20a69341 4118 }
60319eb1 4119 return err;
20a69341
PM
4120}
4121
59105446
PNA
4122/**
4123 * nft_data_hold - hold a nft_data item
4124 *
4125 * @data: struct nft_data to release
4126 * @type: type of data
4127 *
4128 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4129 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
4130 * NFT_GOTO verdicts. This function must be called on active data objects
4131 * from the second phase of the commit protocol.
4132 */
4133static void nft_data_hold(const struct nft_data *data, enum nft_data_types type)
4134{
4135 if (type == NFT_DATA_VERDICT) {
4136 switch (data->verdict.code) {
4137 case NFT_JUMP:
4138 case NFT_GOTO:
4139 data->verdict.chain->use++;
4140 break;
4141 }
4142 }
4143}
4144
4145static void nft_set_elem_activate(const struct net *net,
4146 const struct nft_set *set,
4147 struct nft_set_elem *elem)
4148{
4149 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4150
4151 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4152 nft_data_hold(nft_set_ext_data(ext), set->dtype);
4153 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
4154 (*nft_set_ext_obj(ext))->use++;
4155}
4156
4157static void nft_set_elem_deactivate(const struct net *net,
4158 const struct nft_set *set,
4159 struct nft_set_elem *elem)
4160{
4161 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4162
4163 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4164 nft_data_release(nft_set_ext_data(ext), set->dtype);
4165 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
4166 (*nft_set_ext_obj(ext))->use--;
4167}
4168
60319eb1 4169static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
20a69341
PM
4170 const struct nlattr *attr)
4171{
4172 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3971ca14 4173 struct nft_set_ext_tmpl tmpl;
20a69341
PM
4174 struct nft_data_desc desc;
4175 struct nft_set_elem elem;
3971ca14 4176 struct nft_set_ext *ext;
60319eb1 4177 struct nft_trans *trans;
3971ca14
PNA
4178 u32 flags = 0;
4179 void *priv;
20a69341
PM
4180 int err;
4181
4182 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
fceb6435 4183 nft_set_elem_policy, NULL);
20a69341
PM
4184 if (err < 0)
4185 goto err1;
4186
4187 err = -EINVAL;
4188 if (nla[NFTA_SET_ELEM_KEY] == NULL)
4189 goto err1;
4190
3971ca14
PNA
4191 nft_set_ext_prepare(&tmpl);
4192
4193 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
4194 if (err < 0)
4195 return err;
4196 if (flags != 0)
4197 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
4198
7d740264 4199 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
d0a11fc3 4200 nla[NFTA_SET_ELEM_KEY]);
20a69341
PM
4201 if (err < 0)
4202 goto err1;
4203
4204 err = -EINVAL;
4205 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
4206 goto err2;
4207
3971ca14
PNA
4208 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, desc.len);
4209
4210 err = -ENOMEM;
4211 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, NULL, 0,
4212 GFP_KERNEL);
4213 if (elem.priv == NULL)
4214 goto err2;
4215
4216 ext = nft_set_elem_ext(set, elem.priv);
4217 if (flags)
4218 *nft_set_ext_flags(ext) = flags;
4219
60319eb1 4220 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
609ccf08
JL
4221 if (trans == NULL) {
4222 err = -ENOMEM;
3971ca14 4223 goto err3;
609ccf08 4224 }
20a69341 4225
42a55769 4226 priv = set->ops->deactivate(ctx->net, set, &elem);
3971ca14 4227 if (priv == NULL) {
cc02e457 4228 err = -ENOENT;
3971ca14 4229 goto err4;
cc02e457 4230 }
3971ca14
PNA
4231 kfree(elem.priv);
4232 elem.priv = priv;
cc02e457 4233
59105446
PNA
4234 nft_set_elem_deactivate(ctx->net, set, &elem);
4235
60319eb1 4236 nft_trans_elem(trans) = elem;
46bbafce 4237 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
0dc13625 4238 return 0;
cc02e457 4239
3971ca14 4240err4:
cc02e457 4241 kfree(trans);
3971ca14
PNA
4242err3:
4243 kfree(elem.priv);
20a69341 4244err2:
59105446 4245 nft_data_release(&elem.key.val, desc.type);
20a69341
PM
4246err1:
4247 return err;
4248}
4249
8411b644 4250static int nft_flush_set(const struct nft_ctx *ctx,
de70185d 4251 struct nft_set *set,
8411b644 4252 const struct nft_set_iter *iter,
de70185d 4253 struct nft_set_elem *elem)
8411b644
PNA
4254{
4255 struct nft_trans *trans;
4256 int err;
4257
4258 trans = nft_trans_alloc_gfp(ctx, NFT_MSG_DELSETELEM,
4259 sizeof(struct nft_trans_elem), GFP_ATOMIC);
4260 if (!trans)
4261 return -ENOMEM;
4262
1ba1c414 4263 if (!set->ops->flush(ctx->net, set, elem->priv)) {
8411b644
PNA
4264 err = -ENOENT;
4265 goto err1;
4266 }
b2c11e4b 4267 set->ndeact++;
8411b644 4268
de70185d
PNA
4269 nft_trans_elem_set(trans) = set;
4270 nft_trans_elem(trans) = *elem;
8411b644
PNA
4271 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4272
4273 return 0;
4274err1:
4275 kfree(trans);
4276 return err;
4277}
4278
633c9a84
PNA
4279static int nf_tables_delsetelem(struct net *net, struct sock *nlsk,
4280 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
4281 const struct nlattr * const nla[],
4282 struct netlink_ext_ack *extack)
20a69341 4283{
f2a6d766 4284 u8 genmask = nft_genmask_next(net);
20a69341
PM
4285 const struct nlattr *attr;
4286 struct nft_set *set;
4287 struct nft_ctx ctx;
60319eb1 4288 int rem, err = 0;
20a69341 4289
f2a6d766 4290 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
20a69341
PM
4291 if (err < 0)
4292 return err;
4293
37a9cc52
PNA
4294 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
4295 genmask);
20a69341
PM
4296 if (IS_ERR(set))
4297 return PTR_ERR(set);
4298 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4299 return -EBUSY;
4300
8411b644 4301 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL) {
baa2d42c
PNA
4302 struct nft_set_iter iter = {
4303 .genmask = genmask,
4304 .fn = nft_flush_set,
8411b644 4305 };
baa2d42c 4306 set->ops->walk(&ctx, set, &iter);
8411b644 4307
baa2d42c 4308 return iter.err;
8411b644
PNA
4309 }
4310
20a69341
PM
4311 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4312 err = nft_del_setelem(&ctx, set, attr);
4313 if (err < 0)
60319eb1 4314 break;
4fefee57 4315
3dd0673a 4316 set->ndeact++;
20a69341 4317 }
60319eb1 4318 return err;
20a69341
PM
4319}
4320
cfed7e1b
PM
4321void nft_set_gc_batch_release(struct rcu_head *rcu)
4322{
4323 struct nft_set_gc_batch *gcb;
4324 unsigned int i;
4325
4326 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
4327 for (i = 0; i < gcb->head.cnt; i++)
61f9e292 4328 nft_set_elem_destroy(gcb->head.set, gcb->elems[i], true);
cfed7e1b
PM
4329 kfree(gcb);
4330}
4331EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
4332
4333struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
4334 gfp_t gfp)
4335{
4336 struct nft_set_gc_batch *gcb;
4337
4338 gcb = kzalloc(sizeof(*gcb), gfp);
4339 if (gcb == NULL)
4340 return gcb;
4341 gcb->head.set = set;
4342 return gcb;
4343}
4344EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
4345
e5009240
PNA
4346/*
4347 * Stateful objects
4348 */
4349
4350/**
4351 * nft_register_obj- register nf_tables stateful object type
4352 * @obj: object type
4353 *
4354 * Registers the object type for use with nf_tables. Returns zero on
4355 * success or a negative errno code otherwise.
4356 */
4357int nft_register_obj(struct nft_object_type *obj_type)
4358{
4359 if (obj_type->type == NFT_OBJECT_UNSPEC)
4360 return -EINVAL;
4361
4362 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4363 list_add_rcu(&obj_type->list, &nf_tables_objects);
4364 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4365 return 0;
4366}
4367EXPORT_SYMBOL_GPL(nft_register_obj);
4368
4369/**
4370 * nft_unregister_obj - unregister nf_tables object type
4371 * @obj: object type
4372 *
4373 * Unregisters the object type for use with nf_tables.
4374 */
4375void nft_unregister_obj(struct nft_object_type *obj_type)
4376{
4377 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4378 list_del_rcu(&obj_type->list);
4379 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4380}
4381EXPORT_SYMBOL_GPL(nft_unregister_obj);
4382
4383struct nft_object *nf_tables_obj_lookup(const struct nft_table *table,
4384 const struct nlattr *nla,
4385 u32 objtype, u8 genmask)
4386{
4387 struct nft_object *obj;
4388
4389 list_for_each_entry(obj, &table->objects, list) {
4390 if (!nla_strcmp(nla, obj->name) &&
dfc46034 4391 objtype == obj->ops->type->type &&
e5009240
PNA
4392 nft_active_genmask(obj, genmask))
4393 return obj;
4394 }
4395 return ERR_PTR(-ENOENT);
4396}
4397EXPORT_SYMBOL_GPL(nf_tables_obj_lookup);
4398
ae0662f8 4399static struct nft_object *nf_tables_obj_lookup_byhandle(const struct nft_table *table,
4400 const struct nlattr *nla,
4401 u32 objtype, u8 genmask)
3ecbfd65
HS
4402{
4403 struct nft_object *obj;
4404
4405 list_for_each_entry(obj, &table->objects, list) {
4406 if (be64_to_cpu(nla_get_be64(nla)) == obj->handle &&
4407 objtype == obj->ops->type->type &&
4408 nft_active_genmask(obj, genmask))
4409 return obj;
4410 }
4411 return ERR_PTR(-ENOENT);
4412}
4413
e5009240 4414static const struct nla_policy nft_obj_policy[NFTA_OBJ_MAX + 1] = {
b2fbd044
LZ
4415 [NFTA_OBJ_TABLE] = { .type = NLA_STRING,
4416 .len = NFT_TABLE_MAXNAMELEN - 1 },
4417 [NFTA_OBJ_NAME] = { .type = NLA_STRING,
4418 .len = NFT_OBJ_MAXNAMELEN - 1 },
e5009240
PNA
4419 [NFTA_OBJ_TYPE] = { .type = NLA_U32 },
4420 [NFTA_OBJ_DATA] = { .type = NLA_NESTED },
3ecbfd65 4421 [NFTA_OBJ_HANDLE] = { .type = NLA_U64},
e5009240
PNA
4422};
4423
84fba055
FW
4424static struct nft_object *nft_obj_init(const struct nft_ctx *ctx,
4425 const struct nft_object_type *type,
e5009240
PNA
4426 const struct nlattr *attr)
4427{
5b4c6e38 4428 struct nlattr **tb;
dfc46034 4429 const struct nft_object_ops *ops;
e5009240 4430 struct nft_object *obj;
5b4c6e38
GS
4431 int err = -ENOMEM;
4432
4433 tb = kmalloc_array(type->maxattr + 1, sizeof(*tb), GFP_KERNEL);
4434 if (!tb)
4435 goto err1;
e5009240
PNA
4436
4437 if (attr) {
fceb6435
JB
4438 err = nla_parse_nested(tb, type->maxattr, attr, type->policy,
4439 NULL);
e5009240 4440 if (err < 0)
5b4c6e38 4441 goto err2;
e5009240
PNA
4442 } else {
4443 memset(tb, 0, sizeof(tb[0]) * (type->maxattr + 1));
4444 }
4445
dfc46034
PBG
4446 if (type->select_ops) {
4447 ops = type->select_ops(ctx, (const struct nlattr * const *)tb);
4448 if (IS_ERR(ops)) {
4449 err = PTR_ERR(ops);
5b4c6e38 4450 goto err2;
dfc46034
PBG
4451 }
4452 } else {
4453 ops = type->ops;
4454 }
4455
e5009240 4456 err = -ENOMEM;
dfc46034 4457 obj = kzalloc(sizeof(*obj) + ops->size, GFP_KERNEL);
5b4c6e38
GS
4458 if (!obj)
4459 goto err2;
e5009240 4460
dfc46034 4461 err = ops->init(ctx, (const struct nlattr * const *)tb, obj);
e5009240 4462 if (err < 0)
5b4c6e38 4463 goto err3;
e5009240 4464
dfc46034
PBG
4465 obj->ops = ops;
4466
5b4c6e38 4467 kfree(tb);
e5009240 4468 return obj;
5b4c6e38 4469err3:
e5009240 4470 kfree(obj);
5b4c6e38
GS
4471err2:
4472 kfree(tb);
e5009240
PNA
4473err1:
4474 return ERR_PTR(err);
4475}
4476
4477static int nft_object_dump(struct sk_buff *skb, unsigned int attr,
43da04a5 4478 struct nft_object *obj, bool reset)
e5009240
PNA
4479{
4480 struct nlattr *nest;
4481
4482 nest = nla_nest_start(skb, attr);
4483 if (!nest)
4484 goto nla_put_failure;
dfc46034 4485 if (obj->ops->dump(skb, obj, reset) < 0)
e5009240
PNA
4486 goto nla_put_failure;
4487 nla_nest_end(skb, nest);
4488 return 0;
4489
4490nla_put_failure:
4491 return -1;
4492}
4493
4494static const struct nft_object_type *__nft_obj_type_get(u32 objtype)
4495{
4496 const struct nft_object_type *type;
4497
4498 list_for_each_entry(type, &nf_tables_objects, list) {
4499 if (objtype == type->type)
4500 return type;
4501 }
4502 return NULL;
4503}
4504
4505static const struct nft_object_type *nft_obj_type_get(u32 objtype)
4506{
4507 const struct nft_object_type *type;
4508
4509 type = __nft_obj_type_get(objtype);
4510 if (type != NULL && try_module_get(type->owner))
4511 return type;
4512
4513#ifdef CONFIG_MODULES
4514 if (type == NULL) {
4515 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4516 request_module("nft-obj-%u", objtype);
4517 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4518 if (__nft_obj_type_get(objtype))
4519 return ERR_PTR(-EAGAIN);
4520 }
4521#endif
4522 return ERR_PTR(-ENOENT);
4523}
4524
4525static int nf_tables_newobj(struct net *net, struct sock *nlsk,
4526 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
4527 const struct nlattr * const nla[],
4528 struct netlink_ext_ack *extack)
e5009240
PNA
4529{
4530 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4531 const struct nft_object_type *type;
4532 u8 genmask = nft_genmask_next(net);
4533 int family = nfmsg->nfgen_family;
e5009240
PNA
4534 struct nft_table *table;
4535 struct nft_object *obj;
4536 struct nft_ctx ctx;
4537 u32 objtype;
4538 int err;
4539
4540 if (!nla[NFTA_OBJ_TYPE] ||
4541 !nla[NFTA_OBJ_NAME] ||
4542 !nla[NFTA_OBJ_DATA])
4543 return -EINVAL;
4544
98319cb9 4545 table = nf_tables_table_lookup(net, nla[NFTA_OBJ_TABLE], family,
36596dad 4546 genmask);
e5009240
PNA
4547 if (IS_ERR(table))
4548 return PTR_ERR(table);
4549
4550 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4551 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4552 if (IS_ERR(obj)) {
4553 err = PTR_ERR(obj);
4554 if (err != -ENOENT)
4555 return err;
4556
1a28ad74 4557 } else {
e5009240
PNA
4558 if (nlh->nlmsg_flags & NLM_F_EXCL)
4559 return -EEXIST;
4560
4561 return 0;
4562 }
4563
98319cb9 4564 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
e5009240
PNA
4565
4566 type = nft_obj_type_get(objtype);
4567 if (IS_ERR(type))
4568 return PTR_ERR(type);
4569
84fba055 4570 obj = nft_obj_init(&ctx, type, nla[NFTA_OBJ_DATA]);
e5009240
PNA
4571 if (IS_ERR(obj)) {
4572 err = PTR_ERR(obj);
4573 goto err1;
4574 }
18965317 4575 obj->table = table;
3ecbfd65
HS
4576 obj->handle = nf_tables_alloc_handle(table);
4577
61509575
PS
4578 obj->name = nla_strdup(nla[NFTA_OBJ_NAME], GFP_KERNEL);
4579 if (!obj->name) {
4580 err = -ENOMEM;
4581 goto err2;
4582 }
e5009240
PNA
4583
4584 err = nft_trans_obj_add(&ctx, NFT_MSG_NEWOBJ, obj);
4585 if (err < 0)
61509575 4586 goto err3;
e5009240
PNA
4587
4588 list_add_tail_rcu(&obj->list, &table->objects);
4589 table->use++;
4590 return 0;
61509575
PS
4591err3:
4592 kfree(obj->name);
e5009240 4593err2:
dfc46034
PBG
4594 if (obj->ops->destroy)
4595 obj->ops->destroy(obj);
e5009240
PNA
4596 kfree(obj);
4597err1:
4598 module_put(type->owner);
4599 return err;
4600}
4601
4602static int nf_tables_fill_obj_info(struct sk_buff *skb, struct net *net,
4603 u32 portid, u32 seq, int event, u32 flags,
4604 int family, const struct nft_table *table,
43da04a5 4605 struct nft_object *obj, bool reset)
e5009240
PNA
4606{
4607 struct nfgenmsg *nfmsg;
4608 struct nlmsghdr *nlh;
4609
dedb67c4 4610 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
e5009240
PNA
4611 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
4612 if (nlh == NULL)
4613 goto nla_put_failure;
4614
4615 nfmsg = nlmsg_data(nlh);
4616 nfmsg->nfgen_family = family;
4617 nfmsg->version = NFNETLINK_V0;
4618 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4619
4620 if (nla_put_string(skb, NFTA_OBJ_TABLE, table->name) ||
4621 nla_put_string(skb, NFTA_OBJ_NAME, obj->name) ||
dfc46034 4622 nla_put_be32(skb, NFTA_OBJ_TYPE, htonl(obj->ops->type->type)) ||
e5009240 4623 nla_put_be32(skb, NFTA_OBJ_USE, htonl(obj->use)) ||
3ecbfd65
HS
4624 nft_object_dump(skb, NFTA_OBJ_DATA, obj, reset) ||
4625 nla_put_be64(skb, NFTA_OBJ_HANDLE, cpu_to_be64(obj->handle),
4626 NFTA_OBJ_PAD))
e5009240
PNA
4627 goto nla_put_failure;
4628
4629 nlmsg_end(skb, nlh);
4630 return 0;
4631
4632nla_put_failure:
4633 nlmsg_trim(skb, nlh);
4634 return -1;
4635}
4636
a9fea2a3 4637struct nft_obj_filter {
e46abbcc 4638 char *table;
a9fea2a3
PNA
4639 u32 type;
4640};
4641
e5009240
PNA
4642static int nf_tables_dump_obj(struct sk_buff *skb, struct netlink_callback *cb)
4643{
4644 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
e5009240 4645 const struct nft_table *table;
e5009240 4646 unsigned int idx = 0, s_idx = cb->args[0];
a9fea2a3 4647 struct nft_obj_filter *filter = cb->data;
e5009240
PNA
4648 struct net *net = sock_net(skb->sk);
4649 int family = nfmsg->nfgen_family;
43da04a5
PNA
4650 struct nft_object *obj;
4651 bool reset = false;
4652
4653 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4654 reset = true;
e5009240
PNA
4655
4656 rcu_read_lock();
4657 cb->seq = net->nft.base_seq;
4658
36596dad 4659 list_for_each_entry_rcu(table, &net->nft.tables, list) {
98319cb9 4660 if (family != NFPROTO_UNSPEC && family != table->family)
e5009240
PNA
4661 continue;
4662
36596dad
PNA
4663 list_for_each_entry_rcu(obj, &table->objects, list) {
4664 if (!nft_is_active(net, obj))
4665 goto cont;
4666 if (idx < s_idx)
4667 goto cont;
4668 if (idx > s_idx)
4669 memset(&cb->args[1], 0,
4670 sizeof(cb->args) - sizeof(cb->args[0]));
4671 if (filter && filter->table[0] &&
4672 strcmp(filter->table, table->name))
4673 goto cont;
4674 if (filter &&
4675 filter->type != NFT_OBJECT_UNSPEC &&
4676 obj->ops->type->type != filter->type)
4677 goto cont;
a9fea2a3 4678
36596dad
PNA
4679 if (nf_tables_fill_obj_info(skb, net, NETLINK_CB(cb->skb).portid,
4680 cb->nlh->nlmsg_seq,
4681 NFT_MSG_NEWOBJ,
4682 NLM_F_MULTI | NLM_F_APPEND,
98319cb9 4683 table->family, table,
36596dad
PNA
4684 obj, reset) < 0)
4685 goto done;
e5009240 4686
36596dad 4687 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
e5009240 4688cont:
36596dad 4689 idx++;
e5009240
PNA
4690 }
4691 }
4692done:
4693 rcu_read_unlock();
4694
4695 cb->args[0] = idx;
4696 return skb->len;
4697}
4698
a9fea2a3
PNA
4699static int nf_tables_dump_obj_done(struct netlink_callback *cb)
4700{
e46abbcc
PS
4701 struct nft_obj_filter *filter = cb->data;
4702
8bea728d
HL
4703 if (filter) {
4704 kfree(filter->table);
4705 kfree(filter);
4706 }
a9fea2a3
PNA
4707
4708 return 0;
4709}
4710
4711static struct nft_obj_filter *
4712nft_obj_filter_alloc(const struct nlattr * const nla[])
4713{
4714 struct nft_obj_filter *filter;
4715
4716 filter = kzalloc(sizeof(*filter), GFP_KERNEL);
4717 if (!filter)
4718 return ERR_PTR(-ENOMEM);
4719
e46abbcc
PS
4720 if (nla[NFTA_OBJ_TABLE]) {
4721 filter->table = nla_strdup(nla[NFTA_OBJ_TABLE], GFP_KERNEL);
4722 if (!filter->table) {
4723 kfree(filter);
4724 return ERR_PTR(-ENOMEM);
4725 }
4726 }
a9fea2a3
PNA
4727 if (nla[NFTA_OBJ_TYPE])
4728 filter->type = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4729
4730 return filter;
4731}
4732
e5009240
PNA
4733static int nf_tables_getobj(struct net *net, struct sock *nlsk,
4734 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
4735 const struct nlattr * const nla[],
4736 struct netlink_ext_ack *extack)
e5009240
PNA
4737{
4738 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4739 u8 genmask = nft_genmask_cur(net);
4740 int family = nfmsg->nfgen_family;
e5009240
PNA
4741 const struct nft_table *table;
4742 struct nft_object *obj;
4743 struct sk_buff *skb2;
43da04a5 4744 bool reset = false;
e5009240
PNA
4745 u32 objtype;
4746 int err;
4747
4748 if (nlh->nlmsg_flags & NLM_F_DUMP) {
4749 struct netlink_dump_control c = {
4750 .dump = nf_tables_dump_obj,
a9fea2a3 4751 .done = nf_tables_dump_obj_done,
e5009240 4752 };
a9fea2a3
PNA
4753
4754 if (nla[NFTA_OBJ_TABLE] ||
4755 nla[NFTA_OBJ_TYPE]) {
4756 struct nft_obj_filter *filter;
4757
4758 filter = nft_obj_filter_alloc(nla);
4759 if (IS_ERR(filter))
4760 return -ENOMEM;
4761
4762 c.data = filter;
4763 }
e5009240
PNA
4764 return netlink_dump_start(nlsk, skb, nlh, &c);
4765 }
4766
4767 if (!nla[NFTA_OBJ_NAME] ||
4768 !nla[NFTA_OBJ_TYPE])
4769 return -EINVAL;
4770
98319cb9 4771 table = nf_tables_table_lookup(net, nla[NFTA_OBJ_TABLE], family,
36596dad 4772 genmask);
e5009240
PNA
4773 if (IS_ERR(table))
4774 return PTR_ERR(table);
4775
4776 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4777 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4778 if (IS_ERR(obj))
4779 return PTR_ERR(obj);
4780
4781 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4782 if (!skb2)
4783 return -ENOMEM;
4784
43da04a5
PNA
4785 if (NFNL_MSG_TYPE(nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4786 reset = true;
4787
e5009240
PNA
4788 err = nf_tables_fill_obj_info(skb2, net, NETLINK_CB(skb).portid,
4789 nlh->nlmsg_seq, NFT_MSG_NEWOBJ, 0,
43da04a5 4790 family, table, obj, reset);
e5009240
PNA
4791 if (err < 0)
4792 goto err;
4793
4794 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4795err:
4796 kfree_skb(skb2);
4797 return err;
e5009240
PNA
4798}
4799
4800static void nft_obj_destroy(struct nft_object *obj)
4801{
dfc46034
PBG
4802 if (obj->ops->destroy)
4803 obj->ops->destroy(obj);
e5009240 4804
dfc46034 4805 module_put(obj->ops->type->owner);
61509575 4806 kfree(obj->name);
e5009240
PNA
4807 kfree(obj);
4808}
4809
4810static int nf_tables_delobj(struct net *net, struct sock *nlsk,
04ba724b
PNA
4811 struct sk_buff *skb, const struct nlmsghdr *nlh,
4812 const struct nlattr * const nla[],
4813 struct netlink_ext_ack *extack)
e5009240
PNA
4814{
4815 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4816 u8 genmask = nft_genmask_next(net);
4817 int family = nfmsg->nfgen_family;
e5009240
PNA
4818 struct nft_table *table;
4819 struct nft_object *obj;
4820 struct nft_ctx ctx;
4821 u32 objtype;
4822
4823 if (!nla[NFTA_OBJ_TYPE] ||
3ecbfd65 4824 (!nla[NFTA_OBJ_NAME] && !nla[NFTA_OBJ_HANDLE]))
e5009240
PNA
4825 return -EINVAL;
4826
98319cb9 4827 table = nf_tables_table_lookup(net, nla[NFTA_OBJ_TABLE], family,
36596dad 4828 genmask);
e5009240
PNA
4829 if (IS_ERR(table))
4830 return PTR_ERR(table);
4831
4832 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
3ecbfd65
HS
4833 if (nla[NFTA_OBJ_HANDLE])
4834 obj = nf_tables_obj_lookup_byhandle(table, nla[NFTA_OBJ_HANDLE],
4835 objtype, genmask);
4836 else
4837 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME],
4838 objtype, genmask);
e5009240
PNA
4839 if (IS_ERR(obj))
4840 return PTR_ERR(obj);
4841 if (obj->use > 0)
4842 return -EBUSY;
4843
98319cb9 4844 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
e5009240
PNA
4845
4846 return nft_delobj(&ctx, obj);
4847}
4848
25e94a99
PNA
4849void nft_obj_notify(struct net *net, struct nft_table *table,
4850 struct nft_object *obj, u32 portid, u32 seq, int event,
4851 int family, int report, gfp_t gfp)
e5009240
PNA
4852{
4853 struct sk_buff *skb;
4854 int err;
4855
2599e989
PNA
4856 if (!report &&
4857 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
25e94a99 4858 return;
e5009240 4859
2599e989 4860 skb = nlmsg_new(NLMSG_GOODSIZE, gfp);
e5009240
PNA
4861 if (skb == NULL)
4862 goto err;
4863
2599e989
PNA
4864 err = nf_tables_fill_obj_info(skb, net, portid, seq, event, 0, family,
4865 table, obj, false);
e5009240
PNA
4866 if (err < 0) {
4867 kfree_skb(skb);
4868 goto err;
4869 }
4870
25e94a99
PNA
4871 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, report, gfp);
4872 return;
e5009240 4873err:
25e94a99 4874 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
e5009240 4875}
2599e989
PNA
4876EXPORT_SYMBOL_GPL(nft_obj_notify);
4877
25e94a99
PNA
4878static void nf_tables_obj_notify(const struct nft_ctx *ctx,
4879 struct nft_object *obj, int event)
2599e989 4880{
25e94a99 4881 nft_obj_notify(ctx->net, ctx->table, obj, ctx->portid, ctx->seq, event,
36596dad 4882 ctx->family, ctx->report, GFP_KERNEL);
2599e989 4883}
e5009240 4884
3b49e2e9
PNA
4885/*
4886 * Flow tables
4887 */
4888void nft_register_flowtable_type(struct nf_flowtable_type *type)
4889{
4890 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4891 list_add_tail_rcu(&type->list, &nf_tables_flowtables);
4892 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4893}
4894EXPORT_SYMBOL_GPL(nft_register_flowtable_type);
4895
4896void nft_unregister_flowtable_type(struct nf_flowtable_type *type)
4897{
4898 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4899 list_del_rcu(&type->list);
4900 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4901}
4902EXPORT_SYMBOL_GPL(nft_unregister_flowtable_type);
4903
4904static const struct nla_policy nft_flowtable_policy[NFTA_FLOWTABLE_MAX + 1] = {
4905 [NFTA_FLOWTABLE_TABLE] = { .type = NLA_STRING,
4906 .len = NFT_NAME_MAXLEN - 1 },
4907 [NFTA_FLOWTABLE_NAME] = { .type = NLA_STRING,
4908 .len = NFT_NAME_MAXLEN - 1 },
4909 [NFTA_FLOWTABLE_HOOK] = { .type = NLA_NESTED },
3ecbfd65 4910 [NFTA_FLOWTABLE_HANDLE] = { .type = NLA_U64 },
3b49e2e9
PNA
4911};
4912
4913struct nft_flowtable *nf_tables_flowtable_lookup(const struct nft_table *table,
4914 const struct nlattr *nla,
4915 u8 genmask)
4916{
4917 struct nft_flowtable *flowtable;
4918
4919 list_for_each_entry(flowtable, &table->flowtables, list) {
4920 if (!nla_strcmp(nla, flowtable->name) &&
4921 nft_active_genmask(flowtable, genmask))
4922 return flowtable;
4923 }
4924 return ERR_PTR(-ENOENT);
4925}
4926EXPORT_SYMBOL_GPL(nf_tables_flowtable_lookup);
4927
ae0662f8 4928static struct nft_flowtable *
3ecbfd65
HS
4929nf_tables_flowtable_lookup_byhandle(const struct nft_table *table,
4930 const struct nlattr *nla, u8 genmask)
4931{
4932 struct nft_flowtable *flowtable;
4933
4934 list_for_each_entry(flowtable, &table->flowtables, list) {
4935 if (be64_to_cpu(nla_get_be64(nla)) == flowtable->handle &&
4936 nft_active_genmask(flowtable, genmask))
4937 return flowtable;
4938 }
4939 return ERR_PTR(-ENOENT);
4940}
4941
3b49e2e9
PNA
4942static int nf_tables_parse_devices(const struct nft_ctx *ctx,
4943 const struct nlattr *attr,
4944 struct net_device *dev_array[], int *len)
4945{
4946 const struct nlattr *tmp;
4947 struct net_device *dev;
4948 char ifname[IFNAMSIZ];
4949 int rem, n = 0, err;
4950
4951 nla_for_each_nested(tmp, attr, rem) {
4952 if (nla_type(tmp) != NFTA_DEVICE_NAME) {
4953 err = -EINVAL;
4954 goto err1;
4955 }
4956
4957 nla_strlcpy(ifname, tmp, IFNAMSIZ);
90d2723c 4958 dev = __dev_get_by_name(ctx->net, ifname);
3b49e2e9
PNA
4959 if (!dev) {
4960 err = -ENOENT;
4961 goto err1;
4962 }
4963
4964 dev_array[n++] = dev;
4965 if (n == NFT_FLOWTABLE_DEVICE_MAX) {
4966 err = -EFBIG;
4967 goto err1;
4968 }
4969 }
4970 if (!len)
4971 return -EINVAL;
4972
4973 err = 0;
4974err1:
4975 *len = n;
4976 return err;
4977}
4978
4979static const struct nla_policy nft_flowtable_hook_policy[NFTA_FLOWTABLE_HOOK_MAX + 1] = {
4980 [NFTA_FLOWTABLE_HOOK_NUM] = { .type = NLA_U32 },
4981 [NFTA_FLOWTABLE_HOOK_PRIORITY] = { .type = NLA_U32 },
4982 [NFTA_FLOWTABLE_HOOK_DEVS] = { .type = NLA_NESTED },
4983};
4984
4985static int nf_tables_flowtable_parse_hook(const struct nft_ctx *ctx,
4986 const struct nlattr *attr,
4987 struct nft_flowtable *flowtable)
4988{
4989 struct net_device *dev_array[NFT_FLOWTABLE_DEVICE_MAX];
4990 struct nlattr *tb[NFTA_FLOWTABLE_HOOK_MAX + 1];
4991 struct nf_hook_ops *ops;
4992 int hooknum, priority;
4993 int err, n = 0, i;
4994
4995 err = nla_parse_nested(tb, NFTA_FLOWTABLE_HOOK_MAX, attr,
4996 nft_flowtable_hook_policy, NULL);
4997 if (err < 0)
4998 return err;
4999
5000 if (!tb[NFTA_FLOWTABLE_HOOK_NUM] ||
5001 !tb[NFTA_FLOWTABLE_HOOK_PRIORITY] ||
5002 !tb[NFTA_FLOWTABLE_HOOK_DEVS])
5003 return -EINVAL;
5004
5005 hooknum = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_NUM]));
fe19c04c 5006 if (hooknum != NF_NETDEV_INGRESS)
3b49e2e9
PNA
5007 return -EINVAL;
5008
5009 priority = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_PRIORITY]));
5010
5011 err = nf_tables_parse_devices(ctx, tb[NFTA_FLOWTABLE_HOOK_DEVS],
5012 dev_array, &n);
5013 if (err < 0)
d92191aa 5014 return err;
3b49e2e9
PNA
5015
5016 ops = kzalloc(sizeof(struct nf_hook_ops) * n, GFP_KERNEL);
90d2723c
PNA
5017 if (!ops)
5018 return -ENOMEM;
3b49e2e9 5019
0e839dfa
PNA
5020 flowtable->hooknum = hooknum;
5021 flowtable->priority = priority;
3b49e2e9
PNA
5022 flowtable->ops = ops;
5023 flowtable->ops_len = n;
5024
5025 for (i = 0; i < n; i++) {
5026 flowtable->ops[i].pf = NFPROTO_NETDEV;
5027 flowtable->ops[i].hooknum = hooknum;
5028 flowtable->ops[i].priority = priority;
5029 flowtable->ops[i].priv = &flowtable->data.rhashtable;
5030 flowtable->ops[i].hook = flowtable->data.type->hook;
5031 flowtable->ops[i].dev = dev_array[i];
d92191aa
PNA
5032 flowtable->dev_name[i] = kstrdup(dev_array[i]->name,
5033 GFP_KERNEL);
3b49e2e9
PNA
5034 }
5035
3b49e2e9
PNA
5036 return err;
5037}
5038
98319cb9 5039static const struct nf_flowtable_type *__nft_flowtable_type_get(u8 family)
3b49e2e9
PNA
5040{
5041 const struct nf_flowtable_type *type;
5042
5043 list_for_each_entry(type, &nf_tables_flowtables, list) {
98319cb9 5044 if (family == type->family)
3b49e2e9
PNA
5045 return type;
5046 }
5047 return NULL;
5048}
5049
98319cb9 5050static const struct nf_flowtable_type *nft_flowtable_type_get(u8 family)
3b49e2e9
PNA
5051{
5052 const struct nf_flowtable_type *type;
5053
98319cb9 5054 type = __nft_flowtable_type_get(family);
3b49e2e9
PNA
5055 if (type != NULL && try_module_get(type->owner))
5056 return type;
5057
5058#ifdef CONFIG_MODULES
5059 if (type == NULL) {
5060 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
98319cb9 5061 request_module("nf-flowtable-%u", family);
3b49e2e9 5062 nfnl_lock(NFNL_SUBSYS_NFTABLES);
98319cb9 5063 if (__nft_flowtable_type_get(family))
3b49e2e9
PNA
5064 return ERR_PTR(-EAGAIN);
5065 }
5066#endif
5067 return ERR_PTR(-ENOENT);
5068}
5069
5070void nft_flow_table_iterate(struct net *net,
5071 void (*iter)(struct nf_flowtable *flowtable, void *data),
5072 void *data)
5073{
5074 struct nft_flowtable *flowtable;
3b49e2e9
PNA
5075 const struct nft_table *table;
5076
c7f0030b
PNA
5077 nfnl_lock(NFNL_SUBSYS_NFTABLES);
5078 list_for_each_entry(table, &net->nft.tables, list) {
5079 list_for_each_entry(flowtable, &table->flowtables, list) {
dd4cbef7 5080 iter(&flowtable->data, data);
3b49e2e9
PNA
5081 }
5082 }
c7f0030b 5083 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
3b49e2e9
PNA
5084}
5085EXPORT_SYMBOL_GPL(nft_flow_table_iterate);
5086
5087static void nft_unregister_flowtable_net_hooks(struct net *net,
5088 struct nft_flowtable *flowtable)
5089{
5090 int i;
5091
5092 for (i = 0; i < flowtable->ops_len; i++) {
5093 if (!flowtable->ops[i].dev)
5094 continue;
5095
5096 nf_unregister_net_hook(net, &flowtable->ops[i]);
5097 }
5098}
5099
5100static int nf_tables_newflowtable(struct net *net, struct sock *nlsk,
5101 struct sk_buff *skb,
5102 const struct nlmsghdr *nlh,
5103 const struct nlattr * const nla[],
5104 struct netlink_ext_ack *extack)
5105{
5106 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5107 const struct nf_flowtable_type *type;
32fc7187 5108 struct nft_flowtable *flowtable, *ft;
3b49e2e9
PNA
5109 u8 genmask = nft_genmask_next(net);
5110 int family = nfmsg->nfgen_family;
3b49e2e9
PNA
5111 struct nft_table *table;
5112 struct nft_ctx ctx;
5113 int err, i, k;
5114
5115 if (!nla[NFTA_FLOWTABLE_TABLE] ||
5116 !nla[NFTA_FLOWTABLE_NAME] ||
5117 !nla[NFTA_FLOWTABLE_HOOK])
5118 return -EINVAL;
5119
36596dad 5120 table = nf_tables_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE],
98319cb9 5121 family, genmask);
3b49e2e9
PNA
5122 if (IS_ERR(table))
5123 return PTR_ERR(table);
5124
5125 flowtable = nf_tables_flowtable_lookup(table, nla[NFTA_FLOWTABLE_NAME],
5126 genmask);
5127 if (IS_ERR(flowtable)) {
5128 err = PTR_ERR(flowtable);
5129 if (err != -ENOENT)
5130 return err;
5131 } else {
5132 if (nlh->nlmsg_flags & NLM_F_EXCL)
5133 return -EEXIST;
5134
5135 return 0;
5136 }
5137
98319cb9 5138 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
3b49e2e9
PNA
5139
5140 flowtable = kzalloc(sizeof(*flowtable), GFP_KERNEL);
5141 if (!flowtable)
5142 return -ENOMEM;
5143
5144 flowtable->table = table;
3ecbfd65
HS
5145 flowtable->handle = nf_tables_alloc_handle(table);
5146
3b49e2e9
PNA
5147 flowtable->name = nla_strdup(nla[NFTA_FLOWTABLE_NAME], GFP_KERNEL);
5148 if (!flowtable->name) {
5149 err = -ENOMEM;
5150 goto err1;
5151 }
5152
98319cb9 5153 type = nft_flowtable_type_get(family);
3b49e2e9
PNA
5154 if (IS_ERR(type)) {
5155 err = PTR_ERR(type);
5156 goto err2;
5157 }
5158
5159 flowtable->data.type = type;
5160 err = rhashtable_init(&flowtable->data.rhashtable, type->params);
5161 if (err < 0)
5162 goto err3;
5163
5164 err = nf_tables_flowtable_parse_hook(&ctx, nla[NFTA_FLOWTABLE_HOOK],
5165 flowtable);
5166 if (err < 0)
5167 goto err3;
5168
5169 for (i = 0; i < flowtable->ops_len; i++) {
32fc7187
PNA
5170 if (!flowtable->ops[i].dev)
5171 continue;
5172
5173 list_for_each_entry(ft, &table->flowtables, list) {
5174 for (k = 0; k < ft->ops_len; k++) {
5175 if (!ft->ops[k].dev)
5176 continue;
5177
5178 if (flowtable->ops[i].dev == ft->ops[k].dev &&
5179 flowtable->ops[i].pf == ft->ops[k].pf) {
5180 err = -EBUSY;
5181 goto err4;
5182 }
5183 }
5184 }
5185
3b49e2e9
PNA
5186 err = nf_register_net_hook(net, &flowtable->ops[i]);
5187 if (err < 0)
5188 goto err4;
5189 }
5190
5191 err = nft_trans_flowtable_add(&ctx, NFT_MSG_NEWFLOWTABLE, flowtable);
5192 if (err < 0)
5193 goto err5;
5194
5195 INIT_DEFERRABLE_WORK(&flowtable->data.gc_work, type->gc);
5196 queue_delayed_work(system_power_efficient_wq,
5197 &flowtable->data.gc_work, HZ);
5198
5199 list_add_tail_rcu(&flowtable->list, &table->flowtables);
5200 table->use++;
5201
5202 return 0;
5203err5:
5204 i = flowtable->ops_len;
5205err4:
d92191aa
PNA
5206 for (k = i - 1; k >= 0; k--) {
5207 kfree(flowtable->dev_name[k]);
0e0d5002 5208 nf_unregister_net_hook(net, &flowtable->ops[k]);
d92191aa 5209 }
3b49e2e9
PNA
5210
5211 kfree(flowtable->ops);
5212err3:
5213 module_put(type->owner);
5214err2:
5215 kfree(flowtable->name);
5216err1:
5217 kfree(flowtable);
5218 return err;
5219}
5220
5221static int nf_tables_delflowtable(struct net *net, struct sock *nlsk,
5222 struct sk_buff *skb,
5223 const struct nlmsghdr *nlh,
5224 const struct nlattr * const nla[],
5225 struct netlink_ext_ack *extack)
5226{
5227 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5228 u8 genmask = nft_genmask_next(net);
5229 int family = nfmsg->nfgen_family;
5230 struct nft_flowtable *flowtable;
3b49e2e9
PNA
5231 struct nft_table *table;
5232 struct nft_ctx ctx;
5233
e603ea4b
PNA
5234 if (!nla[NFTA_FLOWTABLE_TABLE] ||
5235 (!nla[NFTA_FLOWTABLE_NAME] &&
5236 !nla[NFTA_FLOWTABLE_HANDLE]))
5237 return -EINVAL;
5238
36596dad 5239 table = nf_tables_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE],
98319cb9 5240 family, genmask);
3b49e2e9
PNA
5241 if (IS_ERR(table))
5242 return PTR_ERR(table);
5243
3ecbfd65
HS
5244 if (nla[NFTA_FLOWTABLE_HANDLE])
5245 flowtable = nf_tables_flowtable_lookup_byhandle(table,
5246 nla[NFTA_FLOWTABLE_HANDLE],
5247 genmask);
5248 else
5249 flowtable = nf_tables_flowtable_lookup(table,
5250 nla[NFTA_FLOWTABLE_NAME],
5251 genmask);
3b49e2e9
PNA
5252 if (IS_ERR(flowtable))
5253 return PTR_ERR(flowtable);
5254 if (flowtable->use > 0)
5255 return -EBUSY;
5256
98319cb9 5257 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
3b49e2e9
PNA
5258
5259 return nft_delflowtable(&ctx, flowtable);
5260}
5261
5262static int nf_tables_fill_flowtable_info(struct sk_buff *skb, struct net *net,
5263 u32 portid, u32 seq, int event,
5264 u32 flags, int family,
5265 struct nft_flowtable *flowtable)
5266{
5267 struct nlattr *nest, *nest_devs;
5268 struct nfgenmsg *nfmsg;
5269 struct nlmsghdr *nlh;
5270 int i;
5271
5272 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
5273 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
5274 if (nlh == NULL)
5275 goto nla_put_failure;
5276
5277 nfmsg = nlmsg_data(nlh);
5278 nfmsg->nfgen_family = family;
5279 nfmsg->version = NFNETLINK_V0;
5280 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
5281
5282 if (nla_put_string(skb, NFTA_FLOWTABLE_TABLE, flowtable->table->name) ||
5283 nla_put_string(skb, NFTA_FLOWTABLE_NAME, flowtable->name) ||
3ecbfd65
HS
5284 nla_put_be32(skb, NFTA_FLOWTABLE_USE, htonl(flowtable->use)) ||
5285 nla_put_be64(skb, NFTA_FLOWTABLE_HANDLE, cpu_to_be64(flowtable->handle),
5286 NFTA_FLOWTABLE_PAD))
3b49e2e9
PNA
5287 goto nla_put_failure;
5288
5289 nest = nla_nest_start(skb, NFTA_FLOWTABLE_HOOK);
5290 if (nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_NUM, htonl(flowtable->hooknum)) ||
5291 nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_PRIORITY, htonl(flowtable->priority)))
5292 goto nla_put_failure;
5293
5294 nest_devs = nla_nest_start(skb, NFTA_FLOWTABLE_HOOK_DEVS);
5295 if (!nest_devs)
5296 goto nla_put_failure;
5297
5298 for (i = 0; i < flowtable->ops_len; i++) {
d92191aa 5299 if (flowtable->dev_name[i][0] &&
3b49e2e9 5300 nla_put_string(skb, NFTA_DEVICE_NAME,
d92191aa 5301 flowtable->dev_name[i]))
3b49e2e9
PNA
5302 goto nla_put_failure;
5303 }
5304 nla_nest_end(skb, nest_devs);
5305 nla_nest_end(skb, nest);
5306
5307 nlmsg_end(skb, nlh);
5308 return 0;
5309
5310nla_put_failure:
5311 nlmsg_trim(skb, nlh);
5312 return -1;
5313}
5314
5315struct nft_flowtable_filter {
5316 char *table;
5317};
5318
5319static int nf_tables_dump_flowtable(struct sk_buff *skb,
5320 struct netlink_callback *cb)
5321{
5322 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
5323 struct nft_flowtable_filter *filter = cb->data;
5324 unsigned int idx = 0, s_idx = cb->args[0];
5325 struct net *net = sock_net(skb->sk);
5326 int family = nfmsg->nfgen_family;
5327 struct nft_flowtable *flowtable;
3b49e2e9
PNA
5328 const struct nft_table *table;
5329
5330 rcu_read_lock();
5331 cb->seq = net->nft.base_seq;
5332
36596dad 5333 list_for_each_entry_rcu(table, &net->nft.tables, list) {
98319cb9 5334 if (family != NFPROTO_UNSPEC && family != table->family)
3b49e2e9
PNA
5335 continue;
5336
36596dad
PNA
5337 list_for_each_entry_rcu(flowtable, &table->flowtables, list) {
5338 if (!nft_is_active(net, flowtable))
5339 goto cont;
5340 if (idx < s_idx)
5341 goto cont;
5342 if (idx > s_idx)
5343 memset(&cb->args[1], 0,
5344 sizeof(cb->args) - sizeof(cb->args[0]));
5345 if (filter && filter->table[0] &&
5346 strcmp(filter->table, table->name))
5347 goto cont;
3b49e2e9 5348
36596dad
PNA
5349 if (nf_tables_fill_flowtable_info(skb, net, NETLINK_CB(cb->skb).portid,
5350 cb->nlh->nlmsg_seq,
5351 NFT_MSG_NEWFLOWTABLE,
5352 NLM_F_MULTI | NLM_F_APPEND,
98319cb9 5353 table->family, flowtable) < 0)
36596dad 5354 goto done;
3b49e2e9 5355
36596dad 5356 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
3b49e2e9 5357cont:
36596dad 5358 idx++;
3b49e2e9
PNA
5359 }
5360 }
5361done:
5362 rcu_read_unlock();
5363
5364 cb->args[0] = idx;
5365 return skb->len;
5366}
5367
5368static int nf_tables_dump_flowtable_done(struct netlink_callback *cb)
5369{
5370 struct nft_flowtable_filter *filter = cb->data;
5371
5372 if (!filter)
5373 return 0;
5374
5375 kfree(filter->table);
5376 kfree(filter);
5377
5378 return 0;
5379}
5380
5381static struct nft_flowtable_filter *
5382nft_flowtable_filter_alloc(const struct nlattr * const nla[])
5383{
5384 struct nft_flowtable_filter *filter;
5385
5386 filter = kzalloc(sizeof(*filter), GFP_KERNEL);
5387 if (!filter)
5388 return ERR_PTR(-ENOMEM);
5389
5390 if (nla[NFTA_FLOWTABLE_TABLE]) {
5391 filter->table = nla_strdup(nla[NFTA_FLOWTABLE_TABLE],
5392 GFP_KERNEL);
5393 if (!filter->table) {
5394 kfree(filter);
5395 return ERR_PTR(-ENOMEM);
5396 }
5397 }
5398 return filter;
5399}
5400
5401static int nf_tables_getflowtable(struct net *net, struct sock *nlsk,
5402 struct sk_buff *skb,
5403 const struct nlmsghdr *nlh,
5404 const struct nlattr * const nla[],
5405 struct netlink_ext_ack *extack)
5406{
5407 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5408 u8 genmask = nft_genmask_cur(net);
5409 int family = nfmsg->nfgen_family;
5410 struct nft_flowtable *flowtable;
3b49e2e9
PNA
5411 const struct nft_table *table;
5412 struct sk_buff *skb2;
5413 int err;
5414
5415 if (nlh->nlmsg_flags & NLM_F_DUMP) {
5416 struct netlink_dump_control c = {
5417 .dump = nf_tables_dump_flowtable,
5418 .done = nf_tables_dump_flowtable_done,
5419 };
5420
5421 if (nla[NFTA_FLOWTABLE_TABLE]) {
5422 struct nft_flowtable_filter *filter;
5423
5424 filter = nft_flowtable_filter_alloc(nla);
5425 if (IS_ERR(filter))
5426 return -ENOMEM;
5427
5428 c.data = filter;
5429 }
5430 return netlink_dump_start(nlsk, skb, nlh, &c);
5431 }
5432
5433 if (!nla[NFTA_FLOWTABLE_NAME])
5434 return -EINVAL;
5435
36596dad 5436 table = nf_tables_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE],
98319cb9 5437 family, genmask);
3b49e2e9
PNA
5438 if (IS_ERR(table))
5439 return PTR_ERR(table);
5440
5441 flowtable = nf_tables_flowtable_lookup(table, nla[NFTA_FLOWTABLE_NAME],
5442 genmask);
03a0120f 5443 if (IS_ERR(flowtable))
3b49e2e9
PNA
5444 return PTR_ERR(flowtable);
5445
5446 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
5447 if (!skb2)
5448 return -ENOMEM;
5449
5450 err = nf_tables_fill_flowtable_info(skb2, net, NETLINK_CB(skb).portid,
5451 nlh->nlmsg_seq,
5452 NFT_MSG_NEWFLOWTABLE, 0, family,
5453 flowtable);
5454 if (err < 0)
5455 goto err;
5456
5457 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
5458err:
5459 kfree_skb(skb2);
5460 return err;
5461}
5462
5463static void nf_tables_flowtable_notify(struct nft_ctx *ctx,
5464 struct nft_flowtable *flowtable,
5465 int event)
5466{
5467 struct sk_buff *skb;
5468 int err;
5469
5470 if (ctx->report &&
5471 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
5472 return;
5473
5474 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
5475 if (skb == NULL)
5476 goto err;
5477
5478 err = nf_tables_fill_flowtable_info(skb, ctx->net, ctx->portid,
5479 ctx->seq, event, 0,
36596dad 5480 ctx->family, flowtable);
3b49e2e9
PNA
5481 if (err < 0) {
5482 kfree_skb(skb);
5483 goto err;
5484 }
5485
5486 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
5487 ctx->report, GFP_KERNEL);
5488 return;
5489err:
5490 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
5491}
5492
3b49e2e9
PNA
5493static void nf_tables_flowtable_destroy(struct nft_flowtable *flowtable)
5494{
5495 cancel_delayed_work_sync(&flowtable->data.gc_work);
c04a3f73 5496 kfree(flowtable->ops);
3b49e2e9 5497 kfree(flowtable->name);
b408c5b0
PNA
5498 flowtable->data.type->free(&flowtable->data);
5499 rhashtable_destroy(&flowtable->data.rhashtable);
3b49e2e9
PNA
5500 module_put(flowtable->data.type->owner);
5501}
5502
84d7fce6
PNA
5503static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
5504 u32 portid, u32 seq)
5505{
5506 struct nlmsghdr *nlh;
5507 struct nfgenmsg *nfmsg;
784b4e61 5508 char buf[TASK_COMM_LEN];
dedb67c4 5509 int event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWGEN);
84d7fce6
PNA
5510
5511 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
5512 if (nlh == NULL)
5513 goto nla_put_failure;
5514
5515 nfmsg = nlmsg_data(nlh);
5516 nfmsg->nfgen_family = AF_UNSPEC;
5517 nfmsg->version = NFNETLINK_V0;
5518 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
5519
784b4e61
PS
5520 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)) ||
5521 nla_put_be32(skb, NFTA_GEN_PROC_PID, htonl(task_pid_nr(current))) ||
5522 nla_put_string(skb, NFTA_GEN_PROC_NAME, get_task_comm(buf, current)))
84d7fce6
PNA
5523 goto nla_put_failure;
5524
053c095a
JB
5525 nlmsg_end(skb, nlh);
5526 return 0;
84d7fce6
PNA
5527
5528nla_put_failure:
5529 nlmsg_trim(skb, nlh);
5530 return -EMSGSIZE;
5531}
5532
3b49e2e9
PNA
5533static void nft_flowtable_event(unsigned long event, struct net_device *dev,
5534 struct nft_flowtable *flowtable)
5535{
5536 int i;
5537
5538 for (i = 0; i < flowtable->ops_len; i++) {
5539 if (flowtable->ops[i].dev != dev)
5540 continue;
5541
5542 nf_unregister_net_hook(dev_net(dev), &flowtable->ops[i]);
d92191aa 5543 flowtable->dev_name[i][0] = '\0';
3b49e2e9
PNA
5544 flowtable->ops[i].dev = NULL;
5545 break;
5546 }
5547}
5548
5549static int nf_tables_flowtable_event(struct notifier_block *this,
5550 unsigned long event, void *ptr)
5551{
5552 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
5553 struct nft_flowtable *flowtable;
5554 struct nft_table *table;
3b49e2e9
PNA
5555
5556 if (event != NETDEV_UNREGISTER)
5557 return 0;
5558
5559 nfnl_lock(NFNL_SUBSYS_NFTABLES);
36596dad
PNA
5560 list_for_each_entry(table, &dev_net(dev)->nft.tables, list) {
5561 list_for_each_entry(flowtable, &table->flowtables, list) {
5562 nft_flowtable_event(event, dev, flowtable);
3b49e2e9
PNA
5563 }
5564 }
5565 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
5566
5567 return NOTIFY_DONE;
5568}
5569
5570static struct notifier_block nf_tables_flowtable_notifier = {
5571 .notifier_call = nf_tables_flowtable_event,
5572};
5573
25e94a99
PNA
5574static void nf_tables_gen_notify(struct net *net, struct sk_buff *skb,
5575 int event)
84d7fce6
PNA
5576{
5577 struct nlmsghdr *nlh = nlmsg_hdr(skb);
5578 struct sk_buff *skb2;
5579 int err;
5580
5581 if (nlmsg_report(nlh) &&
5582 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
25e94a99 5583 return;
84d7fce6 5584
84d7fce6
PNA
5585 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
5586 if (skb2 == NULL)
5587 goto err;
5588
5589 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
5590 nlh->nlmsg_seq);
5591 if (err < 0) {
5592 kfree_skb(skb2);
5593 goto err;
5594 }
5595
25e94a99
PNA
5596 nfnetlink_send(skb2, net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
5597 nlmsg_report(nlh), GFP_KERNEL);
5598 return;
84d7fce6 5599err:
25e94a99
PNA
5600 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
5601 -ENOBUFS);
84d7fce6
PNA
5602}
5603
7b8002a1
PNA
5604static int nf_tables_getgen(struct net *net, struct sock *nlsk,
5605 struct sk_buff *skb, const struct nlmsghdr *nlh,
04ba724b
PNA
5606 const struct nlattr * const nla[],
5607 struct netlink_ext_ack *extack)
84d7fce6 5608{
84d7fce6
PNA
5609 struct sk_buff *skb2;
5610 int err;
5611
5612 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
5613 if (skb2 == NULL)
5614 return -ENOMEM;
5615
5616 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
5617 nlh->nlmsg_seq);
5618 if (err < 0)
5619 goto err;
5620
5621 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
5622err:
5623 kfree_skb(skb2);
5624 return err;
5625}
5626
96518518
PM
5627static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
5628 [NFT_MSG_NEWTABLE] = {
55dd6f93 5629 .call_batch = nf_tables_newtable,
96518518
PM
5630 .attr_count = NFTA_TABLE_MAX,
5631 .policy = nft_table_policy,
5632 },
5633 [NFT_MSG_GETTABLE] = {
5634 .call = nf_tables_gettable,
5635 .attr_count = NFTA_TABLE_MAX,
5636 .policy = nft_table_policy,
5637 },
5638 [NFT_MSG_DELTABLE] = {
55dd6f93 5639 .call_batch = nf_tables_deltable,
96518518
PM
5640 .attr_count = NFTA_TABLE_MAX,
5641 .policy = nft_table_policy,
5642 },
5643 [NFT_MSG_NEWCHAIN] = {
91c7b38d 5644 .call_batch = nf_tables_newchain,
96518518
PM
5645 .attr_count = NFTA_CHAIN_MAX,
5646 .policy = nft_chain_policy,
5647 },
5648 [NFT_MSG_GETCHAIN] = {
5649 .call = nf_tables_getchain,
5650 .attr_count = NFTA_CHAIN_MAX,
5651 .policy = nft_chain_policy,
5652 },
5653 [NFT_MSG_DELCHAIN] = {
91c7b38d 5654 .call_batch = nf_tables_delchain,
96518518
PM
5655 .attr_count = NFTA_CHAIN_MAX,
5656 .policy = nft_chain_policy,
5657 },
5658 [NFT_MSG_NEWRULE] = {
0628b123 5659 .call_batch = nf_tables_newrule,
96518518
PM
5660 .attr_count = NFTA_RULE_MAX,
5661 .policy = nft_rule_policy,
5662 },
5663 [NFT_MSG_GETRULE] = {
5664 .call = nf_tables_getrule,
5665 .attr_count = NFTA_RULE_MAX,
5666 .policy = nft_rule_policy,
5667 },
5668 [NFT_MSG_DELRULE] = {
0628b123 5669 .call_batch = nf_tables_delrule,
96518518
PM
5670 .attr_count = NFTA_RULE_MAX,
5671 .policy = nft_rule_policy,
5672 },
20a69341 5673 [NFT_MSG_NEWSET] = {
958bee14 5674 .call_batch = nf_tables_newset,
20a69341
PM
5675 .attr_count = NFTA_SET_MAX,
5676 .policy = nft_set_policy,
5677 },
5678 [NFT_MSG_GETSET] = {
5679 .call = nf_tables_getset,
5680 .attr_count = NFTA_SET_MAX,
5681 .policy = nft_set_policy,
5682 },
5683 [NFT_MSG_DELSET] = {
958bee14 5684 .call_batch = nf_tables_delset,
20a69341
PM
5685 .attr_count = NFTA_SET_MAX,
5686 .policy = nft_set_policy,
5687 },
5688 [NFT_MSG_NEWSETELEM] = {
958bee14 5689 .call_batch = nf_tables_newsetelem,
20a69341
PM
5690 .attr_count = NFTA_SET_ELEM_LIST_MAX,
5691 .policy = nft_set_elem_list_policy,
5692 },
5693 [NFT_MSG_GETSETELEM] = {
5694 .call = nf_tables_getsetelem,
5695 .attr_count = NFTA_SET_ELEM_LIST_MAX,
5696 .policy = nft_set_elem_list_policy,
5697 },
5698 [NFT_MSG_DELSETELEM] = {
958bee14 5699 .call_batch = nf_tables_delsetelem,
20a69341
PM
5700 .attr_count = NFTA_SET_ELEM_LIST_MAX,
5701 .policy = nft_set_elem_list_policy,
5702 },
84d7fce6
PNA
5703 [NFT_MSG_GETGEN] = {
5704 .call = nf_tables_getgen,
5705 },
e5009240
PNA
5706 [NFT_MSG_NEWOBJ] = {
5707 .call_batch = nf_tables_newobj,
5708 .attr_count = NFTA_OBJ_MAX,
5709 .policy = nft_obj_policy,
5710 },
5711 [NFT_MSG_GETOBJ] = {
5712 .call = nf_tables_getobj,
5713 .attr_count = NFTA_OBJ_MAX,
5714 .policy = nft_obj_policy,
5715 },
5716 [NFT_MSG_DELOBJ] = {
5717 .call_batch = nf_tables_delobj,
5718 .attr_count = NFTA_OBJ_MAX,
5719 .policy = nft_obj_policy,
5720 },
43da04a5
PNA
5721 [NFT_MSG_GETOBJ_RESET] = {
5722 .call = nf_tables_getobj,
5723 .attr_count = NFTA_OBJ_MAX,
5724 .policy = nft_obj_policy,
5725 },
3b49e2e9
PNA
5726 [NFT_MSG_NEWFLOWTABLE] = {
5727 .call_batch = nf_tables_newflowtable,
5728 .attr_count = NFTA_FLOWTABLE_MAX,
5729 .policy = nft_flowtable_policy,
5730 },
5731 [NFT_MSG_GETFLOWTABLE] = {
5732 .call = nf_tables_getflowtable,
5733 .attr_count = NFTA_FLOWTABLE_MAX,
5734 .policy = nft_flowtable_policy,
5735 },
5736 [NFT_MSG_DELFLOWTABLE] = {
5737 .call_batch = nf_tables_delflowtable,
5738 .attr_count = NFTA_FLOWTABLE_MAX,
5739 .policy = nft_flowtable_policy,
5740 },
96518518
PM
5741};
5742
91c7b38d
PNA
5743static void nft_chain_commit_update(struct nft_trans *trans)
5744{
5745 struct nft_base_chain *basechain;
5746
b7263e07 5747 if (nft_trans_chain_name(trans))
d71efb59 5748 swap(trans->ctx.chain->name, nft_trans_chain_name(trans));
91c7b38d 5749
f323d954 5750 if (!nft_is_base_chain(trans->ctx.chain))
91c7b38d
PNA
5751 return;
5752
5753 basechain = nft_base_chain(trans->ctx.chain);
5754 nft_chain_stats_replace(basechain, nft_trans_chain_stats(trans));
5755
5756 switch (nft_trans_chain_policy(trans)) {
5757 case NF_DROP:
5758 case NF_ACCEPT:
5759 basechain->policy = nft_trans_chain_policy(trans);
5760 break;
5761 }
5762}
5763
b326dd37 5764static void nf_tables_commit_release(struct nft_trans *trans)
c7c32e72 5765{
c7c32e72
PNA
5766 switch (trans->msg_type) {
5767 case NFT_MSG_DELTABLE:
5768 nf_tables_table_destroy(&trans->ctx);
5769 break;
5770 case NFT_MSG_DELCHAIN:
43a605f2 5771 nf_tables_chain_destroy(&trans->ctx);
c7c32e72
PNA
5772 break;
5773 case NFT_MSG_DELRULE:
5774 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
5775 break;
5776 case NFT_MSG_DELSET:
5777 nft_set_destroy(nft_trans_set(trans));
5778 break;
61edafbb 5779 case NFT_MSG_DELSETELEM:
59105446
PNA
5780 nf_tables_set_elem_destroy(nft_trans_elem_set(trans),
5781 nft_trans_elem(trans).priv);
61edafbb 5782 break;
e5009240
PNA
5783 case NFT_MSG_DELOBJ:
5784 nft_obj_destroy(nft_trans_obj(trans));
5785 break;
3b49e2e9
PNA
5786 case NFT_MSG_DELFLOWTABLE:
5787 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
5788 break;
c7c32e72
PNA
5789 }
5790 kfree(trans);
5791}
5792
5913beaf 5793static int nf_tables_commit(struct net *net, struct sk_buff *skb)
37082f93 5794{
37082f93 5795 struct nft_trans *trans, *next;
a3716e70 5796 struct nft_trans_elem *te;
37082f93
PNA
5797
5798 /* Bump generation counter, invalidate any dump in progress */
38e029f1 5799 while (++net->nft.base_seq == 0);
37082f93
PNA
5800
5801 /* A new generation has just started */
ea4bd995 5802 net->nft.gencursor = nft_gencursor_next(net);
37082f93
PNA
5803
5804 /* Make sure all packets have left the previous generation before
5805 * purging old rules.
5806 */
5807 synchronize_rcu();
5808
5809 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
b380e5c7 5810 switch (trans->msg_type) {
55dd6f93
PNA
5811 case NFT_MSG_NEWTABLE:
5812 if (nft_trans_table_update(trans)) {
5813 if (!nft_trans_table_enable(trans)) {
664b0f8c 5814 nf_tables_table_disable(net,
55dd6f93
PNA
5815 trans->ctx.table);
5816 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
5817 }
5818 } else {
f2a6d766 5819 nft_clear(net, trans->ctx.table);
55dd6f93 5820 }
35151d84 5821 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
55dd6f93
PNA
5822 nft_trans_destroy(trans);
5823 break;
5824 case NFT_MSG_DELTABLE:
f2a6d766 5825 list_del_rcu(&trans->ctx.table->list);
35151d84 5826 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
55dd6f93 5827 break;
91c7b38d
PNA
5828 case NFT_MSG_NEWCHAIN:
5829 if (nft_trans_chain_update(trans))
5830 nft_chain_commit_update(trans);
4fefee57 5831 else
664b0f8c 5832 nft_clear(net, trans->ctx.chain);
4fefee57 5833
35151d84 5834 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
91c7b38d
PNA
5835 nft_trans_destroy(trans);
5836 break;
5837 case NFT_MSG_DELCHAIN:
664b0f8c 5838 list_del_rcu(&trans->ctx.chain->list);
35151d84 5839 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
c974a3a3
PNA
5840 nf_tables_unregister_hook(trans->ctx.net,
5841 trans->ctx.table,
5842 trans->ctx.chain);
91c7b38d 5843 break;
b380e5c7 5844 case NFT_MSG_NEWRULE:
889f7ee7 5845 nft_clear(trans->ctx.net, nft_trans_rule(trans));
35151d84 5846 nf_tables_rule_notify(&trans->ctx,
37082f93 5847 nft_trans_rule(trans),
35151d84 5848 NFT_MSG_NEWRULE);
37082f93 5849 nft_trans_destroy(trans);
b380e5c7
PNA
5850 break;
5851 case NFT_MSG_DELRULE:
5852 list_del_rcu(&nft_trans_rule(trans)->list);
35151d84
PNA
5853 nf_tables_rule_notify(&trans->ctx,
5854 nft_trans_rule(trans),
5855 NFT_MSG_DELRULE);
b380e5c7 5856 break;
958bee14 5857 case NFT_MSG_NEWSET:
37a9cc52 5858 nft_clear(net, nft_trans_set(trans));
4fefee57
PNA
5859 /* This avoids hitting -EBUSY when deleting the table
5860 * from the transaction.
5861 */
408070d6 5862 if (nft_set_is_anonymous(nft_trans_set(trans)) &&
4fefee57
PNA
5863 !list_empty(&nft_trans_set(trans)->bindings))
5864 trans->ctx.table->use--;
5865
958bee14 5866 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
31f8441c 5867 NFT_MSG_NEWSET, GFP_KERNEL);
958bee14
PNA
5868 nft_trans_destroy(trans);
5869 break;
5870 case NFT_MSG_DELSET:
37a9cc52 5871 list_del_rcu(&nft_trans_set(trans)->list);
958bee14 5872 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
31f8441c 5873 NFT_MSG_DELSET, GFP_KERNEL);
958bee14 5874 break;
60319eb1 5875 case NFT_MSG_NEWSETELEM:
cc02e457
PM
5876 te = (struct nft_trans_elem *)trans->data;
5877
42a55769 5878 te->set->ops->activate(net, te->set, &te->elem);
cc02e457
PM
5879 nf_tables_setelem_notify(&trans->ctx, te->set,
5880 &te->elem,
60319eb1
PNA
5881 NFT_MSG_NEWSETELEM, 0);
5882 nft_trans_destroy(trans);
5883 break;
5884 case NFT_MSG_DELSETELEM:
a3716e70 5885 te = (struct nft_trans_elem *)trans->data;
fe2811eb 5886
a3716e70
PNA
5887 nf_tables_setelem_notify(&trans->ctx, te->set,
5888 &te->elem,
60319eb1 5889 NFT_MSG_DELSETELEM, 0);
5cb82a38 5890 te->set->ops->remove(net, te->set, &te->elem);
3dd0673a
PM
5891 atomic_dec(&te->set->nelems);
5892 te->set->ndeact--;
60319eb1 5893 break;
e5009240
PNA
5894 case NFT_MSG_NEWOBJ:
5895 nft_clear(net, nft_trans_obj(trans));
5896 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
5897 NFT_MSG_NEWOBJ);
5898 nft_trans_destroy(trans);
5899 break;
5900 case NFT_MSG_DELOBJ:
5901 list_del_rcu(&nft_trans_obj(trans)->list);
5902 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
5903 NFT_MSG_DELOBJ);
5904 break;
3b49e2e9
PNA
5905 case NFT_MSG_NEWFLOWTABLE:
5906 nft_clear(net, nft_trans_flowtable(trans));
5907 nf_tables_flowtable_notify(&trans->ctx,
5908 nft_trans_flowtable(trans),
5909 NFT_MSG_NEWFLOWTABLE);
5910 nft_trans_destroy(trans);
5911 break;
5912 case NFT_MSG_DELFLOWTABLE:
5913 list_del_rcu(&nft_trans_flowtable(trans)->list);
5914 nf_tables_flowtable_notify(&trans->ctx,
5915 nft_trans_flowtable(trans),
5916 NFT_MSG_DELFLOWTABLE);
5917 nft_unregister_flowtable_net_hooks(net,
5918 nft_trans_flowtable(trans));
5919 break;
37082f93 5920 }
37082f93
PNA
5921 }
5922
b326dd37
PNA
5923 synchronize_rcu();
5924
37082f93 5925 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
c7c32e72 5926 list_del(&trans->list);
b326dd37 5927 nf_tables_commit_release(trans);
37082f93 5928 }
84d7fce6
PNA
5929
5930 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
37082f93
PNA
5931
5932 return 0;
5933}
5934
b326dd37 5935static void nf_tables_abort_release(struct nft_trans *trans)
c7c32e72 5936{
c7c32e72
PNA
5937 switch (trans->msg_type) {
5938 case NFT_MSG_NEWTABLE:
5939 nf_tables_table_destroy(&trans->ctx);
5940 break;
5941 case NFT_MSG_NEWCHAIN:
43a605f2 5942 nf_tables_chain_destroy(&trans->ctx);
c7c32e72
PNA
5943 break;
5944 case NFT_MSG_NEWRULE:
5945 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
5946 break;
5947 case NFT_MSG_NEWSET:
5948 nft_set_destroy(nft_trans_set(trans));
5949 break;
61edafbb
PM
5950 case NFT_MSG_NEWSETELEM:
5951 nft_set_elem_destroy(nft_trans_elem_set(trans),
61f9e292 5952 nft_trans_elem(trans).priv, true);
61edafbb 5953 break;
e5009240
PNA
5954 case NFT_MSG_NEWOBJ:
5955 nft_obj_destroy(nft_trans_obj(trans));
5956 break;
3b49e2e9
PNA
5957 case NFT_MSG_NEWFLOWTABLE:
5958 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
5959 break;
c7c32e72
PNA
5960 }
5961 kfree(trans);
5962}
5963
5913beaf 5964static int nf_tables_abort(struct net *net, struct sk_buff *skb)
37082f93 5965{
37082f93 5966 struct nft_trans *trans, *next;
02263db0 5967 struct nft_trans_elem *te;
37082f93 5968
a907e36d
XL
5969 list_for_each_entry_safe_reverse(trans, next, &net->nft.commit_list,
5970 list) {
b380e5c7 5971 switch (trans->msg_type) {
55dd6f93
PNA
5972 case NFT_MSG_NEWTABLE:
5973 if (nft_trans_table_update(trans)) {
5974 if (nft_trans_table_enable(trans)) {
664b0f8c 5975 nf_tables_table_disable(net,
55dd6f93
PNA
5976 trans->ctx.table);
5977 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
5978 }
5979 nft_trans_destroy(trans);
5980 } else {
e688a7f8 5981 list_del_rcu(&trans->ctx.table->list);
55dd6f93
PNA
5982 }
5983 break;
5984 case NFT_MSG_DELTABLE:
f2a6d766 5985 nft_clear(trans->ctx.net, trans->ctx.table);
55dd6f93
PNA
5986 nft_trans_destroy(trans);
5987 break;
91c7b38d
PNA
5988 case NFT_MSG_NEWCHAIN:
5989 if (nft_trans_chain_update(trans)) {
982f4051 5990 free_percpu(nft_trans_chain_stats(trans));
91c7b38d
PNA
5991
5992 nft_trans_destroy(trans);
5993 } else {
4fefee57 5994 trans->ctx.table->use--;
e688a7f8 5995 list_del_rcu(&trans->ctx.chain->list);
c974a3a3
PNA
5996 nf_tables_unregister_hook(trans->ctx.net,
5997 trans->ctx.table,
5998 trans->ctx.chain);
91c7b38d
PNA
5999 }
6000 break;
6001 case NFT_MSG_DELCHAIN:
4fefee57 6002 trans->ctx.table->use++;
664b0f8c 6003 nft_clear(trans->ctx.net, trans->ctx.chain);
91c7b38d
PNA
6004 nft_trans_destroy(trans);
6005 break;
b380e5c7 6006 case NFT_MSG_NEWRULE:
4fefee57 6007 trans->ctx.chain->use--;
b380e5c7
PNA
6008 list_del_rcu(&nft_trans_rule(trans)->list);
6009 break;
6010 case NFT_MSG_DELRULE:
4fefee57 6011 trans->ctx.chain->use++;
889f7ee7 6012 nft_clear(trans->ctx.net, nft_trans_rule(trans));
37082f93 6013 nft_trans_destroy(trans);
b380e5c7 6014 break;
958bee14 6015 case NFT_MSG_NEWSET:
4fefee57 6016 trans->ctx.table->use--;
e688a7f8 6017 list_del_rcu(&nft_trans_set(trans)->list);
958bee14
PNA
6018 break;
6019 case NFT_MSG_DELSET:
4fefee57 6020 trans->ctx.table->use++;
37a9cc52 6021 nft_clear(trans->ctx.net, nft_trans_set(trans));
958bee14
PNA
6022 nft_trans_destroy(trans);
6023 break;
60319eb1 6024 case NFT_MSG_NEWSETELEM:
02263db0 6025 te = (struct nft_trans_elem *)trans->data;
fe2811eb 6026
5cb82a38 6027 te->set->ops->remove(net, te->set, &te->elem);
3dd0673a 6028 atomic_dec(&te->set->nelems);
60319eb1
PNA
6029 break;
6030 case NFT_MSG_DELSETELEM:
cc02e457
PM
6031 te = (struct nft_trans_elem *)trans->data;
6032
59105446 6033 nft_set_elem_activate(net, te->set, &te->elem);
42a55769 6034 te->set->ops->activate(net, te->set, &te->elem);
3dd0673a 6035 te->set->ndeact--;
cc02e457 6036
e5009240
PNA
6037 nft_trans_destroy(trans);
6038 break;
6039 case NFT_MSG_NEWOBJ:
6040 trans->ctx.table->use--;
6041 list_del_rcu(&nft_trans_obj(trans)->list);
6042 break;
6043 case NFT_MSG_DELOBJ:
6044 trans->ctx.table->use++;
6045 nft_clear(trans->ctx.net, nft_trans_obj(trans));
60319eb1
PNA
6046 nft_trans_destroy(trans);
6047 break;
3b49e2e9
PNA
6048 case NFT_MSG_NEWFLOWTABLE:
6049 trans->ctx.table->use--;
6050 list_del_rcu(&nft_trans_flowtable(trans)->list);
6051 nft_unregister_flowtable_net_hooks(net,
6052 nft_trans_flowtable(trans));
6053 break;
6054 case NFT_MSG_DELFLOWTABLE:
6055 trans->ctx.table->use++;
6056 nft_clear(trans->ctx.net, nft_trans_flowtable(trans));
6057 nft_trans_destroy(trans);
6058 break;
37082f93 6059 }
37082f93
PNA
6060 }
6061
b326dd37
PNA
6062 synchronize_rcu();
6063
a1cee076
PNA
6064 list_for_each_entry_safe_reverse(trans, next,
6065 &net->nft.commit_list, list) {
c7c32e72 6066 list_del(&trans->list);
b326dd37 6067 nf_tables_abort_release(trans);
37082f93
PNA
6068 }
6069
6070 return 0;
6071}
6072
74e8bcd2
PNA
6073static bool nf_tables_valid_genid(struct net *net, u32 genid)
6074{
6075 return net->nft.base_seq == genid;
6076}
6077
96518518
PM
6078static const struct nfnetlink_subsystem nf_tables_subsys = {
6079 .name = "nf_tables",
6080 .subsys_id = NFNL_SUBSYS_NFTABLES,
6081 .cb_count = NFT_MSG_MAX,
6082 .cb = nf_tables_cb,
0628b123
PNA
6083 .commit = nf_tables_commit,
6084 .abort = nf_tables_abort,
74e8bcd2 6085 .valid_genid = nf_tables_valid_genid,
96518518
PM
6086};
6087
7210e4e3 6088int nft_chain_validate_dependency(const struct nft_chain *chain,
32537e91 6089 enum nft_chain_types type)
7210e4e3
PNA
6090{
6091 const struct nft_base_chain *basechain;
6092
f323d954 6093 if (nft_is_base_chain(chain)) {
7210e4e3
PNA
6094 basechain = nft_base_chain(chain);
6095 if (basechain->type->type != type)
6096 return -EOPNOTSUPP;
6097 }
6098 return 0;
6099}
6100EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
6101
75e8d06d
PNA
6102int nft_chain_validate_hooks(const struct nft_chain *chain,
6103 unsigned int hook_flags)
6104{
6105 struct nft_base_chain *basechain;
6106
f323d954 6107 if (nft_is_base_chain(chain)) {
75e8d06d
PNA
6108 basechain = nft_base_chain(chain);
6109
c974a3a3 6110 if ((1 << basechain->ops.hooknum) & hook_flags)
75e8d06d
PNA
6111 return 0;
6112
6113 return -EOPNOTSUPP;
6114 }
6115
6116 return 0;
6117}
6118EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
6119
20a69341
PM
6120/*
6121 * Loop detection - walk through the ruleset beginning at the destination chain
6122 * of a new jump until either the source chain is reached (loop) or all
6123 * reachable chains have been traversed.
6124 *
6125 * The loop check is performed whenever a new jump verdict is added to an
6126 * expression or verdict map or a verdict map is bound to a new chain.
6127 */
6128
6129static int nf_tables_check_loops(const struct nft_ctx *ctx,
6130 const struct nft_chain *chain);
6131
6132static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
de70185d 6133 struct nft_set *set,
20a69341 6134 const struct nft_set_iter *iter,
de70185d 6135 struct nft_set_elem *elem)
20a69341 6136{
fe2811eb
PM
6137 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
6138 const struct nft_data *data;
6139
6140 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
6141 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
62f9c8b4
PNA
6142 return 0;
6143
fe2811eb 6144 data = nft_set_ext_data(ext);
1ca2e170 6145 switch (data->verdict.code) {
20a69341
PM
6146 case NFT_JUMP:
6147 case NFT_GOTO:
1ca2e170 6148 return nf_tables_check_loops(ctx, data->verdict.chain);
20a69341
PM
6149 default:
6150 return 0;
6151 }
6152}
6153
6154static int nf_tables_check_loops(const struct nft_ctx *ctx,
6155 const struct nft_chain *chain)
6156{
6157 const struct nft_rule *rule;
6158 const struct nft_expr *expr, *last;
de70185d 6159 struct nft_set *set;
20a69341
PM
6160 struct nft_set_binding *binding;
6161 struct nft_set_iter iter;
20a69341
PM
6162
6163 if (ctx->chain == chain)
6164 return -ELOOP;
6165
6166 list_for_each_entry(rule, &chain->rules, list) {
6167 nft_rule_for_each_expr(expr, last, rule) {
0ca743a5
PNA
6168 const struct nft_data *data = NULL;
6169 int err;
6170
6171 if (!expr->ops->validate)
20a69341
PM
6172 continue;
6173
0ca743a5
PNA
6174 err = expr->ops->validate(ctx, expr, &data);
6175 if (err < 0)
6176 return err;
6177
20a69341 6178 if (data == NULL)
0ca743a5 6179 continue;
20a69341 6180
1ca2e170 6181 switch (data->verdict.code) {
20a69341
PM
6182 case NFT_JUMP:
6183 case NFT_GOTO:
1ca2e170
PM
6184 err = nf_tables_check_loops(ctx,
6185 data->verdict.chain);
20a69341
PM
6186 if (err < 0)
6187 return err;
6188 default:
6189 break;
6190 }
6191 }
6192 }
6193
6194 list_for_each_entry(set, &ctx->table->sets, list) {
37a9cc52
PNA
6195 if (!nft_is_active_next(ctx->net, set))
6196 continue;
20a69341
PM
6197 if (!(set->flags & NFT_SET_MAP) ||
6198 set->dtype != NFT_DATA_VERDICT)
6199 continue;
6200
6201 list_for_each_entry(binding, &set->bindings, list) {
11113e19
PM
6202 if (!(binding->flags & NFT_SET_MAP) ||
6203 binding->chain != chain)
20a69341
PM
6204 continue;
6205
8588ac09 6206 iter.genmask = nft_genmask_next(ctx->net);
20a69341
PM
6207 iter.skip = 0;
6208 iter.count = 0;
6209 iter.err = 0;
6210 iter.fn = nf_tables_loop_check_setelem;
6211
6212 set->ops->walk(ctx, set, &iter);
6213 if (iter.err < 0)
6214 return iter.err;
6215 }
6216 }
6217
6218 return 0;
6219}
6220
36b701fa
LGL
6221/**
6222 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
6223 *
6224 * @attr: netlink attribute to fetch value from
6225 * @max: maximum value to be stored in dest
6226 * @dest: pointer to the variable
6227 *
6228 * Parse, check and store a given u32 netlink attribute into variable.
6229 * This function returns -ERANGE if the value goes over maximum value.
6230 * Otherwise a 0 is returned and the attribute value is stored in the
6231 * destination variable.
6232 */
f1d505bb 6233int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
36b701fa 6234{
09525a09 6235 u32 val;
36b701fa
LGL
6236
6237 val = ntohl(nla_get_be32(attr));
6238 if (val > max)
6239 return -ERANGE;
6240
6241 *dest = val;
6242 return 0;
6243}
6244EXPORT_SYMBOL_GPL(nft_parse_u32_check);
6245
49499c3e
PM
6246/**
6247 * nft_parse_register - parse a register value from a netlink attribute
6248 *
6249 * @attr: netlink attribute
6250 *
6251 * Parse and translate a register value from a netlink attribute.
6252 * Registers used to be 128 bit wide, these register numbers will be
6253 * mapped to the corresponding 32 bit register numbers.
6254 */
b1c96ed3
PM
6255unsigned int nft_parse_register(const struct nlattr *attr)
6256{
49499c3e
PM
6257 unsigned int reg;
6258
6259 reg = ntohl(nla_get_be32(attr));
6260 switch (reg) {
6261 case NFT_REG_VERDICT...NFT_REG_4:
6262 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
6263 default:
6264 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
6265 }
b1c96ed3
PM
6266}
6267EXPORT_SYMBOL_GPL(nft_parse_register);
6268
49499c3e
PM
6269/**
6270 * nft_dump_register - dump a register value to a netlink attribute
6271 *
6272 * @skb: socket buffer
6273 * @attr: attribute number
6274 * @reg: register number
6275 *
6276 * Construct a netlink attribute containing the register number. For
6277 * compatibility reasons, register numbers being a multiple of 4 are
6278 * translated to the corresponding 128 bit register numbers.
6279 */
b1c96ed3
PM
6280int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
6281{
49499c3e
PM
6282 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
6283 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
6284 else
6285 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
6286
b1c96ed3
PM
6287 return nla_put_be32(skb, attr, htonl(reg));
6288}
6289EXPORT_SYMBOL_GPL(nft_dump_register);
6290
96518518 6291/**
d07db988 6292 * nft_validate_register_load - validate a load from a register
96518518
PM
6293 *
6294 * @reg: the register number
d07db988 6295 * @len: the length of the data
96518518
PM
6296 *
6297 * Validate that the input register is one of the general purpose
d07db988 6298 * registers and that the length of the load is within the bounds.
96518518 6299 */
d07db988 6300int nft_validate_register_load(enum nft_registers reg, unsigned int len)
96518518 6301{
49499c3e 6302 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
96518518 6303 return -EINVAL;
d07db988
PM
6304 if (len == 0)
6305 return -EINVAL;
49499c3e 6306 if (reg * NFT_REG32_SIZE + len > FIELD_SIZEOF(struct nft_regs, data))
d07db988 6307 return -ERANGE;
49499c3e 6308
96518518
PM
6309 return 0;
6310}
d07db988 6311EXPORT_SYMBOL_GPL(nft_validate_register_load);
96518518 6312
96518518 6313/**
1ec10212 6314 * nft_validate_register_store - validate an expressions' register store
96518518
PM
6315 *
6316 * @ctx: context of the expression performing the load
6317 * @reg: the destination register number
6318 * @data: the data to load
6319 * @type: the data type
45d9bcda 6320 * @len: the length of the data
96518518
PM
6321 *
6322 * Validate that a data load uses the appropriate data type for
45d9bcda
PM
6323 * the destination register and the length is within the bounds.
6324 * A value of NULL for the data means that its runtime gathered
58f40ab6 6325 * data.
96518518 6326 */
1ec10212
PM
6327int nft_validate_register_store(const struct nft_ctx *ctx,
6328 enum nft_registers reg,
6329 const struct nft_data *data,
6330 enum nft_data_types type, unsigned int len)
96518518 6331{
20a69341
PM
6332 int err;
6333
96518518
PM
6334 switch (reg) {
6335 case NFT_REG_VERDICT:
58f40ab6 6336 if (type != NFT_DATA_VERDICT)
96518518 6337 return -EINVAL;
20a69341 6338
58f40ab6 6339 if (data != NULL &&
1ca2e170
PM
6340 (data->verdict.code == NFT_GOTO ||
6341 data->verdict.code == NFT_JUMP)) {
6342 err = nf_tables_check_loops(ctx, data->verdict.chain);
20a69341
PM
6343 if (err < 0)
6344 return err;
6345
1ca2e170
PM
6346 if (ctx->chain->level + 1 >
6347 data->verdict.chain->level) {
20a69341
PM
6348 if (ctx->chain->level + 1 == NFT_JUMP_STACK_SIZE)
6349 return -EMLINK;
1ca2e170 6350 data->verdict.chain->level = ctx->chain->level + 1;
20a69341
PM
6351 }
6352 }
6353
96518518
PM
6354 return 0;
6355 default:
49499c3e 6356 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
27e6d201 6357 return -EINVAL;
45d9bcda
PM
6358 if (len == 0)
6359 return -EINVAL;
49499c3e
PM
6360 if (reg * NFT_REG32_SIZE + len >
6361 FIELD_SIZEOF(struct nft_regs, data))
45d9bcda 6362 return -ERANGE;
27e6d201 6363
96518518
PM
6364 if (data != NULL && type != NFT_DATA_VALUE)
6365 return -EINVAL;
6366 return 0;
6367 }
6368}
1ec10212 6369EXPORT_SYMBOL_GPL(nft_validate_register_store);
96518518
PM
6370
6371static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
6372 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
6373 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
6374 .len = NFT_CHAIN_MAXNAMELEN - 1 },
6375};
6376
6377static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
6378 struct nft_data_desc *desc, const struct nlattr *nla)
6379{
664b0f8c 6380 u8 genmask = nft_genmask_next(ctx->net);
96518518
PM
6381 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
6382 struct nft_chain *chain;
6383 int err;
6384
fceb6435
JB
6385 err = nla_parse_nested(tb, NFTA_VERDICT_MAX, nla, nft_verdict_policy,
6386 NULL);
96518518
PM
6387 if (err < 0)
6388 return err;
6389
6390 if (!tb[NFTA_VERDICT_CODE])
6391 return -EINVAL;
1ca2e170 6392 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
96518518 6393
1ca2e170 6394 switch (data->verdict.code) {
e0abdadc 6395 default:
1ca2e170 6396 switch (data->verdict.code & NF_VERDICT_MASK) {
e0abdadc
PM
6397 case NF_ACCEPT:
6398 case NF_DROP:
6399 case NF_QUEUE:
6400 break;
6401 default:
6402 return -EINVAL;
6403 }
6404 /* fall through */
96518518
PM
6405 case NFT_CONTINUE:
6406 case NFT_BREAK:
6407 case NFT_RETURN:
96518518
PM
6408 break;
6409 case NFT_JUMP:
6410 case NFT_GOTO:
6411 if (!tb[NFTA_VERDICT_CHAIN])
6412 return -EINVAL;
6413 chain = nf_tables_chain_lookup(ctx->table,
664b0f8c 6414 tb[NFTA_VERDICT_CHAIN], genmask);
96518518
PM
6415 if (IS_ERR(chain))
6416 return PTR_ERR(chain);
f323d954 6417 if (nft_is_base_chain(chain))
96518518
PM
6418 return -EOPNOTSUPP;
6419
96518518 6420 chain->use++;
1ca2e170 6421 data->verdict.chain = chain;
96518518 6422 break;
96518518
PM
6423 }
6424
4c4ed074 6425 desc->len = sizeof(data->verdict);
96518518
PM
6426 desc->type = NFT_DATA_VERDICT;
6427 return 0;
6428}
6429
6430static void nft_verdict_uninit(const struct nft_data *data)
6431{
1ca2e170 6432 switch (data->verdict.code) {
96518518
PM
6433 case NFT_JUMP:
6434 case NFT_GOTO:
1ca2e170 6435 data->verdict.chain->use--;
96518518
PM
6436 break;
6437 }
6438}
6439
33d5a7b1 6440int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
96518518
PM
6441{
6442 struct nlattr *nest;
6443
33d5a7b1 6444 nest = nla_nest_start(skb, type);
96518518
PM
6445 if (!nest)
6446 goto nla_put_failure;
6447
33d5a7b1 6448 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
96518518
PM
6449 goto nla_put_failure;
6450
33d5a7b1 6451 switch (v->code) {
96518518
PM
6452 case NFT_JUMP:
6453 case NFT_GOTO:
1ca2e170 6454 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
33d5a7b1 6455 v->chain->name))
96518518
PM
6456 goto nla_put_failure;
6457 }
6458 nla_nest_end(skb, nest);
6459 return 0;
6460
6461nla_put_failure:
6462 return -1;
6463}
6464
d0a11fc3
PM
6465static int nft_value_init(const struct nft_ctx *ctx,
6466 struct nft_data *data, unsigned int size,
96518518
PM
6467 struct nft_data_desc *desc, const struct nlattr *nla)
6468{
6469 unsigned int len;
6470
6471 len = nla_len(nla);
6472 if (len == 0)
6473 return -EINVAL;
d0a11fc3 6474 if (len > size)
96518518
PM
6475 return -EOVERFLOW;
6476
d0a11fc3 6477 nla_memcpy(data->data, nla, len);
96518518
PM
6478 desc->type = NFT_DATA_VALUE;
6479 desc->len = len;
6480 return 0;
6481}
6482
6483static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
6484 unsigned int len)
6485{
6486 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
6487}
6488
6489static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
d0a11fc3 6490 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
96518518
PM
6491 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
6492};
6493
6494/**
6495 * nft_data_init - parse nf_tables data netlink attributes
6496 *
6497 * @ctx: context of the expression using the data
6498 * @data: destination struct nft_data
d0a11fc3 6499 * @size: maximum data length
96518518
PM
6500 * @desc: data description
6501 * @nla: netlink attribute containing data
6502 *
6503 * Parse the netlink data attributes and initialize a struct nft_data.
6504 * The type and length of data are returned in the data description.
6505 *
6506 * The caller can indicate that it only wants to accept data of type
6507 * NFT_DATA_VALUE by passing NULL for the ctx argument.
6508 */
d0a11fc3
PM
6509int nft_data_init(const struct nft_ctx *ctx,
6510 struct nft_data *data, unsigned int size,
96518518
PM
6511 struct nft_data_desc *desc, const struct nlattr *nla)
6512{
6513 struct nlattr *tb[NFTA_DATA_MAX + 1];
6514 int err;
6515
fceb6435 6516 err = nla_parse_nested(tb, NFTA_DATA_MAX, nla, nft_data_policy, NULL);
96518518
PM
6517 if (err < 0)
6518 return err;
6519
6520 if (tb[NFTA_DATA_VALUE])
d0a11fc3
PM
6521 return nft_value_init(ctx, data, size, desc,
6522 tb[NFTA_DATA_VALUE]);
96518518
PM
6523 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
6524 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
6525 return -EINVAL;
6526}
6527EXPORT_SYMBOL_GPL(nft_data_init);
6528
6529/**
59105446 6530 * nft_data_release - release a nft_data item
96518518
PM
6531 *
6532 * @data: struct nft_data to release
6533 * @type: type of data
6534 *
6535 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
6536 * all others need to be released by calling this function.
6537 */
59105446 6538void nft_data_release(const struct nft_data *data, enum nft_data_types type)
96518518 6539{
960bd2c2 6540 if (type < NFT_DATA_VERDICT)
96518518 6541 return;
960bd2c2 6542 switch (type) {
96518518
PM
6543 case NFT_DATA_VERDICT:
6544 return nft_verdict_uninit(data);
6545 default:
6546 WARN_ON(1);
6547 }
6548}
59105446 6549EXPORT_SYMBOL_GPL(nft_data_release);
96518518
PM
6550
6551int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
6552 enum nft_data_types type, unsigned int len)
6553{
6554 struct nlattr *nest;
6555 int err;
6556
6557 nest = nla_nest_start(skb, attr);
6558 if (nest == NULL)
6559 return -1;
6560
6561 switch (type) {
6562 case NFT_DATA_VALUE:
6563 err = nft_value_dump(skb, data, len);
6564 break;
6565 case NFT_DATA_VERDICT:
33d5a7b1 6566 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
96518518
PM
6567 break;
6568 default:
6569 err = -EINVAL;
6570 WARN_ON(1);
6571 }
6572
6573 nla_nest_end(skb, nest);
6574 return err;
6575}
6576EXPORT_SYMBOL_GPL(nft_data_dump);
6577
5ebe0b0e
PNA
6578int __nft_release_basechain(struct nft_ctx *ctx)
6579{
6580 struct nft_rule *rule, *nr;
6581
f323d954 6582 BUG_ON(!nft_is_base_chain(ctx->chain));
5ebe0b0e 6583
c974a3a3 6584 nf_tables_unregister_hook(ctx->net, ctx->chain->table, ctx->chain);
5ebe0b0e
PNA
6585 list_for_each_entry_safe(rule, nr, &ctx->chain->rules, list) {
6586 list_del(&rule->list);
6587 ctx->chain->use--;
6588 nf_tables_rule_destroy(ctx, rule);
6589 }
6590 list_del(&ctx->chain->list);
6591 ctx->table->use--;
43a605f2 6592 nf_tables_chain_destroy(ctx);
5ebe0b0e
PNA
6593
6594 return 0;
6595}
6596EXPORT_SYMBOL_GPL(__nft_release_basechain);
6597
98319cb9 6598static void __nft_release_tables(struct net *net)
df05ef87 6599{
3b49e2e9 6600 struct nft_flowtable *flowtable, *nf;
df05ef87
PNA
6601 struct nft_table *table, *nt;
6602 struct nft_chain *chain, *nc;
e5009240 6603 struct nft_object *obj, *ne;
df05ef87
PNA
6604 struct nft_rule *rule, *nr;
6605 struct nft_set *set, *ns;
6606 struct nft_ctx ctx = {
6607 .net = net,
43a605f2 6608 .family = NFPROTO_NETDEV,
df05ef87
PNA
6609 };
6610
36596dad 6611 list_for_each_entry_safe(table, nt, &net->nft.tables, list) {
98319cb9 6612 ctx.family = table->family;
dd4cbef7 6613
df05ef87 6614 list_for_each_entry(chain, &table->chains, list)
c974a3a3 6615 nf_tables_unregister_hook(net, table, chain);
3b49e2e9
PNA
6616 list_for_each_entry(flowtable, &table->flowtables, list)
6617 nf_unregister_net_hooks(net, flowtable->ops,
6618 flowtable->ops_len);
df05ef87
PNA
6619 /* No packets are walking on these chains anymore. */
6620 ctx.table = table;
6621 list_for_each_entry(chain, &table->chains, list) {
6622 ctx.chain = chain;
6623 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
6624 list_del(&rule->list);
6625 chain->use--;
6626 nf_tables_rule_destroy(&ctx, rule);
6627 }
6628 }
3b49e2e9
PNA
6629 list_for_each_entry_safe(flowtable, nf, &table->flowtables, list) {
6630 list_del(&flowtable->list);
6631 table->use--;
6632 nf_tables_flowtable_destroy(flowtable);
6633 }
df05ef87
PNA
6634 list_for_each_entry_safe(set, ns, &table->sets, list) {
6635 list_del(&set->list);
6636 table->use--;
6637 nft_set_destroy(set);
6638 }
e5009240
PNA
6639 list_for_each_entry_safe(obj, ne, &table->objects, list) {
6640 list_del(&obj->list);
6641 table->use--;
6642 nft_obj_destroy(obj);
6643 }
df05ef87 6644 list_for_each_entry_safe(chain, nc, &table->chains, list) {
43a605f2 6645 ctx.chain = chain;
df05ef87
PNA
6646 list_del(&chain->list);
6647 table->use--;
43a605f2 6648 nf_tables_chain_destroy(&ctx);
df05ef87
PNA
6649 }
6650 list_del(&table->list);
6651 nf_tables_table_destroy(&ctx);
6652 }
6653}
6654
dd4cbef7
PNA
6655static int __net_init nf_tables_init_net(struct net *net)
6656{
6657 INIT_LIST_HEAD(&net->nft.tables);
6658 INIT_LIST_HEAD(&net->nft.commit_list);
6659 net->nft.base_seq = 1;
6660 return 0;
6661}
6662
6663static void __net_exit nf_tables_exit_net(struct net *net)
6664{
98319cb9 6665 __nft_release_tables(net);
dd4cbef7
PNA
6666 WARN_ON_ONCE(!list_empty(&net->nft.tables));
6667 WARN_ON_ONCE(!list_empty(&net->nft.commit_list));
6668}
6669
99633ab2
PNA
6670static struct pernet_operations nf_tables_net_ops = {
6671 .init = nf_tables_init_net,
613d0776 6672 .exit = nf_tables_exit_net,
99633ab2
PNA
6673};
6674
96518518
PM
6675static int __init nf_tables_module_init(void)
6676{
6677 int err;
6678
02c7b25e
PNA
6679 nft_chain_filter_init();
6680
96518518
PM
6681 info = kmalloc(sizeof(struct nft_expr_info) * NFT_RULE_MAXEXPRS,
6682 GFP_KERNEL);
6683 if (info == NULL) {
6684 err = -ENOMEM;
6685 goto err1;
6686 }
6687
6688 err = nf_tables_core_module_init();
6689 if (err < 0)
6690 goto err2;
6691
6692 err = nfnetlink_subsys_register(&nf_tables_subsys);
6693 if (err < 0)
6694 goto err3;
6695
3b49e2e9
PNA
6696 register_netdevice_notifier(&nf_tables_flowtable_notifier);
6697
99633ab2 6698 return register_pernet_subsys(&nf_tables_net_ops);
96518518
PM
6699err3:
6700 nf_tables_core_module_exit();
6701err2:
6702 kfree(info);
6703err1:
6704 return err;
6705}
6706
6707static void __exit nf_tables_module_exit(void)
6708{
99633ab2 6709 unregister_pernet_subsys(&nf_tables_net_ops);
96518518 6710 nfnetlink_subsys_unregister(&nf_tables_subsys);
3b49e2e9 6711 unregister_netdevice_notifier(&nf_tables_flowtable_notifier);
1b1bc49c 6712 rcu_barrier();
96518518
PM
6713 nf_tables_core_module_exit();
6714 kfree(info);
02c7b25e 6715 nft_chain_filter_fini();
96518518
PM
6716}
6717
6718module_init(nf_tables_module_init);
6719module_exit(nf_tables_module_exit);
6720
6721MODULE_LICENSE("GPL");
6722MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
6723MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);