1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 *
5 * Development of this code funded by Astaro AG (http://www.astaro.com/)
6 */
7
8 #include <linux/module.h>
9 #include <linux/init.h>
10 #include <linux/list.h>
11 #include <linux/skbuff.h>
12 #include <linux/netlink.h>
13 #include <linux/vmalloc.h>
14 #include <linux/rhashtable.h>
15 #include <linux/audit.h>
16 #include <linux/netfilter.h>
17 #include <linux/netfilter/nfnetlink.h>
18 #include <linux/netfilter/nf_tables.h>
19 #include <net/netfilter/nf_flow_table.h>
20 #include <net/netfilter/nf_tables_core.h>
21 #include <net/netfilter/nf_tables.h>
22 #include <net/netfilter/nf_tables_offload.h>
23 #include <net/net_namespace.h>
24 #include <net/sock.h>
25
26 #define NFT_MODULE_AUTOLOAD_LIMIT (MODULE_NAME_LEN - sizeof("nft-expr-255-"))
27 #define NFT_SET_MAX_ANONLEN 16
28
29 /* limit compaction to avoid huge kmalloc/krealloc sizes. */
30 #define NFT_MAX_SET_NELEMS ((2048 - sizeof(struct nft_trans_elem)) / sizeof(struct nft_trans_one_elem))
31
32 unsigned int nf_tables_net_id __read_mostly;
33
34 static LIST_HEAD(nf_tables_expressions);
35 static LIST_HEAD(nf_tables_objects);
36 static LIST_HEAD(nf_tables_flowtables);
37 static LIST_HEAD(nf_tables_gc_list);
38 static DEFINE_SPINLOCK(nf_tables_destroy_list_lock);
39 static DEFINE_SPINLOCK(nf_tables_gc_list_lock);
40
41 enum {
42 NFT_VALIDATE_SKIP = 0,
43 NFT_VALIDATE_NEED,
44 NFT_VALIDATE_DO,
45 };
46
47 static struct rhltable nft_objname_ht;
48
49 static u32 nft_chain_hash(const void *data, u32 len, u32 seed);
50 static u32 nft_chain_hash_obj(const void *data, u32 len, u32 seed);
51 static int nft_chain_hash_cmp(struct rhashtable_compare_arg *, const void *);
52
53 static u32 nft_objname_hash(const void *data, u32 len, u32 seed);
54 static u32 nft_objname_hash_obj(const void *data, u32 len, u32 seed);
55 static int nft_objname_hash_cmp(struct rhashtable_compare_arg *, const void *);
56
57 static const struct rhashtable_params nft_chain_ht_params = {
58 .head_offset = offsetof(struct nft_chain, rhlhead),
59 .key_offset = offsetof(struct nft_chain, name),
60 .hashfn = nft_chain_hash,
61 .obj_hashfn = nft_chain_hash_obj,
62 .obj_cmpfn = nft_chain_hash_cmp,
63 .automatic_shrinking = true,
64 };
65
66 static const struct rhashtable_params nft_objname_ht_params = {
67 .head_offset = offsetof(struct nft_object, rhlhead),
68 .key_offset = offsetof(struct nft_object, key),
69 .hashfn = nft_objname_hash,
70 .obj_hashfn = nft_objname_hash_obj,
71 .obj_cmpfn = nft_objname_hash_cmp,
72 .automatic_shrinking = true,
73 };
74
75 struct nft_audit_data {
76 struct nft_table *table;
77 int entries;
78 int op;
79 struct list_head list;
80 };
81
82 static const u8 nft2audit_op[NFT_MSG_MAX] = { // enum nf_tables_msg_types
83 [NFT_MSG_NEWTABLE] = AUDIT_NFT_OP_TABLE_REGISTER,
84 [NFT_MSG_GETTABLE] = AUDIT_NFT_OP_INVALID,
85 [NFT_MSG_DELTABLE] = AUDIT_NFT_OP_TABLE_UNREGISTER,
86 [NFT_MSG_NEWCHAIN] = AUDIT_NFT_OP_CHAIN_REGISTER,
87 [NFT_MSG_GETCHAIN] = AUDIT_NFT_OP_INVALID,
88 [NFT_MSG_DELCHAIN] = AUDIT_NFT_OP_CHAIN_UNREGISTER,
89 [NFT_MSG_NEWRULE] = AUDIT_NFT_OP_RULE_REGISTER,
90 [NFT_MSG_GETRULE] = AUDIT_NFT_OP_INVALID,
91 [NFT_MSG_DELRULE] = AUDIT_NFT_OP_RULE_UNREGISTER,
92 [NFT_MSG_NEWSET] = AUDIT_NFT_OP_SET_REGISTER,
93 [NFT_MSG_GETSET] = AUDIT_NFT_OP_INVALID,
94 [NFT_MSG_DELSET] = AUDIT_NFT_OP_SET_UNREGISTER,
95 [NFT_MSG_NEWSETELEM] = AUDIT_NFT_OP_SETELEM_REGISTER,
96 [NFT_MSG_GETSETELEM] = AUDIT_NFT_OP_INVALID,
97 [NFT_MSG_DELSETELEM] = AUDIT_NFT_OP_SETELEM_UNREGISTER,
98 [NFT_MSG_NEWGEN] = AUDIT_NFT_OP_GEN_REGISTER,
99 [NFT_MSG_GETGEN] = AUDIT_NFT_OP_INVALID,
100 [NFT_MSG_TRACE] = AUDIT_NFT_OP_INVALID,
101 [NFT_MSG_NEWOBJ] = AUDIT_NFT_OP_OBJ_REGISTER,
102 [NFT_MSG_GETOBJ] = AUDIT_NFT_OP_INVALID,
103 [NFT_MSG_DELOBJ] = AUDIT_NFT_OP_OBJ_UNREGISTER,
104 [NFT_MSG_GETOBJ_RESET] = AUDIT_NFT_OP_OBJ_RESET,
105 [NFT_MSG_NEWFLOWTABLE] = AUDIT_NFT_OP_FLOWTABLE_REGISTER,
106 [NFT_MSG_GETFLOWTABLE] = AUDIT_NFT_OP_INVALID,
107 [NFT_MSG_DELFLOWTABLE] = AUDIT_NFT_OP_FLOWTABLE_UNREGISTER,
108 [NFT_MSG_GETSETELEM_RESET] = AUDIT_NFT_OP_SETELEM_RESET,
109 };
110
nft_validate_state_update(struct nft_table * table,u8 new_validate_state)111 static void nft_validate_state_update(struct nft_table *table, u8 new_validate_state)
112 {
113 switch (table->validate_state) {
114 case NFT_VALIDATE_SKIP:
115 WARN_ON_ONCE(new_validate_state == NFT_VALIDATE_DO);
116 break;
117 case NFT_VALIDATE_NEED:
118 break;
119 case NFT_VALIDATE_DO:
120 if (new_validate_state == NFT_VALIDATE_NEED)
121 return;
122 }
123
124 table->validate_state = new_validate_state;
125 }
126 static void nf_tables_trans_destroy_work(struct work_struct *w);
127
128 static void nft_trans_gc_work(struct work_struct *work);
129 static DECLARE_WORK(trans_gc_work, nft_trans_gc_work);
130
nft_ctx_init(struct nft_ctx * ctx,struct net * net,const struct sk_buff * skb,const struct nlmsghdr * nlh,u8 family,struct nft_table * table,struct nft_chain * chain,const struct nlattr * const * nla)131 static void nft_ctx_init(struct nft_ctx *ctx,
132 struct net *net,
133 const struct sk_buff *skb,
134 const struct nlmsghdr *nlh,
135 u8 family,
136 struct nft_table *table,
137 struct nft_chain *chain,
138 const struct nlattr * const *nla)
139 {
140 ctx->net = net;
141 ctx->family = family;
142 ctx->level = 0;
143 ctx->table = table;
144 ctx->chain = chain;
145 ctx->nla = nla;
146 ctx->portid = NETLINK_CB(skb).portid;
147 ctx->report = nlmsg_report(nlh);
148 ctx->flags = nlh->nlmsg_flags;
149 ctx->seq = nlh->nlmsg_seq;
150
151 bitmap_zero(ctx->reg_inited, NFT_REG32_NUM);
152 }
153
nft_trans_alloc_gfp(const struct nft_ctx * ctx,int msg_type,u32 size,gfp_t gfp)154 static struct nft_trans *nft_trans_alloc_gfp(const struct nft_ctx *ctx,
155 int msg_type, u32 size, gfp_t gfp)
156 {
157 struct nft_trans *trans;
158
159 trans = kzalloc(size, gfp);
160 if (trans == NULL)
161 return NULL;
162
163 INIT_LIST_HEAD(&trans->list);
164 trans->msg_type = msg_type;
165
166 trans->net = ctx->net;
167 trans->table = ctx->table;
168 trans->seq = ctx->seq;
169 trans->flags = ctx->flags;
170 trans->report = ctx->report;
171
172 return trans;
173 }
174
nft_trans_alloc(const struct nft_ctx * ctx,int msg_type,u32 size)175 static struct nft_trans *nft_trans_alloc(const struct nft_ctx *ctx,
176 int msg_type, u32 size)
177 {
178 return nft_trans_alloc_gfp(ctx, msg_type, size, GFP_KERNEL);
179 }
180
nft_trans_get_binding(struct nft_trans * trans)181 static struct nft_trans_binding *nft_trans_get_binding(struct nft_trans *trans)
182 {
183 switch (trans->msg_type) {
184 case NFT_MSG_NEWCHAIN:
185 case NFT_MSG_NEWSET:
186 return container_of(trans, struct nft_trans_binding, nft_trans);
187 }
188
189 return NULL;
190 }
191
nft_trans_list_del(struct nft_trans * trans)192 static void nft_trans_list_del(struct nft_trans *trans)
193 {
194 struct nft_trans_binding *trans_binding;
195
196 list_del(&trans->list);
197
198 trans_binding = nft_trans_get_binding(trans);
199 if (trans_binding)
200 list_del(&trans_binding->binding_list);
201 }
202
nft_trans_destroy(struct nft_trans * trans)203 static void nft_trans_destroy(struct nft_trans *trans)
204 {
205 nft_trans_list_del(trans);
206 kfree(trans);
207 }
208
__nft_set_trans_bind(const struct nft_ctx * ctx,struct nft_set * set,bool bind)209 static void __nft_set_trans_bind(const struct nft_ctx *ctx, struct nft_set *set,
210 bool bind)
211 {
212 struct nftables_pernet *nft_net;
213 struct net *net = ctx->net;
214 struct nft_trans *trans;
215
216 if (!nft_set_is_anonymous(set))
217 return;
218
219 nft_net = nft_pernet(net);
220 list_for_each_entry_reverse(trans, &nft_net->commit_list, list) {
221 switch (trans->msg_type) {
222 case NFT_MSG_NEWSET:
223 if (nft_trans_set(trans) == set)
224 nft_trans_set_bound(trans) = bind;
225 break;
226 case NFT_MSG_NEWSETELEM:
227 if (nft_trans_elem_set(trans) == set)
228 nft_trans_elem_set_bound(trans) = bind;
229 break;
230 }
231 }
232 }
233
nft_set_trans_bind(const struct nft_ctx * ctx,struct nft_set * set)234 static void nft_set_trans_bind(const struct nft_ctx *ctx, struct nft_set *set)
235 {
236 return __nft_set_trans_bind(ctx, set, true);
237 }
238
nft_set_trans_unbind(const struct nft_ctx * ctx,struct nft_set * set)239 static void nft_set_trans_unbind(const struct nft_ctx *ctx, struct nft_set *set)
240 {
241 return __nft_set_trans_bind(ctx, set, false);
242 }
243
__nft_chain_trans_bind(const struct nft_ctx * ctx,struct nft_chain * chain,bool bind)244 static void __nft_chain_trans_bind(const struct nft_ctx *ctx,
245 struct nft_chain *chain, bool bind)
246 {
247 struct nftables_pernet *nft_net;
248 struct net *net = ctx->net;
249 struct nft_trans *trans;
250
251 if (!nft_chain_binding(chain))
252 return;
253
254 nft_net = nft_pernet(net);
255 list_for_each_entry_reverse(trans, &nft_net->commit_list, list) {
256 switch (trans->msg_type) {
257 case NFT_MSG_NEWCHAIN:
258 if (nft_trans_chain(trans) == chain)
259 nft_trans_chain_bound(trans) = bind;
260 break;
261 case NFT_MSG_NEWRULE:
262 if (nft_trans_rule_chain(trans) == chain)
263 nft_trans_rule_bound(trans) = bind;
264 break;
265 }
266 }
267 }
268
nft_chain_trans_bind(const struct nft_ctx * ctx,struct nft_chain * chain)269 static void nft_chain_trans_bind(const struct nft_ctx *ctx,
270 struct nft_chain *chain)
271 {
272 __nft_chain_trans_bind(ctx, chain, true);
273 }
274
nf_tables_bind_chain(const struct nft_ctx * ctx,struct nft_chain * chain)275 int nf_tables_bind_chain(const struct nft_ctx *ctx, struct nft_chain *chain)
276 {
277 if (!nft_chain_binding(chain))
278 return 0;
279
280 if (nft_chain_binding(ctx->chain))
281 return -EOPNOTSUPP;
282
283 if (chain->bound)
284 return -EBUSY;
285
286 if (!nft_use_inc(&chain->use))
287 return -EMFILE;
288
289 chain->bound = true;
290 nft_chain_trans_bind(ctx, chain);
291
292 return 0;
293 }
294
nf_tables_unbind_chain(const struct nft_ctx * ctx,struct nft_chain * chain)295 void nf_tables_unbind_chain(const struct nft_ctx *ctx, struct nft_chain *chain)
296 {
297 __nft_chain_trans_bind(ctx, chain, false);
298 }
299
nft_netdev_register_hooks(struct net * net,struct list_head * hook_list)300 static int nft_netdev_register_hooks(struct net *net,
301 struct list_head *hook_list)
302 {
303 struct nf_hook_ops *ops;
304 struct nft_hook *hook;
305 int err, j;
306
307 j = 0;
308 list_for_each_entry(hook, hook_list, list) {
309 list_for_each_entry(ops, &hook->ops_list, list) {
310 err = nf_register_net_hook(net, ops);
311 if (err < 0)
312 goto err_register;
313
314 j++;
315 }
316 }
317 return 0;
318
319 err_register:
320 list_for_each_entry(hook, hook_list, list) {
321 list_for_each_entry(ops, &hook->ops_list, list) {
322 if (j-- <= 0)
323 break;
324
325 nf_unregister_net_hook(net, ops);
326 }
327 }
328 return err;
329 }
330
nft_netdev_hook_free_ops(struct nft_hook * hook)331 static void nft_netdev_hook_free_ops(struct nft_hook *hook)
332 {
333 struct nf_hook_ops *ops, *next;
334
335 list_for_each_entry_safe(ops, next, &hook->ops_list, list) {
336 list_del(&ops->list);
337 kfree(ops);
338 }
339 }
340
nft_netdev_hook_free(struct nft_hook * hook)341 static void nft_netdev_hook_free(struct nft_hook *hook)
342 {
343 nft_netdev_hook_free_ops(hook);
344 kfree(hook);
345 }
346
__nft_netdev_hook_free_rcu(struct rcu_head * rcu)347 static void __nft_netdev_hook_free_rcu(struct rcu_head *rcu)
348 {
349 struct nft_hook *hook = container_of(rcu, struct nft_hook, rcu);
350
351 nft_netdev_hook_free(hook);
352 }
353
nft_netdev_hook_free_rcu(struct nft_hook * hook)354 static void nft_netdev_hook_free_rcu(struct nft_hook *hook)
355 {
356 call_rcu(&hook->rcu, __nft_netdev_hook_free_rcu);
357 }
358
nft_netdev_unregister_hooks(struct net * net,struct list_head * hook_list,bool release_netdev)359 static void nft_netdev_unregister_hooks(struct net *net,
360 struct list_head *hook_list,
361 bool release_netdev)
362 {
363 struct nft_hook *hook, *next;
364 struct nf_hook_ops *ops;
365
366 list_for_each_entry_safe(hook, next, hook_list, list) {
367 list_for_each_entry(ops, &hook->ops_list, list)
368 nf_unregister_net_hook(net, ops);
369 if (release_netdev) {
370 list_del(&hook->list);
371 nft_netdev_hook_free_rcu(hook);
372 }
373 }
374 }
375
nf_tables_register_hook(struct net * net,const struct nft_table * table,struct nft_chain * chain)376 static int nf_tables_register_hook(struct net *net,
377 const struct nft_table *table,
378 struct nft_chain *chain)
379 {
380 struct nft_base_chain *basechain;
381 const struct nf_hook_ops *ops;
382
383 if (table->flags & NFT_TABLE_F_DORMANT ||
384 !nft_is_base_chain(chain))
385 return 0;
386
387 basechain = nft_base_chain(chain);
388 ops = &basechain->ops;
389
390 if (basechain->type->ops_register)
391 return basechain->type->ops_register(net, ops);
392
393 if (nft_base_chain_netdev(table->family, basechain->ops.hooknum))
394 return nft_netdev_register_hooks(net, &basechain->hook_list);
395
396 return nf_register_net_hook(net, &basechain->ops);
397 }
398
__nf_tables_unregister_hook(struct net * net,const struct nft_table * table,struct nft_chain * chain,bool release_netdev)399 static void __nf_tables_unregister_hook(struct net *net,
400 const struct nft_table *table,
401 struct nft_chain *chain,
402 bool release_netdev)
403 {
404 struct nft_base_chain *basechain;
405 const struct nf_hook_ops *ops;
406
407 if (table->flags & NFT_TABLE_F_DORMANT ||
408 !nft_is_base_chain(chain))
409 return;
410 basechain = nft_base_chain(chain);
411 ops = &basechain->ops;
412
413 if (basechain->type->ops_unregister)
414 return basechain->type->ops_unregister(net, ops);
415
416 if (nft_base_chain_netdev(table->family, basechain->ops.hooknum))
417 nft_netdev_unregister_hooks(net, &basechain->hook_list,
418 release_netdev);
419 else
420 nf_unregister_net_hook(net, &basechain->ops);
421 }
422
nf_tables_unregister_hook(struct net * net,const struct nft_table * table,struct nft_chain * chain)423 static void nf_tables_unregister_hook(struct net *net,
424 const struct nft_table *table,
425 struct nft_chain *chain)
426 {
427 return __nf_tables_unregister_hook(net, table, chain, false);
428 }
429
nft_trans_collapse_set_elem_allowed(const struct nft_trans_elem * a,const struct nft_trans_elem * b)430 static bool nft_trans_collapse_set_elem_allowed(const struct nft_trans_elem *a, const struct nft_trans_elem *b)
431 {
432 /* NB: the ->bound equality check is defensive, at this time we only merge
433 * a new nft_trans_elem transaction request with the transaction tail
434 * element, but a->bound != b->bound would imply a NEWRULE transaction
435 * is queued in-between.
436 *
437 * The set check is mandatory, the NFT_MAX_SET_NELEMS check prevents
438 * huge krealloc() requests.
439 */
440 return a->set == b->set && a->bound == b->bound && a->nelems < NFT_MAX_SET_NELEMS;
441 }
442
nft_trans_collapse_set_elem(struct nftables_pernet * nft_net,struct nft_trans_elem * tail,struct nft_trans_elem * trans,gfp_t gfp)443 static bool nft_trans_collapse_set_elem(struct nftables_pernet *nft_net,
444 struct nft_trans_elem *tail,
445 struct nft_trans_elem *trans,
446 gfp_t gfp)
447 {
448 unsigned int nelems, old_nelems = tail->nelems;
449 struct nft_trans_elem *new_trans;
450
451 if (!nft_trans_collapse_set_elem_allowed(tail, trans))
452 return false;
453
454 /* "cannot happen", at this time userspace element add
455 * requests always allocate a new transaction element.
456 *
457 * This serves as a reminder to adjust the list_add_tail
458 * logic below in case this ever changes.
459 */
460 if (WARN_ON_ONCE(trans->nelems != 1))
461 return false;
462
463 if (check_add_overflow(old_nelems, trans->nelems, &nelems))
464 return false;
465
466 /* krealloc might free tail which invalidates list pointers */
467 list_del_init(&tail->nft_trans.list);
468
469 new_trans = krealloc(tail, struct_size(tail, elems, nelems), gfp);
470 if (!new_trans) {
471 list_add_tail(&tail->nft_trans.list, &nft_net->commit_list);
472 return false;
473 }
474
475 /*
476 * new_trans->nft_trans.list contains garbage, but
477 * list_add_tail() doesn't care.
478 */
479 new_trans->nelems = nelems;
480 new_trans->elems[old_nelems] = trans->elems[0];
481 list_add_tail(&new_trans->nft_trans.list, &nft_net->commit_list);
482
483 return true;
484 }
485
nft_trans_try_collapse(struct nftables_pernet * nft_net,struct nft_trans * trans,gfp_t gfp)486 static bool nft_trans_try_collapse(struct nftables_pernet *nft_net,
487 struct nft_trans *trans, gfp_t gfp)
488 {
489 struct nft_trans *tail;
490
491 if (list_empty(&nft_net->commit_list))
492 return false;
493
494 tail = list_last_entry(&nft_net->commit_list, struct nft_trans, list);
495
496 if (tail->msg_type != trans->msg_type)
497 return false;
498
499 switch (trans->msg_type) {
500 case NFT_MSG_NEWSETELEM:
501 case NFT_MSG_DELSETELEM:
502 return nft_trans_collapse_set_elem(nft_net,
503 nft_trans_container_elem(tail),
504 nft_trans_container_elem(trans), gfp);
505 }
506
507 return false;
508 }
509
nft_trans_commit_list_add_tail(struct net * net,struct nft_trans * trans)510 static void nft_trans_commit_list_add_tail(struct net *net, struct nft_trans *trans)
511 {
512 struct nftables_pernet *nft_net = nft_pernet(net);
513 struct nft_trans_binding *binding;
514 struct nft_trans_set *trans_set;
515
516 list_add_tail(&trans->list, &nft_net->commit_list);
517
518 binding = nft_trans_get_binding(trans);
519 if (!binding)
520 return;
521
522 switch (trans->msg_type) {
523 case NFT_MSG_NEWSET:
524 trans_set = nft_trans_container_set(trans);
525
526 if (!nft_trans_set_update(trans) &&
527 nft_set_is_anonymous(nft_trans_set(trans)))
528 list_add_tail(&binding->binding_list, &nft_net->binding_list);
529
530 list_add_tail(&trans_set->list_trans_newset, &nft_net->commit_set_list);
531 break;
532 case NFT_MSG_NEWCHAIN:
533 if (!nft_trans_chain_update(trans) &&
534 nft_chain_binding(nft_trans_chain(trans)))
535 list_add_tail(&binding->binding_list, &nft_net->binding_list);
536 break;
537 }
538 }
539
nft_trans_commit_list_add_elem(struct net * net,struct nft_trans * trans,gfp_t gfp)540 static void nft_trans_commit_list_add_elem(struct net *net, struct nft_trans *trans,
541 gfp_t gfp)
542 {
543 struct nftables_pernet *nft_net = nft_pernet(net);
544
545 WARN_ON_ONCE(trans->msg_type != NFT_MSG_NEWSETELEM &&
546 trans->msg_type != NFT_MSG_DELSETELEM);
547
548 might_alloc(gfp);
549
550 if (nft_trans_try_collapse(nft_net, trans, gfp)) {
551 kfree(trans);
552 return;
553 }
554
555 nft_trans_commit_list_add_tail(net, trans);
556 }
557
nft_trans_table_add(struct nft_ctx * ctx,int msg_type)558 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
559 {
560 struct nft_trans *trans;
561
562 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
563 if (trans == NULL)
564 return -ENOMEM;
565
566 if (msg_type == NFT_MSG_NEWTABLE)
567 nft_activate_next(ctx->net, ctx->table);
568
569 nft_trans_commit_list_add_tail(ctx->net, trans);
570 return 0;
571 }
572
nft_deltable(struct nft_ctx * ctx)573 static int nft_deltable(struct nft_ctx *ctx)
574 {
575 int err;
576
577 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
578 if (err < 0)
579 return err;
580
581 nft_deactivate_next(ctx->net, ctx->table);
582 return err;
583 }
584
585 static struct nft_trans *
nft_trans_alloc_chain(const struct nft_ctx * ctx,int msg_type)586 nft_trans_alloc_chain(const struct nft_ctx *ctx, int msg_type)
587 {
588 struct nft_trans_chain *trans_chain;
589 struct nft_trans *trans;
590
591 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
592 if (!trans)
593 return NULL;
594
595 trans_chain = nft_trans_container_chain(trans);
596 INIT_LIST_HEAD(&trans_chain->nft_trans_binding.binding_list);
597 trans_chain->chain = ctx->chain;
598
599 return trans;
600 }
601
nft_trans_chain_add(struct nft_ctx * ctx,int msg_type)602 static struct nft_trans *nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
603 {
604 struct nft_trans *trans;
605
606 trans = nft_trans_alloc_chain(ctx, msg_type);
607 if (trans == NULL)
608 return ERR_PTR(-ENOMEM);
609
610 if (msg_type == NFT_MSG_NEWCHAIN) {
611 nft_activate_next(ctx->net, ctx->chain);
612
613 if (ctx->nla[NFTA_CHAIN_ID]) {
614 nft_trans_chain_id(trans) =
615 ntohl(nla_get_be32(ctx->nla[NFTA_CHAIN_ID]));
616 }
617 }
618 nft_trans_commit_list_add_tail(ctx->net, trans);
619
620 return trans;
621 }
622
nft_delchain(struct nft_ctx * ctx)623 static int nft_delchain(struct nft_ctx *ctx)
624 {
625 struct nft_trans *trans;
626
627 trans = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
628 if (IS_ERR(trans))
629 return PTR_ERR(trans);
630
631 nft_use_dec(&ctx->table->use);
632 nft_deactivate_next(ctx->net, ctx->chain);
633
634 return 0;
635 }
636
nft_rule_expr_activate(const struct nft_ctx * ctx,struct nft_rule * rule)637 void nft_rule_expr_activate(const struct nft_ctx *ctx, struct nft_rule *rule)
638 {
639 struct nft_expr *expr;
640
641 expr = nft_expr_first(rule);
642 while (nft_expr_more(rule, expr)) {
643 if (expr->ops->activate)
644 expr->ops->activate(ctx, expr);
645
646 expr = nft_expr_next(expr);
647 }
648 }
649
nft_rule_expr_deactivate(const struct nft_ctx * ctx,struct nft_rule * rule,enum nft_trans_phase phase)650 void nft_rule_expr_deactivate(const struct nft_ctx *ctx, struct nft_rule *rule,
651 enum nft_trans_phase phase)
652 {
653 struct nft_expr *expr;
654
655 expr = nft_expr_first(rule);
656 while (nft_expr_more(rule, expr)) {
657 if (expr->ops->deactivate)
658 expr->ops->deactivate(ctx, expr, phase);
659
660 expr = nft_expr_next(expr);
661 }
662 }
663
664 static int
nf_tables_delrule_deactivate(struct nft_ctx * ctx,struct nft_rule * rule)665 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
666 {
667 /* You cannot delete the same rule twice */
668 if (nft_is_active_next(ctx->net, rule)) {
669 nft_deactivate_next(ctx->net, rule);
670 nft_use_dec(&ctx->chain->use);
671 return 0;
672 }
673 return -ENOENT;
674 }
675
nft_trans_rule_add(struct nft_ctx * ctx,int msg_type,struct nft_rule * rule)676 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
677 struct nft_rule *rule)
678 {
679 struct nft_trans *trans;
680
681 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
682 if (trans == NULL)
683 return NULL;
684
685 if (msg_type == NFT_MSG_NEWRULE && ctx->nla[NFTA_RULE_ID] != NULL) {
686 nft_trans_rule_id(trans) =
687 ntohl(nla_get_be32(ctx->nla[NFTA_RULE_ID]));
688 }
689 nft_trans_rule(trans) = rule;
690 nft_trans_rule_chain(trans) = ctx->chain;
691 nft_trans_commit_list_add_tail(ctx->net, trans);
692
693 return trans;
694 }
695
nft_delrule(struct nft_ctx * ctx,struct nft_rule * rule)696 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
697 {
698 struct nft_flow_rule *flow;
699 struct nft_trans *trans;
700 int err;
701
702 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
703 if (trans == NULL)
704 return -ENOMEM;
705
706 if (ctx->chain->flags & NFT_CHAIN_HW_OFFLOAD) {
707 flow = nft_flow_rule_create(ctx->net, rule);
708 if (IS_ERR(flow)) {
709 nft_trans_destroy(trans);
710 return PTR_ERR(flow);
711 }
712
713 nft_trans_flow_rule(trans) = flow;
714 }
715
716 err = nf_tables_delrule_deactivate(ctx, rule);
717 if (err < 0) {
718 nft_trans_destroy(trans);
719 return err;
720 }
721 nft_rule_expr_deactivate(ctx, rule, NFT_TRANS_PREPARE);
722
723 return 0;
724 }
725
nft_delrule_by_chain(struct nft_ctx * ctx)726 static int nft_delrule_by_chain(struct nft_ctx *ctx)
727 {
728 struct nft_rule *rule;
729 int err;
730
731 list_for_each_entry(rule, &ctx->chain->rules, list) {
732 if (!nft_is_active_next(ctx->net, rule))
733 continue;
734
735 err = nft_delrule(ctx, rule);
736 if (err < 0)
737 return err;
738 }
739 return 0;
740 }
741
__nft_trans_set_add(const struct nft_ctx * ctx,int msg_type,struct nft_set * set,const struct nft_set_desc * desc)742 static int __nft_trans_set_add(const struct nft_ctx *ctx, int msg_type,
743 struct nft_set *set,
744 const struct nft_set_desc *desc)
745 {
746 struct nft_trans_set *trans_set;
747 struct nft_trans *trans;
748
749 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
750 if (trans == NULL)
751 return -ENOMEM;
752
753 trans_set = nft_trans_container_set(trans);
754 INIT_LIST_HEAD(&trans_set->nft_trans_binding.binding_list);
755 INIT_LIST_HEAD(&trans_set->list_trans_newset);
756
757 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] && !desc) {
758 nft_trans_set_id(trans) =
759 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
760 nft_activate_next(ctx->net, set);
761 }
762 nft_trans_set(trans) = set;
763 if (desc) {
764 nft_trans_set_update(trans) = true;
765 nft_trans_set_gc_int(trans) = desc->gc_int;
766 nft_trans_set_timeout(trans) = desc->timeout;
767 nft_trans_set_size(trans) = desc->size;
768 }
769 nft_trans_commit_list_add_tail(ctx->net, trans);
770
771 return 0;
772 }
773
nft_trans_set_add(const struct nft_ctx * ctx,int msg_type,struct nft_set * set)774 static int nft_trans_set_add(const struct nft_ctx *ctx, int msg_type,
775 struct nft_set *set)
776 {
777 return __nft_trans_set_add(ctx, msg_type, set, NULL);
778 }
779
nft_mapelem_deactivate(const struct nft_ctx * ctx,struct nft_set * set,const struct nft_set_iter * iter,struct nft_elem_priv * elem_priv)780 static int nft_mapelem_deactivate(const struct nft_ctx *ctx,
781 struct nft_set *set,
782 const struct nft_set_iter *iter,
783 struct nft_elem_priv *elem_priv)
784 {
785 struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
786
787 if (!nft_set_elem_active(ext, iter->genmask))
788 return 0;
789
790 nft_set_elem_change_active(ctx->net, set, ext);
791 nft_setelem_data_deactivate(ctx->net, set, elem_priv);
792
793 return 0;
794 }
795
796 struct nft_set_elem_catchall {
797 struct list_head list;
798 struct rcu_head rcu;
799 struct nft_elem_priv *elem;
800 };
801
nft_map_catchall_deactivate(const struct nft_ctx * ctx,struct nft_set * set)802 static void nft_map_catchall_deactivate(const struct nft_ctx *ctx,
803 struct nft_set *set)
804 {
805 u8 genmask = nft_genmask_next(ctx->net);
806 struct nft_set_elem_catchall *catchall;
807 struct nft_set_ext *ext;
808
809 list_for_each_entry(catchall, &set->catchall_list, list) {
810 ext = nft_set_elem_ext(set, catchall->elem);
811 if (!nft_set_elem_active(ext, genmask))
812 continue;
813
814 nft_set_elem_change_active(ctx->net, set, ext);
815 nft_setelem_data_deactivate(ctx->net, set, catchall->elem);
816 break;
817 }
818 }
819
nft_map_deactivate(const struct nft_ctx * ctx,struct nft_set * set)820 static void nft_map_deactivate(const struct nft_ctx *ctx, struct nft_set *set)
821 {
822 struct nft_set_iter iter = {
823 .genmask = nft_genmask_next(ctx->net),
824 .type = NFT_ITER_UPDATE,
825 .fn = nft_mapelem_deactivate,
826 };
827
828 set->ops->walk(ctx, set, &iter);
829 WARN_ON_ONCE(iter.err);
830
831 nft_map_catchall_deactivate(ctx, set);
832 }
833
nft_delset(const struct nft_ctx * ctx,struct nft_set * set)834 static int nft_delset(const struct nft_ctx *ctx, struct nft_set *set)
835 {
836 int err;
837
838 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
839 if (err < 0)
840 return err;
841
842 if (set->flags & (NFT_SET_MAP | NFT_SET_OBJECT))
843 nft_map_deactivate(ctx, set);
844
845 nft_deactivate_next(ctx->net, set);
846 nft_use_dec(&ctx->table->use);
847
848 return err;
849 }
850
nft_trans_obj_add(struct nft_ctx * ctx,int msg_type,struct nft_object * obj)851 static int nft_trans_obj_add(struct nft_ctx *ctx, int msg_type,
852 struct nft_object *obj)
853 {
854 struct nft_trans *trans;
855
856 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_obj));
857 if (trans == NULL)
858 return -ENOMEM;
859
860 if (msg_type == NFT_MSG_NEWOBJ)
861 nft_activate_next(ctx->net, obj);
862
863 nft_trans_obj(trans) = obj;
864 nft_trans_commit_list_add_tail(ctx->net, trans);
865
866 return 0;
867 }
868
nft_delobj(struct nft_ctx * ctx,struct nft_object * obj)869 static int nft_delobj(struct nft_ctx *ctx, struct nft_object *obj)
870 {
871 int err;
872
873 err = nft_trans_obj_add(ctx, NFT_MSG_DELOBJ, obj);
874 if (err < 0)
875 return err;
876
877 nft_deactivate_next(ctx->net, obj);
878 nft_use_dec(&ctx->table->use);
879
880 return err;
881 }
882
883 static struct nft_trans *
nft_trans_flowtable_add(struct nft_ctx * ctx,int msg_type,struct nft_flowtable * flowtable)884 nft_trans_flowtable_add(struct nft_ctx *ctx, int msg_type,
885 struct nft_flowtable *flowtable)
886 {
887 struct nft_trans *trans;
888
889 trans = nft_trans_alloc(ctx, msg_type,
890 sizeof(struct nft_trans_flowtable));
891 if (trans == NULL)
892 return ERR_PTR(-ENOMEM);
893
894 if (msg_type == NFT_MSG_NEWFLOWTABLE)
895 nft_activate_next(ctx->net, flowtable);
896
897 INIT_LIST_HEAD(&nft_trans_flowtable_hooks(trans));
898 nft_trans_flowtable(trans) = flowtable;
899 nft_trans_commit_list_add_tail(ctx->net, trans);
900
901 return trans;
902 }
903
nft_delflowtable(struct nft_ctx * ctx,struct nft_flowtable * flowtable)904 static int nft_delflowtable(struct nft_ctx *ctx,
905 struct nft_flowtable *flowtable)
906 {
907 struct nft_trans *trans;
908
909 trans = nft_trans_flowtable_add(ctx, NFT_MSG_DELFLOWTABLE, flowtable);
910 if (IS_ERR(trans))
911 return PTR_ERR(trans);
912
913 nft_deactivate_next(ctx->net, flowtable);
914 nft_use_dec(&ctx->table->use);
915
916 return 0;
917 }
918
__nft_reg_track_clobber(struct nft_regs_track * track,u8 dreg)919 static void __nft_reg_track_clobber(struct nft_regs_track *track, u8 dreg)
920 {
921 int i;
922
923 for (i = track->regs[dreg].num_reg; i > 0; i--)
924 __nft_reg_track_cancel(track, dreg - i);
925 }
926
__nft_reg_track_update(struct nft_regs_track * track,const struct nft_expr * expr,u8 dreg,u8 num_reg)927 static void __nft_reg_track_update(struct nft_regs_track *track,
928 const struct nft_expr *expr,
929 u8 dreg, u8 num_reg)
930 {
931 track->regs[dreg].selector = expr;
932 track->regs[dreg].bitwise = NULL;
933 track->regs[dreg].num_reg = num_reg;
934 }
935
nft_reg_track_update(struct nft_regs_track * track,const struct nft_expr * expr,u8 dreg,u8 len)936 void nft_reg_track_update(struct nft_regs_track *track,
937 const struct nft_expr *expr, u8 dreg, u8 len)
938 {
939 unsigned int regcount;
940 int i;
941
942 __nft_reg_track_clobber(track, dreg);
943
944 regcount = DIV_ROUND_UP(len, NFT_REG32_SIZE);
945 for (i = 0; i < regcount; i++, dreg++)
946 __nft_reg_track_update(track, expr, dreg, i);
947 }
948 EXPORT_SYMBOL_GPL(nft_reg_track_update);
949
nft_reg_track_cancel(struct nft_regs_track * track,u8 dreg,u8 len)950 void nft_reg_track_cancel(struct nft_regs_track *track, u8 dreg, u8 len)
951 {
952 unsigned int regcount;
953 int i;
954
955 __nft_reg_track_clobber(track, dreg);
956
957 regcount = DIV_ROUND_UP(len, NFT_REG32_SIZE);
958 for (i = 0; i < regcount; i++, dreg++)
959 __nft_reg_track_cancel(track, dreg);
960 }
961 EXPORT_SYMBOL_GPL(nft_reg_track_cancel);
962
__nft_reg_track_cancel(struct nft_regs_track * track,u8 dreg)963 void __nft_reg_track_cancel(struct nft_regs_track *track, u8 dreg)
964 {
965 track->regs[dreg].selector = NULL;
966 track->regs[dreg].bitwise = NULL;
967 track->regs[dreg].num_reg = 0;
968 }
969 EXPORT_SYMBOL_GPL(__nft_reg_track_cancel);
970
971 /*
972 * Tables
973 */
974
nft_table_lookup(const struct net * net,const struct nlattr * nla,u8 family,u8 genmask,u32 nlpid)975 static struct nft_table *nft_table_lookup(const struct net *net,
976 const struct nlattr *nla,
977 u8 family, u8 genmask, u32 nlpid)
978 {
979 struct nftables_pernet *nft_net;
980 struct nft_table *table;
981
982 if (nla == NULL)
983 return ERR_PTR(-EINVAL);
984
985 nft_net = nft_pernet(net);
986 list_for_each_entry_rcu(table, &nft_net->tables, list,
987 lockdep_is_held(&nft_net->commit_mutex)) {
988 if (!nla_strcmp(nla, table->name) &&
989 table->family == family &&
990 nft_active_genmask(table, genmask)) {
991 if (nft_table_has_owner(table) &&
992 nlpid && table->nlpid != nlpid)
993 return ERR_PTR(-EPERM);
994
995 return table;
996 }
997 }
998
999 return ERR_PTR(-ENOENT);
1000 }
1001
nft_table_lookup_byhandle(const struct net * net,const struct nlattr * nla,int family,u8 genmask,u32 nlpid)1002 static struct nft_table *nft_table_lookup_byhandle(const struct net *net,
1003 const struct nlattr *nla,
1004 int family, u8 genmask, u32 nlpid)
1005 {
1006 struct nftables_pernet *nft_net;
1007 struct nft_table *table;
1008
1009 nft_net = nft_pernet(net);
1010 list_for_each_entry(table, &nft_net->tables, list) {
1011 if (be64_to_cpu(nla_get_be64(nla)) == table->handle &&
1012 table->family == family &&
1013 nft_active_genmask(table, genmask)) {
1014 if (nft_table_has_owner(table) &&
1015 nlpid && table->nlpid != nlpid)
1016 return ERR_PTR(-EPERM);
1017
1018 return table;
1019 }
1020 }
1021
1022 return ERR_PTR(-ENOENT);
1023 }
1024
nf_tables_alloc_handle(struct nft_table * table)1025 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
1026 {
1027 return ++table->hgenerator;
1028 }
1029
1030 static const struct nft_chain_type *chain_type[NFPROTO_NUMPROTO][NFT_CHAIN_T_MAX];
1031
1032 static const struct nft_chain_type *
__nft_chain_type_get(u8 family,enum nft_chain_types type)1033 __nft_chain_type_get(u8 family, enum nft_chain_types type)
1034 {
1035 if (family >= NFPROTO_NUMPROTO ||
1036 type >= NFT_CHAIN_T_MAX)
1037 return NULL;
1038
1039 return chain_type[family][type];
1040 }
1041
1042 static const struct nft_chain_type *
__nf_tables_chain_type_lookup(const struct nlattr * nla,u8 family)1043 __nf_tables_chain_type_lookup(const struct nlattr *nla, u8 family)
1044 {
1045 const struct nft_chain_type *type;
1046 int i;
1047
1048 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
1049 type = __nft_chain_type_get(family, i);
1050 if (!type)
1051 continue;
1052 if (!nla_strcmp(nla, type->name))
1053 return type;
1054 }
1055 return NULL;
1056 }
1057
1058 struct nft_module_request {
1059 struct list_head list;
1060 char module[MODULE_NAME_LEN];
1061 bool done;
1062 };
1063
1064 #ifdef CONFIG_MODULES
nft_request_module(struct net * net,const char * fmt,...)1065 __printf(2, 3) int nft_request_module(struct net *net, const char *fmt,
1066 ...)
1067 {
1068 char module_name[MODULE_NAME_LEN];
1069 struct nftables_pernet *nft_net;
1070 struct nft_module_request *req;
1071 va_list args;
1072 int ret;
1073
1074 va_start(args, fmt);
1075 ret = vsnprintf(module_name, MODULE_NAME_LEN, fmt, args);
1076 va_end(args);
1077 if (ret >= MODULE_NAME_LEN)
1078 return 0;
1079
1080 nft_net = nft_pernet(net);
1081 list_for_each_entry(req, &nft_net->module_list, list) {
1082 if (!strcmp(req->module, module_name)) {
1083 if (req->done)
1084 return 0;
1085
1086 /* A request to load this module already exists. */
1087 return -EAGAIN;
1088 }
1089 }
1090
1091 req = kmalloc(sizeof(*req), GFP_KERNEL);
1092 if (!req)
1093 return -ENOMEM;
1094
1095 req->done = false;
1096 strscpy(req->module, module_name, MODULE_NAME_LEN);
1097 list_add_tail(&req->list, &nft_net->module_list);
1098
1099 return -EAGAIN;
1100 }
1101 EXPORT_SYMBOL_GPL(nft_request_module);
1102 #endif
1103
lockdep_nfnl_nft_mutex_not_held(void)1104 static void lockdep_nfnl_nft_mutex_not_held(void)
1105 {
1106 #ifdef CONFIG_PROVE_LOCKING
1107 if (debug_locks)
1108 WARN_ON_ONCE(lockdep_nfnl_is_held(NFNL_SUBSYS_NFTABLES));
1109 #endif
1110 }
1111
1112 static const struct nft_chain_type *
nf_tables_chain_type_lookup(struct net * net,const struct nlattr * nla,u8 family,bool autoload)1113 nf_tables_chain_type_lookup(struct net *net, const struct nlattr *nla,
1114 u8 family, bool autoload)
1115 {
1116 const struct nft_chain_type *type;
1117
1118 type = __nf_tables_chain_type_lookup(nla, family);
1119 if (type != NULL)
1120 return type;
1121
1122 lockdep_nfnl_nft_mutex_not_held();
1123 #ifdef CONFIG_MODULES
1124 if (autoload) {
1125 if (nft_request_module(net, "nft-chain-%u-%.*s", family,
1126 nla_len(nla),
1127 (const char *)nla_data(nla)) == -EAGAIN)
1128 return ERR_PTR(-EAGAIN);
1129 }
1130 #endif
1131 return ERR_PTR(-ENOENT);
1132 }
1133
nft_base_seq(const struct net * net)1134 static __be16 nft_base_seq(const struct net *net)
1135 {
1136 struct nftables_pernet *nft_net = nft_pernet(net);
1137
1138 return htons(nft_net->base_seq & 0xffff);
1139 }
1140
1141 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
1142 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
1143 .len = NFT_TABLE_MAXNAMELEN - 1 },
1144 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
1145 [NFTA_TABLE_HANDLE] = { .type = NLA_U64 },
1146 [NFTA_TABLE_USERDATA] = { .type = NLA_BINARY,
1147 .len = NFT_USERDATA_MAXLEN }
1148 };
1149
nf_tables_fill_table_info(struct sk_buff * skb,struct net * net,u32 portid,u32 seq,int event,u32 flags,int family,const struct nft_table * table)1150 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
1151 u32 portid, u32 seq, int event, u32 flags,
1152 int family, const struct nft_table *table)
1153 {
1154 struct nlmsghdr *nlh;
1155
1156 nlh = nfnl_msg_put(skb, portid, seq,
1157 nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event),
1158 flags, family, NFNETLINK_V0, nft_base_seq(net));
1159 if (!nlh)
1160 goto nla_put_failure;
1161
1162 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
1163 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)) ||
1164 nla_put_be64(skb, NFTA_TABLE_HANDLE, cpu_to_be64(table->handle),
1165 NFTA_TABLE_PAD))
1166 goto nla_put_failure;
1167
1168 if (event == NFT_MSG_DELTABLE ||
1169 event == NFT_MSG_DESTROYTABLE) {
1170 nlmsg_end(skb, nlh);
1171 return 0;
1172 }
1173
1174 if (nla_put_be32(skb, NFTA_TABLE_FLAGS,
1175 htonl(table->flags & NFT_TABLE_F_MASK)))
1176 goto nla_put_failure;
1177
1178 if (nft_table_has_owner(table) &&
1179 nla_put_be32(skb, NFTA_TABLE_OWNER, htonl(table->nlpid)))
1180 goto nla_put_failure;
1181
1182 if (table->udata) {
1183 if (nla_put(skb, NFTA_TABLE_USERDATA, table->udlen, table->udata))
1184 goto nla_put_failure;
1185 }
1186
1187 nlmsg_end(skb, nlh);
1188 return 0;
1189
1190 nla_put_failure:
1191 nlmsg_trim(skb, nlh);
1192 return -1;
1193 }
1194
1195 struct nftnl_skb_parms {
1196 bool report;
1197 };
1198 #define NFT_CB(skb) (*(struct nftnl_skb_parms*)&((skb)->cb))
1199
nft_notify_enqueue(struct sk_buff * skb,bool report,struct list_head * notify_list)1200 static void nft_notify_enqueue(struct sk_buff *skb, bool report,
1201 struct list_head *notify_list)
1202 {
1203 NFT_CB(skb).report = report;
1204 list_add_tail(&skb->list, notify_list);
1205 }
1206
nf_tables_table_notify(const struct nft_ctx * ctx,int event)1207 static void nf_tables_table_notify(const struct nft_ctx *ctx, int event)
1208 {
1209 struct nftables_pernet *nft_net;
1210 struct sk_buff *skb;
1211 u16 flags = 0;
1212 int err;
1213
1214 if (!ctx->report &&
1215 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1216 return;
1217
1218 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1219 if (skb == NULL)
1220 goto err;
1221
1222 if (ctx->flags & (NLM_F_CREATE | NLM_F_EXCL))
1223 flags |= ctx->flags & (NLM_F_CREATE | NLM_F_EXCL);
1224
1225 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
1226 event, flags, ctx->family, ctx->table);
1227 if (err < 0) {
1228 kfree_skb(skb);
1229 goto err;
1230 }
1231
1232 nft_net = nft_pernet(ctx->net);
1233 nft_notify_enqueue(skb, ctx->report, &nft_net->notify_list);
1234 return;
1235 err:
1236 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
1237 }
1238
nf_tables_dump_tables(struct sk_buff * skb,struct netlink_callback * cb)1239 static int nf_tables_dump_tables(struct sk_buff *skb,
1240 struct netlink_callback *cb)
1241 {
1242 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1243 struct nftables_pernet *nft_net;
1244 const struct nft_table *table;
1245 unsigned int idx = 0, s_idx = cb->args[0];
1246 struct net *net = sock_net(skb->sk);
1247 int family = nfmsg->nfgen_family;
1248
1249 rcu_read_lock();
1250 nft_net = nft_pernet(net);
1251 cb->seq = READ_ONCE(nft_net->base_seq);
1252
1253 list_for_each_entry_rcu(table, &nft_net->tables, list) {
1254 if (family != NFPROTO_UNSPEC && family != table->family)
1255 continue;
1256
1257 if (idx < s_idx)
1258 goto cont;
1259 if (idx > s_idx)
1260 memset(&cb->args[1], 0,
1261 sizeof(cb->args) - sizeof(cb->args[0]));
1262 if (!nft_is_active(net, table))
1263 continue;
1264 if (nf_tables_fill_table_info(skb, net,
1265 NETLINK_CB(cb->skb).portid,
1266 cb->nlh->nlmsg_seq,
1267 NFT_MSG_NEWTABLE, NLM_F_MULTI,
1268 table->family, table) < 0)
1269 goto done;
1270
1271 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1272 cont:
1273 idx++;
1274 }
1275 done:
1276 rcu_read_unlock();
1277 cb->args[0] = idx;
1278 return skb->len;
1279 }
1280
nft_netlink_dump_start_rcu(struct sock * nlsk,struct sk_buff * skb,const struct nlmsghdr * nlh,struct netlink_dump_control * c)1281 static int nft_netlink_dump_start_rcu(struct sock *nlsk, struct sk_buff *skb,
1282 const struct nlmsghdr *nlh,
1283 struct netlink_dump_control *c)
1284 {
1285 int err;
1286
1287 if (!try_module_get(THIS_MODULE))
1288 return -EINVAL;
1289
1290 rcu_read_unlock();
1291 err = netlink_dump_start(nlsk, skb, nlh, c);
1292 rcu_read_lock();
1293 module_put(THIS_MODULE);
1294
1295 return err;
1296 }
1297
1298 /* called with rcu_read_lock held */
nf_tables_gettable(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])1299 static int nf_tables_gettable(struct sk_buff *skb, const struct nfnl_info *info,
1300 const struct nlattr * const nla[])
1301 {
1302 struct netlink_ext_ack *extack = info->extack;
1303 u8 genmask = nft_genmask_cur(info->net);
1304 u8 family = info->nfmsg->nfgen_family;
1305 const struct nft_table *table;
1306 struct net *net = info->net;
1307 struct sk_buff *skb2;
1308 int err;
1309
1310 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
1311 struct netlink_dump_control c = {
1312 .dump = nf_tables_dump_tables,
1313 .module = THIS_MODULE,
1314 };
1315
1316 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
1317 }
1318
1319 table = nft_table_lookup(net, nla[NFTA_TABLE_NAME], family, genmask, 0);
1320 if (IS_ERR(table)) {
1321 NL_SET_BAD_ATTR(extack, nla[NFTA_TABLE_NAME]);
1322 return PTR_ERR(table);
1323 }
1324
1325 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
1326 if (!skb2)
1327 return -ENOMEM;
1328
1329 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
1330 info->nlh->nlmsg_seq, NFT_MSG_NEWTABLE,
1331 0, family, table);
1332 if (err < 0)
1333 goto err_fill_table_info;
1334
1335 return nfnetlink_unicast(skb2, net, NETLINK_CB(skb).portid);
1336
1337 err_fill_table_info:
1338 kfree_skb(skb2);
1339 return err;
1340 }
1341
nft_table_disable(struct net * net,struct nft_table * table,u32 cnt)1342 static void nft_table_disable(struct net *net, struct nft_table *table, u32 cnt)
1343 {
1344 struct nft_chain *chain;
1345 u32 i = 0;
1346
1347 list_for_each_entry(chain, &table->chains, list) {
1348 if (!nft_is_active_next(net, chain))
1349 continue;
1350 if (!nft_is_base_chain(chain))
1351 continue;
1352
1353 if (cnt && i++ == cnt)
1354 break;
1355
1356 nf_tables_unregister_hook(net, table, chain);
1357 }
1358 }
1359
nf_tables_table_enable(struct net * net,struct nft_table * table)1360 static int nf_tables_table_enable(struct net *net, struct nft_table *table)
1361 {
1362 struct nft_chain *chain;
1363 int err, i = 0;
1364
1365 list_for_each_entry(chain, &table->chains, list) {
1366 if (!nft_is_active_next(net, chain))
1367 continue;
1368 if (!nft_is_base_chain(chain))
1369 continue;
1370
1371 err = nf_tables_register_hook(net, table, chain);
1372 if (err < 0)
1373 goto err_register_hooks;
1374
1375 i++;
1376 }
1377 return 0;
1378
1379 err_register_hooks:
1380 if (i)
1381 nft_table_disable(net, table, i);
1382 return err;
1383 }
1384
nf_tables_table_disable(struct net * net,struct nft_table * table)1385 static void nf_tables_table_disable(struct net *net, struct nft_table *table)
1386 {
1387 table->flags &= ~NFT_TABLE_F_DORMANT;
1388 nft_table_disable(net, table, 0);
1389 table->flags |= NFT_TABLE_F_DORMANT;
1390 }
1391
1392 #define __NFT_TABLE_F_INTERNAL (NFT_TABLE_F_MASK + 1)
1393 #define __NFT_TABLE_F_WAS_DORMANT (__NFT_TABLE_F_INTERNAL << 0)
1394 #define __NFT_TABLE_F_WAS_AWAKEN (__NFT_TABLE_F_INTERNAL << 1)
1395 #define __NFT_TABLE_F_WAS_ORPHAN (__NFT_TABLE_F_INTERNAL << 2)
1396 #define __NFT_TABLE_F_UPDATE (__NFT_TABLE_F_WAS_DORMANT | \
1397 __NFT_TABLE_F_WAS_AWAKEN | \
1398 __NFT_TABLE_F_WAS_ORPHAN)
1399
nft_table_pending_update(const struct nft_ctx * ctx)1400 static bool nft_table_pending_update(const struct nft_ctx *ctx)
1401 {
1402 struct nftables_pernet *nft_net = nft_pernet(ctx->net);
1403 struct nft_trans *trans;
1404
1405 if (ctx->table->flags & __NFT_TABLE_F_UPDATE)
1406 return true;
1407
1408 list_for_each_entry(trans, &nft_net->commit_list, list) {
1409 if (trans->table == ctx->table &&
1410 ((trans->msg_type == NFT_MSG_NEWCHAIN &&
1411 nft_trans_chain_update(trans)) ||
1412 (trans->msg_type == NFT_MSG_DELCHAIN &&
1413 nft_is_base_chain(nft_trans_chain(trans)))))
1414 return true;
1415 }
1416
1417 return false;
1418 }
1419
nf_tables_updtable(struct nft_ctx * ctx)1420 static int nf_tables_updtable(struct nft_ctx *ctx)
1421 {
1422 struct nft_trans *trans;
1423 u32 flags;
1424 int ret;
1425
1426 if (!ctx->nla[NFTA_TABLE_FLAGS])
1427 return 0;
1428
1429 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
1430 if (flags & ~NFT_TABLE_F_MASK)
1431 return -EOPNOTSUPP;
1432
1433 if (flags == (ctx->table->flags & NFT_TABLE_F_MASK))
1434 return 0;
1435
1436 if ((nft_table_has_owner(ctx->table) &&
1437 !(flags & NFT_TABLE_F_OWNER)) ||
1438 (flags & NFT_TABLE_F_OWNER &&
1439 !nft_table_is_orphan(ctx->table)))
1440 return -EOPNOTSUPP;
1441
1442 if ((flags ^ ctx->table->flags) & NFT_TABLE_F_PERSIST)
1443 return -EOPNOTSUPP;
1444
1445 /* No dormant off/on/off/on games in single transaction */
1446 if (nft_table_pending_update(ctx))
1447 return -EINVAL;
1448
1449 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
1450 sizeof(struct nft_trans_table));
1451 if (trans == NULL)
1452 return -ENOMEM;
1453
1454 if ((flags & NFT_TABLE_F_DORMANT) &&
1455 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
1456 ctx->table->flags |= NFT_TABLE_F_DORMANT;
1457 if (!(ctx->table->flags & __NFT_TABLE_F_UPDATE))
1458 ctx->table->flags |= __NFT_TABLE_F_WAS_AWAKEN;
1459 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
1460 ctx->table->flags & NFT_TABLE_F_DORMANT) {
1461 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
1462 if (!(ctx->table->flags & __NFT_TABLE_F_UPDATE)) {
1463 ret = nf_tables_table_enable(ctx->net, ctx->table);
1464 if (ret < 0)
1465 goto err_register_hooks;
1466
1467 ctx->table->flags |= __NFT_TABLE_F_WAS_DORMANT;
1468 }
1469 }
1470
1471 if ((flags & NFT_TABLE_F_OWNER) &&
1472 !nft_table_has_owner(ctx->table)) {
1473 ctx->table->nlpid = ctx->portid;
1474 ctx->table->flags |= NFT_TABLE_F_OWNER |
1475 __NFT_TABLE_F_WAS_ORPHAN;
1476 }
1477
1478 nft_trans_table_update(trans) = true;
1479 nft_trans_commit_list_add_tail(ctx->net, trans);
1480
1481 return 0;
1482
1483 err_register_hooks:
1484 ctx->table->flags |= NFT_TABLE_F_DORMANT;
1485 nft_trans_destroy(trans);
1486 return ret;
1487 }
1488
nft_chain_hash(const void * data,u32 len,u32 seed)1489 static u32 nft_chain_hash(const void *data, u32 len, u32 seed)
1490 {
1491 const char *name = data;
1492
1493 return jhash(name, strlen(name), seed);
1494 }
1495
nft_chain_hash_obj(const void * data,u32 len,u32 seed)1496 static u32 nft_chain_hash_obj(const void *data, u32 len, u32 seed)
1497 {
1498 const struct nft_chain *chain = data;
1499
1500 return nft_chain_hash(chain->name, 0, seed);
1501 }
1502
nft_chain_hash_cmp(struct rhashtable_compare_arg * arg,const void * ptr)1503 static int nft_chain_hash_cmp(struct rhashtable_compare_arg *arg,
1504 const void *ptr)
1505 {
1506 const struct nft_chain *chain = ptr;
1507 const char *name = arg->key;
1508
1509 return strcmp(chain->name, name);
1510 }
1511
nft_objname_hash(const void * data,u32 len,u32 seed)1512 static u32 nft_objname_hash(const void *data, u32 len, u32 seed)
1513 {
1514 const struct nft_object_hash_key *k = data;
1515
1516 seed ^= hash_ptr(k->table, 32);
1517
1518 return jhash(k->name, strlen(k->name), seed);
1519 }
1520
nft_objname_hash_obj(const void * data,u32 len,u32 seed)1521 static u32 nft_objname_hash_obj(const void *data, u32 len, u32 seed)
1522 {
1523 const struct nft_object *obj = data;
1524
1525 return nft_objname_hash(&obj->key, 0, seed);
1526 }
1527
nft_objname_hash_cmp(struct rhashtable_compare_arg * arg,const void * ptr)1528 static int nft_objname_hash_cmp(struct rhashtable_compare_arg *arg,
1529 const void *ptr)
1530 {
1531 const struct nft_object_hash_key *k = arg->key;
1532 const struct nft_object *obj = ptr;
1533
1534 if (obj->key.table != k->table)
1535 return -1;
1536
1537 return strcmp(obj->key.name, k->name);
1538 }
1539
nft_supported_family(u8 family)1540 static bool nft_supported_family(u8 family)
1541 {
1542 return false
1543 #ifdef CONFIG_NF_TABLES_INET
1544 || family == NFPROTO_INET
1545 #endif
1546 #ifdef CONFIG_NF_TABLES_IPV4
1547 || family == NFPROTO_IPV4
1548 #endif
1549 #ifdef CONFIG_NF_TABLES_ARP
1550 || family == NFPROTO_ARP
1551 #endif
1552 #ifdef CONFIG_NF_TABLES_NETDEV
1553 || family == NFPROTO_NETDEV
1554 #endif
1555 #if IS_ENABLED(CONFIG_NF_TABLES_BRIDGE)
1556 || family == NFPROTO_BRIDGE
1557 #endif
1558 #ifdef CONFIG_NF_TABLES_IPV6
1559 || family == NFPROTO_IPV6
1560 #endif
1561 ;
1562 }
1563
nf_tables_newtable(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])1564 static int nf_tables_newtable(struct sk_buff *skb, const struct nfnl_info *info,
1565 const struct nlattr * const nla[])
1566 {
1567 struct nftables_pernet *nft_net = nft_pernet(info->net);
1568 struct netlink_ext_ack *extack = info->extack;
1569 u8 genmask = nft_genmask_next(info->net);
1570 u8 family = info->nfmsg->nfgen_family;
1571 struct net *net = info->net;
1572 const struct nlattr *attr;
1573 struct nft_table *table;
1574 struct nft_ctx ctx;
1575 u32 flags = 0;
1576 int err;
1577
1578 if (!nft_supported_family(family))
1579 return -EOPNOTSUPP;
1580
1581 lockdep_assert_held(&nft_net->commit_mutex);
1582 attr = nla[NFTA_TABLE_NAME];
1583 table = nft_table_lookup(net, attr, family, genmask,
1584 NETLINK_CB(skb).portid);
1585 if (IS_ERR(table)) {
1586 if (PTR_ERR(table) != -ENOENT)
1587 return PTR_ERR(table);
1588 } else {
1589 if (info->nlh->nlmsg_flags & NLM_F_EXCL) {
1590 NL_SET_BAD_ATTR(extack, attr);
1591 return -EEXIST;
1592 }
1593 if (info->nlh->nlmsg_flags & NLM_F_REPLACE)
1594 return -EOPNOTSUPP;
1595
1596 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
1597
1598 return nf_tables_updtable(&ctx);
1599 }
1600
1601 if (nla[NFTA_TABLE_FLAGS]) {
1602 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
1603 if (flags & ~NFT_TABLE_F_MASK)
1604 return -EOPNOTSUPP;
1605 }
1606
1607 err = -ENOMEM;
1608 table = kzalloc(sizeof(*table), GFP_KERNEL_ACCOUNT);
1609 if (table == NULL)
1610 goto err_kzalloc;
1611
1612 table->validate_state = nft_net->validate_state;
1613 table->name = nla_strdup(attr, GFP_KERNEL_ACCOUNT);
1614 if (table->name == NULL)
1615 goto err_strdup;
1616
1617 if (nla[NFTA_TABLE_USERDATA]) {
1618 table->udata = nla_memdup(nla[NFTA_TABLE_USERDATA], GFP_KERNEL_ACCOUNT);
1619 if (table->udata == NULL)
1620 goto err_table_udata;
1621
1622 table->udlen = nla_len(nla[NFTA_TABLE_USERDATA]);
1623 }
1624
1625 err = rhltable_init(&table->chains_ht, &nft_chain_ht_params);
1626 if (err)
1627 goto err_chain_ht;
1628
1629 INIT_LIST_HEAD(&table->chains);
1630 INIT_LIST_HEAD(&table->sets);
1631 INIT_LIST_HEAD(&table->objects);
1632 INIT_LIST_HEAD(&table->flowtables);
1633 table->family = family;
1634 table->flags = flags;
1635 table->handle = ++nft_net->table_handle;
1636 if (table->flags & NFT_TABLE_F_OWNER)
1637 table->nlpid = NETLINK_CB(skb).portid;
1638
1639 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
1640 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
1641 if (err < 0)
1642 goto err_trans;
1643
1644 list_add_tail_rcu(&table->list, &nft_net->tables);
1645 return 0;
1646 err_trans:
1647 rhltable_destroy(&table->chains_ht);
1648 err_chain_ht:
1649 kfree(table->udata);
1650 err_table_udata:
1651 kfree(table->name);
1652 err_strdup:
1653 kfree(table);
1654 err_kzalloc:
1655 return err;
1656 }
1657
nft_flush_table(struct nft_ctx * ctx)1658 static int nft_flush_table(struct nft_ctx *ctx)
1659 {
1660 struct nft_flowtable *flowtable, *nft;
1661 struct nft_chain *chain, *nc;
1662 struct nft_object *obj, *ne;
1663 struct nft_set *set, *ns;
1664 int err;
1665
1666 list_for_each_entry(chain, &ctx->table->chains, list) {
1667 if (!nft_is_active_next(ctx->net, chain))
1668 continue;
1669
1670 if (nft_chain_binding(chain))
1671 continue;
1672
1673 ctx->chain = chain;
1674
1675 err = nft_delrule_by_chain(ctx);
1676 if (err < 0)
1677 goto out;
1678 }
1679
1680 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
1681 if (!nft_is_active_next(ctx->net, set))
1682 continue;
1683
1684 if (nft_set_is_anonymous(set))
1685 continue;
1686
1687 err = nft_delset(ctx, set);
1688 if (err < 0)
1689 goto out;
1690 }
1691
1692 list_for_each_entry_safe(flowtable, nft, &ctx->table->flowtables, list) {
1693 if (!nft_is_active_next(ctx->net, flowtable))
1694 continue;
1695
1696 err = nft_delflowtable(ctx, flowtable);
1697 if (err < 0)
1698 goto out;
1699 }
1700
1701 list_for_each_entry_safe(obj, ne, &ctx->table->objects, list) {
1702 if (!nft_is_active_next(ctx->net, obj))
1703 continue;
1704
1705 err = nft_delobj(ctx, obj);
1706 if (err < 0)
1707 goto out;
1708 }
1709
1710 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
1711 if (!nft_is_active_next(ctx->net, chain))
1712 continue;
1713
1714 if (nft_chain_binding(chain))
1715 continue;
1716
1717 ctx->chain = chain;
1718
1719 err = nft_delchain(ctx);
1720 if (err < 0)
1721 goto out;
1722 }
1723
1724 err = nft_deltable(ctx);
1725 out:
1726 return err;
1727 }
1728
nft_flush(struct nft_ctx * ctx,int family)1729 static int nft_flush(struct nft_ctx *ctx, int family)
1730 {
1731 struct nftables_pernet *nft_net = nft_pernet(ctx->net);
1732 const struct nlattr * const *nla = ctx->nla;
1733 struct nft_table *table, *nt;
1734 int err = 0;
1735
1736 list_for_each_entry_safe(table, nt, &nft_net->tables, list) {
1737 if (family != AF_UNSPEC && table->family != family)
1738 continue;
1739
1740 ctx->family = table->family;
1741
1742 if (!nft_is_active_next(ctx->net, table))
1743 continue;
1744
1745 if (nft_table_has_owner(table) && table->nlpid != ctx->portid)
1746 continue;
1747
1748 if (nla[NFTA_TABLE_NAME] &&
1749 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
1750 continue;
1751
1752 ctx->table = table;
1753
1754 err = nft_flush_table(ctx);
1755 if (err < 0)
1756 goto out;
1757 }
1758 out:
1759 return err;
1760 }
1761
nf_tables_deltable(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])1762 static int nf_tables_deltable(struct sk_buff *skb, const struct nfnl_info *info,
1763 const struct nlattr * const nla[])
1764 {
1765 struct netlink_ext_ack *extack = info->extack;
1766 u8 genmask = nft_genmask_next(info->net);
1767 u8 family = info->nfmsg->nfgen_family;
1768 struct net *net = info->net;
1769 const struct nlattr *attr;
1770 struct nft_table *table;
1771 struct nft_ctx ctx;
1772
1773 nft_ctx_init(&ctx, net, skb, info->nlh, 0, NULL, NULL, nla);
1774 if (family == AF_UNSPEC ||
1775 (!nla[NFTA_TABLE_NAME] && !nla[NFTA_TABLE_HANDLE]))
1776 return nft_flush(&ctx, family);
1777
1778 if (nla[NFTA_TABLE_HANDLE]) {
1779 attr = nla[NFTA_TABLE_HANDLE];
1780 table = nft_table_lookup_byhandle(net, attr, family, genmask,
1781 NETLINK_CB(skb).portid);
1782 } else {
1783 attr = nla[NFTA_TABLE_NAME];
1784 table = nft_table_lookup(net, attr, family, genmask,
1785 NETLINK_CB(skb).portid);
1786 }
1787
1788 if (IS_ERR(table)) {
1789 if (PTR_ERR(table) == -ENOENT &&
1790 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYTABLE)
1791 return 0;
1792
1793 NL_SET_BAD_ATTR(extack, attr);
1794 return PTR_ERR(table);
1795 }
1796
1797 if (info->nlh->nlmsg_flags & NLM_F_NONREC &&
1798 table->use > 0)
1799 return -EBUSY;
1800
1801 ctx.family = family;
1802 ctx.table = table;
1803
1804 return nft_flush_table(&ctx);
1805 }
1806
nf_tables_table_destroy(struct nft_table * table)1807 static void nf_tables_table_destroy(struct nft_table *table)
1808 {
1809 if (WARN_ON(table->use > 0))
1810 return;
1811
1812 rhltable_destroy(&table->chains_ht);
1813 kfree(table->name);
1814 kfree(table->udata);
1815 kfree(table);
1816 }
1817
nft_register_chain_type(const struct nft_chain_type * ctype)1818 void nft_register_chain_type(const struct nft_chain_type *ctype)
1819 {
1820 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1821 if (WARN_ON(__nft_chain_type_get(ctype->family, ctype->type))) {
1822 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1823 return;
1824 }
1825 chain_type[ctype->family][ctype->type] = ctype;
1826 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1827 }
1828 EXPORT_SYMBOL_GPL(nft_register_chain_type);
1829
nft_unregister_chain_type(const struct nft_chain_type * ctype)1830 void nft_unregister_chain_type(const struct nft_chain_type *ctype)
1831 {
1832 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1833 chain_type[ctype->family][ctype->type] = NULL;
1834 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1835 }
1836 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
1837
1838 /*
1839 * Chains
1840 */
1841
1842 static struct nft_chain *
nft_chain_lookup_byhandle(const struct nft_table * table,u64 handle,u8 genmask)1843 nft_chain_lookup_byhandle(const struct nft_table *table, u64 handle, u8 genmask)
1844 {
1845 struct nft_chain *chain;
1846
1847 list_for_each_entry(chain, &table->chains, list) {
1848 if (chain->handle == handle &&
1849 nft_active_genmask(chain, genmask))
1850 return chain;
1851 }
1852
1853 return ERR_PTR(-ENOENT);
1854 }
1855
lockdep_commit_lock_is_held(const struct net * net)1856 static bool lockdep_commit_lock_is_held(const struct net *net)
1857 {
1858 #ifdef CONFIG_PROVE_LOCKING
1859 struct nftables_pernet *nft_net = nft_pernet(net);
1860
1861 return lockdep_is_held(&nft_net->commit_mutex);
1862 #else
1863 return true;
1864 #endif
1865 }
1866
nft_chain_lookup(struct net * net,struct nft_table * table,const struct nlattr * nla,u8 genmask)1867 static struct nft_chain *nft_chain_lookup(struct net *net,
1868 struct nft_table *table,
1869 const struct nlattr *nla, u8 genmask)
1870 {
1871 char search[NFT_CHAIN_MAXNAMELEN + 1];
1872 struct rhlist_head *tmp, *list;
1873 struct nft_chain *chain;
1874
1875 if (nla == NULL)
1876 return ERR_PTR(-EINVAL);
1877
1878 nla_strscpy(search, nla, sizeof(search));
1879
1880 WARN_ON(!rcu_read_lock_held() &&
1881 !lockdep_commit_lock_is_held(net));
1882
1883 chain = ERR_PTR(-ENOENT);
1884 rcu_read_lock();
1885 list = rhltable_lookup(&table->chains_ht, search, nft_chain_ht_params);
1886 if (!list)
1887 goto out_unlock;
1888
1889 rhl_for_each_entry_rcu(chain, tmp, list, rhlhead) {
1890 if (nft_active_genmask(chain, genmask))
1891 goto out_unlock;
1892 }
1893 chain = ERR_PTR(-ENOENT);
1894 out_unlock:
1895 rcu_read_unlock();
1896 return chain;
1897 }
1898
1899 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
1900 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING,
1901 .len = NFT_TABLE_MAXNAMELEN - 1 },
1902 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
1903 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
1904 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1905 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
1906 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
1907 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING,
1908 .len = NFT_MODULE_AUTOLOAD_LIMIT },
1909 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
1910 [NFTA_CHAIN_FLAGS] = { .type = NLA_U32 },
1911 [NFTA_CHAIN_ID] = { .type = NLA_U32 },
1912 [NFTA_CHAIN_USERDATA] = { .type = NLA_BINARY,
1913 .len = NFT_USERDATA_MAXLEN },
1914 };
1915
1916 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
1917 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
1918 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
1919 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
1920 .len = IFNAMSIZ - 1 },
1921 };
1922
nft_dump_stats(struct sk_buff * skb,struct nft_stats __percpu * stats)1923 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
1924 {
1925 struct nft_stats *cpu_stats, total;
1926 struct nlattr *nest;
1927 unsigned int seq;
1928 u64 pkts, bytes;
1929 int cpu;
1930
1931 if (!stats)
1932 return 0;
1933
1934 memset(&total, 0, sizeof(total));
1935 for_each_possible_cpu(cpu) {
1936 cpu_stats = per_cpu_ptr(stats, cpu);
1937 do {
1938 seq = u64_stats_fetch_begin(&cpu_stats->syncp);
1939 pkts = cpu_stats->pkts;
1940 bytes = cpu_stats->bytes;
1941 } while (u64_stats_fetch_retry(&cpu_stats->syncp, seq));
1942 total.pkts += pkts;
1943 total.bytes += bytes;
1944 }
1945 nest = nla_nest_start_noflag(skb, NFTA_CHAIN_COUNTERS);
1946 if (nest == NULL)
1947 goto nla_put_failure;
1948
1949 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
1950 NFTA_COUNTER_PAD) ||
1951 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
1952 NFTA_COUNTER_PAD))
1953 goto nla_put_failure;
1954
1955 nla_nest_end(skb, nest);
1956 return 0;
1957
1958 nla_put_failure:
1959 return -ENOSPC;
1960 }
1961
hook_is_prefix(struct nft_hook * hook)1962 static bool hook_is_prefix(struct nft_hook *hook)
1963 {
1964 return strlen(hook->ifname) >= hook->ifnamelen;
1965 }
1966
nft_nla_put_hook_dev(struct sk_buff * skb,struct nft_hook * hook)1967 static int nft_nla_put_hook_dev(struct sk_buff *skb, struct nft_hook *hook)
1968 {
1969 int attr = hook_is_prefix(hook) ? NFTA_DEVICE_PREFIX : NFTA_DEVICE_NAME;
1970
1971 return nla_put_string(skb, attr, hook->ifname);
1972 }
1973
nft_dump_basechain_hook(struct sk_buff * skb,const struct net * net,int family,const struct nft_base_chain * basechain,const struct list_head * hook_list)1974 static int nft_dump_basechain_hook(struct sk_buff *skb,
1975 const struct net *net, int family,
1976 const struct nft_base_chain *basechain,
1977 const struct list_head *hook_list)
1978 {
1979 const struct nf_hook_ops *ops = &basechain->ops;
1980 struct nft_hook *hook, *first = NULL;
1981 struct nlattr *nest, *nest_devs;
1982 int n = 0;
1983
1984 nest = nla_nest_start_noflag(skb, NFTA_CHAIN_HOOK);
1985 if (nest == NULL)
1986 goto nla_put_failure;
1987 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
1988 goto nla_put_failure;
1989 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
1990 goto nla_put_failure;
1991
1992 if (nft_base_chain_netdev(family, ops->hooknum)) {
1993 nest_devs = nla_nest_start_noflag(skb, NFTA_HOOK_DEVS);
1994 if (!nest_devs)
1995 goto nla_put_failure;
1996
1997 if (!hook_list)
1998 hook_list = &basechain->hook_list;
1999
2000 list_for_each_entry_rcu(hook, hook_list, list,
2001 lockdep_commit_lock_is_held(net)) {
2002 if (!first)
2003 first = hook;
2004
2005 if (nft_nla_put_hook_dev(skb, hook))
2006 goto nla_put_failure;
2007 n++;
2008 }
2009 nla_nest_end(skb, nest_devs);
2010
2011 if (n == 1 &&
2012 !hook_is_prefix(first) &&
2013 nla_put_string(skb, NFTA_HOOK_DEV, first->ifname))
2014 goto nla_put_failure;
2015 }
2016 nla_nest_end(skb, nest);
2017
2018 return 0;
2019 nla_put_failure:
2020 return -1;
2021 }
2022
nf_tables_fill_chain_info(struct sk_buff * skb,struct net * net,u32 portid,u32 seq,int event,u32 flags,int family,const struct nft_table * table,const struct nft_chain * chain,const struct list_head * hook_list)2023 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
2024 u32 portid, u32 seq, int event, u32 flags,
2025 int family, const struct nft_table *table,
2026 const struct nft_chain *chain,
2027 const struct list_head *hook_list)
2028 {
2029 struct nlmsghdr *nlh;
2030
2031 nlh = nfnl_msg_put(skb, portid, seq,
2032 nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event),
2033 flags, family, NFNETLINK_V0, nft_base_seq(net));
2034 if (!nlh)
2035 goto nla_put_failure;
2036
2037 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name) ||
2038 nla_put_string(skb, NFTA_CHAIN_NAME, chain->name) ||
2039 nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
2040 NFTA_CHAIN_PAD))
2041 goto nla_put_failure;
2042
2043 if (!hook_list &&
2044 (event == NFT_MSG_DELCHAIN ||
2045 event == NFT_MSG_DESTROYCHAIN)) {
2046 nlmsg_end(skb, nlh);
2047 return 0;
2048 }
2049
2050 if (nft_is_base_chain(chain)) {
2051 const struct nft_base_chain *basechain = nft_base_chain(chain);
2052 struct nft_stats __percpu *stats;
2053
2054 if (nft_dump_basechain_hook(skb, net, family, basechain, hook_list))
2055 goto nla_put_failure;
2056
2057 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
2058 htonl(basechain->policy)))
2059 goto nla_put_failure;
2060
2061 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
2062 goto nla_put_failure;
2063
2064 stats = rcu_dereference_check(basechain->stats,
2065 lockdep_commit_lock_is_held(net));
2066 if (nft_dump_stats(skb, stats))
2067 goto nla_put_failure;
2068 }
2069
2070 if (chain->flags &&
2071 nla_put_be32(skb, NFTA_CHAIN_FLAGS, htonl(chain->flags)))
2072 goto nla_put_failure;
2073
2074 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
2075 goto nla_put_failure;
2076
2077 if (chain->udata &&
2078 nla_put(skb, NFTA_CHAIN_USERDATA, chain->udlen, chain->udata))
2079 goto nla_put_failure;
2080
2081 nlmsg_end(skb, nlh);
2082 return 0;
2083
2084 nla_put_failure:
2085 nlmsg_trim(skb, nlh);
2086 return -1;
2087 }
2088
nf_tables_chain_notify(const struct nft_ctx * ctx,int event,const struct list_head * hook_list)2089 static void nf_tables_chain_notify(const struct nft_ctx *ctx, int event,
2090 const struct list_head *hook_list)
2091 {
2092 struct nftables_pernet *nft_net;
2093 struct sk_buff *skb;
2094 u16 flags = 0;
2095 int err;
2096
2097 if (!ctx->report &&
2098 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2099 return;
2100
2101 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
2102 if (skb == NULL)
2103 goto err;
2104
2105 if (ctx->flags & (NLM_F_CREATE | NLM_F_EXCL))
2106 flags |= ctx->flags & (NLM_F_CREATE | NLM_F_EXCL);
2107
2108 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
2109 event, flags, ctx->family, ctx->table,
2110 ctx->chain, hook_list);
2111 if (err < 0) {
2112 kfree_skb(skb);
2113 goto err;
2114 }
2115
2116 nft_net = nft_pernet(ctx->net);
2117 nft_notify_enqueue(skb, ctx->report, &nft_net->notify_list);
2118 return;
2119 err:
2120 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
2121 }
2122
nf_tables_dump_chains(struct sk_buff * skb,struct netlink_callback * cb)2123 static int nf_tables_dump_chains(struct sk_buff *skb,
2124 struct netlink_callback *cb)
2125 {
2126 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
2127 unsigned int idx = 0, s_idx = cb->args[0];
2128 struct net *net = sock_net(skb->sk);
2129 int family = nfmsg->nfgen_family;
2130 struct nftables_pernet *nft_net;
2131 const struct nft_table *table;
2132 const struct nft_chain *chain;
2133
2134 rcu_read_lock();
2135 nft_net = nft_pernet(net);
2136 cb->seq = READ_ONCE(nft_net->base_seq);
2137
2138 list_for_each_entry_rcu(table, &nft_net->tables, list) {
2139 if (family != NFPROTO_UNSPEC && family != table->family)
2140 continue;
2141
2142 list_for_each_entry_rcu(chain, &table->chains, list) {
2143 if (idx < s_idx)
2144 goto cont;
2145 if (idx > s_idx)
2146 memset(&cb->args[1], 0,
2147 sizeof(cb->args) - sizeof(cb->args[0]));
2148 if (!nft_is_active(net, chain))
2149 continue;
2150 if (nf_tables_fill_chain_info(skb, net,
2151 NETLINK_CB(cb->skb).portid,
2152 cb->nlh->nlmsg_seq,
2153 NFT_MSG_NEWCHAIN,
2154 NLM_F_MULTI,
2155 table->family, table,
2156 chain, NULL) < 0)
2157 goto done;
2158
2159 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2160 cont:
2161 idx++;
2162 }
2163 }
2164 done:
2165 rcu_read_unlock();
2166 cb->args[0] = idx;
2167 return skb->len;
2168 }
2169
2170 /* called with rcu_read_lock held */
nf_tables_getchain(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])2171 static int nf_tables_getchain(struct sk_buff *skb, const struct nfnl_info *info,
2172 const struct nlattr * const nla[])
2173 {
2174 struct netlink_ext_ack *extack = info->extack;
2175 u8 genmask = nft_genmask_cur(info->net);
2176 u8 family = info->nfmsg->nfgen_family;
2177 const struct nft_chain *chain;
2178 struct net *net = info->net;
2179 struct nft_table *table;
2180 struct sk_buff *skb2;
2181 int err;
2182
2183 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
2184 struct netlink_dump_control c = {
2185 .dump = nf_tables_dump_chains,
2186 .module = THIS_MODULE,
2187 };
2188
2189 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
2190 }
2191
2192 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask, 0);
2193 if (IS_ERR(table)) {
2194 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
2195 return PTR_ERR(table);
2196 }
2197
2198 chain = nft_chain_lookup(net, table, nla[NFTA_CHAIN_NAME], genmask);
2199 if (IS_ERR(chain)) {
2200 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_NAME]);
2201 return PTR_ERR(chain);
2202 }
2203
2204 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
2205 if (!skb2)
2206 return -ENOMEM;
2207
2208 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
2209 info->nlh->nlmsg_seq, NFT_MSG_NEWCHAIN,
2210 0, family, table, chain, NULL);
2211 if (err < 0)
2212 goto err_fill_chain_info;
2213
2214 return nfnetlink_unicast(skb2, net, NETLINK_CB(skb).portid);
2215
2216 err_fill_chain_info:
2217 kfree_skb(skb2);
2218 return err;
2219 }
2220
2221 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
2222 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
2223 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
2224 };
2225
nft_stats_alloc(const struct nlattr * attr)2226 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
2227 {
2228 struct nlattr *tb[NFTA_COUNTER_MAX+1];
2229 struct nft_stats __percpu *newstats;
2230 struct nft_stats *stats;
2231 int err;
2232
2233 err = nla_parse_nested_deprecated(tb, NFTA_COUNTER_MAX, attr,
2234 nft_counter_policy, NULL);
2235 if (err < 0)
2236 return ERR_PTR_PCPU(err);
2237
2238 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
2239 return ERR_PTR_PCPU(-EINVAL);
2240
2241 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
2242 if (newstats == NULL)
2243 return ERR_PTR_PCPU(-ENOMEM);
2244
2245 /* Restore old counters on this cpu, no problem. Per-cpu statistics
2246 * are not exposed to userspace.
2247 */
2248 preempt_disable();
2249 stats = this_cpu_ptr(newstats);
2250 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
2251 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
2252 preempt_enable();
2253
2254 return newstats;
2255 }
2256
nft_chain_stats_replace(struct nft_trans_chain * trans)2257 static void nft_chain_stats_replace(struct nft_trans_chain *trans)
2258 {
2259 const struct nft_trans *t = &trans->nft_trans_binding.nft_trans;
2260 struct nft_base_chain *chain = nft_base_chain(trans->chain);
2261
2262 if (!trans->stats)
2263 return;
2264
2265 trans->stats =
2266 rcu_replace_pointer(chain->stats, trans->stats,
2267 lockdep_commit_lock_is_held(t->net));
2268
2269 if (!trans->stats)
2270 static_branch_inc(&nft_counters_enabled);
2271 }
2272
nf_tables_chain_free_chain_rules(struct nft_chain * chain)2273 static void nf_tables_chain_free_chain_rules(struct nft_chain *chain)
2274 {
2275 struct nft_rule_blob *g0 = rcu_dereference_raw(chain->blob_gen_0);
2276 struct nft_rule_blob *g1 = rcu_dereference_raw(chain->blob_gen_1);
2277
2278 if (g0 != g1)
2279 kvfree(g1);
2280 kvfree(g0);
2281
2282 /* should be NULL either via abort or via successful commit */
2283 WARN_ON_ONCE(chain->blob_next);
2284 kvfree(chain->blob_next);
2285 }
2286
nf_tables_chain_destroy(struct nft_chain * chain)2287 void nf_tables_chain_destroy(struct nft_chain *chain)
2288 {
2289 const struct nft_table *table = chain->table;
2290 struct nft_hook *hook, *next;
2291
2292 if (WARN_ON(chain->use > 0))
2293 return;
2294
2295 /* no concurrent access possible anymore */
2296 nf_tables_chain_free_chain_rules(chain);
2297
2298 if (nft_is_base_chain(chain)) {
2299 struct nft_base_chain *basechain = nft_base_chain(chain);
2300
2301 if (nft_base_chain_netdev(table->family, basechain->ops.hooknum)) {
2302 list_for_each_entry_safe(hook, next,
2303 &basechain->hook_list, list) {
2304 list_del_rcu(&hook->list);
2305 nft_netdev_hook_free_rcu(hook);
2306 }
2307 }
2308 module_put(basechain->type->owner);
2309 if (rcu_access_pointer(basechain->stats)) {
2310 static_branch_dec(&nft_counters_enabled);
2311 free_percpu(rcu_dereference_raw(basechain->stats));
2312 }
2313 kfree(chain->name);
2314 kfree(chain->udata);
2315 kfree(basechain);
2316 } else {
2317 kfree(chain->name);
2318 kfree(chain->udata);
2319 kfree(chain);
2320 }
2321 }
2322
nft_netdev_hook_alloc(struct net * net,const struct nlattr * attr,bool prefix)2323 static struct nft_hook *nft_netdev_hook_alloc(struct net *net,
2324 const struct nlattr *attr,
2325 bool prefix)
2326 {
2327 struct nf_hook_ops *ops;
2328 struct net_device *dev;
2329 struct nft_hook *hook;
2330 int err;
2331
2332 hook = kzalloc(sizeof(struct nft_hook), GFP_KERNEL_ACCOUNT);
2333 if (!hook)
2334 return ERR_PTR(-ENOMEM);
2335
2336 INIT_LIST_HEAD(&hook->ops_list);
2337
2338 err = nla_strscpy(hook->ifname, attr, IFNAMSIZ);
2339 if (err < 0)
2340 goto err_hook_free;
2341
2342 /* include the terminating NUL-char when comparing non-prefixes */
2343 hook->ifnamelen = strlen(hook->ifname) + !prefix;
2344
2345 /* nf_tables_netdev_event() is called under rtnl_mutex, this is
2346 * indirectly serializing all the other holders of the commit_mutex with
2347 * the rtnl_mutex.
2348 */
2349 for_each_netdev(net, dev) {
2350 if (strncmp(dev->name, hook->ifname, hook->ifnamelen))
2351 continue;
2352
2353 ops = kzalloc(sizeof(struct nf_hook_ops), GFP_KERNEL_ACCOUNT);
2354 if (!ops) {
2355 err = -ENOMEM;
2356 goto err_hook_free;
2357 }
2358 ops->dev = dev;
2359 list_add_tail(&ops->list, &hook->ops_list);
2360 }
2361 return hook;
2362
2363 err_hook_free:
2364 nft_netdev_hook_free(hook);
2365 return ERR_PTR(err);
2366 }
2367
nft_hook_list_find(struct list_head * hook_list,const struct nft_hook * this)2368 static struct nft_hook *nft_hook_list_find(struct list_head *hook_list,
2369 const struct nft_hook *this)
2370 {
2371 struct nft_hook *hook;
2372
2373 list_for_each_entry(hook, hook_list, list) {
2374 if (!strncmp(hook->ifname, this->ifname,
2375 min(hook->ifnamelen, this->ifnamelen)))
2376 return hook;
2377 }
2378
2379 return NULL;
2380 }
2381
nf_tables_parse_netdev_hooks(struct net * net,const struct nlattr * attr,struct list_head * hook_list,struct netlink_ext_ack * extack)2382 static int nf_tables_parse_netdev_hooks(struct net *net,
2383 const struct nlattr *attr,
2384 struct list_head *hook_list,
2385 struct netlink_ext_ack *extack)
2386 {
2387 struct nft_hook *hook, *next;
2388 const struct nlattr *tmp;
2389 int rem, n = 0, err;
2390 bool prefix;
2391
2392 nla_for_each_nested(tmp, attr, rem) {
2393 switch (nla_type(tmp)) {
2394 case NFTA_DEVICE_NAME:
2395 prefix = false;
2396 break;
2397 case NFTA_DEVICE_PREFIX:
2398 prefix = true;
2399 break;
2400 default:
2401 err = -EINVAL;
2402 goto err_hook;
2403 }
2404
2405 hook = nft_netdev_hook_alloc(net, tmp, prefix);
2406 if (IS_ERR(hook)) {
2407 NL_SET_BAD_ATTR(extack, tmp);
2408 err = PTR_ERR(hook);
2409 goto err_hook;
2410 }
2411 if (nft_hook_list_find(hook_list, hook)) {
2412 NL_SET_BAD_ATTR(extack, tmp);
2413 nft_netdev_hook_free(hook);
2414 err = -EEXIST;
2415 goto err_hook;
2416 }
2417 list_add_tail(&hook->list, hook_list);
2418 n++;
2419
2420 if (n == NFT_NETDEVICE_MAX) {
2421 err = -EFBIG;
2422 goto err_hook;
2423 }
2424 }
2425
2426 return 0;
2427
2428 err_hook:
2429 list_for_each_entry_safe(hook, next, hook_list, list) {
2430 list_del(&hook->list);
2431 nft_netdev_hook_free(hook);
2432 }
2433 return err;
2434 }
2435
2436 struct nft_chain_hook {
2437 u32 num;
2438 s32 priority;
2439 const struct nft_chain_type *type;
2440 struct list_head list;
2441 };
2442
nft_chain_parse_netdev(struct net * net,struct nlattr * tb[],struct list_head * hook_list,struct netlink_ext_ack * extack,u32 flags)2443 static int nft_chain_parse_netdev(struct net *net, struct nlattr *tb[],
2444 struct list_head *hook_list,
2445 struct netlink_ext_ack *extack, u32 flags)
2446 {
2447 struct nft_hook *hook;
2448 int err;
2449
2450 if (tb[NFTA_HOOK_DEV]) {
2451 hook = nft_netdev_hook_alloc(net, tb[NFTA_HOOK_DEV], false);
2452 if (IS_ERR(hook)) {
2453 NL_SET_BAD_ATTR(extack, tb[NFTA_HOOK_DEV]);
2454 return PTR_ERR(hook);
2455 }
2456
2457 list_add_tail(&hook->list, hook_list);
2458 } else if (tb[NFTA_HOOK_DEVS]) {
2459 err = nf_tables_parse_netdev_hooks(net, tb[NFTA_HOOK_DEVS],
2460 hook_list, extack);
2461 if (err < 0)
2462 return err;
2463
2464 }
2465
2466 if (flags & NFT_CHAIN_HW_OFFLOAD &&
2467 list_empty(hook_list))
2468 return -EINVAL;
2469
2470 return 0;
2471 }
2472
nft_chain_parse_hook(struct net * net,struct nft_base_chain * basechain,const struct nlattr * const nla[],struct nft_chain_hook * hook,u8 family,u32 flags,struct netlink_ext_ack * extack)2473 static int nft_chain_parse_hook(struct net *net,
2474 struct nft_base_chain *basechain,
2475 const struct nlattr * const nla[],
2476 struct nft_chain_hook *hook, u8 family,
2477 u32 flags, struct netlink_ext_ack *extack)
2478 {
2479 struct nftables_pernet *nft_net = nft_pernet(net);
2480 struct nlattr *ha[NFTA_HOOK_MAX + 1];
2481 const struct nft_chain_type *type;
2482 int err;
2483
2484 lockdep_assert_held(&nft_net->commit_mutex);
2485 lockdep_nfnl_nft_mutex_not_held();
2486
2487 err = nla_parse_nested_deprecated(ha, NFTA_HOOK_MAX,
2488 nla[NFTA_CHAIN_HOOK],
2489 nft_hook_policy, NULL);
2490 if (err < 0)
2491 return err;
2492
2493 if (!basechain) {
2494 if (!ha[NFTA_HOOK_HOOKNUM] ||
2495 !ha[NFTA_HOOK_PRIORITY]) {
2496 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_NAME]);
2497 return -ENOENT;
2498 }
2499
2500 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
2501 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
2502
2503 type = __nft_chain_type_get(family, NFT_CHAIN_T_DEFAULT);
2504 if (!type)
2505 return -EOPNOTSUPP;
2506
2507 if (nla[NFTA_CHAIN_TYPE]) {
2508 type = nf_tables_chain_type_lookup(net, nla[NFTA_CHAIN_TYPE],
2509 family, true);
2510 if (IS_ERR(type)) {
2511 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TYPE]);
2512 return PTR_ERR(type);
2513 }
2514 }
2515 if (hook->num >= NFT_MAX_HOOKS || !(type->hook_mask & (1 << hook->num)))
2516 return -EOPNOTSUPP;
2517
2518 if (type->type == NFT_CHAIN_T_NAT &&
2519 hook->priority <= NF_IP_PRI_CONNTRACK)
2520 return -EOPNOTSUPP;
2521 } else {
2522 if (ha[NFTA_HOOK_HOOKNUM]) {
2523 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
2524 if (hook->num != basechain->ops.hooknum)
2525 return -EOPNOTSUPP;
2526 }
2527 if (ha[NFTA_HOOK_PRIORITY]) {
2528 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
2529 if (hook->priority != basechain->ops.priority)
2530 return -EOPNOTSUPP;
2531 }
2532
2533 if (nla[NFTA_CHAIN_TYPE]) {
2534 type = __nf_tables_chain_type_lookup(nla[NFTA_CHAIN_TYPE],
2535 family);
2536 if (!type) {
2537 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TYPE]);
2538 return -ENOENT;
2539 }
2540 } else {
2541 type = basechain->type;
2542 }
2543 }
2544
2545 if (!try_module_get(type->owner)) {
2546 if (nla[NFTA_CHAIN_TYPE])
2547 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TYPE]);
2548 return -ENOENT;
2549 }
2550
2551 hook->type = type;
2552
2553 INIT_LIST_HEAD(&hook->list);
2554 if (nft_base_chain_netdev(family, hook->num)) {
2555 err = nft_chain_parse_netdev(net, ha, &hook->list, extack, flags);
2556 if (err < 0) {
2557 module_put(type->owner);
2558 return err;
2559 }
2560 } else if (ha[NFTA_HOOK_DEV] || ha[NFTA_HOOK_DEVS]) {
2561 module_put(type->owner);
2562 return -EOPNOTSUPP;
2563 }
2564
2565 return 0;
2566 }
2567
nft_chain_release_hook(struct nft_chain_hook * hook)2568 static void nft_chain_release_hook(struct nft_chain_hook *hook)
2569 {
2570 struct nft_hook *h, *next;
2571
2572 list_for_each_entry_safe(h, next, &hook->list, list) {
2573 list_del(&h->list);
2574 nft_netdev_hook_free(h);
2575 }
2576 module_put(hook->type->owner);
2577 }
2578
nft_last_rule(const struct nft_chain * chain,const void * ptr)2579 static void nft_last_rule(const struct nft_chain *chain, const void *ptr)
2580 {
2581 struct nft_rule_dp_last *lrule;
2582
2583 BUILD_BUG_ON(offsetof(struct nft_rule_dp_last, end) != 0);
2584
2585 lrule = (struct nft_rule_dp_last *)ptr;
2586 lrule->end.is_last = 1;
2587 lrule->chain = chain;
2588 /* blob size does not include the trailer rule */
2589 }
2590
nf_tables_chain_alloc_rules(const struct nft_chain * chain,unsigned int size)2591 static struct nft_rule_blob *nf_tables_chain_alloc_rules(const struct nft_chain *chain,
2592 unsigned int size)
2593 {
2594 struct nft_rule_blob *blob;
2595
2596 if (size > INT_MAX)
2597 return NULL;
2598
2599 size += sizeof(struct nft_rule_blob) + sizeof(struct nft_rule_dp_last);
2600
2601 blob = kvmalloc(size, GFP_KERNEL_ACCOUNT);
2602 if (!blob)
2603 return NULL;
2604
2605 blob->size = 0;
2606 nft_last_rule(chain, blob->data);
2607
2608 return blob;
2609 }
2610
nft_basechain_hook_init(struct nf_hook_ops * ops,u8 family,const struct nft_chain_hook * hook,struct nft_chain * chain)2611 static void nft_basechain_hook_init(struct nf_hook_ops *ops, u8 family,
2612 const struct nft_chain_hook *hook,
2613 struct nft_chain *chain)
2614 {
2615 ops->pf = family;
2616 ops->hooknum = hook->num;
2617 ops->priority = hook->priority;
2618 ops->priv = chain;
2619 ops->hook = hook->type->hooks[ops->hooknum];
2620 ops->hook_ops_type = NF_HOOK_OP_NF_TABLES;
2621 }
2622
nft_basechain_init(struct nft_base_chain * basechain,u8 family,struct nft_chain_hook * hook,u32 flags)2623 static int nft_basechain_init(struct nft_base_chain *basechain, u8 family,
2624 struct nft_chain_hook *hook, u32 flags)
2625 {
2626 struct nft_chain *chain;
2627 struct nf_hook_ops *ops;
2628 struct nft_hook *h;
2629
2630 basechain->type = hook->type;
2631 INIT_LIST_HEAD(&basechain->hook_list);
2632 chain = &basechain->chain;
2633
2634 if (nft_base_chain_netdev(family, hook->num)) {
2635 list_splice_init(&hook->list, &basechain->hook_list);
2636 list_for_each_entry(h, &basechain->hook_list, list) {
2637 list_for_each_entry(ops, &h->ops_list, list)
2638 nft_basechain_hook_init(ops, family, hook, chain);
2639 }
2640 }
2641 nft_basechain_hook_init(&basechain->ops, family, hook, chain);
2642
2643 chain->flags |= NFT_CHAIN_BASE | flags;
2644 basechain->policy = NF_ACCEPT;
2645 if (chain->flags & NFT_CHAIN_HW_OFFLOAD &&
2646 !nft_chain_offload_support(basechain)) {
2647 list_splice_init(&basechain->hook_list, &hook->list);
2648 return -EOPNOTSUPP;
2649 }
2650
2651 flow_block_init(&basechain->flow_block);
2652
2653 return 0;
2654 }
2655
nft_chain_add(struct nft_table * table,struct nft_chain * chain)2656 int nft_chain_add(struct nft_table *table, struct nft_chain *chain)
2657 {
2658 int err;
2659
2660 err = rhltable_insert_key(&table->chains_ht, chain->name,
2661 &chain->rhlhead, nft_chain_ht_params);
2662 if (err)
2663 return err;
2664
2665 list_add_tail_rcu(&chain->list, &table->chains);
2666
2667 return 0;
2668 }
2669
2670 static u64 chain_id;
2671
nf_tables_addchain(struct nft_ctx * ctx,u8 family,u8 policy,u32 flags,struct netlink_ext_ack * extack)2672 static int nf_tables_addchain(struct nft_ctx *ctx, u8 family, u8 policy,
2673 u32 flags, struct netlink_ext_ack *extack)
2674 {
2675 const struct nlattr * const *nla = ctx->nla;
2676 struct nft_table *table = ctx->table;
2677 struct nft_base_chain *basechain;
2678 struct net *net = ctx->net;
2679 char name[NFT_NAME_MAXLEN];
2680 struct nft_rule_blob *blob;
2681 struct nft_trans *trans;
2682 struct nft_chain *chain;
2683 int err;
2684
2685 if (nla[NFTA_CHAIN_HOOK]) {
2686 struct nft_stats __percpu *stats = NULL;
2687 struct nft_chain_hook hook = {};
2688
2689 if (table->flags & __NFT_TABLE_F_UPDATE)
2690 return -EINVAL;
2691
2692 if (flags & NFT_CHAIN_BINDING)
2693 return -EOPNOTSUPP;
2694
2695 err = nft_chain_parse_hook(net, NULL, nla, &hook, family, flags,
2696 extack);
2697 if (err < 0)
2698 return err;
2699
2700 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL_ACCOUNT);
2701 if (basechain == NULL) {
2702 nft_chain_release_hook(&hook);
2703 return -ENOMEM;
2704 }
2705 chain = &basechain->chain;
2706
2707 if (nla[NFTA_CHAIN_COUNTERS]) {
2708 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
2709 if (IS_ERR_PCPU(stats)) {
2710 nft_chain_release_hook(&hook);
2711 kfree(basechain);
2712 return PTR_ERR_PCPU(stats);
2713 }
2714 rcu_assign_pointer(basechain->stats, stats);
2715 }
2716
2717 err = nft_basechain_init(basechain, family, &hook, flags);
2718 if (err < 0) {
2719 nft_chain_release_hook(&hook);
2720 kfree(basechain);
2721 free_percpu(stats);
2722 return err;
2723 }
2724 if (stats)
2725 static_branch_inc(&nft_counters_enabled);
2726 } else {
2727 if (flags & NFT_CHAIN_BASE)
2728 return -EINVAL;
2729 if (flags & NFT_CHAIN_HW_OFFLOAD)
2730 return -EOPNOTSUPP;
2731
2732 chain = kzalloc(sizeof(*chain), GFP_KERNEL_ACCOUNT);
2733 if (chain == NULL)
2734 return -ENOMEM;
2735
2736 chain->flags = flags;
2737 }
2738 ctx->chain = chain;
2739
2740 INIT_LIST_HEAD(&chain->rules);
2741 chain->handle = nf_tables_alloc_handle(table);
2742 chain->table = table;
2743
2744 if (nla[NFTA_CHAIN_NAME]) {
2745 chain->name = nla_strdup(nla[NFTA_CHAIN_NAME], GFP_KERNEL_ACCOUNT);
2746 } else {
2747 if (!(flags & NFT_CHAIN_BINDING)) {
2748 err = -EINVAL;
2749 goto err_destroy_chain;
2750 }
2751
2752 snprintf(name, sizeof(name), "__chain%llu", ++chain_id);
2753 chain->name = kstrdup(name, GFP_KERNEL_ACCOUNT);
2754 }
2755
2756 if (!chain->name) {
2757 err = -ENOMEM;
2758 goto err_destroy_chain;
2759 }
2760
2761 if (nla[NFTA_CHAIN_USERDATA]) {
2762 chain->udata = nla_memdup(nla[NFTA_CHAIN_USERDATA], GFP_KERNEL_ACCOUNT);
2763 if (chain->udata == NULL) {
2764 err = -ENOMEM;
2765 goto err_destroy_chain;
2766 }
2767 chain->udlen = nla_len(nla[NFTA_CHAIN_USERDATA]);
2768 }
2769
2770 blob = nf_tables_chain_alloc_rules(chain, 0);
2771 if (!blob) {
2772 err = -ENOMEM;
2773 goto err_destroy_chain;
2774 }
2775
2776 RCU_INIT_POINTER(chain->blob_gen_0, blob);
2777 RCU_INIT_POINTER(chain->blob_gen_1, blob);
2778
2779 if (!nft_use_inc(&table->use)) {
2780 err = -EMFILE;
2781 goto err_destroy_chain;
2782 }
2783
2784 trans = nft_trans_chain_add(ctx, NFT_MSG_NEWCHAIN);
2785 if (IS_ERR(trans)) {
2786 err = PTR_ERR(trans);
2787 goto err_trans;
2788 }
2789
2790 nft_trans_chain_policy(trans) = NFT_CHAIN_POLICY_UNSET;
2791 if (nft_is_base_chain(chain))
2792 nft_trans_chain_policy(trans) = policy;
2793
2794 err = nft_chain_add(table, chain);
2795 if (err < 0)
2796 goto err_chain_add;
2797
2798 /* This must be LAST to ensure no packets are walking over this chain. */
2799 err = nf_tables_register_hook(net, table, chain);
2800 if (err < 0)
2801 goto err_register_hook;
2802
2803 return 0;
2804
2805 err_register_hook:
2806 nft_chain_del(chain);
2807 err_chain_add:
2808 nft_trans_destroy(trans);
2809 err_trans:
2810 nft_use_dec_restore(&table->use);
2811 err_destroy_chain:
2812 nf_tables_chain_destroy(chain);
2813
2814 return err;
2815 }
2816
nf_tables_updchain(struct nft_ctx * ctx,u8 genmask,u8 policy,u32 flags,const struct nlattr * attr,struct netlink_ext_ack * extack)2817 static int nf_tables_updchain(struct nft_ctx *ctx, u8 genmask, u8 policy,
2818 u32 flags, const struct nlattr *attr,
2819 struct netlink_ext_ack *extack)
2820 {
2821 const struct nlattr * const *nla = ctx->nla;
2822 struct nft_base_chain *basechain = NULL;
2823 struct nft_table *table = ctx->table;
2824 struct nft_chain *chain = ctx->chain;
2825 struct nft_chain_hook hook = {};
2826 struct nft_stats __percpu *stats = NULL;
2827 struct nftables_pernet *nft_net;
2828 struct nft_hook *h, *next;
2829 struct nf_hook_ops *ops;
2830 struct nft_trans *trans;
2831 bool unregister = false;
2832 int err;
2833
2834 if (chain->flags ^ flags)
2835 return -EOPNOTSUPP;
2836
2837 INIT_LIST_HEAD(&hook.list);
2838
2839 if (nla[NFTA_CHAIN_HOOK]) {
2840 if (!nft_is_base_chain(chain)) {
2841 NL_SET_BAD_ATTR(extack, attr);
2842 return -EEXIST;
2843 }
2844
2845 basechain = nft_base_chain(chain);
2846 err = nft_chain_parse_hook(ctx->net, basechain, nla, &hook,
2847 ctx->family, flags, extack);
2848 if (err < 0)
2849 return err;
2850
2851 if (basechain->type != hook.type) {
2852 nft_chain_release_hook(&hook);
2853 NL_SET_BAD_ATTR(extack, attr);
2854 return -EEXIST;
2855 }
2856
2857 if (nft_base_chain_netdev(ctx->family, basechain->ops.hooknum)) {
2858 list_for_each_entry_safe(h, next, &hook.list, list) {
2859 list_for_each_entry(ops, &h->ops_list, list) {
2860 ops->pf = basechain->ops.pf;
2861 ops->hooknum = basechain->ops.hooknum;
2862 ops->priority = basechain->ops.priority;
2863 ops->priv = basechain->ops.priv;
2864 ops->hook = basechain->ops.hook;
2865 }
2866
2867 if (nft_hook_list_find(&basechain->hook_list, h)) {
2868 list_del(&h->list);
2869 nft_netdev_hook_free(h);
2870 continue;
2871 }
2872
2873 nft_net = nft_pernet(ctx->net);
2874 list_for_each_entry(trans, &nft_net->commit_list, list) {
2875 if (trans->msg_type != NFT_MSG_NEWCHAIN ||
2876 trans->table != ctx->table ||
2877 !nft_trans_chain_update(trans))
2878 continue;
2879
2880 if (nft_hook_list_find(&nft_trans_chain_hooks(trans), h)) {
2881 nft_chain_release_hook(&hook);
2882 return -EEXIST;
2883 }
2884 }
2885 }
2886 } else {
2887 ops = &basechain->ops;
2888 if (ops->hooknum != hook.num ||
2889 ops->priority != hook.priority) {
2890 nft_chain_release_hook(&hook);
2891 NL_SET_BAD_ATTR(extack, attr);
2892 return -EEXIST;
2893 }
2894 }
2895 }
2896
2897 if (nla[NFTA_CHAIN_HANDLE] &&
2898 nla[NFTA_CHAIN_NAME]) {
2899 struct nft_chain *chain2;
2900
2901 chain2 = nft_chain_lookup(ctx->net, table,
2902 nla[NFTA_CHAIN_NAME], genmask);
2903 if (!IS_ERR(chain2)) {
2904 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_NAME]);
2905 err = -EEXIST;
2906 goto err_hooks;
2907 }
2908 }
2909
2910 if (table->flags & __NFT_TABLE_F_UPDATE &&
2911 !list_empty(&hook.list)) {
2912 NL_SET_BAD_ATTR(extack, attr);
2913 err = -EOPNOTSUPP;
2914 goto err_hooks;
2915 }
2916
2917 if (!(table->flags & NFT_TABLE_F_DORMANT) &&
2918 nft_is_base_chain(chain) &&
2919 !list_empty(&hook.list)) {
2920 basechain = nft_base_chain(chain);
2921 ops = &basechain->ops;
2922
2923 if (nft_base_chain_netdev(table->family, basechain->ops.hooknum)) {
2924 err = nft_netdev_register_hooks(ctx->net, &hook.list);
2925 if (err < 0)
2926 goto err_hooks;
2927
2928 unregister = true;
2929 }
2930 }
2931
2932 if (nla[NFTA_CHAIN_COUNTERS]) {
2933 if (!nft_is_base_chain(chain)) {
2934 err = -EOPNOTSUPP;
2935 goto err_hooks;
2936 }
2937
2938 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
2939 if (IS_ERR_PCPU(stats)) {
2940 err = PTR_ERR_PCPU(stats);
2941 goto err_hooks;
2942 }
2943 }
2944
2945 err = -ENOMEM;
2946 trans = nft_trans_alloc_chain(ctx, NFT_MSG_NEWCHAIN);
2947 if (trans == NULL)
2948 goto err_trans;
2949
2950 nft_trans_chain_stats(trans) = stats;
2951 nft_trans_chain_update(trans) = true;
2952
2953 if (nla[NFTA_CHAIN_POLICY])
2954 nft_trans_chain_policy(trans) = policy;
2955 else
2956 nft_trans_chain_policy(trans) = -1;
2957
2958 if (nla[NFTA_CHAIN_HANDLE] &&
2959 nla[NFTA_CHAIN_NAME]) {
2960 struct nftables_pernet *nft_net = nft_pernet(ctx->net);
2961 struct nft_trans *tmp;
2962 char *name;
2963
2964 err = -ENOMEM;
2965 name = nla_strdup(nla[NFTA_CHAIN_NAME], GFP_KERNEL_ACCOUNT);
2966 if (!name)
2967 goto err_trans;
2968
2969 err = -EEXIST;
2970 list_for_each_entry(tmp, &nft_net->commit_list, list) {
2971 if (tmp->msg_type == NFT_MSG_NEWCHAIN &&
2972 tmp->table == table &&
2973 nft_trans_chain_update(tmp) &&
2974 nft_trans_chain_name(tmp) &&
2975 strcmp(name, nft_trans_chain_name(tmp)) == 0) {
2976 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_NAME]);
2977 kfree(name);
2978 goto err_trans;
2979 }
2980 }
2981
2982 nft_trans_chain_name(trans) = name;
2983 }
2984
2985 nft_trans_basechain(trans) = basechain;
2986 INIT_LIST_HEAD(&nft_trans_chain_hooks(trans));
2987 list_splice(&hook.list, &nft_trans_chain_hooks(trans));
2988 if (nla[NFTA_CHAIN_HOOK])
2989 module_put(hook.type->owner);
2990
2991 nft_trans_commit_list_add_tail(ctx->net, trans);
2992
2993 return 0;
2994
2995 err_trans:
2996 free_percpu(stats);
2997 kfree(trans);
2998 err_hooks:
2999 if (nla[NFTA_CHAIN_HOOK]) {
3000 list_for_each_entry_safe(h, next, &hook.list, list) {
3001 if (unregister) {
3002 list_for_each_entry(ops, &h->ops_list, list)
3003 nf_unregister_net_hook(ctx->net, ops);
3004 }
3005 list_del(&h->list);
3006 nft_netdev_hook_free_rcu(h);
3007 }
3008 module_put(hook.type->owner);
3009 }
3010
3011 return err;
3012 }
3013
nft_chain_lookup_byid(const struct net * net,const struct nft_table * table,const struct nlattr * nla,u8 genmask)3014 static struct nft_chain *nft_chain_lookup_byid(const struct net *net,
3015 const struct nft_table *table,
3016 const struct nlattr *nla, u8 genmask)
3017 {
3018 struct nftables_pernet *nft_net = nft_pernet(net);
3019 u32 id = ntohl(nla_get_be32(nla));
3020 struct nft_trans *trans;
3021
3022 list_for_each_entry(trans, &nft_net->commit_list, list) {
3023 if (trans->msg_type == NFT_MSG_NEWCHAIN &&
3024 nft_trans_chain(trans)->table == table &&
3025 id == nft_trans_chain_id(trans) &&
3026 nft_active_genmask(nft_trans_chain(trans), genmask))
3027 return nft_trans_chain(trans);
3028 }
3029 return ERR_PTR(-ENOENT);
3030 }
3031
nf_tables_newchain(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])3032 static int nf_tables_newchain(struct sk_buff *skb, const struct nfnl_info *info,
3033 const struct nlattr * const nla[])
3034 {
3035 struct nftables_pernet *nft_net = nft_pernet(info->net);
3036 struct netlink_ext_ack *extack = info->extack;
3037 u8 genmask = nft_genmask_next(info->net);
3038 u8 family = info->nfmsg->nfgen_family;
3039 struct nft_chain *chain = NULL;
3040 struct net *net = info->net;
3041 const struct nlattr *attr;
3042 struct nft_table *table;
3043 u8 policy = NF_ACCEPT;
3044 struct nft_ctx ctx;
3045 u64 handle = 0;
3046 u32 flags = 0;
3047
3048 lockdep_assert_held(&nft_net->commit_mutex);
3049
3050 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask,
3051 NETLINK_CB(skb).portid);
3052 if (IS_ERR(table)) {
3053 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
3054 return PTR_ERR(table);
3055 }
3056
3057 chain = NULL;
3058 attr = nla[NFTA_CHAIN_NAME];
3059
3060 if (nla[NFTA_CHAIN_HANDLE]) {
3061 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
3062 chain = nft_chain_lookup_byhandle(table, handle, genmask);
3063 if (IS_ERR(chain)) {
3064 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_HANDLE]);
3065 return PTR_ERR(chain);
3066 }
3067 attr = nla[NFTA_CHAIN_HANDLE];
3068 } else if (nla[NFTA_CHAIN_NAME]) {
3069 chain = nft_chain_lookup(net, table, attr, genmask);
3070 if (IS_ERR(chain)) {
3071 if (PTR_ERR(chain) != -ENOENT) {
3072 NL_SET_BAD_ATTR(extack, attr);
3073 return PTR_ERR(chain);
3074 }
3075 chain = NULL;
3076 }
3077 } else if (!nla[NFTA_CHAIN_ID]) {
3078 return -EINVAL;
3079 }
3080
3081 if (nla[NFTA_CHAIN_POLICY]) {
3082 if (chain != NULL &&
3083 !nft_is_base_chain(chain)) {
3084 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_POLICY]);
3085 return -EOPNOTSUPP;
3086 }
3087
3088 if (chain == NULL &&
3089 nla[NFTA_CHAIN_HOOK] == NULL) {
3090 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_POLICY]);
3091 return -EOPNOTSUPP;
3092 }
3093
3094 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
3095 switch (policy) {
3096 case NF_DROP:
3097 case NF_ACCEPT:
3098 break;
3099 default:
3100 return -EINVAL;
3101 }
3102 }
3103
3104 if (nla[NFTA_CHAIN_FLAGS])
3105 flags = ntohl(nla_get_be32(nla[NFTA_CHAIN_FLAGS]));
3106 else if (chain)
3107 flags = chain->flags;
3108
3109 if (flags & ~NFT_CHAIN_FLAGS)
3110 return -EOPNOTSUPP;
3111
3112 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, chain, nla);
3113
3114 if (chain != NULL) {
3115 if (chain->flags & NFT_CHAIN_BINDING)
3116 return -EINVAL;
3117
3118 if (info->nlh->nlmsg_flags & NLM_F_EXCL) {
3119 NL_SET_BAD_ATTR(extack, attr);
3120 return -EEXIST;
3121 }
3122 if (info->nlh->nlmsg_flags & NLM_F_REPLACE)
3123 return -EOPNOTSUPP;
3124
3125 flags |= chain->flags & NFT_CHAIN_BASE;
3126 return nf_tables_updchain(&ctx, genmask, policy, flags, attr,
3127 extack);
3128 }
3129
3130 return nf_tables_addchain(&ctx, family, policy, flags, extack);
3131 }
3132
nft_delchain_hook(struct nft_ctx * ctx,struct nft_base_chain * basechain,struct netlink_ext_ack * extack)3133 static int nft_delchain_hook(struct nft_ctx *ctx,
3134 struct nft_base_chain *basechain,
3135 struct netlink_ext_ack *extack)
3136 {
3137 const struct nft_chain *chain = &basechain->chain;
3138 const struct nlattr * const *nla = ctx->nla;
3139 struct nft_chain_hook chain_hook = {};
3140 struct nft_hook *this, *hook;
3141 LIST_HEAD(chain_del_list);
3142 struct nft_trans *trans;
3143 int err;
3144
3145 if (ctx->table->flags & __NFT_TABLE_F_UPDATE)
3146 return -EOPNOTSUPP;
3147
3148 err = nft_chain_parse_hook(ctx->net, basechain, nla, &chain_hook,
3149 ctx->family, chain->flags, extack);
3150 if (err < 0)
3151 return err;
3152
3153 list_for_each_entry(this, &chain_hook.list, list) {
3154 hook = nft_hook_list_find(&basechain->hook_list, this);
3155 if (!hook) {
3156 err = -ENOENT;
3157 goto err_chain_del_hook;
3158 }
3159 list_move(&hook->list, &chain_del_list);
3160 }
3161
3162 trans = nft_trans_alloc_chain(ctx, NFT_MSG_DELCHAIN);
3163 if (!trans) {
3164 err = -ENOMEM;
3165 goto err_chain_del_hook;
3166 }
3167
3168 nft_trans_basechain(trans) = basechain;
3169 nft_trans_chain_update(trans) = true;
3170 INIT_LIST_HEAD(&nft_trans_chain_hooks(trans));
3171 list_splice(&chain_del_list, &nft_trans_chain_hooks(trans));
3172 nft_chain_release_hook(&chain_hook);
3173
3174 nft_trans_commit_list_add_tail(ctx->net, trans);
3175
3176 return 0;
3177
3178 err_chain_del_hook:
3179 list_splice(&chain_del_list, &basechain->hook_list);
3180 nft_chain_release_hook(&chain_hook);
3181
3182 return err;
3183 }
3184
nf_tables_delchain(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])3185 static int nf_tables_delchain(struct sk_buff *skb, const struct nfnl_info *info,
3186 const struct nlattr * const nla[])
3187 {
3188 struct netlink_ext_ack *extack = info->extack;
3189 u8 genmask = nft_genmask_next(info->net);
3190 u8 family = info->nfmsg->nfgen_family;
3191 struct net *net = info->net;
3192 const struct nlattr *attr;
3193 struct nft_table *table;
3194 struct nft_chain *chain;
3195 struct nft_rule *rule;
3196 struct nft_ctx ctx;
3197 u64 handle;
3198 u32 use;
3199 int err;
3200
3201 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask,
3202 NETLINK_CB(skb).portid);
3203 if (IS_ERR(table)) {
3204 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
3205 return PTR_ERR(table);
3206 }
3207
3208 if (nla[NFTA_CHAIN_HANDLE]) {
3209 attr = nla[NFTA_CHAIN_HANDLE];
3210 handle = be64_to_cpu(nla_get_be64(attr));
3211 chain = nft_chain_lookup_byhandle(table, handle, genmask);
3212 } else {
3213 attr = nla[NFTA_CHAIN_NAME];
3214 chain = nft_chain_lookup(net, table, attr, genmask);
3215 }
3216 if (IS_ERR(chain)) {
3217 if (PTR_ERR(chain) == -ENOENT &&
3218 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYCHAIN)
3219 return 0;
3220
3221 NL_SET_BAD_ATTR(extack, attr);
3222 return PTR_ERR(chain);
3223 }
3224
3225 if (nft_chain_binding(chain))
3226 return -EOPNOTSUPP;
3227
3228 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, chain, nla);
3229
3230 if (nla[NFTA_CHAIN_HOOK]) {
3231 if (NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYCHAIN ||
3232 chain->flags & NFT_CHAIN_HW_OFFLOAD)
3233 return -EOPNOTSUPP;
3234
3235 if (nft_is_base_chain(chain)) {
3236 struct nft_base_chain *basechain = nft_base_chain(chain);
3237
3238 if (nft_base_chain_netdev(table->family, basechain->ops.hooknum))
3239 return nft_delchain_hook(&ctx, basechain, extack);
3240 }
3241 }
3242
3243 if (info->nlh->nlmsg_flags & NLM_F_NONREC &&
3244 chain->use > 0)
3245 return -EBUSY;
3246
3247 use = chain->use;
3248 list_for_each_entry(rule, &chain->rules, list) {
3249 if (!nft_is_active_next(net, rule))
3250 continue;
3251 use--;
3252
3253 err = nft_delrule(&ctx, rule);
3254 if (err < 0)
3255 return err;
3256 }
3257
3258 /* There are rules and elements that are still holding references to us,
3259 * we cannot do a recursive removal in this case.
3260 */
3261 if (use > 0) {
3262 NL_SET_BAD_ATTR(extack, attr);
3263 return -EBUSY;
3264 }
3265
3266 return nft_delchain(&ctx);
3267 }
3268
3269 /*
3270 * Expressions
3271 */
3272
3273 /**
3274 * nft_register_expr - register nf_tables expr type
3275 * @type: expr type
3276 *
3277 * Registers the expr type for use with nf_tables. Returns zero on
3278 * success or a negative errno code otherwise.
3279 */
nft_register_expr(struct nft_expr_type * type)3280 int nft_register_expr(struct nft_expr_type *type)
3281 {
3282 if (WARN_ON_ONCE(type->maxattr > NFT_EXPR_MAXATTR))
3283 return -ENOMEM;
3284
3285 nfnl_lock(NFNL_SUBSYS_NFTABLES);
3286 if (type->family == NFPROTO_UNSPEC)
3287 list_add_tail_rcu(&type->list, &nf_tables_expressions);
3288 else
3289 list_add_rcu(&type->list, &nf_tables_expressions);
3290 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
3291 return 0;
3292 }
3293 EXPORT_SYMBOL_GPL(nft_register_expr);
3294
3295 /**
3296 * nft_unregister_expr - unregister nf_tables expr type
3297 * @type: expr type
3298 *
3299 * Unregisters the expr typefor use with nf_tables.
3300 */
nft_unregister_expr(struct nft_expr_type * type)3301 void nft_unregister_expr(struct nft_expr_type *type)
3302 {
3303 nfnl_lock(NFNL_SUBSYS_NFTABLES);
3304 list_del_rcu(&type->list);
3305 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
3306 }
3307 EXPORT_SYMBOL_GPL(nft_unregister_expr);
3308
__nft_expr_type_get(u8 family,struct nlattr * nla)3309 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
3310 struct nlattr *nla)
3311 {
3312 const struct nft_expr_type *type, *candidate = NULL;
3313
3314 list_for_each_entry_rcu(type, &nf_tables_expressions, list) {
3315 if (!nla_strcmp(nla, type->name)) {
3316 if (!type->family && !candidate)
3317 candidate = type;
3318 else if (type->family == family)
3319 candidate = type;
3320 }
3321 }
3322 return candidate;
3323 }
3324
3325 #ifdef CONFIG_MODULES
nft_expr_type_request_module(struct net * net,u8 family,struct nlattr * nla)3326 static int nft_expr_type_request_module(struct net *net, u8 family,
3327 struct nlattr *nla)
3328 {
3329 if (nft_request_module(net, "nft-expr-%u-%.*s", family,
3330 nla_len(nla), (char *)nla_data(nla)) == -EAGAIN)
3331 return -EAGAIN;
3332
3333 return 0;
3334 }
3335 #endif
3336
nft_expr_type_get(struct net * net,u8 family,struct nlattr * nla)3337 static const struct nft_expr_type *nft_expr_type_get(struct net *net,
3338 u8 family,
3339 struct nlattr *nla)
3340 {
3341 const struct nft_expr_type *type;
3342
3343 if (nla == NULL)
3344 return ERR_PTR(-EINVAL);
3345
3346 rcu_read_lock();
3347 type = __nft_expr_type_get(family, nla);
3348 if (type != NULL && try_module_get(type->owner)) {
3349 rcu_read_unlock();
3350 return type;
3351 }
3352 rcu_read_unlock();
3353
3354 lockdep_nfnl_nft_mutex_not_held();
3355 #ifdef CONFIG_MODULES
3356 if (type == NULL) {
3357 if (nft_expr_type_request_module(net, family, nla) == -EAGAIN)
3358 return ERR_PTR(-EAGAIN);
3359
3360 if (nft_request_module(net, "nft-expr-%.*s",
3361 nla_len(nla),
3362 (char *)nla_data(nla)) == -EAGAIN)
3363 return ERR_PTR(-EAGAIN);
3364 }
3365 #endif
3366 return ERR_PTR(-ENOENT);
3367 }
3368
3369 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
3370 [NFTA_EXPR_NAME] = { .type = NLA_STRING,
3371 .len = NFT_MODULE_AUTOLOAD_LIMIT },
3372 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
3373 };
3374
nf_tables_fill_expr_info(struct sk_buff * skb,const struct nft_expr * expr,bool reset)3375 static int nf_tables_fill_expr_info(struct sk_buff *skb,
3376 const struct nft_expr *expr, bool reset)
3377 {
3378 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
3379 goto nla_put_failure;
3380
3381 if (expr->ops->dump) {
3382 struct nlattr *data = nla_nest_start_noflag(skb,
3383 NFTA_EXPR_DATA);
3384 if (data == NULL)
3385 goto nla_put_failure;
3386 if (expr->ops->dump(skb, expr, reset) < 0)
3387 goto nla_put_failure;
3388 nla_nest_end(skb, data);
3389 }
3390
3391 return skb->len;
3392
3393 nla_put_failure:
3394 return -1;
3395 };
3396
nft_expr_dump(struct sk_buff * skb,unsigned int attr,const struct nft_expr * expr,bool reset)3397 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
3398 const struct nft_expr *expr, bool reset)
3399 {
3400 struct nlattr *nest;
3401
3402 nest = nla_nest_start_noflag(skb, attr);
3403 if (!nest)
3404 goto nla_put_failure;
3405 if (nf_tables_fill_expr_info(skb, expr, reset) < 0)
3406 goto nla_put_failure;
3407 nla_nest_end(skb, nest);
3408 return 0;
3409
3410 nla_put_failure:
3411 return -1;
3412 }
3413
3414 struct nft_expr_info {
3415 const struct nft_expr_ops *ops;
3416 const struct nlattr *attr;
3417 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
3418 };
3419
nf_tables_expr_parse(const struct nft_ctx * ctx,const struct nlattr * nla,struct nft_expr_info * info)3420 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
3421 const struct nlattr *nla,
3422 struct nft_expr_info *info)
3423 {
3424 const struct nft_expr_type *type;
3425 const struct nft_expr_ops *ops;
3426 struct nlattr *tb[NFTA_EXPR_MAX + 1];
3427 int err;
3428
3429 err = nla_parse_nested_deprecated(tb, NFTA_EXPR_MAX, nla,
3430 nft_expr_policy, NULL);
3431 if (err < 0)
3432 return err;
3433
3434 type = nft_expr_type_get(ctx->net, ctx->family, tb[NFTA_EXPR_NAME]);
3435 if (IS_ERR(type))
3436 return PTR_ERR(type);
3437
3438 if (tb[NFTA_EXPR_DATA]) {
3439 err = nla_parse_nested_deprecated(info->tb, type->maxattr,
3440 tb[NFTA_EXPR_DATA],
3441 type->policy, NULL);
3442 if (err < 0)
3443 goto err1;
3444 } else
3445 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
3446
3447 if (type->select_ops != NULL) {
3448 ops = type->select_ops(ctx,
3449 (const struct nlattr * const *)info->tb);
3450 if (IS_ERR(ops)) {
3451 err = PTR_ERR(ops);
3452 #ifdef CONFIG_MODULES
3453 if (err == -EAGAIN)
3454 if (nft_expr_type_request_module(ctx->net,
3455 ctx->family,
3456 tb[NFTA_EXPR_NAME]) != -EAGAIN)
3457 err = -ENOENT;
3458 #endif
3459 goto err1;
3460 }
3461 } else
3462 ops = type->ops;
3463
3464 info->attr = nla;
3465 info->ops = ops;
3466
3467 return 0;
3468
3469 err1:
3470 module_put(type->owner);
3471 return err;
3472 }
3473
nft_expr_inner_parse(const struct nft_ctx * ctx,const struct nlattr * nla,struct nft_expr_info * info)3474 int nft_expr_inner_parse(const struct nft_ctx *ctx, const struct nlattr *nla,
3475 struct nft_expr_info *info)
3476 {
3477 struct nlattr *tb[NFTA_EXPR_MAX + 1];
3478 const struct nft_expr_type *type;
3479 int err;
3480
3481 err = nla_parse_nested_deprecated(tb, NFTA_EXPR_MAX, nla,
3482 nft_expr_policy, NULL);
3483 if (err < 0)
3484 return err;
3485
3486 if (!tb[NFTA_EXPR_DATA] || !tb[NFTA_EXPR_NAME])
3487 return -EINVAL;
3488
3489 rcu_read_lock();
3490
3491 type = __nft_expr_type_get(ctx->family, tb[NFTA_EXPR_NAME]);
3492 if (!type) {
3493 err = -ENOENT;
3494 goto out_unlock;
3495 }
3496
3497 if (!type->inner_ops) {
3498 err = -EOPNOTSUPP;
3499 goto out_unlock;
3500 }
3501
3502 err = nla_parse_nested_deprecated(info->tb, type->maxattr,
3503 tb[NFTA_EXPR_DATA],
3504 type->policy, NULL);
3505 if (err < 0)
3506 goto out_unlock;
3507
3508 info->attr = nla;
3509 info->ops = type->inner_ops;
3510
3511 /* No module reference will be taken on type->owner.
3512 * Presence of type->inner_ops implies that the expression
3513 * is builtin, so it cannot go away.
3514 */
3515 rcu_read_unlock();
3516 return 0;
3517
3518 out_unlock:
3519 rcu_read_unlock();
3520 return err;
3521 }
3522
nf_tables_newexpr(const struct nft_ctx * ctx,const struct nft_expr_info * expr_info,struct nft_expr * expr)3523 static int nf_tables_newexpr(const struct nft_ctx *ctx,
3524 const struct nft_expr_info *expr_info,
3525 struct nft_expr *expr)
3526 {
3527 const struct nft_expr_ops *ops = expr_info->ops;
3528 int err;
3529
3530 expr->ops = ops;
3531 if (ops->init) {
3532 err = ops->init(ctx, expr, (const struct nlattr **)expr_info->tb);
3533 if (err < 0)
3534 goto err1;
3535 }
3536
3537 return 0;
3538 err1:
3539 expr->ops = NULL;
3540 return err;
3541 }
3542
nf_tables_expr_destroy(const struct nft_ctx * ctx,struct nft_expr * expr)3543 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
3544 struct nft_expr *expr)
3545 {
3546 const struct nft_expr_type *type = expr->ops->type;
3547
3548 if (expr->ops->destroy)
3549 expr->ops->destroy(ctx, expr);
3550 module_put(type->owner);
3551 }
3552
nft_expr_init(const struct nft_ctx * ctx,const struct nlattr * nla)3553 static struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
3554 const struct nlattr *nla)
3555 {
3556 struct nft_expr_info expr_info;
3557 struct nft_expr *expr;
3558 struct module *owner;
3559 int err;
3560
3561 err = nf_tables_expr_parse(ctx, nla, &expr_info);
3562 if (err < 0)
3563 goto err_expr_parse;
3564
3565 err = -EOPNOTSUPP;
3566 if (!(expr_info.ops->type->flags & NFT_EXPR_STATEFUL))
3567 goto err_expr_stateful;
3568
3569 err = -ENOMEM;
3570 expr = kzalloc(expr_info.ops->size, GFP_KERNEL_ACCOUNT);
3571 if (expr == NULL)
3572 goto err_expr_stateful;
3573
3574 err = nf_tables_newexpr(ctx, &expr_info, expr);
3575 if (err < 0)
3576 goto err_expr_new;
3577
3578 return expr;
3579 err_expr_new:
3580 kfree(expr);
3581 err_expr_stateful:
3582 owner = expr_info.ops->type->owner;
3583 if (expr_info.ops->type->release_ops)
3584 expr_info.ops->type->release_ops(expr_info.ops);
3585
3586 module_put(owner);
3587 err_expr_parse:
3588 return ERR_PTR(err);
3589 }
3590
nft_expr_clone(struct nft_expr * dst,struct nft_expr * src,gfp_t gfp)3591 int nft_expr_clone(struct nft_expr *dst, struct nft_expr *src, gfp_t gfp)
3592 {
3593 int err;
3594
3595 if (WARN_ON_ONCE(!src->ops->clone))
3596 return -EINVAL;
3597
3598 dst->ops = src->ops;
3599 err = src->ops->clone(dst, src, gfp);
3600 if (err < 0)
3601 return err;
3602
3603 __module_get(src->ops->type->owner);
3604
3605 return 0;
3606 }
3607
nft_expr_destroy(const struct nft_ctx * ctx,struct nft_expr * expr)3608 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
3609 {
3610 nf_tables_expr_destroy(ctx, expr);
3611 kfree(expr);
3612 }
3613
3614 /*
3615 * Rules
3616 */
3617
__nft_rule_lookup(const struct net * net,const struct nft_chain * chain,u64 handle)3618 static struct nft_rule *__nft_rule_lookup(const struct net *net,
3619 const struct nft_chain *chain,
3620 u64 handle)
3621 {
3622 struct nft_rule *rule;
3623
3624 // FIXME: this sucks
3625 list_for_each_entry_rcu(rule, &chain->rules, list,
3626 lockdep_commit_lock_is_held(net)) {
3627 if (handle == rule->handle)
3628 return rule;
3629 }
3630
3631 return ERR_PTR(-ENOENT);
3632 }
3633
nft_rule_lookup(const struct net * net,const struct nft_chain * chain,const struct nlattr * nla)3634 static struct nft_rule *nft_rule_lookup(const struct net *net,
3635 const struct nft_chain *chain,
3636 const struct nlattr *nla)
3637 {
3638 if (nla == NULL)
3639 return ERR_PTR(-EINVAL);
3640
3641 return __nft_rule_lookup(net, chain, be64_to_cpu(nla_get_be64(nla)));
3642 }
3643
3644 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
3645 [NFTA_RULE_TABLE] = { .type = NLA_STRING,
3646 .len = NFT_TABLE_MAXNAMELEN - 1 },
3647 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
3648 .len = NFT_CHAIN_MAXNAMELEN - 1 },
3649 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
3650 [NFTA_RULE_EXPRESSIONS] = NLA_POLICY_NESTED_ARRAY(nft_expr_policy),
3651 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
3652 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
3653 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
3654 .len = NFT_USERDATA_MAXLEN },
3655 [NFTA_RULE_ID] = { .type = NLA_U32 },
3656 [NFTA_RULE_POSITION_ID] = { .type = NLA_U32 },
3657 [NFTA_RULE_CHAIN_ID] = { .type = NLA_U32 },
3658 };
3659
nf_tables_fill_rule_info(struct sk_buff * skb,struct net * net,u32 portid,u32 seq,int event,u32 flags,int family,const struct nft_table * table,const struct nft_chain * chain,const struct nft_rule * rule,u64 handle,bool reset)3660 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
3661 u32 portid, u32 seq, int event,
3662 u32 flags, int family,
3663 const struct nft_table *table,
3664 const struct nft_chain *chain,
3665 const struct nft_rule *rule, u64 handle,
3666 bool reset)
3667 {
3668 struct nlmsghdr *nlh;
3669 const struct nft_expr *expr, *next;
3670 struct nlattr *list;
3671 u16 type = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
3672
3673 nlh = nfnl_msg_put(skb, portid, seq, type, flags, family, NFNETLINK_V0,
3674 nft_base_seq(net));
3675 if (!nlh)
3676 goto nla_put_failure;
3677
3678 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
3679 goto nla_put_failure;
3680 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
3681 goto nla_put_failure;
3682 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
3683 NFTA_RULE_PAD))
3684 goto nla_put_failure;
3685
3686 if (event != NFT_MSG_DELRULE && handle) {
3687 if (nla_put_be64(skb, NFTA_RULE_POSITION, cpu_to_be64(handle),
3688 NFTA_RULE_PAD))
3689 goto nla_put_failure;
3690 }
3691
3692 if (chain->flags & NFT_CHAIN_HW_OFFLOAD)
3693 nft_flow_rule_stats(chain, rule);
3694
3695 list = nla_nest_start_noflag(skb, NFTA_RULE_EXPRESSIONS);
3696 if (list == NULL)
3697 goto nla_put_failure;
3698 nft_rule_for_each_expr(expr, next, rule) {
3699 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr, reset) < 0)
3700 goto nla_put_failure;
3701 }
3702 nla_nest_end(skb, list);
3703
3704 if (rule->udata) {
3705 struct nft_userdata *udata = nft_userdata(rule);
3706 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
3707 udata->data) < 0)
3708 goto nla_put_failure;
3709 }
3710
3711 nlmsg_end(skb, nlh);
3712 return 0;
3713
3714 nla_put_failure:
3715 nlmsg_trim(skb, nlh);
3716 return -1;
3717 }
3718
nf_tables_rule_notify(const struct nft_ctx * ctx,const struct nft_rule * rule,int event)3719 static void nf_tables_rule_notify(const struct nft_ctx *ctx,
3720 const struct nft_rule *rule, int event)
3721 {
3722 struct nftables_pernet *nft_net = nft_pernet(ctx->net);
3723 const struct nft_rule *prule;
3724 struct sk_buff *skb;
3725 u64 handle = 0;
3726 u16 flags = 0;
3727 int err;
3728
3729 if (!ctx->report &&
3730 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
3731 return;
3732
3733 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3734 if (skb == NULL)
3735 goto err;
3736
3737 if (event == NFT_MSG_NEWRULE &&
3738 !list_is_first(&rule->list, &ctx->chain->rules) &&
3739 !list_is_last(&rule->list, &ctx->chain->rules)) {
3740 prule = list_prev_entry(rule, list);
3741 handle = prule->handle;
3742 }
3743 if (ctx->flags & (NLM_F_APPEND | NLM_F_REPLACE))
3744 flags |= NLM_F_APPEND;
3745 if (ctx->flags & (NLM_F_CREATE | NLM_F_EXCL))
3746 flags |= ctx->flags & (NLM_F_CREATE | NLM_F_EXCL);
3747
3748 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
3749 event, flags, ctx->family, ctx->table,
3750 ctx->chain, rule, handle, false);
3751 if (err < 0) {
3752 kfree_skb(skb);
3753 goto err;
3754 }
3755
3756 nft_notify_enqueue(skb, ctx->report, &nft_net->notify_list);
3757 return;
3758 err:
3759 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
3760 }
3761
audit_log_rule_reset(const struct nft_table * table,unsigned int base_seq,unsigned int nentries)3762 static void audit_log_rule_reset(const struct nft_table *table,
3763 unsigned int base_seq,
3764 unsigned int nentries)
3765 {
3766 char *buf = kasprintf(GFP_ATOMIC, "%s:%u",
3767 table->name, base_seq);
3768
3769 audit_log_nfcfg(buf, table->family, nentries,
3770 AUDIT_NFT_OP_RULE_RESET, GFP_ATOMIC);
3771 kfree(buf);
3772 }
3773
3774 struct nft_rule_dump_ctx {
3775 unsigned int s_idx;
3776 char *table;
3777 char *chain;
3778 bool reset;
3779 };
3780
__nf_tables_dump_rules(struct sk_buff * skb,unsigned int * idx,struct netlink_callback * cb,const struct nft_table * table,const struct nft_chain * chain)3781 static int __nf_tables_dump_rules(struct sk_buff *skb,
3782 unsigned int *idx,
3783 struct netlink_callback *cb,
3784 const struct nft_table *table,
3785 const struct nft_chain *chain)
3786 {
3787 struct nft_rule_dump_ctx *ctx = (void *)cb->ctx;
3788 struct net *net = sock_net(skb->sk);
3789 const struct nft_rule *rule, *prule;
3790 unsigned int entries = 0;
3791 int ret = 0;
3792 u64 handle;
3793
3794 prule = NULL;
3795 list_for_each_entry_rcu(rule, &chain->rules, list) {
3796 if (!nft_is_active(net, rule))
3797 goto cont_skip;
3798 if (*idx < ctx->s_idx)
3799 goto cont;
3800 if (prule)
3801 handle = prule->handle;
3802 else
3803 handle = 0;
3804
3805 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
3806 cb->nlh->nlmsg_seq,
3807 NFT_MSG_NEWRULE,
3808 NLM_F_MULTI | NLM_F_APPEND,
3809 table->family,
3810 table, chain, rule, handle, ctx->reset) < 0) {
3811 ret = 1;
3812 break;
3813 }
3814 entries++;
3815 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
3816 cont:
3817 prule = rule;
3818 cont_skip:
3819 (*idx)++;
3820 }
3821
3822 if (ctx->reset && entries)
3823 audit_log_rule_reset(table, cb->seq, entries);
3824
3825 return ret;
3826 }
3827
nf_tables_dump_rules(struct sk_buff * skb,struct netlink_callback * cb)3828 static int nf_tables_dump_rules(struct sk_buff *skb,
3829 struct netlink_callback *cb)
3830 {
3831 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
3832 struct nft_rule_dump_ctx *ctx = (void *)cb->ctx;
3833 struct nft_table *table;
3834 const struct nft_chain *chain;
3835 unsigned int idx = 0;
3836 struct net *net = sock_net(skb->sk);
3837 int family = nfmsg->nfgen_family;
3838 struct nftables_pernet *nft_net;
3839
3840 rcu_read_lock();
3841 nft_net = nft_pernet(net);
3842 cb->seq = READ_ONCE(nft_net->base_seq);
3843
3844 list_for_each_entry_rcu(table, &nft_net->tables, list) {
3845 if (family != NFPROTO_UNSPEC && family != table->family)
3846 continue;
3847
3848 if (ctx->table && strcmp(ctx->table, table->name) != 0)
3849 continue;
3850
3851 if (ctx->table && ctx->chain) {
3852 struct rhlist_head *list, *tmp;
3853
3854 list = rhltable_lookup(&table->chains_ht, ctx->chain,
3855 nft_chain_ht_params);
3856 if (!list)
3857 goto done;
3858
3859 rhl_for_each_entry_rcu(chain, tmp, list, rhlhead) {
3860 if (!nft_is_active(net, chain))
3861 continue;
3862 __nf_tables_dump_rules(skb, &idx,
3863 cb, table, chain);
3864 break;
3865 }
3866 goto done;
3867 }
3868
3869 list_for_each_entry_rcu(chain, &table->chains, list) {
3870 if (__nf_tables_dump_rules(skb, &idx,
3871 cb, table, chain))
3872 goto done;
3873 }
3874
3875 if (ctx->table)
3876 break;
3877 }
3878 done:
3879 rcu_read_unlock();
3880
3881 ctx->s_idx = idx;
3882 return skb->len;
3883 }
3884
nf_tables_dumpreset_rules(struct sk_buff * skb,struct netlink_callback * cb)3885 static int nf_tables_dumpreset_rules(struct sk_buff *skb,
3886 struct netlink_callback *cb)
3887 {
3888 struct nftables_pernet *nft_net = nft_pernet(sock_net(skb->sk));
3889 int ret;
3890
3891 /* Mutex is held is to prevent that two concurrent dump-and-reset calls
3892 * do not underrun counters and quotas. The commit_mutex is used for
3893 * the lack a better lock, this is not transaction path.
3894 */
3895 mutex_lock(&nft_net->commit_mutex);
3896 ret = nf_tables_dump_rules(skb, cb);
3897 mutex_unlock(&nft_net->commit_mutex);
3898
3899 return ret;
3900 }
3901
nf_tables_dump_rules_start(struct netlink_callback * cb)3902 static int nf_tables_dump_rules_start(struct netlink_callback *cb)
3903 {
3904 struct nft_rule_dump_ctx *ctx = (void *)cb->ctx;
3905 const struct nlattr * const *nla = cb->data;
3906
3907 BUILD_BUG_ON(sizeof(*ctx) > sizeof(cb->ctx));
3908
3909 if (nla[NFTA_RULE_TABLE]) {
3910 ctx->table = nla_strdup(nla[NFTA_RULE_TABLE], GFP_ATOMIC);
3911 if (!ctx->table)
3912 return -ENOMEM;
3913 }
3914 if (nla[NFTA_RULE_CHAIN]) {
3915 ctx->chain = nla_strdup(nla[NFTA_RULE_CHAIN], GFP_ATOMIC);
3916 if (!ctx->chain) {
3917 kfree(ctx->table);
3918 return -ENOMEM;
3919 }
3920 }
3921 return 0;
3922 }
3923
nf_tables_dumpreset_rules_start(struct netlink_callback * cb)3924 static int nf_tables_dumpreset_rules_start(struct netlink_callback *cb)
3925 {
3926 struct nft_rule_dump_ctx *ctx = (void *)cb->ctx;
3927
3928 ctx->reset = true;
3929
3930 return nf_tables_dump_rules_start(cb);
3931 }
3932
nf_tables_dump_rules_done(struct netlink_callback * cb)3933 static int nf_tables_dump_rules_done(struct netlink_callback *cb)
3934 {
3935 struct nft_rule_dump_ctx *ctx = (void *)cb->ctx;
3936
3937 kfree(ctx->table);
3938 kfree(ctx->chain);
3939 return 0;
3940 }
3941
3942 /* Caller must hold rcu read lock or transaction mutex */
3943 static struct sk_buff *
nf_tables_getrule_single(u32 portid,const struct nfnl_info * info,const struct nlattr * const nla[],bool reset)3944 nf_tables_getrule_single(u32 portid, const struct nfnl_info *info,
3945 const struct nlattr * const nla[], bool reset)
3946 {
3947 struct netlink_ext_ack *extack = info->extack;
3948 u8 genmask = nft_genmask_cur(info->net);
3949 u8 family = info->nfmsg->nfgen_family;
3950 const struct nft_chain *chain;
3951 const struct nft_rule *rule;
3952 struct net *net = info->net;
3953 struct nft_table *table;
3954 struct sk_buff *skb2;
3955 int err;
3956
3957 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask, 0);
3958 if (IS_ERR(table)) {
3959 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
3960 return ERR_CAST(table);
3961 }
3962
3963 chain = nft_chain_lookup(net, table, nla[NFTA_RULE_CHAIN], genmask);
3964 if (IS_ERR(chain)) {
3965 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
3966 return ERR_CAST(chain);
3967 }
3968
3969 rule = nft_rule_lookup(net, chain, nla[NFTA_RULE_HANDLE]);
3970 if (IS_ERR(rule)) {
3971 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
3972 return ERR_CAST(rule);
3973 }
3974
3975 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
3976 if (!skb2)
3977 return ERR_PTR(-ENOMEM);
3978
3979 err = nf_tables_fill_rule_info(skb2, net, portid,
3980 info->nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
3981 family, table, chain, rule, 0, reset);
3982 if (err < 0) {
3983 kfree_skb(skb2);
3984 return ERR_PTR(err);
3985 }
3986
3987 return skb2;
3988 }
3989
nf_tables_getrule(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])3990 static int nf_tables_getrule(struct sk_buff *skb, const struct nfnl_info *info,
3991 const struct nlattr * const nla[])
3992 {
3993 u32 portid = NETLINK_CB(skb).portid;
3994 struct net *net = info->net;
3995 struct sk_buff *skb2;
3996
3997 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
3998 struct netlink_dump_control c = {
3999 .start= nf_tables_dump_rules_start,
4000 .dump = nf_tables_dump_rules,
4001 .done = nf_tables_dump_rules_done,
4002 .module = THIS_MODULE,
4003 .data = (void *)nla,
4004 };
4005
4006 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
4007 }
4008
4009 skb2 = nf_tables_getrule_single(portid, info, nla, false);
4010 if (IS_ERR(skb2))
4011 return PTR_ERR(skb2);
4012
4013 return nfnetlink_unicast(skb2, net, portid);
4014 }
4015
nf_tables_getrule_reset(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])4016 static int nf_tables_getrule_reset(struct sk_buff *skb,
4017 const struct nfnl_info *info,
4018 const struct nlattr * const nla[])
4019 {
4020 struct nftables_pernet *nft_net = nft_pernet(info->net);
4021 u32 portid = NETLINK_CB(skb).portid;
4022 struct net *net = info->net;
4023 struct sk_buff *skb2;
4024 char *buf;
4025
4026 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
4027 struct netlink_dump_control c = {
4028 .start= nf_tables_dumpreset_rules_start,
4029 .dump = nf_tables_dumpreset_rules,
4030 .done = nf_tables_dump_rules_done,
4031 .module = THIS_MODULE,
4032 .data = (void *)nla,
4033 };
4034
4035 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
4036 }
4037
4038 if (!try_module_get(THIS_MODULE))
4039 return -EINVAL;
4040 rcu_read_unlock();
4041 mutex_lock(&nft_net->commit_mutex);
4042 skb2 = nf_tables_getrule_single(portid, info, nla, true);
4043 mutex_unlock(&nft_net->commit_mutex);
4044 rcu_read_lock();
4045 module_put(THIS_MODULE);
4046
4047 if (IS_ERR(skb2))
4048 return PTR_ERR(skb2);
4049
4050 buf = kasprintf(GFP_ATOMIC, "%.*s:%u",
4051 nla_len(nla[NFTA_RULE_TABLE]),
4052 (char *)nla_data(nla[NFTA_RULE_TABLE]),
4053 nft_net->base_seq);
4054 audit_log_nfcfg(buf, info->nfmsg->nfgen_family, 1,
4055 AUDIT_NFT_OP_RULE_RESET, GFP_ATOMIC);
4056 kfree(buf);
4057
4058 return nfnetlink_unicast(skb2, net, portid);
4059 }
4060
nf_tables_rule_destroy(const struct nft_ctx * ctx,struct nft_rule * rule)4061 void nf_tables_rule_destroy(const struct nft_ctx *ctx, struct nft_rule *rule)
4062 {
4063 struct nft_expr *expr, *next;
4064
4065 /*
4066 * Careful: some expressions might not be initialized in case this
4067 * is called on error from nf_tables_newrule().
4068 */
4069 expr = nft_expr_first(rule);
4070 while (nft_expr_more(rule, expr)) {
4071 next = nft_expr_next(expr);
4072 nf_tables_expr_destroy(ctx, expr);
4073 expr = next;
4074 }
4075 kfree(rule);
4076 }
4077
4078 /* can only be used if rule is no longer visible to dumps */
nf_tables_rule_release(const struct nft_ctx * ctx,struct nft_rule * rule)4079 static void nf_tables_rule_release(const struct nft_ctx *ctx, struct nft_rule *rule)
4080 {
4081 WARN_ON_ONCE(!lockdep_commit_lock_is_held(ctx->net));
4082
4083 nft_rule_expr_deactivate(ctx, rule, NFT_TRANS_RELEASE);
4084 nf_tables_rule_destroy(ctx, rule);
4085 }
4086
4087 /** nft_chain_validate - loop detection and hook validation
4088 *
4089 * @ctx: context containing call depth and base chain
4090 * @chain: chain to validate
4091 *
4092 * Walk through the rules of the given chain and chase all jumps/gotos
4093 * and set lookups until either the jump limit is hit or all reachable
4094 * chains have been validated.
4095 */
nft_chain_validate(const struct nft_ctx * ctx,const struct nft_chain * chain)4096 int nft_chain_validate(const struct nft_ctx *ctx, const struct nft_chain *chain)
4097 {
4098 struct nft_expr *expr, *last;
4099 struct nft_rule *rule;
4100 int err;
4101
4102 if (ctx->level == NFT_JUMP_STACK_SIZE)
4103 return -EMLINK;
4104
4105 list_for_each_entry(rule, &chain->rules, list) {
4106 if (fatal_signal_pending(current))
4107 return -EINTR;
4108
4109 if (!nft_is_active_next(ctx->net, rule))
4110 continue;
4111
4112 nft_rule_for_each_expr(expr, last, rule) {
4113 if (!expr->ops->validate)
4114 continue;
4115
4116 /* This may call nft_chain_validate() recursively,
4117 * callers that do so must increment ctx->level.
4118 */
4119 err = expr->ops->validate(ctx, expr);
4120 if (err < 0)
4121 return err;
4122 }
4123 }
4124
4125 return 0;
4126 }
4127 EXPORT_SYMBOL_GPL(nft_chain_validate);
4128
nft_table_validate(struct net * net,const struct nft_table * table)4129 static int nft_table_validate(struct net *net, const struct nft_table *table)
4130 {
4131 struct nft_chain *chain;
4132 struct nft_ctx ctx = {
4133 .net = net,
4134 .family = table->family,
4135 };
4136 int err;
4137
4138 list_for_each_entry(chain, &table->chains, list) {
4139 if (!nft_is_base_chain(chain))
4140 continue;
4141
4142 ctx.chain = chain;
4143 err = nft_chain_validate(&ctx, chain);
4144 if (err < 0)
4145 return err;
4146
4147 cond_resched();
4148 }
4149
4150 return 0;
4151 }
4152
nft_setelem_validate(const struct nft_ctx * ctx,struct nft_set * set,const struct nft_set_iter * iter,struct nft_elem_priv * elem_priv)4153 int nft_setelem_validate(const struct nft_ctx *ctx, struct nft_set *set,
4154 const struct nft_set_iter *iter,
4155 struct nft_elem_priv *elem_priv)
4156 {
4157 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
4158 struct nft_ctx *pctx = (struct nft_ctx *)ctx;
4159 const struct nft_data *data;
4160 int err;
4161
4162 if (!nft_set_elem_active(ext, iter->genmask))
4163 return 0;
4164
4165 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
4166 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
4167 return 0;
4168
4169 data = nft_set_ext_data(ext);
4170 switch (data->verdict.code) {
4171 case NFT_JUMP:
4172 case NFT_GOTO:
4173 pctx->level++;
4174 err = nft_chain_validate(ctx, data->verdict.chain);
4175 if (err < 0)
4176 return err;
4177 pctx->level--;
4178 break;
4179 default:
4180 break;
4181 }
4182
4183 return 0;
4184 }
4185
nft_set_catchall_validate(const struct nft_ctx * ctx,struct nft_set * set)4186 int nft_set_catchall_validate(const struct nft_ctx *ctx, struct nft_set *set)
4187 {
4188 struct nft_set_iter dummy_iter = {
4189 .genmask = nft_genmask_next(ctx->net),
4190 };
4191 struct nft_set_elem_catchall *catchall;
4192
4193 struct nft_set_ext *ext;
4194 int ret = 0;
4195
4196 list_for_each_entry_rcu(catchall, &set->catchall_list, list,
4197 lockdep_commit_lock_is_held(ctx->net)) {
4198 ext = nft_set_elem_ext(set, catchall->elem);
4199 if (!nft_set_elem_active(ext, dummy_iter.genmask))
4200 continue;
4201
4202 ret = nft_setelem_validate(ctx, set, &dummy_iter, catchall->elem);
4203 if (ret < 0)
4204 return ret;
4205 }
4206
4207 return ret;
4208 }
4209
4210 static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
4211 const struct nft_chain *chain,
4212 const struct nlattr *nla);
4213
4214 #define NFT_RULE_MAXEXPRS 128
4215
nf_tables_newrule(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])4216 static int nf_tables_newrule(struct sk_buff *skb, const struct nfnl_info *info,
4217 const struct nlattr * const nla[])
4218 {
4219 struct nftables_pernet *nft_net = nft_pernet(info->net);
4220 struct netlink_ext_ack *extack = info->extack;
4221 unsigned int size, i, n, ulen = 0, usize = 0;
4222 u8 genmask = nft_genmask_next(info->net);
4223 struct nft_rule *rule, *old_rule = NULL;
4224 struct nft_expr_info *expr_info = NULL;
4225 u8 family = info->nfmsg->nfgen_family;
4226 struct nft_flow_rule *flow = NULL;
4227 struct net *net = info->net;
4228 struct nft_userdata *udata;
4229 struct nft_table *table;
4230 struct nft_chain *chain;
4231 struct nft_trans *trans;
4232 u64 handle, pos_handle;
4233 struct nft_expr *expr;
4234 struct nft_ctx ctx;
4235 struct nlattr *tmp;
4236 int err, rem;
4237
4238 lockdep_assert_held(&nft_net->commit_mutex);
4239
4240 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask,
4241 NETLINK_CB(skb).portid);
4242 if (IS_ERR(table)) {
4243 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
4244 return PTR_ERR(table);
4245 }
4246
4247 if (nla[NFTA_RULE_CHAIN]) {
4248 chain = nft_chain_lookup(net, table, nla[NFTA_RULE_CHAIN],
4249 genmask);
4250 if (IS_ERR(chain)) {
4251 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
4252 return PTR_ERR(chain);
4253 }
4254
4255 } else if (nla[NFTA_RULE_CHAIN_ID]) {
4256 chain = nft_chain_lookup_byid(net, table, nla[NFTA_RULE_CHAIN_ID],
4257 genmask);
4258 if (IS_ERR(chain)) {
4259 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN_ID]);
4260 return PTR_ERR(chain);
4261 }
4262 } else {
4263 return -EINVAL;
4264 }
4265
4266 if (nft_chain_is_bound(chain))
4267 return -EOPNOTSUPP;
4268
4269 if (nla[NFTA_RULE_HANDLE]) {
4270 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
4271 rule = __nft_rule_lookup(net, chain, handle);
4272 if (IS_ERR(rule)) {
4273 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
4274 return PTR_ERR(rule);
4275 }
4276
4277 if (info->nlh->nlmsg_flags & NLM_F_EXCL) {
4278 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
4279 return -EEXIST;
4280 }
4281 if (info->nlh->nlmsg_flags & NLM_F_REPLACE)
4282 old_rule = rule;
4283 else
4284 return -EOPNOTSUPP;
4285 } else {
4286 if (!(info->nlh->nlmsg_flags & NLM_F_CREATE) ||
4287 info->nlh->nlmsg_flags & NLM_F_REPLACE)
4288 return -EINVAL;
4289 handle = nf_tables_alloc_handle(table);
4290
4291 if (nla[NFTA_RULE_POSITION]) {
4292 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
4293 old_rule = __nft_rule_lookup(net, chain, pos_handle);
4294 if (IS_ERR(old_rule)) {
4295 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_POSITION]);
4296 return PTR_ERR(old_rule);
4297 }
4298 } else if (nla[NFTA_RULE_POSITION_ID]) {
4299 old_rule = nft_rule_lookup_byid(net, chain, nla[NFTA_RULE_POSITION_ID]);
4300 if (IS_ERR(old_rule)) {
4301 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_POSITION_ID]);
4302 return PTR_ERR(old_rule);
4303 }
4304 }
4305 }
4306
4307 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, chain, nla);
4308
4309 n = 0;
4310 size = 0;
4311 if (nla[NFTA_RULE_EXPRESSIONS]) {
4312 expr_info = kvmalloc_array(NFT_RULE_MAXEXPRS,
4313 sizeof(struct nft_expr_info),
4314 GFP_KERNEL);
4315 if (!expr_info)
4316 return -ENOMEM;
4317
4318 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
4319 err = -EINVAL;
4320 if (nla_type(tmp) != NFTA_LIST_ELEM)
4321 goto err_release_expr;
4322 if (n == NFT_RULE_MAXEXPRS)
4323 goto err_release_expr;
4324 err = nf_tables_expr_parse(&ctx, tmp, &expr_info[n]);
4325 if (err < 0) {
4326 NL_SET_BAD_ATTR(extack, tmp);
4327 goto err_release_expr;
4328 }
4329 size += expr_info[n].ops->size;
4330 n++;
4331 }
4332 }
4333 /* Check for overflow of dlen field */
4334 err = -EFBIG;
4335 if (size >= 1 << 12)
4336 goto err_release_expr;
4337
4338 if (nla[NFTA_RULE_USERDATA]) {
4339 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
4340 if (ulen > 0)
4341 usize = sizeof(struct nft_userdata) + ulen;
4342 }
4343
4344 err = -ENOMEM;
4345 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL_ACCOUNT);
4346 if (rule == NULL)
4347 goto err_release_expr;
4348
4349 nft_activate_next(net, rule);
4350
4351 rule->handle = handle;
4352 rule->dlen = size;
4353 rule->udata = ulen ? 1 : 0;
4354
4355 if (ulen) {
4356 udata = nft_userdata(rule);
4357 udata->len = ulen - 1;
4358 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
4359 }
4360
4361 expr = nft_expr_first(rule);
4362 for (i = 0; i < n; i++) {
4363 err = nf_tables_newexpr(&ctx, &expr_info[i], expr);
4364 if (err < 0) {
4365 NL_SET_BAD_ATTR(extack, expr_info[i].attr);
4366 goto err_release_rule;
4367 }
4368
4369 if (expr_info[i].ops->validate)
4370 nft_validate_state_update(table, NFT_VALIDATE_NEED);
4371
4372 expr_info[i].ops = NULL;
4373 expr = nft_expr_next(expr);
4374 }
4375
4376 if (chain->flags & NFT_CHAIN_HW_OFFLOAD) {
4377 flow = nft_flow_rule_create(net, rule);
4378 if (IS_ERR(flow)) {
4379 err = PTR_ERR(flow);
4380 goto err_release_rule;
4381 }
4382 }
4383
4384 if (!nft_use_inc(&chain->use)) {
4385 err = -EMFILE;
4386 goto err_release_rule;
4387 }
4388
4389 if (info->nlh->nlmsg_flags & NLM_F_REPLACE) {
4390 if (nft_chain_binding(chain)) {
4391 err = -EOPNOTSUPP;
4392 goto err_destroy_flow_rule;
4393 }
4394
4395 err = nft_delrule(&ctx, old_rule);
4396 if (err < 0)
4397 goto err_destroy_flow_rule;
4398
4399 trans = nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule);
4400 if (trans == NULL) {
4401 err = -ENOMEM;
4402 goto err_destroy_flow_rule;
4403 }
4404 list_add_tail_rcu(&rule->list, &old_rule->list);
4405 } else {
4406 trans = nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule);
4407 if (!trans) {
4408 err = -ENOMEM;
4409 goto err_destroy_flow_rule;
4410 }
4411
4412 if (info->nlh->nlmsg_flags & NLM_F_APPEND) {
4413 if (old_rule)
4414 list_add_rcu(&rule->list, &old_rule->list);
4415 else
4416 list_add_tail_rcu(&rule->list, &chain->rules);
4417 } else {
4418 if (old_rule)
4419 list_add_tail_rcu(&rule->list, &old_rule->list);
4420 else
4421 list_add_rcu(&rule->list, &chain->rules);
4422 }
4423 }
4424 kvfree(expr_info);
4425
4426 if (flow)
4427 nft_trans_flow_rule(trans) = flow;
4428
4429 if (table->validate_state == NFT_VALIDATE_DO)
4430 return nft_table_validate(net, table);
4431
4432 return 0;
4433
4434 err_destroy_flow_rule:
4435 nft_use_dec_restore(&chain->use);
4436 if (flow)
4437 nft_flow_rule_destroy(flow);
4438 err_release_rule:
4439 nft_rule_expr_deactivate(&ctx, rule, NFT_TRANS_PREPARE_ERROR);
4440 nf_tables_rule_destroy(&ctx, rule);
4441 err_release_expr:
4442 for (i = 0; i < n; i++) {
4443 if (expr_info[i].ops) {
4444 module_put(expr_info[i].ops->type->owner);
4445 if (expr_info[i].ops->type->release_ops)
4446 expr_info[i].ops->type->release_ops(expr_info[i].ops);
4447 }
4448 }
4449 kvfree(expr_info);
4450
4451 return err;
4452 }
4453
nft_rule_lookup_byid(const struct net * net,const struct nft_chain * chain,const struct nlattr * nla)4454 static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
4455 const struct nft_chain *chain,
4456 const struct nlattr *nla)
4457 {
4458 struct nftables_pernet *nft_net = nft_pernet(net);
4459 u32 id = ntohl(nla_get_be32(nla));
4460 struct nft_trans *trans;
4461
4462 list_for_each_entry(trans, &nft_net->commit_list, list) {
4463 if (trans->msg_type == NFT_MSG_NEWRULE &&
4464 nft_trans_rule_chain(trans) == chain &&
4465 id == nft_trans_rule_id(trans))
4466 return nft_trans_rule(trans);
4467 }
4468 return ERR_PTR(-ENOENT);
4469 }
4470
nf_tables_delrule(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])4471 static int nf_tables_delrule(struct sk_buff *skb, const struct nfnl_info *info,
4472 const struct nlattr * const nla[])
4473 {
4474 struct netlink_ext_ack *extack = info->extack;
4475 u8 genmask = nft_genmask_next(info->net);
4476 u8 family = info->nfmsg->nfgen_family;
4477 struct nft_chain *chain = NULL;
4478 struct net *net = info->net;
4479 struct nft_table *table;
4480 struct nft_rule *rule;
4481 struct nft_ctx ctx;
4482 int err = 0;
4483
4484 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask,
4485 NETLINK_CB(skb).portid);
4486 if (IS_ERR(table)) {
4487 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
4488 return PTR_ERR(table);
4489 }
4490
4491 if (nla[NFTA_RULE_CHAIN]) {
4492 chain = nft_chain_lookup(net, table, nla[NFTA_RULE_CHAIN],
4493 genmask);
4494 if (IS_ERR(chain)) {
4495 if (PTR_ERR(chain) == -ENOENT &&
4496 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYRULE)
4497 return 0;
4498
4499 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
4500 return PTR_ERR(chain);
4501 }
4502 if (nft_chain_binding(chain))
4503 return -EOPNOTSUPP;
4504 }
4505
4506 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, chain, nla);
4507
4508 if (chain) {
4509 if (nla[NFTA_RULE_HANDLE]) {
4510 rule = nft_rule_lookup(info->net, chain, nla[NFTA_RULE_HANDLE]);
4511 if (IS_ERR(rule)) {
4512 if (PTR_ERR(rule) == -ENOENT &&
4513 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYRULE)
4514 return 0;
4515
4516 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
4517 return PTR_ERR(rule);
4518 }
4519
4520 err = nft_delrule(&ctx, rule);
4521 } else if (nla[NFTA_RULE_ID]) {
4522 rule = nft_rule_lookup_byid(net, chain, nla[NFTA_RULE_ID]);
4523 if (IS_ERR(rule)) {
4524 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_ID]);
4525 return PTR_ERR(rule);
4526 }
4527
4528 err = nft_delrule(&ctx, rule);
4529 } else {
4530 err = nft_delrule_by_chain(&ctx);
4531 }
4532 } else {
4533 list_for_each_entry(chain, &table->chains, list) {
4534 if (!nft_is_active_next(net, chain))
4535 continue;
4536 if (nft_chain_binding(chain))
4537 continue;
4538
4539 ctx.chain = chain;
4540 err = nft_delrule_by_chain(&ctx);
4541 if (err < 0)
4542 break;
4543 }
4544 }
4545
4546 return err;
4547 }
4548
4549 /*
4550 * Sets
4551 */
4552 static const struct nft_set_type *nft_set_types[] = {
4553 &nft_set_hash_fast_type,
4554 &nft_set_hash_type,
4555 &nft_set_rhash_type,
4556 &nft_set_bitmap_type,
4557 &nft_set_rbtree_type,
4558 #if defined(CONFIG_X86_64) && !defined(CONFIG_UML)
4559 &nft_set_pipapo_avx2_type,
4560 #endif
4561 &nft_set_pipapo_type,
4562 };
4563
4564 #define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
4565 NFT_SET_TIMEOUT | NFT_SET_OBJECT | \
4566 NFT_SET_EVAL)
4567
nft_set_ops_candidate(const struct nft_set_type * type,u32 flags)4568 static bool nft_set_ops_candidate(const struct nft_set_type *type, u32 flags)
4569 {
4570 return (flags & type->features) == (flags & NFT_SET_FEATURES);
4571 }
4572
4573 /*
4574 * Select a set implementation based on the data characteristics and the
4575 * given policy. The total memory use might not be known if no size is
4576 * given, in that case the amount of memory per element is used.
4577 */
4578 static const struct nft_set_ops *
nft_select_set_ops(const struct nft_ctx * ctx,u32 flags,const struct nft_set_desc * desc)4579 nft_select_set_ops(const struct nft_ctx *ctx, u32 flags,
4580 const struct nft_set_desc *desc)
4581 {
4582 struct nftables_pernet *nft_net = nft_pernet(ctx->net);
4583 const struct nft_set_ops *ops, *bops;
4584 struct nft_set_estimate est, best;
4585 const struct nft_set_type *type;
4586 int i;
4587
4588 lockdep_assert_held(&nft_net->commit_mutex);
4589 lockdep_nfnl_nft_mutex_not_held();
4590
4591 bops = NULL;
4592 best.size = ~0;
4593 best.lookup = ~0;
4594 best.space = ~0;
4595
4596 for (i = 0; i < ARRAY_SIZE(nft_set_types); i++) {
4597 type = nft_set_types[i];
4598 ops = &type->ops;
4599
4600 if (!nft_set_ops_candidate(type, flags))
4601 continue;
4602 if (!ops->estimate(desc, flags, &est))
4603 continue;
4604
4605 switch (desc->policy) {
4606 case NFT_SET_POL_PERFORMANCE:
4607 if (est.lookup < best.lookup)
4608 break;
4609 if (est.lookup == best.lookup &&
4610 est.space < best.space)
4611 break;
4612 continue;
4613 case NFT_SET_POL_MEMORY:
4614 if (!desc->size) {
4615 if (est.space < best.space)
4616 break;
4617 if (est.space == best.space &&
4618 est.lookup < best.lookup)
4619 break;
4620 } else if (est.size < best.size || !bops) {
4621 break;
4622 }
4623 continue;
4624 default:
4625 break;
4626 }
4627
4628 bops = ops;
4629 best = est;
4630 }
4631
4632 if (bops != NULL)
4633 return bops;
4634
4635 return ERR_PTR(-EOPNOTSUPP);
4636 }
4637
4638 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
4639 [NFTA_SET_TABLE] = { .type = NLA_STRING,
4640 .len = NFT_TABLE_MAXNAMELEN - 1 },
4641 [NFTA_SET_NAME] = { .type = NLA_STRING,
4642 .len = NFT_SET_MAXNAMELEN - 1 },
4643 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
4644 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
4645 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
4646 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
4647 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
4648 [NFTA_SET_POLICY] = { .type = NLA_U32 },
4649 [NFTA_SET_DESC] = { .type = NLA_NESTED },
4650 [NFTA_SET_ID] = { .type = NLA_U32 },
4651 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
4652 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
4653 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
4654 .len = NFT_USERDATA_MAXLEN },
4655 [NFTA_SET_OBJ_TYPE] = { .type = NLA_U32 },
4656 [NFTA_SET_HANDLE] = { .type = NLA_U64 },
4657 [NFTA_SET_EXPR] = { .type = NLA_NESTED },
4658 [NFTA_SET_EXPRESSIONS] = NLA_POLICY_NESTED_ARRAY(nft_expr_policy),
4659 [NFTA_SET_TYPE] = { .type = NLA_REJECT },
4660 [NFTA_SET_COUNT] = { .type = NLA_REJECT },
4661 };
4662
4663 static const struct nla_policy nft_concat_policy[NFTA_SET_FIELD_MAX + 1] = {
4664 [NFTA_SET_FIELD_LEN] = { .type = NLA_U32 },
4665 };
4666
4667 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
4668 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
4669 [NFTA_SET_DESC_CONCAT] = NLA_POLICY_NESTED_ARRAY(nft_concat_policy),
4670 };
4671
nft_set_lookup(const struct net * net,const struct nft_table * table,const struct nlattr * nla,u8 genmask)4672 static struct nft_set *nft_set_lookup(const struct net *net,
4673 const struct nft_table *table,
4674 const struct nlattr *nla, u8 genmask)
4675 {
4676 struct nft_set *set;
4677
4678 if (nla == NULL)
4679 return ERR_PTR(-EINVAL);
4680
4681 list_for_each_entry_rcu(set, &table->sets, list,
4682 lockdep_commit_lock_is_held(net)) {
4683 if (!nla_strcmp(nla, set->name) &&
4684 nft_active_genmask(set, genmask))
4685 return set;
4686 }
4687 return ERR_PTR(-ENOENT);
4688 }
4689
nft_set_lookup_byhandle(const struct nft_table * table,const struct nlattr * nla,u8 genmask)4690 static struct nft_set *nft_set_lookup_byhandle(const struct nft_table *table,
4691 const struct nlattr *nla,
4692 u8 genmask)
4693 {
4694 struct nft_set *set;
4695
4696 list_for_each_entry(set, &table->sets, list) {
4697 if (be64_to_cpu(nla_get_be64(nla)) == set->handle &&
4698 nft_active_genmask(set, genmask))
4699 return set;
4700 }
4701 return ERR_PTR(-ENOENT);
4702 }
4703
nft_set_lookup_byid(const struct net * net,const struct nft_table * table,const struct nlattr * nla,u8 genmask)4704 static struct nft_set *nft_set_lookup_byid(const struct net *net,
4705 const struct nft_table *table,
4706 const struct nlattr *nla, u8 genmask)
4707 {
4708 struct nftables_pernet *nft_net = nft_pernet(net);
4709 u32 id = ntohl(nla_get_be32(nla));
4710 struct nft_trans_set *trans;
4711
4712 /* its likely the id we need is at the tail, not at start */
4713 list_for_each_entry_reverse(trans, &nft_net->commit_set_list, list_trans_newset) {
4714 struct nft_set *set = trans->set;
4715
4716 if (id == trans->set_id &&
4717 set->table == table &&
4718 nft_active_genmask(set, genmask))
4719 return set;
4720 }
4721 return ERR_PTR(-ENOENT);
4722 }
4723
nft_set_lookup_global(const struct net * net,const struct nft_table * table,const struct nlattr * nla_set_name,const struct nlattr * nla_set_id,u8 genmask)4724 struct nft_set *nft_set_lookup_global(const struct net *net,
4725 const struct nft_table *table,
4726 const struct nlattr *nla_set_name,
4727 const struct nlattr *nla_set_id,
4728 u8 genmask)
4729 {
4730 struct nft_set *set;
4731
4732 set = nft_set_lookup(net, table, nla_set_name, genmask);
4733 if (IS_ERR(set)) {
4734 if (!nla_set_id)
4735 return set;
4736
4737 set = nft_set_lookup_byid(net, table, nla_set_id, genmask);
4738 }
4739 return set;
4740 }
4741 EXPORT_SYMBOL_GPL(nft_set_lookup_global);
4742
nf_tables_set_alloc_name(struct nft_ctx * ctx,struct nft_set * set,const char * name)4743 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
4744 const char *name)
4745 {
4746 const struct nft_set *i;
4747 const char *p;
4748 unsigned long *inuse;
4749 unsigned int n = 0, min = 0;
4750
4751 p = strchr(name, '%');
4752 if (p != NULL) {
4753 if (p[1] != 'd' || strchr(p + 2, '%'))
4754 return -EINVAL;
4755
4756 if (strnlen(name, NFT_SET_MAX_ANONLEN) >= NFT_SET_MAX_ANONLEN)
4757 return -EINVAL;
4758
4759 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
4760 if (inuse == NULL)
4761 return -ENOMEM;
4762 cont:
4763 list_for_each_entry(i, &ctx->table->sets, list) {
4764 int tmp;
4765
4766 if (!nft_is_active_next(ctx->net, i))
4767 continue;
4768 if (!sscanf(i->name, name, &tmp))
4769 continue;
4770 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
4771 continue;
4772
4773 set_bit(tmp - min, inuse);
4774 }
4775
4776 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
4777 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
4778 min += BITS_PER_BYTE * PAGE_SIZE;
4779 memset(inuse, 0, PAGE_SIZE);
4780 goto cont;
4781 }
4782 free_page((unsigned long)inuse);
4783 }
4784
4785 set->name = kasprintf(GFP_KERNEL_ACCOUNT, name, min + n);
4786 if (!set->name)
4787 return -ENOMEM;
4788
4789 list_for_each_entry(i, &ctx->table->sets, list) {
4790 if (!nft_is_active_next(ctx->net, i))
4791 continue;
4792 if (!strcmp(set->name, i->name)) {
4793 kfree(set->name);
4794 set->name = NULL;
4795 return -ENFILE;
4796 }
4797 }
4798 return 0;
4799 }
4800
nf_msecs_to_jiffies64(const struct nlattr * nla,u64 * result)4801 int nf_msecs_to_jiffies64(const struct nlattr *nla, u64 *result)
4802 {
4803 u64 ms = be64_to_cpu(nla_get_be64(nla));
4804 u64 max = (u64)(~((u64)0));
4805
4806 max = div_u64(max, NSEC_PER_MSEC);
4807 if (ms >= max)
4808 return -ERANGE;
4809
4810 ms *= NSEC_PER_MSEC;
4811 *result = nsecs_to_jiffies64(ms) ? : !!ms;
4812 return 0;
4813 }
4814
nf_jiffies64_to_msecs(u64 input)4815 __be64 nf_jiffies64_to_msecs(u64 input)
4816 {
4817 return cpu_to_be64(jiffies64_to_msecs(input));
4818 }
4819
nf_tables_fill_set_concat(struct sk_buff * skb,const struct nft_set * set)4820 static int nf_tables_fill_set_concat(struct sk_buff *skb,
4821 const struct nft_set *set)
4822 {
4823 struct nlattr *concat, *field;
4824 int i;
4825
4826 concat = nla_nest_start_noflag(skb, NFTA_SET_DESC_CONCAT);
4827 if (!concat)
4828 return -ENOMEM;
4829
4830 for (i = 0; i < set->field_count; i++) {
4831 field = nla_nest_start_noflag(skb, NFTA_LIST_ELEM);
4832 if (!field)
4833 return -ENOMEM;
4834
4835 if (nla_put_be32(skb, NFTA_SET_FIELD_LEN,
4836 htonl(set->field_len[i])))
4837 return -ENOMEM;
4838
4839 nla_nest_end(skb, field);
4840 }
4841
4842 nla_nest_end(skb, concat);
4843
4844 return 0;
4845 }
4846
nft_set_userspace_size(const struct nft_set_ops * ops,u32 size)4847 static u32 nft_set_userspace_size(const struct nft_set_ops *ops, u32 size)
4848 {
4849 if (ops->usize)
4850 return ops->usize(size);
4851
4852 return size;
4853 }
4854
4855 static noinline_for_stack int
nf_tables_fill_set_info(struct sk_buff * skb,const struct nft_set * set)4856 nf_tables_fill_set_info(struct sk_buff *skb, const struct nft_set *set)
4857 {
4858 unsigned int nelems;
4859 char str[40];
4860 int ret;
4861
4862 ret = snprintf(str, sizeof(str), "%ps", set->ops);
4863
4864 /* Not expected to happen and harmless: NFTA_SET_TYPE is dumped
4865 * to userspace purely for informational/debug purposes.
4866 */
4867 DEBUG_NET_WARN_ON_ONCE(ret >= sizeof(str));
4868
4869 if (nla_put_string(skb, NFTA_SET_TYPE, str))
4870 return -EMSGSIZE;
4871
4872 nelems = nft_set_userspace_size(set->ops, atomic_read(&set->nelems));
4873 return nla_put_be32(skb, NFTA_SET_COUNT, htonl(nelems));
4874 }
4875
nf_tables_fill_set(struct sk_buff * skb,const struct nft_ctx * ctx,const struct nft_set * set,u16 event,u16 flags)4876 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
4877 const struct nft_set *set, u16 event, u16 flags)
4878 {
4879 u64 timeout = READ_ONCE(set->timeout);
4880 u32 gc_int = READ_ONCE(set->gc_int);
4881 u32 portid = ctx->portid;
4882 struct nlmsghdr *nlh;
4883 struct nlattr *nest;
4884 u32 seq = ctx->seq;
4885 int i;
4886
4887 nlh = nfnl_msg_put(skb, portid, seq,
4888 nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event),
4889 flags, ctx->family, NFNETLINK_V0,
4890 nft_base_seq(ctx->net));
4891 if (!nlh)
4892 goto nla_put_failure;
4893
4894 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
4895 goto nla_put_failure;
4896 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
4897 goto nla_put_failure;
4898 if (nla_put_be64(skb, NFTA_SET_HANDLE, cpu_to_be64(set->handle),
4899 NFTA_SET_PAD))
4900 goto nla_put_failure;
4901
4902 if (event == NFT_MSG_DELSET ||
4903 event == NFT_MSG_DESTROYSET) {
4904 nlmsg_end(skb, nlh);
4905 return 0;
4906 }
4907
4908 if (set->flags != 0)
4909 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
4910 goto nla_put_failure;
4911
4912 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
4913 goto nla_put_failure;
4914 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
4915 goto nla_put_failure;
4916 if (set->flags & NFT_SET_MAP) {
4917 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
4918 goto nla_put_failure;
4919 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
4920 goto nla_put_failure;
4921 }
4922 if (set->flags & NFT_SET_OBJECT &&
4923 nla_put_be32(skb, NFTA_SET_OBJ_TYPE, htonl(set->objtype)))
4924 goto nla_put_failure;
4925
4926 if (timeout &&
4927 nla_put_be64(skb, NFTA_SET_TIMEOUT,
4928 nf_jiffies64_to_msecs(timeout),
4929 NFTA_SET_PAD))
4930 goto nla_put_failure;
4931 if (gc_int &&
4932 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(gc_int)))
4933 goto nla_put_failure;
4934
4935 if (set->policy != NFT_SET_POL_PERFORMANCE) {
4936 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
4937 goto nla_put_failure;
4938 }
4939
4940 if (set->udata &&
4941 nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
4942 goto nla_put_failure;
4943
4944 nest = nla_nest_start_noflag(skb, NFTA_SET_DESC);
4945 if (!nest)
4946 goto nla_put_failure;
4947 if (set->size &&
4948 nla_put_be32(skb, NFTA_SET_DESC_SIZE,
4949 htonl(nft_set_userspace_size(set->ops, set->size))))
4950 goto nla_put_failure;
4951
4952 if (set->field_count > 1 &&
4953 nf_tables_fill_set_concat(skb, set))
4954 goto nla_put_failure;
4955
4956 nla_nest_end(skb, nest);
4957
4958 if (nf_tables_fill_set_info(skb, set))
4959 goto nla_put_failure;
4960
4961 if (set->num_exprs == 1) {
4962 nest = nla_nest_start_noflag(skb, NFTA_SET_EXPR);
4963 if (nf_tables_fill_expr_info(skb, set->exprs[0], false) < 0)
4964 goto nla_put_failure;
4965
4966 nla_nest_end(skb, nest);
4967 } else if (set->num_exprs > 1) {
4968 nest = nla_nest_start_noflag(skb, NFTA_SET_EXPRESSIONS);
4969 if (nest == NULL)
4970 goto nla_put_failure;
4971
4972 for (i = 0; i < set->num_exprs; i++) {
4973 if (nft_expr_dump(skb, NFTA_LIST_ELEM,
4974 set->exprs[i], false) < 0)
4975 goto nla_put_failure;
4976 }
4977 nla_nest_end(skb, nest);
4978 }
4979
4980 nlmsg_end(skb, nlh);
4981 return 0;
4982
4983 nla_put_failure:
4984 nlmsg_trim(skb, nlh);
4985 return -1;
4986 }
4987
nf_tables_set_notify(const struct nft_ctx * ctx,const struct nft_set * set,int event,gfp_t gfp_flags)4988 static void nf_tables_set_notify(const struct nft_ctx *ctx,
4989 const struct nft_set *set, int event,
4990 gfp_t gfp_flags)
4991 {
4992 struct nftables_pernet *nft_net = nft_pernet(ctx->net);
4993 u32 portid = ctx->portid;
4994 struct sk_buff *skb;
4995 u16 flags = 0;
4996 int err;
4997
4998 if (!ctx->report &&
4999 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
5000 return;
5001
5002 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
5003 if (skb == NULL)
5004 goto err;
5005
5006 if (ctx->flags & (NLM_F_CREATE | NLM_F_EXCL))
5007 flags |= ctx->flags & (NLM_F_CREATE | NLM_F_EXCL);
5008
5009 err = nf_tables_fill_set(skb, ctx, set, event, flags);
5010 if (err < 0) {
5011 kfree_skb(skb);
5012 goto err;
5013 }
5014
5015 nft_notify_enqueue(skb, ctx->report, &nft_net->notify_list);
5016 return;
5017 err:
5018 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
5019 }
5020
nf_tables_dump_sets(struct sk_buff * skb,struct netlink_callback * cb)5021 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
5022 {
5023 const struct nft_set *set;
5024 unsigned int idx, s_idx = cb->args[0];
5025 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
5026 struct net *net = sock_net(skb->sk);
5027 struct nft_ctx *ctx = cb->data, ctx_set;
5028 struct nftables_pernet *nft_net;
5029
5030 if (cb->args[1])
5031 return skb->len;
5032
5033 rcu_read_lock();
5034 nft_net = nft_pernet(net);
5035 cb->seq = READ_ONCE(nft_net->base_seq);
5036
5037 list_for_each_entry_rcu(table, &nft_net->tables, list) {
5038 if (ctx->family != NFPROTO_UNSPEC &&
5039 ctx->family != table->family)
5040 continue;
5041
5042 if (ctx->table && ctx->table != table)
5043 continue;
5044
5045 if (cur_table) {
5046 if (cur_table != table)
5047 continue;
5048
5049 cur_table = NULL;
5050 }
5051 idx = 0;
5052 list_for_each_entry_rcu(set, &table->sets, list) {
5053 if (idx < s_idx)
5054 goto cont;
5055 if (!nft_is_active(net, set))
5056 goto cont;
5057
5058 ctx_set = *ctx;
5059 ctx_set.table = table;
5060 ctx_set.family = table->family;
5061
5062 if (nf_tables_fill_set(skb, &ctx_set, set,
5063 NFT_MSG_NEWSET,
5064 NLM_F_MULTI) < 0) {
5065 cb->args[0] = idx;
5066 cb->args[2] = (unsigned long) table;
5067 goto done;
5068 }
5069 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
5070 cont:
5071 idx++;
5072 }
5073 if (s_idx)
5074 s_idx = 0;
5075 }
5076 cb->args[1] = 1;
5077 done:
5078 rcu_read_unlock();
5079 return skb->len;
5080 }
5081
nf_tables_dump_sets_start(struct netlink_callback * cb)5082 static int nf_tables_dump_sets_start(struct netlink_callback *cb)
5083 {
5084 struct nft_ctx *ctx_dump = NULL;
5085
5086 ctx_dump = kmemdup(cb->data, sizeof(*ctx_dump), GFP_ATOMIC);
5087 if (ctx_dump == NULL)
5088 return -ENOMEM;
5089
5090 cb->data = ctx_dump;
5091 return 0;
5092 }
5093
nf_tables_dump_sets_done(struct netlink_callback * cb)5094 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
5095 {
5096 kfree(cb->data);
5097 return 0;
5098 }
5099
5100 /* called with rcu_read_lock held */
nf_tables_getset(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])5101 static int nf_tables_getset(struct sk_buff *skb, const struct nfnl_info *info,
5102 const struct nlattr * const nla[])
5103 {
5104 struct netlink_ext_ack *extack = info->extack;
5105 u8 genmask = nft_genmask_cur(info->net);
5106 u8 family = info->nfmsg->nfgen_family;
5107 struct nft_table *table = NULL;
5108 struct net *net = info->net;
5109 const struct nft_set *set;
5110 struct sk_buff *skb2;
5111 struct nft_ctx ctx;
5112 int err;
5113
5114 if (nla[NFTA_SET_TABLE]) {
5115 table = nft_table_lookup(net, nla[NFTA_SET_TABLE], family,
5116 genmask, 0);
5117 if (IS_ERR(table)) {
5118 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_TABLE]);
5119 return PTR_ERR(table);
5120 }
5121 }
5122
5123 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
5124
5125 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
5126 struct netlink_dump_control c = {
5127 .start = nf_tables_dump_sets_start,
5128 .dump = nf_tables_dump_sets,
5129 .done = nf_tables_dump_sets_done,
5130 .data = &ctx,
5131 .module = THIS_MODULE,
5132 };
5133
5134 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
5135 }
5136
5137 /* Only accept unspec with dump */
5138 if (info->nfmsg->nfgen_family == NFPROTO_UNSPEC)
5139 return -EAFNOSUPPORT;
5140 if (!nla[NFTA_SET_TABLE])
5141 return -EINVAL;
5142
5143 set = nft_set_lookup(net, table, nla[NFTA_SET_NAME], genmask);
5144 if (IS_ERR(set)) {
5145 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
5146 return PTR_ERR(set);
5147 }
5148
5149 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
5150 if (skb2 == NULL)
5151 return -ENOMEM;
5152
5153 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
5154 if (err < 0)
5155 goto err_fill_set_info;
5156
5157 return nfnetlink_unicast(skb2, net, NETLINK_CB(skb).portid);
5158
5159 err_fill_set_info:
5160 kfree_skb(skb2);
5161 return err;
5162 }
5163
nft_set_desc_concat_parse(const struct nlattr * attr,struct nft_set_desc * desc)5164 static int nft_set_desc_concat_parse(const struct nlattr *attr,
5165 struct nft_set_desc *desc)
5166 {
5167 struct nlattr *tb[NFTA_SET_FIELD_MAX + 1];
5168 u32 len;
5169 int err;
5170
5171 if (desc->field_count >= ARRAY_SIZE(desc->field_len))
5172 return -E2BIG;
5173
5174 err = nla_parse_nested_deprecated(tb, NFTA_SET_FIELD_MAX, attr,
5175 nft_concat_policy, NULL);
5176 if (err < 0)
5177 return err;
5178
5179 if (!tb[NFTA_SET_FIELD_LEN])
5180 return -EINVAL;
5181
5182 len = ntohl(nla_get_be32(tb[NFTA_SET_FIELD_LEN]));
5183 if (!len || len > U8_MAX)
5184 return -EINVAL;
5185
5186 desc->field_len[desc->field_count++] = len;
5187
5188 return 0;
5189 }
5190
nft_set_desc_concat(struct nft_set_desc * desc,const struct nlattr * nla)5191 static int nft_set_desc_concat(struct nft_set_desc *desc,
5192 const struct nlattr *nla)
5193 {
5194 u32 len = 0, num_regs;
5195 struct nlattr *attr;
5196 int rem, err, i;
5197
5198 nla_for_each_nested(attr, nla, rem) {
5199 if (nla_type(attr) != NFTA_LIST_ELEM)
5200 return -EINVAL;
5201
5202 err = nft_set_desc_concat_parse(attr, desc);
5203 if (err < 0)
5204 return err;
5205 }
5206
5207 for (i = 0; i < desc->field_count; i++)
5208 len += round_up(desc->field_len[i], sizeof(u32));
5209
5210 if (len != desc->klen)
5211 return -EINVAL;
5212
5213 num_regs = DIV_ROUND_UP(desc->klen, sizeof(u32));
5214 if (num_regs > NFT_REG32_COUNT)
5215 return -E2BIG;
5216
5217 return 0;
5218 }
5219
nf_tables_set_desc_parse(struct nft_set_desc * desc,const struct nlattr * nla)5220 static int nf_tables_set_desc_parse(struct nft_set_desc *desc,
5221 const struct nlattr *nla)
5222 {
5223 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
5224 int err;
5225
5226 err = nla_parse_nested_deprecated(da, NFTA_SET_DESC_MAX, nla,
5227 nft_set_desc_policy, NULL);
5228 if (err < 0)
5229 return err;
5230
5231 if (da[NFTA_SET_DESC_SIZE] != NULL)
5232 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
5233 if (da[NFTA_SET_DESC_CONCAT])
5234 err = nft_set_desc_concat(desc, da[NFTA_SET_DESC_CONCAT]);
5235
5236 return err;
5237 }
5238
nft_set_expr_alloc(struct nft_ctx * ctx,struct nft_set * set,const struct nlattr * const * nla,struct nft_expr ** exprs,int * num_exprs,u32 flags)5239 static int nft_set_expr_alloc(struct nft_ctx *ctx, struct nft_set *set,
5240 const struct nlattr * const *nla,
5241 struct nft_expr **exprs, int *num_exprs,
5242 u32 flags)
5243 {
5244 struct nft_expr *expr;
5245 int err, i;
5246
5247 if (nla[NFTA_SET_EXPR]) {
5248 expr = nft_set_elem_expr_alloc(ctx, set, nla[NFTA_SET_EXPR]);
5249 if (IS_ERR(expr)) {
5250 err = PTR_ERR(expr);
5251 goto err_set_expr_alloc;
5252 }
5253 exprs[0] = expr;
5254 (*num_exprs)++;
5255 } else if (nla[NFTA_SET_EXPRESSIONS]) {
5256 struct nlattr *tmp;
5257 int left;
5258
5259 if (!(flags & NFT_SET_EXPR)) {
5260 err = -EINVAL;
5261 goto err_set_expr_alloc;
5262 }
5263 i = 0;
5264 nla_for_each_nested(tmp, nla[NFTA_SET_EXPRESSIONS], left) {
5265 if (i == NFT_SET_EXPR_MAX) {
5266 err = -E2BIG;
5267 goto err_set_expr_alloc;
5268 }
5269 if (nla_type(tmp) != NFTA_LIST_ELEM) {
5270 err = -EINVAL;
5271 goto err_set_expr_alloc;
5272 }
5273 expr = nft_set_elem_expr_alloc(ctx, set, tmp);
5274 if (IS_ERR(expr)) {
5275 err = PTR_ERR(expr);
5276 goto err_set_expr_alloc;
5277 }
5278 exprs[i++] = expr;
5279 (*num_exprs)++;
5280 }
5281 }
5282
5283 return 0;
5284
5285 err_set_expr_alloc:
5286 for (i = 0; i < *num_exprs; i++)
5287 nft_expr_destroy(ctx, exprs[i]);
5288
5289 return err;
5290 }
5291
nft_set_is_same(const struct nft_set * set,const struct nft_set_desc * desc,struct nft_expr * exprs[],u32 num_exprs,u32 flags)5292 static bool nft_set_is_same(const struct nft_set *set,
5293 const struct nft_set_desc *desc,
5294 struct nft_expr *exprs[], u32 num_exprs, u32 flags)
5295 {
5296 int i;
5297
5298 if (set->ktype != desc->ktype ||
5299 set->dtype != desc->dtype ||
5300 set->flags != flags ||
5301 set->klen != desc->klen ||
5302 set->dlen != desc->dlen ||
5303 set->field_count != desc->field_count ||
5304 set->num_exprs != num_exprs)
5305 return false;
5306
5307 for (i = 0; i < desc->field_count; i++) {
5308 if (set->field_len[i] != desc->field_len[i])
5309 return false;
5310 }
5311
5312 for (i = 0; i < num_exprs; i++) {
5313 if (set->exprs[i]->ops != exprs[i]->ops)
5314 return false;
5315 }
5316
5317 return true;
5318 }
5319
nft_set_kernel_size(const struct nft_set_ops * ops,const struct nft_set_desc * desc)5320 static u32 nft_set_kernel_size(const struct nft_set_ops *ops,
5321 const struct nft_set_desc *desc)
5322 {
5323 if (ops->ksize)
5324 return ops->ksize(desc->size);
5325
5326 return desc->size;
5327 }
5328
nf_tables_newset(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])5329 static int nf_tables_newset(struct sk_buff *skb, const struct nfnl_info *info,
5330 const struct nlattr * const nla[])
5331 {
5332 struct netlink_ext_ack *extack = info->extack;
5333 u8 genmask = nft_genmask_next(info->net);
5334 u8 family = info->nfmsg->nfgen_family;
5335 const struct nft_set_ops *ops;
5336 struct net *net = info->net;
5337 struct nft_set_desc desc;
5338 struct nft_table *table;
5339 unsigned char *udata;
5340 struct nft_set *set;
5341 struct nft_ctx ctx;
5342 size_t alloc_size;
5343 int num_exprs = 0;
5344 char *name;
5345 int err, i;
5346 u16 udlen;
5347 u32 flags;
5348 u64 size;
5349
5350 if (nla[NFTA_SET_TABLE] == NULL ||
5351 nla[NFTA_SET_NAME] == NULL ||
5352 nla[NFTA_SET_KEY_LEN] == NULL ||
5353 nla[NFTA_SET_ID] == NULL)
5354 return -EINVAL;
5355
5356 memset(&desc, 0, sizeof(desc));
5357
5358 desc.ktype = NFT_DATA_VALUE;
5359 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
5360 desc.ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
5361 if ((desc.ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
5362 return -EINVAL;
5363 }
5364
5365 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
5366 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
5367 return -EINVAL;
5368
5369 flags = 0;
5370 if (nla[NFTA_SET_FLAGS] != NULL) {
5371 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
5372 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
5373 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
5374 NFT_SET_MAP | NFT_SET_EVAL |
5375 NFT_SET_OBJECT | NFT_SET_CONCAT | NFT_SET_EXPR))
5376 return -EOPNOTSUPP;
5377 /* Only one of these operations is supported */
5378 if ((flags & (NFT_SET_MAP | NFT_SET_OBJECT)) ==
5379 (NFT_SET_MAP | NFT_SET_OBJECT))
5380 return -EOPNOTSUPP;
5381 if ((flags & (NFT_SET_EVAL | NFT_SET_OBJECT)) ==
5382 (NFT_SET_EVAL | NFT_SET_OBJECT))
5383 return -EOPNOTSUPP;
5384 if ((flags & (NFT_SET_ANONYMOUS | NFT_SET_TIMEOUT | NFT_SET_EVAL)) ==
5385 (NFT_SET_ANONYMOUS | NFT_SET_TIMEOUT))
5386 return -EOPNOTSUPP;
5387 if ((flags & (NFT_SET_CONSTANT | NFT_SET_TIMEOUT)) ==
5388 (NFT_SET_CONSTANT | NFT_SET_TIMEOUT))
5389 return -EOPNOTSUPP;
5390 }
5391
5392 desc.dtype = 0;
5393 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
5394 if (!(flags & NFT_SET_MAP))
5395 return -EINVAL;
5396
5397 desc.dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
5398 if ((desc.dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
5399 desc.dtype != NFT_DATA_VERDICT)
5400 return -EINVAL;
5401
5402 if (desc.dtype != NFT_DATA_VERDICT) {
5403 if (nla[NFTA_SET_DATA_LEN] == NULL)
5404 return -EINVAL;
5405 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
5406 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
5407 return -EINVAL;
5408 } else
5409 desc.dlen = sizeof(struct nft_verdict);
5410 } else if (flags & NFT_SET_MAP)
5411 return -EINVAL;
5412
5413 if (nla[NFTA_SET_OBJ_TYPE] != NULL) {
5414 if (!(flags & NFT_SET_OBJECT))
5415 return -EINVAL;
5416
5417 desc.objtype = ntohl(nla_get_be32(nla[NFTA_SET_OBJ_TYPE]));
5418 if (desc.objtype == NFT_OBJECT_UNSPEC ||
5419 desc.objtype > NFT_OBJECT_MAX)
5420 return -EOPNOTSUPP;
5421 } else if (flags & NFT_SET_OBJECT)
5422 return -EINVAL;
5423 else
5424 desc.objtype = NFT_OBJECT_UNSPEC;
5425
5426 desc.timeout = 0;
5427 if (nla[NFTA_SET_TIMEOUT] != NULL) {
5428 if (!(flags & NFT_SET_TIMEOUT))
5429 return -EINVAL;
5430
5431 if (flags & NFT_SET_ANONYMOUS)
5432 return -EOPNOTSUPP;
5433
5434 err = nf_msecs_to_jiffies64(nla[NFTA_SET_TIMEOUT], &desc.timeout);
5435 if (err)
5436 return err;
5437 }
5438 desc.gc_int = 0;
5439 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
5440 if (!(flags & NFT_SET_TIMEOUT))
5441 return -EINVAL;
5442
5443 if (flags & NFT_SET_ANONYMOUS)
5444 return -EOPNOTSUPP;
5445
5446 desc.gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
5447 }
5448
5449 desc.policy = NFT_SET_POL_PERFORMANCE;
5450 if (nla[NFTA_SET_POLICY] != NULL) {
5451 desc.policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
5452 switch (desc.policy) {
5453 case NFT_SET_POL_PERFORMANCE:
5454 case NFT_SET_POL_MEMORY:
5455 break;
5456 default:
5457 return -EOPNOTSUPP;
5458 }
5459 }
5460
5461 if (nla[NFTA_SET_DESC] != NULL) {
5462 err = nf_tables_set_desc_parse(&desc, nla[NFTA_SET_DESC]);
5463 if (err < 0)
5464 return err;
5465
5466 if (desc.field_count > 1) {
5467 if (!(flags & NFT_SET_CONCAT))
5468 return -EINVAL;
5469 } else if (flags & NFT_SET_CONCAT) {
5470 return -EINVAL;
5471 }
5472 } else if (flags & NFT_SET_CONCAT) {
5473 return -EINVAL;
5474 }
5475
5476 if (nla[NFTA_SET_EXPR] || nla[NFTA_SET_EXPRESSIONS])
5477 desc.expr = true;
5478
5479 table = nft_table_lookup(net, nla[NFTA_SET_TABLE], family, genmask,
5480 NETLINK_CB(skb).portid);
5481 if (IS_ERR(table)) {
5482 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_TABLE]);
5483 return PTR_ERR(table);
5484 }
5485
5486 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
5487
5488 set = nft_set_lookup(net, table, nla[NFTA_SET_NAME], genmask);
5489 if (IS_ERR(set)) {
5490 if (PTR_ERR(set) != -ENOENT) {
5491 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
5492 return PTR_ERR(set);
5493 }
5494 } else {
5495 struct nft_expr *exprs[NFT_SET_EXPR_MAX] = {};
5496
5497 if (info->nlh->nlmsg_flags & NLM_F_EXCL) {
5498 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
5499 return -EEXIST;
5500 }
5501 if (info->nlh->nlmsg_flags & NLM_F_REPLACE)
5502 return -EOPNOTSUPP;
5503
5504 if (nft_set_is_anonymous(set))
5505 return -EOPNOTSUPP;
5506
5507 err = nft_set_expr_alloc(&ctx, set, nla, exprs, &num_exprs, flags);
5508 if (err < 0)
5509 return err;
5510
5511 if (desc.size)
5512 desc.size = nft_set_kernel_size(set->ops, &desc);
5513
5514 err = 0;
5515 if (!nft_set_is_same(set, &desc, exprs, num_exprs, flags)) {
5516 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
5517 err = -EEXIST;
5518 }
5519
5520 for (i = 0; i < num_exprs; i++)
5521 nft_expr_destroy(&ctx, exprs[i]);
5522
5523 if (err < 0)
5524 return err;
5525
5526 return __nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set, &desc);
5527 }
5528
5529 if (!(info->nlh->nlmsg_flags & NLM_F_CREATE))
5530 return -ENOENT;
5531
5532 ops = nft_select_set_ops(&ctx, flags, &desc);
5533 if (IS_ERR(ops))
5534 return PTR_ERR(ops);
5535
5536 if (desc.size)
5537 desc.size = nft_set_kernel_size(ops, &desc);
5538
5539 udlen = 0;
5540 if (nla[NFTA_SET_USERDATA])
5541 udlen = nla_len(nla[NFTA_SET_USERDATA]);
5542
5543 size = 0;
5544 if (ops->privsize != NULL)
5545 size = ops->privsize(nla, &desc);
5546 alloc_size = sizeof(*set) + size + udlen;
5547 if (alloc_size < size || alloc_size > INT_MAX)
5548 return -ENOMEM;
5549
5550 if (!nft_use_inc(&table->use))
5551 return -EMFILE;
5552
5553 set = kvzalloc(alloc_size, GFP_KERNEL_ACCOUNT);
5554 if (!set) {
5555 err = -ENOMEM;
5556 goto err_alloc;
5557 }
5558
5559 name = nla_strdup(nla[NFTA_SET_NAME], GFP_KERNEL_ACCOUNT);
5560 if (!name) {
5561 err = -ENOMEM;
5562 goto err_set_name;
5563 }
5564
5565 err = nf_tables_set_alloc_name(&ctx, set, name);
5566 kfree(name);
5567 if (err < 0)
5568 goto err_set_name;
5569
5570 udata = NULL;
5571 if (udlen) {
5572 udata = set->data + size;
5573 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
5574 }
5575
5576 INIT_LIST_HEAD(&set->bindings);
5577 INIT_LIST_HEAD(&set->catchall_list);
5578 refcount_set(&set->refs, 1);
5579 set->table = table;
5580 write_pnet(&set->net, net);
5581 set->ops = ops;
5582 set->ktype = desc.ktype;
5583 set->klen = desc.klen;
5584 set->dtype = desc.dtype;
5585 set->objtype = desc.objtype;
5586 set->dlen = desc.dlen;
5587 set->flags = flags;
5588 set->size = desc.size;
5589 set->policy = desc.policy;
5590 set->udlen = udlen;
5591 set->udata = udata;
5592 set->timeout = desc.timeout;
5593 set->gc_int = desc.gc_int;
5594
5595 set->field_count = desc.field_count;
5596 for (i = 0; i < desc.field_count; i++)
5597 set->field_len[i] = desc.field_len[i];
5598
5599 err = ops->init(set, &desc, nla);
5600 if (err < 0)
5601 goto err_set_init;
5602
5603 err = nft_set_expr_alloc(&ctx, set, nla, set->exprs, &num_exprs, flags);
5604 if (err < 0)
5605 goto err_set_destroy;
5606
5607 set->num_exprs = num_exprs;
5608 set->handle = nf_tables_alloc_handle(table);
5609 INIT_LIST_HEAD(&set->pending_update);
5610
5611 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
5612 if (err < 0)
5613 goto err_set_expr_alloc;
5614
5615 list_add_tail_rcu(&set->list, &table->sets);
5616
5617 return 0;
5618
5619 err_set_expr_alloc:
5620 for (i = 0; i < set->num_exprs; i++)
5621 nft_expr_destroy(&ctx, set->exprs[i]);
5622 err_set_destroy:
5623 ops->destroy(&ctx, set);
5624 err_set_init:
5625 kfree(set->name);
5626 err_set_name:
5627 kvfree(set);
5628 err_alloc:
5629 nft_use_dec_restore(&table->use);
5630
5631 return err;
5632 }
5633
nft_set_catchall_destroy(const struct nft_ctx * ctx,struct nft_set * set)5634 static void nft_set_catchall_destroy(const struct nft_ctx *ctx,
5635 struct nft_set *set)
5636 {
5637 struct nft_set_elem_catchall *next, *catchall;
5638
5639 list_for_each_entry_safe(catchall, next, &set->catchall_list, list) {
5640 list_del_rcu(&catchall->list);
5641 nf_tables_set_elem_destroy(ctx, set, catchall->elem);
5642 kfree_rcu(catchall, rcu);
5643 }
5644 }
5645
nft_set_put(struct nft_set * set)5646 static void nft_set_put(struct nft_set *set)
5647 {
5648 if (refcount_dec_and_test(&set->refs)) {
5649 kfree(set->name);
5650 kvfree(set);
5651 }
5652 }
5653
nft_set_destroy(const struct nft_ctx * ctx,struct nft_set * set)5654 static void nft_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
5655 {
5656 int i;
5657
5658 if (WARN_ON(set->use > 0))
5659 return;
5660
5661 for (i = 0; i < set->num_exprs; i++)
5662 nft_expr_destroy(ctx, set->exprs[i]);
5663
5664 set->ops->destroy(ctx, set);
5665 nft_set_catchall_destroy(ctx, set);
5666 nft_set_put(set);
5667 }
5668
nf_tables_delset(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])5669 static int nf_tables_delset(struct sk_buff *skb, const struct nfnl_info *info,
5670 const struct nlattr * const nla[])
5671 {
5672 struct netlink_ext_ack *extack = info->extack;
5673 u8 genmask = nft_genmask_next(info->net);
5674 u8 family = info->nfmsg->nfgen_family;
5675 struct net *net = info->net;
5676 const struct nlattr *attr;
5677 struct nft_table *table;
5678 struct nft_set *set;
5679 struct nft_ctx ctx;
5680
5681 if (info->nfmsg->nfgen_family == NFPROTO_UNSPEC)
5682 return -EAFNOSUPPORT;
5683
5684 table = nft_table_lookup(net, nla[NFTA_SET_TABLE], family,
5685 genmask, NETLINK_CB(skb).portid);
5686 if (IS_ERR(table)) {
5687 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_TABLE]);
5688 return PTR_ERR(table);
5689 }
5690
5691 if (nla[NFTA_SET_HANDLE]) {
5692 attr = nla[NFTA_SET_HANDLE];
5693 set = nft_set_lookup_byhandle(table, attr, genmask);
5694 } else {
5695 attr = nla[NFTA_SET_NAME];
5696 set = nft_set_lookup(net, table, attr, genmask);
5697 }
5698
5699 if (IS_ERR(set)) {
5700 if (PTR_ERR(set) == -ENOENT &&
5701 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYSET)
5702 return 0;
5703
5704 NL_SET_BAD_ATTR(extack, attr);
5705 return PTR_ERR(set);
5706 }
5707 if (set->use ||
5708 (info->nlh->nlmsg_flags & NLM_F_NONREC &&
5709 atomic_read(&set->nelems) > 0)) {
5710 NL_SET_BAD_ATTR(extack, attr);
5711 return -EBUSY;
5712 }
5713
5714 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
5715
5716 return nft_delset(&ctx, set);
5717 }
5718
5719 static int nft_validate_register_store(const struct nft_ctx *ctx,
5720 enum nft_registers reg,
5721 const struct nft_data *data,
5722 enum nft_data_types type,
5723 unsigned int len);
5724
nft_setelem_data_validate(const struct nft_ctx * ctx,struct nft_set * set,struct nft_elem_priv * elem_priv)5725 static int nft_setelem_data_validate(const struct nft_ctx *ctx,
5726 struct nft_set *set,
5727 struct nft_elem_priv *elem_priv)
5728 {
5729 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
5730 enum nft_registers dreg;
5731
5732 dreg = nft_type_to_reg(set->dtype);
5733 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
5734 set->dtype == NFT_DATA_VERDICT ?
5735 NFT_DATA_VERDICT : NFT_DATA_VALUE,
5736 set->dlen);
5737 }
5738
nf_tables_bind_check_setelem(const struct nft_ctx * ctx,struct nft_set * set,const struct nft_set_iter * iter,struct nft_elem_priv * elem_priv)5739 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
5740 struct nft_set *set,
5741 const struct nft_set_iter *iter,
5742 struct nft_elem_priv *elem_priv)
5743 {
5744 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
5745
5746 if (!nft_set_elem_active(ext, iter->genmask))
5747 return 0;
5748
5749 return nft_setelem_data_validate(ctx, set, elem_priv);
5750 }
5751
nft_set_catchall_bind_check(const struct nft_ctx * ctx,struct nft_set * set)5752 static int nft_set_catchall_bind_check(const struct nft_ctx *ctx,
5753 struct nft_set *set)
5754 {
5755 u8 genmask = nft_genmask_next(ctx->net);
5756 struct nft_set_elem_catchall *catchall;
5757 struct nft_set_ext *ext;
5758 int ret = 0;
5759
5760 list_for_each_entry_rcu(catchall, &set->catchall_list, list,
5761 lockdep_commit_lock_is_held(ctx->net)) {
5762 ext = nft_set_elem_ext(set, catchall->elem);
5763 if (!nft_set_elem_active(ext, genmask))
5764 continue;
5765
5766 ret = nft_setelem_data_validate(ctx, set, catchall->elem);
5767 if (ret < 0)
5768 break;
5769 }
5770
5771 return ret;
5772 }
5773
nf_tables_bind_set(const struct nft_ctx * ctx,struct nft_set * set,struct nft_set_binding * binding)5774 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
5775 struct nft_set_binding *binding)
5776 {
5777 struct nft_set_binding *i;
5778 struct nft_set_iter iter;
5779
5780 if (!list_empty(&set->bindings) && nft_set_is_anonymous(set))
5781 return -EBUSY;
5782
5783 if (binding->flags & NFT_SET_MAP) {
5784 /* If the set is already bound to the same chain all
5785 * jumps are already validated for that chain.
5786 */
5787 list_for_each_entry(i, &set->bindings, list) {
5788 if (i->flags & NFT_SET_MAP &&
5789 i->chain == binding->chain)
5790 goto bind;
5791 }
5792
5793 iter.genmask = nft_genmask_next(ctx->net);
5794 iter.type = NFT_ITER_UPDATE;
5795 iter.skip = 0;
5796 iter.count = 0;
5797 iter.err = 0;
5798 iter.fn = nf_tables_bind_check_setelem;
5799
5800 set->ops->walk(ctx, set, &iter);
5801 if (!iter.err)
5802 iter.err = nft_set_catchall_bind_check(ctx, set);
5803
5804 if (iter.err < 0)
5805 return iter.err;
5806 }
5807 bind:
5808 if (!nft_use_inc(&set->use))
5809 return -EMFILE;
5810
5811 binding->chain = ctx->chain;
5812 list_add_tail_rcu(&binding->list, &set->bindings);
5813 nft_set_trans_bind(ctx, set);
5814
5815 return 0;
5816 }
5817 EXPORT_SYMBOL_GPL(nf_tables_bind_set);
5818
nf_tables_unbind_set(const struct nft_ctx * ctx,struct nft_set * set,struct nft_set_binding * binding,bool event)5819 static void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
5820 struct nft_set_binding *binding, bool event)
5821 {
5822 list_del_rcu(&binding->list);
5823
5824 if (list_empty(&set->bindings) && nft_set_is_anonymous(set)) {
5825 list_del_rcu(&set->list);
5826 set->dead = 1;
5827 if (event)
5828 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET,
5829 GFP_KERNEL);
5830 }
5831 }
5832
5833 static void nft_setelem_data_activate(const struct net *net,
5834 const struct nft_set *set,
5835 struct nft_elem_priv *elem_priv);
5836
nft_mapelem_activate(const struct nft_ctx * ctx,struct nft_set * set,const struct nft_set_iter * iter,struct nft_elem_priv * elem_priv)5837 static int nft_mapelem_activate(const struct nft_ctx *ctx,
5838 struct nft_set *set,
5839 const struct nft_set_iter *iter,
5840 struct nft_elem_priv *elem_priv)
5841 {
5842 struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
5843
5844 /* called from abort path, reverse check to undo changes. */
5845 if (nft_set_elem_active(ext, iter->genmask))
5846 return 0;
5847
5848 nft_clear(ctx->net, ext);
5849 nft_setelem_data_activate(ctx->net, set, elem_priv);
5850
5851 return 0;
5852 }
5853
nft_map_catchall_activate(const struct nft_ctx * ctx,struct nft_set * set)5854 static void nft_map_catchall_activate(const struct nft_ctx *ctx,
5855 struct nft_set *set)
5856 {
5857 u8 genmask = nft_genmask_next(ctx->net);
5858 struct nft_set_elem_catchall *catchall;
5859 struct nft_set_ext *ext;
5860
5861 list_for_each_entry(catchall, &set->catchall_list, list) {
5862 ext = nft_set_elem_ext(set, catchall->elem);
5863 if (!nft_set_elem_active(ext, genmask))
5864 continue;
5865
5866 nft_clear(ctx->net, ext);
5867 nft_setelem_data_activate(ctx->net, set, catchall->elem);
5868 break;
5869 }
5870 }
5871
nft_map_activate(const struct nft_ctx * ctx,struct nft_set * set)5872 static void nft_map_activate(const struct nft_ctx *ctx, struct nft_set *set)
5873 {
5874 struct nft_set_iter iter = {
5875 .genmask = nft_genmask_next(ctx->net),
5876 .type = NFT_ITER_UPDATE,
5877 .fn = nft_mapelem_activate,
5878 };
5879
5880 set->ops->walk(ctx, set, &iter);
5881 WARN_ON_ONCE(iter.err);
5882
5883 nft_map_catchall_activate(ctx, set);
5884 }
5885
nf_tables_activate_set(const struct nft_ctx * ctx,struct nft_set * set)5886 void nf_tables_activate_set(const struct nft_ctx *ctx, struct nft_set *set)
5887 {
5888 if (nft_set_is_anonymous(set)) {
5889 if (set->flags & (NFT_SET_MAP | NFT_SET_OBJECT))
5890 nft_map_activate(ctx, set);
5891
5892 nft_clear(ctx->net, set);
5893 }
5894
5895 nft_use_inc_restore(&set->use);
5896 }
5897 EXPORT_SYMBOL_GPL(nf_tables_activate_set);
5898
nf_tables_deactivate_set(const struct nft_ctx * ctx,struct nft_set * set,struct nft_set_binding * binding,enum nft_trans_phase phase)5899 void nf_tables_deactivate_set(const struct nft_ctx *ctx, struct nft_set *set,
5900 struct nft_set_binding *binding,
5901 enum nft_trans_phase phase)
5902 {
5903 WARN_ON_ONCE(!lockdep_commit_lock_is_held(ctx->net));
5904
5905 switch (phase) {
5906 case NFT_TRANS_PREPARE_ERROR:
5907 nft_set_trans_unbind(ctx, set);
5908 if (nft_set_is_anonymous(set))
5909 nft_deactivate_next(ctx->net, set);
5910 else
5911 list_del_rcu(&binding->list);
5912
5913 nft_use_dec(&set->use);
5914 break;
5915 case NFT_TRANS_PREPARE:
5916 if (nft_set_is_anonymous(set)) {
5917 if (set->flags & (NFT_SET_MAP | NFT_SET_OBJECT))
5918 nft_map_deactivate(ctx, set);
5919
5920 nft_deactivate_next(ctx->net, set);
5921 }
5922 nft_use_dec(&set->use);
5923 return;
5924 case NFT_TRANS_ABORT:
5925 case NFT_TRANS_RELEASE:
5926 if (nft_set_is_anonymous(set) &&
5927 set->flags & (NFT_SET_MAP | NFT_SET_OBJECT))
5928 nft_map_deactivate(ctx, set);
5929
5930 nft_use_dec(&set->use);
5931 fallthrough;
5932 default:
5933 nf_tables_unbind_set(ctx, set, binding,
5934 phase == NFT_TRANS_COMMIT);
5935 }
5936 }
5937 EXPORT_SYMBOL_GPL(nf_tables_deactivate_set);
5938
nf_tables_destroy_set(const struct nft_ctx * ctx,struct nft_set * set)5939 void nf_tables_destroy_set(const struct nft_ctx *ctx, struct nft_set *set)
5940 {
5941 if (list_empty(&set->bindings) && nft_set_is_anonymous(set))
5942 nft_set_destroy(ctx, set);
5943 }
5944 EXPORT_SYMBOL_GPL(nf_tables_destroy_set);
5945
5946 const struct nft_set_ext_type nft_set_ext_types[] = {
5947 [NFT_SET_EXT_KEY] = {
5948 .align = __alignof__(u32),
5949 },
5950 [NFT_SET_EXT_DATA] = {
5951 .align = __alignof__(u32),
5952 },
5953 [NFT_SET_EXT_EXPRESSIONS] = {
5954 .align = __alignof__(struct nft_set_elem_expr),
5955 },
5956 [NFT_SET_EXT_OBJREF] = {
5957 .len = sizeof(struct nft_object *),
5958 .align = __alignof__(struct nft_object *),
5959 },
5960 [NFT_SET_EXT_FLAGS] = {
5961 .len = sizeof(u8),
5962 .align = __alignof__(u8),
5963 },
5964 [NFT_SET_EXT_TIMEOUT] = {
5965 .len = sizeof(struct nft_timeout),
5966 .align = __alignof__(struct nft_timeout),
5967 },
5968 [NFT_SET_EXT_USERDATA] = {
5969 .len = sizeof(struct nft_userdata),
5970 .align = __alignof__(struct nft_userdata),
5971 },
5972 [NFT_SET_EXT_KEY_END] = {
5973 .align = __alignof__(u32),
5974 },
5975 };
5976
5977 /*
5978 * Set elements
5979 */
5980
5981 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
5982 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
5983 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
5984 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
5985 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
5986 [NFTA_SET_ELEM_EXPIRATION] = { .type = NLA_U64 },
5987 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
5988 .len = NFT_USERDATA_MAXLEN },
5989 [NFTA_SET_ELEM_EXPR] = { .type = NLA_NESTED },
5990 [NFTA_SET_ELEM_OBJREF] = { .type = NLA_STRING,
5991 .len = NFT_OBJ_MAXNAMELEN - 1 },
5992 [NFTA_SET_ELEM_KEY_END] = { .type = NLA_NESTED },
5993 [NFTA_SET_ELEM_EXPRESSIONS] = NLA_POLICY_NESTED_ARRAY(nft_expr_policy),
5994 };
5995
5996 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
5997 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING,
5998 .len = NFT_TABLE_MAXNAMELEN - 1 },
5999 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING,
6000 .len = NFT_SET_MAXNAMELEN - 1 },
6001 [NFTA_SET_ELEM_LIST_ELEMENTS] = NLA_POLICY_NESTED_ARRAY(nft_set_elem_policy),
6002 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
6003 };
6004
nft_set_elem_expr_dump(struct sk_buff * skb,const struct nft_set * set,const struct nft_set_ext * ext,bool reset)6005 static int nft_set_elem_expr_dump(struct sk_buff *skb,
6006 const struct nft_set *set,
6007 const struct nft_set_ext *ext,
6008 bool reset)
6009 {
6010 struct nft_set_elem_expr *elem_expr;
6011 u32 size, num_exprs = 0;
6012 struct nft_expr *expr;
6013 struct nlattr *nest;
6014
6015 elem_expr = nft_set_ext_expr(ext);
6016 nft_setelem_expr_foreach(expr, elem_expr, size)
6017 num_exprs++;
6018
6019 if (num_exprs == 1) {
6020 expr = nft_setelem_expr_at(elem_expr, 0);
6021 if (nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, expr, reset) < 0)
6022 return -1;
6023
6024 return 0;
6025 } else if (num_exprs > 1) {
6026 nest = nla_nest_start_noflag(skb, NFTA_SET_ELEM_EXPRESSIONS);
6027 if (nest == NULL)
6028 goto nla_put_failure;
6029
6030 nft_setelem_expr_foreach(expr, elem_expr, size) {
6031 expr = nft_setelem_expr_at(elem_expr, size);
6032 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr, reset) < 0)
6033 goto nla_put_failure;
6034 }
6035 nla_nest_end(skb, nest);
6036 }
6037 return 0;
6038
6039 nla_put_failure:
6040 return -1;
6041 }
6042
nf_tables_fill_setelem(struct sk_buff * skb,const struct nft_set * set,const struct nft_elem_priv * elem_priv,bool reset)6043 static int nf_tables_fill_setelem(struct sk_buff *skb,
6044 const struct nft_set *set,
6045 const struct nft_elem_priv *elem_priv,
6046 bool reset)
6047 {
6048 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
6049 unsigned char *b = skb_tail_pointer(skb);
6050 struct nlattr *nest;
6051
6052 nest = nla_nest_start_noflag(skb, NFTA_LIST_ELEM);
6053 if (nest == NULL)
6054 goto nla_put_failure;
6055
6056 if (nft_set_ext_exists(ext, NFT_SET_EXT_KEY) &&
6057 nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
6058 NFT_DATA_VALUE, set->klen) < 0)
6059 goto nla_put_failure;
6060
6061 if (nft_set_ext_exists(ext, NFT_SET_EXT_KEY_END) &&
6062 nft_data_dump(skb, NFTA_SET_ELEM_KEY_END, nft_set_ext_key_end(ext),
6063 NFT_DATA_VALUE, set->klen) < 0)
6064 goto nla_put_failure;
6065
6066 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
6067 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
6068 nft_set_datatype(set), set->dlen) < 0)
6069 goto nla_put_failure;
6070
6071 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPRESSIONS) &&
6072 nft_set_elem_expr_dump(skb, set, ext, reset))
6073 goto nla_put_failure;
6074
6075 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
6076 nla_put_string(skb, NFTA_SET_ELEM_OBJREF,
6077 (*nft_set_ext_obj(ext))->key.name) < 0)
6078 goto nla_put_failure;
6079
6080 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
6081 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
6082 htonl(*nft_set_ext_flags(ext))))
6083 goto nla_put_failure;
6084
6085 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT)) {
6086 u64 timeout = READ_ONCE(nft_set_ext_timeout(ext)->timeout);
6087 u64 set_timeout = READ_ONCE(set->timeout);
6088 __be64 msecs = 0;
6089
6090 if (set_timeout != timeout) {
6091 msecs = nf_jiffies64_to_msecs(timeout);
6092 if (nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT, msecs,
6093 NFTA_SET_ELEM_PAD))
6094 goto nla_put_failure;
6095 }
6096
6097 if (timeout > 0) {
6098 u64 expires, now = get_jiffies_64();
6099
6100 expires = READ_ONCE(nft_set_ext_timeout(ext)->expiration);
6101 if (time_before64(now, expires))
6102 expires -= now;
6103 else
6104 expires = 0;
6105
6106 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
6107 nf_jiffies64_to_msecs(expires),
6108 NFTA_SET_ELEM_PAD))
6109 goto nla_put_failure;
6110 }
6111 }
6112
6113 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
6114 struct nft_userdata *udata;
6115
6116 udata = nft_set_ext_userdata(ext);
6117 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
6118 udata->len + 1, udata->data))
6119 goto nla_put_failure;
6120 }
6121
6122 nla_nest_end(skb, nest);
6123 return 0;
6124
6125 nla_put_failure:
6126 nlmsg_trim(skb, b);
6127 return -EMSGSIZE;
6128 }
6129
6130 struct nft_set_dump_args {
6131 const struct netlink_callback *cb;
6132 struct nft_set_iter iter;
6133 struct sk_buff *skb;
6134 bool reset;
6135 };
6136
nf_tables_dump_setelem(const struct nft_ctx * ctx,struct nft_set * set,const struct nft_set_iter * iter,struct nft_elem_priv * elem_priv)6137 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
6138 struct nft_set *set,
6139 const struct nft_set_iter *iter,
6140 struct nft_elem_priv *elem_priv)
6141 {
6142 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
6143 struct nft_set_dump_args *args;
6144
6145 if (!nft_set_elem_active(ext, iter->genmask))
6146 return 0;
6147
6148 if (nft_set_elem_expired(ext) || nft_set_elem_is_dead(ext))
6149 return 0;
6150
6151 args = container_of(iter, struct nft_set_dump_args, iter);
6152 return nf_tables_fill_setelem(args->skb, set, elem_priv, args->reset);
6153 }
6154
audit_log_nft_set_reset(const struct nft_table * table,unsigned int base_seq,unsigned int nentries)6155 static void audit_log_nft_set_reset(const struct nft_table *table,
6156 unsigned int base_seq,
6157 unsigned int nentries)
6158 {
6159 char *buf = kasprintf(GFP_ATOMIC, "%s:%u", table->name, base_seq);
6160
6161 audit_log_nfcfg(buf, table->family, nentries,
6162 AUDIT_NFT_OP_SETELEM_RESET, GFP_ATOMIC);
6163 kfree(buf);
6164 }
6165
6166 struct nft_set_dump_ctx {
6167 const struct nft_set *set;
6168 struct nft_ctx ctx;
6169 bool reset;
6170 };
6171
nft_set_catchall_dump(struct net * net,struct sk_buff * skb,const struct nft_set * set,bool reset,unsigned int base_seq)6172 static int nft_set_catchall_dump(struct net *net, struct sk_buff *skb,
6173 const struct nft_set *set, bool reset,
6174 unsigned int base_seq)
6175 {
6176 struct nft_set_elem_catchall *catchall;
6177 u8 genmask = nft_genmask_cur(net);
6178 struct nft_set_ext *ext;
6179 int ret = 0;
6180
6181 list_for_each_entry_rcu(catchall, &set->catchall_list, list) {
6182 ext = nft_set_elem_ext(set, catchall->elem);
6183 if (!nft_set_elem_active(ext, genmask) ||
6184 nft_set_elem_expired(ext))
6185 continue;
6186
6187 ret = nf_tables_fill_setelem(skb, set, catchall->elem, reset);
6188 if (reset && !ret)
6189 audit_log_nft_set_reset(set->table, base_seq, 1);
6190 break;
6191 }
6192
6193 return ret;
6194 }
6195
nf_tables_dump_set(struct sk_buff * skb,struct netlink_callback * cb)6196 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
6197 {
6198 struct nft_set_dump_ctx *dump_ctx = cb->data;
6199 struct net *net = sock_net(skb->sk);
6200 struct nftables_pernet *nft_net;
6201 struct nft_table *table;
6202 struct nft_set *set;
6203 struct nft_set_dump_args args;
6204 bool set_found = false;
6205 struct nlmsghdr *nlh;
6206 struct nlattr *nest;
6207 u32 portid, seq;
6208 int event;
6209
6210 rcu_read_lock();
6211 nft_net = nft_pernet(net);
6212 cb->seq = READ_ONCE(nft_net->base_seq);
6213
6214 list_for_each_entry_rcu(table, &nft_net->tables, list) {
6215 if (dump_ctx->ctx.family != NFPROTO_UNSPEC &&
6216 dump_ctx->ctx.family != table->family)
6217 continue;
6218
6219 if (table != dump_ctx->ctx.table)
6220 continue;
6221
6222 list_for_each_entry_rcu(set, &table->sets, list) {
6223 if (set == dump_ctx->set) {
6224 set_found = true;
6225 break;
6226 }
6227 }
6228 break;
6229 }
6230
6231 if (!set_found) {
6232 rcu_read_unlock();
6233 return -ENOENT;
6234 }
6235
6236 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWSETELEM);
6237 portid = NETLINK_CB(cb->skb).portid;
6238 seq = cb->nlh->nlmsg_seq;
6239
6240 nlh = nfnl_msg_put(skb, portid, seq, event, NLM_F_MULTI,
6241 table->family, NFNETLINK_V0, nft_base_seq(net));
6242 if (!nlh)
6243 goto nla_put_failure;
6244
6245 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, table->name))
6246 goto nla_put_failure;
6247 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
6248 goto nla_put_failure;
6249
6250 nest = nla_nest_start_noflag(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
6251 if (nest == NULL)
6252 goto nla_put_failure;
6253
6254 args.cb = cb;
6255 args.skb = skb;
6256 args.reset = dump_ctx->reset;
6257 args.iter.genmask = nft_genmask_cur(net);
6258 args.iter.type = NFT_ITER_READ;
6259 args.iter.skip = cb->args[0];
6260 args.iter.count = 0;
6261 args.iter.err = 0;
6262 args.iter.fn = nf_tables_dump_setelem;
6263 set->ops->walk(&dump_ctx->ctx, set, &args.iter);
6264
6265 if (!args.iter.err && args.iter.count == cb->args[0])
6266 args.iter.err = nft_set_catchall_dump(net, skb, set,
6267 dump_ctx->reset, cb->seq);
6268 nla_nest_end(skb, nest);
6269 nlmsg_end(skb, nlh);
6270
6271 rcu_read_unlock();
6272
6273 if (args.iter.err && args.iter.err != -EMSGSIZE)
6274 return args.iter.err;
6275 if (args.iter.count == cb->args[0])
6276 return 0;
6277
6278 cb->args[0] = args.iter.count;
6279 return skb->len;
6280
6281 nla_put_failure:
6282 rcu_read_unlock();
6283 return -ENOSPC;
6284 }
6285
nf_tables_dumpreset_set(struct sk_buff * skb,struct netlink_callback * cb)6286 static int nf_tables_dumpreset_set(struct sk_buff *skb,
6287 struct netlink_callback *cb)
6288 {
6289 struct nftables_pernet *nft_net = nft_pernet(sock_net(skb->sk));
6290 struct nft_set_dump_ctx *dump_ctx = cb->data;
6291 int ret, skip = cb->args[0];
6292
6293 mutex_lock(&nft_net->commit_mutex);
6294
6295 ret = nf_tables_dump_set(skb, cb);
6296
6297 if (cb->args[0] > skip)
6298 audit_log_nft_set_reset(dump_ctx->ctx.table, cb->seq,
6299 cb->args[0] - skip);
6300
6301 mutex_unlock(&nft_net->commit_mutex);
6302
6303 return ret;
6304 }
6305
nf_tables_dump_set_start(struct netlink_callback * cb)6306 static int nf_tables_dump_set_start(struct netlink_callback *cb)
6307 {
6308 struct nft_set_dump_ctx *dump_ctx = cb->data;
6309
6310 cb->data = kmemdup(dump_ctx, sizeof(*dump_ctx), GFP_ATOMIC);
6311
6312 return cb->data ? 0 : -ENOMEM;
6313 }
6314
nf_tables_dump_set_done(struct netlink_callback * cb)6315 static int nf_tables_dump_set_done(struct netlink_callback *cb)
6316 {
6317 kfree(cb->data);
6318 return 0;
6319 }
6320
nf_tables_fill_setelem_info(struct sk_buff * skb,const struct nft_ctx * ctx,u32 seq,u32 portid,int event,u16 flags,const struct nft_set * set,const struct nft_elem_priv * elem_priv,bool reset)6321 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
6322 const struct nft_ctx *ctx, u32 seq,
6323 u32 portid, int event, u16 flags,
6324 const struct nft_set *set,
6325 const struct nft_elem_priv *elem_priv,
6326 bool reset)
6327 {
6328 struct nlmsghdr *nlh;
6329 struct nlattr *nest;
6330 int err;
6331
6332 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
6333 nlh = nfnl_msg_put(skb, portid, seq, event, flags, ctx->family,
6334 NFNETLINK_V0, nft_base_seq(ctx->net));
6335 if (!nlh)
6336 goto nla_put_failure;
6337
6338 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
6339 goto nla_put_failure;
6340 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
6341 goto nla_put_failure;
6342
6343 nest = nla_nest_start_noflag(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
6344 if (nest == NULL)
6345 goto nla_put_failure;
6346
6347 err = nf_tables_fill_setelem(skb, set, elem_priv, reset);
6348 if (err < 0)
6349 goto nla_put_failure;
6350
6351 nla_nest_end(skb, nest);
6352
6353 nlmsg_end(skb, nlh);
6354 return 0;
6355
6356 nla_put_failure:
6357 nlmsg_trim(skb, nlh);
6358 return -1;
6359 }
6360
nft_setelem_parse_flags(const struct nft_set * set,const struct nlattr * attr,u32 * flags)6361 static int nft_setelem_parse_flags(const struct nft_set *set,
6362 const struct nlattr *attr, u32 *flags)
6363 {
6364 if (attr == NULL)
6365 return 0;
6366
6367 *flags = ntohl(nla_get_be32(attr));
6368 if (*flags & ~(NFT_SET_ELEM_INTERVAL_END | NFT_SET_ELEM_CATCHALL))
6369 return -EOPNOTSUPP;
6370 if (!(set->flags & NFT_SET_INTERVAL) &&
6371 *flags & NFT_SET_ELEM_INTERVAL_END)
6372 return -EINVAL;
6373 if ((*flags & (NFT_SET_ELEM_INTERVAL_END | NFT_SET_ELEM_CATCHALL)) ==
6374 (NFT_SET_ELEM_INTERVAL_END | NFT_SET_ELEM_CATCHALL))
6375 return -EINVAL;
6376
6377 return 0;
6378 }
6379
nft_setelem_parse_key(struct nft_ctx * ctx,const struct nft_set * set,struct nft_data * key,struct nlattr * attr)6380 static int nft_setelem_parse_key(struct nft_ctx *ctx, const struct nft_set *set,
6381 struct nft_data *key, struct nlattr *attr)
6382 {
6383 struct nft_data_desc desc = {
6384 .type = NFT_DATA_VALUE,
6385 .size = NFT_DATA_VALUE_MAXLEN,
6386 .len = set->klen,
6387 };
6388
6389 return nft_data_init(ctx, key, &desc, attr);
6390 }
6391
nft_setelem_parse_data(struct nft_ctx * ctx,struct nft_set * set,struct nft_data_desc * desc,struct nft_data * data,struct nlattr * attr)6392 static int nft_setelem_parse_data(struct nft_ctx *ctx, struct nft_set *set,
6393 struct nft_data_desc *desc,
6394 struct nft_data *data,
6395 struct nlattr *attr)
6396 {
6397 u32 dtype;
6398
6399 if (set->dtype == NFT_DATA_VERDICT)
6400 dtype = NFT_DATA_VERDICT;
6401 else
6402 dtype = NFT_DATA_VALUE;
6403
6404 desc->type = dtype;
6405 desc->size = NFT_DATA_VALUE_MAXLEN;
6406 desc->len = set->dlen;
6407 desc->flags = NFT_DATA_DESC_SETELEM;
6408
6409 return nft_data_init(ctx, data, desc, attr);
6410 }
6411
nft_setelem_catchall_get(const struct net * net,const struct nft_set * set)6412 static void *nft_setelem_catchall_get(const struct net *net,
6413 const struct nft_set *set)
6414 {
6415 struct nft_set_elem_catchall *catchall;
6416 u8 genmask = nft_genmask_cur(net);
6417 struct nft_set_ext *ext;
6418 void *priv = NULL;
6419
6420 list_for_each_entry_rcu(catchall, &set->catchall_list, list) {
6421 ext = nft_set_elem_ext(set, catchall->elem);
6422 if (!nft_set_elem_active(ext, genmask) ||
6423 nft_set_elem_expired(ext))
6424 continue;
6425
6426 priv = catchall->elem;
6427 break;
6428 }
6429
6430 return priv;
6431 }
6432
nft_setelem_get(struct nft_ctx * ctx,const struct nft_set * set,struct nft_set_elem * elem,u32 flags)6433 static int nft_setelem_get(struct nft_ctx *ctx, const struct nft_set *set,
6434 struct nft_set_elem *elem, u32 flags)
6435 {
6436 void *priv;
6437
6438 if (!(flags & NFT_SET_ELEM_CATCHALL)) {
6439 priv = set->ops->get(ctx->net, set, elem, flags);
6440 if (IS_ERR(priv))
6441 return PTR_ERR(priv);
6442 } else {
6443 priv = nft_setelem_catchall_get(ctx->net, set);
6444 if (!priv)
6445 return -ENOENT;
6446 }
6447 elem->priv = priv;
6448
6449 return 0;
6450 }
6451
nft_get_set_elem(struct nft_ctx * ctx,const struct nft_set * set,const struct nlattr * attr,bool reset)6452 static int nft_get_set_elem(struct nft_ctx *ctx, const struct nft_set *set,
6453 const struct nlattr *attr, bool reset)
6454 {
6455 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
6456 struct nft_set_elem elem;
6457 struct sk_buff *skb;
6458 uint32_t flags = 0;
6459 int err;
6460
6461 err = nla_parse_nested_deprecated(nla, NFTA_SET_ELEM_MAX, attr,
6462 nft_set_elem_policy, NULL);
6463 if (err < 0)
6464 return err;
6465
6466 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
6467 if (err < 0)
6468 return err;
6469
6470 if (!nla[NFTA_SET_ELEM_KEY] && !(flags & NFT_SET_ELEM_CATCHALL))
6471 return -EINVAL;
6472
6473 if (nla[NFTA_SET_ELEM_KEY]) {
6474 err = nft_setelem_parse_key(ctx, set, &elem.key.val,
6475 nla[NFTA_SET_ELEM_KEY]);
6476 if (err < 0)
6477 return err;
6478 }
6479
6480 if (nla[NFTA_SET_ELEM_KEY_END]) {
6481 err = nft_setelem_parse_key(ctx, set, &elem.key_end.val,
6482 nla[NFTA_SET_ELEM_KEY_END]);
6483 if (err < 0)
6484 return err;
6485 }
6486
6487 err = nft_setelem_get(ctx, set, &elem, flags);
6488 if (err < 0)
6489 return err;
6490
6491 err = -ENOMEM;
6492 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_ATOMIC);
6493 if (skb == NULL)
6494 return err;
6495
6496 err = nf_tables_fill_setelem_info(skb, ctx, ctx->seq, ctx->portid,
6497 NFT_MSG_NEWSETELEM, 0, set, elem.priv,
6498 reset);
6499 if (err < 0)
6500 goto err_fill_setelem;
6501
6502 return nfnetlink_unicast(skb, ctx->net, ctx->portid);
6503
6504 err_fill_setelem:
6505 kfree_skb(skb);
6506 return err;
6507 }
6508
nft_set_dump_ctx_init(struct nft_set_dump_ctx * dump_ctx,const struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[],bool reset)6509 static int nft_set_dump_ctx_init(struct nft_set_dump_ctx *dump_ctx,
6510 const struct sk_buff *skb,
6511 const struct nfnl_info *info,
6512 const struct nlattr * const nla[],
6513 bool reset)
6514 {
6515 struct netlink_ext_ack *extack = info->extack;
6516 u8 genmask = nft_genmask_cur(info->net);
6517 u8 family = info->nfmsg->nfgen_family;
6518 struct net *net = info->net;
6519 struct nft_table *table;
6520 struct nft_set *set;
6521
6522 table = nft_table_lookup(net, nla[NFTA_SET_ELEM_LIST_TABLE], family,
6523 genmask, 0);
6524 if (IS_ERR(table)) {
6525 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_TABLE]);
6526 return PTR_ERR(table);
6527 }
6528
6529 set = nft_set_lookup(net, table, nla[NFTA_SET_ELEM_LIST_SET], genmask);
6530 if (IS_ERR(set)) {
6531 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_SET]);
6532 return PTR_ERR(set);
6533 }
6534
6535 nft_ctx_init(&dump_ctx->ctx, net, skb,
6536 info->nlh, family, table, NULL, nla);
6537 dump_ctx->set = set;
6538 dump_ctx->reset = reset;
6539 return 0;
6540 }
6541
6542 /* called with rcu_read_lock held */
nf_tables_getsetelem(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])6543 static int nf_tables_getsetelem(struct sk_buff *skb,
6544 const struct nfnl_info *info,
6545 const struct nlattr * const nla[])
6546 {
6547 struct netlink_ext_ack *extack = info->extack;
6548 struct nft_set_dump_ctx dump_ctx;
6549 struct nlattr *attr;
6550 int rem, err = 0;
6551
6552 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
6553 struct netlink_dump_control c = {
6554 .start = nf_tables_dump_set_start,
6555 .dump = nf_tables_dump_set,
6556 .done = nf_tables_dump_set_done,
6557 .module = THIS_MODULE,
6558 };
6559
6560 err = nft_set_dump_ctx_init(&dump_ctx, skb, info, nla, false);
6561 if (err)
6562 return err;
6563
6564 c.data = &dump_ctx;
6565 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
6566 }
6567
6568 if (!nla[NFTA_SET_ELEM_LIST_ELEMENTS])
6569 return -EINVAL;
6570
6571 err = nft_set_dump_ctx_init(&dump_ctx, skb, info, nla, false);
6572 if (err)
6573 return err;
6574
6575 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
6576 err = nft_get_set_elem(&dump_ctx.ctx, dump_ctx.set, attr, false);
6577 if (err < 0) {
6578 NL_SET_BAD_ATTR(extack, attr);
6579 break;
6580 }
6581 }
6582
6583 return err;
6584 }
6585
nf_tables_getsetelem_reset(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])6586 static int nf_tables_getsetelem_reset(struct sk_buff *skb,
6587 const struct nfnl_info *info,
6588 const struct nlattr * const nla[])
6589 {
6590 struct nftables_pernet *nft_net = nft_pernet(info->net);
6591 struct netlink_ext_ack *extack = info->extack;
6592 struct nft_set_dump_ctx dump_ctx;
6593 int rem, err = 0, nelems = 0;
6594 struct nlattr *attr;
6595
6596 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
6597 struct netlink_dump_control c = {
6598 .start = nf_tables_dump_set_start,
6599 .dump = nf_tables_dumpreset_set,
6600 .done = nf_tables_dump_set_done,
6601 .module = THIS_MODULE,
6602 };
6603
6604 err = nft_set_dump_ctx_init(&dump_ctx, skb, info, nla, true);
6605 if (err)
6606 return err;
6607
6608 c.data = &dump_ctx;
6609 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
6610 }
6611
6612 if (!nla[NFTA_SET_ELEM_LIST_ELEMENTS])
6613 return -EINVAL;
6614
6615 if (!try_module_get(THIS_MODULE))
6616 return -EINVAL;
6617 rcu_read_unlock();
6618 mutex_lock(&nft_net->commit_mutex);
6619 rcu_read_lock();
6620
6621 err = nft_set_dump_ctx_init(&dump_ctx, skb, info, nla, true);
6622 if (err)
6623 goto out_unlock;
6624
6625 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
6626 err = nft_get_set_elem(&dump_ctx.ctx, dump_ctx.set, attr, true);
6627 if (err < 0) {
6628 NL_SET_BAD_ATTR(extack, attr);
6629 break;
6630 }
6631 nelems++;
6632 }
6633 audit_log_nft_set_reset(dump_ctx.ctx.table, nft_net->base_seq, nelems);
6634
6635 out_unlock:
6636 rcu_read_unlock();
6637 mutex_unlock(&nft_net->commit_mutex);
6638 rcu_read_lock();
6639 module_put(THIS_MODULE);
6640
6641 return err;
6642 }
6643
nf_tables_setelem_notify(const struct nft_ctx * ctx,const struct nft_set * set,const struct nft_elem_priv * elem_priv,int event)6644 static void nf_tables_setelem_notify(const struct nft_ctx *ctx,
6645 const struct nft_set *set,
6646 const struct nft_elem_priv *elem_priv,
6647 int event)
6648 {
6649 struct nftables_pernet *nft_net;
6650 struct net *net = ctx->net;
6651 u32 portid = ctx->portid;
6652 struct sk_buff *skb;
6653 u16 flags = 0;
6654 int err;
6655
6656 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
6657 return;
6658
6659 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
6660 if (skb == NULL)
6661 goto err;
6662
6663 if (ctx->flags & (NLM_F_CREATE | NLM_F_EXCL))
6664 flags |= ctx->flags & (NLM_F_CREATE | NLM_F_EXCL);
6665
6666 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
6667 set, elem_priv, false);
6668 if (err < 0) {
6669 kfree_skb(skb);
6670 goto err;
6671 }
6672
6673 nft_net = nft_pernet(net);
6674 nft_notify_enqueue(skb, ctx->report, &nft_net->notify_list);
6675 return;
6676 err:
6677 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
6678 }
6679
nft_trans_elem_alloc(const struct nft_ctx * ctx,int msg_type,struct nft_set * set)6680 static struct nft_trans *nft_trans_elem_alloc(const struct nft_ctx *ctx,
6681 int msg_type,
6682 struct nft_set *set)
6683 {
6684 struct nft_trans_elem *te;
6685 struct nft_trans *trans;
6686
6687 trans = nft_trans_alloc(ctx, msg_type, struct_size(te, elems, 1));
6688 if (trans == NULL)
6689 return NULL;
6690
6691 te = nft_trans_container_elem(trans);
6692 te->nelems = 1;
6693 te->set = set;
6694
6695 return trans;
6696 }
6697
nft_set_elem_expr_alloc(const struct nft_ctx * ctx,const struct nft_set * set,const struct nlattr * attr)6698 struct nft_expr *nft_set_elem_expr_alloc(const struct nft_ctx *ctx,
6699 const struct nft_set *set,
6700 const struct nlattr *attr)
6701 {
6702 struct nft_expr *expr;
6703 int err;
6704
6705 expr = nft_expr_init(ctx, attr);
6706 if (IS_ERR(expr))
6707 return expr;
6708
6709 err = -EOPNOTSUPP;
6710 if (expr->ops->type->flags & NFT_EXPR_GC) {
6711 if (set->flags & NFT_SET_TIMEOUT)
6712 goto err_set_elem_expr;
6713 if (!set->ops->gc_init)
6714 goto err_set_elem_expr;
6715 set->ops->gc_init(set);
6716 }
6717
6718 return expr;
6719
6720 err_set_elem_expr:
6721 nft_expr_destroy(ctx, expr);
6722 return ERR_PTR(err);
6723 }
6724
nft_set_ext_check(const struct nft_set_ext_tmpl * tmpl,u8 id,u32 len)6725 static int nft_set_ext_check(const struct nft_set_ext_tmpl *tmpl, u8 id, u32 len)
6726 {
6727 len += nft_set_ext_types[id].len;
6728 if (len > tmpl->ext_len[id] ||
6729 len > U8_MAX)
6730 return -1;
6731
6732 return 0;
6733 }
6734
nft_set_ext_memcpy(const struct nft_set_ext_tmpl * tmpl,u8 id,void * to,const void * from,u32 len)6735 static int nft_set_ext_memcpy(const struct nft_set_ext_tmpl *tmpl, u8 id,
6736 void *to, const void *from, u32 len)
6737 {
6738 if (nft_set_ext_check(tmpl, id, len) < 0)
6739 return -1;
6740
6741 memcpy(to, from, len);
6742
6743 return 0;
6744 }
6745
nft_set_elem_init(const struct nft_set * set,const struct nft_set_ext_tmpl * tmpl,const u32 * key,const u32 * key_end,const u32 * data,u64 timeout,u64 expiration,gfp_t gfp)6746 struct nft_elem_priv *nft_set_elem_init(const struct nft_set *set,
6747 const struct nft_set_ext_tmpl *tmpl,
6748 const u32 *key, const u32 *key_end,
6749 const u32 *data,
6750 u64 timeout, u64 expiration, gfp_t gfp)
6751 {
6752 struct nft_set_ext *ext;
6753 void *elem;
6754
6755 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
6756 if (elem == NULL)
6757 return ERR_PTR(-ENOMEM);
6758
6759 ext = nft_set_elem_ext(set, elem);
6760 nft_set_ext_init(ext, tmpl);
6761
6762 if (nft_set_ext_exists(ext, NFT_SET_EXT_KEY) &&
6763 nft_set_ext_memcpy(tmpl, NFT_SET_EXT_KEY,
6764 nft_set_ext_key(ext), key, set->klen) < 0)
6765 goto err_ext_check;
6766
6767 if (nft_set_ext_exists(ext, NFT_SET_EXT_KEY_END) &&
6768 nft_set_ext_memcpy(tmpl, NFT_SET_EXT_KEY_END,
6769 nft_set_ext_key_end(ext), key_end, set->klen) < 0)
6770 goto err_ext_check;
6771
6772 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
6773 nft_set_ext_memcpy(tmpl, NFT_SET_EXT_DATA,
6774 nft_set_ext_data(ext), data, set->dlen) < 0)
6775 goto err_ext_check;
6776
6777 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT)) {
6778 nft_set_ext_timeout(ext)->timeout = timeout;
6779
6780 if (expiration == 0)
6781 expiration = timeout;
6782
6783 nft_set_ext_timeout(ext)->expiration = get_jiffies_64() + expiration;
6784 }
6785
6786 return elem;
6787
6788 err_ext_check:
6789 kfree(elem);
6790
6791 return ERR_PTR(-EINVAL);
6792 }
6793
__nft_set_elem_expr_destroy(const struct nft_ctx * ctx,struct nft_expr * expr)6794 static void __nft_set_elem_expr_destroy(const struct nft_ctx *ctx,
6795 struct nft_expr *expr)
6796 {
6797 if (expr->ops->destroy_clone) {
6798 expr->ops->destroy_clone(ctx, expr);
6799 module_put(expr->ops->type->owner);
6800 } else {
6801 nf_tables_expr_destroy(ctx, expr);
6802 }
6803 }
6804
nft_set_elem_expr_destroy(const struct nft_ctx * ctx,struct nft_set_elem_expr * elem_expr)6805 static void nft_set_elem_expr_destroy(const struct nft_ctx *ctx,
6806 struct nft_set_elem_expr *elem_expr)
6807 {
6808 struct nft_expr *expr;
6809 u32 size;
6810
6811 nft_setelem_expr_foreach(expr, elem_expr, size)
6812 __nft_set_elem_expr_destroy(ctx, expr);
6813 }
6814
6815 /* Drop references and destroy. Called from gc, dynset and abort path. */
__nft_set_elem_destroy(const struct nft_ctx * ctx,const struct nft_set * set,const struct nft_elem_priv * elem_priv,bool destroy_expr)6816 static void __nft_set_elem_destroy(const struct nft_ctx *ctx,
6817 const struct nft_set *set,
6818 const struct nft_elem_priv *elem_priv,
6819 bool destroy_expr)
6820 {
6821 struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
6822
6823 nft_data_release(nft_set_ext_key(ext), NFT_DATA_VALUE);
6824 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
6825 nft_data_release(nft_set_ext_data(ext), set->dtype);
6826 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPRESSIONS))
6827 nft_set_elem_expr_destroy(ctx, nft_set_ext_expr(ext));
6828 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
6829 nft_use_dec(&(*nft_set_ext_obj(ext))->use);
6830
6831 kfree(elem_priv);
6832 }
6833
6834 /* Drop references and destroy. Called from gc and dynset. */
nft_set_elem_destroy(const struct nft_set * set,const struct nft_elem_priv * elem_priv,bool destroy_expr)6835 void nft_set_elem_destroy(const struct nft_set *set,
6836 const struct nft_elem_priv *elem_priv,
6837 bool destroy_expr)
6838 {
6839 struct nft_ctx ctx = {
6840 .net = read_pnet(&set->net),
6841 .family = set->table->family,
6842 };
6843
6844 __nft_set_elem_destroy(&ctx, set, elem_priv, destroy_expr);
6845 }
6846 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
6847
6848 /* Drop references and destroy. Called from abort path. */
nft_trans_set_elem_destroy(const struct nft_ctx * ctx,struct nft_trans_elem * te)6849 static void nft_trans_set_elem_destroy(const struct nft_ctx *ctx, struct nft_trans_elem *te)
6850 {
6851 int i;
6852
6853 for (i = 0; i < te->nelems; i++) {
6854 /* skip update request, see nft_trans_elems_new_abort() */
6855 if (!te->elems[i].priv)
6856 continue;
6857
6858 __nft_set_elem_destroy(ctx, te->set, te->elems[i].priv, true);
6859 }
6860 }
6861
6862 /* Destroy element. References have been already dropped in the preparation
6863 * path via nft_setelem_data_deactivate().
6864 */
nf_tables_set_elem_destroy(const struct nft_ctx * ctx,const struct nft_set * set,const struct nft_elem_priv * elem_priv)6865 void nf_tables_set_elem_destroy(const struct nft_ctx *ctx,
6866 const struct nft_set *set,
6867 const struct nft_elem_priv *elem_priv)
6868 {
6869 struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
6870
6871 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPRESSIONS))
6872 nft_set_elem_expr_destroy(ctx, nft_set_ext_expr(ext));
6873
6874 kfree(elem_priv);
6875 }
6876
nft_trans_elems_destroy(const struct nft_ctx * ctx,const struct nft_trans_elem * te)6877 static void nft_trans_elems_destroy(const struct nft_ctx *ctx,
6878 const struct nft_trans_elem *te)
6879 {
6880 int i;
6881
6882 for (i = 0; i < te->nelems; i++)
6883 nf_tables_set_elem_destroy(ctx, te->set, te->elems[i].priv);
6884 }
6885
nft_set_elem_expr_clone(const struct nft_ctx * ctx,struct nft_set * set,struct nft_expr * expr_array[])6886 int nft_set_elem_expr_clone(const struct nft_ctx *ctx, struct nft_set *set,
6887 struct nft_expr *expr_array[])
6888 {
6889 struct nft_expr *expr;
6890 int err, i, k;
6891
6892 for (i = 0; i < set->num_exprs; i++) {
6893 expr = kzalloc(set->exprs[i]->ops->size, GFP_KERNEL_ACCOUNT);
6894 if (!expr)
6895 goto err_expr;
6896
6897 err = nft_expr_clone(expr, set->exprs[i], GFP_KERNEL_ACCOUNT);
6898 if (err < 0) {
6899 kfree(expr);
6900 goto err_expr;
6901 }
6902 expr_array[i] = expr;
6903 }
6904
6905 return 0;
6906
6907 err_expr:
6908 for (k = i - 1; k >= 0; k--)
6909 nft_expr_destroy(ctx, expr_array[k]);
6910
6911 return -ENOMEM;
6912 }
6913
nft_set_elem_expr_setup(struct nft_ctx * ctx,const struct nft_set_ext_tmpl * tmpl,const struct nft_set_ext * ext,struct nft_expr * expr_array[],u32 num_exprs)6914 static int nft_set_elem_expr_setup(struct nft_ctx *ctx,
6915 const struct nft_set_ext_tmpl *tmpl,
6916 const struct nft_set_ext *ext,
6917 struct nft_expr *expr_array[],
6918 u32 num_exprs)
6919 {
6920 struct nft_set_elem_expr *elem_expr = nft_set_ext_expr(ext);
6921 u32 len = sizeof(struct nft_set_elem_expr);
6922 struct nft_expr *expr;
6923 int i, err;
6924
6925 if (num_exprs == 0)
6926 return 0;
6927
6928 for (i = 0; i < num_exprs; i++)
6929 len += expr_array[i]->ops->size;
6930
6931 if (nft_set_ext_check(tmpl, NFT_SET_EXT_EXPRESSIONS, len) < 0)
6932 return -EINVAL;
6933
6934 for (i = 0; i < num_exprs; i++) {
6935 expr = nft_setelem_expr_at(elem_expr, elem_expr->size);
6936 err = nft_expr_clone(expr, expr_array[i], GFP_KERNEL_ACCOUNT);
6937 if (err < 0)
6938 goto err_elem_expr_setup;
6939
6940 elem_expr->size += expr_array[i]->ops->size;
6941 nft_expr_destroy(ctx, expr_array[i]);
6942 expr_array[i] = NULL;
6943 }
6944
6945 return 0;
6946
6947 err_elem_expr_setup:
6948 for (; i < num_exprs; i++) {
6949 nft_expr_destroy(ctx, expr_array[i]);
6950 expr_array[i] = NULL;
6951 }
6952
6953 return -ENOMEM;
6954 }
6955
nft_set_catchall_lookup(const struct net * net,const struct nft_set * set)6956 struct nft_set_ext *nft_set_catchall_lookup(const struct net *net,
6957 const struct nft_set *set)
6958 {
6959 struct nft_set_elem_catchall *catchall;
6960 u8 genmask = nft_genmask_cur(net);
6961 struct nft_set_ext *ext;
6962
6963 list_for_each_entry_rcu(catchall, &set->catchall_list, list) {
6964 ext = nft_set_elem_ext(set, catchall->elem);
6965 if (nft_set_elem_active(ext, genmask) &&
6966 !nft_set_elem_expired(ext) &&
6967 !nft_set_elem_is_dead(ext))
6968 return ext;
6969 }
6970
6971 return NULL;
6972 }
6973 EXPORT_SYMBOL_GPL(nft_set_catchall_lookup);
6974
nft_setelem_catchall_insert(const struct net * net,struct nft_set * set,const struct nft_set_elem * elem,struct nft_elem_priv ** priv)6975 static int nft_setelem_catchall_insert(const struct net *net,
6976 struct nft_set *set,
6977 const struct nft_set_elem *elem,
6978 struct nft_elem_priv **priv)
6979 {
6980 struct nft_set_elem_catchall *catchall;
6981 u8 genmask = nft_genmask_next(net);
6982 struct nft_set_ext *ext;
6983
6984 list_for_each_entry(catchall, &set->catchall_list, list) {
6985 ext = nft_set_elem_ext(set, catchall->elem);
6986 if (nft_set_elem_active(ext, genmask)) {
6987 *priv = catchall->elem;
6988 return -EEXIST;
6989 }
6990 }
6991
6992 catchall = kmalloc(sizeof(*catchall), GFP_KERNEL_ACCOUNT);
6993 if (!catchall)
6994 return -ENOMEM;
6995
6996 catchall->elem = elem->priv;
6997 list_add_tail_rcu(&catchall->list, &set->catchall_list);
6998
6999 return 0;
7000 }
7001
nft_setelem_insert(const struct net * net,struct nft_set * set,const struct nft_set_elem * elem,struct nft_elem_priv ** elem_priv,unsigned int flags)7002 static int nft_setelem_insert(const struct net *net,
7003 struct nft_set *set,
7004 const struct nft_set_elem *elem,
7005 struct nft_elem_priv **elem_priv,
7006 unsigned int flags)
7007 {
7008 int ret;
7009
7010 if (flags & NFT_SET_ELEM_CATCHALL)
7011 ret = nft_setelem_catchall_insert(net, set, elem, elem_priv);
7012 else
7013 ret = set->ops->insert(net, set, elem, elem_priv);
7014
7015 return ret;
7016 }
7017
nft_setelem_is_catchall(const struct nft_set * set,const struct nft_elem_priv * elem_priv)7018 static bool nft_setelem_is_catchall(const struct nft_set *set,
7019 const struct nft_elem_priv *elem_priv)
7020 {
7021 struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
7022
7023 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
7024 *nft_set_ext_flags(ext) & NFT_SET_ELEM_CATCHALL)
7025 return true;
7026
7027 return false;
7028 }
7029
nft_setelem_activate(struct net * net,struct nft_set * set,struct nft_elem_priv * elem_priv)7030 static void nft_setelem_activate(struct net *net, struct nft_set *set,
7031 struct nft_elem_priv *elem_priv)
7032 {
7033 struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
7034
7035 if (nft_setelem_is_catchall(set, elem_priv)) {
7036 nft_clear(net, ext);
7037 } else {
7038 set->ops->activate(net, set, elem_priv);
7039 }
7040 }
7041
nft_trans_elem_update(const struct nft_set * set,const struct nft_trans_one_elem * elem)7042 static void nft_trans_elem_update(const struct nft_set *set,
7043 const struct nft_trans_one_elem *elem)
7044 {
7045 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
7046 const struct nft_elem_update *update = elem->update;
7047
7048 if (update->flags & NFT_TRANS_UPD_TIMEOUT)
7049 WRITE_ONCE(nft_set_ext_timeout(ext)->timeout, update->timeout);
7050
7051 if (update->flags & NFT_TRANS_UPD_EXPIRATION)
7052 WRITE_ONCE(nft_set_ext_timeout(ext)->expiration, get_jiffies_64() + update->expiration);
7053 }
7054
nft_trans_elems_add(const struct nft_ctx * ctx,struct nft_trans_elem * te)7055 static void nft_trans_elems_add(const struct nft_ctx *ctx,
7056 struct nft_trans_elem *te)
7057 {
7058 int i;
7059
7060 for (i = 0; i < te->nelems; i++) {
7061 struct nft_trans_one_elem *elem = &te->elems[i];
7062
7063 if (elem->update)
7064 nft_trans_elem_update(te->set, elem);
7065 else
7066 nft_setelem_activate(ctx->net, te->set, elem->priv);
7067
7068 nf_tables_setelem_notify(ctx, te->set, elem->priv,
7069 NFT_MSG_NEWSETELEM);
7070 kfree(elem->update);
7071 }
7072 }
7073
nft_setelem_catchall_deactivate(const struct net * net,struct nft_set * set,struct nft_set_elem * elem)7074 static int nft_setelem_catchall_deactivate(const struct net *net,
7075 struct nft_set *set,
7076 struct nft_set_elem *elem)
7077 {
7078 struct nft_set_elem_catchall *catchall;
7079 struct nft_set_ext *ext;
7080
7081 list_for_each_entry(catchall, &set->catchall_list, list) {
7082 ext = nft_set_elem_ext(set, catchall->elem);
7083 if (!nft_is_active_next(net, ext))
7084 continue;
7085
7086 kfree(elem->priv);
7087 elem->priv = catchall->elem;
7088 nft_set_elem_change_active(net, set, ext);
7089 return 0;
7090 }
7091
7092 return -ENOENT;
7093 }
7094
__nft_setelem_deactivate(const struct net * net,struct nft_set * set,struct nft_set_elem * elem)7095 static int __nft_setelem_deactivate(const struct net *net,
7096 struct nft_set *set,
7097 struct nft_set_elem *elem)
7098 {
7099 void *priv;
7100
7101 priv = set->ops->deactivate(net, set, elem);
7102 if (!priv)
7103 return -ENOENT;
7104
7105 kfree(elem->priv);
7106 elem->priv = priv;
7107 set->ndeact++;
7108
7109 return 0;
7110 }
7111
nft_setelem_deactivate(const struct net * net,struct nft_set * set,struct nft_set_elem * elem,u32 flags)7112 static int nft_setelem_deactivate(const struct net *net,
7113 struct nft_set *set,
7114 struct nft_set_elem *elem, u32 flags)
7115 {
7116 int ret;
7117
7118 if (flags & NFT_SET_ELEM_CATCHALL)
7119 ret = nft_setelem_catchall_deactivate(net, set, elem);
7120 else
7121 ret = __nft_setelem_deactivate(net, set, elem);
7122
7123 return ret;
7124 }
7125
nft_setelem_catchall_destroy(struct nft_set_elem_catchall * catchall)7126 static void nft_setelem_catchall_destroy(struct nft_set_elem_catchall *catchall)
7127 {
7128 list_del_rcu(&catchall->list);
7129 kfree_rcu(catchall, rcu);
7130 }
7131
nft_setelem_catchall_remove(const struct net * net,const struct nft_set * set,struct nft_elem_priv * elem_priv)7132 static void nft_setelem_catchall_remove(const struct net *net,
7133 const struct nft_set *set,
7134 struct nft_elem_priv *elem_priv)
7135 {
7136 struct nft_set_elem_catchall *catchall, *next;
7137
7138 list_for_each_entry_safe(catchall, next, &set->catchall_list, list) {
7139 if (catchall->elem == elem_priv) {
7140 nft_setelem_catchall_destroy(catchall);
7141 break;
7142 }
7143 }
7144 }
7145
nft_setelem_remove(const struct net * net,const struct nft_set * set,struct nft_elem_priv * elem_priv)7146 static void nft_setelem_remove(const struct net *net,
7147 const struct nft_set *set,
7148 struct nft_elem_priv *elem_priv)
7149 {
7150 if (nft_setelem_is_catchall(set, elem_priv))
7151 nft_setelem_catchall_remove(net, set, elem_priv);
7152 else
7153 set->ops->remove(net, set, elem_priv);
7154 }
7155
nft_trans_elems_remove(const struct nft_ctx * ctx,const struct nft_trans_elem * te)7156 static void nft_trans_elems_remove(const struct nft_ctx *ctx,
7157 const struct nft_trans_elem *te)
7158 {
7159 int i;
7160
7161 for (i = 0; i < te->nelems; i++) {
7162 WARN_ON_ONCE(te->elems[i].update);
7163
7164 nf_tables_setelem_notify(ctx, te->set,
7165 te->elems[i].priv,
7166 te->nft_trans.msg_type);
7167
7168 nft_setelem_remove(ctx->net, te->set, te->elems[i].priv);
7169 if (!nft_setelem_is_catchall(te->set, te->elems[i].priv)) {
7170 atomic_dec(&te->set->nelems);
7171 te->set->ndeact--;
7172 }
7173 }
7174 }
7175
nft_setelem_valid_key_end(const struct nft_set * set,struct nlattr ** nla,u32 flags)7176 static bool nft_setelem_valid_key_end(const struct nft_set *set,
7177 struct nlattr **nla, u32 flags)
7178 {
7179 if ((set->flags & (NFT_SET_CONCAT | NFT_SET_INTERVAL)) ==
7180 (NFT_SET_CONCAT | NFT_SET_INTERVAL)) {
7181 if (flags & NFT_SET_ELEM_INTERVAL_END)
7182 return false;
7183
7184 if (nla[NFTA_SET_ELEM_KEY_END] &&
7185 flags & NFT_SET_ELEM_CATCHALL)
7186 return false;
7187 } else {
7188 if (nla[NFTA_SET_ELEM_KEY_END])
7189 return false;
7190 }
7191
7192 return true;
7193 }
7194
nft_set_maxsize(const struct nft_set * set)7195 static u32 nft_set_maxsize(const struct nft_set *set)
7196 {
7197 u32 maxsize, delta;
7198
7199 if (!set->size)
7200 return UINT_MAX;
7201
7202 if (set->ops->adjust_maxsize)
7203 delta = set->ops->adjust_maxsize(set);
7204 else
7205 delta = 0;
7206
7207 if (check_add_overflow(set->size, set->ndeact, &maxsize))
7208 return UINT_MAX;
7209
7210 if (check_add_overflow(maxsize, delta, &maxsize))
7211 return UINT_MAX;
7212
7213 return maxsize;
7214 }
7215
nft_add_set_elem(struct nft_ctx * ctx,struct nft_set * set,const struct nlattr * attr,u32 nlmsg_flags)7216 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
7217 const struct nlattr *attr, u32 nlmsg_flags)
7218 {
7219 struct nft_expr *expr_array[NFT_SET_EXPR_MAX] = {};
7220 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
7221 u8 genmask = nft_genmask_next(ctx->net);
7222 u32 flags = 0, size = 0, num_exprs = 0;
7223 struct nft_set_ext_tmpl tmpl;
7224 struct nft_set_ext *ext, *ext2;
7225 struct nft_set_elem elem;
7226 struct nft_set_binding *binding;
7227 struct nft_elem_priv *elem_priv;
7228 struct nft_object *obj = NULL;
7229 struct nft_userdata *udata;
7230 struct nft_data_desc desc;
7231 enum nft_registers dreg;
7232 struct nft_trans *trans;
7233 u64 expiration;
7234 u64 timeout;
7235 int err, i;
7236 u8 ulen;
7237
7238 err = nla_parse_nested_deprecated(nla, NFTA_SET_ELEM_MAX, attr,
7239 nft_set_elem_policy, NULL);
7240 if (err < 0)
7241 return err;
7242
7243 nft_set_ext_prepare(&tmpl);
7244
7245 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
7246 if (err < 0)
7247 return err;
7248
7249 if (((flags & NFT_SET_ELEM_CATCHALL) && nla[NFTA_SET_ELEM_KEY]) ||
7250 (!(flags & NFT_SET_ELEM_CATCHALL) && !nla[NFTA_SET_ELEM_KEY]))
7251 return -EINVAL;
7252
7253 if (flags != 0) {
7254 err = nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
7255 if (err < 0)
7256 return err;
7257 }
7258
7259 if (set->flags & NFT_SET_MAP) {
7260 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
7261 !(flags & NFT_SET_ELEM_INTERVAL_END))
7262 return -EINVAL;
7263 } else {
7264 if (nla[NFTA_SET_ELEM_DATA] != NULL)
7265 return -EINVAL;
7266 }
7267
7268 if (set->flags & NFT_SET_OBJECT) {
7269 if (!nla[NFTA_SET_ELEM_OBJREF] &&
7270 !(flags & NFT_SET_ELEM_INTERVAL_END))
7271 return -EINVAL;
7272 } else {
7273 if (nla[NFTA_SET_ELEM_OBJREF])
7274 return -EINVAL;
7275 }
7276
7277 if (!nft_setelem_valid_key_end(set, nla, flags))
7278 return -EINVAL;
7279
7280 if ((flags & NFT_SET_ELEM_INTERVAL_END) &&
7281 (nla[NFTA_SET_ELEM_DATA] ||
7282 nla[NFTA_SET_ELEM_OBJREF] ||
7283 nla[NFTA_SET_ELEM_TIMEOUT] ||
7284 nla[NFTA_SET_ELEM_EXPIRATION] ||
7285 nla[NFTA_SET_ELEM_USERDATA] ||
7286 nla[NFTA_SET_ELEM_EXPR] ||
7287 nla[NFTA_SET_ELEM_KEY_END] ||
7288 nla[NFTA_SET_ELEM_EXPRESSIONS]))
7289 return -EINVAL;
7290
7291 timeout = 0;
7292 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
7293 if (!(set->flags & NFT_SET_TIMEOUT))
7294 return -EINVAL;
7295 err = nf_msecs_to_jiffies64(nla[NFTA_SET_ELEM_TIMEOUT],
7296 &timeout);
7297 if (err)
7298 return err;
7299 } else if (set->flags & NFT_SET_TIMEOUT &&
7300 !(flags & NFT_SET_ELEM_INTERVAL_END)) {
7301 timeout = set->timeout;
7302 }
7303
7304 expiration = 0;
7305 if (nla[NFTA_SET_ELEM_EXPIRATION] != NULL) {
7306 if (!(set->flags & NFT_SET_TIMEOUT))
7307 return -EINVAL;
7308 if (timeout == 0)
7309 return -EOPNOTSUPP;
7310
7311 err = nf_msecs_to_jiffies64(nla[NFTA_SET_ELEM_EXPIRATION],
7312 &expiration);
7313 if (err)
7314 return err;
7315
7316 if (expiration > timeout)
7317 return -ERANGE;
7318 }
7319
7320 if (nla[NFTA_SET_ELEM_EXPR]) {
7321 struct nft_expr *expr;
7322
7323 if (set->num_exprs && set->num_exprs != 1)
7324 return -EOPNOTSUPP;
7325
7326 expr = nft_set_elem_expr_alloc(ctx, set,
7327 nla[NFTA_SET_ELEM_EXPR]);
7328 if (IS_ERR(expr))
7329 return PTR_ERR(expr);
7330
7331 expr_array[0] = expr;
7332 num_exprs = 1;
7333
7334 if (set->num_exprs && set->exprs[0]->ops != expr->ops) {
7335 err = -EOPNOTSUPP;
7336 goto err_set_elem_expr;
7337 }
7338 } else if (nla[NFTA_SET_ELEM_EXPRESSIONS]) {
7339 struct nft_expr *expr;
7340 struct nlattr *tmp;
7341 int left;
7342
7343 i = 0;
7344 nla_for_each_nested(tmp, nla[NFTA_SET_ELEM_EXPRESSIONS], left) {
7345 if (i == NFT_SET_EXPR_MAX ||
7346 (set->num_exprs && set->num_exprs == i)) {
7347 err = -E2BIG;
7348 goto err_set_elem_expr;
7349 }
7350 if (nla_type(tmp) != NFTA_LIST_ELEM) {
7351 err = -EINVAL;
7352 goto err_set_elem_expr;
7353 }
7354 expr = nft_set_elem_expr_alloc(ctx, set, tmp);
7355 if (IS_ERR(expr)) {
7356 err = PTR_ERR(expr);
7357 goto err_set_elem_expr;
7358 }
7359 expr_array[i] = expr;
7360 num_exprs++;
7361
7362 if (set->num_exprs && expr->ops != set->exprs[i]->ops) {
7363 err = -EOPNOTSUPP;
7364 goto err_set_elem_expr;
7365 }
7366 i++;
7367 }
7368 if (set->num_exprs && set->num_exprs != i) {
7369 err = -EOPNOTSUPP;
7370 goto err_set_elem_expr;
7371 }
7372 } else if (set->num_exprs > 0 &&
7373 !(flags & NFT_SET_ELEM_INTERVAL_END)) {
7374 err = nft_set_elem_expr_clone(ctx, set, expr_array);
7375 if (err < 0)
7376 goto err_set_elem_expr_clone;
7377
7378 num_exprs = set->num_exprs;
7379 }
7380
7381 if (nla[NFTA_SET_ELEM_KEY]) {
7382 err = nft_setelem_parse_key(ctx, set, &elem.key.val,
7383 nla[NFTA_SET_ELEM_KEY]);
7384 if (err < 0)
7385 goto err_set_elem_expr;
7386
7387 err = nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, set->klen);
7388 if (err < 0)
7389 goto err_parse_key;
7390 }
7391
7392 if (nla[NFTA_SET_ELEM_KEY_END]) {
7393 err = nft_setelem_parse_key(ctx, set, &elem.key_end.val,
7394 nla[NFTA_SET_ELEM_KEY_END]);
7395 if (err < 0)
7396 goto err_parse_key;
7397
7398 err = nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY_END, set->klen);
7399 if (err < 0)
7400 goto err_parse_key_end;
7401 }
7402
7403 if (set->flags & NFT_SET_TIMEOUT) {
7404 err = nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
7405 if (err < 0)
7406 goto err_parse_key_end;
7407 }
7408
7409 if (num_exprs) {
7410 for (i = 0; i < num_exprs; i++)
7411 size += expr_array[i]->ops->size;
7412
7413 err = nft_set_ext_add_length(&tmpl, NFT_SET_EXT_EXPRESSIONS,
7414 sizeof(struct nft_set_elem_expr) + size);
7415 if (err < 0)
7416 goto err_parse_key_end;
7417 }
7418
7419 if (nla[NFTA_SET_ELEM_OBJREF] != NULL) {
7420 obj = nft_obj_lookup(ctx->net, ctx->table,
7421 nla[NFTA_SET_ELEM_OBJREF],
7422 set->objtype, genmask);
7423 if (IS_ERR(obj)) {
7424 err = PTR_ERR(obj);
7425 obj = NULL;
7426 goto err_parse_key_end;
7427 }
7428
7429 if (!nft_use_inc(&obj->use)) {
7430 err = -EMFILE;
7431 obj = NULL;
7432 goto err_parse_key_end;
7433 }
7434
7435 err = nft_set_ext_add(&tmpl, NFT_SET_EXT_OBJREF);
7436 if (err < 0)
7437 goto err_parse_key_end;
7438 }
7439
7440 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
7441 err = nft_setelem_parse_data(ctx, set, &desc, &elem.data.val,
7442 nla[NFTA_SET_ELEM_DATA]);
7443 if (err < 0)
7444 goto err_parse_key_end;
7445
7446 dreg = nft_type_to_reg(set->dtype);
7447 list_for_each_entry(binding, &set->bindings, list) {
7448 struct nft_ctx bind_ctx = {
7449 .net = ctx->net,
7450 .family = ctx->family,
7451 .table = ctx->table,
7452 .chain = (struct nft_chain *)binding->chain,
7453 };
7454
7455 if (!(binding->flags & NFT_SET_MAP))
7456 continue;
7457
7458 err = nft_validate_register_store(&bind_ctx, dreg,
7459 &elem.data.val,
7460 desc.type, desc.len);
7461 if (err < 0)
7462 goto err_parse_data;
7463
7464 if (desc.type == NFT_DATA_VERDICT &&
7465 (elem.data.val.verdict.code == NFT_GOTO ||
7466 elem.data.val.verdict.code == NFT_JUMP))
7467 nft_validate_state_update(ctx->table,
7468 NFT_VALIDATE_NEED);
7469 }
7470
7471 err = nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, desc.len);
7472 if (err < 0)
7473 goto err_parse_data;
7474 }
7475
7476 /* The full maximum length of userdata can exceed the maximum
7477 * offset value (U8_MAX) for following extensions, therefor it
7478 * must be the last extension added.
7479 */
7480 ulen = 0;
7481 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
7482 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
7483 if (ulen > 0) {
7484 err = nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
7485 ulen);
7486 if (err < 0)
7487 goto err_parse_data;
7488 }
7489 }
7490
7491 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data,
7492 elem.key_end.val.data, elem.data.val.data,
7493 timeout, expiration, GFP_KERNEL_ACCOUNT);
7494 if (IS_ERR(elem.priv)) {
7495 err = PTR_ERR(elem.priv);
7496 goto err_parse_data;
7497 }
7498
7499 ext = nft_set_elem_ext(set, elem.priv);
7500 if (flags)
7501 *nft_set_ext_flags(ext) = flags;
7502
7503 if (obj)
7504 *nft_set_ext_obj(ext) = obj;
7505
7506 if (ulen > 0) {
7507 if (nft_set_ext_check(&tmpl, NFT_SET_EXT_USERDATA, ulen) < 0) {
7508 err = -EINVAL;
7509 goto err_elem_free;
7510 }
7511 udata = nft_set_ext_userdata(ext);
7512 udata->len = ulen - 1;
7513 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
7514 }
7515 err = nft_set_elem_expr_setup(ctx, &tmpl, ext, expr_array, num_exprs);
7516 if (err < 0)
7517 goto err_elem_free;
7518
7519 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
7520 if (trans == NULL) {
7521 err = -ENOMEM;
7522 goto err_elem_free;
7523 }
7524
7525 ext->genmask = nft_genmask_cur(ctx->net);
7526
7527 err = nft_setelem_insert(ctx->net, set, &elem, &elem_priv, flags);
7528 if (err) {
7529 if (err == -EEXIST) {
7530 ext2 = nft_set_elem_ext(set, elem_priv);
7531 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) ^
7532 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) ||
7533 nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) ^
7534 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF))
7535 goto err_element_clash;
7536 if ((nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
7537 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
7538 memcmp(nft_set_ext_data(ext),
7539 nft_set_ext_data(ext2), set->dlen) != 0) ||
7540 (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
7541 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF) &&
7542 *nft_set_ext_obj(ext) != *nft_set_ext_obj(ext2)))
7543 goto err_element_clash;
7544 else if (!(nlmsg_flags & NLM_F_EXCL)) {
7545 err = 0;
7546 if (nft_set_ext_exists(ext2, NFT_SET_EXT_TIMEOUT)) {
7547 struct nft_elem_update update = { };
7548
7549 if (timeout != nft_set_ext_timeout(ext2)->timeout) {
7550 update.timeout = timeout;
7551 if (expiration == 0)
7552 expiration = timeout;
7553
7554 update.flags |= NFT_TRANS_UPD_TIMEOUT;
7555 }
7556 if (expiration) {
7557 update.expiration = expiration;
7558 update.flags |= NFT_TRANS_UPD_EXPIRATION;
7559 }
7560
7561 if (update.flags) {
7562 struct nft_trans_one_elem *ue;
7563
7564 ue = &nft_trans_container_elem(trans)->elems[0];
7565
7566 ue->update = kmemdup(&update, sizeof(update), GFP_KERNEL);
7567 if (!ue->update) {
7568 err = -ENOMEM;
7569 goto err_element_clash;
7570 }
7571
7572 ue->priv = elem_priv;
7573 nft_trans_commit_list_add_elem(ctx->net, trans, GFP_KERNEL);
7574 goto err_elem_free;
7575 }
7576 }
7577 }
7578 } else if (err == -ENOTEMPTY) {
7579 /* ENOTEMPTY reports overlapping between this element
7580 * and an existing one.
7581 */
7582 err = -EEXIST;
7583 }
7584 goto err_element_clash;
7585 }
7586
7587 if (!(flags & NFT_SET_ELEM_CATCHALL)) {
7588 unsigned int max = nft_set_maxsize(set);
7589
7590 if (!atomic_add_unless(&set->nelems, 1, max)) {
7591 err = -ENFILE;
7592 goto err_set_full;
7593 }
7594 }
7595
7596 nft_trans_container_elem(trans)->elems[0].priv = elem.priv;
7597 nft_trans_commit_list_add_elem(ctx->net, trans, GFP_KERNEL);
7598 return 0;
7599
7600 err_set_full:
7601 nft_setelem_remove(ctx->net, set, elem.priv);
7602 err_element_clash:
7603 kfree(trans);
7604 err_elem_free:
7605 nf_tables_set_elem_destroy(ctx, set, elem.priv);
7606 err_parse_data:
7607 if (nla[NFTA_SET_ELEM_DATA] != NULL)
7608 nft_data_release(&elem.data.val, desc.type);
7609 err_parse_key_end:
7610 if (obj)
7611 nft_use_dec_restore(&obj->use);
7612
7613 nft_data_release(&elem.key_end.val, NFT_DATA_VALUE);
7614 err_parse_key:
7615 nft_data_release(&elem.key.val, NFT_DATA_VALUE);
7616 err_set_elem_expr:
7617 for (i = 0; i < num_exprs && expr_array[i]; i++)
7618 nft_expr_destroy(ctx, expr_array[i]);
7619 err_set_elem_expr_clone:
7620 return err;
7621 }
7622
nf_tables_newsetelem(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])7623 static int nf_tables_newsetelem(struct sk_buff *skb,
7624 const struct nfnl_info *info,
7625 const struct nlattr * const nla[])
7626 {
7627 struct netlink_ext_ack *extack = info->extack;
7628 u8 genmask = nft_genmask_next(info->net);
7629 u8 family = info->nfmsg->nfgen_family;
7630 struct net *net = info->net;
7631 const struct nlattr *attr;
7632 struct nft_table *table;
7633 struct nft_set *set;
7634 struct nft_ctx ctx;
7635 int rem, err;
7636
7637 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
7638 return -EINVAL;
7639
7640 table = nft_table_lookup(net, nla[NFTA_SET_ELEM_LIST_TABLE], family,
7641 genmask, NETLINK_CB(skb).portid);
7642 if (IS_ERR(table)) {
7643 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_TABLE]);
7644 return PTR_ERR(table);
7645 }
7646
7647 set = nft_set_lookup_global(net, table, nla[NFTA_SET_ELEM_LIST_SET],
7648 nla[NFTA_SET_ELEM_LIST_SET_ID], genmask);
7649 if (IS_ERR(set)) {
7650 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_SET]);
7651 return PTR_ERR(set);
7652 }
7653
7654 if (!list_empty(&set->bindings) &&
7655 (set->flags & (NFT_SET_CONSTANT | NFT_SET_ANONYMOUS)))
7656 return -EBUSY;
7657
7658 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
7659
7660 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
7661 err = nft_add_set_elem(&ctx, set, attr, info->nlh->nlmsg_flags);
7662 if (err < 0) {
7663 NL_SET_BAD_ATTR(extack, attr);
7664 return err;
7665 }
7666 }
7667
7668 if (table->validate_state == NFT_VALIDATE_DO)
7669 return nft_table_validate(net, table);
7670
7671 return 0;
7672 }
7673
7674 /**
7675 * nft_data_hold - hold a nft_data item
7676 *
7677 * @data: struct nft_data to release
7678 * @type: type of data
7679 *
7680 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
7681 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
7682 * NFT_GOTO verdicts. This function must be called on active data objects
7683 * from the second phase of the commit protocol.
7684 */
nft_data_hold(const struct nft_data * data,enum nft_data_types type)7685 void nft_data_hold(const struct nft_data *data, enum nft_data_types type)
7686 {
7687 struct nft_chain *chain;
7688
7689 if (type == NFT_DATA_VERDICT) {
7690 switch (data->verdict.code) {
7691 case NFT_JUMP:
7692 case NFT_GOTO:
7693 chain = data->verdict.chain;
7694 nft_use_inc_restore(&chain->use);
7695 break;
7696 }
7697 }
7698 }
7699
nft_setelem_active_next(const struct net * net,const struct nft_set * set,struct nft_elem_priv * elem_priv)7700 static int nft_setelem_active_next(const struct net *net,
7701 const struct nft_set *set,
7702 struct nft_elem_priv *elem_priv)
7703 {
7704 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
7705 u8 genmask = nft_genmask_next(net);
7706
7707 return nft_set_elem_active(ext, genmask);
7708 }
7709
nft_setelem_data_activate(const struct net * net,const struct nft_set * set,struct nft_elem_priv * elem_priv)7710 static void nft_setelem_data_activate(const struct net *net,
7711 const struct nft_set *set,
7712 struct nft_elem_priv *elem_priv)
7713 {
7714 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
7715
7716 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
7717 nft_data_hold(nft_set_ext_data(ext), set->dtype);
7718 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
7719 nft_use_inc_restore(&(*nft_set_ext_obj(ext))->use);
7720 }
7721
nft_setelem_data_deactivate(const struct net * net,const struct nft_set * set,struct nft_elem_priv * elem_priv)7722 void nft_setelem_data_deactivate(const struct net *net,
7723 const struct nft_set *set,
7724 struct nft_elem_priv *elem_priv)
7725 {
7726 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
7727
7728 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
7729 nft_data_release(nft_set_ext_data(ext), set->dtype);
7730 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
7731 nft_use_dec(&(*nft_set_ext_obj(ext))->use);
7732 }
7733
7734 /* similar to nft_trans_elems_remove, but called from abort path to undo newsetelem.
7735 * No notifications and no ndeact changes.
7736 *
7737 * Returns true if set had been added to (i.e., elements need to be removed again).
7738 */
nft_trans_elems_new_abort(const struct nft_ctx * ctx,struct nft_trans_elem * te)7739 static bool nft_trans_elems_new_abort(const struct nft_ctx *ctx,
7740 struct nft_trans_elem *te)
7741 {
7742 bool removed = false;
7743 int i;
7744
7745 for (i = 0; i < te->nelems; i++) {
7746 if (te->elems[i].update) {
7747 kfree(te->elems[i].update);
7748 te->elems[i].update = NULL;
7749 /* Update request, so do not release this element */
7750 te->elems[i].priv = NULL;
7751 continue;
7752 }
7753
7754 if (!te->set->ops->abort || nft_setelem_is_catchall(te->set, te->elems[i].priv))
7755 nft_setelem_remove(ctx->net, te->set, te->elems[i].priv);
7756
7757 if (!nft_setelem_is_catchall(te->set, te->elems[i].priv))
7758 atomic_dec(&te->set->nelems);
7759
7760 removed = true;
7761 }
7762
7763 return removed;
7764 }
7765
7766 /* Called from abort path to undo DELSETELEM/DESTROYSETELEM. */
nft_trans_elems_destroy_abort(const struct nft_ctx * ctx,const struct nft_trans_elem * te)7767 static void nft_trans_elems_destroy_abort(const struct nft_ctx *ctx,
7768 const struct nft_trans_elem *te)
7769 {
7770 int i;
7771
7772 for (i = 0; i < te->nelems; i++) {
7773 if (!nft_setelem_active_next(ctx->net, te->set, te->elems[i].priv)) {
7774 nft_setelem_data_activate(ctx->net, te->set, te->elems[i].priv);
7775 nft_setelem_activate(ctx->net, te->set, te->elems[i].priv);
7776 }
7777
7778 if (!nft_setelem_is_catchall(te->set, te->elems[i].priv))
7779 te->set->ndeact--;
7780 }
7781 }
7782
nft_del_setelem(struct nft_ctx * ctx,struct nft_set * set,const struct nlattr * attr)7783 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
7784 const struct nlattr *attr)
7785 {
7786 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
7787 struct nft_set_ext_tmpl tmpl;
7788 struct nft_set_elem elem;
7789 struct nft_set_ext *ext;
7790 struct nft_trans *trans;
7791 u32 flags = 0;
7792 int err;
7793
7794 err = nla_parse_nested_deprecated(nla, NFTA_SET_ELEM_MAX, attr,
7795 nft_set_elem_policy, NULL);
7796 if (err < 0)
7797 return err;
7798
7799 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
7800 if (err < 0)
7801 return err;
7802
7803 if (!nla[NFTA_SET_ELEM_KEY] && !(flags & NFT_SET_ELEM_CATCHALL))
7804 return -EINVAL;
7805
7806 if (!nft_setelem_valid_key_end(set, nla, flags))
7807 return -EINVAL;
7808
7809 nft_set_ext_prepare(&tmpl);
7810
7811 if (flags != 0) {
7812 err = nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
7813 if (err < 0)
7814 return err;
7815 }
7816
7817 if (nla[NFTA_SET_ELEM_KEY]) {
7818 err = nft_setelem_parse_key(ctx, set, &elem.key.val,
7819 nla[NFTA_SET_ELEM_KEY]);
7820 if (err < 0)
7821 return err;
7822
7823 err = nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, set->klen);
7824 if (err < 0)
7825 goto fail_elem;
7826 }
7827
7828 if (nla[NFTA_SET_ELEM_KEY_END]) {
7829 err = nft_setelem_parse_key(ctx, set, &elem.key_end.val,
7830 nla[NFTA_SET_ELEM_KEY_END]);
7831 if (err < 0)
7832 goto fail_elem;
7833
7834 err = nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY_END, set->klen);
7835 if (err < 0)
7836 goto fail_elem_key_end;
7837 }
7838
7839 err = -ENOMEM;
7840 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data,
7841 elem.key_end.val.data, NULL, 0, 0,
7842 GFP_KERNEL_ACCOUNT);
7843 if (IS_ERR(elem.priv)) {
7844 err = PTR_ERR(elem.priv);
7845 goto fail_elem_key_end;
7846 }
7847
7848 ext = nft_set_elem_ext(set, elem.priv);
7849 if (flags)
7850 *nft_set_ext_flags(ext) = flags;
7851
7852 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
7853 if (trans == NULL)
7854 goto fail_trans;
7855
7856 err = nft_setelem_deactivate(ctx->net, set, &elem, flags);
7857 if (err < 0)
7858 goto fail_ops;
7859
7860 nft_setelem_data_deactivate(ctx->net, set, elem.priv);
7861
7862 nft_trans_container_elem(trans)->elems[0].priv = elem.priv;
7863 nft_trans_commit_list_add_elem(ctx->net, trans, GFP_KERNEL);
7864 return 0;
7865
7866 fail_ops:
7867 kfree(trans);
7868 fail_trans:
7869 kfree(elem.priv);
7870 fail_elem_key_end:
7871 nft_data_release(&elem.key_end.val, NFT_DATA_VALUE);
7872 fail_elem:
7873 nft_data_release(&elem.key.val, NFT_DATA_VALUE);
7874 return err;
7875 }
7876
nft_setelem_flush(const struct nft_ctx * ctx,struct nft_set * set,const struct nft_set_iter * iter,struct nft_elem_priv * elem_priv)7877 static int nft_setelem_flush(const struct nft_ctx *ctx,
7878 struct nft_set *set,
7879 const struct nft_set_iter *iter,
7880 struct nft_elem_priv *elem_priv)
7881 {
7882 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem_priv);
7883 struct nft_trans *trans;
7884
7885 if (!nft_set_elem_active(ext, iter->genmask))
7886 return 0;
7887
7888 trans = nft_trans_alloc_gfp(ctx, NFT_MSG_DELSETELEM,
7889 struct_size_t(struct nft_trans_elem, elems, 1),
7890 GFP_ATOMIC);
7891 if (!trans)
7892 return -ENOMEM;
7893
7894 set->ops->flush(ctx->net, set, elem_priv);
7895 set->ndeact++;
7896
7897 nft_setelem_data_deactivate(ctx->net, set, elem_priv);
7898 nft_trans_elem_set(trans) = set;
7899 nft_trans_container_elem(trans)->nelems = 1;
7900 nft_trans_container_elem(trans)->elems[0].priv = elem_priv;
7901 nft_trans_commit_list_add_elem(ctx->net, trans, GFP_ATOMIC);
7902
7903 return 0;
7904 }
7905
__nft_set_catchall_flush(const struct nft_ctx * ctx,struct nft_set * set,struct nft_elem_priv * elem_priv)7906 static int __nft_set_catchall_flush(const struct nft_ctx *ctx,
7907 struct nft_set *set,
7908 struct nft_elem_priv *elem_priv)
7909 {
7910 struct nft_trans *trans;
7911
7912 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
7913 if (!trans)
7914 return -ENOMEM;
7915
7916 nft_setelem_data_deactivate(ctx->net, set, elem_priv);
7917 nft_trans_container_elem(trans)->elems[0].priv = elem_priv;
7918 nft_trans_commit_list_add_elem(ctx->net, trans, GFP_KERNEL);
7919
7920 return 0;
7921 }
7922
nft_set_catchall_flush(const struct nft_ctx * ctx,struct nft_set * set)7923 static int nft_set_catchall_flush(const struct nft_ctx *ctx,
7924 struct nft_set *set)
7925 {
7926 u8 genmask = nft_genmask_next(ctx->net);
7927 struct nft_set_elem_catchall *catchall;
7928 struct nft_set_ext *ext;
7929 int ret = 0;
7930
7931 list_for_each_entry_rcu(catchall, &set->catchall_list, list,
7932 lockdep_commit_lock_is_held(ctx->net)) {
7933 ext = nft_set_elem_ext(set, catchall->elem);
7934 if (!nft_set_elem_active(ext, genmask))
7935 continue;
7936
7937 ret = __nft_set_catchall_flush(ctx, set, catchall->elem);
7938 if (ret < 0)
7939 break;
7940 nft_set_elem_change_active(ctx->net, set, ext);
7941 }
7942
7943 return ret;
7944 }
7945
nft_set_flush(struct nft_ctx * ctx,struct nft_set * set,u8 genmask)7946 static int nft_set_flush(struct nft_ctx *ctx, struct nft_set *set, u8 genmask)
7947 {
7948 struct nft_set_iter iter = {
7949 .genmask = genmask,
7950 .type = NFT_ITER_UPDATE,
7951 .fn = nft_setelem_flush,
7952 };
7953
7954 set->ops->walk(ctx, set, &iter);
7955 if (!iter.err)
7956 iter.err = nft_set_catchall_flush(ctx, set);
7957
7958 return iter.err;
7959 }
7960
nf_tables_delsetelem(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])7961 static int nf_tables_delsetelem(struct sk_buff *skb,
7962 const struct nfnl_info *info,
7963 const struct nlattr * const nla[])
7964 {
7965 struct netlink_ext_ack *extack = info->extack;
7966 u8 genmask = nft_genmask_next(info->net);
7967 u8 family = info->nfmsg->nfgen_family;
7968 struct net *net = info->net;
7969 const struct nlattr *attr;
7970 struct nft_table *table;
7971 struct nft_set *set;
7972 struct nft_ctx ctx;
7973 int rem, err = 0;
7974
7975 table = nft_table_lookup(net, nla[NFTA_SET_ELEM_LIST_TABLE], family,
7976 genmask, NETLINK_CB(skb).portid);
7977 if (IS_ERR(table)) {
7978 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_TABLE]);
7979 return PTR_ERR(table);
7980 }
7981
7982 set = nft_set_lookup(net, table, nla[NFTA_SET_ELEM_LIST_SET], genmask);
7983 if (IS_ERR(set)) {
7984 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_SET]);
7985 return PTR_ERR(set);
7986 }
7987
7988 if (nft_set_is_anonymous(set))
7989 return -EOPNOTSUPP;
7990
7991 if (!list_empty(&set->bindings) && (set->flags & NFT_SET_CONSTANT))
7992 return -EBUSY;
7993
7994 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
7995
7996 if (!nla[NFTA_SET_ELEM_LIST_ELEMENTS])
7997 return nft_set_flush(&ctx, set, genmask);
7998
7999 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
8000 err = nft_del_setelem(&ctx, set, attr);
8001 if (err == -ENOENT &&
8002 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYSETELEM)
8003 continue;
8004
8005 if (err < 0) {
8006 NL_SET_BAD_ATTR(extack, attr);
8007 return err;
8008 }
8009 }
8010
8011 return 0;
8012 }
8013
8014 /*
8015 * Stateful objects
8016 */
8017
8018 /**
8019 * nft_register_obj- register nf_tables stateful object type
8020 * @obj_type: object type
8021 *
8022 * Registers the object type for use with nf_tables. Returns zero on
8023 * success or a negative errno code otherwise.
8024 */
nft_register_obj(struct nft_object_type * obj_type)8025 int nft_register_obj(struct nft_object_type *obj_type)
8026 {
8027 if (obj_type->type == NFT_OBJECT_UNSPEC)
8028 return -EINVAL;
8029
8030 nfnl_lock(NFNL_SUBSYS_NFTABLES);
8031 list_add_rcu(&obj_type->list, &nf_tables_objects);
8032 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
8033 return 0;
8034 }
8035 EXPORT_SYMBOL_GPL(nft_register_obj);
8036
8037 /**
8038 * nft_unregister_obj - unregister nf_tables object type
8039 * @obj_type: object type
8040 *
8041 * Unregisters the object type for use with nf_tables.
8042 */
nft_unregister_obj(struct nft_object_type * obj_type)8043 void nft_unregister_obj(struct nft_object_type *obj_type)
8044 {
8045 nfnl_lock(NFNL_SUBSYS_NFTABLES);
8046 list_del_rcu(&obj_type->list);
8047 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
8048 }
8049 EXPORT_SYMBOL_GPL(nft_unregister_obj);
8050
nft_obj_lookup(const struct net * net,const struct nft_table * table,const struct nlattr * nla,u32 objtype,u8 genmask)8051 struct nft_object *nft_obj_lookup(const struct net *net,
8052 const struct nft_table *table,
8053 const struct nlattr *nla, u32 objtype,
8054 u8 genmask)
8055 {
8056 struct nft_object_hash_key k = { .table = table };
8057 char search[NFT_OBJ_MAXNAMELEN];
8058 struct rhlist_head *tmp, *list;
8059 struct nft_object *obj;
8060
8061 nla_strscpy(search, nla, sizeof(search));
8062 k.name = search;
8063
8064 WARN_ON_ONCE(!rcu_read_lock_held() &&
8065 !lockdep_commit_lock_is_held(net));
8066
8067 rcu_read_lock();
8068 list = rhltable_lookup(&nft_objname_ht, &k, nft_objname_ht_params);
8069 if (!list)
8070 goto out;
8071
8072 rhl_for_each_entry_rcu(obj, tmp, list, rhlhead) {
8073 if (objtype == obj->ops->type->type &&
8074 nft_active_genmask(obj, genmask)) {
8075 rcu_read_unlock();
8076 return obj;
8077 }
8078 }
8079 out:
8080 rcu_read_unlock();
8081 return ERR_PTR(-ENOENT);
8082 }
8083 EXPORT_SYMBOL_GPL(nft_obj_lookup);
8084
nft_obj_lookup_byhandle(const struct nft_table * table,const struct nlattr * nla,u32 objtype,u8 genmask)8085 static struct nft_object *nft_obj_lookup_byhandle(const struct nft_table *table,
8086 const struct nlattr *nla,
8087 u32 objtype, u8 genmask)
8088 {
8089 struct nft_object *obj;
8090
8091 list_for_each_entry(obj, &table->objects, list) {
8092 if (be64_to_cpu(nla_get_be64(nla)) == obj->handle &&
8093 objtype == obj->ops->type->type &&
8094 nft_active_genmask(obj, genmask))
8095 return obj;
8096 }
8097 return ERR_PTR(-ENOENT);
8098 }
8099
8100 static const struct nla_policy nft_obj_policy[NFTA_OBJ_MAX + 1] = {
8101 [NFTA_OBJ_TABLE] = { .type = NLA_STRING,
8102 .len = NFT_TABLE_MAXNAMELEN - 1 },
8103 [NFTA_OBJ_NAME] = { .type = NLA_STRING,
8104 .len = NFT_OBJ_MAXNAMELEN - 1 },
8105 [NFTA_OBJ_TYPE] = { .type = NLA_U32 },
8106 [NFTA_OBJ_DATA] = { .type = NLA_NESTED },
8107 [NFTA_OBJ_HANDLE] = { .type = NLA_U64},
8108 [NFTA_OBJ_USERDATA] = { .type = NLA_BINARY,
8109 .len = NFT_USERDATA_MAXLEN },
8110 };
8111
nft_obj_init(const struct nft_ctx * ctx,const struct nft_object_type * type,const struct nlattr * attr)8112 static struct nft_object *nft_obj_init(const struct nft_ctx *ctx,
8113 const struct nft_object_type *type,
8114 const struct nlattr *attr)
8115 {
8116 struct nlattr **tb;
8117 const struct nft_object_ops *ops;
8118 struct nft_object *obj;
8119 int err = -ENOMEM;
8120
8121 tb = kmalloc_array(type->maxattr + 1, sizeof(*tb), GFP_KERNEL);
8122 if (!tb)
8123 goto err1;
8124
8125 if (attr) {
8126 err = nla_parse_nested_deprecated(tb, type->maxattr, attr,
8127 type->policy, NULL);
8128 if (err < 0)
8129 goto err2;
8130 } else {
8131 memset(tb, 0, sizeof(tb[0]) * (type->maxattr + 1));
8132 }
8133
8134 if (type->select_ops) {
8135 ops = type->select_ops(ctx, (const struct nlattr * const *)tb);
8136 if (IS_ERR(ops)) {
8137 err = PTR_ERR(ops);
8138 goto err2;
8139 }
8140 } else {
8141 ops = type->ops;
8142 }
8143
8144 err = -ENOMEM;
8145 obj = kzalloc(sizeof(*obj) + ops->size, GFP_KERNEL_ACCOUNT);
8146 if (!obj)
8147 goto err2;
8148
8149 err = ops->init(ctx, (const struct nlattr * const *)tb, obj);
8150 if (err < 0)
8151 goto err3;
8152
8153 obj->ops = ops;
8154
8155 kfree(tb);
8156 return obj;
8157 err3:
8158 kfree(obj);
8159 err2:
8160 kfree(tb);
8161 err1:
8162 return ERR_PTR(err);
8163 }
8164
nft_object_dump(struct sk_buff * skb,unsigned int attr,struct nft_object * obj,bool reset)8165 static int nft_object_dump(struct sk_buff *skb, unsigned int attr,
8166 struct nft_object *obj, bool reset)
8167 {
8168 struct nlattr *nest;
8169
8170 nest = nla_nest_start_noflag(skb, attr);
8171 if (!nest)
8172 goto nla_put_failure;
8173 if (obj->ops->dump(skb, obj, reset) < 0)
8174 goto nla_put_failure;
8175 nla_nest_end(skb, nest);
8176 return 0;
8177
8178 nla_put_failure:
8179 return -1;
8180 }
8181
__nft_obj_type_get(u32 objtype,u8 family)8182 static const struct nft_object_type *__nft_obj_type_get(u32 objtype, u8 family)
8183 {
8184 const struct nft_object_type *type;
8185
8186 list_for_each_entry_rcu(type, &nf_tables_objects, list) {
8187 if (type->family != NFPROTO_UNSPEC &&
8188 type->family != family)
8189 continue;
8190
8191 if (objtype == type->type)
8192 return type;
8193 }
8194 return NULL;
8195 }
8196
8197 static const struct nft_object_type *
nft_obj_type_get(struct net * net,u32 objtype,u8 family)8198 nft_obj_type_get(struct net *net, u32 objtype, u8 family)
8199 {
8200 const struct nft_object_type *type;
8201
8202 rcu_read_lock();
8203 type = __nft_obj_type_get(objtype, family);
8204 if (type != NULL && try_module_get(type->owner)) {
8205 rcu_read_unlock();
8206 return type;
8207 }
8208 rcu_read_unlock();
8209
8210 lockdep_nfnl_nft_mutex_not_held();
8211 #ifdef CONFIG_MODULES
8212 if (type == NULL) {
8213 if (nft_request_module(net, "nft-obj-%u", objtype) == -EAGAIN)
8214 return ERR_PTR(-EAGAIN);
8215 }
8216 #endif
8217 return ERR_PTR(-ENOENT);
8218 }
8219
nf_tables_updobj(const struct nft_ctx * ctx,const struct nft_object_type * type,const struct nlattr * attr,struct nft_object * obj)8220 static int nf_tables_updobj(const struct nft_ctx *ctx,
8221 const struct nft_object_type *type,
8222 const struct nlattr *attr,
8223 struct nft_object *obj)
8224 {
8225 struct nft_object *newobj;
8226 struct nft_trans *trans;
8227 int err = -ENOMEM;
8228
8229 /* caller must have obtained type->owner reference. */
8230 trans = nft_trans_alloc(ctx, NFT_MSG_NEWOBJ,
8231 sizeof(struct nft_trans_obj));
8232 if (!trans)
8233 goto err_trans;
8234
8235 newobj = nft_obj_init(ctx, type, attr);
8236 if (IS_ERR(newobj)) {
8237 err = PTR_ERR(newobj);
8238 goto err_free_trans;
8239 }
8240
8241 nft_trans_obj(trans) = obj;
8242 nft_trans_obj_update(trans) = true;
8243 nft_trans_obj_newobj(trans) = newobj;
8244 nft_trans_commit_list_add_tail(ctx->net, trans);
8245
8246 return 0;
8247
8248 err_free_trans:
8249 kfree(trans);
8250 err_trans:
8251 module_put(type->owner);
8252 return err;
8253 }
8254
nf_tables_newobj(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])8255 static int nf_tables_newobj(struct sk_buff *skb, const struct nfnl_info *info,
8256 const struct nlattr * const nla[])
8257 {
8258 struct netlink_ext_ack *extack = info->extack;
8259 u8 genmask = nft_genmask_next(info->net);
8260 u8 family = info->nfmsg->nfgen_family;
8261 const struct nft_object_type *type;
8262 struct net *net = info->net;
8263 struct nft_table *table;
8264 struct nft_object *obj;
8265 struct nft_ctx ctx;
8266 u32 objtype;
8267 int err;
8268
8269 if (!nla[NFTA_OBJ_TYPE] ||
8270 !nla[NFTA_OBJ_NAME] ||
8271 !nla[NFTA_OBJ_DATA])
8272 return -EINVAL;
8273
8274 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask,
8275 NETLINK_CB(skb).portid);
8276 if (IS_ERR(table)) {
8277 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
8278 return PTR_ERR(table);
8279 }
8280
8281 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
8282 obj = nft_obj_lookup(net, table, nla[NFTA_OBJ_NAME], objtype, genmask);
8283 if (IS_ERR(obj)) {
8284 err = PTR_ERR(obj);
8285 if (err != -ENOENT) {
8286 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
8287 return err;
8288 }
8289 } else {
8290 if (info->nlh->nlmsg_flags & NLM_F_EXCL) {
8291 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
8292 return -EEXIST;
8293 }
8294 if (info->nlh->nlmsg_flags & NLM_F_REPLACE)
8295 return -EOPNOTSUPP;
8296
8297 if (!obj->ops->update)
8298 return 0;
8299
8300 type = nft_obj_type_get(net, objtype, family);
8301 if (WARN_ON_ONCE(IS_ERR(type)))
8302 return PTR_ERR(type);
8303
8304 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
8305
8306 /* type->owner reference is put when transaction object is released. */
8307 return nf_tables_updobj(&ctx, type, nla[NFTA_OBJ_DATA], obj);
8308 }
8309
8310 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
8311
8312 if (!nft_use_inc(&table->use))
8313 return -EMFILE;
8314
8315 type = nft_obj_type_get(net, objtype, family);
8316 if (IS_ERR(type)) {
8317 err = PTR_ERR(type);
8318 goto err_type;
8319 }
8320
8321 obj = nft_obj_init(&ctx, type, nla[NFTA_OBJ_DATA]);
8322 if (IS_ERR(obj)) {
8323 err = PTR_ERR(obj);
8324 goto err_init;
8325 }
8326 obj->key.table = table;
8327 obj->handle = nf_tables_alloc_handle(table);
8328
8329 obj->key.name = nla_strdup(nla[NFTA_OBJ_NAME], GFP_KERNEL_ACCOUNT);
8330 if (!obj->key.name) {
8331 err = -ENOMEM;
8332 goto err_strdup;
8333 }
8334
8335 if (nla[NFTA_OBJ_USERDATA]) {
8336 obj->udata = nla_memdup(nla[NFTA_OBJ_USERDATA], GFP_KERNEL_ACCOUNT);
8337 if (obj->udata == NULL)
8338 goto err_userdata;
8339
8340 obj->udlen = nla_len(nla[NFTA_OBJ_USERDATA]);
8341 }
8342
8343 err = nft_trans_obj_add(&ctx, NFT_MSG_NEWOBJ, obj);
8344 if (err < 0)
8345 goto err_trans;
8346
8347 err = rhltable_insert(&nft_objname_ht, &obj->rhlhead,
8348 nft_objname_ht_params);
8349 if (err < 0)
8350 goto err_obj_ht;
8351
8352 list_add_tail_rcu(&obj->list, &table->objects);
8353
8354 return 0;
8355 err_obj_ht:
8356 /* queued in transaction log */
8357 INIT_LIST_HEAD(&obj->list);
8358 return err;
8359 err_trans:
8360 kfree(obj->udata);
8361 err_userdata:
8362 kfree(obj->key.name);
8363 err_strdup:
8364 if (obj->ops->destroy)
8365 obj->ops->destroy(&ctx, obj);
8366 kfree(obj);
8367 err_init:
8368 module_put(type->owner);
8369 err_type:
8370 nft_use_dec_restore(&table->use);
8371
8372 return err;
8373 }
8374
nf_tables_fill_obj_info(struct sk_buff * skb,struct net * net,u32 portid,u32 seq,int event,u32 flags,int family,const struct nft_table * table,struct nft_object * obj,bool reset)8375 static int nf_tables_fill_obj_info(struct sk_buff *skb, struct net *net,
8376 u32 portid, u32 seq, int event, u32 flags,
8377 int family, const struct nft_table *table,
8378 struct nft_object *obj, bool reset)
8379 {
8380 struct nlmsghdr *nlh;
8381
8382 nlh = nfnl_msg_put(skb, portid, seq,
8383 nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event),
8384 flags, family, NFNETLINK_V0, nft_base_seq(net));
8385 if (!nlh)
8386 goto nla_put_failure;
8387
8388 if (nla_put_string(skb, NFTA_OBJ_TABLE, table->name) ||
8389 nla_put_string(skb, NFTA_OBJ_NAME, obj->key.name) ||
8390 nla_put_be32(skb, NFTA_OBJ_TYPE, htonl(obj->ops->type->type)) ||
8391 nla_put_be64(skb, NFTA_OBJ_HANDLE, cpu_to_be64(obj->handle),
8392 NFTA_OBJ_PAD))
8393 goto nla_put_failure;
8394
8395 if (event == NFT_MSG_DELOBJ ||
8396 event == NFT_MSG_DESTROYOBJ) {
8397 nlmsg_end(skb, nlh);
8398 return 0;
8399 }
8400
8401 if (nla_put_be32(skb, NFTA_OBJ_USE, htonl(obj->use)) ||
8402 nft_object_dump(skb, NFTA_OBJ_DATA, obj, reset))
8403 goto nla_put_failure;
8404
8405 if (obj->udata &&
8406 nla_put(skb, NFTA_OBJ_USERDATA, obj->udlen, obj->udata))
8407 goto nla_put_failure;
8408
8409 nlmsg_end(skb, nlh);
8410 return 0;
8411
8412 nla_put_failure:
8413 nlmsg_trim(skb, nlh);
8414 return -1;
8415 }
8416
audit_log_obj_reset(const struct nft_table * table,unsigned int base_seq,unsigned int nentries)8417 static void audit_log_obj_reset(const struct nft_table *table,
8418 unsigned int base_seq, unsigned int nentries)
8419 {
8420 char *buf = kasprintf(GFP_ATOMIC, "%s:%u", table->name, base_seq);
8421
8422 audit_log_nfcfg(buf, table->family, nentries,
8423 AUDIT_NFT_OP_OBJ_RESET, GFP_ATOMIC);
8424 kfree(buf);
8425 }
8426
8427 struct nft_obj_dump_ctx {
8428 unsigned int s_idx;
8429 char *table;
8430 u32 type;
8431 bool reset;
8432 };
8433
nf_tables_dump_obj(struct sk_buff * skb,struct netlink_callback * cb)8434 static int nf_tables_dump_obj(struct sk_buff *skb, struct netlink_callback *cb)
8435 {
8436 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
8437 struct nft_obj_dump_ctx *ctx = (void *)cb->ctx;
8438 struct net *net = sock_net(skb->sk);
8439 int family = nfmsg->nfgen_family;
8440 struct nftables_pernet *nft_net;
8441 const struct nft_table *table;
8442 unsigned int entries = 0;
8443 struct nft_object *obj;
8444 unsigned int idx = 0;
8445 int rc = 0;
8446
8447 rcu_read_lock();
8448 nft_net = nft_pernet(net);
8449 cb->seq = READ_ONCE(nft_net->base_seq);
8450
8451 list_for_each_entry_rcu(table, &nft_net->tables, list) {
8452 if (family != NFPROTO_UNSPEC && family != table->family)
8453 continue;
8454
8455 entries = 0;
8456 list_for_each_entry_rcu(obj, &table->objects, list) {
8457 if (!nft_is_active(net, obj))
8458 goto cont;
8459 if (idx < ctx->s_idx)
8460 goto cont;
8461 if (ctx->table && strcmp(ctx->table, table->name))
8462 goto cont;
8463 if (ctx->type != NFT_OBJECT_UNSPEC &&
8464 obj->ops->type->type != ctx->type)
8465 goto cont;
8466
8467 rc = nf_tables_fill_obj_info(skb, net,
8468 NETLINK_CB(cb->skb).portid,
8469 cb->nlh->nlmsg_seq,
8470 NFT_MSG_NEWOBJ,
8471 NLM_F_MULTI | NLM_F_APPEND,
8472 table->family, table,
8473 obj, ctx->reset);
8474 if (rc < 0)
8475 break;
8476
8477 entries++;
8478 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
8479 cont:
8480 idx++;
8481 }
8482 if (ctx->reset && entries)
8483 audit_log_obj_reset(table, nft_net->base_seq, entries);
8484 if (rc < 0)
8485 break;
8486 }
8487 rcu_read_unlock();
8488
8489 ctx->s_idx = idx;
8490 return skb->len;
8491 }
8492
nf_tables_dumpreset_obj(struct sk_buff * skb,struct netlink_callback * cb)8493 static int nf_tables_dumpreset_obj(struct sk_buff *skb,
8494 struct netlink_callback *cb)
8495 {
8496 struct nftables_pernet *nft_net = nft_pernet(sock_net(skb->sk));
8497 int ret;
8498
8499 mutex_lock(&nft_net->commit_mutex);
8500 ret = nf_tables_dump_obj(skb, cb);
8501 mutex_unlock(&nft_net->commit_mutex);
8502
8503 return ret;
8504 }
8505
nf_tables_dump_obj_start(struct netlink_callback * cb)8506 static int nf_tables_dump_obj_start(struct netlink_callback *cb)
8507 {
8508 struct nft_obj_dump_ctx *ctx = (void *)cb->ctx;
8509 const struct nlattr * const *nla = cb->data;
8510
8511 BUILD_BUG_ON(sizeof(*ctx) > sizeof(cb->ctx));
8512
8513 if (nla[NFTA_OBJ_TABLE]) {
8514 ctx->table = nla_strdup(nla[NFTA_OBJ_TABLE], GFP_ATOMIC);
8515 if (!ctx->table)
8516 return -ENOMEM;
8517 }
8518
8519 if (nla[NFTA_OBJ_TYPE])
8520 ctx->type = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
8521
8522 return 0;
8523 }
8524
nf_tables_dumpreset_obj_start(struct netlink_callback * cb)8525 static int nf_tables_dumpreset_obj_start(struct netlink_callback *cb)
8526 {
8527 struct nft_obj_dump_ctx *ctx = (void *)cb->ctx;
8528
8529 ctx->reset = true;
8530
8531 return nf_tables_dump_obj_start(cb);
8532 }
8533
nf_tables_dump_obj_done(struct netlink_callback * cb)8534 static int nf_tables_dump_obj_done(struct netlink_callback *cb)
8535 {
8536 struct nft_obj_dump_ctx *ctx = (void *)cb->ctx;
8537
8538 kfree(ctx->table);
8539
8540 return 0;
8541 }
8542
8543 /* Caller must hold rcu read lock or transaction mutex */
8544 static struct sk_buff *
nf_tables_getobj_single(u32 portid,const struct nfnl_info * info,const struct nlattr * const nla[],bool reset)8545 nf_tables_getobj_single(u32 portid, const struct nfnl_info *info,
8546 const struct nlattr * const nla[], bool reset)
8547 {
8548 struct netlink_ext_ack *extack = info->extack;
8549 u8 genmask = nft_genmask_cur(info->net);
8550 u8 family = info->nfmsg->nfgen_family;
8551 const struct nft_table *table;
8552 struct net *net = info->net;
8553 struct nft_object *obj;
8554 struct sk_buff *skb2;
8555 u32 objtype;
8556 int err;
8557
8558 if (!nla[NFTA_OBJ_NAME] ||
8559 !nla[NFTA_OBJ_TYPE])
8560 return ERR_PTR(-EINVAL);
8561
8562 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask, 0);
8563 if (IS_ERR(table)) {
8564 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
8565 return ERR_CAST(table);
8566 }
8567
8568 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
8569 obj = nft_obj_lookup(net, table, nla[NFTA_OBJ_NAME], objtype, genmask);
8570 if (IS_ERR(obj)) {
8571 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
8572 return ERR_CAST(obj);
8573 }
8574
8575 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
8576 if (!skb2)
8577 return ERR_PTR(-ENOMEM);
8578
8579 err = nf_tables_fill_obj_info(skb2, net, portid,
8580 info->nlh->nlmsg_seq, NFT_MSG_NEWOBJ, 0,
8581 family, table, obj, reset);
8582 if (err < 0) {
8583 kfree_skb(skb2);
8584 return ERR_PTR(err);
8585 }
8586
8587 return skb2;
8588 }
8589
nf_tables_getobj(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])8590 static int nf_tables_getobj(struct sk_buff *skb, const struct nfnl_info *info,
8591 const struct nlattr * const nla[])
8592 {
8593 u32 portid = NETLINK_CB(skb).portid;
8594 struct sk_buff *skb2;
8595
8596 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
8597 struct netlink_dump_control c = {
8598 .start = nf_tables_dump_obj_start,
8599 .dump = nf_tables_dump_obj,
8600 .done = nf_tables_dump_obj_done,
8601 .module = THIS_MODULE,
8602 .data = (void *)nla,
8603 };
8604
8605 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
8606 }
8607
8608 skb2 = nf_tables_getobj_single(portid, info, nla, false);
8609 if (IS_ERR(skb2))
8610 return PTR_ERR(skb2);
8611
8612 return nfnetlink_unicast(skb2, info->net, portid);
8613 }
8614
nf_tables_getobj_reset(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])8615 static int nf_tables_getobj_reset(struct sk_buff *skb,
8616 const struct nfnl_info *info,
8617 const struct nlattr * const nla[])
8618 {
8619 struct nftables_pernet *nft_net = nft_pernet(info->net);
8620 u32 portid = NETLINK_CB(skb).portid;
8621 struct net *net = info->net;
8622 struct sk_buff *skb2;
8623 char *buf;
8624
8625 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
8626 struct netlink_dump_control c = {
8627 .start = nf_tables_dumpreset_obj_start,
8628 .dump = nf_tables_dumpreset_obj,
8629 .done = nf_tables_dump_obj_done,
8630 .module = THIS_MODULE,
8631 .data = (void *)nla,
8632 };
8633
8634 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
8635 }
8636
8637 if (!try_module_get(THIS_MODULE))
8638 return -EINVAL;
8639 rcu_read_unlock();
8640 mutex_lock(&nft_net->commit_mutex);
8641 skb2 = nf_tables_getobj_single(portid, info, nla, true);
8642 mutex_unlock(&nft_net->commit_mutex);
8643 rcu_read_lock();
8644 module_put(THIS_MODULE);
8645
8646 if (IS_ERR(skb2))
8647 return PTR_ERR(skb2);
8648
8649 buf = kasprintf(GFP_ATOMIC, "%.*s:%u",
8650 nla_len(nla[NFTA_OBJ_TABLE]),
8651 (char *)nla_data(nla[NFTA_OBJ_TABLE]),
8652 nft_net->base_seq);
8653 audit_log_nfcfg(buf, info->nfmsg->nfgen_family, 1,
8654 AUDIT_NFT_OP_OBJ_RESET, GFP_ATOMIC);
8655 kfree(buf);
8656
8657 return nfnetlink_unicast(skb2, net, portid);
8658 }
8659
nft_obj_destroy(const struct nft_ctx * ctx,struct nft_object * obj)8660 static void nft_obj_destroy(const struct nft_ctx *ctx, struct nft_object *obj)
8661 {
8662 if (obj->ops->destroy)
8663 obj->ops->destroy(ctx, obj);
8664
8665 module_put(obj->ops->type->owner);
8666 kfree(obj->key.name);
8667 kfree(obj->udata);
8668 kfree(obj);
8669 }
8670
nf_tables_delobj(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])8671 static int nf_tables_delobj(struct sk_buff *skb, const struct nfnl_info *info,
8672 const struct nlattr * const nla[])
8673 {
8674 struct netlink_ext_ack *extack = info->extack;
8675 u8 genmask = nft_genmask_next(info->net);
8676 u8 family = info->nfmsg->nfgen_family;
8677 struct net *net = info->net;
8678 const struct nlattr *attr;
8679 struct nft_table *table;
8680 struct nft_object *obj;
8681 struct nft_ctx ctx;
8682 u32 objtype;
8683
8684 if (!nla[NFTA_OBJ_TYPE] ||
8685 (!nla[NFTA_OBJ_NAME] && !nla[NFTA_OBJ_HANDLE]))
8686 return -EINVAL;
8687
8688 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask,
8689 NETLINK_CB(skb).portid);
8690 if (IS_ERR(table)) {
8691 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
8692 return PTR_ERR(table);
8693 }
8694
8695 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
8696 if (nla[NFTA_OBJ_HANDLE]) {
8697 attr = nla[NFTA_OBJ_HANDLE];
8698 obj = nft_obj_lookup_byhandle(table, attr, objtype, genmask);
8699 } else {
8700 attr = nla[NFTA_OBJ_NAME];
8701 obj = nft_obj_lookup(net, table, attr, objtype, genmask);
8702 }
8703
8704 if (IS_ERR(obj)) {
8705 if (PTR_ERR(obj) == -ENOENT &&
8706 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYOBJ)
8707 return 0;
8708
8709 NL_SET_BAD_ATTR(extack, attr);
8710 return PTR_ERR(obj);
8711 }
8712 if (obj->use > 0) {
8713 NL_SET_BAD_ATTR(extack, attr);
8714 return -EBUSY;
8715 }
8716
8717 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
8718
8719 return nft_delobj(&ctx, obj);
8720 }
8721
8722 static void
__nft_obj_notify(struct net * net,const struct nft_table * table,struct nft_object * obj,u32 portid,u32 seq,int event,u16 flags,int family,int report,gfp_t gfp)8723 __nft_obj_notify(struct net *net, const struct nft_table *table,
8724 struct nft_object *obj, u32 portid, u32 seq, int event,
8725 u16 flags, int family, int report, gfp_t gfp)
8726 {
8727 struct nftables_pernet *nft_net = nft_pernet(net);
8728 struct sk_buff *skb;
8729 int err;
8730
8731 if (!report &&
8732 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
8733 return;
8734
8735 skb = nlmsg_new(NLMSG_GOODSIZE, gfp);
8736 if (skb == NULL)
8737 goto err;
8738
8739 err = nf_tables_fill_obj_info(skb, net, portid, seq, event,
8740 flags & (NLM_F_CREATE | NLM_F_EXCL),
8741 family, table, obj, false);
8742 if (err < 0) {
8743 kfree_skb(skb);
8744 goto err;
8745 }
8746
8747 nft_notify_enqueue(skb, report, &nft_net->notify_list);
8748 return;
8749 err:
8750 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
8751 }
8752
nft_obj_notify(struct net * net,const struct nft_table * table,struct nft_object * obj,u32 portid,u32 seq,int event,u16 flags,int family,int report,gfp_t gfp)8753 void nft_obj_notify(struct net *net, const struct nft_table *table,
8754 struct nft_object *obj, u32 portid, u32 seq, int event,
8755 u16 flags, int family, int report, gfp_t gfp)
8756 {
8757 struct nftables_pernet *nft_net = nft_pernet(net);
8758 char *buf = kasprintf(gfp, "%s:%u",
8759 table->name, nft_net->base_seq);
8760
8761 audit_log_nfcfg(buf,
8762 family,
8763 obj->handle,
8764 event == NFT_MSG_NEWOBJ ?
8765 AUDIT_NFT_OP_OBJ_REGISTER :
8766 AUDIT_NFT_OP_OBJ_UNREGISTER,
8767 gfp);
8768 kfree(buf);
8769
8770 __nft_obj_notify(net, table, obj, portid, seq, event,
8771 flags, family, report, gfp);
8772 }
8773 EXPORT_SYMBOL_GPL(nft_obj_notify);
8774
nf_tables_obj_notify(const struct nft_ctx * ctx,struct nft_object * obj,int event)8775 static void nf_tables_obj_notify(const struct nft_ctx *ctx,
8776 struct nft_object *obj, int event)
8777 {
8778 __nft_obj_notify(ctx->net, ctx->table, obj, ctx->portid,
8779 ctx->seq, event, ctx->flags, ctx->family,
8780 ctx->report, GFP_KERNEL);
8781 }
8782
8783 /*
8784 * Flow tables
8785 */
nft_register_flowtable_type(struct nf_flowtable_type * type)8786 void nft_register_flowtable_type(struct nf_flowtable_type *type)
8787 {
8788 nfnl_lock(NFNL_SUBSYS_NFTABLES);
8789 list_add_tail_rcu(&type->list, &nf_tables_flowtables);
8790 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
8791 }
8792 EXPORT_SYMBOL_GPL(nft_register_flowtable_type);
8793
nft_unregister_flowtable_type(struct nf_flowtable_type * type)8794 void nft_unregister_flowtable_type(struct nf_flowtable_type *type)
8795 {
8796 nfnl_lock(NFNL_SUBSYS_NFTABLES);
8797 list_del_rcu(&type->list);
8798 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
8799 }
8800 EXPORT_SYMBOL_GPL(nft_unregister_flowtable_type);
8801
8802 static const struct nla_policy nft_flowtable_policy[NFTA_FLOWTABLE_MAX + 1] = {
8803 [NFTA_FLOWTABLE_TABLE] = { .type = NLA_STRING,
8804 .len = NFT_NAME_MAXLEN - 1 },
8805 [NFTA_FLOWTABLE_NAME] = { .type = NLA_STRING,
8806 .len = NFT_NAME_MAXLEN - 1 },
8807 [NFTA_FLOWTABLE_HOOK] = { .type = NLA_NESTED },
8808 [NFTA_FLOWTABLE_HANDLE] = { .type = NLA_U64 },
8809 [NFTA_FLOWTABLE_FLAGS] = { .type = NLA_U32 },
8810 };
8811
nft_flowtable_lookup(const struct net * net,const struct nft_table * table,const struct nlattr * nla,u8 genmask)8812 struct nft_flowtable *nft_flowtable_lookup(const struct net *net,
8813 const struct nft_table *table,
8814 const struct nlattr *nla, u8 genmask)
8815 {
8816 struct nft_flowtable *flowtable;
8817
8818 list_for_each_entry_rcu(flowtable, &table->flowtables, list,
8819 lockdep_commit_lock_is_held(net)) {
8820 if (!nla_strcmp(nla, flowtable->name) &&
8821 nft_active_genmask(flowtable, genmask))
8822 return flowtable;
8823 }
8824 return ERR_PTR(-ENOENT);
8825 }
8826 EXPORT_SYMBOL_GPL(nft_flowtable_lookup);
8827
nf_tables_deactivate_flowtable(const struct nft_ctx * ctx,struct nft_flowtable * flowtable,enum nft_trans_phase phase)8828 void nf_tables_deactivate_flowtable(const struct nft_ctx *ctx,
8829 struct nft_flowtable *flowtable,
8830 enum nft_trans_phase phase)
8831 {
8832 switch (phase) {
8833 case NFT_TRANS_PREPARE_ERROR:
8834 case NFT_TRANS_PREPARE:
8835 case NFT_TRANS_ABORT:
8836 case NFT_TRANS_RELEASE:
8837 nft_use_dec(&flowtable->use);
8838 fallthrough;
8839 default:
8840 return;
8841 }
8842 }
8843 EXPORT_SYMBOL_GPL(nf_tables_deactivate_flowtable);
8844
8845 static struct nft_flowtable *
nft_flowtable_lookup_byhandle(const struct nft_table * table,const struct nlattr * nla,u8 genmask)8846 nft_flowtable_lookup_byhandle(const struct nft_table *table,
8847 const struct nlattr *nla, u8 genmask)
8848 {
8849 struct nft_flowtable *flowtable;
8850
8851 list_for_each_entry(flowtable, &table->flowtables, list) {
8852 if (be64_to_cpu(nla_get_be64(nla)) == flowtable->handle &&
8853 nft_active_genmask(flowtable, genmask))
8854 return flowtable;
8855 }
8856 return ERR_PTR(-ENOENT);
8857 }
8858
8859 struct nft_flowtable_hook {
8860 u32 num;
8861 int priority;
8862 struct list_head list;
8863 };
8864
8865 static const struct nla_policy nft_flowtable_hook_policy[NFTA_FLOWTABLE_HOOK_MAX + 1] = {
8866 [NFTA_FLOWTABLE_HOOK_NUM] = { .type = NLA_U32 },
8867 [NFTA_FLOWTABLE_HOOK_PRIORITY] = { .type = NLA_U32 },
8868 [NFTA_FLOWTABLE_HOOK_DEVS] = { .type = NLA_NESTED },
8869 };
8870
nft_flowtable_parse_hook(const struct nft_ctx * ctx,const struct nlattr * const nla[],struct nft_flowtable_hook * flowtable_hook,struct nft_flowtable * flowtable,struct netlink_ext_ack * extack,bool add)8871 static int nft_flowtable_parse_hook(const struct nft_ctx *ctx,
8872 const struct nlattr * const nla[],
8873 struct nft_flowtable_hook *flowtable_hook,
8874 struct nft_flowtable *flowtable,
8875 struct netlink_ext_ack *extack, bool add)
8876 {
8877 struct nlattr *tb[NFTA_FLOWTABLE_HOOK_MAX + 1];
8878 struct nf_hook_ops *ops;
8879 struct nft_hook *hook;
8880 int hooknum, priority;
8881 int err;
8882
8883 INIT_LIST_HEAD(&flowtable_hook->list);
8884
8885 err = nla_parse_nested_deprecated(tb, NFTA_FLOWTABLE_HOOK_MAX,
8886 nla[NFTA_FLOWTABLE_HOOK],
8887 nft_flowtable_hook_policy, NULL);
8888 if (err < 0)
8889 return err;
8890
8891 if (add) {
8892 if (!tb[NFTA_FLOWTABLE_HOOK_NUM] ||
8893 !tb[NFTA_FLOWTABLE_HOOK_PRIORITY]) {
8894 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
8895 return -ENOENT;
8896 }
8897
8898 hooknum = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_NUM]));
8899 if (hooknum != NF_NETDEV_INGRESS)
8900 return -EOPNOTSUPP;
8901
8902 priority = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_PRIORITY]));
8903
8904 flowtable_hook->priority = priority;
8905 flowtable_hook->num = hooknum;
8906 } else {
8907 if (tb[NFTA_FLOWTABLE_HOOK_NUM]) {
8908 hooknum = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_NUM]));
8909 if (hooknum != flowtable->hooknum)
8910 return -EOPNOTSUPP;
8911 }
8912
8913 if (tb[NFTA_FLOWTABLE_HOOK_PRIORITY]) {
8914 priority = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_PRIORITY]));
8915 if (priority != flowtable->data.priority)
8916 return -EOPNOTSUPP;
8917 }
8918
8919 flowtable_hook->priority = flowtable->data.priority;
8920 flowtable_hook->num = flowtable->hooknum;
8921 }
8922
8923 if (tb[NFTA_FLOWTABLE_HOOK_DEVS]) {
8924 err = nf_tables_parse_netdev_hooks(ctx->net,
8925 tb[NFTA_FLOWTABLE_HOOK_DEVS],
8926 &flowtable_hook->list,
8927 extack);
8928 if (err < 0)
8929 return err;
8930 }
8931
8932 list_for_each_entry(hook, &flowtable_hook->list, list) {
8933 list_for_each_entry(ops, &hook->ops_list, list) {
8934 ops->pf = NFPROTO_NETDEV;
8935 ops->hooknum = flowtable_hook->num;
8936 ops->priority = flowtable_hook->priority;
8937 ops->priv = &flowtable->data;
8938 ops->hook = flowtable->data.type->hook;
8939 ops->hook_ops_type = NF_HOOK_OP_NFT_FT;
8940 }
8941 }
8942
8943 return err;
8944 }
8945
8946 /* call under rcu_read_lock */
__nft_flowtable_type_get(u8 family)8947 static const struct nf_flowtable_type *__nft_flowtable_type_get(u8 family)
8948 {
8949 const struct nf_flowtable_type *type;
8950
8951 list_for_each_entry_rcu(type, &nf_tables_flowtables, list) {
8952 if (family == type->family)
8953 return type;
8954 }
8955 return NULL;
8956 }
8957
8958 static const struct nf_flowtable_type *
nft_flowtable_type_get(struct net * net,u8 family)8959 nft_flowtable_type_get(struct net *net, u8 family)
8960 {
8961 const struct nf_flowtable_type *type;
8962
8963 rcu_read_lock();
8964 type = __nft_flowtable_type_get(family);
8965 if (type != NULL && try_module_get(type->owner)) {
8966 rcu_read_unlock();
8967 return type;
8968 }
8969 rcu_read_unlock();
8970
8971 lockdep_nfnl_nft_mutex_not_held();
8972 #ifdef CONFIG_MODULES
8973 if (type == NULL) {
8974 if (nft_request_module(net, "nf-flowtable-%u", family) == -EAGAIN)
8975 return ERR_PTR(-EAGAIN);
8976 }
8977 #endif
8978 return ERR_PTR(-ENOENT);
8979 }
8980
8981 /* Only called from error and netdev event paths. */
nft_unregister_flowtable_ops(struct net * net,struct nft_flowtable * flowtable,struct nf_hook_ops * ops)8982 static void nft_unregister_flowtable_ops(struct net *net,
8983 struct nft_flowtable *flowtable,
8984 struct nf_hook_ops *ops)
8985 {
8986 nf_unregister_net_hook(net, ops);
8987 flowtable->data.type->setup(&flowtable->data, ops->dev,
8988 FLOW_BLOCK_UNBIND);
8989 }
8990
__nft_unregister_flowtable_net_hooks(struct net * net,struct nft_flowtable * flowtable,struct list_head * hook_list,bool release_netdev)8991 static void __nft_unregister_flowtable_net_hooks(struct net *net,
8992 struct nft_flowtable *flowtable,
8993 struct list_head *hook_list,
8994 bool release_netdev)
8995 {
8996 struct nft_hook *hook, *next;
8997 struct nf_hook_ops *ops;
8998
8999 list_for_each_entry_safe(hook, next, hook_list, list) {
9000 list_for_each_entry(ops, &hook->ops_list, list)
9001 nft_unregister_flowtable_ops(net, flowtable, ops);
9002 if (release_netdev) {
9003 list_del(&hook->list);
9004 nft_netdev_hook_free_rcu(hook);
9005 }
9006 }
9007 }
9008
nft_unregister_flowtable_net_hooks(struct net * net,struct nft_flowtable * flowtable,struct list_head * hook_list)9009 static void nft_unregister_flowtable_net_hooks(struct net *net,
9010 struct nft_flowtable *flowtable,
9011 struct list_head *hook_list)
9012 {
9013 __nft_unregister_flowtable_net_hooks(net, flowtable, hook_list, false);
9014 }
9015
nft_register_flowtable_ops(struct net * net,struct nft_flowtable * flowtable,struct nf_hook_ops * ops)9016 static int nft_register_flowtable_ops(struct net *net,
9017 struct nft_flowtable *flowtable,
9018 struct nf_hook_ops *ops)
9019 {
9020 int err;
9021
9022 err = flowtable->data.type->setup(&flowtable->data,
9023 ops->dev, FLOW_BLOCK_BIND);
9024 if (err < 0)
9025 return err;
9026
9027 err = nf_register_net_hook(net, ops);
9028 if (!err)
9029 return 0;
9030
9031 flowtable->data.type->setup(&flowtable->data,
9032 ops->dev, FLOW_BLOCK_UNBIND);
9033 return err;
9034 }
9035
nft_register_flowtable_net_hooks(struct net * net,struct nft_table * table,struct list_head * hook_list,struct nft_flowtable * flowtable)9036 static int nft_register_flowtable_net_hooks(struct net *net,
9037 struct nft_table *table,
9038 struct list_head *hook_list,
9039 struct nft_flowtable *flowtable)
9040 {
9041 struct nft_hook *hook, *next;
9042 struct nft_flowtable *ft;
9043 struct nf_hook_ops *ops;
9044 int err, i = 0;
9045
9046 list_for_each_entry(hook, hook_list, list) {
9047 list_for_each_entry(ft, &table->flowtables, list) {
9048 if (!nft_is_active_next(net, ft))
9049 continue;
9050
9051 if (nft_hook_list_find(&ft->hook_list, hook)) {
9052 err = -EEXIST;
9053 goto err_unregister_net_hooks;
9054 }
9055 }
9056
9057 list_for_each_entry(ops, &hook->ops_list, list) {
9058 err = nft_register_flowtable_ops(net, flowtable, ops);
9059 if (err < 0)
9060 goto err_unregister_net_hooks;
9061
9062 i++;
9063 }
9064 }
9065
9066 return 0;
9067
9068 err_unregister_net_hooks:
9069 list_for_each_entry_safe(hook, next, hook_list, list) {
9070 list_for_each_entry(ops, &hook->ops_list, list) {
9071 if (i-- <= 0)
9072 break;
9073
9074 nft_unregister_flowtable_ops(net, flowtable, ops);
9075 }
9076 list_del_rcu(&hook->list);
9077 nft_netdev_hook_free_rcu(hook);
9078 }
9079
9080 return err;
9081 }
9082
nft_hooks_destroy(struct list_head * hook_list)9083 static void nft_hooks_destroy(struct list_head *hook_list)
9084 {
9085 struct nft_hook *hook, *next;
9086
9087 list_for_each_entry_safe(hook, next, hook_list, list) {
9088 list_del_rcu(&hook->list);
9089 nft_netdev_hook_free_rcu(hook);
9090 }
9091 }
9092
nft_flowtable_update(struct nft_ctx * ctx,const struct nlmsghdr * nlh,struct nft_flowtable * flowtable,struct netlink_ext_ack * extack)9093 static int nft_flowtable_update(struct nft_ctx *ctx, const struct nlmsghdr *nlh,
9094 struct nft_flowtable *flowtable,
9095 struct netlink_ext_ack *extack)
9096 {
9097 const struct nlattr * const *nla = ctx->nla;
9098 struct nft_flowtable_hook flowtable_hook;
9099 struct nftables_pernet *nft_net;
9100 struct nft_hook *hook, *next;
9101 struct nf_hook_ops *ops;
9102 struct nft_trans *trans;
9103 bool unregister = false;
9104 u32 flags;
9105 int err;
9106
9107 err = nft_flowtable_parse_hook(ctx, nla, &flowtable_hook, flowtable,
9108 extack, false);
9109 if (err < 0)
9110 return err;
9111
9112 list_for_each_entry_safe(hook, next, &flowtable_hook.list, list) {
9113 if (nft_hook_list_find(&flowtable->hook_list, hook)) {
9114 list_del(&hook->list);
9115 nft_netdev_hook_free(hook);
9116 continue;
9117 }
9118
9119 nft_net = nft_pernet(ctx->net);
9120 list_for_each_entry(trans, &nft_net->commit_list, list) {
9121 if (trans->msg_type != NFT_MSG_NEWFLOWTABLE ||
9122 trans->table != ctx->table ||
9123 !nft_trans_flowtable_update(trans))
9124 continue;
9125
9126 if (nft_hook_list_find(&nft_trans_flowtable_hooks(trans), hook)) {
9127 err = -EEXIST;
9128 goto err_flowtable_update_hook;
9129 }
9130 }
9131 }
9132
9133 if (nla[NFTA_FLOWTABLE_FLAGS]) {
9134 flags = ntohl(nla_get_be32(nla[NFTA_FLOWTABLE_FLAGS]));
9135 if (flags & ~NFT_FLOWTABLE_MASK) {
9136 err = -EOPNOTSUPP;
9137 goto err_flowtable_update_hook;
9138 }
9139 if ((flowtable->data.flags & NFT_FLOWTABLE_HW_OFFLOAD) ^
9140 (flags & NFT_FLOWTABLE_HW_OFFLOAD)) {
9141 err = -EOPNOTSUPP;
9142 goto err_flowtable_update_hook;
9143 }
9144 } else {
9145 flags = flowtable->data.flags;
9146 }
9147
9148 err = nft_register_flowtable_net_hooks(ctx->net, ctx->table,
9149 &flowtable_hook.list, flowtable);
9150 if (err < 0)
9151 goto err_flowtable_update_hook;
9152
9153 trans = nft_trans_alloc(ctx, NFT_MSG_NEWFLOWTABLE,
9154 sizeof(struct nft_trans_flowtable));
9155 if (!trans) {
9156 unregister = true;
9157 err = -ENOMEM;
9158 goto err_flowtable_update_hook;
9159 }
9160
9161 nft_trans_flowtable_flags(trans) = flags;
9162 nft_trans_flowtable(trans) = flowtable;
9163 nft_trans_flowtable_update(trans) = true;
9164 INIT_LIST_HEAD(&nft_trans_flowtable_hooks(trans));
9165 list_splice(&flowtable_hook.list, &nft_trans_flowtable_hooks(trans));
9166
9167 nft_trans_commit_list_add_tail(ctx->net, trans);
9168
9169 return 0;
9170
9171 err_flowtable_update_hook:
9172 list_for_each_entry_safe(hook, next, &flowtable_hook.list, list) {
9173 if (unregister) {
9174 list_for_each_entry(ops, &hook->ops_list, list)
9175 nft_unregister_flowtable_ops(ctx->net,
9176 flowtable, ops);
9177 }
9178 list_del_rcu(&hook->list);
9179 nft_netdev_hook_free_rcu(hook);
9180 }
9181
9182 return err;
9183
9184 }
9185
nf_tables_newflowtable(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])9186 static int nf_tables_newflowtable(struct sk_buff *skb,
9187 const struct nfnl_info *info,
9188 const struct nlattr * const nla[])
9189 {
9190 struct netlink_ext_ack *extack = info->extack;
9191 struct nft_flowtable_hook flowtable_hook;
9192 u8 genmask = nft_genmask_next(info->net);
9193 u8 family = info->nfmsg->nfgen_family;
9194 const struct nf_flowtable_type *type;
9195 struct nft_flowtable *flowtable;
9196 struct net *net = info->net;
9197 struct nft_table *table;
9198 struct nft_trans *trans;
9199 struct nft_ctx ctx;
9200 int err;
9201
9202 if (!nla[NFTA_FLOWTABLE_TABLE] ||
9203 !nla[NFTA_FLOWTABLE_NAME] ||
9204 !nla[NFTA_FLOWTABLE_HOOK])
9205 return -EINVAL;
9206
9207 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
9208 genmask, NETLINK_CB(skb).portid);
9209 if (IS_ERR(table)) {
9210 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_TABLE]);
9211 return PTR_ERR(table);
9212 }
9213
9214 flowtable = nft_flowtable_lookup(net, table, nla[NFTA_FLOWTABLE_NAME],
9215 genmask);
9216 if (IS_ERR(flowtable)) {
9217 err = PTR_ERR(flowtable);
9218 if (err != -ENOENT) {
9219 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
9220 return err;
9221 }
9222 } else {
9223 if (info->nlh->nlmsg_flags & NLM_F_EXCL) {
9224 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
9225 return -EEXIST;
9226 }
9227
9228 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
9229
9230 return nft_flowtable_update(&ctx, info->nlh, flowtable, extack);
9231 }
9232
9233 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
9234
9235 if (!nft_use_inc(&table->use))
9236 return -EMFILE;
9237
9238 flowtable = kzalloc(sizeof(*flowtable), GFP_KERNEL_ACCOUNT);
9239 if (!flowtable) {
9240 err = -ENOMEM;
9241 goto flowtable_alloc;
9242 }
9243
9244 flowtable->table = table;
9245 flowtable->handle = nf_tables_alloc_handle(table);
9246 INIT_LIST_HEAD(&flowtable->hook_list);
9247
9248 flowtable->name = nla_strdup(nla[NFTA_FLOWTABLE_NAME], GFP_KERNEL_ACCOUNT);
9249 if (!flowtable->name) {
9250 err = -ENOMEM;
9251 goto err1;
9252 }
9253
9254 type = nft_flowtable_type_get(net, family);
9255 if (IS_ERR(type)) {
9256 err = PTR_ERR(type);
9257 goto err2;
9258 }
9259
9260 if (nla[NFTA_FLOWTABLE_FLAGS]) {
9261 flowtable->data.flags =
9262 ntohl(nla_get_be32(nla[NFTA_FLOWTABLE_FLAGS]));
9263 if (flowtable->data.flags & ~NFT_FLOWTABLE_MASK) {
9264 err = -EOPNOTSUPP;
9265 goto err3;
9266 }
9267 }
9268
9269 write_pnet(&flowtable->data.net, net);
9270 flowtable->data.type = type;
9271 err = type->init(&flowtable->data);
9272 if (err < 0)
9273 goto err3;
9274
9275 err = nft_flowtable_parse_hook(&ctx, nla, &flowtable_hook, flowtable,
9276 extack, true);
9277 if (err < 0)
9278 goto err_flowtable_parse_hooks;
9279
9280 list_splice(&flowtable_hook.list, &flowtable->hook_list);
9281 flowtable->data.priority = flowtable_hook.priority;
9282 flowtable->hooknum = flowtable_hook.num;
9283
9284 trans = nft_trans_flowtable_add(&ctx, NFT_MSG_NEWFLOWTABLE, flowtable);
9285 if (IS_ERR(trans)) {
9286 err = PTR_ERR(trans);
9287 goto err_flowtable_trans;
9288 }
9289
9290 /* This must be LAST to ensure no packets are walking over this flowtable. */
9291 err = nft_register_flowtable_net_hooks(ctx.net, table,
9292 &flowtable->hook_list,
9293 flowtable);
9294 if (err < 0)
9295 goto err_flowtable_hooks;
9296
9297 list_add_tail_rcu(&flowtable->list, &table->flowtables);
9298
9299 return 0;
9300
9301 err_flowtable_hooks:
9302 nft_trans_destroy(trans);
9303 err_flowtable_trans:
9304 nft_hooks_destroy(&flowtable->hook_list);
9305 err_flowtable_parse_hooks:
9306 flowtable->data.type->free(&flowtable->data);
9307 err3:
9308 module_put(type->owner);
9309 err2:
9310 kfree(flowtable->name);
9311 err1:
9312 kfree(flowtable);
9313 flowtable_alloc:
9314 nft_use_dec_restore(&table->use);
9315
9316 return err;
9317 }
9318
nft_flowtable_hook_release(struct nft_flowtable_hook * flowtable_hook)9319 static void nft_flowtable_hook_release(struct nft_flowtable_hook *flowtable_hook)
9320 {
9321 struct nft_hook *this, *next;
9322
9323 list_for_each_entry_safe(this, next, &flowtable_hook->list, list) {
9324 list_del(&this->list);
9325 nft_netdev_hook_free(this);
9326 }
9327 }
9328
nft_delflowtable_hook(struct nft_ctx * ctx,struct nft_flowtable * flowtable,struct netlink_ext_ack * extack)9329 static int nft_delflowtable_hook(struct nft_ctx *ctx,
9330 struct nft_flowtable *flowtable,
9331 struct netlink_ext_ack *extack)
9332 {
9333 const struct nlattr * const *nla = ctx->nla;
9334 struct nft_flowtable_hook flowtable_hook;
9335 LIST_HEAD(flowtable_del_list);
9336 struct nft_hook *this, *hook;
9337 struct nft_trans *trans;
9338 int err;
9339
9340 err = nft_flowtable_parse_hook(ctx, nla, &flowtable_hook, flowtable,
9341 extack, false);
9342 if (err < 0)
9343 return err;
9344
9345 list_for_each_entry(this, &flowtable_hook.list, list) {
9346 hook = nft_hook_list_find(&flowtable->hook_list, this);
9347 if (!hook) {
9348 err = -ENOENT;
9349 goto err_flowtable_del_hook;
9350 }
9351 list_move(&hook->list, &flowtable_del_list);
9352 }
9353
9354 trans = nft_trans_alloc(ctx, NFT_MSG_DELFLOWTABLE,
9355 sizeof(struct nft_trans_flowtable));
9356 if (!trans) {
9357 err = -ENOMEM;
9358 goto err_flowtable_del_hook;
9359 }
9360
9361 nft_trans_flowtable(trans) = flowtable;
9362 nft_trans_flowtable_update(trans) = true;
9363 INIT_LIST_HEAD(&nft_trans_flowtable_hooks(trans));
9364 list_splice(&flowtable_del_list, &nft_trans_flowtable_hooks(trans));
9365 nft_flowtable_hook_release(&flowtable_hook);
9366
9367 nft_trans_commit_list_add_tail(ctx->net, trans);
9368
9369 return 0;
9370
9371 err_flowtable_del_hook:
9372 list_splice(&flowtable_del_list, &flowtable->hook_list);
9373 nft_flowtable_hook_release(&flowtable_hook);
9374
9375 return err;
9376 }
9377
nf_tables_delflowtable(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])9378 static int nf_tables_delflowtable(struct sk_buff *skb,
9379 const struct nfnl_info *info,
9380 const struct nlattr * const nla[])
9381 {
9382 struct netlink_ext_ack *extack = info->extack;
9383 u8 genmask = nft_genmask_next(info->net);
9384 u8 family = info->nfmsg->nfgen_family;
9385 struct nft_flowtable *flowtable;
9386 struct net *net = info->net;
9387 const struct nlattr *attr;
9388 struct nft_table *table;
9389 struct nft_ctx ctx;
9390
9391 if (!nla[NFTA_FLOWTABLE_TABLE] ||
9392 (!nla[NFTA_FLOWTABLE_NAME] &&
9393 !nla[NFTA_FLOWTABLE_HANDLE]))
9394 return -EINVAL;
9395
9396 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
9397 genmask, NETLINK_CB(skb).portid);
9398 if (IS_ERR(table)) {
9399 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_TABLE]);
9400 return PTR_ERR(table);
9401 }
9402
9403 if (nla[NFTA_FLOWTABLE_HANDLE]) {
9404 attr = nla[NFTA_FLOWTABLE_HANDLE];
9405 flowtable = nft_flowtable_lookup_byhandle(table, attr, genmask);
9406 } else {
9407 attr = nla[NFTA_FLOWTABLE_NAME];
9408 flowtable = nft_flowtable_lookup(net, table, attr, genmask);
9409 }
9410
9411 if (IS_ERR(flowtable)) {
9412 if (PTR_ERR(flowtable) == -ENOENT &&
9413 NFNL_MSG_TYPE(info->nlh->nlmsg_type) == NFT_MSG_DESTROYFLOWTABLE)
9414 return 0;
9415
9416 NL_SET_BAD_ATTR(extack, attr);
9417 return PTR_ERR(flowtable);
9418 }
9419
9420 nft_ctx_init(&ctx, net, skb, info->nlh, family, table, NULL, nla);
9421
9422 if (nla[NFTA_FLOWTABLE_HOOK])
9423 return nft_delflowtable_hook(&ctx, flowtable, extack);
9424
9425 if (flowtable->use > 0) {
9426 NL_SET_BAD_ATTR(extack, attr);
9427 return -EBUSY;
9428 }
9429
9430 return nft_delflowtable(&ctx, flowtable);
9431 }
9432
nf_tables_fill_flowtable_info(struct sk_buff * skb,struct net * net,u32 portid,u32 seq,int event,u32 flags,int family,struct nft_flowtable * flowtable,struct list_head * hook_list)9433 static int nf_tables_fill_flowtable_info(struct sk_buff *skb, struct net *net,
9434 u32 portid, u32 seq, int event,
9435 u32 flags, int family,
9436 struct nft_flowtable *flowtable,
9437 struct list_head *hook_list)
9438 {
9439 struct nlattr *nest, *nest_devs;
9440 struct nft_hook *hook;
9441 struct nlmsghdr *nlh;
9442
9443 nlh = nfnl_msg_put(skb, portid, seq,
9444 nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event),
9445 flags, family, NFNETLINK_V0, nft_base_seq(net));
9446 if (!nlh)
9447 goto nla_put_failure;
9448
9449 if (nla_put_string(skb, NFTA_FLOWTABLE_TABLE, flowtable->table->name) ||
9450 nla_put_string(skb, NFTA_FLOWTABLE_NAME, flowtable->name) ||
9451 nla_put_be64(skb, NFTA_FLOWTABLE_HANDLE, cpu_to_be64(flowtable->handle),
9452 NFTA_FLOWTABLE_PAD))
9453 goto nla_put_failure;
9454
9455 if (!hook_list &&
9456 (event == NFT_MSG_DELFLOWTABLE ||
9457 event == NFT_MSG_DESTROYFLOWTABLE)) {
9458 nlmsg_end(skb, nlh);
9459 return 0;
9460 }
9461
9462 if (nla_put_be32(skb, NFTA_FLOWTABLE_USE, htonl(flowtable->use)) ||
9463 nla_put_be32(skb, NFTA_FLOWTABLE_FLAGS, htonl(flowtable->data.flags)))
9464 goto nla_put_failure;
9465
9466 nest = nla_nest_start_noflag(skb, NFTA_FLOWTABLE_HOOK);
9467 if (!nest)
9468 goto nla_put_failure;
9469 if (nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_NUM, htonl(flowtable->hooknum)) ||
9470 nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_PRIORITY, htonl(flowtable->data.priority)))
9471 goto nla_put_failure;
9472
9473 nest_devs = nla_nest_start_noflag(skb, NFTA_FLOWTABLE_HOOK_DEVS);
9474 if (!nest_devs)
9475 goto nla_put_failure;
9476
9477 if (!hook_list)
9478 hook_list = &flowtable->hook_list;
9479
9480 list_for_each_entry_rcu(hook, hook_list, list,
9481 lockdep_commit_lock_is_held(net)) {
9482 if (nft_nla_put_hook_dev(skb, hook))
9483 goto nla_put_failure;
9484 }
9485 nla_nest_end(skb, nest_devs);
9486 nla_nest_end(skb, nest);
9487
9488 nlmsg_end(skb, nlh);
9489 return 0;
9490
9491 nla_put_failure:
9492 nlmsg_trim(skb, nlh);
9493 return -1;
9494 }
9495
9496 struct nft_flowtable_filter {
9497 char *table;
9498 };
9499
nf_tables_dump_flowtable(struct sk_buff * skb,struct netlink_callback * cb)9500 static int nf_tables_dump_flowtable(struct sk_buff *skb,
9501 struct netlink_callback *cb)
9502 {
9503 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
9504 struct nft_flowtable_filter *filter = cb->data;
9505 unsigned int idx = 0, s_idx = cb->args[0];
9506 struct net *net = sock_net(skb->sk);
9507 int family = nfmsg->nfgen_family;
9508 struct nft_flowtable *flowtable;
9509 struct nftables_pernet *nft_net;
9510 const struct nft_table *table;
9511
9512 rcu_read_lock();
9513 nft_net = nft_pernet(net);
9514 cb->seq = READ_ONCE(nft_net->base_seq);
9515
9516 list_for_each_entry_rcu(table, &nft_net->tables, list) {
9517 if (family != NFPROTO_UNSPEC && family != table->family)
9518 continue;
9519
9520 list_for_each_entry_rcu(flowtable, &table->flowtables, list) {
9521 if (!nft_is_active(net, flowtable))
9522 goto cont;
9523 if (idx < s_idx)
9524 goto cont;
9525 if (idx > s_idx)
9526 memset(&cb->args[1], 0,
9527 sizeof(cb->args) - sizeof(cb->args[0]));
9528 if (filter && filter->table &&
9529 strcmp(filter->table, table->name))
9530 goto cont;
9531
9532 if (nf_tables_fill_flowtable_info(skb, net, NETLINK_CB(cb->skb).portid,
9533 cb->nlh->nlmsg_seq,
9534 NFT_MSG_NEWFLOWTABLE,
9535 NLM_F_MULTI | NLM_F_APPEND,
9536 table->family,
9537 flowtable, NULL) < 0)
9538 goto done;
9539
9540 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
9541 cont:
9542 idx++;
9543 }
9544 }
9545 done:
9546 rcu_read_unlock();
9547
9548 cb->args[0] = idx;
9549 return skb->len;
9550 }
9551
nf_tables_dump_flowtable_start(struct netlink_callback * cb)9552 static int nf_tables_dump_flowtable_start(struct netlink_callback *cb)
9553 {
9554 const struct nlattr * const *nla = cb->data;
9555 struct nft_flowtable_filter *filter = NULL;
9556
9557 if (nla[NFTA_FLOWTABLE_TABLE]) {
9558 filter = kzalloc(sizeof(*filter), GFP_ATOMIC);
9559 if (!filter)
9560 return -ENOMEM;
9561
9562 filter->table = nla_strdup(nla[NFTA_FLOWTABLE_TABLE],
9563 GFP_ATOMIC);
9564 if (!filter->table) {
9565 kfree(filter);
9566 return -ENOMEM;
9567 }
9568 }
9569
9570 cb->data = filter;
9571 return 0;
9572 }
9573
nf_tables_dump_flowtable_done(struct netlink_callback * cb)9574 static int nf_tables_dump_flowtable_done(struct netlink_callback *cb)
9575 {
9576 struct nft_flowtable_filter *filter = cb->data;
9577
9578 if (!filter)
9579 return 0;
9580
9581 kfree(filter->table);
9582 kfree(filter);
9583
9584 return 0;
9585 }
9586
9587 /* called with rcu_read_lock held */
nf_tables_getflowtable(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])9588 static int nf_tables_getflowtable(struct sk_buff *skb,
9589 const struct nfnl_info *info,
9590 const struct nlattr * const nla[])
9591 {
9592 struct netlink_ext_ack *extack = info->extack;
9593 u8 genmask = nft_genmask_cur(info->net);
9594 u8 family = info->nfmsg->nfgen_family;
9595 struct nft_flowtable *flowtable;
9596 const struct nft_table *table;
9597 struct net *net = info->net;
9598 struct sk_buff *skb2;
9599 int err;
9600
9601 if (info->nlh->nlmsg_flags & NLM_F_DUMP) {
9602 struct netlink_dump_control c = {
9603 .start = nf_tables_dump_flowtable_start,
9604 .dump = nf_tables_dump_flowtable,
9605 .done = nf_tables_dump_flowtable_done,
9606 .module = THIS_MODULE,
9607 .data = (void *)nla,
9608 };
9609
9610 return nft_netlink_dump_start_rcu(info->sk, skb, info->nlh, &c);
9611 }
9612
9613 if (!nla[NFTA_FLOWTABLE_NAME])
9614 return -EINVAL;
9615
9616 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
9617 genmask, 0);
9618 if (IS_ERR(table)) {
9619 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_TABLE]);
9620 return PTR_ERR(table);
9621 }
9622
9623 flowtable = nft_flowtable_lookup(net, table, nla[NFTA_FLOWTABLE_NAME],
9624 genmask);
9625 if (IS_ERR(flowtable)) {
9626 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
9627 return PTR_ERR(flowtable);
9628 }
9629
9630 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
9631 if (!skb2)
9632 return -ENOMEM;
9633
9634 err = nf_tables_fill_flowtable_info(skb2, net, NETLINK_CB(skb).portid,
9635 info->nlh->nlmsg_seq,
9636 NFT_MSG_NEWFLOWTABLE, 0, family,
9637 flowtable, NULL);
9638 if (err < 0)
9639 goto err_fill_flowtable_info;
9640
9641 return nfnetlink_unicast(skb2, net, NETLINK_CB(skb).portid);
9642
9643 err_fill_flowtable_info:
9644 kfree_skb(skb2);
9645 return err;
9646 }
9647
nf_tables_flowtable_notify(struct nft_ctx * ctx,struct nft_flowtable * flowtable,struct list_head * hook_list,int event)9648 static void nf_tables_flowtable_notify(struct nft_ctx *ctx,
9649 struct nft_flowtable *flowtable,
9650 struct list_head *hook_list, int event)
9651 {
9652 struct nftables_pernet *nft_net = nft_pernet(ctx->net);
9653 struct sk_buff *skb;
9654 u16 flags = 0;
9655 int err;
9656
9657 if (!ctx->report &&
9658 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
9659 return;
9660
9661 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
9662 if (skb == NULL)
9663 goto err;
9664
9665 if (ctx->flags & (NLM_F_CREATE | NLM_F_EXCL))
9666 flags |= ctx->flags & (NLM_F_CREATE | NLM_F_EXCL);
9667
9668 err = nf_tables_fill_flowtable_info(skb, ctx->net, ctx->portid,
9669 ctx->seq, event, flags,
9670 ctx->family, flowtable, hook_list);
9671 if (err < 0) {
9672 kfree_skb(skb);
9673 goto err;
9674 }
9675
9676 nft_notify_enqueue(skb, ctx->report, &nft_net->notify_list);
9677 return;
9678 err:
9679 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
9680 }
9681
nf_tables_flowtable_destroy(struct nft_flowtable * flowtable)9682 static void nf_tables_flowtable_destroy(struct nft_flowtable *flowtable)
9683 {
9684 struct nft_hook *hook, *next;
9685
9686 flowtable->data.type->free(&flowtable->data);
9687 list_for_each_entry_safe(hook, next, &flowtable->hook_list, list) {
9688 list_del_rcu(&hook->list);
9689 nft_netdev_hook_free_rcu(hook);
9690 }
9691 kfree(flowtable->name);
9692 module_put(flowtable->data.type->owner);
9693 kfree(flowtable);
9694 }
9695
nf_tables_fill_gen_info(struct sk_buff * skb,struct net * net,u32 portid,u32 seq)9696 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
9697 u32 portid, u32 seq)
9698 {
9699 struct nftables_pernet *nft_net = nft_pernet(net);
9700 struct nlmsghdr *nlh;
9701 char buf[TASK_COMM_LEN];
9702 int event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWGEN);
9703
9704 nlh = nfnl_msg_put(skb, portid, seq, event, 0, AF_UNSPEC,
9705 NFNETLINK_V0, nft_base_seq(net));
9706 if (!nlh)
9707 goto nla_put_failure;
9708
9709 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(nft_net->base_seq)) ||
9710 nla_put_be32(skb, NFTA_GEN_PROC_PID, htonl(task_pid_nr(current))) ||
9711 nla_put_string(skb, NFTA_GEN_PROC_NAME, get_task_comm(buf, current)))
9712 goto nla_put_failure;
9713
9714 nlmsg_end(skb, nlh);
9715 return 0;
9716
9717 nla_put_failure:
9718 nlmsg_trim(skb, nlh);
9719 return -EMSGSIZE;
9720 }
9721
nft_hook_find_ops(const struct nft_hook * hook,const struct net_device * dev)9722 struct nf_hook_ops *nft_hook_find_ops(const struct nft_hook *hook,
9723 const struct net_device *dev)
9724 {
9725 struct nf_hook_ops *ops;
9726
9727 list_for_each_entry(ops, &hook->ops_list, list) {
9728 if (ops->dev == dev)
9729 return ops;
9730 }
9731 return NULL;
9732 }
9733 EXPORT_SYMBOL_GPL(nft_hook_find_ops);
9734
nft_hook_find_ops_rcu(const struct nft_hook * hook,const struct net_device * dev)9735 struct nf_hook_ops *nft_hook_find_ops_rcu(const struct nft_hook *hook,
9736 const struct net_device *dev)
9737 {
9738 struct nf_hook_ops *ops;
9739
9740 list_for_each_entry_rcu(ops, &hook->ops_list, list) {
9741 if (ops->dev == dev)
9742 return ops;
9743 }
9744 return NULL;
9745 }
9746 EXPORT_SYMBOL_GPL(nft_hook_find_ops_rcu);
9747
nft_flowtable_event(unsigned long event,struct net_device * dev,struct nft_flowtable * flowtable,bool changename)9748 static int nft_flowtable_event(unsigned long event, struct net_device *dev,
9749 struct nft_flowtable *flowtable, bool changename)
9750 {
9751 struct nf_hook_ops *ops;
9752 struct nft_hook *hook;
9753 bool match;
9754
9755 list_for_each_entry(hook, &flowtable->hook_list, list) {
9756 ops = nft_hook_find_ops(hook, dev);
9757 match = !strncmp(hook->ifname, dev->name, hook->ifnamelen);
9758
9759 switch (event) {
9760 case NETDEV_UNREGISTER:
9761 /* NOP if not found or new name still matching */
9762 if (!ops || (changename && match))
9763 continue;
9764
9765 /* flow_offload_netdev_event() cleans up entries for us. */
9766 nft_unregister_flowtable_ops(dev_net(dev),
9767 flowtable, ops);
9768 list_del_rcu(&ops->list);
9769 kfree_rcu(ops, rcu);
9770 break;
9771 case NETDEV_REGISTER:
9772 /* NOP if not matching or already registered */
9773 if (!match || (changename && ops))
9774 continue;
9775
9776 ops = kzalloc(sizeof(struct nf_hook_ops),
9777 GFP_KERNEL_ACCOUNT);
9778 if (!ops)
9779 return 1;
9780
9781 ops->pf = NFPROTO_NETDEV;
9782 ops->hooknum = flowtable->hooknum;
9783 ops->priority = flowtable->data.priority;
9784 ops->priv = &flowtable->data;
9785 ops->hook = flowtable->data.type->hook;
9786 ops->hook_ops_type = NF_HOOK_OP_NFT_FT;
9787 ops->dev = dev;
9788 if (nft_register_flowtable_ops(dev_net(dev),
9789 flowtable, ops)) {
9790 kfree(ops);
9791 return 1;
9792 }
9793 list_add_tail_rcu(&ops->list, &hook->ops_list);
9794 break;
9795 }
9796 break;
9797 }
9798 return 0;
9799 }
9800
__nf_tables_flowtable_event(unsigned long event,struct net_device * dev,bool changename)9801 static int __nf_tables_flowtable_event(unsigned long event,
9802 struct net_device *dev,
9803 bool changename)
9804 {
9805 struct nftables_pernet *nft_net = nft_pernet(dev_net(dev));
9806 struct nft_flowtable *flowtable;
9807 struct nft_table *table;
9808
9809 list_for_each_entry(table, &nft_net->tables, list) {
9810 list_for_each_entry(flowtable, &table->flowtables, list) {
9811 if (nft_flowtable_event(event, dev,
9812 flowtable, changename))
9813 return 1;
9814 }
9815 }
9816 return 0;
9817 }
9818
nf_tables_flowtable_event(struct notifier_block * this,unsigned long event,void * ptr)9819 static int nf_tables_flowtable_event(struct notifier_block *this,
9820 unsigned long event, void *ptr)
9821 {
9822 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
9823 struct nftables_pernet *nft_net;
9824 int ret = NOTIFY_DONE;
9825 struct net *net;
9826
9827 if (event != NETDEV_REGISTER &&
9828 event != NETDEV_UNREGISTER &&
9829 event != NETDEV_CHANGENAME)
9830 return NOTIFY_DONE;
9831
9832 net = dev_net(dev);
9833 nft_net = nft_pernet(net);
9834 mutex_lock(&nft_net->commit_mutex);
9835
9836 if (event == NETDEV_CHANGENAME) {
9837 if (__nf_tables_flowtable_event(NETDEV_REGISTER, dev, true)) {
9838 ret = NOTIFY_BAD;
9839 goto out_unlock;
9840 }
9841 __nf_tables_flowtable_event(NETDEV_UNREGISTER, dev, true);
9842 } else if (__nf_tables_flowtable_event(event, dev, false)) {
9843 ret = NOTIFY_BAD;
9844 }
9845 out_unlock:
9846 mutex_unlock(&nft_net->commit_mutex);
9847 return ret;
9848 }
9849
9850 static struct notifier_block nf_tables_flowtable_notifier = {
9851 .notifier_call = nf_tables_flowtable_event,
9852 };
9853
nf_tables_gen_notify(struct net * net,struct sk_buff * skb,int event)9854 static void nf_tables_gen_notify(struct net *net, struct sk_buff *skb,
9855 int event)
9856 {
9857 struct nlmsghdr *nlh = nlmsg_hdr(skb);
9858 struct sk_buff *skb2;
9859 int err;
9860
9861 if (!nlmsg_report(nlh) &&
9862 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
9863 return;
9864
9865 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
9866 if (skb2 == NULL)
9867 goto err;
9868
9869 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
9870 nlh->nlmsg_seq);
9871 if (err < 0) {
9872 kfree_skb(skb2);
9873 goto err;
9874 }
9875
9876 nfnetlink_send(skb2, net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
9877 nlmsg_report(nlh), GFP_KERNEL);
9878 return;
9879 err:
9880 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
9881 -ENOBUFS);
9882 }
9883
nf_tables_getgen(struct sk_buff * skb,const struct nfnl_info * info,const struct nlattr * const nla[])9884 static int nf_tables_getgen(struct sk_buff *skb, const struct nfnl_info *info,
9885 const struct nlattr * const nla[])
9886 {
9887 struct sk_buff *skb2;
9888 int err;
9889
9890 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
9891 if (skb2 == NULL)
9892 return -ENOMEM;
9893
9894 err = nf_tables_fill_gen_info(skb2, info->net, NETLINK_CB(skb).portid,
9895 info->nlh->nlmsg_seq);
9896 if (err < 0)
9897 goto err_fill_gen_info;
9898
9899 return nfnetlink_unicast(skb2, info->net, NETLINK_CB(skb).portid);
9900
9901 err_fill_gen_info:
9902 kfree_skb(skb2);
9903 return err;
9904 }
9905
9906 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
9907 [NFT_MSG_NEWTABLE] = {
9908 .call = nf_tables_newtable,
9909 .type = NFNL_CB_BATCH,
9910 .attr_count = NFTA_TABLE_MAX,
9911 .policy = nft_table_policy,
9912 },
9913 [NFT_MSG_GETTABLE] = {
9914 .call = nf_tables_gettable,
9915 .type = NFNL_CB_RCU,
9916 .attr_count = NFTA_TABLE_MAX,
9917 .policy = nft_table_policy,
9918 },
9919 [NFT_MSG_DELTABLE] = {
9920 .call = nf_tables_deltable,
9921 .type = NFNL_CB_BATCH,
9922 .attr_count = NFTA_TABLE_MAX,
9923 .policy = nft_table_policy,
9924 },
9925 [NFT_MSG_DESTROYTABLE] = {
9926 .call = nf_tables_deltable,
9927 .type = NFNL_CB_BATCH,
9928 .attr_count = NFTA_TABLE_MAX,
9929 .policy = nft_table_policy,
9930 },
9931 [NFT_MSG_NEWCHAIN] = {
9932 .call = nf_tables_newchain,
9933 .type = NFNL_CB_BATCH,
9934 .attr_count = NFTA_CHAIN_MAX,
9935 .policy = nft_chain_policy,
9936 },
9937 [NFT_MSG_GETCHAIN] = {
9938 .call = nf_tables_getchain,
9939 .type = NFNL_CB_RCU,
9940 .attr_count = NFTA_CHAIN_MAX,
9941 .policy = nft_chain_policy,
9942 },
9943 [NFT_MSG_DELCHAIN] = {
9944 .call = nf_tables_delchain,
9945 .type = NFNL_CB_BATCH,
9946 .attr_count = NFTA_CHAIN_MAX,
9947 .policy = nft_chain_policy,
9948 },
9949 [NFT_MSG_DESTROYCHAIN] = {
9950 .call = nf_tables_delchain,
9951 .type = NFNL_CB_BATCH,
9952 .attr_count = NFTA_CHAIN_MAX,
9953 .policy = nft_chain_policy,
9954 },
9955 [NFT_MSG_NEWRULE] = {
9956 .call = nf_tables_newrule,
9957 .type = NFNL_CB_BATCH,
9958 .attr_count = NFTA_RULE_MAX,
9959 .policy = nft_rule_policy,
9960 },
9961 [NFT_MSG_GETRULE] = {
9962 .call = nf_tables_getrule,
9963 .type = NFNL_CB_RCU,
9964 .attr_count = NFTA_RULE_MAX,
9965 .policy = nft_rule_policy,
9966 },
9967 [NFT_MSG_GETRULE_RESET] = {
9968 .call = nf_tables_getrule_reset,
9969 .type = NFNL_CB_RCU,
9970 .attr_count = NFTA_RULE_MAX,
9971 .policy = nft_rule_policy,
9972 },
9973 [NFT_MSG_DELRULE] = {
9974 .call = nf_tables_delrule,
9975 .type = NFNL_CB_BATCH,
9976 .attr_count = NFTA_RULE_MAX,
9977 .policy = nft_rule_policy,
9978 },
9979 [NFT_MSG_DESTROYRULE] = {
9980 .call = nf_tables_delrule,
9981 .type = NFNL_CB_BATCH,
9982 .attr_count = NFTA_RULE_MAX,
9983 .policy = nft_rule_policy,
9984 },
9985 [NFT_MSG_NEWSET] = {
9986 .call = nf_tables_newset,
9987 .type = NFNL_CB_BATCH,
9988 .attr_count = NFTA_SET_MAX,
9989 .policy = nft_set_policy,
9990 },
9991 [NFT_MSG_GETSET] = {
9992 .call = nf_tables_getset,
9993 .type = NFNL_CB_RCU,
9994 .attr_count = NFTA_SET_MAX,
9995 .policy = nft_set_policy,
9996 },
9997 [NFT_MSG_DELSET] = {
9998 .call = nf_tables_delset,
9999 .type = NFNL_CB_BATCH,
10000 .attr_count = NFTA_SET_MAX,
10001 .policy = nft_set_policy,
10002 },
10003 [NFT_MSG_DESTROYSET] = {
10004 .call = nf_tables_delset,
10005 .type = NFNL_CB_BATCH,
10006 .attr_count = NFTA_SET_MAX,
10007 .policy = nft_set_policy,
10008 },
10009 [NFT_MSG_NEWSETELEM] = {
10010 .call = nf_tables_newsetelem,
10011 .type = NFNL_CB_BATCH,
10012 .attr_count = NFTA_SET_ELEM_LIST_MAX,
10013 .policy = nft_set_elem_list_policy,
10014 },
10015 [NFT_MSG_GETSETELEM] = {
10016 .call = nf_tables_getsetelem,
10017 .type = NFNL_CB_RCU,
10018 .attr_count = NFTA_SET_ELEM_LIST_MAX,
10019 .policy = nft_set_elem_list_policy,
10020 },
10021 [NFT_MSG_GETSETELEM_RESET] = {
10022 .call = nf_tables_getsetelem_reset,
10023 .type = NFNL_CB_RCU,
10024 .attr_count = NFTA_SET_ELEM_LIST_MAX,
10025 .policy = nft_set_elem_list_policy,
10026 },
10027 [NFT_MSG_DELSETELEM] = {
10028 .call = nf_tables_delsetelem,
10029 .type = NFNL_CB_BATCH,
10030 .attr_count = NFTA_SET_ELEM_LIST_MAX,
10031 .policy = nft_set_elem_list_policy,
10032 },
10033 [NFT_MSG_DESTROYSETELEM] = {
10034 .call = nf_tables_delsetelem,
10035 .type = NFNL_CB_BATCH,
10036 .attr_count = NFTA_SET_ELEM_LIST_MAX,
10037 .policy = nft_set_elem_list_policy,
10038 },
10039 [NFT_MSG_GETGEN] = {
10040 .call = nf_tables_getgen,
10041 .type = NFNL_CB_RCU,
10042 },
10043 [NFT_MSG_NEWOBJ] = {
10044 .call = nf_tables_newobj,
10045 .type = NFNL_CB_BATCH,
10046 .attr_count = NFTA_OBJ_MAX,
10047 .policy = nft_obj_policy,
10048 },
10049 [NFT_MSG_GETOBJ] = {
10050 .call = nf_tables_getobj,
10051 .type = NFNL_CB_RCU,
10052 .attr_count = NFTA_OBJ_MAX,
10053 .policy = nft_obj_policy,
10054 },
10055 [NFT_MSG_DELOBJ] = {
10056 .call = nf_tables_delobj,
10057 .type = NFNL_CB_BATCH,
10058 .attr_count = NFTA_OBJ_MAX,
10059 .policy = nft_obj_policy,
10060 },
10061 [NFT_MSG_DESTROYOBJ] = {
10062 .call = nf_tables_delobj,
10063 .type = NFNL_CB_BATCH,
10064 .attr_count = NFTA_OBJ_MAX,
10065 .policy = nft_obj_policy,
10066 },
10067 [NFT_MSG_GETOBJ_RESET] = {
10068 .call = nf_tables_getobj_reset,
10069 .type = NFNL_CB_RCU,
10070 .attr_count = NFTA_OBJ_MAX,
10071 .policy = nft_obj_policy,
10072 },
10073 [NFT_MSG_NEWFLOWTABLE] = {
10074 .call = nf_tables_newflowtable,
10075 .type = NFNL_CB_BATCH,
10076 .attr_count = NFTA_FLOWTABLE_MAX,
10077 .policy = nft_flowtable_policy,
10078 },
10079 [NFT_MSG_GETFLOWTABLE] = {
10080 .call = nf_tables_getflowtable,
10081 .type = NFNL_CB_RCU,
10082 .attr_count = NFTA_FLOWTABLE_MAX,
10083 .policy = nft_flowtable_policy,
10084 },
10085 [NFT_MSG_DELFLOWTABLE] = {
10086 .call = nf_tables_delflowtable,
10087 .type = NFNL_CB_BATCH,
10088 .attr_count = NFTA_FLOWTABLE_MAX,
10089 .policy = nft_flowtable_policy,
10090 },
10091 [NFT_MSG_DESTROYFLOWTABLE] = {
10092 .call = nf_tables_delflowtable,
10093 .type = NFNL_CB_BATCH,
10094 .attr_count = NFTA_FLOWTABLE_MAX,
10095 .policy = nft_flowtable_policy,
10096 },
10097 };
10098
nf_tables_validate(struct net * net)10099 static int nf_tables_validate(struct net *net)
10100 {
10101 struct nftables_pernet *nft_net = nft_pernet(net);
10102 struct nft_table *table;
10103
10104 list_for_each_entry(table, &nft_net->tables, list) {
10105 switch (table->validate_state) {
10106 case NFT_VALIDATE_SKIP:
10107 continue;
10108 case NFT_VALIDATE_NEED:
10109 nft_validate_state_update(table, NFT_VALIDATE_DO);
10110 fallthrough;
10111 case NFT_VALIDATE_DO:
10112 if (nft_table_validate(net, table) < 0)
10113 return -EAGAIN;
10114
10115 nft_validate_state_update(table, NFT_VALIDATE_SKIP);
10116 break;
10117 }
10118 }
10119
10120 return 0;
10121 }
10122
10123 /* a drop policy has to be deferred until all rules have been activated,
10124 * otherwise a large ruleset that contains a drop-policy base chain will
10125 * cause all packets to get dropped until the full transaction has been
10126 * processed.
10127 *
10128 * We defer the drop policy until the transaction has been finalized.
10129 */
nft_chain_commit_drop_policy(struct nft_trans_chain * trans)10130 static void nft_chain_commit_drop_policy(struct nft_trans_chain *trans)
10131 {
10132 struct nft_base_chain *basechain;
10133
10134 if (trans->policy != NF_DROP)
10135 return;
10136
10137 if (!nft_is_base_chain(trans->chain))
10138 return;
10139
10140 basechain = nft_base_chain(trans->chain);
10141 basechain->policy = NF_DROP;
10142 }
10143
nft_chain_commit_update(struct nft_trans_chain * trans)10144 static void nft_chain_commit_update(struct nft_trans_chain *trans)
10145 {
10146 struct nft_table *table = trans->nft_trans_binding.nft_trans.table;
10147 struct nft_base_chain *basechain;
10148
10149 if (trans->name) {
10150 rhltable_remove(&table->chains_ht,
10151 &trans->chain->rhlhead,
10152 nft_chain_ht_params);
10153 swap(trans->chain->name, trans->name);
10154 rhltable_insert_key(&table->chains_ht,
10155 trans->chain->name,
10156 &trans->chain->rhlhead,
10157 nft_chain_ht_params);
10158 }
10159
10160 if (!nft_is_base_chain(trans->chain))
10161 return;
10162
10163 nft_chain_stats_replace(trans);
10164
10165 basechain = nft_base_chain(trans->chain);
10166
10167 switch (trans->policy) {
10168 case NF_DROP:
10169 case NF_ACCEPT:
10170 basechain->policy = trans->policy;
10171 break;
10172 }
10173 }
10174
nft_obj_commit_update(const struct nft_ctx * ctx,struct nft_trans * trans)10175 static void nft_obj_commit_update(const struct nft_ctx *ctx,
10176 struct nft_trans *trans)
10177 {
10178 struct nft_object *newobj;
10179 struct nft_object *obj;
10180
10181 obj = nft_trans_obj(trans);
10182 newobj = nft_trans_obj_newobj(trans);
10183
10184 if (WARN_ON_ONCE(!obj->ops->update))
10185 return;
10186
10187 obj->ops->update(obj, newobj);
10188 nft_obj_destroy(ctx, newobj);
10189 }
10190
nft_commit_release(struct nft_trans * trans)10191 static void nft_commit_release(struct nft_trans *trans)
10192 {
10193 struct nft_ctx ctx = {
10194 .net = trans->net,
10195 };
10196
10197 nft_ctx_update(&ctx, trans);
10198
10199 switch (trans->msg_type) {
10200 case NFT_MSG_DELTABLE:
10201 case NFT_MSG_DESTROYTABLE:
10202 nf_tables_table_destroy(trans->table);
10203 break;
10204 case NFT_MSG_NEWCHAIN:
10205 free_percpu(nft_trans_chain_stats(trans));
10206 kfree(nft_trans_chain_name(trans));
10207 break;
10208 case NFT_MSG_DELCHAIN:
10209 case NFT_MSG_DESTROYCHAIN:
10210 if (nft_trans_chain_update(trans))
10211 nft_hooks_destroy(&nft_trans_chain_hooks(trans));
10212 else
10213 nf_tables_chain_destroy(nft_trans_chain(trans));
10214 break;
10215 case NFT_MSG_DELRULE:
10216 case NFT_MSG_DESTROYRULE:
10217 nf_tables_rule_destroy(&ctx, nft_trans_rule(trans));
10218 break;
10219 case NFT_MSG_DELSET:
10220 case NFT_MSG_DESTROYSET:
10221 nft_set_destroy(&ctx, nft_trans_set(trans));
10222 break;
10223 case NFT_MSG_DELSETELEM:
10224 case NFT_MSG_DESTROYSETELEM:
10225 nft_trans_elems_destroy(&ctx, nft_trans_container_elem(trans));
10226 break;
10227 case NFT_MSG_DELOBJ:
10228 case NFT_MSG_DESTROYOBJ:
10229 nft_obj_destroy(&ctx, nft_trans_obj(trans));
10230 break;
10231 case NFT_MSG_DELFLOWTABLE:
10232 case NFT_MSG_DESTROYFLOWTABLE:
10233 if (nft_trans_flowtable_update(trans))
10234 nft_hooks_destroy(&nft_trans_flowtable_hooks(trans));
10235 else
10236 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
10237 break;
10238 }
10239
10240 if (trans->put_net)
10241 put_net(trans->net);
10242
10243 kfree(trans);
10244 }
10245
nf_tables_trans_destroy_work(struct work_struct * w)10246 static void nf_tables_trans_destroy_work(struct work_struct *w)
10247 {
10248 struct nftables_pernet *nft_net = container_of(w, struct nftables_pernet, destroy_work);
10249 struct nft_trans *trans, *next;
10250 LIST_HEAD(head);
10251
10252 spin_lock(&nf_tables_destroy_list_lock);
10253 list_splice_init(&nft_net->destroy_list, &head);
10254 spin_unlock(&nf_tables_destroy_list_lock);
10255
10256 if (list_empty(&head))
10257 return;
10258
10259 synchronize_rcu();
10260
10261 list_for_each_entry_safe(trans, next, &head, list) {
10262 nft_trans_list_del(trans);
10263 nft_commit_release(trans);
10264 }
10265 }
10266
nf_tables_trans_destroy_flush_work(struct net * net)10267 void nf_tables_trans_destroy_flush_work(struct net *net)
10268 {
10269 struct nftables_pernet *nft_net = nft_pernet(net);
10270
10271 flush_work(&nft_net->destroy_work);
10272 }
10273 EXPORT_SYMBOL_GPL(nf_tables_trans_destroy_flush_work);
10274
nft_expr_reduce(struct nft_regs_track * track,const struct nft_expr * expr)10275 static bool nft_expr_reduce(struct nft_regs_track *track,
10276 const struct nft_expr *expr)
10277 {
10278 return false;
10279 }
10280
nf_tables_commit_chain_prepare(struct net * net,struct nft_chain * chain)10281 static int nf_tables_commit_chain_prepare(struct net *net, struct nft_chain *chain)
10282 {
10283 const struct nft_expr *expr, *last;
10284 struct nft_regs_track track = {};
10285 unsigned int size, data_size;
10286 void *data, *data_boundary;
10287 struct nft_rule_dp *prule;
10288 struct nft_rule *rule;
10289
10290 /* already handled or inactive chain? */
10291 if (chain->blob_next || !nft_is_active_next(net, chain))
10292 return 0;
10293
10294 data_size = 0;
10295 list_for_each_entry(rule, &chain->rules, list) {
10296 if (nft_is_active_next(net, rule)) {
10297 data_size += sizeof(*prule) + rule->dlen;
10298 if (data_size > INT_MAX)
10299 return -ENOMEM;
10300 }
10301 }
10302
10303 chain->blob_next = nf_tables_chain_alloc_rules(chain, data_size);
10304 if (!chain->blob_next)
10305 return -ENOMEM;
10306
10307 data = (void *)chain->blob_next->data;
10308 data_boundary = data + data_size;
10309 size = 0;
10310
10311 list_for_each_entry(rule, &chain->rules, list) {
10312 if (!nft_is_active_next(net, rule))
10313 continue;
10314
10315 prule = (struct nft_rule_dp *)data;
10316 data += offsetof(struct nft_rule_dp, data);
10317 if (WARN_ON_ONCE(data > data_boundary))
10318 return -ENOMEM;
10319
10320 size = 0;
10321 track.last = nft_expr_last(rule);
10322 nft_rule_for_each_expr(expr, last, rule) {
10323 track.cur = expr;
10324
10325 if (nft_expr_reduce(&track, expr)) {
10326 expr = track.cur;
10327 continue;
10328 }
10329
10330 if (WARN_ON_ONCE(data + size + expr->ops->size > data_boundary))
10331 return -ENOMEM;
10332
10333 memcpy(data + size, expr, expr->ops->size);
10334 size += expr->ops->size;
10335 }
10336 if (WARN_ON_ONCE(size >= 1 << 12))
10337 return -ENOMEM;
10338
10339 prule->handle = rule->handle;
10340 prule->dlen = size;
10341 prule->is_last = 0;
10342
10343 data += size;
10344 size = 0;
10345 chain->blob_next->size += (unsigned long)(data - (void *)prule);
10346 }
10347
10348 if (WARN_ON_ONCE(data > data_boundary))
10349 return -ENOMEM;
10350
10351 prule = (struct nft_rule_dp *)data;
10352 nft_last_rule(chain, prule);
10353
10354 return 0;
10355 }
10356
nf_tables_commit_chain_prepare_cancel(struct net * net)10357 static void nf_tables_commit_chain_prepare_cancel(struct net *net)
10358 {
10359 struct nftables_pernet *nft_net = nft_pernet(net);
10360 struct nft_trans *trans, *next;
10361
10362 list_for_each_entry_safe(trans, next, &nft_net->commit_list, list) {
10363 if (trans->msg_type == NFT_MSG_NEWRULE ||
10364 trans->msg_type == NFT_MSG_DELRULE) {
10365 struct nft_chain *chain = nft_trans_rule_chain(trans);
10366
10367 kvfree(chain->blob_next);
10368 chain->blob_next = NULL;
10369 }
10370 }
10371 }
10372
__nf_tables_commit_chain_free_rules(struct rcu_head * h)10373 static void __nf_tables_commit_chain_free_rules(struct rcu_head *h)
10374 {
10375 struct nft_rule_dp_last *l = container_of(h, struct nft_rule_dp_last, h);
10376
10377 kvfree(l->blob);
10378 }
10379
nf_tables_commit_chain_free_rules_old(struct nft_rule_blob * blob)10380 static void nf_tables_commit_chain_free_rules_old(struct nft_rule_blob *blob)
10381 {
10382 struct nft_rule_dp_last *last;
10383
10384 /* last rule trailer is after end marker */
10385 last = (void *)blob + sizeof(*blob) + blob->size;
10386 last->blob = blob;
10387
10388 call_rcu(&last->h, __nf_tables_commit_chain_free_rules);
10389 }
10390
nf_tables_commit_chain(struct net * net,struct nft_chain * chain)10391 static void nf_tables_commit_chain(struct net *net, struct nft_chain *chain)
10392 {
10393 struct nft_rule_blob *g0, *g1;
10394 bool next_genbit;
10395
10396 next_genbit = nft_gencursor_next(net);
10397
10398 g0 = rcu_dereference_protected(chain->blob_gen_0,
10399 lockdep_commit_lock_is_held(net));
10400 g1 = rcu_dereference_protected(chain->blob_gen_1,
10401 lockdep_commit_lock_is_held(net));
10402
10403 /* No changes to this chain? */
10404 if (chain->blob_next == NULL) {
10405 /* chain had no change in last or next generation */
10406 if (g0 == g1)
10407 return;
10408 /*
10409 * chain had no change in this generation; make sure next
10410 * one uses same rules as current generation.
10411 */
10412 if (next_genbit) {
10413 rcu_assign_pointer(chain->blob_gen_1, g0);
10414 nf_tables_commit_chain_free_rules_old(g1);
10415 } else {
10416 rcu_assign_pointer(chain->blob_gen_0, g1);
10417 nf_tables_commit_chain_free_rules_old(g0);
10418 }
10419
10420 return;
10421 }
10422
10423 if (next_genbit)
10424 rcu_assign_pointer(chain->blob_gen_1, chain->blob_next);
10425 else
10426 rcu_assign_pointer(chain->blob_gen_0, chain->blob_next);
10427
10428 chain->blob_next = NULL;
10429
10430 if (g0 == g1)
10431 return;
10432
10433 if (next_genbit)
10434 nf_tables_commit_chain_free_rules_old(g1);
10435 else
10436 nf_tables_commit_chain_free_rules_old(g0);
10437 }
10438
nft_obj_del(struct nft_object * obj)10439 static void nft_obj_del(struct nft_object *obj)
10440 {
10441 rhltable_remove(&nft_objname_ht, &obj->rhlhead, nft_objname_ht_params);
10442 list_del_rcu(&obj->list);
10443 }
10444
nft_chain_del(struct nft_chain * chain)10445 void nft_chain_del(struct nft_chain *chain)
10446 {
10447 struct nft_table *table = chain->table;
10448
10449 WARN_ON_ONCE(rhltable_remove(&table->chains_ht, &chain->rhlhead,
10450 nft_chain_ht_params));
10451 list_del_rcu(&chain->list);
10452 }
10453
nft_trans_gc_setelem_remove(struct nft_ctx * ctx,struct nft_trans_gc * trans)10454 static void nft_trans_gc_setelem_remove(struct nft_ctx *ctx,
10455 struct nft_trans_gc *trans)
10456 {
10457 struct nft_elem_priv **priv = trans->priv;
10458 unsigned int i;
10459
10460 for (i = 0; i < trans->count; i++) {
10461 nft_setelem_data_deactivate(ctx->net, trans->set, priv[i]);
10462 nft_setelem_remove(ctx->net, trans->set, priv[i]);
10463 }
10464 }
10465
nft_trans_gc_destroy(struct nft_trans_gc * trans)10466 void nft_trans_gc_destroy(struct nft_trans_gc *trans)
10467 {
10468 nft_set_put(trans->set);
10469 put_net(trans->net);
10470 kfree(trans);
10471 }
10472
nft_trans_gc_trans_free(struct rcu_head * rcu)10473 static void nft_trans_gc_trans_free(struct rcu_head *rcu)
10474 {
10475 struct nft_elem_priv *elem_priv;
10476 struct nft_trans_gc *trans;
10477 struct nft_ctx ctx = {};
10478 unsigned int i;
10479
10480 trans = container_of(rcu, struct nft_trans_gc, rcu);
10481 ctx.net = read_pnet(&trans->set->net);
10482
10483 for (i = 0; i < trans->count; i++) {
10484 elem_priv = trans->priv[i];
10485 if (!nft_setelem_is_catchall(trans->set, elem_priv))
10486 atomic_dec(&trans->set->nelems);
10487
10488 nf_tables_set_elem_destroy(&ctx, trans->set, elem_priv);
10489 }
10490
10491 nft_trans_gc_destroy(trans);
10492 }
10493
nft_trans_gc_work_done(struct nft_trans_gc * trans)10494 static bool nft_trans_gc_work_done(struct nft_trans_gc *trans)
10495 {
10496 struct nftables_pernet *nft_net;
10497 struct nft_ctx ctx = {};
10498
10499 nft_net = nft_pernet(trans->net);
10500
10501 mutex_lock(&nft_net->commit_mutex);
10502
10503 /* Check for race with transaction, otherwise this batch refers to
10504 * stale objects that might not be there anymore. Skip transaction if
10505 * set has been destroyed from control plane transaction in case gc
10506 * worker loses race.
10507 */
10508 if (READ_ONCE(nft_net->gc_seq) != trans->seq || trans->set->dead) {
10509 mutex_unlock(&nft_net->commit_mutex);
10510 return false;
10511 }
10512
10513 ctx.net = trans->net;
10514 ctx.table = trans->set->table;
10515
10516 nft_trans_gc_setelem_remove(&ctx, trans);
10517 mutex_unlock(&nft_net->commit_mutex);
10518
10519 return true;
10520 }
10521
nft_trans_gc_work(struct work_struct * work)10522 static void nft_trans_gc_work(struct work_struct *work)
10523 {
10524 struct nft_trans_gc *trans, *next;
10525 LIST_HEAD(trans_gc_list);
10526
10527 spin_lock(&nf_tables_gc_list_lock);
10528 list_splice_init(&nf_tables_gc_list, &trans_gc_list);
10529 spin_unlock(&nf_tables_gc_list_lock);
10530
10531 list_for_each_entry_safe(trans, next, &trans_gc_list, list) {
10532 list_del(&trans->list);
10533 if (!nft_trans_gc_work_done(trans)) {
10534 nft_trans_gc_destroy(trans);
10535 continue;
10536 }
10537 call_rcu(&trans->rcu, nft_trans_gc_trans_free);
10538 }
10539 }
10540
nft_trans_gc_alloc(struct nft_set * set,unsigned int gc_seq,gfp_t gfp)10541 struct nft_trans_gc *nft_trans_gc_alloc(struct nft_set *set,
10542 unsigned int gc_seq, gfp_t gfp)
10543 {
10544 struct net *net = read_pnet(&set->net);
10545 struct nft_trans_gc *trans;
10546
10547 trans = kzalloc(sizeof(*trans), gfp);
10548 if (!trans)
10549 return NULL;
10550
10551 trans->net = maybe_get_net(net);
10552 if (!trans->net) {
10553 kfree(trans);
10554 return NULL;
10555 }
10556
10557 refcount_inc(&set->refs);
10558 trans->set = set;
10559 trans->seq = gc_seq;
10560
10561 return trans;
10562 }
10563
nft_trans_gc_elem_add(struct nft_trans_gc * trans,void * priv)10564 void nft_trans_gc_elem_add(struct nft_trans_gc *trans, void *priv)
10565 {
10566 trans->priv[trans->count++] = priv;
10567 }
10568
nft_trans_gc_queue_work(struct nft_trans_gc * trans)10569 static void nft_trans_gc_queue_work(struct nft_trans_gc *trans)
10570 {
10571 spin_lock(&nf_tables_gc_list_lock);
10572 list_add_tail(&trans->list, &nf_tables_gc_list);
10573 spin_unlock(&nf_tables_gc_list_lock);
10574
10575 schedule_work(&trans_gc_work);
10576 }
10577
nft_trans_gc_space(struct nft_trans_gc * trans)10578 static int nft_trans_gc_space(struct nft_trans_gc *trans)
10579 {
10580 return NFT_TRANS_GC_BATCHCOUNT - trans->count;
10581 }
10582
nft_trans_gc_queue_async(struct nft_trans_gc * gc,unsigned int gc_seq,gfp_t gfp)10583 struct nft_trans_gc *nft_trans_gc_queue_async(struct nft_trans_gc *gc,
10584 unsigned int gc_seq, gfp_t gfp)
10585 {
10586 struct nft_set *set;
10587
10588 if (nft_trans_gc_space(gc))
10589 return gc;
10590
10591 set = gc->set;
10592 nft_trans_gc_queue_work(gc);
10593
10594 return nft_trans_gc_alloc(set, gc_seq, gfp);
10595 }
10596
nft_trans_gc_queue_async_done(struct nft_trans_gc * trans)10597 void nft_trans_gc_queue_async_done(struct nft_trans_gc *trans)
10598 {
10599 if (trans->count == 0) {
10600 nft_trans_gc_destroy(trans);
10601 return;
10602 }
10603
10604 nft_trans_gc_queue_work(trans);
10605 }
10606
nft_trans_gc_queue_sync(struct nft_trans_gc * gc,gfp_t gfp)10607 struct nft_trans_gc *nft_trans_gc_queue_sync(struct nft_trans_gc *gc, gfp_t gfp)
10608 {
10609 struct nft_set *set;
10610
10611 if (WARN_ON_ONCE(!lockdep_commit_lock_is_held(gc->net)))
10612 return NULL;
10613
10614 if (nft_trans_gc_space(gc))
10615 return gc;
10616
10617 set = gc->set;
10618 call_rcu(&gc->rcu, nft_trans_gc_trans_free);
10619
10620 return nft_trans_gc_alloc(set, 0, gfp);
10621 }
10622
nft_trans_gc_queue_sync_done(struct nft_trans_gc * trans)10623 void nft_trans_gc_queue_sync_done(struct nft_trans_gc *trans)
10624 {
10625 WARN_ON_ONCE(!lockdep_commit_lock_is_held(trans->net));
10626
10627 if (trans->count == 0) {
10628 nft_trans_gc_destroy(trans);
10629 return;
10630 }
10631
10632 call_rcu(&trans->rcu, nft_trans_gc_trans_free);
10633 }
10634
nft_trans_gc_catchall_async(struct nft_trans_gc * gc,unsigned int gc_seq)10635 struct nft_trans_gc *nft_trans_gc_catchall_async(struct nft_trans_gc *gc,
10636 unsigned int gc_seq)
10637 {
10638 struct nft_set_elem_catchall *catchall;
10639 const struct nft_set *set = gc->set;
10640 struct nft_set_ext *ext;
10641
10642 list_for_each_entry_rcu(catchall, &set->catchall_list, list) {
10643 ext = nft_set_elem_ext(set, catchall->elem);
10644
10645 if (!nft_set_elem_expired(ext))
10646 continue;
10647 if (nft_set_elem_is_dead(ext))
10648 goto dead_elem;
10649
10650 nft_set_elem_dead(ext);
10651 dead_elem:
10652 gc = nft_trans_gc_queue_async(gc, gc_seq, GFP_ATOMIC);
10653 if (!gc)
10654 return NULL;
10655
10656 nft_trans_gc_elem_add(gc, catchall->elem);
10657 }
10658
10659 return gc;
10660 }
10661
nft_trans_gc_catchall_sync(struct nft_trans_gc * gc)10662 struct nft_trans_gc *nft_trans_gc_catchall_sync(struct nft_trans_gc *gc)
10663 {
10664 struct nft_set_elem_catchall *catchall, *next;
10665 u64 tstamp = nft_net_tstamp(gc->net);
10666 const struct nft_set *set = gc->set;
10667 struct nft_elem_priv *elem_priv;
10668 struct nft_set_ext *ext;
10669
10670 WARN_ON_ONCE(!lockdep_commit_lock_is_held(gc->net));
10671
10672 list_for_each_entry_safe(catchall, next, &set->catchall_list, list) {
10673 ext = nft_set_elem_ext(set, catchall->elem);
10674
10675 if (!__nft_set_elem_expired(ext, tstamp))
10676 continue;
10677
10678 gc = nft_trans_gc_queue_sync(gc, GFP_KERNEL);
10679 if (!gc)
10680 return NULL;
10681
10682 elem_priv = catchall->elem;
10683 nft_setelem_data_deactivate(gc->net, gc->set, elem_priv);
10684 nft_setelem_catchall_destroy(catchall);
10685 nft_trans_gc_elem_add(gc, elem_priv);
10686 }
10687
10688 return gc;
10689 }
10690
nf_tables_module_autoload_cleanup(struct net * net)10691 static void nf_tables_module_autoload_cleanup(struct net *net)
10692 {
10693 struct nftables_pernet *nft_net = nft_pernet(net);
10694 struct nft_module_request *req, *next;
10695
10696 WARN_ON_ONCE(!list_empty(&nft_net->commit_list));
10697 list_for_each_entry_safe(req, next, &nft_net->module_list, list) {
10698 WARN_ON_ONCE(!req->done);
10699 list_del(&req->list);
10700 kfree(req);
10701 }
10702 }
10703
nf_tables_commit_release(struct net * net)10704 static void nf_tables_commit_release(struct net *net)
10705 {
10706 struct nftables_pernet *nft_net = nft_pernet(net);
10707 struct nft_trans *trans;
10708
10709 /* all side effects have to be made visible.
10710 * For example, if a chain named 'foo' has been deleted, a
10711 * new transaction must not find it anymore.
10712 *
10713 * Memory reclaim happens asynchronously from work queue
10714 * to prevent expensive synchronize_rcu() in commit phase.
10715 */
10716 if (list_empty(&nft_net->commit_list)) {
10717 nf_tables_module_autoload_cleanup(net);
10718 mutex_unlock(&nft_net->commit_mutex);
10719 return;
10720 }
10721
10722 trans = list_last_entry(&nft_net->commit_list,
10723 struct nft_trans, list);
10724 get_net(trans->net);
10725 WARN_ON_ONCE(trans->put_net);
10726
10727 trans->put_net = true;
10728 spin_lock(&nf_tables_destroy_list_lock);
10729 list_splice_tail_init(&nft_net->commit_list, &nft_net->destroy_list);
10730 spin_unlock(&nf_tables_destroy_list_lock);
10731
10732 nf_tables_module_autoload_cleanup(net);
10733 schedule_work(&nft_net->destroy_work);
10734
10735 mutex_unlock(&nft_net->commit_mutex);
10736 }
10737
nft_commit_notify(struct net * net,u32 portid)10738 static void nft_commit_notify(struct net *net, u32 portid)
10739 {
10740 struct nftables_pernet *nft_net = nft_pernet(net);
10741 struct sk_buff *batch_skb = NULL, *nskb, *skb;
10742 unsigned char *data;
10743 int len;
10744
10745 list_for_each_entry_safe(skb, nskb, &nft_net->notify_list, list) {
10746 if (!batch_skb) {
10747 new_batch:
10748 batch_skb = skb;
10749 len = NLMSG_GOODSIZE - skb->len;
10750 list_del(&skb->list);
10751 continue;
10752 }
10753 len -= skb->len;
10754 if (len > 0 && NFT_CB(skb).report == NFT_CB(batch_skb).report) {
10755 data = skb_put(batch_skb, skb->len);
10756 memcpy(data, skb->data, skb->len);
10757 list_del(&skb->list);
10758 kfree_skb(skb);
10759 continue;
10760 }
10761 nfnetlink_send(batch_skb, net, portid, NFNLGRP_NFTABLES,
10762 NFT_CB(batch_skb).report, GFP_KERNEL);
10763 goto new_batch;
10764 }
10765
10766 if (batch_skb) {
10767 nfnetlink_send(batch_skb, net, portid, NFNLGRP_NFTABLES,
10768 NFT_CB(batch_skb).report, GFP_KERNEL);
10769 }
10770
10771 WARN_ON_ONCE(!list_empty(&nft_net->notify_list));
10772 }
10773
nf_tables_commit_audit_alloc(struct list_head * adl,struct nft_table * table)10774 static int nf_tables_commit_audit_alloc(struct list_head *adl,
10775 struct nft_table *table)
10776 {
10777 struct nft_audit_data *adp;
10778
10779 list_for_each_entry(adp, adl, list) {
10780 if (adp->table == table)
10781 return 0;
10782 }
10783 adp = kzalloc(sizeof(*adp), GFP_KERNEL);
10784 if (!adp)
10785 return -ENOMEM;
10786 adp->table = table;
10787 list_add(&adp->list, adl);
10788 return 0;
10789 }
10790
nf_tables_commit_audit_free(struct list_head * adl)10791 static void nf_tables_commit_audit_free(struct list_head *adl)
10792 {
10793 struct nft_audit_data *adp, *adn;
10794
10795 list_for_each_entry_safe(adp, adn, adl, list) {
10796 list_del(&adp->list);
10797 kfree(adp);
10798 }
10799 }
10800
10801 /* nft audit emits the number of elements that get added/removed/updated,
10802 * so NEW/DELSETELEM needs to increment based on the total elem count.
10803 */
nf_tables_commit_audit_entrycount(const struct nft_trans * trans)10804 static unsigned int nf_tables_commit_audit_entrycount(const struct nft_trans *trans)
10805 {
10806 switch (trans->msg_type) {
10807 case NFT_MSG_NEWSETELEM:
10808 case NFT_MSG_DELSETELEM:
10809 return nft_trans_container_elem(trans)->nelems;
10810 }
10811
10812 return 1;
10813 }
10814
nf_tables_commit_audit_collect(struct list_head * adl,const struct nft_trans * trans,u32 op)10815 static void nf_tables_commit_audit_collect(struct list_head *adl,
10816 const struct nft_trans *trans, u32 op)
10817 {
10818 const struct nft_table *table = trans->table;
10819 struct nft_audit_data *adp;
10820
10821 list_for_each_entry(adp, adl, list) {
10822 if (adp->table == table)
10823 goto found;
10824 }
10825 WARN_ONCE(1, "table=%s not expected in commit list", table->name);
10826 return;
10827 found:
10828 adp->entries += nf_tables_commit_audit_entrycount(trans);
10829 if (!adp->op || adp->op > op)
10830 adp->op = op;
10831 }
10832
10833 #define AUNFTABLENAMELEN (NFT_TABLE_MAXNAMELEN + 22)
10834
nf_tables_commit_audit_log(struct list_head * adl,u32 generation)10835 static void nf_tables_commit_audit_log(struct list_head *adl, u32 generation)
10836 {
10837 struct nft_audit_data *adp, *adn;
10838 char aubuf[AUNFTABLENAMELEN];
10839
10840 list_for_each_entry_safe(adp, adn, adl, list) {
10841 snprintf(aubuf, AUNFTABLENAMELEN, "%s:%u", adp->table->name,
10842 generation);
10843 audit_log_nfcfg(aubuf, adp->table->family, adp->entries,
10844 nft2audit_op[adp->op], GFP_KERNEL);
10845 list_del(&adp->list);
10846 kfree(adp);
10847 }
10848 }
10849
nft_set_commit_update(struct list_head * set_update_list)10850 static void nft_set_commit_update(struct list_head *set_update_list)
10851 {
10852 struct nft_set *set, *next;
10853
10854 list_for_each_entry_safe(set, next, set_update_list, pending_update) {
10855 list_del_init(&set->pending_update);
10856
10857 if (!set->ops->commit || set->dead)
10858 continue;
10859
10860 set->ops->commit(set);
10861 }
10862 }
10863
nft_gc_seq_begin(struct nftables_pernet * nft_net)10864 static unsigned int nft_gc_seq_begin(struct nftables_pernet *nft_net)
10865 {
10866 unsigned int gc_seq;
10867
10868 /* Bump gc counter, it becomes odd, this is the busy mark. */
10869 gc_seq = READ_ONCE(nft_net->gc_seq);
10870 WRITE_ONCE(nft_net->gc_seq, ++gc_seq);
10871
10872 return gc_seq;
10873 }
10874
nft_gc_seq_end(struct nftables_pernet * nft_net,unsigned int gc_seq)10875 static void nft_gc_seq_end(struct nftables_pernet *nft_net, unsigned int gc_seq)
10876 {
10877 WRITE_ONCE(nft_net->gc_seq, ++gc_seq);
10878 }
10879
nf_tables_commit(struct net * net,struct sk_buff * skb)10880 static int nf_tables_commit(struct net *net, struct sk_buff *skb)
10881 {
10882 struct nftables_pernet *nft_net = nft_pernet(net);
10883 const struct nlmsghdr *nlh = nlmsg_hdr(skb);
10884 struct nft_trans_binding *trans_binding;
10885 struct nft_trans *trans, *next;
10886 unsigned int base_seq, gc_seq;
10887 LIST_HEAD(set_update_list);
10888 struct nft_trans_elem *te;
10889 struct nft_chain *chain;
10890 struct nft_table *table;
10891 struct nft_ctx ctx;
10892 LIST_HEAD(adl);
10893 int err;
10894
10895 if (list_empty(&nft_net->commit_list)) {
10896 mutex_unlock(&nft_net->commit_mutex);
10897 return 0;
10898 }
10899
10900 nft_ctx_init(&ctx, net, skb, nlh, NFPROTO_UNSPEC, NULL, NULL, NULL);
10901
10902 list_for_each_entry(trans_binding, &nft_net->binding_list, binding_list) {
10903 trans = &trans_binding->nft_trans;
10904 switch (trans->msg_type) {
10905 case NFT_MSG_NEWSET:
10906 if (!nft_trans_set_update(trans) &&
10907 nft_set_is_anonymous(nft_trans_set(trans)) &&
10908 !nft_trans_set_bound(trans)) {
10909 pr_warn_once("nftables ruleset with unbound set\n");
10910 return -EINVAL;
10911 }
10912 break;
10913 case NFT_MSG_NEWCHAIN:
10914 if (!nft_trans_chain_update(trans) &&
10915 nft_chain_binding(nft_trans_chain(trans)) &&
10916 !nft_trans_chain_bound(trans)) {
10917 pr_warn_once("nftables ruleset with unbound chain\n");
10918 return -EINVAL;
10919 }
10920 break;
10921 default:
10922 WARN_ONCE(1, "Unhandled bind type %d", trans->msg_type);
10923 break;
10924 }
10925 }
10926
10927 /* 0. Validate ruleset, otherwise roll back for error reporting. */
10928 if (nf_tables_validate(net) < 0) {
10929 nft_net->validate_state = NFT_VALIDATE_DO;
10930 return -EAGAIN;
10931 }
10932
10933 err = nft_flow_rule_offload_commit(net);
10934 if (err < 0)
10935 return err;
10936
10937 /* 1. Allocate space for next generation rules_gen_X[] */
10938 list_for_each_entry_safe(trans, next, &nft_net->commit_list, list) {
10939 struct nft_table *table = trans->table;
10940 int ret;
10941
10942 ret = nf_tables_commit_audit_alloc(&adl, table);
10943 if (ret) {
10944 nf_tables_commit_chain_prepare_cancel(net);
10945 nf_tables_commit_audit_free(&adl);
10946 return ret;
10947 }
10948 if (trans->msg_type == NFT_MSG_NEWRULE ||
10949 trans->msg_type == NFT_MSG_DELRULE) {
10950 chain = nft_trans_rule_chain(trans);
10951
10952 ret = nf_tables_commit_chain_prepare(net, chain);
10953 if (ret < 0) {
10954 nf_tables_commit_chain_prepare_cancel(net);
10955 nf_tables_commit_audit_free(&adl);
10956 return ret;
10957 }
10958 }
10959 }
10960
10961 /* step 2. Make rules_gen_X visible to packet path */
10962 list_for_each_entry(table, &nft_net->tables, list) {
10963 list_for_each_entry(chain, &table->chains, list)
10964 nf_tables_commit_chain(net, chain);
10965 }
10966
10967 /*
10968 * Bump generation counter, invalidate any dump in progress.
10969 * Cannot fail after this point.
10970 */
10971 base_seq = READ_ONCE(nft_net->base_seq);
10972 while (++base_seq == 0)
10973 ;
10974
10975 WRITE_ONCE(nft_net->base_seq, base_seq);
10976
10977 gc_seq = nft_gc_seq_begin(nft_net);
10978
10979 /* step 3. Start new generation, rules_gen_X now in use. */
10980 net->nft.gencursor = nft_gencursor_next(net);
10981
10982 list_for_each_entry_safe(trans, next, &nft_net->commit_list, list) {
10983 struct nft_table *table = trans->table;
10984
10985 nft_ctx_update(&ctx, trans);
10986
10987 nf_tables_commit_audit_collect(&adl, trans, trans->msg_type);
10988 switch (trans->msg_type) {
10989 case NFT_MSG_NEWTABLE:
10990 if (nft_trans_table_update(trans)) {
10991 if (!(table->flags & __NFT_TABLE_F_UPDATE)) {
10992 nft_trans_destroy(trans);
10993 break;
10994 }
10995 if (table->flags & NFT_TABLE_F_DORMANT)
10996 nf_tables_table_disable(net, table);
10997
10998 table->flags &= ~__NFT_TABLE_F_UPDATE;
10999 } else {
11000 nft_clear(net, table);
11001 }
11002 nf_tables_table_notify(&ctx, NFT_MSG_NEWTABLE);
11003 nft_trans_destroy(trans);
11004 break;
11005 case NFT_MSG_DELTABLE:
11006 case NFT_MSG_DESTROYTABLE:
11007 list_del_rcu(&table->list);
11008 nf_tables_table_notify(&ctx, trans->msg_type);
11009 break;
11010 case NFT_MSG_NEWCHAIN:
11011 if (nft_trans_chain_update(trans)) {
11012 nft_chain_commit_update(nft_trans_container_chain(trans));
11013 nf_tables_chain_notify(&ctx, NFT_MSG_NEWCHAIN,
11014 &nft_trans_chain_hooks(trans));
11015 list_splice(&nft_trans_chain_hooks(trans),
11016 &nft_trans_basechain(trans)->hook_list);
11017 /* trans destroyed after rcu grace period */
11018 } else {
11019 nft_chain_commit_drop_policy(nft_trans_container_chain(trans));
11020 nft_clear(net, nft_trans_chain(trans));
11021 nf_tables_chain_notify(&ctx, NFT_MSG_NEWCHAIN, NULL);
11022 nft_trans_destroy(trans);
11023 }
11024 break;
11025 case NFT_MSG_DELCHAIN:
11026 case NFT_MSG_DESTROYCHAIN:
11027 if (nft_trans_chain_update(trans)) {
11028 nf_tables_chain_notify(&ctx, NFT_MSG_DELCHAIN,
11029 &nft_trans_chain_hooks(trans));
11030 if (!(table->flags & NFT_TABLE_F_DORMANT)) {
11031 nft_netdev_unregister_hooks(net,
11032 &nft_trans_chain_hooks(trans),
11033 true);
11034 }
11035 } else {
11036 nft_chain_del(nft_trans_chain(trans));
11037 nf_tables_chain_notify(&ctx, NFT_MSG_DELCHAIN,
11038 NULL);
11039 nf_tables_unregister_hook(ctx.net, ctx.table,
11040 nft_trans_chain(trans));
11041 }
11042 break;
11043 case NFT_MSG_NEWRULE:
11044 nft_clear(net, nft_trans_rule(trans));
11045 nf_tables_rule_notify(&ctx, nft_trans_rule(trans),
11046 NFT_MSG_NEWRULE);
11047 if (nft_trans_rule_chain(trans)->flags & NFT_CHAIN_HW_OFFLOAD)
11048 nft_flow_rule_destroy(nft_trans_flow_rule(trans));
11049
11050 nft_trans_destroy(trans);
11051 break;
11052 case NFT_MSG_DELRULE:
11053 case NFT_MSG_DESTROYRULE:
11054 list_del_rcu(&nft_trans_rule(trans)->list);
11055 nf_tables_rule_notify(&ctx, nft_trans_rule(trans),
11056 trans->msg_type);
11057 nft_rule_expr_deactivate(&ctx, nft_trans_rule(trans),
11058 NFT_TRANS_COMMIT);
11059
11060 if (nft_trans_rule_chain(trans)->flags & NFT_CHAIN_HW_OFFLOAD)
11061 nft_flow_rule_destroy(nft_trans_flow_rule(trans));
11062 break;
11063 case NFT_MSG_NEWSET:
11064 list_del(&nft_trans_container_set(trans)->list_trans_newset);
11065 if (nft_trans_set_update(trans)) {
11066 struct nft_set *set = nft_trans_set(trans);
11067
11068 WRITE_ONCE(set->timeout, nft_trans_set_timeout(trans));
11069 WRITE_ONCE(set->gc_int, nft_trans_set_gc_int(trans));
11070
11071 if (nft_trans_set_size(trans))
11072 WRITE_ONCE(set->size, nft_trans_set_size(trans));
11073 } else {
11074 nft_clear(net, nft_trans_set(trans));
11075 /* This avoids hitting -EBUSY when deleting the table
11076 * from the transaction.
11077 */
11078 if (nft_set_is_anonymous(nft_trans_set(trans)) &&
11079 !list_empty(&nft_trans_set(trans)->bindings))
11080 nft_use_dec(&table->use);
11081 }
11082 nf_tables_set_notify(&ctx, nft_trans_set(trans),
11083 NFT_MSG_NEWSET, GFP_KERNEL);
11084 nft_trans_destroy(trans);
11085 break;
11086 case NFT_MSG_DELSET:
11087 case NFT_MSG_DESTROYSET:
11088 nft_trans_set(trans)->dead = 1;
11089 list_del_rcu(&nft_trans_set(trans)->list);
11090 nf_tables_set_notify(&ctx, nft_trans_set(trans),
11091 trans->msg_type, GFP_KERNEL);
11092 break;
11093 case NFT_MSG_NEWSETELEM:
11094 te = nft_trans_container_elem(trans);
11095
11096 nft_trans_elems_add(&ctx, te);
11097
11098 if (te->set->ops->commit &&
11099 list_empty(&te->set->pending_update)) {
11100 list_add_tail(&te->set->pending_update,
11101 &set_update_list);
11102 }
11103 nft_trans_destroy(trans);
11104 break;
11105 case NFT_MSG_DELSETELEM:
11106 case NFT_MSG_DESTROYSETELEM:
11107 te = nft_trans_container_elem(trans);
11108
11109 nft_trans_elems_remove(&ctx, te);
11110
11111 if (te->set->ops->commit &&
11112 list_empty(&te->set->pending_update)) {
11113 list_add_tail(&te->set->pending_update,
11114 &set_update_list);
11115 }
11116 break;
11117 case NFT_MSG_NEWOBJ:
11118 if (nft_trans_obj_update(trans)) {
11119 nft_obj_commit_update(&ctx, trans);
11120 nf_tables_obj_notify(&ctx,
11121 nft_trans_obj(trans),
11122 NFT_MSG_NEWOBJ);
11123 } else {
11124 nft_clear(net, nft_trans_obj(trans));
11125 nf_tables_obj_notify(&ctx,
11126 nft_trans_obj(trans),
11127 NFT_MSG_NEWOBJ);
11128 nft_trans_destroy(trans);
11129 }
11130 break;
11131 case NFT_MSG_DELOBJ:
11132 case NFT_MSG_DESTROYOBJ:
11133 nft_obj_del(nft_trans_obj(trans));
11134 nf_tables_obj_notify(&ctx, nft_trans_obj(trans),
11135 trans->msg_type);
11136 break;
11137 case NFT_MSG_NEWFLOWTABLE:
11138 if (nft_trans_flowtable_update(trans)) {
11139 nft_trans_flowtable(trans)->data.flags =
11140 nft_trans_flowtable_flags(trans);
11141 nf_tables_flowtable_notify(&ctx,
11142 nft_trans_flowtable(trans),
11143 &nft_trans_flowtable_hooks(trans),
11144 NFT_MSG_NEWFLOWTABLE);
11145 list_splice(&nft_trans_flowtable_hooks(trans),
11146 &nft_trans_flowtable(trans)->hook_list);
11147 } else {
11148 nft_clear(net, nft_trans_flowtable(trans));
11149 nf_tables_flowtable_notify(&ctx,
11150 nft_trans_flowtable(trans),
11151 NULL,
11152 NFT_MSG_NEWFLOWTABLE);
11153 }
11154 nft_trans_destroy(trans);
11155 break;
11156 case NFT_MSG_DELFLOWTABLE:
11157 case NFT_MSG_DESTROYFLOWTABLE:
11158 if (nft_trans_flowtable_update(trans)) {
11159 nf_tables_flowtable_notify(&ctx,
11160 nft_trans_flowtable(trans),
11161 &nft_trans_flowtable_hooks(trans),
11162 trans->msg_type);
11163 nft_unregister_flowtable_net_hooks(net,
11164 nft_trans_flowtable(trans),
11165 &nft_trans_flowtable_hooks(trans));
11166 } else {
11167 list_del_rcu(&nft_trans_flowtable(trans)->list);
11168 nf_tables_flowtable_notify(&ctx,
11169 nft_trans_flowtable(trans),
11170 NULL,
11171 trans->msg_type);
11172 nft_unregister_flowtable_net_hooks(net,
11173 nft_trans_flowtable(trans),
11174 &nft_trans_flowtable(trans)->hook_list);
11175 }
11176 break;
11177 }
11178 }
11179
11180 nft_set_commit_update(&set_update_list);
11181
11182 nft_commit_notify(net, NETLINK_CB(skb).portid);
11183 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
11184 nf_tables_commit_audit_log(&adl, nft_net->base_seq);
11185
11186 nft_gc_seq_end(nft_net, gc_seq);
11187 nft_net->validate_state = NFT_VALIDATE_SKIP;
11188 nf_tables_commit_release(net);
11189
11190 return 0;
11191 }
11192
nf_tables_module_autoload(struct net * net)11193 static void nf_tables_module_autoload(struct net *net)
11194 {
11195 struct nftables_pernet *nft_net = nft_pernet(net);
11196 struct nft_module_request *req, *next;
11197 LIST_HEAD(module_list);
11198
11199 list_splice_init(&nft_net->module_list, &module_list);
11200 mutex_unlock(&nft_net->commit_mutex);
11201 list_for_each_entry_safe(req, next, &module_list, list) {
11202 request_module("%s", req->module);
11203 req->done = true;
11204 }
11205 mutex_lock(&nft_net->commit_mutex);
11206 list_splice(&module_list, &nft_net->module_list);
11207 }
11208
nf_tables_abort_release(struct nft_trans * trans)11209 static void nf_tables_abort_release(struct nft_trans *trans)
11210 {
11211 struct nft_ctx ctx = { };
11212
11213 nft_ctx_update(&ctx, trans);
11214
11215 switch (trans->msg_type) {
11216 case NFT_MSG_NEWTABLE:
11217 nf_tables_table_destroy(trans->table);
11218 break;
11219 case NFT_MSG_NEWCHAIN:
11220 if (nft_trans_chain_update(trans))
11221 nft_hooks_destroy(&nft_trans_chain_hooks(trans));
11222 else
11223 nf_tables_chain_destroy(nft_trans_chain(trans));
11224 break;
11225 case NFT_MSG_NEWRULE:
11226 nf_tables_rule_destroy(&ctx, nft_trans_rule(trans));
11227 break;
11228 case NFT_MSG_NEWSET:
11229 nft_set_destroy(&ctx, nft_trans_set(trans));
11230 break;
11231 case NFT_MSG_NEWSETELEM:
11232 nft_trans_set_elem_destroy(&ctx, nft_trans_container_elem(trans));
11233 break;
11234 case NFT_MSG_NEWOBJ:
11235 nft_obj_destroy(&ctx, nft_trans_obj(trans));
11236 break;
11237 case NFT_MSG_NEWFLOWTABLE:
11238 if (nft_trans_flowtable_update(trans))
11239 nft_hooks_destroy(&nft_trans_flowtable_hooks(trans));
11240 else
11241 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
11242 break;
11243 }
11244 kfree(trans);
11245 }
11246
nft_set_abort_update(struct list_head * set_update_list)11247 static void nft_set_abort_update(struct list_head *set_update_list)
11248 {
11249 struct nft_set *set, *next;
11250
11251 list_for_each_entry_safe(set, next, set_update_list, pending_update) {
11252 list_del_init(&set->pending_update);
11253
11254 if (!set->ops->abort)
11255 continue;
11256
11257 set->ops->abort(set);
11258 }
11259 }
11260
__nf_tables_abort(struct net * net,enum nfnl_abort_action action)11261 static int __nf_tables_abort(struct net *net, enum nfnl_abort_action action)
11262 {
11263 struct nftables_pernet *nft_net = nft_pernet(net);
11264 struct nft_trans *trans, *next;
11265 LIST_HEAD(set_update_list);
11266 struct nft_trans_elem *te;
11267 struct nft_ctx ctx = {
11268 .net = net,
11269 };
11270 int err = 0;
11271
11272 if (action == NFNL_ABORT_VALIDATE &&
11273 nf_tables_validate(net) < 0)
11274 err = -EAGAIN;
11275
11276 list_for_each_entry_safe_reverse(trans, next, &nft_net->commit_list,
11277 list) {
11278 struct nft_table *table = trans->table;
11279
11280 nft_ctx_update(&ctx, trans);
11281
11282 switch (trans->msg_type) {
11283 case NFT_MSG_NEWTABLE:
11284 if (nft_trans_table_update(trans)) {
11285 if (!(table->flags & __NFT_TABLE_F_UPDATE)) {
11286 nft_trans_destroy(trans);
11287 break;
11288 }
11289 if (table->flags & __NFT_TABLE_F_WAS_DORMANT) {
11290 nf_tables_table_disable(net, table);
11291 table->flags |= NFT_TABLE_F_DORMANT;
11292 } else if (table->flags & __NFT_TABLE_F_WAS_AWAKEN) {
11293 table->flags &= ~NFT_TABLE_F_DORMANT;
11294 }
11295 if (table->flags & __NFT_TABLE_F_WAS_ORPHAN) {
11296 table->flags &= ~NFT_TABLE_F_OWNER;
11297 table->nlpid = 0;
11298 }
11299 table->flags &= ~__NFT_TABLE_F_UPDATE;
11300 nft_trans_destroy(trans);
11301 } else {
11302 list_del_rcu(&table->list);
11303 }
11304 break;
11305 case NFT_MSG_DELTABLE:
11306 case NFT_MSG_DESTROYTABLE:
11307 nft_clear(trans->net, table);
11308 nft_trans_destroy(trans);
11309 break;
11310 case NFT_MSG_NEWCHAIN:
11311 if (nft_trans_chain_update(trans)) {
11312 if (!(table->flags & NFT_TABLE_F_DORMANT)) {
11313 nft_netdev_unregister_hooks(net,
11314 &nft_trans_chain_hooks(trans),
11315 true);
11316 }
11317 free_percpu(nft_trans_chain_stats(trans));
11318 kfree(nft_trans_chain_name(trans));
11319 nft_trans_destroy(trans);
11320 } else {
11321 if (nft_trans_chain_bound(trans)) {
11322 nft_trans_destroy(trans);
11323 break;
11324 }
11325 nft_use_dec_restore(&table->use);
11326 nft_chain_del(nft_trans_chain(trans));
11327 nf_tables_unregister_hook(trans->net, table,
11328 nft_trans_chain(trans));
11329 }
11330 break;
11331 case NFT_MSG_DELCHAIN:
11332 case NFT_MSG_DESTROYCHAIN:
11333 if (nft_trans_chain_update(trans)) {
11334 list_splice(&nft_trans_chain_hooks(trans),
11335 &nft_trans_basechain(trans)->hook_list);
11336 } else {
11337 nft_use_inc_restore(&table->use);
11338 nft_clear(trans->net, nft_trans_chain(trans));
11339 }
11340 nft_trans_destroy(trans);
11341 break;
11342 case NFT_MSG_NEWRULE:
11343 if (nft_trans_rule_bound(trans)) {
11344 nft_trans_destroy(trans);
11345 break;
11346 }
11347 nft_use_dec_restore(&nft_trans_rule_chain(trans)->use);
11348 list_del_rcu(&nft_trans_rule(trans)->list);
11349 nft_rule_expr_deactivate(&ctx,
11350 nft_trans_rule(trans),
11351 NFT_TRANS_ABORT);
11352 if (nft_trans_rule_chain(trans)->flags & NFT_CHAIN_HW_OFFLOAD)
11353 nft_flow_rule_destroy(nft_trans_flow_rule(trans));
11354 break;
11355 case NFT_MSG_DELRULE:
11356 case NFT_MSG_DESTROYRULE:
11357 nft_use_inc_restore(&nft_trans_rule_chain(trans)->use);
11358 nft_clear(trans->net, nft_trans_rule(trans));
11359 nft_rule_expr_activate(&ctx, nft_trans_rule(trans));
11360 if (nft_trans_rule_chain(trans)->flags & NFT_CHAIN_HW_OFFLOAD)
11361 nft_flow_rule_destroy(nft_trans_flow_rule(trans));
11362
11363 nft_trans_destroy(trans);
11364 break;
11365 case NFT_MSG_NEWSET:
11366 list_del(&nft_trans_container_set(trans)->list_trans_newset);
11367 if (nft_trans_set_update(trans)) {
11368 nft_trans_destroy(trans);
11369 break;
11370 }
11371 nft_use_dec_restore(&table->use);
11372 if (nft_trans_set_bound(trans)) {
11373 nft_trans_destroy(trans);
11374 break;
11375 }
11376 nft_trans_set(trans)->dead = 1;
11377 list_del_rcu(&nft_trans_set(trans)->list);
11378 break;
11379 case NFT_MSG_DELSET:
11380 case NFT_MSG_DESTROYSET:
11381 nft_use_inc_restore(&table->use);
11382 nft_clear(trans->net, nft_trans_set(trans));
11383 if (nft_trans_set(trans)->flags & (NFT_SET_MAP | NFT_SET_OBJECT))
11384 nft_map_activate(&ctx, nft_trans_set(trans));
11385
11386 nft_trans_destroy(trans);
11387 break;
11388 case NFT_MSG_NEWSETELEM:
11389 if (nft_trans_elem_set_bound(trans)) {
11390 nft_trans_destroy(trans);
11391 break;
11392 }
11393 te = nft_trans_container_elem(trans);
11394 if (!nft_trans_elems_new_abort(&ctx, te)) {
11395 nft_trans_destroy(trans);
11396 break;
11397 }
11398
11399 if (te->set->ops->abort &&
11400 list_empty(&te->set->pending_update)) {
11401 list_add_tail(&te->set->pending_update,
11402 &set_update_list);
11403 }
11404 break;
11405 case NFT_MSG_DELSETELEM:
11406 case NFT_MSG_DESTROYSETELEM:
11407 te = nft_trans_container_elem(trans);
11408
11409 nft_trans_elems_destroy_abort(&ctx, te);
11410
11411 if (te->set->ops->abort &&
11412 list_empty(&te->set->pending_update)) {
11413 list_add_tail(&te->set->pending_update,
11414 &set_update_list);
11415 }
11416 nft_trans_destroy(trans);
11417 break;
11418 case NFT_MSG_NEWOBJ:
11419 if (nft_trans_obj_update(trans)) {
11420 nft_obj_destroy(&ctx, nft_trans_obj_newobj(trans));
11421 nft_trans_destroy(trans);
11422 } else {
11423 nft_use_dec_restore(&table->use);
11424 nft_obj_del(nft_trans_obj(trans));
11425 }
11426 break;
11427 case NFT_MSG_DELOBJ:
11428 case NFT_MSG_DESTROYOBJ:
11429 nft_use_inc_restore(&table->use);
11430 nft_clear(trans->net, nft_trans_obj(trans));
11431 nft_trans_destroy(trans);
11432 break;
11433 case NFT_MSG_NEWFLOWTABLE:
11434 if (nft_trans_flowtable_update(trans)) {
11435 nft_unregister_flowtable_net_hooks(net,
11436 nft_trans_flowtable(trans),
11437 &nft_trans_flowtable_hooks(trans));
11438 } else {
11439 nft_use_dec_restore(&table->use);
11440 list_del_rcu(&nft_trans_flowtable(trans)->list);
11441 nft_unregister_flowtable_net_hooks(net,
11442 nft_trans_flowtable(trans),
11443 &nft_trans_flowtable(trans)->hook_list);
11444 }
11445 break;
11446 case NFT_MSG_DELFLOWTABLE:
11447 case NFT_MSG_DESTROYFLOWTABLE:
11448 if (nft_trans_flowtable_update(trans)) {
11449 list_splice(&nft_trans_flowtable_hooks(trans),
11450 &nft_trans_flowtable(trans)->hook_list);
11451 } else {
11452 nft_use_inc_restore(&table->use);
11453 nft_clear(trans->net, nft_trans_flowtable(trans));
11454 }
11455 nft_trans_destroy(trans);
11456 break;
11457 }
11458 }
11459
11460 WARN_ON_ONCE(!list_empty(&nft_net->commit_set_list));
11461
11462 nft_set_abort_update(&set_update_list);
11463
11464 synchronize_rcu();
11465
11466 list_for_each_entry_safe_reverse(trans, next,
11467 &nft_net->commit_list, list) {
11468 nft_trans_list_del(trans);
11469 nf_tables_abort_release(trans);
11470 }
11471
11472 return err;
11473 }
11474
nf_tables_abort(struct net * net,struct sk_buff * skb,enum nfnl_abort_action action)11475 static int nf_tables_abort(struct net *net, struct sk_buff *skb,
11476 enum nfnl_abort_action action)
11477 {
11478 struct nftables_pernet *nft_net = nft_pernet(net);
11479 unsigned int gc_seq;
11480 int ret;
11481
11482 gc_seq = nft_gc_seq_begin(nft_net);
11483 ret = __nf_tables_abort(net, action);
11484 nft_gc_seq_end(nft_net, gc_seq);
11485
11486 WARN_ON_ONCE(!list_empty(&nft_net->commit_list));
11487
11488 /* module autoload needs to happen after GC sequence update because it
11489 * temporarily releases and grabs mutex again.
11490 */
11491 if (action == NFNL_ABORT_AUTOLOAD)
11492 nf_tables_module_autoload(net);
11493 else
11494 nf_tables_module_autoload_cleanup(net);
11495
11496 mutex_unlock(&nft_net->commit_mutex);
11497
11498 return ret;
11499 }
11500
nf_tables_valid_genid(struct net * net,u32 genid)11501 static bool nf_tables_valid_genid(struct net *net, u32 genid)
11502 {
11503 struct nftables_pernet *nft_net = nft_pernet(net);
11504 bool genid_ok;
11505
11506 mutex_lock(&nft_net->commit_mutex);
11507 nft_net->tstamp = get_jiffies_64();
11508
11509 genid_ok = genid == 0 || nft_net->base_seq == genid;
11510 if (!genid_ok)
11511 mutex_unlock(&nft_net->commit_mutex);
11512
11513 /* else, commit mutex has to be released by commit or abort function */
11514 return genid_ok;
11515 }
11516
11517 static const struct nfnetlink_subsystem nf_tables_subsys = {
11518 .name = "nf_tables",
11519 .subsys_id = NFNL_SUBSYS_NFTABLES,
11520 .cb_count = NFT_MSG_MAX,
11521 .cb = nf_tables_cb,
11522 .commit = nf_tables_commit,
11523 .abort = nf_tables_abort,
11524 .valid_genid = nf_tables_valid_genid,
11525 .owner = THIS_MODULE,
11526 };
11527
nft_chain_validate_dependency(const struct nft_chain * chain,enum nft_chain_types type)11528 int nft_chain_validate_dependency(const struct nft_chain *chain,
11529 enum nft_chain_types type)
11530 {
11531 const struct nft_base_chain *basechain;
11532
11533 if (nft_is_base_chain(chain)) {
11534 basechain = nft_base_chain(chain);
11535 if (basechain->type->type != type)
11536 return -EOPNOTSUPP;
11537 }
11538 return 0;
11539 }
11540 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
11541
nft_chain_validate_hooks(const struct nft_chain * chain,unsigned int hook_flags)11542 int nft_chain_validate_hooks(const struct nft_chain *chain,
11543 unsigned int hook_flags)
11544 {
11545 struct nft_base_chain *basechain;
11546
11547 if (nft_is_base_chain(chain)) {
11548 basechain = nft_base_chain(chain);
11549
11550 if ((1 << basechain->ops.hooknum) & hook_flags)
11551 return 0;
11552
11553 return -EOPNOTSUPP;
11554 }
11555
11556 return 0;
11557 }
11558 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
11559
11560 /**
11561 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
11562 *
11563 * @attr: netlink attribute to fetch value from
11564 * @max: maximum value to be stored in dest
11565 * @dest: pointer to the variable
11566 *
11567 * Parse, check and store a given u32 netlink attribute into variable.
11568 * This function returns -ERANGE if the value goes over maximum value.
11569 * Otherwise a 0 is returned and the attribute value is stored in the
11570 * destination variable.
11571 */
nft_parse_u32_check(const struct nlattr * attr,int max,u32 * dest)11572 int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
11573 {
11574 u32 val;
11575
11576 val = ntohl(nla_get_be32(attr));
11577 if (val > max)
11578 return -ERANGE;
11579
11580 *dest = val;
11581 return 0;
11582 }
11583 EXPORT_SYMBOL_GPL(nft_parse_u32_check);
11584
nft_parse_register(const struct nlattr * attr,u32 * preg)11585 static int nft_parse_register(const struct nlattr *attr, u32 *preg)
11586 {
11587 unsigned int reg;
11588
11589 reg = ntohl(nla_get_be32(attr));
11590 switch (reg) {
11591 case NFT_REG_VERDICT...NFT_REG_4:
11592 *preg = reg * NFT_REG_SIZE / NFT_REG32_SIZE;
11593 break;
11594 case NFT_REG32_00...NFT_REG32_15:
11595 *preg = reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
11596 break;
11597 default:
11598 return -ERANGE;
11599 }
11600
11601 return 0;
11602 }
11603
11604 /**
11605 * nft_dump_register - dump a register value to a netlink attribute
11606 *
11607 * @skb: socket buffer
11608 * @attr: attribute number
11609 * @reg: register number
11610 *
11611 * Construct a netlink attribute containing the register number. For
11612 * compatibility reasons, register numbers being a multiple of 4 are
11613 * translated to the corresponding 128 bit register numbers.
11614 */
nft_dump_register(struct sk_buff * skb,unsigned int attr,unsigned int reg)11615 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
11616 {
11617 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
11618 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
11619 else
11620 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
11621
11622 return nla_put_be32(skb, attr, htonl(reg));
11623 }
11624 EXPORT_SYMBOL_GPL(nft_dump_register);
11625
nft_validate_register_load(enum nft_registers reg,unsigned int len)11626 static int nft_validate_register_load(enum nft_registers reg, unsigned int len)
11627 {
11628 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
11629 return -EINVAL;
11630 if (len == 0)
11631 return -EINVAL;
11632 if (reg * NFT_REG32_SIZE + len > sizeof_field(struct nft_regs, data))
11633 return -ERANGE;
11634
11635 return 0;
11636 }
11637
nft_parse_register_load(const struct nft_ctx * ctx,const struct nlattr * attr,u8 * sreg,u32 len)11638 int nft_parse_register_load(const struct nft_ctx *ctx,
11639 const struct nlattr *attr, u8 *sreg, u32 len)
11640 {
11641 int err, invalid_reg;
11642 u32 reg, next_register;
11643
11644 err = nft_parse_register(attr, ®);
11645 if (err < 0)
11646 return err;
11647
11648 err = nft_validate_register_load(reg, len);
11649 if (err < 0)
11650 return err;
11651
11652 next_register = DIV_ROUND_UP(len, NFT_REG32_SIZE) + reg;
11653
11654 /* Can't happen: nft_validate_register_load() should have failed */
11655 if (WARN_ON_ONCE(next_register > NFT_REG32_NUM))
11656 return -EINVAL;
11657
11658 /* find first register that did not see an earlier store. */
11659 invalid_reg = find_next_zero_bit(ctx->reg_inited, NFT_REG32_NUM, reg);
11660
11661 /* invalid register within the range that we're loading from? */
11662 if (invalid_reg < next_register)
11663 return -ENODATA;
11664
11665 *sreg = reg;
11666 return 0;
11667 }
11668 EXPORT_SYMBOL_GPL(nft_parse_register_load);
11669
nft_saw_register_store(const struct nft_ctx * __ctx,int reg,unsigned int len)11670 static void nft_saw_register_store(const struct nft_ctx *__ctx,
11671 int reg, unsigned int len)
11672 {
11673 unsigned int registers = DIV_ROUND_UP(len, NFT_REG32_SIZE);
11674 struct nft_ctx *ctx = (struct nft_ctx *)__ctx;
11675
11676 if (WARN_ON_ONCE(len == 0 || reg < 0))
11677 return;
11678
11679 bitmap_set(ctx->reg_inited, reg, registers);
11680 }
11681
nft_validate_register_store(const struct nft_ctx * ctx,enum nft_registers reg,const struct nft_data * data,enum nft_data_types type,unsigned int len)11682 static int nft_validate_register_store(const struct nft_ctx *ctx,
11683 enum nft_registers reg,
11684 const struct nft_data *data,
11685 enum nft_data_types type,
11686 unsigned int len)
11687 {
11688 int err;
11689
11690 switch (reg) {
11691 case NFT_REG_VERDICT:
11692 if (type != NFT_DATA_VERDICT)
11693 return -EINVAL;
11694
11695 if (data != NULL &&
11696 (data->verdict.code == NFT_GOTO ||
11697 data->verdict.code == NFT_JUMP)) {
11698 err = nft_chain_validate(ctx, data->verdict.chain);
11699 if (err < 0)
11700 return err;
11701 }
11702
11703 break;
11704 default:
11705 if (type != NFT_DATA_VALUE)
11706 return -EINVAL;
11707
11708 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
11709 return -EINVAL;
11710 if (len == 0)
11711 return -EINVAL;
11712 if (reg * NFT_REG32_SIZE + len >
11713 sizeof_field(struct nft_regs, data))
11714 return -ERANGE;
11715
11716 break;
11717 }
11718
11719 nft_saw_register_store(ctx, reg, len);
11720 return 0;
11721 }
11722
nft_parse_register_store(const struct nft_ctx * ctx,const struct nlattr * attr,u8 * dreg,const struct nft_data * data,enum nft_data_types type,unsigned int len)11723 int nft_parse_register_store(const struct nft_ctx *ctx,
11724 const struct nlattr *attr, u8 *dreg,
11725 const struct nft_data *data,
11726 enum nft_data_types type, unsigned int len)
11727 {
11728 int err;
11729 u32 reg;
11730
11731 err = nft_parse_register(attr, ®);
11732 if (err < 0)
11733 return err;
11734
11735 err = nft_validate_register_store(ctx, reg, data, type, len);
11736 if (err < 0)
11737 return err;
11738
11739 *dreg = reg;
11740 return 0;
11741 }
11742 EXPORT_SYMBOL_GPL(nft_parse_register_store);
11743
11744 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
11745 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
11746 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
11747 .len = NFT_CHAIN_MAXNAMELEN - 1 },
11748 [NFTA_VERDICT_CHAIN_ID] = { .type = NLA_U32 },
11749 };
11750
nft_verdict_init(const struct nft_ctx * ctx,struct nft_data * data,struct nft_data_desc * desc,const struct nlattr * nla)11751 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
11752 struct nft_data_desc *desc, const struct nlattr *nla)
11753 {
11754 u8 genmask = nft_genmask_next(ctx->net);
11755 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
11756 struct nft_chain *chain;
11757 int err;
11758
11759 err = nla_parse_nested_deprecated(tb, NFTA_VERDICT_MAX, nla,
11760 nft_verdict_policy, NULL);
11761 if (err < 0)
11762 return err;
11763
11764 if (!tb[NFTA_VERDICT_CODE])
11765 return -EINVAL;
11766
11767 /* zero padding hole for memcmp */
11768 memset(data, 0, sizeof(*data));
11769 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
11770
11771 switch (data->verdict.code) {
11772 case NF_ACCEPT:
11773 case NF_DROP:
11774 case NF_QUEUE:
11775 break;
11776 case NFT_CONTINUE:
11777 case NFT_BREAK:
11778 case NFT_RETURN:
11779 break;
11780 case NFT_JUMP:
11781 case NFT_GOTO:
11782 if (tb[NFTA_VERDICT_CHAIN]) {
11783 chain = nft_chain_lookup(ctx->net, ctx->table,
11784 tb[NFTA_VERDICT_CHAIN],
11785 genmask);
11786 } else if (tb[NFTA_VERDICT_CHAIN_ID]) {
11787 chain = nft_chain_lookup_byid(ctx->net, ctx->table,
11788 tb[NFTA_VERDICT_CHAIN_ID],
11789 genmask);
11790 if (IS_ERR(chain))
11791 return PTR_ERR(chain);
11792 } else {
11793 return -EINVAL;
11794 }
11795
11796 if (IS_ERR(chain))
11797 return PTR_ERR(chain);
11798 if (nft_is_base_chain(chain))
11799 return -EOPNOTSUPP;
11800 if (nft_chain_is_bound(chain))
11801 return -EINVAL;
11802 if (desc->flags & NFT_DATA_DESC_SETELEM &&
11803 chain->flags & NFT_CHAIN_BINDING)
11804 return -EINVAL;
11805 if (!nft_use_inc(&chain->use))
11806 return -EMFILE;
11807
11808 data->verdict.chain = chain;
11809 break;
11810 default:
11811 return -EINVAL;
11812 }
11813
11814 desc->len = sizeof(data->verdict);
11815
11816 return 0;
11817 }
11818
nft_verdict_uninit(const struct nft_data * data)11819 static void nft_verdict_uninit(const struct nft_data *data)
11820 {
11821 struct nft_chain *chain;
11822
11823 switch (data->verdict.code) {
11824 case NFT_JUMP:
11825 case NFT_GOTO:
11826 chain = data->verdict.chain;
11827 nft_use_dec(&chain->use);
11828 break;
11829 }
11830 }
11831
nft_verdict_dump(struct sk_buff * skb,int type,const struct nft_verdict * v)11832 int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
11833 {
11834 struct nlattr *nest;
11835
11836 nest = nla_nest_start_noflag(skb, type);
11837 if (!nest)
11838 goto nla_put_failure;
11839
11840 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
11841 goto nla_put_failure;
11842
11843 switch (v->code) {
11844 case NFT_JUMP:
11845 case NFT_GOTO:
11846 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
11847 v->chain->name))
11848 goto nla_put_failure;
11849 }
11850 nla_nest_end(skb, nest);
11851 return 0;
11852
11853 nla_put_failure:
11854 return -1;
11855 }
11856
nft_value_init(const struct nft_ctx * ctx,struct nft_data * data,struct nft_data_desc * desc,const struct nlattr * nla)11857 static int nft_value_init(const struct nft_ctx *ctx,
11858 struct nft_data *data, struct nft_data_desc *desc,
11859 const struct nlattr *nla)
11860 {
11861 unsigned int len;
11862
11863 len = nla_len(nla);
11864 if (len == 0)
11865 return -EINVAL;
11866 if (len > desc->size)
11867 return -EOVERFLOW;
11868 if (desc->len) {
11869 if (len != desc->len)
11870 return -EINVAL;
11871 } else {
11872 desc->len = len;
11873 }
11874
11875 nla_memcpy(data->data, nla, len);
11876
11877 return 0;
11878 }
11879
nft_value_dump(struct sk_buff * skb,const struct nft_data * data,unsigned int len)11880 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
11881 unsigned int len)
11882 {
11883 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
11884 }
11885
11886 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
11887 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
11888 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
11889 };
11890
11891 /**
11892 * nft_data_init - parse nf_tables data netlink attributes
11893 *
11894 * @ctx: context of the expression using the data
11895 * @data: destination struct nft_data
11896 * @desc: data description
11897 * @nla: netlink attribute containing data
11898 *
11899 * Parse the netlink data attributes and initialize a struct nft_data.
11900 * The type and length of data are returned in the data description.
11901 *
11902 * The caller can indicate that it only wants to accept data of type
11903 * NFT_DATA_VALUE by passing NULL for the ctx argument.
11904 */
nft_data_init(const struct nft_ctx * ctx,struct nft_data * data,struct nft_data_desc * desc,const struct nlattr * nla)11905 int nft_data_init(const struct nft_ctx *ctx, struct nft_data *data,
11906 struct nft_data_desc *desc, const struct nlattr *nla)
11907 {
11908 struct nlattr *tb[NFTA_DATA_MAX + 1];
11909 int err;
11910
11911 if (WARN_ON_ONCE(!desc->size))
11912 return -EINVAL;
11913
11914 err = nla_parse_nested_deprecated(tb, NFTA_DATA_MAX, nla,
11915 nft_data_policy, NULL);
11916 if (err < 0)
11917 return err;
11918
11919 if (tb[NFTA_DATA_VALUE]) {
11920 if (desc->type != NFT_DATA_VALUE)
11921 return -EINVAL;
11922
11923 err = nft_value_init(ctx, data, desc, tb[NFTA_DATA_VALUE]);
11924 } else if (tb[NFTA_DATA_VERDICT] && ctx != NULL) {
11925 if (desc->type != NFT_DATA_VERDICT)
11926 return -EINVAL;
11927
11928 err = nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
11929 } else {
11930 err = -EINVAL;
11931 }
11932
11933 return err;
11934 }
11935 EXPORT_SYMBOL_GPL(nft_data_init);
11936
11937 /**
11938 * nft_data_release - release a nft_data item
11939 *
11940 * @data: struct nft_data to release
11941 * @type: type of data
11942 *
11943 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
11944 * all others need to be released by calling this function.
11945 */
nft_data_release(const struct nft_data * data,enum nft_data_types type)11946 void nft_data_release(const struct nft_data *data, enum nft_data_types type)
11947 {
11948 if (type < NFT_DATA_VERDICT)
11949 return;
11950 switch (type) {
11951 case NFT_DATA_VERDICT:
11952 return nft_verdict_uninit(data);
11953 default:
11954 WARN_ON(1);
11955 }
11956 }
11957 EXPORT_SYMBOL_GPL(nft_data_release);
11958
nft_data_dump(struct sk_buff * skb,int attr,const struct nft_data * data,enum nft_data_types type,unsigned int len)11959 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
11960 enum nft_data_types type, unsigned int len)
11961 {
11962 struct nlattr *nest;
11963 int err;
11964
11965 nest = nla_nest_start_noflag(skb, attr);
11966 if (nest == NULL)
11967 return -1;
11968
11969 switch (type) {
11970 case NFT_DATA_VALUE:
11971 err = nft_value_dump(skb, data, len);
11972 break;
11973 case NFT_DATA_VERDICT:
11974 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
11975 break;
11976 default:
11977 err = -EINVAL;
11978 WARN_ON(1);
11979 }
11980
11981 nla_nest_end(skb, nest);
11982 return err;
11983 }
11984 EXPORT_SYMBOL_GPL(nft_data_dump);
11985
__nft_release_hook(struct net * net,struct nft_table * table)11986 static void __nft_release_hook(struct net *net, struct nft_table *table)
11987 {
11988 struct nft_flowtable *flowtable;
11989 struct nft_chain *chain;
11990
11991 list_for_each_entry(chain, &table->chains, list)
11992 __nf_tables_unregister_hook(net, table, chain, true);
11993 list_for_each_entry(flowtable, &table->flowtables, list)
11994 __nft_unregister_flowtable_net_hooks(net, flowtable,
11995 &flowtable->hook_list,
11996 true);
11997 }
11998
__nft_release_hooks(struct net * net)11999 static void __nft_release_hooks(struct net *net)
12000 {
12001 struct nftables_pernet *nft_net = nft_pernet(net);
12002 struct nft_table *table;
12003
12004 list_for_each_entry(table, &nft_net->tables, list) {
12005 if (nft_table_has_owner(table))
12006 continue;
12007
12008 __nft_release_hook(net, table);
12009 }
12010 }
12011
__nft_release_table(struct net * net,struct nft_table * table)12012 static void __nft_release_table(struct net *net, struct nft_table *table)
12013 {
12014 struct nft_flowtable *flowtable, *nf;
12015 struct nft_chain *chain, *nc;
12016 struct nft_object *obj, *ne;
12017 struct nft_rule *rule, *nr;
12018 struct nft_set *set, *ns;
12019 struct nft_ctx ctx = {
12020 .net = net,
12021 .family = NFPROTO_NETDEV,
12022 };
12023
12024 ctx.family = table->family;
12025 ctx.table = table;
12026 list_for_each_entry(chain, &table->chains, list) {
12027 if (nft_chain_binding(chain))
12028 continue;
12029
12030 ctx.chain = chain;
12031 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
12032 list_del(&rule->list);
12033 nft_use_dec(&chain->use);
12034 nf_tables_rule_release(&ctx, rule);
12035 }
12036 }
12037 list_for_each_entry_safe(flowtable, nf, &table->flowtables, list) {
12038 list_del(&flowtable->list);
12039 nft_use_dec(&table->use);
12040 nf_tables_flowtable_destroy(flowtable);
12041 }
12042 list_for_each_entry_safe(set, ns, &table->sets, list) {
12043 list_del(&set->list);
12044 nft_use_dec(&table->use);
12045 if (set->flags & (NFT_SET_MAP | NFT_SET_OBJECT))
12046 nft_map_deactivate(&ctx, set);
12047
12048 nft_set_destroy(&ctx, set);
12049 }
12050 list_for_each_entry_safe(obj, ne, &table->objects, list) {
12051 nft_obj_del(obj);
12052 nft_use_dec(&table->use);
12053 nft_obj_destroy(&ctx, obj);
12054 }
12055 list_for_each_entry_safe(chain, nc, &table->chains, list) {
12056 nft_chain_del(chain);
12057 nft_use_dec(&table->use);
12058 nf_tables_chain_destroy(chain);
12059 }
12060 nf_tables_table_destroy(table);
12061 }
12062
__nft_release_tables(struct net * net)12063 static void __nft_release_tables(struct net *net)
12064 {
12065 struct nftables_pernet *nft_net = nft_pernet(net);
12066 struct nft_table *table, *nt;
12067
12068 list_for_each_entry_safe(table, nt, &nft_net->tables, list) {
12069 if (nft_table_has_owner(table))
12070 continue;
12071
12072 list_del(&table->list);
12073
12074 __nft_release_table(net, table);
12075 }
12076 }
12077
nft_rcv_nl_event(struct notifier_block * this,unsigned long event,void * ptr)12078 static int nft_rcv_nl_event(struct notifier_block *this, unsigned long event,
12079 void *ptr)
12080 {
12081 struct nft_table *table, *to_delete[8];
12082 struct nftables_pernet *nft_net;
12083 struct netlink_notify *n = ptr;
12084 struct net *net = n->net;
12085 unsigned int deleted;
12086 bool restart = false;
12087 unsigned int gc_seq;
12088
12089 if (event != NETLINK_URELEASE || n->protocol != NETLINK_NETFILTER)
12090 return NOTIFY_DONE;
12091
12092 nft_net = nft_pernet(net);
12093 deleted = 0;
12094 mutex_lock(&nft_net->commit_mutex);
12095
12096 gc_seq = nft_gc_seq_begin(nft_net);
12097
12098 nf_tables_trans_destroy_flush_work(net);
12099 again:
12100 list_for_each_entry(table, &nft_net->tables, list) {
12101 if (nft_table_has_owner(table) &&
12102 n->portid == table->nlpid) {
12103 if (table->flags & NFT_TABLE_F_PERSIST) {
12104 table->flags &= ~NFT_TABLE_F_OWNER;
12105 continue;
12106 }
12107 __nft_release_hook(net, table);
12108 list_del_rcu(&table->list);
12109 to_delete[deleted++] = table;
12110 if (deleted >= ARRAY_SIZE(to_delete))
12111 break;
12112 }
12113 }
12114 if (deleted) {
12115 restart = deleted >= ARRAY_SIZE(to_delete);
12116 synchronize_rcu();
12117 while (deleted)
12118 __nft_release_table(net, to_delete[--deleted]);
12119
12120 if (restart)
12121 goto again;
12122 }
12123 nft_gc_seq_end(nft_net, gc_seq);
12124
12125 mutex_unlock(&nft_net->commit_mutex);
12126
12127 return NOTIFY_DONE;
12128 }
12129
12130 static struct notifier_block nft_nl_notifier = {
12131 .notifier_call = nft_rcv_nl_event,
12132 };
12133
nf_tables_init_net(struct net * net)12134 static int __net_init nf_tables_init_net(struct net *net)
12135 {
12136 struct nftables_pernet *nft_net = nft_pernet(net);
12137
12138 INIT_LIST_HEAD(&nft_net->tables);
12139 INIT_LIST_HEAD(&nft_net->commit_list);
12140 INIT_LIST_HEAD(&nft_net->destroy_list);
12141 INIT_LIST_HEAD(&nft_net->commit_set_list);
12142 INIT_LIST_HEAD(&nft_net->binding_list);
12143 INIT_LIST_HEAD(&nft_net->module_list);
12144 INIT_LIST_HEAD(&nft_net->notify_list);
12145 mutex_init(&nft_net->commit_mutex);
12146 nft_net->base_seq = 1;
12147 nft_net->gc_seq = 0;
12148 nft_net->validate_state = NFT_VALIDATE_SKIP;
12149 INIT_WORK(&nft_net->destroy_work, nf_tables_trans_destroy_work);
12150
12151 return 0;
12152 }
12153
nf_tables_pre_exit_net(struct net * net)12154 static void __net_exit nf_tables_pre_exit_net(struct net *net)
12155 {
12156 struct nftables_pernet *nft_net = nft_pernet(net);
12157
12158 mutex_lock(&nft_net->commit_mutex);
12159 __nft_release_hooks(net);
12160 mutex_unlock(&nft_net->commit_mutex);
12161 }
12162
nf_tables_exit_net(struct net * net)12163 static void __net_exit nf_tables_exit_net(struct net *net)
12164 {
12165 struct nftables_pernet *nft_net = nft_pernet(net);
12166 unsigned int gc_seq;
12167
12168 mutex_lock(&nft_net->commit_mutex);
12169
12170 gc_seq = nft_gc_seq_begin(nft_net);
12171
12172 WARN_ON_ONCE(!list_empty(&nft_net->commit_list));
12173 WARN_ON_ONCE(!list_empty(&nft_net->commit_set_list));
12174
12175 if (!list_empty(&nft_net->module_list))
12176 nf_tables_module_autoload_cleanup(net);
12177
12178 cancel_work_sync(&nft_net->destroy_work);
12179 __nft_release_tables(net);
12180
12181 nft_gc_seq_end(nft_net, gc_seq);
12182
12183 mutex_unlock(&nft_net->commit_mutex);
12184
12185 WARN_ON_ONCE(!list_empty(&nft_net->tables));
12186 WARN_ON_ONCE(!list_empty(&nft_net->module_list));
12187 WARN_ON_ONCE(!list_empty(&nft_net->notify_list));
12188 WARN_ON_ONCE(!list_empty(&nft_net->destroy_list));
12189 }
12190
nf_tables_exit_batch(struct list_head * net_exit_list)12191 static void nf_tables_exit_batch(struct list_head *net_exit_list)
12192 {
12193 flush_work(&trans_gc_work);
12194 }
12195
12196 static struct pernet_operations nf_tables_net_ops = {
12197 .init = nf_tables_init_net,
12198 .pre_exit = nf_tables_pre_exit_net,
12199 .exit = nf_tables_exit_net,
12200 .exit_batch = nf_tables_exit_batch,
12201 .id = &nf_tables_net_id,
12202 .size = sizeof(struct nftables_pernet),
12203 };
12204
nf_tables_module_init(void)12205 static int __init nf_tables_module_init(void)
12206 {
12207 int err;
12208
12209 BUILD_BUG_ON(offsetof(struct nft_trans_table, nft_trans) != 0);
12210 BUILD_BUG_ON(offsetof(struct nft_trans_chain, nft_trans_binding.nft_trans) != 0);
12211 BUILD_BUG_ON(offsetof(struct nft_trans_rule, nft_trans) != 0);
12212 BUILD_BUG_ON(offsetof(struct nft_trans_set, nft_trans_binding.nft_trans) != 0);
12213 BUILD_BUG_ON(offsetof(struct nft_trans_elem, nft_trans) != 0);
12214 BUILD_BUG_ON(offsetof(struct nft_trans_obj, nft_trans) != 0);
12215 BUILD_BUG_ON(offsetof(struct nft_trans_flowtable, nft_trans) != 0);
12216
12217 err = register_pernet_subsys(&nf_tables_net_ops);
12218 if (err < 0)
12219 return err;
12220
12221 err = nft_chain_filter_init();
12222 if (err < 0)
12223 goto err_chain_filter;
12224
12225 err = nf_tables_core_module_init();
12226 if (err < 0)
12227 goto err_core_module;
12228
12229 err = register_netdevice_notifier(&nf_tables_flowtable_notifier);
12230 if (err < 0)
12231 goto err_netdev_notifier;
12232
12233 err = rhltable_init(&nft_objname_ht, &nft_objname_ht_params);
12234 if (err < 0)
12235 goto err_rht_objname;
12236
12237 err = nft_offload_init();
12238 if (err < 0)
12239 goto err_offload;
12240
12241 err = netlink_register_notifier(&nft_nl_notifier);
12242 if (err < 0)
12243 goto err_netlink_notifier;
12244
12245 /* must be last */
12246 err = nfnetlink_subsys_register(&nf_tables_subsys);
12247 if (err < 0)
12248 goto err_nfnl_subsys;
12249
12250 nft_chain_route_init();
12251
12252 return err;
12253
12254 err_nfnl_subsys:
12255 netlink_unregister_notifier(&nft_nl_notifier);
12256 err_netlink_notifier:
12257 nft_offload_exit();
12258 err_offload:
12259 rhltable_destroy(&nft_objname_ht);
12260 err_rht_objname:
12261 unregister_netdevice_notifier(&nf_tables_flowtable_notifier);
12262 err_netdev_notifier:
12263 nf_tables_core_module_exit();
12264 err_core_module:
12265 nft_chain_filter_fini();
12266 err_chain_filter:
12267 unregister_pernet_subsys(&nf_tables_net_ops);
12268 return err;
12269 }
12270
nf_tables_module_exit(void)12271 static void __exit nf_tables_module_exit(void)
12272 {
12273 nfnetlink_subsys_unregister(&nf_tables_subsys);
12274 netlink_unregister_notifier(&nft_nl_notifier);
12275 nft_offload_exit();
12276 unregister_netdevice_notifier(&nf_tables_flowtable_notifier);
12277 nft_chain_filter_fini();
12278 nft_chain_route_fini();
12279 unregister_pernet_subsys(&nf_tables_net_ops);
12280 cancel_work_sync(&trans_gc_work);
12281 rcu_barrier();
12282 rhltable_destroy(&nft_objname_ht);
12283 nf_tables_core_module_exit();
12284 }
12285
12286 module_init(nf_tables_module_init);
12287 module_exit(nf_tables_module_exit);
12288
12289 MODULE_LICENSE("GPL");
12290 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
12291 MODULE_DESCRIPTION("Framework for packet filtering and classification");
12292 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);
12293