1 // SPDX-License-Identifier: GPL-2.0-only
3 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
5 * Development of this code funded by Astaro AG (http://www.astaro.com/)
8 #include <linux/module.h>
9 #include <linux/init.h>
10 #include <linux/list.h>
11 #include <linux/skbuff.h>
12 #include <linux/netlink.h>
13 #include <linux/vmalloc.h>
14 #include <linux/rhashtable.h>
15 #include <linux/netfilter.h>
16 #include <linux/netfilter/nfnetlink.h>
17 #include <linux/netfilter/nf_tables.h>
18 #include <net/netfilter/nf_flow_table.h>
19 #include <net/netfilter/nf_tables_core.h>
20 #include <net/netfilter/nf_tables.h>
21 #include <net/netfilter/nf_tables_offload.h>
22 #include <net/net_namespace.h>
25 #define NFT_MODULE_AUTOLOAD_LIMIT (MODULE_NAME_LEN - sizeof("nft-expr-255-"))
27 static LIST_HEAD(nf_tables_expressions);
28 static LIST_HEAD(nf_tables_objects);
29 static LIST_HEAD(nf_tables_flowtables);
30 static LIST_HEAD(nf_tables_destroy_list);
31 static DEFINE_SPINLOCK(nf_tables_destroy_list_lock);
32 static u64 table_handle;
35 NFT_VALIDATE_SKIP = 0,
40 static struct rhltable nft_objname_ht;
42 static u32 nft_chain_hash(const void *data, u32 len, u32 seed);
43 static u32 nft_chain_hash_obj(const void *data, u32 len, u32 seed);
44 static int nft_chain_hash_cmp(struct rhashtable_compare_arg *, const void *);
46 static u32 nft_objname_hash(const void *data, u32 len, u32 seed);
47 static u32 nft_objname_hash_obj(const void *data, u32 len, u32 seed);
48 static int nft_objname_hash_cmp(struct rhashtable_compare_arg *, const void *);
50 static const struct rhashtable_params nft_chain_ht_params = {
51 .head_offset = offsetof(struct nft_chain, rhlhead),
52 .key_offset = offsetof(struct nft_chain, name),
53 .hashfn = nft_chain_hash,
54 .obj_hashfn = nft_chain_hash_obj,
55 .obj_cmpfn = nft_chain_hash_cmp,
56 .automatic_shrinking = true,
59 static const struct rhashtable_params nft_objname_ht_params = {
60 .head_offset = offsetof(struct nft_object, rhlhead),
61 .key_offset = offsetof(struct nft_object, key),
62 .hashfn = nft_objname_hash,
63 .obj_hashfn = nft_objname_hash_obj,
64 .obj_cmpfn = nft_objname_hash_cmp,
65 .automatic_shrinking = true,
68 static void nft_validate_state_update(struct net *net, u8 new_validate_state)
70 switch (net->nft.validate_state) {
71 case NFT_VALIDATE_SKIP:
72 WARN_ON_ONCE(new_validate_state == NFT_VALIDATE_DO);
74 case NFT_VALIDATE_NEED:
77 if (new_validate_state == NFT_VALIDATE_NEED)
81 net->nft.validate_state = new_validate_state;
83 static void nf_tables_trans_destroy_work(struct work_struct *w);
84 static DECLARE_WORK(trans_destroy_work, nf_tables_trans_destroy_work);
86 static void nft_ctx_init(struct nft_ctx *ctx,
88 const struct sk_buff *skb,
89 const struct nlmsghdr *nlh,
91 struct nft_table *table,
92 struct nft_chain *chain,
93 const struct nlattr * const *nla)
101 ctx->portid = NETLINK_CB(skb).portid;
102 ctx->report = nlmsg_report(nlh);
103 ctx->flags = nlh->nlmsg_flags;
104 ctx->seq = nlh->nlmsg_seq;
107 static struct nft_trans *nft_trans_alloc_gfp(const struct nft_ctx *ctx,
108 int msg_type, u32 size, gfp_t gfp)
110 struct nft_trans *trans;
112 trans = kzalloc(sizeof(struct nft_trans) + size, gfp);
116 trans->msg_type = msg_type;
122 static struct nft_trans *nft_trans_alloc(const struct nft_ctx *ctx,
123 int msg_type, u32 size)
125 return nft_trans_alloc_gfp(ctx, msg_type, size, GFP_KERNEL);
128 static void nft_trans_destroy(struct nft_trans *trans)
130 list_del(&trans->list);
134 static void nft_set_trans_bind(const struct nft_ctx *ctx, struct nft_set *set)
136 struct net *net = ctx->net;
137 struct nft_trans *trans;
139 if (!nft_set_is_anonymous(set))
142 list_for_each_entry_reverse(trans, &net->nft.commit_list, list) {
143 switch (trans->msg_type) {
145 if (nft_trans_set(trans) == set)
146 nft_trans_set_bound(trans) = true;
148 case NFT_MSG_NEWSETELEM:
149 if (nft_trans_elem_set(trans) == set)
150 nft_trans_elem_set_bound(trans) = true;
156 static int nft_netdev_register_hooks(struct net *net,
157 struct list_head *hook_list)
159 struct nft_hook *hook;
163 list_for_each_entry(hook, hook_list, list) {
164 err = nf_register_net_hook(net, &hook->ops);
173 list_for_each_entry(hook, hook_list, list) {
177 nf_unregister_net_hook(net, &hook->ops);
182 static void nft_netdev_unregister_hooks(struct net *net,
183 struct list_head *hook_list)
185 struct nft_hook *hook;
187 list_for_each_entry(hook, hook_list, list)
188 nf_unregister_net_hook(net, &hook->ops);
191 static int nft_register_basechain_hooks(struct net *net, int family,
192 struct nft_base_chain *basechain)
194 if (family == NFPROTO_NETDEV)
195 return nft_netdev_register_hooks(net, &basechain->hook_list);
197 return nf_register_net_hook(net, &basechain->ops);
200 static void nft_unregister_basechain_hooks(struct net *net, int family,
201 struct nft_base_chain *basechain)
203 if (family == NFPROTO_NETDEV)
204 nft_netdev_unregister_hooks(net, &basechain->hook_list);
206 nf_unregister_net_hook(net, &basechain->ops);
209 static int nf_tables_register_hook(struct net *net,
210 const struct nft_table *table,
211 struct nft_chain *chain)
213 struct nft_base_chain *basechain;
214 const struct nf_hook_ops *ops;
216 if (table->flags & NFT_TABLE_F_DORMANT ||
217 !nft_is_base_chain(chain))
220 basechain = nft_base_chain(chain);
221 ops = &basechain->ops;
223 if (basechain->type->ops_register)
224 return basechain->type->ops_register(net, ops);
226 return nft_register_basechain_hooks(net, table->family, basechain);
229 static void nf_tables_unregister_hook(struct net *net,
230 const struct nft_table *table,
231 struct nft_chain *chain)
233 struct nft_base_chain *basechain;
234 const struct nf_hook_ops *ops;
236 if (table->flags & NFT_TABLE_F_DORMANT ||
237 !nft_is_base_chain(chain))
239 basechain = nft_base_chain(chain);
240 ops = &basechain->ops;
242 if (basechain->type->ops_unregister)
243 return basechain->type->ops_unregister(net, ops);
245 nft_unregister_basechain_hooks(net, table->family, basechain);
248 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
250 struct nft_trans *trans;
252 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
256 if (msg_type == NFT_MSG_NEWTABLE)
257 nft_activate_next(ctx->net, ctx->table);
259 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
263 static int nft_deltable(struct nft_ctx *ctx)
267 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
271 nft_deactivate_next(ctx->net, ctx->table);
275 static struct nft_trans *nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
277 struct nft_trans *trans;
279 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
281 return ERR_PTR(-ENOMEM);
283 if (msg_type == NFT_MSG_NEWCHAIN)
284 nft_activate_next(ctx->net, ctx->chain);
286 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
290 static int nft_delchain(struct nft_ctx *ctx)
292 struct nft_trans *trans;
294 trans = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
296 return PTR_ERR(trans);
299 nft_deactivate_next(ctx->net, ctx->chain);
304 static void nft_rule_expr_activate(const struct nft_ctx *ctx,
305 struct nft_rule *rule)
307 struct nft_expr *expr;
309 expr = nft_expr_first(rule);
310 while (expr != nft_expr_last(rule) && expr->ops) {
311 if (expr->ops->activate)
312 expr->ops->activate(ctx, expr);
314 expr = nft_expr_next(expr);
318 static void nft_rule_expr_deactivate(const struct nft_ctx *ctx,
319 struct nft_rule *rule,
320 enum nft_trans_phase phase)
322 struct nft_expr *expr;
324 expr = nft_expr_first(rule);
325 while (expr != nft_expr_last(rule) && expr->ops) {
326 if (expr->ops->deactivate)
327 expr->ops->deactivate(ctx, expr, phase);
329 expr = nft_expr_next(expr);
334 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
336 /* You cannot delete the same rule twice */
337 if (nft_is_active_next(ctx->net, rule)) {
338 nft_deactivate_next(ctx->net, rule);
345 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
346 struct nft_rule *rule)
348 struct nft_trans *trans;
350 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
354 if (msg_type == NFT_MSG_NEWRULE && ctx->nla[NFTA_RULE_ID] != NULL) {
355 nft_trans_rule_id(trans) =
356 ntohl(nla_get_be32(ctx->nla[NFTA_RULE_ID]));
358 nft_trans_rule(trans) = rule;
359 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
364 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
366 struct nft_flow_rule *flow;
367 struct nft_trans *trans;
370 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
374 if (ctx->chain->flags & NFT_CHAIN_HW_OFFLOAD) {
375 flow = nft_flow_rule_create(ctx->net, rule);
377 nft_trans_destroy(trans);
378 return PTR_ERR(flow);
381 nft_trans_flow_rule(trans) = flow;
384 err = nf_tables_delrule_deactivate(ctx, rule);
386 nft_trans_destroy(trans);
389 nft_rule_expr_deactivate(ctx, rule, NFT_TRANS_PREPARE);
394 static int nft_delrule_by_chain(struct nft_ctx *ctx)
396 struct nft_rule *rule;
399 list_for_each_entry(rule, &ctx->chain->rules, list) {
400 if (!nft_is_active_next(ctx->net, rule))
403 err = nft_delrule(ctx, rule);
410 static int nft_trans_set_add(const struct nft_ctx *ctx, int msg_type,
413 struct nft_trans *trans;
415 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
419 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
420 nft_trans_set_id(trans) =
421 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
422 nft_activate_next(ctx->net, set);
424 nft_trans_set(trans) = set;
425 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
430 static int nft_delset(const struct nft_ctx *ctx, struct nft_set *set)
434 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
438 nft_deactivate_next(ctx->net, set);
444 static int nft_trans_obj_add(struct nft_ctx *ctx, int msg_type,
445 struct nft_object *obj)
447 struct nft_trans *trans;
449 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_obj));
453 if (msg_type == NFT_MSG_NEWOBJ)
454 nft_activate_next(ctx->net, obj);
456 nft_trans_obj(trans) = obj;
457 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
462 static int nft_delobj(struct nft_ctx *ctx, struct nft_object *obj)
466 err = nft_trans_obj_add(ctx, NFT_MSG_DELOBJ, obj);
470 nft_deactivate_next(ctx->net, obj);
476 static int nft_trans_flowtable_add(struct nft_ctx *ctx, int msg_type,
477 struct nft_flowtable *flowtable)
479 struct nft_trans *trans;
481 trans = nft_trans_alloc(ctx, msg_type,
482 sizeof(struct nft_trans_flowtable));
486 if (msg_type == NFT_MSG_NEWFLOWTABLE)
487 nft_activate_next(ctx->net, flowtable);
489 nft_trans_flowtable(trans) = flowtable;
490 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
495 static int nft_delflowtable(struct nft_ctx *ctx,
496 struct nft_flowtable *flowtable)
500 err = nft_trans_flowtable_add(ctx, NFT_MSG_DELFLOWTABLE, flowtable);
504 nft_deactivate_next(ctx->net, flowtable);
514 static struct nft_table *nft_table_lookup(const struct net *net,
515 const struct nlattr *nla,
516 u8 family, u8 genmask)
518 struct nft_table *table;
521 return ERR_PTR(-EINVAL);
523 list_for_each_entry_rcu(table, &net->nft.tables, list) {
524 if (!nla_strcmp(nla, table->name) &&
525 table->family == family &&
526 nft_active_genmask(table, genmask))
530 return ERR_PTR(-ENOENT);
533 static struct nft_table *nft_table_lookup_byhandle(const struct net *net,
534 const struct nlattr *nla,
537 struct nft_table *table;
539 list_for_each_entry(table, &net->nft.tables, list) {
540 if (be64_to_cpu(nla_get_be64(nla)) == table->handle &&
541 nft_active_genmask(table, genmask))
545 return ERR_PTR(-ENOENT);
548 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
550 return ++table->hgenerator;
553 static const struct nft_chain_type *chain_type[NFPROTO_NUMPROTO][NFT_CHAIN_T_MAX];
555 static const struct nft_chain_type *
556 __nf_tables_chain_type_lookup(const struct nlattr *nla, u8 family)
560 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
561 if (chain_type[family][i] != NULL &&
562 !nla_strcmp(nla, chain_type[family][i]->name))
563 return chain_type[family][i];
569 * Loading a module requires dropping mutex that guards the transaction.
570 * A different client might race to start a new transaction meanwhile. Zap the
571 * list of pending transaction and then restore it once the mutex is grabbed
572 * again. Users of this function return EAGAIN which implicitly triggers the
573 * transaction abort path to clean up the list of pending transactions.
575 #ifdef CONFIG_MODULES
576 static void nft_request_module(struct net *net, const char *fmt, ...)
578 char module_name[MODULE_NAME_LEN];
579 LIST_HEAD(commit_list);
583 list_splice_init(&net->nft.commit_list, &commit_list);
586 ret = vsnprintf(module_name, MODULE_NAME_LEN, fmt, args);
588 if (ret >= MODULE_NAME_LEN)
591 mutex_unlock(&net->nft.commit_mutex);
592 request_module("%s", module_name);
593 mutex_lock(&net->nft.commit_mutex);
595 WARN_ON_ONCE(!list_empty(&net->nft.commit_list));
596 list_splice(&commit_list, &net->nft.commit_list);
600 static void lockdep_nfnl_nft_mutex_not_held(void)
602 #ifdef CONFIG_PROVE_LOCKING
603 WARN_ON_ONCE(lockdep_nfnl_is_held(NFNL_SUBSYS_NFTABLES));
607 static const struct nft_chain_type *
608 nf_tables_chain_type_lookup(struct net *net, const struct nlattr *nla,
609 u8 family, bool autoload)
611 const struct nft_chain_type *type;
613 type = __nf_tables_chain_type_lookup(nla, family);
617 lockdep_nfnl_nft_mutex_not_held();
618 #ifdef CONFIG_MODULES
620 nft_request_module(net, "nft-chain-%u-%.*s", family,
621 nla_len(nla), (const char *)nla_data(nla));
622 type = __nf_tables_chain_type_lookup(nla, family);
624 return ERR_PTR(-EAGAIN);
627 return ERR_PTR(-ENOENT);
630 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
631 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
632 .len = NFT_TABLE_MAXNAMELEN - 1 },
633 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
634 [NFTA_TABLE_HANDLE] = { .type = NLA_U64 },
637 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
638 u32 portid, u32 seq, int event, u32 flags,
639 int family, const struct nft_table *table)
641 struct nlmsghdr *nlh;
642 struct nfgenmsg *nfmsg;
644 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
645 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
647 goto nla_put_failure;
649 nfmsg = nlmsg_data(nlh);
650 nfmsg->nfgen_family = family;
651 nfmsg->version = NFNETLINK_V0;
652 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
654 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
655 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
656 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)) ||
657 nla_put_be64(skb, NFTA_TABLE_HANDLE, cpu_to_be64(table->handle),
659 goto nla_put_failure;
665 nlmsg_trim(skb, nlh);
669 static void nf_tables_table_notify(const struct nft_ctx *ctx, int event)
675 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
678 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
682 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
683 event, 0, ctx->family, ctx->table);
689 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
690 ctx->report, GFP_KERNEL);
693 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
696 static int nf_tables_dump_tables(struct sk_buff *skb,
697 struct netlink_callback *cb)
699 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
700 const struct nft_table *table;
701 unsigned int idx = 0, s_idx = cb->args[0];
702 struct net *net = sock_net(skb->sk);
703 int family = nfmsg->nfgen_family;
706 cb->seq = net->nft.base_seq;
708 list_for_each_entry_rcu(table, &net->nft.tables, list) {
709 if (family != NFPROTO_UNSPEC && family != table->family)
715 memset(&cb->args[1], 0,
716 sizeof(cb->args) - sizeof(cb->args[0]));
717 if (!nft_is_active(net, table))
719 if (nf_tables_fill_table_info(skb, net,
720 NETLINK_CB(cb->skb).portid,
722 NFT_MSG_NEWTABLE, NLM_F_MULTI,
723 table->family, table) < 0)
726 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
736 static int nft_netlink_dump_start_rcu(struct sock *nlsk, struct sk_buff *skb,
737 const struct nlmsghdr *nlh,
738 struct netlink_dump_control *c)
742 if (!try_module_get(THIS_MODULE))
746 err = netlink_dump_start(nlsk, skb, nlh, c);
748 module_put(THIS_MODULE);
753 /* called with rcu_read_lock held */
754 static int nf_tables_gettable(struct net *net, struct sock *nlsk,
755 struct sk_buff *skb, const struct nlmsghdr *nlh,
756 const struct nlattr * const nla[],
757 struct netlink_ext_ack *extack)
759 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
760 u8 genmask = nft_genmask_cur(net);
761 const struct nft_table *table;
762 struct sk_buff *skb2;
763 int family = nfmsg->nfgen_family;
766 if (nlh->nlmsg_flags & NLM_F_DUMP) {
767 struct netlink_dump_control c = {
768 .dump = nf_tables_dump_tables,
769 .module = THIS_MODULE,
772 return nft_netlink_dump_start_rcu(nlsk, skb, nlh, &c);
775 table = nft_table_lookup(net, nla[NFTA_TABLE_NAME], family, genmask);
777 NL_SET_BAD_ATTR(extack, nla[NFTA_TABLE_NAME]);
778 return PTR_ERR(table);
781 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
785 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
786 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
791 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
798 static void nft_table_disable(struct net *net, struct nft_table *table, u32 cnt)
800 struct nft_chain *chain;
803 list_for_each_entry(chain, &table->chains, list) {
804 if (!nft_is_active_next(net, chain))
806 if (!nft_is_base_chain(chain))
809 if (cnt && i++ == cnt)
812 nft_unregister_basechain_hooks(net, table->family,
813 nft_base_chain(chain));
817 static int nf_tables_table_enable(struct net *net, struct nft_table *table)
819 struct nft_chain *chain;
822 list_for_each_entry(chain, &table->chains, list) {
823 if (!nft_is_active_next(net, chain))
825 if (!nft_is_base_chain(chain))
828 err = nft_register_basechain_hooks(net, table->family,
829 nft_base_chain(chain));
831 goto err_register_hooks;
839 nft_table_disable(net, table, i);
843 static void nf_tables_table_disable(struct net *net, struct nft_table *table)
845 nft_table_disable(net, table, 0);
848 static int nf_tables_updtable(struct nft_ctx *ctx)
850 struct nft_trans *trans;
854 if (!ctx->nla[NFTA_TABLE_FLAGS])
857 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
858 if (flags & ~NFT_TABLE_F_DORMANT)
861 if (flags == ctx->table->flags)
864 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
865 sizeof(struct nft_trans_table));
869 if ((flags & NFT_TABLE_F_DORMANT) &&
870 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
871 nft_trans_table_enable(trans) = false;
872 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
873 ctx->table->flags & NFT_TABLE_F_DORMANT) {
874 ret = nf_tables_table_enable(ctx->net, ctx->table);
876 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
877 nft_trans_table_enable(trans) = true;
883 nft_trans_table_update(trans) = true;
884 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
887 nft_trans_destroy(trans);
891 static u32 nft_chain_hash(const void *data, u32 len, u32 seed)
893 const char *name = data;
895 return jhash(name, strlen(name), seed);
898 static u32 nft_chain_hash_obj(const void *data, u32 len, u32 seed)
900 const struct nft_chain *chain = data;
902 return nft_chain_hash(chain->name, 0, seed);
905 static int nft_chain_hash_cmp(struct rhashtable_compare_arg *arg,
908 const struct nft_chain *chain = ptr;
909 const char *name = arg->key;
911 return strcmp(chain->name, name);
914 static u32 nft_objname_hash(const void *data, u32 len, u32 seed)
916 const struct nft_object_hash_key *k = data;
918 seed ^= hash_ptr(k->table, 32);
920 return jhash(k->name, strlen(k->name), seed);
923 static u32 nft_objname_hash_obj(const void *data, u32 len, u32 seed)
925 const struct nft_object *obj = data;
927 return nft_objname_hash(&obj->key, 0, seed);
930 static int nft_objname_hash_cmp(struct rhashtable_compare_arg *arg,
933 const struct nft_object_hash_key *k = arg->key;
934 const struct nft_object *obj = ptr;
936 if (obj->key.table != k->table)
939 return strcmp(obj->key.name, k->name);
942 static int nf_tables_newtable(struct net *net, struct sock *nlsk,
943 struct sk_buff *skb, const struct nlmsghdr *nlh,
944 const struct nlattr * const nla[],
945 struct netlink_ext_ack *extack)
947 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
948 u8 genmask = nft_genmask_next(net);
949 int family = nfmsg->nfgen_family;
950 const struct nlattr *attr;
951 struct nft_table *table;
956 lockdep_assert_held(&net->nft.commit_mutex);
957 attr = nla[NFTA_TABLE_NAME];
958 table = nft_table_lookup(net, attr, family, genmask);
960 if (PTR_ERR(table) != -ENOENT)
961 return PTR_ERR(table);
963 if (nlh->nlmsg_flags & NLM_F_EXCL) {
964 NL_SET_BAD_ATTR(extack, attr);
967 if (nlh->nlmsg_flags & NLM_F_REPLACE)
970 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
971 return nf_tables_updtable(&ctx);
974 if (nla[NFTA_TABLE_FLAGS]) {
975 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
976 if (flags & ~NFT_TABLE_F_DORMANT)
981 table = kzalloc(sizeof(*table), GFP_KERNEL);
985 table->name = nla_strdup(attr, GFP_KERNEL);
986 if (table->name == NULL)
989 err = rhltable_init(&table->chains_ht, &nft_chain_ht_params);
993 INIT_LIST_HEAD(&table->chains);
994 INIT_LIST_HEAD(&table->sets);
995 INIT_LIST_HEAD(&table->objects);
996 INIT_LIST_HEAD(&table->flowtables);
997 table->family = family;
998 table->flags = flags;
999 table->handle = ++table_handle;
1001 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
1002 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
1006 list_add_tail_rcu(&table->list, &net->nft.tables);
1009 rhltable_destroy(&table->chains_ht);
1018 static int nft_flush_table(struct nft_ctx *ctx)
1020 struct nft_flowtable *flowtable, *nft;
1021 struct nft_chain *chain, *nc;
1022 struct nft_object *obj, *ne;
1023 struct nft_set *set, *ns;
1026 list_for_each_entry(chain, &ctx->table->chains, list) {
1027 if (!nft_is_active_next(ctx->net, chain))
1032 err = nft_delrule_by_chain(ctx);
1037 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
1038 if (!nft_is_active_next(ctx->net, set))
1041 if (nft_set_is_anonymous(set) &&
1042 !list_empty(&set->bindings))
1045 err = nft_delset(ctx, set);
1050 list_for_each_entry_safe(flowtable, nft, &ctx->table->flowtables, list) {
1051 if (!nft_is_active_next(ctx->net, flowtable))
1054 err = nft_delflowtable(ctx, flowtable);
1059 list_for_each_entry_safe(obj, ne, &ctx->table->objects, list) {
1060 if (!nft_is_active_next(ctx->net, obj))
1063 err = nft_delobj(ctx, obj);
1068 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
1069 if (!nft_is_active_next(ctx->net, chain))
1074 err = nft_delchain(ctx);
1079 err = nft_deltable(ctx);
1084 static int nft_flush(struct nft_ctx *ctx, int family)
1086 struct nft_table *table, *nt;
1087 const struct nlattr * const *nla = ctx->nla;
1090 list_for_each_entry_safe(table, nt, &ctx->net->nft.tables, list) {
1091 if (family != AF_UNSPEC && table->family != family)
1094 ctx->family = table->family;
1096 if (!nft_is_active_next(ctx->net, table))
1099 if (nla[NFTA_TABLE_NAME] &&
1100 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
1105 err = nft_flush_table(ctx);
1113 static int nf_tables_deltable(struct net *net, struct sock *nlsk,
1114 struct sk_buff *skb, const struct nlmsghdr *nlh,
1115 const struct nlattr * const nla[],
1116 struct netlink_ext_ack *extack)
1118 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1119 u8 genmask = nft_genmask_next(net);
1120 int family = nfmsg->nfgen_family;
1121 const struct nlattr *attr;
1122 struct nft_table *table;
1125 nft_ctx_init(&ctx, net, skb, nlh, 0, NULL, NULL, nla);
1126 if (family == AF_UNSPEC ||
1127 (!nla[NFTA_TABLE_NAME] && !nla[NFTA_TABLE_HANDLE]))
1128 return nft_flush(&ctx, family);
1130 if (nla[NFTA_TABLE_HANDLE]) {
1131 attr = nla[NFTA_TABLE_HANDLE];
1132 table = nft_table_lookup_byhandle(net, attr, genmask);
1134 attr = nla[NFTA_TABLE_NAME];
1135 table = nft_table_lookup(net, attr, family, genmask);
1138 if (IS_ERR(table)) {
1139 NL_SET_BAD_ATTR(extack, attr);
1140 return PTR_ERR(table);
1143 if (nlh->nlmsg_flags & NLM_F_NONREC &&
1147 ctx.family = family;
1150 return nft_flush_table(&ctx);
1153 static void nf_tables_table_destroy(struct nft_ctx *ctx)
1155 if (WARN_ON(ctx->table->use > 0))
1158 rhltable_destroy(&ctx->table->chains_ht);
1159 kfree(ctx->table->name);
1163 void nft_register_chain_type(const struct nft_chain_type *ctype)
1165 if (WARN_ON(ctype->family >= NFPROTO_NUMPROTO))
1168 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1169 if (WARN_ON(chain_type[ctype->family][ctype->type] != NULL)) {
1170 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1173 chain_type[ctype->family][ctype->type] = ctype;
1174 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1176 EXPORT_SYMBOL_GPL(nft_register_chain_type);
1178 void nft_unregister_chain_type(const struct nft_chain_type *ctype)
1180 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1181 chain_type[ctype->family][ctype->type] = NULL;
1182 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1184 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
1190 static struct nft_chain *
1191 nft_chain_lookup_byhandle(const struct nft_table *table, u64 handle, u8 genmask)
1193 struct nft_chain *chain;
1195 list_for_each_entry(chain, &table->chains, list) {
1196 if (chain->handle == handle &&
1197 nft_active_genmask(chain, genmask))
1201 return ERR_PTR(-ENOENT);
1204 static bool lockdep_commit_lock_is_held(const struct net *net)
1206 #ifdef CONFIG_PROVE_LOCKING
1207 return lockdep_is_held(&net->nft.commit_mutex);
1213 static struct nft_chain *nft_chain_lookup(struct net *net,
1214 struct nft_table *table,
1215 const struct nlattr *nla, u8 genmask)
1217 char search[NFT_CHAIN_MAXNAMELEN + 1];
1218 struct rhlist_head *tmp, *list;
1219 struct nft_chain *chain;
1222 return ERR_PTR(-EINVAL);
1224 nla_strlcpy(search, nla, sizeof(search));
1226 WARN_ON(!rcu_read_lock_held() &&
1227 !lockdep_commit_lock_is_held(net));
1229 chain = ERR_PTR(-ENOENT);
1231 list = rhltable_lookup(&table->chains_ht, search, nft_chain_ht_params);
1235 rhl_for_each_entry_rcu(chain, tmp, list, rhlhead) {
1236 if (nft_active_genmask(chain, genmask))
1239 chain = ERR_PTR(-ENOENT);
1245 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
1246 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING,
1247 .len = NFT_TABLE_MAXNAMELEN - 1 },
1248 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
1249 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
1250 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1251 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
1252 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
1253 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING,
1254 .len = NFT_MODULE_AUTOLOAD_LIMIT },
1255 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
1256 [NFTA_CHAIN_FLAGS] = { .type = NLA_U32 },
1259 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
1260 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
1261 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
1262 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
1263 .len = IFNAMSIZ - 1 },
1266 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
1268 struct nft_stats *cpu_stats, total;
1269 struct nlattr *nest;
1277 memset(&total, 0, sizeof(total));
1278 for_each_possible_cpu(cpu) {
1279 cpu_stats = per_cpu_ptr(stats, cpu);
1281 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
1282 pkts = cpu_stats->pkts;
1283 bytes = cpu_stats->bytes;
1284 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
1286 total.bytes += bytes;
1288 nest = nla_nest_start_noflag(skb, NFTA_CHAIN_COUNTERS);
1290 goto nla_put_failure;
1292 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
1293 NFTA_COUNTER_PAD) ||
1294 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
1296 goto nla_put_failure;
1298 nla_nest_end(skb, nest);
1305 static int nft_dump_basechain_hook(struct sk_buff *skb, int family,
1306 const struct nft_base_chain *basechain)
1308 const struct nf_hook_ops *ops = &basechain->ops;
1309 struct nft_hook *hook, *first = NULL;
1310 struct nlattr *nest, *nest_devs;
1313 nest = nla_nest_start_noflag(skb, NFTA_CHAIN_HOOK);
1315 goto nla_put_failure;
1316 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
1317 goto nla_put_failure;
1318 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
1319 goto nla_put_failure;
1321 if (family == NFPROTO_NETDEV) {
1322 nest_devs = nla_nest_start_noflag(skb, NFTA_HOOK_DEVS);
1323 list_for_each_entry(hook, &basechain->hook_list, list) {
1327 if (nla_put_string(skb, NFTA_DEVICE_NAME,
1328 hook->ops.dev->name))
1329 goto nla_put_failure;
1332 nla_nest_end(skb, nest_devs);
1335 nla_put_string(skb, NFTA_HOOK_DEV, first->ops.dev->name))
1336 goto nla_put_failure;
1338 nla_nest_end(skb, nest);
1345 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
1346 u32 portid, u32 seq, int event, u32 flags,
1347 int family, const struct nft_table *table,
1348 const struct nft_chain *chain)
1350 struct nlmsghdr *nlh;
1351 struct nfgenmsg *nfmsg;
1353 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
1354 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
1356 goto nla_put_failure;
1358 nfmsg = nlmsg_data(nlh);
1359 nfmsg->nfgen_family = family;
1360 nfmsg->version = NFNETLINK_V0;
1361 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1363 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
1364 goto nla_put_failure;
1365 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
1367 goto nla_put_failure;
1368 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
1369 goto nla_put_failure;
1371 if (nft_is_base_chain(chain)) {
1372 const struct nft_base_chain *basechain = nft_base_chain(chain);
1373 struct nft_stats __percpu *stats;
1375 if (nft_dump_basechain_hook(skb, family, basechain))
1376 goto nla_put_failure;
1378 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
1379 htonl(basechain->policy)))
1380 goto nla_put_failure;
1382 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
1383 goto nla_put_failure;
1385 stats = rcu_dereference_check(basechain->stats,
1386 lockdep_commit_lock_is_held(net));
1387 if (nft_dump_stats(skb, stats))
1388 goto nla_put_failure;
1391 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
1392 goto nla_put_failure;
1394 nlmsg_end(skb, nlh);
1398 nlmsg_trim(skb, nlh);
1402 static void nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
1404 struct sk_buff *skb;
1408 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1411 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1415 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
1416 event, 0, ctx->family, ctx->table,
1423 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1424 ctx->report, GFP_KERNEL);
1427 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
1430 static int nf_tables_dump_chains(struct sk_buff *skb,
1431 struct netlink_callback *cb)
1433 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1434 const struct nft_table *table;
1435 const struct nft_chain *chain;
1436 unsigned int idx = 0, s_idx = cb->args[0];
1437 struct net *net = sock_net(skb->sk);
1438 int family = nfmsg->nfgen_family;
1441 cb->seq = net->nft.base_seq;
1443 list_for_each_entry_rcu(table, &net->nft.tables, list) {
1444 if (family != NFPROTO_UNSPEC && family != table->family)
1447 list_for_each_entry_rcu(chain, &table->chains, list) {
1451 memset(&cb->args[1], 0,
1452 sizeof(cb->args) - sizeof(cb->args[0]));
1453 if (!nft_is_active(net, chain))
1455 if (nf_tables_fill_chain_info(skb, net,
1456 NETLINK_CB(cb->skb).portid,
1460 table->family, table,
1464 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1475 /* called with rcu_read_lock held */
1476 static int nf_tables_getchain(struct net *net, struct sock *nlsk,
1477 struct sk_buff *skb, const struct nlmsghdr *nlh,
1478 const struct nlattr * const nla[],
1479 struct netlink_ext_ack *extack)
1481 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1482 u8 genmask = nft_genmask_cur(net);
1483 const struct nft_chain *chain;
1484 struct nft_table *table;
1485 struct sk_buff *skb2;
1486 int family = nfmsg->nfgen_family;
1489 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1490 struct netlink_dump_control c = {
1491 .dump = nf_tables_dump_chains,
1492 .module = THIS_MODULE,
1495 return nft_netlink_dump_start_rcu(nlsk, skb, nlh, &c);
1498 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask);
1499 if (IS_ERR(table)) {
1500 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
1501 return PTR_ERR(table);
1504 chain = nft_chain_lookup(net, table, nla[NFTA_CHAIN_NAME], genmask);
1505 if (IS_ERR(chain)) {
1506 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_NAME]);
1507 return PTR_ERR(chain);
1510 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
1514 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
1515 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1516 family, table, chain);
1520 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1527 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1528 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1529 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1532 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
1534 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1535 struct nft_stats __percpu *newstats;
1536 struct nft_stats *stats;
1539 err = nla_parse_nested_deprecated(tb, NFTA_COUNTER_MAX, attr,
1540 nft_counter_policy, NULL);
1542 return ERR_PTR(err);
1544 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
1545 return ERR_PTR(-EINVAL);
1547 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
1548 if (newstats == NULL)
1549 return ERR_PTR(-ENOMEM);
1551 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1552 * are not exposed to userspace.
1555 stats = this_cpu_ptr(newstats);
1556 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1557 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
1563 static void nft_chain_stats_replace(struct nft_trans *trans)
1565 struct nft_base_chain *chain = nft_base_chain(trans->ctx.chain);
1567 if (!nft_trans_chain_stats(trans))
1570 nft_trans_chain_stats(trans) =
1571 rcu_replace_pointer(chain->stats, nft_trans_chain_stats(trans),
1572 lockdep_commit_lock_is_held(trans->ctx.net));
1574 if (!nft_trans_chain_stats(trans))
1575 static_branch_inc(&nft_counters_enabled);
1578 static void nf_tables_chain_free_chain_rules(struct nft_chain *chain)
1580 struct nft_rule **g0 = rcu_dereference_raw(chain->rules_gen_0);
1581 struct nft_rule **g1 = rcu_dereference_raw(chain->rules_gen_1);
1587 /* should be NULL either via abort or via successful commit */
1588 WARN_ON_ONCE(chain->rules_next);
1589 kvfree(chain->rules_next);
1592 static void nf_tables_chain_destroy(struct nft_ctx *ctx)
1594 struct nft_chain *chain = ctx->chain;
1595 struct nft_hook *hook, *next;
1597 if (WARN_ON(chain->use > 0))
1600 /* no concurrent access possible anymore */
1601 nf_tables_chain_free_chain_rules(chain);
1603 if (nft_is_base_chain(chain)) {
1604 struct nft_base_chain *basechain = nft_base_chain(chain);
1606 if (ctx->family == NFPROTO_NETDEV) {
1607 list_for_each_entry_safe(hook, next,
1608 &basechain->hook_list, list) {
1609 list_del_rcu(&hook->list);
1610 kfree_rcu(hook, rcu);
1613 module_put(basechain->type->owner);
1614 if (rcu_access_pointer(basechain->stats)) {
1615 static_branch_dec(&nft_counters_enabled);
1616 free_percpu(rcu_dereference_raw(basechain->stats));
1626 static struct nft_hook *nft_netdev_hook_alloc(struct net *net,
1627 const struct nlattr *attr)
1629 struct net_device *dev;
1630 char ifname[IFNAMSIZ];
1631 struct nft_hook *hook;
1634 hook = kmalloc(sizeof(struct nft_hook), GFP_KERNEL);
1637 goto err_hook_alloc;
1640 nla_strlcpy(ifname, attr, IFNAMSIZ);
1641 dev = __dev_get_by_name(net, ifname);
1646 hook->ops.dev = dev;
1653 return ERR_PTR(err);
1656 static bool nft_hook_list_find(struct list_head *hook_list,
1657 const struct nft_hook *this)
1659 struct nft_hook *hook;
1661 list_for_each_entry(hook, hook_list, list) {
1662 if (this->ops.dev == hook->ops.dev)
1669 static int nf_tables_parse_netdev_hooks(struct net *net,
1670 const struct nlattr *attr,
1671 struct list_head *hook_list)
1673 struct nft_hook *hook, *next;
1674 const struct nlattr *tmp;
1675 int rem, n = 0, err;
1677 nla_for_each_nested(tmp, attr, rem) {
1678 if (nla_type(tmp) != NFTA_DEVICE_NAME) {
1683 hook = nft_netdev_hook_alloc(net, tmp);
1685 err = PTR_ERR(hook);
1688 if (nft_hook_list_find(hook_list, hook)) {
1693 list_add_tail(&hook->list, hook_list);
1696 if (n == NFT_NETDEVICE_MAX) {
1707 list_for_each_entry_safe(hook, next, hook_list, list) {
1708 list_del(&hook->list);
1714 struct nft_chain_hook {
1717 const struct nft_chain_type *type;
1718 struct list_head list;
1721 static int nft_chain_parse_netdev(struct net *net,
1722 struct nlattr *tb[],
1723 struct list_head *hook_list)
1725 struct nft_hook *hook;
1728 if (tb[NFTA_HOOK_DEV]) {
1729 hook = nft_netdev_hook_alloc(net, tb[NFTA_HOOK_DEV]);
1731 return PTR_ERR(hook);
1733 list_add_tail(&hook->list, hook_list);
1734 } else if (tb[NFTA_HOOK_DEVS]) {
1735 err = nf_tables_parse_netdev_hooks(net, tb[NFTA_HOOK_DEVS],
1746 static int nft_chain_parse_hook(struct net *net,
1747 const struct nlattr * const nla[],
1748 struct nft_chain_hook *hook, u8 family,
1751 struct nlattr *ha[NFTA_HOOK_MAX + 1];
1752 const struct nft_chain_type *type;
1755 lockdep_assert_held(&net->nft.commit_mutex);
1756 lockdep_nfnl_nft_mutex_not_held();
1758 err = nla_parse_nested_deprecated(ha, NFTA_HOOK_MAX,
1759 nla[NFTA_CHAIN_HOOK],
1760 nft_hook_policy, NULL);
1764 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1765 ha[NFTA_HOOK_PRIORITY] == NULL)
1768 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
1769 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1771 type = chain_type[family][NFT_CHAIN_T_DEFAULT];
1772 if (nla[NFTA_CHAIN_TYPE]) {
1773 type = nf_tables_chain_type_lookup(net, nla[NFTA_CHAIN_TYPE],
1776 return PTR_ERR(type);
1778 if (hook->num > NF_MAX_HOOKS || !(type->hook_mask & (1 << hook->num)))
1781 if (type->type == NFT_CHAIN_T_NAT &&
1782 hook->priority <= NF_IP_PRI_CONNTRACK)
1785 if (!try_module_get(type->owner))
1790 INIT_LIST_HEAD(&hook->list);
1791 if (family == NFPROTO_NETDEV) {
1792 err = nft_chain_parse_netdev(net, ha, &hook->list);
1794 module_put(type->owner);
1797 } else if (ha[NFTA_HOOK_DEV] || ha[NFTA_HOOK_DEVS]) {
1798 module_put(type->owner);
1805 static void nft_chain_release_hook(struct nft_chain_hook *hook)
1807 struct nft_hook *h, *next;
1809 list_for_each_entry_safe(h, next, &hook->list, list) {
1813 module_put(hook->type->owner);
1816 struct nft_rules_old {
1818 struct nft_rule **start;
1821 static struct nft_rule **nf_tables_chain_alloc_rules(const struct nft_chain *chain,
1824 if (alloc > INT_MAX)
1827 alloc += 1; /* NULL, ends rules */
1828 if (sizeof(struct nft_rule *) > INT_MAX / alloc)
1831 alloc *= sizeof(struct nft_rule *);
1832 alloc += sizeof(struct nft_rules_old);
1834 return kvmalloc(alloc, GFP_KERNEL);
1837 static void nft_basechain_hook_init(struct nf_hook_ops *ops, u8 family,
1838 const struct nft_chain_hook *hook,
1839 struct nft_chain *chain)
1842 ops->hooknum = hook->num;
1843 ops->priority = hook->priority;
1845 ops->hook = hook->type->hooks[ops->hooknum];
1848 static int nft_basechain_init(struct nft_base_chain *basechain, u8 family,
1849 struct nft_chain_hook *hook, u32 flags)
1851 struct nft_chain *chain;
1854 basechain->type = hook->type;
1855 INIT_LIST_HEAD(&basechain->hook_list);
1856 chain = &basechain->chain;
1858 if (family == NFPROTO_NETDEV) {
1859 list_splice_init(&hook->list, &basechain->hook_list);
1860 list_for_each_entry(h, &basechain->hook_list, list)
1861 nft_basechain_hook_init(&h->ops, family, hook, chain);
1863 basechain->ops.hooknum = hook->num;
1864 basechain->ops.priority = hook->priority;
1866 nft_basechain_hook_init(&basechain->ops, family, hook, chain);
1869 chain->flags |= NFT_BASE_CHAIN | flags;
1870 basechain->policy = NF_ACCEPT;
1871 if (chain->flags & NFT_CHAIN_HW_OFFLOAD &&
1872 nft_chain_offload_priority(basechain) < 0)
1875 flow_block_init(&basechain->flow_block);
1880 static int nf_tables_addchain(struct nft_ctx *ctx, u8 family, u8 genmask,
1881 u8 policy, u32 flags)
1883 const struct nlattr * const *nla = ctx->nla;
1884 struct nft_table *table = ctx->table;
1885 struct nft_base_chain *basechain;
1886 struct nft_stats __percpu *stats;
1887 struct net *net = ctx->net;
1888 struct nft_trans *trans;
1889 struct nft_chain *chain;
1890 struct nft_rule **rules;
1893 if (table->use == UINT_MAX)
1896 if (nla[NFTA_CHAIN_HOOK]) {
1897 struct nft_chain_hook hook;
1899 err = nft_chain_parse_hook(net, nla, &hook, family, true);
1903 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1904 if (basechain == NULL) {
1905 nft_chain_release_hook(&hook);
1908 chain = &basechain->chain;
1910 if (nla[NFTA_CHAIN_COUNTERS]) {
1911 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1912 if (IS_ERR(stats)) {
1913 nft_chain_release_hook(&hook);
1915 return PTR_ERR(stats);
1917 rcu_assign_pointer(basechain->stats, stats);
1918 static_branch_inc(&nft_counters_enabled);
1921 err = nft_basechain_init(basechain, family, &hook, flags);
1923 nft_chain_release_hook(&hook);
1928 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1934 INIT_LIST_HEAD(&chain->rules);
1935 chain->handle = nf_tables_alloc_handle(table);
1936 chain->table = table;
1937 chain->name = nla_strdup(nla[NFTA_CHAIN_NAME], GFP_KERNEL);
1943 rules = nf_tables_chain_alloc_rules(chain, 0);
1950 rcu_assign_pointer(chain->rules_gen_0, rules);
1951 rcu_assign_pointer(chain->rules_gen_1, rules);
1953 err = nf_tables_register_hook(net, table, chain);
1957 err = rhltable_insert_key(&table->chains_ht, chain->name,
1958 &chain->rhlhead, nft_chain_ht_params);
1962 trans = nft_trans_chain_add(ctx, NFT_MSG_NEWCHAIN);
1963 if (IS_ERR(trans)) {
1964 err = PTR_ERR(trans);
1965 rhltable_remove(&table->chains_ht, &chain->rhlhead,
1966 nft_chain_ht_params);
1970 nft_trans_chain_policy(trans) = NFT_CHAIN_POLICY_UNSET;
1971 if (nft_is_base_chain(chain))
1972 nft_trans_chain_policy(trans) = policy;
1975 list_add_tail_rcu(&chain->list, &table->chains);
1979 nf_tables_unregister_hook(net, table, chain);
1981 nf_tables_chain_destroy(ctx);
1986 static bool nft_hook_list_equal(struct list_head *hook_list1,
1987 struct list_head *hook_list2)
1989 struct nft_hook *hook;
1993 list_for_each_entry(hook, hook_list2, list) {
1994 if (!nft_hook_list_find(hook_list1, hook))
1999 list_for_each_entry(hook, hook_list1, list)
2005 static int nf_tables_updchain(struct nft_ctx *ctx, u8 genmask, u8 policy,
2008 const struct nlattr * const *nla = ctx->nla;
2009 struct nft_table *table = ctx->table;
2010 struct nft_chain *chain = ctx->chain;
2011 struct nft_base_chain *basechain;
2012 struct nft_stats *stats = NULL;
2013 struct nft_chain_hook hook;
2014 struct nf_hook_ops *ops;
2015 struct nft_trans *trans;
2018 if (chain->flags ^ flags)
2021 if (nla[NFTA_CHAIN_HOOK]) {
2022 if (!nft_is_base_chain(chain))
2025 err = nft_chain_parse_hook(ctx->net, nla, &hook, ctx->family,
2030 basechain = nft_base_chain(chain);
2031 if (basechain->type != hook.type) {
2032 nft_chain_release_hook(&hook);
2036 if (ctx->family == NFPROTO_NETDEV) {
2037 if (!nft_hook_list_equal(&basechain->hook_list,
2039 nft_chain_release_hook(&hook);
2043 ops = &basechain->ops;
2044 if (ops->hooknum != hook.num ||
2045 ops->priority != hook.priority) {
2046 nft_chain_release_hook(&hook);
2050 nft_chain_release_hook(&hook);
2053 if (nla[NFTA_CHAIN_HANDLE] &&
2054 nla[NFTA_CHAIN_NAME]) {
2055 struct nft_chain *chain2;
2057 chain2 = nft_chain_lookup(ctx->net, table,
2058 nla[NFTA_CHAIN_NAME], genmask);
2059 if (!IS_ERR(chain2))
2063 if (nla[NFTA_CHAIN_COUNTERS]) {
2064 if (!nft_is_base_chain(chain))
2067 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
2069 return PTR_ERR(stats);
2073 trans = nft_trans_alloc(ctx, NFT_MSG_NEWCHAIN,
2074 sizeof(struct nft_trans_chain));
2078 nft_trans_chain_stats(trans) = stats;
2079 nft_trans_chain_update(trans) = true;
2081 if (nla[NFTA_CHAIN_POLICY])
2082 nft_trans_chain_policy(trans) = policy;
2084 nft_trans_chain_policy(trans) = -1;
2086 if (nla[NFTA_CHAIN_HANDLE] &&
2087 nla[NFTA_CHAIN_NAME]) {
2088 struct nft_trans *tmp;
2092 name = nla_strdup(nla[NFTA_CHAIN_NAME], GFP_KERNEL);
2097 list_for_each_entry(tmp, &ctx->net->nft.commit_list, list) {
2098 if (tmp->msg_type == NFT_MSG_NEWCHAIN &&
2099 tmp->ctx.table == table &&
2100 nft_trans_chain_update(tmp) &&
2101 nft_trans_chain_name(tmp) &&
2102 strcmp(name, nft_trans_chain_name(tmp)) == 0) {
2108 nft_trans_chain_name(trans) = name;
2110 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
2119 static int nf_tables_newchain(struct net *net, struct sock *nlsk,
2120 struct sk_buff *skb, const struct nlmsghdr *nlh,
2121 const struct nlattr * const nla[],
2122 struct netlink_ext_ack *extack)
2124 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2125 u8 genmask = nft_genmask_next(net);
2126 int family = nfmsg->nfgen_family;
2127 const struct nlattr *attr;
2128 struct nft_table *table;
2129 struct nft_chain *chain;
2130 u8 policy = NF_ACCEPT;
2135 lockdep_assert_held(&net->nft.commit_mutex);
2137 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask);
2138 if (IS_ERR(table)) {
2139 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
2140 return PTR_ERR(table);
2144 attr = nla[NFTA_CHAIN_NAME];
2146 if (nla[NFTA_CHAIN_HANDLE]) {
2147 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
2148 chain = nft_chain_lookup_byhandle(table, handle, genmask);
2149 if (IS_ERR(chain)) {
2150 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_HANDLE]);
2151 return PTR_ERR(chain);
2153 attr = nla[NFTA_CHAIN_HANDLE];
2155 chain = nft_chain_lookup(net, table, attr, genmask);
2156 if (IS_ERR(chain)) {
2157 if (PTR_ERR(chain) != -ENOENT) {
2158 NL_SET_BAD_ATTR(extack, attr);
2159 return PTR_ERR(chain);
2165 if (nla[NFTA_CHAIN_POLICY]) {
2166 if (chain != NULL &&
2167 !nft_is_base_chain(chain)) {
2168 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_POLICY]);
2172 if (chain == NULL &&
2173 nla[NFTA_CHAIN_HOOK] == NULL) {
2174 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_POLICY]);
2178 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
2188 if (nla[NFTA_CHAIN_FLAGS])
2189 flags = ntohl(nla_get_be32(nla[NFTA_CHAIN_FLAGS]));
2191 flags = chain->flags;
2193 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
2195 if (chain != NULL) {
2196 if (nlh->nlmsg_flags & NLM_F_EXCL) {
2197 NL_SET_BAD_ATTR(extack, attr);
2200 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2203 flags |= chain->flags & NFT_BASE_CHAIN;
2204 return nf_tables_updchain(&ctx, genmask, policy, flags);
2207 return nf_tables_addchain(&ctx, family, genmask, policy, flags);
2210 static int nf_tables_delchain(struct net *net, struct sock *nlsk,
2211 struct sk_buff *skb, const struct nlmsghdr *nlh,
2212 const struct nlattr * const nla[],
2213 struct netlink_ext_ack *extack)
2215 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2216 u8 genmask = nft_genmask_next(net);
2217 int family = nfmsg->nfgen_family;
2218 const struct nlattr *attr;
2219 struct nft_table *table;
2220 struct nft_chain *chain;
2221 struct nft_rule *rule;
2227 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask);
2228 if (IS_ERR(table)) {
2229 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
2230 return PTR_ERR(table);
2233 if (nla[NFTA_CHAIN_HANDLE]) {
2234 attr = nla[NFTA_CHAIN_HANDLE];
2235 handle = be64_to_cpu(nla_get_be64(attr));
2236 chain = nft_chain_lookup_byhandle(table, handle, genmask);
2238 attr = nla[NFTA_CHAIN_NAME];
2239 chain = nft_chain_lookup(net, table, attr, genmask);
2241 if (IS_ERR(chain)) {
2242 NL_SET_BAD_ATTR(extack, attr);
2243 return PTR_ERR(chain);
2246 if (nlh->nlmsg_flags & NLM_F_NONREC &&
2250 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
2253 list_for_each_entry(rule, &chain->rules, list) {
2254 if (!nft_is_active_next(net, rule))
2258 err = nft_delrule(&ctx, rule);
2263 /* There are rules and elements that are still holding references to us,
2264 * we cannot do a recursive removal in this case.
2267 NL_SET_BAD_ATTR(extack, attr);
2271 return nft_delchain(&ctx);
2279 * nft_register_expr - register nf_tables expr type
2282 * Registers the expr type for use with nf_tables. Returns zero on
2283 * success or a negative errno code otherwise.
2285 int nft_register_expr(struct nft_expr_type *type)
2287 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2288 if (type->family == NFPROTO_UNSPEC)
2289 list_add_tail_rcu(&type->list, &nf_tables_expressions);
2291 list_add_rcu(&type->list, &nf_tables_expressions);
2292 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2295 EXPORT_SYMBOL_GPL(nft_register_expr);
2298 * nft_unregister_expr - unregister nf_tables expr type
2301 * Unregisters the expr typefor use with nf_tables.
2303 void nft_unregister_expr(struct nft_expr_type *type)
2305 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2306 list_del_rcu(&type->list);
2307 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2309 EXPORT_SYMBOL_GPL(nft_unregister_expr);
2311 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
2314 const struct nft_expr_type *type, *candidate = NULL;
2316 list_for_each_entry(type, &nf_tables_expressions, list) {
2317 if (!nla_strcmp(nla, type->name)) {
2318 if (!type->family && !candidate)
2320 else if (type->family == family)
2327 #ifdef CONFIG_MODULES
2328 static int nft_expr_type_request_module(struct net *net, u8 family,
2331 nft_request_module(net, "nft-expr-%u-%.*s", family,
2332 nla_len(nla), (char *)nla_data(nla));
2333 if (__nft_expr_type_get(family, nla))
2340 static const struct nft_expr_type *nft_expr_type_get(struct net *net,
2344 const struct nft_expr_type *type;
2347 return ERR_PTR(-EINVAL);
2349 type = __nft_expr_type_get(family, nla);
2350 if (type != NULL && try_module_get(type->owner))
2353 lockdep_nfnl_nft_mutex_not_held();
2354 #ifdef CONFIG_MODULES
2356 if (nft_expr_type_request_module(net, family, nla) == -EAGAIN)
2357 return ERR_PTR(-EAGAIN);
2359 nft_request_module(net, "nft-expr-%.*s",
2360 nla_len(nla), (char *)nla_data(nla));
2361 if (__nft_expr_type_get(family, nla))
2362 return ERR_PTR(-EAGAIN);
2365 return ERR_PTR(-ENOENT);
2368 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
2369 [NFTA_EXPR_NAME] = { .type = NLA_STRING,
2370 .len = NFT_MODULE_AUTOLOAD_LIMIT },
2371 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
2374 static int nf_tables_fill_expr_info(struct sk_buff *skb,
2375 const struct nft_expr *expr)
2377 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
2378 goto nla_put_failure;
2380 if (expr->ops->dump) {
2381 struct nlattr *data = nla_nest_start_noflag(skb,
2384 goto nla_put_failure;
2385 if (expr->ops->dump(skb, expr) < 0)
2386 goto nla_put_failure;
2387 nla_nest_end(skb, data);
2396 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
2397 const struct nft_expr *expr)
2399 struct nlattr *nest;
2401 nest = nla_nest_start_noflag(skb, attr);
2403 goto nla_put_failure;
2404 if (nf_tables_fill_expr_info(skb, expr) < 0)
2405 goto nla_put_failure;
2406 nla_nest_end(skb, nest);
2413 struct nft_expr_info {
2414 const struct nft_expr_ops *ops;
2415 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
2418 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
2419 const struct nlattr *nla,
2420 struct nft_expr_info *info)
2422 const struct nft_expr_type *type;
2423 const struct nft_expr_ops *ops;
2424 struct nlattr *tb[NFTA_EXPR_MAX + 1];
2427 err = nla_parse_nested_deprecated(tb, NFTA_EXPR_MAX, nla,
2428 nft_expr_policy, NULL);
2432 type = nft_expr_type_get(ctx->net, ctx->family, tb[NFTA_EXPR_NAME]);
2434 return PTR_ERR(type);
2436 if (tb[NFTA_EXPR_DATA]) {
2437 err = nla_parse_nested_deprecated(info->tb, type->maxattr,
2439 type->policy, NULL);
2443 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
2445 if (type->select_ops != NULL) {
2446 ops = type->select_ops(ctx,
2447 (const struct nlattr * const *)info->tb);
2450 #ifdef CONFIG_MODULES
2452 nft_expr_type_request_module(ctx->net,
2454 tb[NFTA_EXPR_NAME]);
2465 module_put(type->owner);
2469 static int nf_tables_newexpr(const struct nft_ctx *ctx,
2470 const struct nft_expr_info *info,
2471 struct nft_expr *expr)
2473 const struct nft_expr_ops *ops = info->ops;
2478 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
2489 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
2490 struct nft_expr *expr)
2492 const struct nft_expr_type *type = expr->ops->type;
2494 if (expr->ops->destroy)
2495 expr->ops->destroy(ctx, expr);
2496 module_put(type->owner);
2499 struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
2500 const struct nlattr *nla)
2502 struct nft_expr_info info;
2503 struct nft_expr *expr;
2504 struct module *owner;
2507 err = nf_tables_expr_parse(ctx, nla, &info);
2512 expr = kzalloc(info.ops->size, GFP_KERNEL);
2516 err = nf_tables_newexpr(ctx, &info, expr);
2524 owner = info.ops->type->owner;
2525 if (info.ops->type->release_ops)
2526 info.ops->type->release_ops(info.ops);
2530 return ERR_PTR(err);
2533 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
2535 nf_tables_expr_destroy(ctx, expr);
2543 static struct nft_rule *__nft_rule_lookup(const struct nft_chain *chain,
2546 struct nft_rule *rule;
2548 // FIXME: this sucks
2549 list_for_each_entry_rcu(rule, &chain->rules, list) {
2550 if (handle == rule->handle)
2554 return ERR_PTR(-ENOENT);
2557 static struct nft_rule *nft_rule_lookup(const struct nft_chain *chain,
2558 const struct nlattr *nla)
2561 return ERR_PTR(-EINVAL);
2563 return __nft_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
2566 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
2567 [NFTA_RULE_TABLE] = { .type = NLA_STRING,
2568 .len = NFT_TABLE_MAXNAMELEN - 1 },
2569 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
2570 .len = NFT_CHAIN_MAXNAMELEN - 1 },
2571 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
2572 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
2573 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
2574 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
2575 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
2576 .len = NFT_USERDATA_MAXLEN },
2577 [NFTA_RULE_ID] = { .type = NLA_U32 },
2578 [NFTA_RULE_POSITION_ID] = { .type = NLA_U32 },
2581 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
2582 u32 portid, u32 seq, int event,
2583 u32 flags, int family,
2584 const struct nft_table *table,
2585 const struct nft_chain *chain,
2586 const struct nft_rule *rule,
2587 const struct nft_rule *prule)
2589 struct nlmsghdr *nlh;
2590 struct nfgenmsg *nfmsg;
2591 const struct nft_expr *expr, *next;
2592 struct nlattr *list;
2593 u16 type = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
2595 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg), flags);
2597 goto nla_put_failure;
2599 nfmsg = nlmsg_data(nlh);
2600 nfmsg->nfgen_family = family;
2601 nfmsg->version = NFNETLINK_V0;
2602 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
2604 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
2605 goto nla_put_failure;
2606 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
2607 goto nla_put_failure;
2608 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
2610 goto nla_put_failure;
2612 if (event != NFT_MSG_DELRULE && prule) {
2613 if (nla_put_be64(skb, NFTA_RULE_POSITION,
2614 cpu_to_be64(prule->handle),
2616 goto nla_put_failure;
2619 list = nla_nest_start_noflag(skb, NFTA_RULE_EXPRESSIONS);
2621 goto nla_put_failure;
2622 nft_rule_for_each_expr(expr, next, rule) {
2623 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
2624 goto nla_put_failure;
2626 nla_nest_end(skb, list);
2629 struct nft_userdata *udata = nft_userdata(rule);
2630 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
2632 goto nla_put_failure;
2635 nlmsg_end(skb, nlh);
2639 nlmsg_trim(skb, nlh);
2643 static void nf_tables_rule_notify(const struct nft_ctx *ctx,
2644 const struct nft_rule *rule, int event)
2646 struct sk_buff *skb;
2650 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2653 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
2657 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
2658 event, 0, ctx->family, ctx->table,
2659 ctx->chain, rule, NULL);
2665 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
2666 ctx->report, GFP_KERNEL);
2669 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
2672 struct nft_rule_dump_ctx {
2677 static int __nf_tables_dump_rules(struct sk_buff *skb,
2679 struct netlink_callback *cb,
2680 const struct nft_table *table,
2681 const struct nft_chain *chain)
2683 struct net *net = sock_net(skb->sk);
2684 const struct nft_rule *rule, *prule;
2685 unsigned int s_idx = cb->args[0];
2688 list_for_each_entry_rcu(rule, &chain->rules, list) {
2689 if (!nft_is_active(net, rule))
2694 memset(&cb->args[1], 0,
2695 sizeof(cb->args) - sizeof(cb->args[0]));
2697 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
2700 NLM_F_MULTI | NLM_F_APPEND,
2702 table, chain, rule, prule) < 0)
2705 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2714 static int nf_tables_dump_rules(struct sk_buff *skb,
2715 struct netlink_callback *cb)
2717 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
2718 const struct nft_rule_dump_ctx *ctx = cb->data;
2719 struct nft_table *table;
2720 const struct nft_chain *chain;
2721 unsigned int idx = 0;
2722 struct net *net = sock_net(skb->sk);
2723 int family = nfmsg->nfgen_family;
2726 cb->seq = net->nft.base_seq;
2728 list_for_each_entry_rcu(table, &net->nft.tables, list) {
2729 if (family != NFPROTO_UNSPEC && family != table->family)
2732 if (ctx && ctx->table && strcmp(ctx->table, table->name) != 0)
2735 if (ctx && ctx->table && ctx->chain) {
2736 struct rhlist_head *list, *tmp;
2738 list = rhltable_lookup(&table->chains_ht, ctx->chain,
2739 nft_chain_ht_params);
2743 rhl_for_each_entry_rcu(chain, tmp, list, rhlhead) {
2744 if (!nft_is_active(net, chain))
2746 __nf_tables_dump_rules(skb, &idx,
2753 list_for_each_entry_rcu(chain, &table->chains, list) {
2754 if (__nf_tables_dump_rules(skb, &idx, cb, table, chain))
2758 if (ctx && ctx->table)
2768 static int nf_tables_dump_rules_start(struct netlink_callback *cb)
2770 const struct nlattr * const *nla = cb->data;
2771 struct nft_rule_dump_ctx *ctx = NULL;
2773 if (nla[NFTA_RULE_TABLE] || nla[NFTA_RULE_CHAIN]) {
2774 ctx = kzalloc(sizeof(*ctx), GFP_ATOMIC);
2778 if (nla[NFTA_RULE_TABLE]) {
2779 ctx->table = nla_strdup(nla[NFTA_RULE_TABLE],
2786 if (nla[NFTA_RULE_CHAIN]) {
2787 ctx->chain = nla_strdup(nla[NFTA_RULE_CHAIN],
2801 static int nf_tables_dump_rules_done(struct netlink_callback *cb)
2803 struct nft_rule_dump_ctx *ctx = cb->data;
2813 /* called with rcu_read_lock held */
2814 static int nf_tables_getrule(struct net *net, struct sock *nlsk,
2815 struct sk_buff *skb, const struct nlmsghdr *nlh,
2816 const struct nlattr * const nla[],
2817 struct netlink_ext_ack *extack)
2819 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2820 u8 genmask = nft_genmask_cur(net);
2821 const struct nft_chain *chain;
2822 const struct nft_rule *rule;
2823 struct nft_table *table;
2824 struct sk_buff *skb2;
2825 int family = nfmsg->nfgen_family;
2828 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2829 struct netlink_dump_control c = {
2830 .start= nf_tables_dump_rules_start,
2831 .dump = nf_tables_dump_rules,
2832 .done = nf_tables_dump_rules_done,
2833 .module = THIS_MODULE,
2834 .data = (void *)nla,
2837 return nft_netlink_dump_start_rcu(nlsk, skb, nlh, &c);
2840 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask);
2841 if (IS_ERR(table)) {
2842 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
2843 return PTR_ERR(table);
2846 chain = nft_chain_lookup(net, table, nla[NFTA_RULE_CHAIN], genmask);
2847 if (IS_ERR(chain)) {
2848 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
2849 return PTR_ERR(chain);
2852 rule = nft_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2854 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
2855 return PTR_ERR(rule);
2858 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
2862 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
2863 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
2864 family, table, chain, rule, NULL);
2868 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2875 static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
2876 struct nft_rule *rule)
2878 struct nft_expr *expr, *next;
2881 * Careful: some expressions might not be initialized in case this
2882 * is called on error from nf_tables_newrule().
2884 expr = nft_expr_first(rule);
2885 while (expr != nft_expr_last(rule) && expr->ops) {
2886 next = nft_expr_next(expr);
2887 nf_tables_expr_destroy(ctx, expr);
2893 static void nf_tables_rule_release(const struct nft_ctx *ctx,
2894 struct nft_rule *rule)
2896 nft_rule_expr_deactivate(ctx, rule, NFT_TRANS_RELEASE);
2897 nf_tables_rule_destroy(ctx, rule);
2900 int nft_chain_validate(const struct nft_ctx *ctx, const struct nft_chain *chain)
2902 struct nft_expr *expr, *last;
2903 const struct nft_data *data;
2904 struct nft_rule *rule;
2907 if (ctx->level == NFT_JUMP_STACK_SIZE)
2910 list_for_each_entry(rule, &chain->rules, list) {
2911 if (!nft_is_active_next(ctx->net, rule))
2914 nft_rule_for_each_expr(expr, last, rule) {
2915 if (!expr->ops->validate)
2918 err = expr->ops->validate(ctx, expr, &data);
2926 EXPORT_SYMBOL_GPL(nft_chain_validate);
2928 static int nft_table_validate(struct net *net, const struct nft_table *table)
2930 struct nft_chain *chain;
2931 struct nft_ctx ctx = {
2933 .family = table->family,
2937 list_for_each_entry(chain, &table->chains, list) {
2938 if (!nft_is_base_chain(chain))
2942 err = nft_chain_validate(&ctx, chain);
2950 static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
2951 const struct nlattr *nla);
2953 #define NFT_RULE_MAXEXPRS 128
2955 static int nf_tables_newrule(struct net *net, struct sock *nlsk,
2956 struct sk_buff *skb, const struct nlmsghdr *nlh,
2957 const struct nlattr * const nla[],
2958 struct netlink_ext_ack *extack)
2960 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2961 u8 genmask = nft_genmask_next(net);
2962 struct nft_expr_info *info = NULL;
2963 int family = nfmsg->nfgen_family;
2964 struct nft_flow_rule *flow;
2965 struct nft_table *table;
2966 struct nft_chain *chain;
2967 struct nft_rule *rule, *old_rule = NULL;
2968 struct nft_userdata *udata;
2969 struct nft_trans *trans = NULL;
2970 struct nft_expr *expr;
2973 unsigned int size, i, n, ulen = 0, usize = 0;
2975 u64 handle, pos_handle;
2977 lockdep_assert_held(&net->nft.commit_mutex);
2979 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask);
2980 if (IS_ERR(table)) {
2981 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
2982 return PTR_ERR(table);
2985 chain = nft_chain_lookup(net, table, nla[NFTA_RULE_CHAIN], genmask);
2986 if (IS_ERR(chain)) {
2987 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
2988 return PTR_ERR(chain);
2991 if (nla[NFTA_RULE_HANDLE]) {
2992 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
2993 rule = __nft_rule_lookup(chain, handle);
2995 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
2996 return PTR_ERR(rule);
2999 if (nlh->nlmsg_flags & NLM_F_EXCL) {
3000 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
3003 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3008 if (!(nlh->nlmsg_flags & NLM_F_CREATE) ||
3009 nlh->nlmsg_flags & NLM_F_REPLACE)
3011 handle = nf_tables_alloc_handle(table);
3013 if (chain->use == UINT_MAX)
3016 if (nla[NFTA_RULE_POSITION]) {
3017 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
3018 old_rule = __nft_rule_lookup(chain, pos_handle);
3019 if (IS_ERR(old_rule)) {
3020 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_POSITION]);
3021 return PTR_ERR(old_rule);
3023 } else if (nla[NFTA_RULE_POSITION_ID]) {
3024 old_rule = nft_rule_lookup_byid(net, nla[NFTA_RULE_POSITION_ID]);
3025 if (IS_ERR(old_rule)) {
3026 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_POSITION_ID]);
3027 return PTR_ERR(old_rule);
3032 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
3036 if (nla[NFTA_RULE_EXPRESSIONS]) {
3037 info = kvmalloc_array(NFT_RULE_MAXEXPRS,
3038 sizeof(struct nft_expr_info),
3043 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
3045 if (nla_type(tmp) != NFTA_LIST_ELEM)
3047 if (n == NFT_RULE_MAXEXPRS)
3049 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
3052 size += info[n].ops->size;
3056 /* Check for overflow of dlen field */
3058 if (size >= 1 << 12)
3061 if (nla[NFTA_RULE_USERDATA]) {
3062 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
3064 usize = sizeof(struct nft_userdata) + ulen;
3068 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
3072 nft_activate_next(net, rule);
3074 rule->handle = handle;
3076 rule->udata = ulen ? 1 : 0;
3079 udata = nft_userdata(rule);
3080 udata->len = ulen - 1;
3081 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
3084 expr = nft_expr_first(rule);
3085 for (i = 0; i < n; i++) {
3086 err = nf_tables_newexpr(&ctx, &info[i], expr);
3090 if (info[i].ops->validate)
3091 nft_validate_state_update(net, NFT_VALIDATE_NEED);
3094 expr = nft_expr_next(expr);
3097 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
3098 trans = nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule);
3099 if (trans == NULL) {
3103 err = nft_delrule(&ctx, old_rule);
3105 nft_trans_destroy(trans);
3109 list_add_tail_rcu(&rule->list, &old_rule->list);
3111 trans = nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule);
3117 if (nlh->nlmsg_flags & NLM_F_APPEND) {
3119 list_add_rcu(&rule->list, &old_rule->list);
3121 list_add_tail_rcu(&rule->list, &chain->rules);
3124 list_add_tail_rcu(&rule->list, &old_rule->list);
3126 list_add_rcu(&rule->list, &chain->rules);
3132 if (net->nft.validate_state == NFT_VALIDATE_DO)
3133 return nft_table_validate(net, table);
3135 if (chain->flags & NFT_CHAIN_HW_OFFLOAD) {
3136 flow = nft_flow_rule_create(net, rule);
3138 return PTR_ERR(flow);
3140 nft_trans_flow_rule(trans) = flow;
3145 nf_tables_rule_release(&ctx, rule);
3147 for (i = 0; i < n; i++) {
3149 module_put(info[i].ops->type->owner);
3150 if (info[i].ops->type->release_ops)
3151 info[i].ops->type->release_ops(info[i].ops);
3158 static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
3159 const struct nlattr *nla)
3161 u32 id = ntohl(nla_get_be32(nla));
3162 struct nft_trans *trans;
3164 list_for_each_entry(trans, &net->nft.commit_list, list) {
3165 struct nft_rule *rule = nft_trans_rule(trans);
3167 if (trans->msg_type == NFT_MSG_NEWRULE &&
3168 id == nft_trans_rule_id(trans))
3171 return ERR_PTR(-ENOENT);
3174 static int nf_tables_delrule(struct net *net, struct sock *nlsk,
3175 struct sk_buff *skb, const struct nlmsghdr *nlh,
3176 const struct nlattr * const nla[],
3177 struct netlink_ext_ack *extack)
3179 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3180 u8 genmask = nft_genmask_next(net);
3181 struct nft_table *table;
3182 struct nft_chain *chain = NULL;
3183 struct nft_rule *rule;
3184 int family = nfmsg->nfgen_family, err = 0;
3187 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask);
3188 if (IS_ERR(table)) {
3189 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
3190 return PTR_ERR(table);
3193 if (nla[NFTA_RULE_CHAIN]) {
3194 chain = nft_chain_lookup(net, table, nla[NFTA_RULE_CHAIN],
3196 if (IS_ERR(chain)) {
3197 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
3198 return PTR_ERR(chain);
3202 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
3205 if (nla[NFTA_RULE_HANDLE]) {
3206 rule = nft_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
3208 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
3209 return PTR_ERR(rule);
3212 err = nft_delrule(&ctx, rule);
3213 } else if (nla[NFTA_RULE_ID]) {
3214 rule = nft_rule_lookup_byid(net, nla[NFTA_RULE_ID]);
3216 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_ID]);
3217 return PTR_ERR(rule);
3220 err = nft_delrule(&ctx, rule);
3222 err = nft_delrule_by_chain(&ctx);
3225 list_for_each_entry(chain, &table->chains, list) {
3226 if (!nft_is_active_next(net, chain))
3230 err = nft_delrule_by_chain(&ctx);
3243 static LIST_HEAD(nf_tables_set_types);
3245 int nft_register_set(struct nft_set_type *type)
3247 nfnl_lock(NFNL_SUBSYS_NFTABLES);
3248 list_add_tail_rcu(&type->list, &nf_tables_set_types);
3249 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
3252 EXPORT_SYMBOL_GPL(nft_register_set);
3254 void nft_unregister_set(struct nft_set_type *type)
3256 nfnl_lock(NFNL_SUBSYS_NFTABLES);
3257 list_del_rcu(&type->list);
3258 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
3260 EXPORT_SYMBOL_GPL(nft_unregister_set);
3262 #define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
3263 NFT_SET_TIMEOUT | NFT_SET_OBJECT | \
3266 static bool nft_set_ops_candidate(const struct nft_set_type *type, u32 flags)
3268 return (flags & type->features) == (flags & NFT_SET_FEATURES);
3272 * Select a set implementation based on the data characteristics and the
3273 * given policy. The total memory use might not be known if no size is
3274 * given, in that case the amount of memory per element is used.
3276 static const struct nft_set_ops *
3277 nft_select_set_ops(const struct nft_ctx *ctx,
3278 const struct nlattr * const nla[],
3279 const struct nft_set_desc *desc,
3280 enum nft_set_policies policy)
3282 const struct nft_set_ops *ops, *bops;
3283 struct nft_set_estimate est, best;
3284 const struct nft_set_type *type;
3287 lockdep_assert_held(&ctx->net->nft.commit_mutex);
3288 lockdep_nfnl_nft_mutex_not_held();
3289 #ifdef CONFIG_MODULES
3290 if (list_empty(&nf_tables_set_types)) {
3291 nft_request_module(ctx->net, "nft-set");
3292 if (!list_empty(&nf_tables_set_types))
3293 return ERR_PTR(-EAGAIN);
3296 if (nla[NFTA_SET_FLAGS] != NULL)
3297 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
3304 list_for_each_entry(type, &nf_tables_set_types, list) {
3307 if (!nft_set_ops_candidate(type, flags))
3309 if (!ops->estimate(desc, flags, &est))
3313 case NFT_SET_POL_PERFORMANCE:
3314 if (est.lookup < best.lookup)
3316 if (est.lookup == best.lookup &&
3317 est.space < best.space)
3320 case NFT_SET_POL_MEMORY:
3322 if (est.space < best.space)
3324 if (est.space == best.space &&
3325 est.lookup < best.lookup)
3327 } else if (est.size < best.size || !bops) {
3335 if (!try_module_get(type->owner))
3338 module_put(to_set_type(bops)->owner);
3347 return ERR_PTR(-EOPNOTSUPP);
3350 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
3351 [NFTA_SET_TABLE] = { .type = NLA_STRING,
3352 .len = NFT_TABLE_MAXNAMELEN - 1 },
3353 [NFTA_SET_NAME] = { .type = NLA_STRING,
3354 .len = NFT_SET_MAXNAMELEN - 1 },
3355 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
3356 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
3357 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
3358 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
3359 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
3360 [NFTA_SET_POLICY] = { .type = NLA_U32 },
3361 [NFTA_SET_DESC] = { .type = NLA_NESTED },
3362 [NFTA_SET_ID] = { .type = NLA_U32 },
3363 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
3364 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
3365 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
3366 .len = NFT_USERDATA_MAXLEN },
3367 [NFTA_SET_OBJ_TYPE] = { .type = NLA_U32 },
3368 [NFTA_SET_HANDLE] = { .type = NLA_U64 },
3371 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
3372 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
3375 static int nft_ctx_init_from_setattr(struct nft_ctx *ctx, struct net *net,
3376 const struct sk_buff *skb,
3377 const struct nlmsghdr *nlh,
3378 const struct nlattr * const nla[],
3379 struct netlink_ext_ack *extack,
3382 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3383 int family = nfmsg->nfgen_family;
3384 struct nft_table *table = NULL;
3386 if (nla[NFTA_SET_TABLE] != NULL) {
3387 table = nft_table_lookup(net, nla[NFTA_SET_TABLE], family,
3389 if (IS_ERR(table)) {
3390 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_TABLE]);
3391 return PTR_ERR(table);
3395 nft_ctx_init(ctx, net, skb, nlh, family, table, NULL, nla);
3399 static struct nft_set *nft_set_lookup(const struct nft_table *table,
3400 const struct nlattr *nla, u8 genmask)
3402 struct nft_set *set;
3405 return ERR_PTR(-EINVAL);
3407 list_for_each_entry_rcu(set, &table->sets, list) {
3408 if (!nla_strcmp(nla, set->name) &&
3409 nft_active_genmask(set, genmask))
3412 return ERR_PTR(-ENOENT);
3415 static struct nft_set *nft_set_lookup_byhandle(const struct nft_table *table,
3416 const struct nlattr *nla,
3419 struct nft_set *set;
3421 list_for_each_entry(set, &table->sets, list) {
3422 if (be64_to_cpu(nla_get_be64(nla)) == set->handle &&
3423 nft_active_genmask(set, genmask))
3426 return ERR_PTR(-ENOENT);
3429 static struct nft_set *nft_set_lookup_byid(const struct net *net,
3430 const struct nlattr *nla, u8 genmask)
3432 struct nft_trans *trans;
3433 u32 id = ntohl(nla_get_be32(nla));
3435 list_for_each_entry(trans, &net->nft.commit_list, list) {
3436 if (trans->msg_type == NFT_MSG_NEWSET) {
3437 struct nft_set *set = nft_trans_set(trans);
3439 if (id == nft_trans_set_id(trans) &&
3440 nft_active_genmask(set, genmask))
3444 return ERR_PTR(-ENOENT);
3447 struct nft_set *nft_set_lookup_global(const struct net *net,
3448 const struct nft_table *table,
3449 const struct nlattr *nla_set_name,
3450 const struct nlattr *nla_set_id,
3453 struct nft_set *set;
3455 set = nft_set_lookup(table, nla_set_name, genmask);
3460 set = nft_set_lookup_byid(net, nla_set_id, genmask);
3464 EXPORT_SYMBOL_GPL(nft_set_lookup_global);
3466 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
3469 const struct nft_set *i;
3471 unsigned long *inuse;
3472 unsigned int n = 0, min = 0;
3474 p = strchr(name, '%');
3476 if (p[1] != 'd' || strchr(p + 2, '%'))
3479 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
3483 list_for_each_entry(i, &ctx->table->sets, list) {
3486 if (!nft_is_active_next(ctx->net, set))
3488 if (!sscanf(i->name, name, &tmp))
3490 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
3493 set_bit(tmp - min, inuse);
3496 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
3497 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
3498 min += BITS_PER_BYTE * PAGE_SIZE;
3499 memset(inuse, 0, PAGE_SIZE);
3502 free_page((unsigned long)inuse);
3505 set->name = kasprintf(GFP_KERNEL, name, min + n);
3509 list_for_each_entry(i, &ctx->table->sets, list) {
3510 if (!nft_is_active_next(ctx->net, i))
3512 if (!strcmp(set->name, i->name)) {
3520 static int nf_msecs_to_jiffies64(const struct nlattr *nla, u64 *result)
3522 u64 ms = be64_to_cpu(nla_get_be64(nla));
3523 u64 max = (u64)(~((u64)0));
3525 max = div_u64(max, NSEC_PER_MSEC);
3529 ms *= NSEC_PER_MSEC;
3530 *result = nsecs_to_jiffies64(ms);
3534 static __be64 nf_jiffies64_to_msecs(u64 input)
3536 return cpu_to_be64(jiffies64_to_msecs(input));
3539 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
3540 const struct nft_set *set, u16 event, u16 flags)
3542 struct nfgenmsg *nfmsg;
3543 struct nlmsghdr *nlh;
3544 struct nlattr *desc;
3545 u32 portid = ctx->portid;
3548 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
3549 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3552 goto nla_put_failure;
3554 nfmsg = nlmsg_data(nlh);
3555 nfmsg->nfgen_family = ctx->family;
3556 nfmsg->version = NFNETLINK_V0;
3557 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
3559 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3560 goto nla_put_failure;
3561 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3562 goto nla_put_failure;
3563 if (nla_put_be64(skb, NFTA_SET_HANDLE, cpu_to_be64(set->handle),
3565 goto nla_put_failure;
3566 if (set->flags != 0)
3567 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
3568 goto nla_put_failure;
3570 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
3571 goto nla_put_failure;
3572 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
3573 goto nla_put_failure;
3574 if (set->flags & NFT_SET_MAP) {
3575 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
3576 goto nla_put_failure;
3577 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
3578 goto nla_put_failure;
3580 if (set->flags & NFT_SET_OBJECT &&
3581 nla_put_be32(skb, NFTA_SET_OBJ_TYPE, htonl(set->objtype)))
3582 goto nla_put_failure;
3585 nla_put_be64(skb, NFTA_SET_TIMEOUT,
3586 nf_jiffies64_to_msecs(set->timeout),
3588 goto nla_put_failure;
3590 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
3591 goto nla_put_failure;
3593 if (set->policy != NFT_SET_POL_PERFORMANCE) {
3594 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
3595 goto nla_put_failure;
3598 if (nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
3599 goto nla_put_failure;
3601 desc = nla_nest_start_noflag(skb, NFTA_SET_DESC);
3603 goto nla_put_failure;
3605 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
3606 goto nla_put_failure;
3607 nla_nest_end(skb, desc);
3609 nlmsg_end(skb, nlh);
3613 nlmsg_trim(skb, nlh);
3617 static void nf_tables_set_notify(const struct nft_ctx *ctx,
3618 const struct nft_set *set, int event,
3621 struct sk_buff *skb;
3622 u32 portid = ctx->portid;
3626 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
3629 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
3633 err = nf_tables_fill_set(skb, ctx, set, event, 0);
3639 nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES, ctx->report,
3643 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
3646 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
3648 const struct nft_set *set;
3649 unsigned int idx, s_idx = cb->args[0];
3650 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
3651 struct net *net = sock_net(skb->sk);
3652 struct nft_ctx *ctx = cb->data, ctx_set;
3658 cb->seq = net->nft.base_seq;
3660 list_for_each_entry_rcu(table, &net->nft.tables, list) {
3661 if (ctx->family != NFPROTO_UNSPEC &&
3662 ctx->family != table->family)
3665 if (ctx->table && ctx->table != table)
3669 if (cur_table != table)
3675 list_for_each_entry_rcu(set, &table->sets, list) {
3678 if (!nft_is_active(net, set))
3682 ctx_set.table = table;
3683 ctx_set.family = table->family;
3685 if (nf_tables_fill_set(skb, &ctx_set, set,
3689 cb->args[2] = (unsigned long) table;
3692 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
3705 static int nf_tables_dump_sets_start(struct netlink_callback *cb)
3707 struct nft_ctx *ctx_dump = NULL;
3709 ctx_dump = kmemdup(cb->data, sizeof(*ctx_dump), GFP_ATOMIC);
3710 if (ctx_dump == NULL)
3713 cb->data = ctx_dump;
3717 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
3723 /* called with rcu_read_lock held */
3724 static int nf_tables_getset(struct net *net, struct sock *nlsk,
3725 struct sk_buff *skb, const struct nlmsghdr *nlh,
3726 const struct nlattr * const nla[],
3727 struct netlink_ext_ack *extack)
3729 u8 genmask = nft_genmask_cur(net);
3730 const struct nft_set *set;
3732 struct sk_buff *skb2;
3733 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3736 /* Verify existence before starting dump */
3737 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, extack,
3742 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3743 struct netlink_dump_control c = {
3744 .start = nf_tables_dump_sets_start,
3745 .dump = nf_tables_dump_sets,
3746 .done = nf_tables_dump_sets_done,
3748 .module = THIS_MODULE,
3751 return nft_netlink_dump_start_rcu(nlsk, skb, nlh, &c);
3754 /* Only accept unspec with dump */
3755 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
3756 return -EAFNOSUPPORT;
3757 if (!nla[NFTA_SET_TABLE])
3760 set = nft_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
3762 return PTR_ERR(set);
3764 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
3768 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
3772 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
3779 static int nf_tables_set_desc_parse(struct nft_set_desc *desc,
3780 const struct nlattr *nla)
3782 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
3785 err = nla_parse_nested_deprecated(da, NFTA_SET_DESC_MAX, nla,
3786 nft_set_desc_policy, NULL);
3790 if (da[NFTA_SET_DESC_SIZE] != NULL)
3791 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
3796 static int nf_tables_newset(struct net *net, struct sock *nlsk,
3797 struct sk_buff *skb, const struct nlmsghdr *nlh,
3798 const struct nlattr * const nla[],
3799 struct netlink_ext_ack *extack)
3801 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3802 u8 genmask = nft_genmask_next(net);
3803 int family = nfmsg->nfgen_family;
3804 const struct nft_set_ops *ops;
3805 struct nft_table *table;
3806 struct nft_set *set;
3811 u32 ktype, dtype, flags, policy, gc_int, objtype;
3812 struct nft_set_desc desc;
3813 unsigned char *udata;
3817 if (nla[NFTA_SET_TABLE] == NULL ||
3818 nla[NFTA_SET_NAME] == NULL ||
3819 nla[NFTA_SET_KEY_LEN] == NULL ||
3820 nla[NFTA_SET_ID] == NULL)
3823 memset(&desc, 0, sizeof(desc));
3825 ktype = NFT_DATA_VALUE;
3826 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
3827 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
3828 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
3832 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
3833 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
3837 if (nla[NFTA_SET_FLAGS] != NULL) {
3838 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
3839 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
3840 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
3841 NFT_SET_MAP | NFT_SET_EVAL |
3844 /* Only one of these operations is supported */
3845 if ((flags & (NFT_SET_MAP | NFT_SET_OBJECT)) ==
3846 (NFT_SET_MAP | NFT_SET_OBJECT))
3848 if ((flags & (NFT_SET_EVAL | NFT_SET_OBJECT)) ==
3849 (NFT_SET_EVAL | NFT_SET_OBJECT))
3854 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
3855 if (!(flags & NFT_SET_MAP))
3858 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
3859 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
3860 dtype != NFT_DATA_VERDICT)
3863 if (dtype != NFT_DATA_VERDICT) {
3864 if (nla[NFTA_SET_DATA_LEN] == NULL)
3866 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
3867 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
3870 desc.dlen = sizeof(struct nft_verdict);
3871 } else if (flags & NFT_SET_MAP)
3874 if (nla[NFTA_SET_OBJ_TYPE] != NULL) {
3875 if (!(flags & NFT_SET_OBJECT))
3878 objtype = ntohl(nla_get_be32(nla[NFTA_SET_OBJ_TYPE]));
3879 if (objtype == NFT_OBJECT_UNSPEC ||
3880 objtype > NFT_OBJECT_MAX)
3882 } else if (flags & NFT_SET_OBJECT)
3885 objtype = NFT_OBJECT_UNSPEC;
3888 if (nla[NFTA_SET_TIMEOUT] != NULL) {
3889 if (!(flags & NFT_SET_TIMEOUT))
3892 err = nf_msecs_to_jiffies64(nla[NFTA_SET_TIMEOUT], &timeout);
3897 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
3898 if (!(flags & NFT_SET_TIMEOUT))
3900 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
3903 policy = NFT_SET_POL_PERFORMANCE;
3904 if (nla[NFTA_SET_POLICY] != NULL)
3905 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
3907 if (nla[NFTA_SET_DESC] != NULL) {
3908 err = nf_tables_set_desc_parse(&desc, nla[NFTA_SET_DESC]);
3913 table = nft_table_lookup(net, nla[NFTA_SET_TABLE], family, genmask);
3914 if (IS_ERR(table)) {
3915 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_TABLE]);
3916 return PTR_ERR(table);
3919 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
3921 set = nft_set_lookup(table, nla[NFTA_SET_NAME], genmask);
3923 if (PTR_ERR(set) != -ENOENT) {
3924 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
3925 return PTR_ERR(set);
3928 if (nlh->nlmsg_flags & NLM_F_EXCL) {
3929 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
3932 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3938 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
3941 ops = nft_select_set_ops(&ctx, nla, &desc, policy);
3943 return PTR_ERR(ops);
3946 if (nla[NFTA_SET_USERDATA])
3947 udlen = nla_len(nla[NFTA_SET_USERDATA]);
3950 if (ops->privsize != NULL)
3951 size = ops->privsize(nla, &desc);
3953 set = kvzalloc(sizeof(*set) + size + udlen, GFP_KERNEL);
3959 name = nla_strdup(nla[NFTA_SET_NAME], GFP_KERNEL);
3965 err = nf_tables_set_alloc_name(&ctx, set, name);
3972 udata = set->data + size;
3973 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
3976 INIT_LIST_HEAD(&set->bindings);
3978 write_pnet(&set->net, net);
3981 set->klen = desc.klen;
3983 set->objtype = objtype;
3984 set->dlen = desc.dlen;
3986 set->size = desc.size;
3987 set->policy = policy;
3990 set->timeout = timeout;
3991 set->gc_int = gc_int;
3992 set->handle = nf_tables_alloc_handle(table);
3994 err = ops->init(set, &desc, nla);
3998 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
4002 list_add_tail_rcu(&set->list, &table->sets);
4013 module_put(to_set_type(ops)->owner);
4017 static void nft_set_destroy(struct nft_set *set)
4019 if (WARN_ON(set->use > 0))
4022 set->ops->destroy(set);
4023 module_put(to_set_type(set->ops)->owner);
4028 static int nf_tables_delset(struct net *net, struct sock *nlsk,
4029 struct sk_buff *skb, const struct nlmsghdr *nlh,
4030 const struct nlattr * const nla[],
4031 struct netlink_ext_ack *extack)
4033 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4034 u8 genmask = nft_genmask_next(net);
4035 const struct nlattr *attr;
4036 struct nft_set *set;
4040 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
4041 return -EAFNOSUPPORT;
4042 if (nla[NFTA_SET_TABLE] == NULL)
4045 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, extack,
4050 if (nla[NFTA_SET_HANDLE]) {
4051 attr = nla[NFTA_SET_HANDLE];
4052 set = nft_set_lookup_byhandle(ctx.table, attr, genmask);
4054 attr = nla[NFTA_SET_NAME];
4055 set = nft_set_lookup(ctx.table, attr, genmask);
4059 NL_SET_BAD_ATTR(extack, attr);
4060 return PTR_ERR(set);
4063 (nlh->nlmsg_flags & NLM_F_NONREC && atomic_read(&set->nelems) > 0)) {
4064 NL_SET_BAD_ATTR(extack, attr);
4068 return nft_delset(&ctx, set);
4071 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
4072 struct nft_set *set,
4073 const struct nft_set_iter *iter,
4074 struct nft_set_elem *elem)
4076 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4077 enum nft_registers dreg;
4079 dreg = nft_type_to_reg(set->dtype);
4080 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
4081 set->dtype == NFT_DATA_VERDICT ?
4082 NFT_DATA_VERDICT : NFT_DATA_VALUE,
4086 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
4087 struct nft_set_binding *binding)
4089 struct nft_set_binding *i;
4090 struct nft_set_iter iter;
4092 if (set->use == UINT_MAX)
4095 if (!list_empty(&set->bindings) && nft_set_is_anonymous(set))
4098 if (binding->flags & NFT_SET_MAP) {
4099 /* If the set is already bound to the same chain all
4100 * jumps are already validated for that chain.
4102 list_for_each_entry(i, &set->bindings, list) {
4103 if (i->flags & NFT_SET_MAP &&
4104 i->chain == binding->chain)
4108 iter.genmask = nft_genmask_next(ctx->net);
4112 iter.fn = nf_tables_bind_check_setelem;
4114 set->ops->walk(ctx, set, &iter);
4119 binding->chain = ctx->chain;
4120 list_add_tail_rcu(&binding->list, &set->bindings);
4121 nft_set_trans_bind(ctx, set);
4126 EXPORT_SYMBOL_GPL(nf_tables_bind_set);
4128 static void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
4129 struct nft_set_binding *binding, bool event)
4131 list_del_rcu(&binding->list);
4133 if (list_empty(&set->bindings) && nft_set_is_anonymous(set)) {
4134 list_del_rcu(&set->list);
4136 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET,
4141 void nf_tables_deactivate_set(const struct nft_ctx *ctx, struct nft_set *set,
4142 struct nft_set_binding *binding,
4143 enum nft_trans_phase phase)
4146 case NFT_TRANS_PREPARE:
4149 case NFT_TRANS_ABORT:
4150 case NFT_TRANS_RELEASE:
4154 nf_tables_unbind_set(ctx, set, binding,
4155 phase == NFT_TRANS_COMMIT);
4158 EXPORT_SYMBOL_GPL(nf_tables_deactivate_set);
4160 void nf_tables_destroy_set(const struct nft_ctx *ctx, struct nft_set *set)
4162 if (list_empty(&set->bindings) && nft_set_is_anonymous(set))
4163 nft_set_destroy(set);
4165 EXPORT_SYMBOL_GPL(nf_tables_destroy_set);
4167 const struct nft_set_ext_type nft_set_ext_types[] = {
4168 [NFT_SET_EXT_KEY] = {
4169 .align = __alignof__(u32),
4171 [NFT_SET_EXT_DATA] = {
4172 .align = __alignof__(u32),
4174 [NFT_SET_EXT_EXPR] = {
4175 .align = __alignof__(struct nft_expr),
4177 [NFT_SET_EXT_OBJREF] = {
4178 .len = sizeof(struct nft_object *),
4179 .align = __alignof__(struct nft_object *),
4181 [NFT_SET_EXT_FLAGS] = {
4183 .align = __alignof__(u8),
4185 [NFT_SET_EXT_TIMEOUT] = {
4187 .align = __alignof__(u64),
4189 [NFT_SET_EXT_EXPIRATION] = {
4191 .align = __alignof__(u64),
4193 [NFT_SET_EXT_USERDATA] = {
4194 .len = sizeof(struct nft_userdata),
4195 .align = __alignof__(struct nft_userdata),
4198 EXPORT_SYMBOL_GPL(nft_set_ext_types);
4204 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
4205 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
4206 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
4207 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
4208 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
4209 [NFTA_SET_ELEM_EXPIRATION] = { .type = NLA_U64 },
4210 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
4211 .len = NFT_USERDATA_MAXLEN },
4212 [NFTA_SET_ELEM_EXPR] = { .type = NLA_NESTED },
4213 [NFTA_SET_ELEM_OBJREF] = { .type = NLA_STRING,
4214 .len = NFT_OBJ_MAXNAMELEN - 1 },
4217 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
4218 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING,
4219 .len = NFT_TABLE_MAXNAMELEN - 1 },
4220 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING,
4221 .len = NFT_SET_MAXNAMELEN - 1 },
4222 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
4223 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
4226 static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx, struct net *net,
4227 const struct sk_buff *skb,
4228 const struct nlmsghdr *nlh,
4229 const struct nlattr * const nla[],
4230 struct netlink_ext_ack *extack,
4233 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4234 int family = nfmsg->nfgen_family;
4235 struct nft_table *table;
4237 table = nft_table_lookup(net, nla[NFTA_SET_ELEM_LIST_TABLE], family,
4239 if (IS_ERR(table)) {
4240 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_TABLE]);
4241 return PTR_ERR(table);
4244 nft_ctx_init(ctx, net, skb, nlh, family, table, NULL, nla);
4248 static int nf_tables_fill_setelem(struct sk_buff *skb,
4249 const struct nft_set *set,
4250 const struct nft_set_elem *elem)
4252 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4253 unsigned char *b = skb_tail_pointer(skb);
4254 struct nlattr *nest;
4256 nest = nla_nest_start_noflag(skb, NFTA_LIST_ELEM);
4258 goto nla_put_failure;
4260 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
4261 NFT_DATA_VALUE, set->klen) < 0)
4262 goto nla_put_failure;
4264 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
4265 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
4266 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
4268 goto nla_put_failure;
4270 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
4271 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
4272 goto nla_put_failure;
4274 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
4275 nla_put_string(skb, NFTA_SET_ELEM_OBJREF,
4276 (*nft_set_ext_obj(ext))->key.name) < 0)
4277 goto nla_put_failure;
4279 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
4280 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
4281 htonl(*nft_set_ext_flags(ext))))
4282 goto nla_put_failure;
4284 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
4285 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
4286 nf_jiffies64_to_msecs(*nft_set_ext_timeout(ext)),
4288 goto nla_put_failure;
4290 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
4291 u64 expires, now = get_jiffies_64();
4293 expires = *nft_set_ext_expiration(ext);
4294 if (time_before64(now, expires))
4299 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
4300 nf_jiffies64_to_msecs(expires),
4302 goto nla_put_failure;
4305 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
4306 struct nft_userdata *udata;
4308 udata = nft_set_ext_userdata(ext);
4309 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
4310 udata->len + 1, udata->data))
4311 goto nla_put_failure;
4314 nla_nest_end(skb, nest);
4322 struct nft_set_dump_args {
4323 const struct netlink_callback *cb;
4324 struct nft_set_iter iter;
4325 struct sk_buff *skb;
4328 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
4329 struct nft_set *set,
4330 const struct nft_set_iter *iter,
4331 struct nft_set_elem *elem)
4333 struct nft_set_dump_args *args;
4335 args = container_of(iter, struct nft_set_dump_args, iter);
4336 return nf_tables_fill_setelem(args->skb, set, elem);
4339 struct nft_set_dump_ctx {
4340 const struct nft_set *set;
4344 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
4346 struct nft_set_dump_ctx *dump_ctx = cb->data;
4347 struct net *net = sock_net(skb->sk);
4348 struct nft_table *table;
4349 struct nft_set *set;
4350 struct nft_set_dump_args args;
4351 bool set_found = false;
4352 struct nfgenmsg *nfmsg;
4353 struct nlmsghdr *nlh;
4354 struct nlattr *nest;
4359 list_for_each_entry_rcu(table, &net->nft.tables, list) {
4360 if (dump_ctx->ctx.family != NFPROTO_UNSPEC &&
4361 dump_ctx->ctx.family != table->family)
4364 if (table != dump_ctx->ctx.table)
4367 list_for_each_entry_rcu(set, &table->sets, list) {
4368 if (set == dump_ctx->set) {
4381 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWSETELEM);
4382 portid = NETLINK_CB(cb->skb).portid;
4383 seq = cb->nlh->nlmsg_seq;
4385 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
4388 goto nla_put_failure;
4390 nfmsg = nlmsg_data(nlh);
4391 nfmsg->nfgen_family = table->family;
4392 nfmsg->version = NFNETLINK_V0;
4393 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4395 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, table->name))
4396 goto nla_put_failure;
4397 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
4398 goto nla_put_failure;
4400 nest = nla_nest_start_noflag(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
4402 goto nla_put_failure;
4406 args.iter.genmask = nft_genmask_cur(net);
4407 args.iter.skip = cb->args[0];
4408 args.iter.count = 0;
4410 args.iter.fn = nf_tables_dump_setelem;
4411 set->ops->walk(&dump_ctx->ctx, set, &args.iter);
4414 nla_nest_end(skb, nest);
4415 nlmsg_end(skb, nlh);
4417 if (args.iter.err && args.iter.err != -EMSGSIZE)
4418 return args.iter.err;
4419 if (args.iter.count == cb->args[0])
4422 cb->args[0] = args.iter.count;
4430 static int nf_tables_dump_set_start(struct netlink_callback *cb)
4432 struct nft_set_dump_ctx *dump_ctx = cb->data;
4434 cb->data = kmemdup(dump_ctx, sizeof(*dump_ctx), GFP_ATOMIC);
4436 return cb->data ? 0 : -ENOMEM;
4439 static int nf_tables_dump_set_done(struct netlink_callback *cb)
4445 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
4446 const struct nft_ctx *ctx, u32 seq,
4447 u32 portid, int event, u16 flags,
4448 const struct nft_set *set,
4449 const struct nft_set_elem *elem)
4451 struct nfgenmsg *nfmsg;
4452 struct nlmsghdr *nlh;
4453 struct nlattr *nest;
4456 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
4457 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
4460 goto nla_put_failure;
4462 nfmsg = nlmsg_data(nlh);
4463 nfmsg->nfgen_family = ctx->family;
4464 nfmsg->version = NFNETLINK_V0;
4465 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
4467 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
4468 goto nla_put_failure;
4469 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
4470 goto nla_put_failure;
4472 nest = nla_nest_start_noflag(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
4474 goto nla_put_failure;
4476 err = nf_tables_fill_setelem(skb, set, elem);
4478 goto nla_put_failure;
4480 nla_nest_end(skb, nest);
4482 nlmsg_end(skb, nlh);
4486 nlmsg_trim(skb, nlh);
4490 static int nft_setelem_parse_flags(const struct nft_set *set,
4491 const struct nlattr *attr, u32 *flags)
4496 *flags = ntohl(nla_get_be32(attr));
4497 if (*flags & ~NFT_SET_ELEM_INTERVAL_END)
4499 if (!(set->flags & NFT_SET_INTERVAL) &&
4500 *flags & NFT_SET_ELEM_INTERVAL_END)
4506 static int nft_get_set_elem(struct nft_ctx *ctx, struct nft_set *set,
4507 const struct nlattr *attr)
4509 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
4510 struct nft_data_desc desc;
4511 struct nft_set_elem elem;
4512 struct sk_buff *skb;
4517 err = nla_parse_nested_deprecated(nla, NFTA_SET_ELEM_MAX, attr,
4518 nft_set_elem_policy, NULL);
4522 if (!nla[NFTA_SET_ELEM_KEY])
4525 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
4529 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
4530 nla[NFTA_SET_ELEM_KEY]);
4535 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen) {
4536 nft_data_release(&elem.key.val, desc.type);
4540 priv = set->ops->get(ctx->net, set, &elem, flags);
4542 return PTR_ERR(priv);
4547 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_ATOMIC);
4551 err = nf_tables_fill_setelem_info(skb, ctx, ctx->seq, ctx->portid,
4552 NFT_MSG_NEWSETELEM, 0, set, &elem);
4556 err = nfnetlink_unicast(skb, ctx->net, ctx->portid, MSG_DONTWAIT);
4557 /* This avoids a loop in nfnetlink. */
4565 /* this avoids a loop in nfnetlink. */
4566 return err == -EAGAIN ? -ENOBUFS : err;
4569 /* called with rcu_read_lock held */
4570 static int nf_tables_getsetelem(struct net *net, struct sock *nlsk,
4571 struct sk_buff *skb, const struct nlmsghdr *nlh,
4572 const struct nlattr * const nla[],
4573 struct netlink_ext_ack *extack)
4575 u8 genmask = nft_genmask_cur(net);
4576 struct nft_set *set;
4577 struct nlattr *attr;
4581 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, extack,
4586 set = nft_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET], genmask);
4588 return PTR_ERR(set);
4590 if (nlh->nlmsg_flags & NLM_F_DUMP) {
4591 struct netlink_dump_control c = {
4592 .start = nf_tables_dump_set_start,
4593 .dump = nf_tables_dump_set,
4594 .done = nf_tables_dump_set_done,
4595 .module = THIS_MODULE,
4597 struct nft_set_dump_ctx dump_ctx = {
4603 return nft_netlink_dump_start_rcu(nlsk, skb, nlh, &c);
4606 if (!nla[NFTA_SET_ELEM_LIST_ELEMENTS])
4609 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4610 err = nft_get_set_elem(&ctx, set, attr);
4618 static void nf_tables_setelem_notify(const struct nft_ctx *ctx,
4619 const struct nft_set *set,
4620 const struct nft_set_elem *elem,
4621 int event, u16 flags)
4623 struct net *net = ctx->net;
4624 u32 portid = ctx->portid;
4625 struct sk_buff *skb;
4628 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4631 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
4635 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
4642 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
4646 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
4649 static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
4651 struct nft_set *set)
4653 struct nft_trans *trans;
4655 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
4659 nft_trans_elem_set(trans) = set;
4663 void *nft_set_elem_init(const struct nft_set *set,
4664 const struct nft_set_ext_tmpl *tmpl,
4665 const u32 *key, const u32 *data,
4666 u64 timeout, u64 expiration, gfp_t gfp)
4668 struct nft_set_ext *ext;
4671 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
4675 ext = nft_set_elem_ext(set, elem);
4676 nft_set_ext_init(ext, tmpl);
4678 memcpy(nft_set_ext_key(ext), key, set->klen);
4679 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4680 memcpy(nft_set_ext_data(ext), data, set->dlen);
4681 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
4682 *nft_set_ext_expiration(ext) = get_jiffies_64() + expiration;
4683 if (expiration == 0)
4684 *nft_set_ext_expiration(ext) += timeout;
4686 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
4687 *nft_set_ext_timeout(ext) = timeout;
4692 void nft_set_elem_destroy(const struct nft_set *set, void *elem,
4695 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
4696 struct nft_ctx ctx = {
4697 .net = read_pnet(&set->net),
4698 .family = set->table->family,
4701 nft_data_release(nft_set_ext_key(ext), NFT_DATA_VALUE);
4702 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4703 nft_data_release(nft_set_ext_data(ext), set->dtype);
4704 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPR)) {
4705 struct nft_expr *expr = nft_set_ext_expr(ext);
4707 if (expr->ops->destroy_clone) {
4708 expr->ops->destroy_clone(&ctx, expr);
4709 module_put(expr->ops->type->owner);
4711 nf_tables_expr_destroy(&ctx, expr);
4714 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
4715 (*nft_set_ext_obj(ext))->use--;
4718 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
4720 /* Only called from commit path, nft_set_elem_deactivate() already deals with
4721 * the refcounting from the preparation phase.
4723 static void nf_tables_set_elem_destroy(const struct nft_ctx *ctx,
4724 const struct nft_set *set, void *elem)
4726 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
4728 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
4729 nf_tables_expr_destroy(ctx, nft_set_ext_expr(ext));
4733 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
4734 const struct nlattr *attr, u32 nlmsg_flags)
4736 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
4737 u8 genmask = nft_genmask_next(ctx->net);
4738 struct nft_data_desc d1, d2;
4739 struct nft_set_ext_tmpl tmpl;
4740 struct nft_set_ext *ext, *ext2;
4741 struct nft_set_elem elem;
4742 struct nft_set_binding *binding;
4743 struct nft_object *obj = NULL;
4744 struct nft_userdata *udata;
4745 struct nft_data data;
4746 enum nft_registers dreg;
4747 struct nft_trans *trans;
4754 err = nla_parse_nested_deprecated(nla, NFTA_SET_ELEM_MAX, attr,
4755 nft_set_elem_policy, NULL);
4759 if (nla[NFTA_SET_ELEM_KEY] == NULL)
4762 nft_set_ext_prepare(&tmpl);
4764 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
4768 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
4770 if (set->flags & NFT_SET_MAP) {
4771 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
4772 !(flags & NFT_SET_ELEM_INTERVAL_END))
4775 if (nla[NFTA_SET_ELEM_DATA] != NULL)
4779 if ((flags & NFT_SET_ELEM_INTERVAL_END) &&
4780 (nla[NFTA_SET_ELEM_DATA] ||
4781 nla[NFTA_SET_ELEM_OBJREF] ||
4782 nla[NFTA_SET_ELEM_TIMEOUT] ||
4783 nla[NFTA_SET_ELEM_EXPIRATION] ||
4784 nla[NFTA_SET_ELEM_USERDATA] ||
4785 nla[NFTA_SET_ELEM_EXPR]))
4789 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
4790 if (!(set->flags & NFT_SET_TIMEOUT))
4792 err = nf_msecs_to_jiffies64(nla[NFTA_SET_ELEM_TIMEOUT],
4796 } else if (set->flags & NFT_SET_TIMEOUT) {
4797 timeout = set->timeout;
4801 if (nla[NFTA_SET_ELEM_EXPIRATION] != NULL) {
4802 if (!(set->flags & NFT_SET_TIMEOUT))
4804 err = nf_msecs_to_jiffies64(nla[NFTA_SET_ELEM_EXPIRATION],
4810 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
4811 nla[NFTA_SET_ELEM_KEY]);
4815 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
4818 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
4820 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
4821 if (timeout != set->timeout)
4822 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
4825 if (nla[NFTA_SET_ELEM_OBJREF] != NULL) {
4826 if (!(set->flags & NFT_SET_OBJECT)) {
4830 obj = nft_obj_lookup(ctx->net, ctx->table,
4831 nla[NFTA_SET_ELEM_OBJREF],
4832 set->objtype, genmask);
4837 nft_set_ext_add(&tmpl, NFT_SET_EXT_OBJREF);
4840 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
4841 err = nft_data_init(ctx, &data, sizeof(data), &d2,
4842 nla[NFTA_SET_ELEM_DATA]);
4847 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
4850 dreg = nft_type_to_reg(set->dtype);
4851 list_for_each_entry(binding, &set->bindings, list) {
4852 struct nft_ctx bind_ctx = {
4854 .family = ctx->family,
4855 .table = ctx->table,
4856 .chain = (struct nft_chain *)binding->chain,
4859 if (!(binding->flags & NFT_SET_MAP))
4862 err = nft_validate_register_store(&bind_ctx, dreg,
4868 if (d2.type == NFT_DATA_VERDICT &&
4869 (data.verdict.code == NFT_GOTO ||
4870 data.verdict.code == NFT_JUMP))
4871 nft_validate_state_update(ctx->net,
4875 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
4878 /* The full maximum length of userdata can exceed the maximum
4879 * offset value (U8_MAX) for following extensions, therefor it
4880 * must be the last extension added.
4883 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
4884 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
4886 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
4891 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
4892 timeout, expiration, GFP_KERNEL);
4893 if (elem.priv == NULL)
4896 ext = nft_set_elem_ext(set, elem.priv);
4898 *nft_set_ext_flags(ext) = flags;
4900 udata = nft_set_ext_userdata(ext);
4901 udata->len = ulen - 1;
4902 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
4905 *nft_set_ext_obj(ext) = obj;
4909 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
4913 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
4914 err = set->ops->insert(ctx->net, set, &elem, &ext2);
4916 if (err == -EEXIST) {
4917 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) ^
4918 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) ||
4919 nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) ^
4920 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF)) {
4924 if ((nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
4925 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
4926 memcmp(nft_set_ext_data(ext),
4927 nft_set_ext_data(ext2), set->dlen) != 0) ||
4928 (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
4929 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF) &&
4930 *nft_set_ext_obj(ext) != *nft_set_ext_obj(ext2)))
4932 else if (!(nlmsg_flags & NLM_F_EXCL))
4939 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact)) {
4944 nft_trans_elem(trans) = elem;
4945 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4949 set->ops->remove(ctx->net, set, &elem);
4957 if (nla[NFTA_SET_ELEM_DATA] != NULL)
4958 nft_data_release(&data, d2.type);
4960 nft_data_release(&elem.key.val, d1.type);
4965 static int nf_tables_newsetelem(struct net *net, struct sock *nlsk,
4966 struct sk_buff *skb, const struct nlmsghdr *nlh,
4967 const struct nlattr * const nla[],
4968 struct netlink_ext_ack *extack)
4970 u8 genmask = nft_genmask_next(net);
4971 const struct nlattr *attr;
4972 struct nft_set *set;
4976 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
4979 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, extack,
4984 set = nft_set_lookup_global(net, ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
4985 nla[NFTA_SET_ELEM_LIST_SET_ID], genmask);
4987 return PTR_ERR(set);
4989 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4992 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4993 err = nft_add_set_elem(&ctx, set, attr, nlh->nlmsg_flags);
4998 if (net->nft.validate_state == NFT_VALIDATE_DO)
4999 return nft_table_validate(net, ctx.table);
5005 * nft_data_hold - hold a nft_data item
5007 * @data: struct nft_data to release
5008 * @type: type of data
5010 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
5011 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
5012 * NFT_GOTO verdicts. This function must be called on active data objects
5013 * from the second phase of the commit protocol.
5015 void nft_data_hold(const struct nft_data *data, enum nft_data_types type)
5017 if (type == NFT_DATA_VERDICT) {
5018 switch (data->verdict.code) {
5021 data->verdict.chain->use++;
5027 static void nft_set_elem_activate(const struct net *net,
5028 const struct nft_set *set,
5029 struct nft_set_elem *elem)
5031 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
5033 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
5034 nft_data_hold(nft_set_ext_data(ext), set->dtype);
5035 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
5036 (*nft_set_ext_obj(ext))->use++;
5039 static void nft_set_elem_deactivate(const struct net *net,
5040 const struct nft_set *set,
5041 struct nft_set_elem *elem)
5043 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
5045 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
5046 nft_data_release(nft_set_ext_data(ext), set->dtype);
5047 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
5048 (*nft_set_ext_obj(ext))->use--;
5051 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
5052 const struct nlattr *attr)
5054 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
5055 struct nft_set_ext_tmpl tmpl;
5056 struct nft_data_desc desc;
5057 struct nft_set_elem elem;
5058 struct nft_set_ext *ext;
5059 struct nft_trans *trans;
5064 err = nla_parse_nested_deprecated(nla, NFTA_SET_ELEM_MAX, attr,
5065 nft_set_elem_policy, NULL);
5070 if (nla[NFTA_SET_ELEM_KEY] == NULL)
5073 nft_set_ext_prepare(&tmpl);
5075 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
5079 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
5081 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
5082 nla[NFTA_SET_ELEM_KEY]);
5087 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
5090 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, desc.len);
5093 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, NULL, 0,
5095 if (elem.priv == NULL)
5098 ext = nft_set_elem_ext(set, elem.priv);
5100 *nft_set_ext_flags(ext) = flags;
5102 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
5103 if (trans == NULL) {
5108 priv = set->ops->deactivate(ctx->net, set, &elem);
5116 nft_set_elem_deactivate(ctx->net, set, &elem);
5118 nft_trans_elem(trans) = elem;
5119 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
5127 nft_data_release(&elem.key.val, desc.type);
5132 static int nft_flush_set(const struct nft_ctx *ctx,
5133 struct nft_set *set,
5134 const struct nft_set_iter *iter,
5135 struct nft_set_elem *elem)
5137 struct nft_trans *trans;
5140 trans = nft_trans_alloc_gfp(ctx, NFT_MSG_DELSETELEM,
5141 sizeof(struct nft_trans_elem), GFP_ATOMIC);
5145 if (!set->ops->flush(ctx->net, set, elem->priv)) {
5151 nft_set_elem_deactivate(ctx->net, set, elem);
5152 nft_trans_elem_set(trans) = set;
5153 nft_trans_elem(trans) = *elem;
5154 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
5162 static int nf_tables_delsetelem(struct net *net, struct sock *nlsk,
5163 struct sk_buff *skb, const struct nlmsghdr *nlh,
5164 const struct nlattr * const nla[],
5165 struct netlink_ext_ack *extack)
5167 u8 genmask = nft_genmask_next(net);
5168 const struct nlattr *attr;
5169 struct nft_set *set;
5173 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, extack,
5178 set = nft_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET], genmask);
5180 return PTR_ERR(set);
5181 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
5184 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL) {
5185 struct nft_set_iter iter = {
5187 .fn = nft_flush_set,
5189 set->ops->walk(&ctx, set, &iter);
5194 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
5195 err = nft_del_setelem(&ctx, set, attr);
5204 void nft_set_gc_batch_release(struct rcu_head *rcu)
5206 struct nft_set_gc_batch *gcb;
5209 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
5210 for (i = 0; i < gcb->head.cnt; i++)
5211 nft_set_elem_destroy(gcb->head.set, gcb->elems[i], true);
5214 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
5216 struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
5219 struct nft_set_gc_batch *gcb;
5221 gcb = kzalloc(sizeof(*gcb), gfp);
5224 gcb->head.set = set;
5227 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
5234 * nft_register_obj- register nf_tables stateful object type
5237 * Registers the object type for use with nf_tables. Returns zero on
5238 * success or a negative errno code otherwise.
5240 int nft_register_obj(struct nft_object_type *obj_type)
5242 if (obj_type->type == NFT_OBJECT_UNSPEC)
5245 nfnl_lock(NFNL_SUBSYS_NFTABLES);
5246 list_add_rcu(&obj_type->list, &nf_tables_objects);
5247 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
5250 EXPORT_SYMBOL_GPL(nft_register_obj);
5253 * nft_unregister_obj - unregister nf_tables object type
5256 * Unregisters the object type for use with nf_tables.
5258 void nft_unregister_obj(struct nft_object_type *obj_type)
5260 nfnl_lock(NFNL_SUBSYS_NFTABLES);
5261 list_del_rcu(&obj_type->list);
5262 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
5264 EXPORT_SYMBOL_GPL(nft_unregister_obj);
5266 struct nft_object *nft_obj_lookup(const struct net *net,
5267 const struct nft_table *table,
5268 const struct nlattr *nla, u32 objtype,
5271 struct nft_object_hash_key k = { .table = table };
5272 char search[NFT_OBJ_MAXNAMELEN];
5273 struct rhlist_head *tmp, *list;
5274 struct nft_object *obj;
5276 nla_strlcpy(search, nla, sizeof(search));
5279 WARN_ON_ONCE(!rcu_read_lock_held() &&
5280 !lockdep_commit_lock_is_held(net));
5283 list = rhltable_lookup(&nft_objname_ht, &k, nft_objname_ht_params);
5287 rhl_for_each_entry_rcu(obj, tmp, list, rhlhead) {
5288 if (objtype == obj->ops->type->type &&
5289 nft_active_genmask(obj, genmask)) {
5296 return ERR_PTR(-ENOENT);
5298 EXPORT_SYMBOL_GPL(nft_obj_lookup);
5300 static struct nft_object *nft_obj_lookup_byhandle(const struct nft_table *table,
5301 const struct nlattr *nla,
5302 u32 objtype, u8 genmask)
5304 struct nft_object *obj;
5306 list_for_each_entry(obj, &table->objects, list) {
5307 if (be64_to_cpu(nla_get_be64(nla)) == obj->handle &&
5308 objtype == obj->ops->type->type &&
5309 nft_active_genmask(obj, genmask))
5312 return ERR_PTR(-ENOENT);
5315 static const struct nla_policy nft_obj_policy[NFTA_OBJ_MAX + 1] = {
5316 [NFTA_OBJ_TABLE] = { .type = NLA_STRING,
5317 .len = NFT_TABLE_MAXNAMELEN - 1 },
5318 [NFTA_OBJ_NAME] = { .type = NLA_STRING,
5319 .len = NFT_OBJ_MAXNAMELEN - 1 },
5320 [NFTA_OBJ_TYPE] = { .type = NLA_U32 },
5321 [NFTA_OBJ_DATA] = { .type = NLA_NESTED },
5322 [NFTA_OBJ_HANDLE] = { .type = NLA_U64},
5325 static struct nft_object *nft_obj_init(const struct nft_ctx *ctx,
5326 const struct nft_object_type *type,
5327 const struct nlattr *attr)
5330 const struct nft_object_ops *ops;
5331 struct nft_object *obj;
5334 tb = kmalloc_array(type->maxattr + 1, sizeof(*tb), GFP_KERNEL);
5339 err = nla_parse_nested_deprecated(tb, type->maxattr, attr,
5340 type->policy, NULL);
5344 memset(tb, 0, sizeof(tb[0]) * (type->maxattr + 1));
5347 if (type->select_ops) {
5348 ops = type->select_ops(ctx, (const struct nlattr * const *)tb);
5358 obj = kzalloc(sizeof(*obj) + ops->size, GFP_KERNEL);
5362 err = ops->init(ctx, (const struct nlattr * const *)tb, obj);
5375 return ERR_PTR(err);
5378 static int nft_object_dump(struct sk_buff *skb, unsigned int attr,
5379 struct nft_object *obj, bool reset)
5381 struct nlattr *nest;
5383 nest = nla_nest_start_noflag(skb, attr);
5385 goto nla_put_failure;
5386 if (obj->ops->dump(skb, obj, reset) < 0)
5387 goto nla_put_failure;
5388 nla_nest_end(skb, nest);
5395 static const struct nft_object_type *__nft_obj_type_get(u32 objtype)
5397 const struct nft_object_type *type;
5399 list_for_each_entry(type, &nf_tables_objects, list) {
5400 if (objtype == type->type)
5406 static const struct nft_object_type *
5407 nft_obj_type_get(struct net *net, u32 objtype)
5409 const struct nft_object_type *type;
5411 type = __nft_obj_type_get(objtype);
5412 if (type != NULL && try_module_get(type->owner))
5415 lockdep_nfnl_nft_mutex_not_held();
5416 #ifdef CONFIG_MODULES
5418 nft_request_module(net, "nft-obj-%u", objtype);
5419 if (__nft_obj_type_get(objtype))
5420 return ERR_PTR(-EAGAIN);
5423 return ERR_PTR(-ENOENT);
5426 static int nf_tables_updobj(const struct nft_ctx *ctx,
5427 const struct nft_object_type *type,
5428 const struct nlattr *attr,
5429 struct nft_object *obj)
5431 struct nft_object *newobj;
5432 struct nft_trans *trans;
5435 trans = nft_trans_alloc(ctx, NFT_MSG_NEWOBJ,
5436 sizeof(struct nft_trans_obj));
5440 newobj = nft_obj_init(ctx, type, attr);
5441 if (IS_ERR(newobj)) {
5442 err = PTR_ERR(newobj);
5443 goto err_free_trans;
5446 nft_trans_obj(trans) = obj;
5447 nft_trans_obj_update(trans) = true;
5448 nft_trans_obj_newobj(trans) = newobj;
5449 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
5458 static int nf_tables_newobj(struct net *net, struct sock *nlsk,
5459 struct sk_buff *skb, const struct nlmsghdr *nlh,
5460 const struct nlattr * const nla[],
5461 struct netlink_ext_ack *extack)
5463 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5464 const struct nft_object_type *type;
5465 u8 genmask = nft_genmask_next(net);
5466 int family = nfmsg->nfgen_family;
5467 struct nft_table *table;
5468 struct nft_object *obj;
5473 if (!nla[NFTA_OBJ_TYPE] ||
5474 !nla[NFTA_OBJ_NAME] ||
5475 !nla[NFTA_OBJ_DATA])
5478 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask);
5479 if (IS_ERR(table)) {
5480 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
5481 return PTR_ERR(table);
5484 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
5485 obj = nft_obj_lookup(net, table, nla[NFTA_OBJ_NAME], objtype, genmask);
5488 if (err != -ENOENT) {
5489 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
5493 if (nlh->nlmsg_flags & NLM_F_EXCL) {
5494 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
5497 if (nlh->nlmsg_flags & NLM_F_REPLACE)
5500 type = __nft_obj_type_get(objtype);
5501 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
5503 return nf_tables_updobj(&ctx, type, nla[NFTA_OBJ_DATA], obj);
5506 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
5508 type = nft_obj_type_get(net, objtype);
5510 return PTR_ERR(type);
5512 obj = nft_obj_init(&ctx, type, nla[NFTA_OBJ_DATA]);
5517 obj->key.table = table;
5518 obj->handle = nf_tables_alloc_handle(table);
5520 obj->key.name = nla_strdup(nla[NFTA_OBJ_NAME], GFP_KERNEL);
5521 if (!obj->key.name) {
5526 err = nft_trans_obj_add(&ctx, NFT_MSG_NEWOBJ, obj);
5530 err = rhltable_insert(&nft_objname_ht, &obj->rhlhead,
5531 nft_objname_ht_params);
5535 list_add_tail_rcu(&obj->list, &table->objects);
5539 /* queued in transaction log */
5540 INIT_LIST_HEAD(&obj->list);
5543 kfree(obj->key.name);
5545 if (obj->ops->destroy)
5546 obj->ops->destroy(&ctx, obj);
5549 module_put(type->owner);
5553 static int nf_tables_fill_obj_info(struct sk_buff *skb, struct net *net,
5554 u32 portid, u32 seq, int event, u32 flags,
5555 int family, const struct nft_table *table,
5556 struct nft_object *obj, bool reset)
5558 struct nfgenmsg *nfmsg;
5559 struct nlmsghdr *nlh;
5561 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
5562 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
5564 goto nla_put_failure;
5566 nfmsg = nlmsg_data(nlh);
5567 nfmsg->nfgen_family = family;
5568 nfmsg->version = NFNETLINK_V0;
5569 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
5571 if (nla_put_string(skb, NFTA_OBJ_TABLE, table->name) ||
5572 nla_put_string(skb, NFTA_OBJ_NAME, obj->key.name) ||
5573 nla_put_be32(skb, NFTA_OBJ_TYPE, htonl(obj->ops->type->type)) ||
5574 nla_put_be32(skb, NFTA_OBJ_USE, htonl(obj->use)) ||
5575 nft_object_dump(skb, NFTA_OBJ_DATA, obj, reset) ||
5576 nla_put_be64(skb, NFTA_OBJ_HANDLE, cpu_to_be64(obj->handle),
5578 goto nla_put_failure;
5580 nlmsg_end(skb, nlh);
5584 nlmsg_trim(skb, nlh);
5588 struct nft_obj_filter {
5593 static int nf_tables_dump_obj(struct sk_buff *skb, struct netlink_callback *cb)
5595 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
5596 const struct nft_table *table;
5597 unsigned int idx = 0, s_idx = cb->args[0];
5598 struct nft_obj_filter *filter = cb->data;
5599 struct net *net = sock_net(skb->sk);
5600 int family = nfmsg->nfgen_family;
5601 struct nft_object *obj;
5604 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
5608 cb->seq = net->nft.base_seq;
5610 list_for_each_entry_rcu(table, &net->nft.tables, list) {
5611 if (family != NFPROTO_UNSPEC && family != table->family)
5614 list_for_each_entry_rcu(obj, &table->objects, list) {
5615 if (!nft_is_active(net, obj))
5620 memset(&cb->args[1], 0,
5621 sizeof(cb->args) - sizeof(cb->args[0]));
5622 if (filter && filter->table &&
5623 strcmp(filter->table, table->name))
5626 filter->type != NFT_OBJECT_UNSPEC &&
5627 obj->ops->type->type != filter->type)
5630 if (nf_tables_fill_obj_info(skb, net, NETLINK_CB(cb->skb).portid,
5633 NLM_F_MULTI | NLM_F_APPEND,
5634 table->family, table,
5638 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
5650 static int nf_tables_dump_obj_start(struct netlink_callback *cb)
5652 const struct nlattr * const *nla = cb->data;
5653 struct nft_obj_filter *filter = NULL;
5655 if (nla[NFTA_OBJ_TABLE] || nla[NFTA_OBJ_TYPE]) {
5656 filter = kzalloc(sizeof(*filter), GFP_ATOMIC);
5660 if (nla[NFTA_OBJ_TABLE]) {
5661 filter->table = nla_strdup(nla[NFTA_OBJ_TABLE], GFP_ATOMIC);
5662 if (!filter->table) {
5668 if (nla[NFTA_OBJ_TYPE])
5669 filter->type = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
5676 static int nf_tables_dump_obj_done(struct netlink_callback *cb)
5678 struct nft_obj_filter *filter = cb->data;
5681 kfree(filter->table);
5688 /* called with rcu_read_lock held */
5689 static int nf_tables_getobj(struct net *net, struct sock *nlsk,
5690 struct sk_buff *skb, const struct nlmsghdr *nlh,
5691 const struct nlattr * const nla[],
5692 struct netlink_ext_ack *extack)
5694 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5695 u8 genmask = nft_genmask_cur(net);
5696 int family = nfmsg->nfgen_family;
5697 const struct nft_table *table;
5698 struct nft_object *obj;
5699 struct sk_buff *skb2;
5704 if (nlh->nlmsg_flags & NLM_F_DUMP) {
5705 struct netlink_dump_control c = {
5706 .start = nf_tables_dump_obj_start,
5707 .dump = nf_tables_dump_obj,
5708 .done = nf_tables_dump_obj_done,
5709 .module = THIS_MODULE,
5710 .data = (void *)nla,
5713 return nft_netlink_dump_start_rcu(nlsk, skb, nlh, &c);
5716 if (!nla[NFTA_OBJ_NAME] ||
5717 !nla[NFTA_OBJ_TYPE])
5720 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask);
5721 if (IS_ERR(table)) {
5722 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
5723 return PTR_ERR(table);
5726 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
5727 obj = nft_obj_lookup(net, table, nla[NFTA_OBJ_NAME], objtype, genmask);
5729 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
5730 return PTR_ERR(obj);
5733 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
5737 if (NFNL_MSG_TYPE(nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
5740 err = nf_tables_fill_obj_info(skb2, net, NETLINK_CB(skb).portid,
5741 nlh->nlmsg_seq, NFT_MSG_NEWOBJ, 0,
5742 family, table, obj, reset);
5746 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
5752 static void nft_obj_destroy(const struct nft_ctx *ctx, struct nft_object *obj)
5754 if (obj->ops->destroy)
5755 obj->ops->destroy(ctx, obj);
5757 module_put(obj->ops->type->owner);
5758 kfree(obj->key.name);
5762 static int nf_tables_delobj(struct net *net, struct sock *nlsk,
5763 struct sk_buff *skb, const struct nlmsghdr *nlh,
5764 const struct nlattr * const nla[],
5765 struct netlink_ext_ack *extack)
5767 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5768 u8 genmask = nft_genmask_next(net);
5769 int family = nfmsg->nfgen_family;
5770 const struct nlattr *attr;
5771 struct nft_table *table;
5772 struct nft_object *obj;
5776 if (!nla[NFTA_OBJ_TYPE] ||
5777 (!nla[NFTA_OBJ_NAME] && !nla[NFTA_OBJ_HANDLE]))
5780 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask);
5781 if (IS_ERR(table)) {
5782 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
5783 return PTR_ERR(table);
5786 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
5787 if (nla[NFTA_OBJ_HANDLE]) {
5788 attr = nla[NFTA_OBJ_HANDLE];
5789 obj = nft_obj_lookup_byhandle(table, attr, objtype, genmask);
5791 attr = nla[NFTA_OBJ_NAME];
5792 obj = nft_obj_lookup(net, table, attr, objtype, genmask);
5796 NL_SET_BAD_ATTR(extack, attr);
5797 return PTR_ERR(obj);
5800 NL_SET_BAD_ATTR(extack, attr);
5804 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
5806 return nft_delobj(&ctx, obj);
5809 void nft_obj_notify(struct net *net, const struct nft_table *table,
5810 struct nft_object *obj, u32 portid, u32 seq, int event,
5811 int family, int report, gfp_t gfp)
5813 struct sk_buff *skb;
5817 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
5820 skb = nlmsg_new(NLMSG_GOODSIZE, gfp);
5824 err = nf_tables_fill_obj_info(skb, net, portid, seq, event, 0, family,
5831 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, report, gfp);
5834 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
5836 EXPORT_SYMBOL_GPL(nft_obj_notify);
5838 static void nf_tables_obj_notify(const struct nft_ctx *ctx,
5839 struct nft_object *obj, int event)
5841 nft_obj_notify(ctx->net, ctx->table, obj, ctx->portid, ctx->seq, event,
5842 ctx->family, ctx->report, GFP_KERNEL);
5848 void nft_register_flowtable_type(struct nf_flowtable_type *type)
5850 nfnl_lock(NFNL_SUBSYS_NFTABLES);
5851 list_add_tail_rcu(&type->list, &nf_tables_flowtables);
5852 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
5854 EXPORT_SYMBOL_GPL(nft_register_flowtable_type);
5856 void nft_unregister_flowtable_type(struct nf_flowtable_type *type)
5858 nfnl_lock(NFNL_SUBSYS_NFTABLES);
5859 list_del_rcu(&type->list);
5860 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
5862 EXPORT_SYMBOL_GPL(nft_unregister_flowtable_type);
5864 static const struct nla_policy nft_flowtable_policy[NFTA_FLOWTABLE_MAX + 1] = {
5865 [NFTA_FLOWTABLE_TABLE] = { .type = NLA_STRING,
5866 .len = NFT_NAME_MAXLEN - 1 },
5867 [NFTA_FLOWTABLE_NAME] = { .type = NLA_STRING,
5868 .len = NFT_NAME_MAXLEN - 1 },
5869 [NFTA_FLOWTABLE_HOOK] = { .type = NLA_NESTED },
5870 [NFTA_FLOWTABLE_HANDLE] = { .type = NLA_U64 },
5871 [NFTA_FLOWTABLE_FLAGS] = { .type = NLA_U32 },
5874 struct nft_flowtable *nft_flowtable_lookup(const struct nft_table *table,
5875 const struct nlattr *nla, u8 genmask)
5877 struct nft_flowtable *flowtable;
5879 list_for_each_entry_rcu(flowtable, &table->flowtables, list) {
5880 if (!nla_strcmp(nla, flowtable->name) &&
5881 nft_active_genmask(flowtable, genmask))
5884 return ERR_PTR(-ENOENT);
5886 EXPORT_SYMBOL_GPL(nft_flowtable_lookup);
5888 void nf_tables_deactivate_flowtable(const struct nft_ctx *ctx,
5889 struct nft_flowtable *flowtable,
5890 enum nft_trans_phase phase)
5893 case NFT_TRANS_PREPARE:
5894 case NFT_TRANS_ABORT:
5895 case NFT_TRANS_RELEASE:
5902 EXPORT_SYMBOL_GPL(nf_tables_deactivate_flowtable);
5904 static struct nft_flowtable *
5905 nft_flowtable_lookup_byhandle(const struct nft_table *table,
5906 const struct nlattr *nla, u8 genmask)
5908 struct nft_flowtable *flowtable;
5910 list_for_each_entry(flowtable, &table->flowtables, list) {
5911 if (be64_to_cpu(nla_get_be64(nla)) == flowtable->handle &&
5912 nft_active_genmask(flowtable, genmask))
5915 return ERR_PTR(-ENOENT);
5918 static const struct nla_policy nft_flowtable_hook_policy[NFTA_FLOWTABLE_HOOK_MAX + 1] = {
5919 [NFTA_FLOWTABLE_HOOK_NUM] = { .type = NLA_U32 },
5920 [NFTA_FLOWTABLE_HOOK_PRIORITY] = { .type = NLA_U32 },
5921 [NFTA_FLOWTABLE_HOOK_DEVS] = { .type = NLA_NESTED },
5924 static int nf_tables_flowtable_parse_hook(const struct nft_ctx *ctx,
5925 const struct nlattr *attr,
5926 struct nft_flowtable *flowtable)
5928 struct nlattr *tb[NFTA_FLOWTABLE_HOOK_MAX + 1];
5929 struct nft_hook *hook;
5930 int hooknum, priority;
5933 err = nla_parse_nested_deprecated(tb, NFTA_FLOWTABLE_HOOK_MAX, attr,
5934 nft_flowtable_hook_policy, NULL);
5938 if (!tb[NFTA_FLOWTABLE_HOOK_NUM] ||
5939 !tb[NFTA_FLOWTABLE_HOOK_PRIORITY] ||
5940 !tb[NFTA_FLOWTABLE_HOOK_DEVS])
5943 hooknum = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_NUM]));
5944 if (hooknum != NF_NETDEV_INGRESS)
5947 priority = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_PRIORITY]));
5949 err = nf_tables_parse_netdev_hooks(ctx->net,
5950 tb[NFTA_FLOWTABLE_HOOK_DEVS],
5951 &flowtable->hook_list);
5955 flowtable->hooknum = hooknum;
5956 flowtable->data.priority = priority;
5958 list_for_each_entry(hook, &flowtable->hook_list, list) {
5959 hook->ops.pf = NFPROTO_NETDEV;
5960 hook->ops.hooknum = hooknum;
5961 hook->ops.priority = priority;
5962 hook->ops.priv = &flowtable->data;
5963 hook->ops.hook = flowtable->data.type->hook;
5969 static const struct nf_flowtable_type *__nft_flowtable_type_get(u8 family)
5971 const struct nf_flowtable_type *type;
5973 list_for_each_entry(type, &nf_tables_flowtables, list) {
5974 if (family == type->family)
5980 static const struct nf_flowtable_type *
5981 nft_flowtable_type_get(struct net *net, u8 family)
5983 const struct nf_flowtable_type *type;
5985 type = __nft_flowtable_type_get(family);
5986 if (type != NULL && try_module_get(type->owner))
5989 lockdep_nfnl_nft_mutex_not_held();
5990 #ifdef CONFIG_MODULES
5992 nft_request_module(net, "nf-flowtable-%u", family);
5993 if (__nft_flowtable_type_get(family))
5994 return ERR_PTR(-EAGAIN);
5997 return ERR_PTR(-ENOENT);
6000 /* Only called from error and netdev event paths. */
6001 static void nft_unregister_flowtable_hook(struct net *net,
6002 struct nft_flowtable *flowtable,
6003 struct nft_hook *hook)
6005 nf_unregister_net_hook(net, &hook->ops);
6006 flowtable->data.type->setup(&flowtable->data, hook->ops.dev,
6010 static void nft_unregister_flowtable_net_hooks(struct net *net,
6011 struct nft_flowtable *flowtable)
6013 struct nft_hook *hook;
6015 list_for_each_entry(hook, &flowtable->hook_list, list)
6016 nf_unregister_net_hook(net, &hook->ops);
6019 static int nft_register_flowtable_net_hooks(struct net *net,
6020 struct nft_table *table,
6021 struct nft_flowtable *flowtable)
6023 struct nft_hook *hook, *hook2, *next;
6024 struct nft_flowtable *ft;
6027 list_for_each_entry(hook, &flowtable->hook_list, list) {
6028 list_for_each_entry(ft, &table->flowtables, list) {
6029 list_for_each_entry(hook2, &ft->hook_list, list) {
6030 if (hook->ops.dev == hook2->ops.dev &&
6031 hook->ops.pf == hook2->ops.pf) {
6033 goto err_unregister_net_hooks;
6038 err = flowtable->data.type->setup(&flowtable->data,
6042 goto err_unregister_net_hooks;
6044 err = nf_register_net_hook(net, &hook->ops);
6046 flowtable->data.type->setup(&flowtable->data,
6049 goto err_unregister_net_hooks;
6057 err_unregister_net_hooks:
6058 list_for_each_entry_safe(hook, next, &flowtable->hook_list, list) {
6062 nft_unregister_flowtable_hook(net, flowtable, hook);
6063 list_del_rcu(&hook->list);
6064 kfree_rcu(hook, rcu);
6070 static int nf_tables_newflowtable(struct net *net, struct sock *nlsk,
6071 struct sk_buff *skb,
6072 const struct nlmsghdr *nlh,
6073 const struct nlattr * const nla[],
6074 struct netlink_ext_ack *extack)
6076 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
6077 const struct nf_flowtable_type *type;
6078 u8 genmask = nft_genmask_next(net);
6079 int family = nfmsg->nfgen_family;
6080 struct nft_flowtable *flowtable;
6081 struct nft_hook *hook, *next;
6082 struct nft_table *table;
6086 if (!nla[NFTA_FLOWTABLE_TABLE] ||
6087 !nla[NFTA_FLOWTABLE_NAME] ||
6088 !nla[NFTA_FLOWTABLE_HOOK])
6091 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
6093 if (IS_ERR(table)) {
6094 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_TABLE]);
6095 return PTR_ERR(table);
6098 flowtable = nft_flowtable_lookup(table, nla[NFTA_FLOWTABLE_NAME],
6100 if (IS_ERR(flowtable)) {
6101 err = PTR_ERR(flowtable);
6102 if (err != -ENOENT) {
6103 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
6107 if (nlh->nlmsg_flags & NLM_F_EXCL) {
6108 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
6115 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
6117 flowtable = kzalloc(sizeof(*flowtable), GFP_KERNEL);
6121 flowtable->table = table;
6122 flowtable->handle = nf_tables_alloc_handle(table);
6123 INIT_LIST_HEAD(&flowtable->hook_list);
6125 flowtable->name = nla_strdup(nla[NFTA_FLOWTABLE_NAME], GFP_KERNEL);
6126 if (!flowtable->name) {
6131 type = nft_flowtable_type_get(net, family);
6133 err = PTR_ERR(type);
6137 if (nla[NFTA_FLOWTABLE_FLAGS]) {
6138 flowtable->data.flags =
6139 ntohl(nla_get_be32(nla[NFTA_FLOWTABLE_FLAGS]));
6140 if (flowtable->data.flags & ~NF_FLOWTABLE_HW_OFFLOAD)
6144 write_pnet(&flowtable->data.net, net);
6145 flowtable->data.type = type;
6146 err = type->init(&flowtable->data);
6150 err = nf_tables_flowtable_parse_hook(&ctx, nla[NFTA_FLOWTABLE_HOOK],
6155 err = nft_register_flowtable_net_hooks(ctx.net, table, flowtable);
6159 err = nft_trans_flowtable_add(&ctx, NFT_MSG_NEWFLOWTABLE, flowtable);
6163 list_add_tail_rcu(&flowtable->list, &table->flowtables);
6168 list_for_each_entry_safe(hook, next, &flowtable->hook_list, list) {
6169 nft_unregister_flowtable_hook(net, flowtable, hook);
6170 list_del_rcu(&hook->list);
6171 kfree_rcu(hook, rcu);
6174 flowtable->data.type->free(&flowtable->data);
6176 module_put(type->owner);
6178 kfree(flowtable->name);
6184 static int nf_tables_delflowtable(struct net *net, struct sock *nlsk,
6185 struct sk_buff *skb,
6186 const struct nlmsghdr *nlh,
6187 const struct nlattr * const nla[],
6188 struct netlink_ext_ack *extack)
6190 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
6191 u8 genmask = nft_genmask_next(net);
6192 int family = nfmsg->nfgen_family;
6193 struct nft_flowtable *flowtable;
6194 const struct nlattr *attr;
6195 struct nft_table *table;
6198 if (!nla[NFTA_FLOWTABLE_TABLE] ||
6199 (!nla[NFTA_FLOWTABLE_NAME] &&
6200 !nla[NFTA_FLOWTABLE_HANDLE]))
6203 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
6205 if (IS_ERR(table)) {
6206 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_TABLE]);
6207 return PTR_ERR(table);
6210 if (nla[NFTA_FLOWTABLE_HANDLE]) {
6211 attr = nla[NFTA_FLOWTABLE_HANDLE];
6212 flowtable = nft_flowtable_lookup_byhandle(table, attr, genmask);
6214 attr = nla[NFTA_FLOWTABLE_NAME];
6215 flowtable = nft_flowtable_lookup(table, attr, genmask);
6218 if (IS_ERR(flowtable)) {
6219 NL_SET_BAD_ATTR(extack, attr);
6220 return PTR_ERR(flowtable);
6222 if (flowtable->use > 0) {
6223 NL_SET_BAD_ATTR(extack, attr);
6227 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
6229 return nft_delflowtable(&ctx, flowtable);
6232 static int nf_tables_fill_flowtable_info(struct sk_buff *skb, struct net *net,
6233 u32 portid, u32 seq, int event,
6234 u32 flags, int family,
6235 struct nft_flowtable *flowtable)
6237 struct nlattr *nest, *nest_devs;
6238 struct nfgenmsg *nfmsg;
6239 struct nft_hook *hook;
6240 struct nlmsghdr *nlh;
6242 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
6243 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
6245 goto nla_put_failure;
6247 nfmsg = nlmsg_data(nlh);
6248 nfmsg->nfgen_family = family;
6249 nfmsg->version = NFNETLINK_V0;
6250 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
6252 if (nla_put_string(skb, NFTA_FLOWTABLE_TABLE, flowtable->table->name) ||
6253 nla_put_string(skb, NFTA_FLOWTABLE_NAME, flowtable->name) ||
6254 nla_put_be32(skb, NFTA_FLOWTABLE_USE, htonl(flowtable->use)) ||
6255 nla_put_be64(skb, NFTA_FLOWTABLE_HANDLE, cpu_to_be64(flowtable->handle),
6256 NFTA_FLOWTABLE_PAD) ||
6257 nla_put_be32(skb, NFTA_FLOWTABLE_FLAGS, htonl(flowtable->data.flags)))
6258 goto nla_put_failure;
6260 nest = nla_nest_start_noflag(skb, NFTA_FLOWTABLE_HOOK);
6262 goto nla_put_failure;
6263 if (nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_NUM, htonl(flowtable->hooknum)) ||
6264 nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_PRIORITY, htonl(flowtable->data.priority)))
6265 goto nla_put_failure;
6267 nest_devs = nla_nest_start_noflag(skb, NFTA_FLOWTABLE_HOOK_DEVS);
6269 goto nla_put_failure;
6271 list_for_each_entry_rcu(hook, &flowtable->hook_list, list) {
6272 if (nla_put_string(skb, NFTA_DEVICE_NAME, hook->ops.dev->name))
6273 goto nla_put_failure;
6275 nla_nest_end(skb, nest_devs);
6276 nla_nest_end(skb, nest);
6278 nlmsg_end(skb, nlh);
6282 nlmsg_trim(skb, nlh);
6286 struct nft_flowtable_filter {
6290 static int nf_tables_dump_flowtable(struct sk_buff *skb,
6291 struct netlink_callback *cb)
6293 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
6294 struct nft_flowtable_filter *filter = cb->data;
6295 unsigned int idx = 0, s_idx = cb->args[0];
6296 struct net *net = sock_net(skb->sk);
6297 int family = nfmsg->nfgen_family;
6298 struct nft_flowtable *flowtable;
6299 const struct nft_table *table;
6302 cb->seq = net->nft.base_seq;
6304 list_for_each_entry_rcu(table, &net->nft.tables, list) {
6305 if (family != NFPROTO_UNSPEC && family != table->family)
6308 list_for_each_entry_rcu(flowtable, &table->flowtables, list) {
6309 if (!nft_is_active(net, flowtable))
6314 memset(&cb->args[1], 0,
6315 sizeof(cb->args) - sizeof(cb->args[0]));
6316 if (filter && filter->table &&
6317 strcmp(filter->table, table->name))
6320 if (nf_tables_fill_flowtable_info(skb, net, NETLINK_CB(cb->skb).portid,
6322 NFT_MSG_NEWFLOWTABLE,
6323 NLM_F_MULTI | NLM_F_APPEND,
6324 table->family, flowtable) < 0)
6327 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
6339 static int nf_tables_dump_flowtable_start(struct netlink_callback *cb)
6341 const struct nlattr * const *nla = cb->data;
6342 struct nft_flowtable_filter *filter = NULL;
6344 if (nla[NFTA_FLOWTABLE_TABLE]) {
6345 filter = kzalloc(sizeof(*filter), GFP_ATOMIC);
6349 filter->table = nla_strdup(nla[NFTA_FLOWTABLE_TABLE],
6351 if (!filter->table) {
6361 static int nf_tables_dump_flowtable_done(struct netlink_callback *cb)
6363 struct nft_flowtable_filter *filter = cb->data;
6368 kfree(filter->table);
6374 /* called with rcu_read_lock held */
6375 static int nf_tables_getflowtable(struct net *net, struct sock *nlsk,
6376 struct sk_buff *skb,
6377 const struct nlmsghdr *nlh,
6378 const struct nlattr * const nla[],
6379 struct netlink_ext_ack *extack)
6381 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
6382 u8 genmask = nft_genmask_cur(net);
6383 int family = nfmsg->nfgen_family;
6384 struct nft_flowtable *flowtable;
6385 const struct nft_table *table;
6386 struct sk_buff *skb2;
6389 if (nlh->nlmsg_flags & NLM_F_DUMP) {
6390 struct netlink_dump_control c = {
6391 .start = nf_tables_dump_flowtable_start,
6392 .dump = nf_tables_dump_flowtable,
6393 .done = nf_tables_dump_flowtable_done,
6394 .module = THIS_MODULE,
6395 .data = (void *)nla,
6398 return nft_netlink_dump_start_rcu(nlsk, skb, nlh, &c);
6401 if (!nla[NFTA_FLOWTABLE_NAME])
6404 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
6407 return PTR_ERR(table);
6409 flowtable = nft_flowtable_lookup(table, nla[NFTA_FLOWTABLE_NAME],
6411 if (IS_ERR(flowtable))
6412 return PTR_ERR(flowtable);
6414 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
6418 err = nf_tables_fill_flowtable_info(skb2, net, NETLINK_CB(skb).portid,
6420 NFT_MSG_NEWFLOWTABLE, 0, family,
6425 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
6431 static void nf_tables_flowtable_notify(struct nft_ctx *ctx,
6432 struct nft_flowtable *flowtable,
6435 struct sk_buff *skb;
6439 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
6442 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
6446 err = nf_tables_fill_flowtable_info(skb, ctx->net, ctx->portid,
6448 ctx->family, flowtable);
6454 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
6455 ctx->report, GFP_KERNEL);
6458 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
6461 static void nf_tables_flowtable_destroy(struct nft_flowtable *flowtable)
6463 struct nft_hook *hook, *next;
6465 flowtable->data.type->free(&flowtable->data);
6466 list_for_each_entry_safe(hook, next, &flowtable->hook_list, list) {
6467 flowtable->data.type->setup(&flowtable->data, hook->ops.dev,
6469 list_del_rcu(&hook->list);
6472 kfree(flowtable->name);
6473 module_put(flowtable->data.type->owner);
6477 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
6478 u32 portid, u32 seq)
6480 struct nlmsghdr *nlh;
6481 struct nfgenmsg *nfmsg;
6482 char buf[TASK_COMM_LEN];
6483 int event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWGEN);
6485 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
6487 goto nla_put_failure;
6489 nfmsg = nlmsg_data(nlh);
6490 nfmsg->nfgen_family = AF_UNSPEC;
6491 nfmsg->version = NFNETLINK_V0;
6492 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
6494 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)) ||
6495 nla_put_be32(skb, NFTA_GEN_PROC_PID, htonl(task_pid_nr(current))) ||
6496 nla_put_string(skb, NFTA_GEN_PROC_NAME, get_task_comm(buf, current)))
6497 goto nla_put_failure;
6499 nlmsg_end(skb, nlh);
6503 nlmsg_trim(skb, nlh);
6507 static void nft_flowtable_event(unsigned long event, struct net_device *dev,
6508 struct nft_flowtable *flowtable)
6510 struct nft_hook *hook;
6512 list_for_each_entry(hook, &flowtable->hook_list, list) {
6513 if (hook->ops.dev != dev)
6516 /* flow_offload_netdev_event() cleans up entries for us. */
6517 nft_unregister_flowtable_hook(dev_net(dev), flowtable, hook);
6518 list_del_rcu(&hook->list);
6519 kfree_rcu(hook, rcu);
6524 static int nf_tables_flowtable_event(struct notifier_block *this,
6525 unsigned long event, void *ptr)
6527 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
6528 struct nft_flowtable *flowtable;
6529 struct nft_table *table;
6532 if (event != NETDEV_UNREGISTER)
6536 mutex_lock(&net->nft.commit_mutex);
6537 list_for_each_entry(table, &net->nft.tables, list) {
6538 list_for_each_entry(flowtable, &table->flowtables, list) {
6539 nft_flowtable_event(event, dev, flowtable);
6542 mutex_unlock(&net->nft.commit_mutex);
6547 static struct notifier_block nf_tables_flowtable_notifier = {
6548 .notifier_call = nf_tables_flowtable_event,
6551 static void nf_tables_gen_notify(struct net *net, struct sk_buff *skb,
6554 struct nlmsghdr *nlh = nlmsg_hdr(skb);
6555 struct sk_buff *skb2;
6558 if (nlmsg_report(nlh) &&
6559 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
6562 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
6566 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
6573 nfnetlink_send(skb2, net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
6574 nlmsg_report(nlh), GFP_KERNEL);
6577 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
6581 static int nf_tables_getgen(struct net *net, struct sock *nlsk,
6582 struct sk_buff *skb, const struct nlmsghdr *nlh,
6583 const struct nlattr * const nla[],
6584 struct netlink_ext_ack *extack)
6586 struct sk_buff *skb2;
6589 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
6593 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
6598 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
6604 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
6605 [NFT_MSG_NEWTABLE] = {
6606 .call_batch = nf_tables_newtable,
6607 .attr_count = NFTA_TABLE_MAX,
6608 .policy = nft_table_policy,
6610 [NFT_MSG_GETTABLE] = {
6611 .call_rcu = nf_tables_gettable,
6612 .attr_count = NFTA_TABLE_MAX,
6613 .policy = nft_table_policy,
6615 [NFT_MSG_DELTABLE] = {
6616 .call_batch = nf_tables_deltable,
6617 .attr_count = NFTA_TABLE_MAX,
6618 .policy = nft_table_policy,
6620 [NFT_MSG_NEWCHAIN] = {
6621 .call_batch = nf_tables_newchain,
6622 .attr_count = NFTA_CHAIN_MAX,
6623 .policy = nft_chain_policy,
6625 [NFT_MSG_GETCHAIN] = {
6626 .call_rcu = nf_tables_getchain,
6627 .attr_count = NFTA_CHAIN_MAX,
6628 .policy = nft_chain_policy,
6630 [NFT_MSG_DELCHAIN] = {
6631 .call_batch = nf_tables_delchain,
6632 .attr_count = NFTA_CHAIN_MAX,
6633 .policy = nft_chain_policy,
6635 [NFT_MSG_NEWRULE] = {
6636 .call_batch = nf_tables_newrule,
6637 .attr_count = NFTA_RULE_MAX,
6638 .policy = nft_rule_policy,
6640 [NFT_MSG_GETRULE] = {
6641 .call_rcu = nf_tables_getrule,
6642 .attr_count = NFTA_RULE_MAX,
6643 .policy = nft_rule_policy,
6645 [NFT_MSG_DELRULE] = {
6646 .call_batch = nf_tables_delrule,
6647 .attr_count = NFTA_RULE_MAX,
6648 .policy = nft_rule_policy,
6650 [NFT_MSG_NEWSET] = {
6651 .call_batch = nf_tables_newset,
6652 .attr_count = NFTA_SET_MAX,
6653 .policy = nft_set_policy,
6655 [NFT_MSG_GETSET] = {
6656 .call_rcu = nf_tables_getset,
6657 .attr_count = NFTA_SET_MAX,
6658 .policy = nft_set_policy,
6660 [NFT_MSG_DELSET] = {
6661 .call_batch = nf_tables_delset,
6662 .attr_count = NFTA_SET_MAX,
6663 .policy = nft_set_policy,
6665 [NFT_MSG_NEWSETELEM] = {
6666 .call_batch = nf_tables_newsetelem,
6667 .attr_count = NFTA_SET_ELEM_LIST_MAX,
6668 .policy = nft_set_elem_list_policy,
6670 [NFT_MSG_GETSETELEM] = {
6671 .call_rcu = nf_tables_getsetelem,
6672 .attr_count = NFTA_SET_ELEM_LIST_MAX,
6673 .policy = nft_set_elem_list_policy,
6675 [NFT_MSG_DELSETELEM] = {
6676 .call_batch = nf_tables_delsetelem,
6677 .attr_count = NFTA_SET_ELEM_LIST_MAX,
6678 .policy = nft_set_elem_list_policy,
6680 [NFT_MSG_GETGEN] = {
6681 .call_rcu = nf_tables_getgen,
6683 [NFT_MSG_NEWOBJ] = {
6684 .call_batch = nf_tables_newobj,
6685 .attr_count = NFTA_OBJ_MAX,
6686 .policy = nft_obj_policy,
6688 [NFT_MSG_GETOBJ] = {
6689 .call_rcu = nf_tables_getobj,
6690 .attr_count = NFTA_OBJ_MAX,
6691 .policy = nft_obj_policy,
6693 [NFT_MSG_DELOBJ] = {
6694 .call_batch = nf_tables_delobj,
6695 .attr_count = NFTA_OBJ_MAX,
6696 .policy = nft_obj_policy,
6698 [NFT_MSG_GETOBJ_RESET] = {
6699 .call_rcu = nf_tables_getobj,
6700 .attr_count = NFTA_OBJ_MAX,
6701 .policy = nft_obj_policy,
6703 [NFT_MSG_NEWFLOWTABLE] = {
6704 .call_batch = nf_tables_newflowtable,
6705 .attr_count = NFTA_FLOWTABLE_MAX,
6706 .policy = nft_flowtable_policy,
6708 [NFT_MSG_GETFLOWTABLE] = {
6709 .call_rcu = nf_tables_getflowtable,
6710 .attr_count = NFTA_FLOWTABLE_MAX,
6711 .policy = nft_flowtable_policy,
6713 [NFT_MSG_DELFLOWTABLE] = {
6714 .call_batch = nf_tables_delflowtable,
6715 .attr_count = NFTA_FLOWTABLE_MAX,
6716 .policy = nft_flowtable_policy,
6720 static int nf_tables_validate(struct net *net)
6722 struct nft_table *table;
6724 switch (net->nft.validate_state) {
6725 case NFT_VALIDATE_SKIP:
6727 case NFT_VALIDATE_NEED:
6728 nft_validate_state_update(net, NFT_VALIDATE_DO);
6730 case NFT_VALIDATE_DO:
6731 list_for_each_entry(table, &net->nft.tables, list) {
6732 if (nft_table_validate(net, table) < 0)
6741 /* a drop policy has to be deferred until all rules have been activated,
6742 * otherwise a large ruleset that contains a drop-policy base chain will
6743 * cause all packets to get dropped until the full transaction has been
6746 * We defer the drop policy until the transaction has been finalized.
6748 static void nft_chain_commit_drop_policy(struct nft_trans *trans)
6750 struct nft_base_chain *basechain;
6752 if (nft_trans_chain_policy(trans) != NF_DROP)
6755 if (!nft_is_base_chain(trans->ctx.chain))
6758 basechain = nft_base_chain(trans->ctx.chain);
6759 basechain->policy = NF_DROP;
6762 static void nft_chain_commit_update(struct nft_trans *trans)
6764 struct nft_base_chain *basechain;
6766 if (nft_trans_chain_name(trans)) {
6767 rhltable_remove(&trans->ctx.table->chains_ht,
6768 &trans->ctx.chain->rhlhead,
6769 nft_chain_ht_params);
6770 swap(trans->ctx.chain->name, nft_trans_chain_name(trans));
6771 rhltable_insert_key(&trans->ctx.table->chains_ht,
6772 trans->ctx.chain->name,
6773 &trans->ctx.chain->rhlhead,
6774 nft_chain_ht_params);
6777 if (!nft_is_base_chain(trans->ctx.chain))
6780 nft_chain_stats_replace(trans);
6782 basechain = nft_base_chain(trans->ctx.chain);
6784 switch (nft_trans_chain_policy(trans)) {
6787 basechain->policy = nft_trans_chain_policy(trans);
6792 static void nft_obj_commit_update(struct nft_trans *trans)
6794 struct nft_object *newobj;
6795 struct nft_object *obj;
6797 obj = nft_trans_obj(trans);
6798 newobj = nft_trans_obj_newobj(trans);
6800 if (obj->ops->update)
6801 obj->ops->update(obj, newobj);
6806 static void nft_commit_release(struct nft_trans *trans)
6808 switch (trans->msg_type) {
6809 case NFT_MSG_DELTABLE:
6810 nf_tables_table_destroy(&trans->ctx);
6812 case NFT_MSG_NEWCHAIN:
6813 free_percpu(nft_trans_chain_stats(trans));
6814 kfree(nft_trans_chain_name(trans));
6816 case NFT_MSG_DELCHAIN:
6817 nf_tables_chain_destroy(&trans->ctx);
6819 case NFT_MSG_DELRULE:
6820 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
6822 case NFT_MSG_DELSET:
6823 nft_set_destroy(nft_trans_set(trans));
6825 case NFT_MSG_DELSETELEM:
6826 nf_tables_set_elem_destroy(&trans->ctx,
6827 nft_trans_elem_set(trans),
6828 nft_trans_elem(trans).priv);
6830 case NFT_MSG_DELOBJ:
6831 nft_obj_destroy(&trans->ctx, nft_trans_obj(trans));
6833 case NFT_MSG_DELFLOWTABLE:
6834 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
6839 put_net(trans->ctx.net);
6844 static void nf_tables_trans_destroy_work(struct work_struct *w)
6846 struct nft_trans *trans, *next;
6849 spin_lock(&nf_tables_destroy_list_lock);
6850 list_splice_init(&nf_tables_destroy_list, &head);
6851 spin_unlock(&nf_tables_destroy_list_lock);
6853 if (list_empty(&head))
6858 list_for_each_entry_safe(trans, next, &head, list) {
6859 list_del(&trans->list);
6860 nft_commit_release(trans);
6864 static int nf_tables_commit_chain_prepare(struct net *net, struct nft_chain *chain)
6866 struct nft_rule *rule;
6867 unsigned int alloc = 0;
6870 /* already handled or inactive chain? */
6871 if (chain->rules_next || !nft_is_active_next(net, chain))
6874 rule = list_entry(&chain->rules, struct nft_rule, list);
6877 list_for_each_entry_continue(rule, &chain->rules, list) {
6878 if (nft_is_active_next(net, rule))
6882 chain->rules_next = nf_tables_chain_alloc_rules(chain, alloc);
6883 if (!chain->rules_next)
6886 list_for_each_entry_continue(rule, &chain->rules, list) {
6887 if (nft_is_active_next(net, rule))
6888 chain->rules_next[i++] = rule;
6891 chain->rules_next[i] = NULL;
6895 static void nf_tables_commit_chain_prepare_cancel(struct net *net)
6897 struct nft_trans *trans, *next;
6899 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
6900 struct nft_chain *chain = trans->ctx.chain;
6902 if (trans->msg_type == NFT_MSG_NEWRULE ||
6903 trans->msg_type == NFT_MSG_DELRULE) {
6904 kvfree(chain->rules_next);
6905 chain->rules_next = NULL;
6910 static void __nf_tables_commit_chain_free_rules_old(struct rcu_head *h)
6912 struct nft_rules_old *o = container_of(h, struct nft_rules_old, h);
6917 static void nf_tables_commit_chain_free_rules_old(struct nft_rule **rules)
6919 struct nft_rule **r = rules;
6920 struct nft_rules_old *old;
6925 r++; /* rcu_head is after end marker */
6929 call_rcu(&old->h, __nf_tables_commit_chain_free_rules_old);
6932 static void nf_tables_commit_chain(struct net *net, struct nft_chain *chain)
6934 struct nft_rule **g0, **g1;
6937 next_genbit = nft_gencursor_next(net);
6939 g0 = rcu_dereference_protected(chain->rules_gen_0,
6940 lockdep_commit_lock_is_held(net));
6941 g1 = rcu_dereference_protected(chain->rules_gen_1,
6942 lockdep_commit_lock_is_held(net));
6944 /* No changes to this chain? */
6945 if (chain->rules_next == NULL) {
6946 /* chain had no change in last or next generation */
6950 * chain had no change in this generation; make sure next
6951 * one uses same rules as current generation.
6954 rcu_assign_pointer(chain->rules_gen_1, g0);
6955 nf_tables_commit_chain_free_rules_old(g1);
6957 rcu_assign_pointer(chain->rules_gen_0, g1);
6958 nf_tables_commit_chain_free_rules_old(g0);
6965 rcu_assign_pointer(chain->rules_gen_1, chain->rules_next);
6967 rcu_assign_pointer(chain->rules_gen_0, chain->rules_next);
6969 chain->rules_next = NULL;
6975 nf_tables_commit_chain_free_rules_old(g1);
6977 nf_tables_commit_chain_free_rules_old(g0);
6980 static void nft_obj_del(struct nft_object *obj)
6982 rhltable_remove(&nft_objname_ht, &obj->rhlhead, nft_objname_ht_params);
6983 list_del_rcu(&obj->list);
6986 static void nft_chain_del(struct nft_chain *chain)
6988 struct nft_table *table = chain->table;
6990 WARN_ON_ONCE(rhltable_remove(&table->chains_ht, &chain->rhlhead,
6991 nft_chain_ht_params));
6992 list_del_rcu(&chain->list);
6995 static void nf_tables_commit_release(struct net *net)
6997 struct nft_trans *trans;
6999 /* all side effects have to be made visible.
7000 * For example, if a chain named 'foo' has been deleted, a
7001 * new transaction must not find it anymore.
7003 * Memory reclaim happens asynchronously from work queue
7004 * to prevent expensive synchronize_rcu() in commit phase.
7006 if (list_empty(&net->nft.commit_list)) {
7007 mutex_unlock(&net->nft.commit_mutex);
7011 trans = list_last_entry(&net->nft.commit_list,
7012 struct nft_trans, list);
7013 get_net(trans->ctx.net);
7014 WARN_ON_ONCE(trans->put_net);
7016 trans->put_net = true;
7017 spin_lock(&nf_tables_destroy_list_lock);
7018 list_splice_tail_init(&net->nft.commit_list, &nf_tables_destroy_list);
7019 spin_unlock(&nf_tables_destroy_list_lock);
7021 mutex_unlock(&net->nft.commit_mutex);
7023 schedule_work(&trans_destroy_work);
7026 static int nf_tables_commit(struct net *net, struct sk_buff *skb)
7028 struct nft_trans *trans, *next;
7029 struct nft_trans_elem *te;
7030 struct nft_chain *chain;
7031 struct nft_table *table;
7034 if (list_empty(&net->nft.commit_list)) {
7035 mutex_unlock(&net->nft.commit_mutex);
7039 /* 0. Validate ruleset, otherwise roll back for error reporting. */
7040 if (nf_tables_validate(net) < 0)
7043 err = nft_flow_rule_offload_commit(net);
7047 /* 1. Allocate space for next generation rules_gen_X[] */
7048 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
7051 if (trans->msg_type == NFT_MSG_NEWRULE ||
7052 trans->msg_type == NFT_MSG_DELRULE) {
7053 chain = trans->ctx.chain;
7055 ret = nf_tables_commit_chain_prepare(net, chain);
7057 nf_tables_commit_chain_prepare_cancel(net);
7063 /* step 2. Make rules_gen_X visible to packet path */
7064 list_for_each_entry(table, &net->nft.tables, list) {
7065 list_for_each_entry(chain, &table->chains, list)
7066 nf_tables_commit_chain(net, chain);
7070 * Bump generation counter, invalidate any dump in progress.
7071 * Cannot fail after this point.
7073 while (++net->nft.base_seq == 0);
7075 /* step 3. Start new generation, rules_gen_X now in use. */
7076 net->nft.gencursor = nft_gencursor_next(net);
7078 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
7079 switch (trans->msg_type) {
7080 case NFT_MSG_NEWTABLE:
7081 if (nft_trans_table_update(trans)) {
7082 if (!nft_trans_table_enable(trans)) {
7083 nf_tables_table_disable(net,
7085 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
7088 nft_clear(net, trans->ctx.table);
7090 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
7091 nft_trans_destroy(trans);
7093 case NFT_MSG_DELTABLE:
7094 list_del_rcu(&trans->ctx.table->list);
7095 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
7097 case NFT_MSG_NEWCHAIN:
7098 if (nft_trans_chain_update(trans)) {
7099 nft_chain_commit_update(trans);
7100 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
7101 /* trans destroyed after rcu grace period */
7103 nft_chain_commit_drop_policy(trans);
7104 nft_clear(net, trans->ctx.chain);
7105 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
7106 nft_trans_destroy(trans);
7109 case NFT_MSG_DELCHAIN:
7110 nft_chain_del(trans->ctx.chain);
7111 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
7112 nf_tables_unregister_hook(trans->ctx.net,
7116 case NFT_MSG_NEWRULE:
7117 nft_clear(trans->ctx.net, nft_trans_rule(trans));
7118 nf_tables_rule_notify(&trans->ctx,
7119 nft_trans_rule(trans),
7121 nft_trans_destroy(trans);
7123 case NFT_MSG_DELRULE:
7124 list_del_rcu(&nft_trans_rule(trans)->list);
7125 nf_tables_rule_notify(&trans->ctx,
7126 nft_trans_rule(trans),
7128 nft_rule_expr_deactivate(&trans->ctx,
7129 nft_trans_rule(trans),
7132 case NFT_MSG_NEWSET:
7133 nft_clear(net, nft_trans_set(trans));
7134 /* This avoids hitting -EBUSY when deleting the table
7135 * from the transaction.
7137 if (nft_set_is_anonymous(nft_trans_set(trans)) &&
7138 !list_empty(&nft_trans_set(trans)->bindings))
7139 trans->ctx.table->use--;
7141 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
7142 NFT_MSG_NEWSET, GFP_KERNEL);
7143 nft_trans_destroy(trans);
7145 case NFT_MSG_DELSET:
7146 list_del_rcu(&nft_trans_set(trans)->list);
7147 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
7148 NFT_MSG_DELSET, GFP_KERNEL);
7150 case NFT_MSG_NEWSETELEM:
7151 te = (struct nft_trans_elem *)trans->data;
7153 te->set->ops->activate(net, te->set, &te->elem);
7154 nf_tables_setelem_notify(&trans->ctx, te->set,
7156 NFT_MSG_NEWSETELEM, 0);
7157 nft_trans_destroy(trans);
7159 case NFT_MSG_DELSETELEM:
7160 te = (struct nft_trans_elem *)trans->data;
7162 nf_tables_setelem_notify(&trans->ctx, te->set,
7164 NFT_MSG_DELSETELEM, 0);
7165 te->set->ops->remove(net, te->set, &te->elem);
7166 atomic_dec(&te->set->nelems);
7169 case NFT_MSG_NEWOBJ:
7170 if (nft_trans_obj_update(trans)) {
7171 nft_obj_commit_update(trans);
7172 nf_tables_obj_notify(&trans->ctx,
7173 nft_trans_obj(trans),
7176 nft_clear(net, nft_trans_obj(trans));
7177 nf_tables_obj_notify(&trans->ctx,
7178 nft_trans_obj(trans),
7180 nft_trans_destroy(trans);
7183 case NFT_MSG_DELOBJ:
7184 nft_obj_del(nft_trans_obj(trans));
7185 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
7188 case NFT_MSG_NEWFLOWTABLE:
7189 nft_clear(net, nft_trans_flowtable(trans));
7190 nf_tables_flowtable_notify(&trans->ctx,
7191 nft_trans_flowtable(trans),
7192 NFT_MSG_NEWFLOWTABLE);
7193 nft_trans_destroy(trans);
7195 case NFT_MSG_DELFLOWTABLE:
7196 list_del_rcu(&nft_trans_flowtable(trans)->list);
7197 nf_tables_flowtable_notify(&trans->ctx,
7198 nft_trans_flowtable(trans),
7199 NFT_MSG_DELFLOWTABLE);
7200 nft_unregister_flowtable_net_hooks(net,
7201 nft_trans_flowtable(trans));
7206 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
7207 nf_tables_commit_release(net);
7212 static void nf_tables_abort_release(struct nft_trans *trans)
7214 switch (trans->msg_type) {
7215 case NFT_MSG_NEWTABLE:
7216 nf_tables_table_destroy(&trans->ctx);
7218 case NFT_MSG_NEWCHAIN:
7219 nf_tables_chain_destroy(&trans->ctx);
7221 case NFT_MSG_NEWRULE:
7222 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
7224 case NFT_MSG_NEWSET:
7225 nft_set_destroy(nft_trans_set(trans));
7227 case NFT_MSG_NEWSETELEM:
7228 nft_set_elem_destroy(nft_trans_elem_set(trans),
7229 nft_trans_elem(trans).priv, true);
7231 case NFT_MSG_NEWOBJ:
7232 nft_obj_destroy(&trans->ctx, nft_trans_obj(trans));
7234 case NFT_MSG_NEWFLOWTABLE:
7235 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
7241 static int __nf_tables_abort(struct net *net)
7243 struct nft_trans *trans, *next;
7244 struct nft_trans_elem *te;
7246 list_for_each_entry_safe_reverse(trans, next, &net->nft.commit_list,
7248 switch (trans->msg_type) {
7249 case NFT_MSG_NEWTABLE:
7250 if (nft_trans_table_update(trans)) {
7251 if (nft_trans_table_enable(trans)) {
7252 nf_tables_table_disable(net,
7254 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
7256 nft_trans_destroy(trans);
7258 list_del_rcu(&trans->ctx.table->list);
7261 case NFT_MSG_DELTABLE:
7262 nft_clear(trans->ctx.net, trans->ctx.table);
7263 nft_trans_destroy(trans);
7265 case NFT_MSG_NEWCHAIN:
7266 if (nft_trans_chain_update(trans)) {
7267 free_percpu(nft_trans_chain_stats(trans));
7268 kfree(nft_trans_chain_name(trans));
7269 nft_trans_destroy(trans);
7271 trans->ctx.table->use--;
7272 nft_chain_del(trans->ctx.chain);
7273 nf_tables_unregister_hook(trans->ctx.net,
7278 case NFT_MSG_DELCHAIN:
7279 trans->ctx.table->use++;
7280 nft_clear(trans->ctx.net, trans->ctx.chain);
7281 nft_trans_destroy(trans);
7283 case NFT_MSG_NEWRULE:
7284 trans->ctx.chain->use--;
7285 list_del_rcu(&nft_trans_rule(trans)->list);
7286 nft_rule_expr_deactivate(&trans->ctx,
7287 nft_trans_rule(trans),
7290 case NFT_MSG_DELRULE:
7291 trans->ctx.chain->use++;
7292 nft_clear(trans->ctx.net, nft_trans_rule(trans));
7293 nft_rule_expr_activate(&trans->ctx, nft_trans_rule(trans));
7294 nft_trans_destroy(trans);
7296 case NFT_MSG_NEWSET:
7297 trans->ctx.table->use--;
7298 if (nft_trans_set_bound(trans)) {
7299 nft_trans_destroy(trans);
7302 list_del_rcu(&nft_trans_set(trans)->list);
7304 case NFT_MSG_DELSET:
7305 trans->ctx.table->use++;
7306 nft_clear(trans->ctx.net, nft_trans_set(trans));
7307 nft_trans_destroy(trans);
7309 case NFT_MSG_NEWSETELEM:
7310 if (nft_trans_elem_set_bound(trans)) {
7311 nft_trans_destroy(trans);
7314 te = (struct nft_trans_elem *)trans->data;
7315 te->set->ops->remove(net, te->set, &te->elem);
7316 atomic_dec(&te->set->nelems);
7318 case NFT_MSG_DELSETELEM:
7319 te = (struct nft_trans_elem *)trans->data;
7321 nft_set_elem_activate(net, te->set, &te->elem);
7322 te->set->ops->activate(net, te->set, &te->elem);
7325 nft_trans_destroy(trans);
7327 case NFT_MSG_NEWOBJ:
7328 if (nft_trans_obj_update(trans)) {
7329 kfree(nft_trans_obj_newobj(trans));
7330 nft_trans_destroy(trans);
7332 trans->ctx.table->use--;
7333 nft_obj_del(nft_trans_obj(trans));
7336 case NFT_MSG_DELOBJ:
7337 trans->ctx.table->use++;
7338 nft_clear(trans->ctx.net, nft_trans_obj(trans));
7339 nft_trans_destroy(trans);
7341 case NFT_MSG_NEWFLOWTABLE:
7342 trans->ctx.table->use--;
7343 list_del_rcu(&nft_trans_flowtable(trans)->list);
7344 nft_unregister_flowtable_net_hooks(net,
7345 nft_trans_flowtable(trans));
7347 case NFT_MSG_DELFLOWTABLE:
7348 trans->ctx.table->use++;
7349 nft_clear(trans->ctx.net, nft_trans_flowtable(trans));
7350 nft_trans_destroy(trans);
7357 list_for_each_entry_safe_reverse(trans, next,
7358 &net->nft.commit_list, list) {
7359 list_del(&trans->list);
7360 nf_tables_abort_release(trans);
7366 static void nf_tables_cleanup(struct net *net)
7368 nft_validate_state_update(net, NFT_VALIDATE_SKIP);
7371 static int nf_tables_abort(struct net *net, struct sk_buff *skb)
7373 int ret = __nf_tables_abort(net);
7375 mutex_unlock(&net->nft.commit_mutex);
7380 static bool nf_tables_valid_genid(struct net *net, u32 genid)
7384 mutex_lock(&net->nft.commit_mutex);
7386 genid_ok = genid == 0 || net->nft.base_seq == genid;
7388 mutex_unlock(&net->nft.commit_mutex);
7390 /* else, commit mutex has to be released by commit or abort function */
7394 static const struct nfnetlink_subsystem nf_tables_subsys = {
7395 .name = "nf_tables",
7396 .subsys_id = NFNL_SUBSYS_NFTABLES,
7397 .cb_count = NFT_MSG_MAX,
7399 .commit = nf_tables_commit,
7400 .abort = nf_tables_abort,
7401 .cleanup = nf_tables_cleanup,
7402 .valid_genid = nf_tables_valid_genid,
7403 .owner = THIS_MODULE,
7406 int nft_chain_validate_dependency(const struct nft_chain *chain,
7407 enum nft_chain_types type)
7409 const struct nft_base_chain *basechain;
7411 if (nft_is_base_chain(chain)) {
7412 basechain = nft_base_chain(chain);
7413 if (basechain->type->type != type)
7418 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
7420 int nft_chain_validate_hooks(const struct nft_chain *chain,
7421 unsigned int hook_flags)
7423 struct nft_base_chain *basechain;
7425 if (nft_is_base_chain(chain)) {
7426 basechain = nft_base_chain(chain);
7428 if ((1 << basechain->ops.hooknum) & hook_flags)
7436 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
7439 * Loop detection - walk through the ruleset beginning at the destination chain
7440 * of a new jump until either the source chain is reached (loop) or all
7441 * reachable chains have been traversed.
7443 * The loop check is performed whenever a new jump verdict is added to an
7444 * expression or verdict map or a verdict map is bound to a new chain.
7447 static int nf_tables_check_loops(const struct nft_ctx *ctx,
7448 const struct nft_chain *chain);
7450 static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
7451 struct nft_set *set,
7452 const struct nft_set_iter *iter,
7453 struct nft_set_elem *elem)
7455 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
7456 const struct nft_data *data;
7458 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
7459 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
7462 data = nft_set_ext_data(ext);
7463 switch (data->verdict.code) {
7466 return nf_tables_check_loops(ctx, data->verdict.chain);
7472 static int nf_tables_check_loops(const struct nft_ctx *ctx,
7473 const struct nft_chain *chain)
7475 const struct nft_rule *rule;
7476 const struct nft_expr *expr, *last;
7477 struct nft_set *set;
7478 struct nft_set_binding *binding;
7479 struct nft_set_iter iter;
7481 if (ctx->chain == chain)
7484 list_for_each_entry(rule, &chain->rules, list) {
7485 nft_rule_for_each_expr(expr, last, rule) {
7486 struct nft_immediate_expr *priv;
7487 const struct nft_data *data;
7490 if (strcmp(expr->ops->type->name, "immediate"))
7493 priv = nft_expr_priv(expr);
7494 if (priv->dreg != NFT_REG_VERDICT)
7498 switch (data->verdict.code) {
7501 err = nf_tables_check_loops(ctx,
7502 data->verdict.chain);
7511 list_for_each_entry(set, &ctx->table->sets, list) {
7512 if (!nft_is_active_next(ctx->net, set))
7514 if (!(set->flags & NFT_SET_MAP) ||
7515 set->dtype != NFT_DATA_VERDICT)
7518 list_for_each_entry(binding, &set->bindings, list) {
7519 if (!(binding->flags & NFT_SET_MAP) ||
7520 binding->chain != chain)
7523 iter.genmask = nft_genmask_next(ctx->net);
7527 iter.fn = nf_tables_loop_check_setelem;
7529 set->ops->walk(ctx, set, &iter);
7539 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
7541 * @attr: netlink attribute to fetch value from
7542 * @max: maximum value to be stored in dest
7543 * @dest: pointer to the variable
7545 * Parse, check and store a given u32 netlink attribute into variable.
7546 * This function returns -ERANGE if the value goes over maximum value.
7547 * Otherwise a 0 is returned and the attribute value is stored in the
7548 * destination variable.
7550 int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
7554 val = ntohl(nla_get_be32(attr));
7561 EXPORT_SYMBOL_GPL(nft_parse_u32_check);
7564 * nft_parse_register - parse a register value from a netlink attribute
7566 * @attr: netlink attribute
7568 * Parse and translate a register value from a netlink attribute.
7569 * Registers used to be 128 bit wide, these register numbers will be
7570 * mapped to the corresponding 32 bit register numbers.
7572 unsigned int nft_parse_register(const struct nlattr *attr)
7576 reg = ntohl(nla_get_be32(attr));
7578 case NFT_REG_VERDICT...NFT_REG_4:
7579 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
7581 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
7584 EXPORT_SYMBOL_GPL(nft_parse_register);
7587 * nft_dump_register - dump a register value to a netlink attribute
7589 * @skb: socket buffer
7590 * @attr: attribute number
7591 * @reg: register number
7593 * Construct a netlink attribute containing the register number. For
7594 * compatibility reasons, register numbers being a multiple of 4 are
7595 * translated to the corresponding 128 bit register numbers.
7597 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
7599 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
7600 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
7602 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
7604 return nla_put_be32(skb, attr, htonl(reg));
7606 EXPORT_SYMBOL_GPL(nft_dump_register);
7609 * nft_validate_register_load - validate a load from a register
7611 * @reg: the register number
7612 * @len: the length of the data
7614 * Validate that the input register is one of the general purpose
7615 * registers and that the length of the load is within the bounds.
7617 int nft_validate_register_load(enum nft_registers reg, unsigned int len)
7619 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
7623 if (reg * NFT_REG32_SIZE + len > sizeof_field(struct nft_regs, data))
7628 EXPORT_SYMBOL_GPL(nft_validate_register_load);
7631 * nft_validate_register_store - validate an expressions' register store
7633 * @ctx: context of the expression performing the load
7634 * @reg: the destination register number
7635 * @data: the data to load
7636 * @type: the data type
7637 * @len: the length of the data
7639 * Validate that a data load uses the appropriate data type for
7640 * the destination register and the length is within the bounds.
7641 * A value of NULL for the data means that its runtime gathered
7644 int nft_validate_register_store(const struct nft_ctx *ctx,
7645 enum nft_registers reg,
7646 const struct nft_data *data,
7647 enum nft_data_types type, unsigned int len)
7652 case NFT_REG_VERDICT:
7653 if (type != NFT_DATA_VERDICT)
7657 (data->verdict.code == NFT_GOTO ||
7658 data->verdict.code == NFT_JUMP)) {
7659 err = nf_tables_check_loops(ctx, data->verdict.chain);
7666 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
7670 if (reg * NFT_REG32_SIZE + len >
7671 sizeof_field(struct nft_regs, data))
7674 if (data != NULL && type != NFT_DATA_VALUE)
7679 EXPORT_SYMBOL_GPL(nft_validate_register_store);
7681 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
7682 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
7683 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
7684 .len = NFT_CHAIN_MAXNAMELEN - 1 },
7687 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
7688 struct nft_data_desc *desc, const struct nlattr *nla)
7690 u8 genmask = nft_genmask_next(ctx->net);
7691 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
7692 struct nft_chain *chain;
7695 err = nla_parse_nested_deprecated(tb, NFTA_VERDICT_MAX, nla,
7696 nft_verdict_policy, NULL);
7700 if (!tb[NFTA_VERDICT_CODE])
7702 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
7704 switch (data->verdict.code) {
7706 switch (data->verdict.code & NF_VERDICT_MASK) {
7721 if (!tb[NFTA_VERDICT_CHAIN])
7723 chain = nft_chain_lookup(ctx->net, ctx->table,
7724 tb[NFTA_VERDICT_CHAIN], genmask);
7726 return PTR_ERR(chain);
7727 if (nft_is_base_chain(chain))
7731 data->verdict.chain = chain;
7735 desc->len = sizeof(data->verdict);
7736 desc->type = NFT_DATA_VERDICT;
7740 static void nft_verdict_uninit(const struct nft_data *data)
7742 switch (data->verdict.code) {
7745 data->verdict.chain->use--;
7750 int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
7752 struct nlattr *nest;
7754 nest = nla_nest_start_noflag(skb, type);
7756 goto nla_put_failure;
7758 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
7759 goto nla_put_failure;
7764 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
7766 goto nla_put_failure;
7768 nla_nest_end(skb, nest);
7775 static int nft_value_init(const struct nft_ctx *ctx,
7776 struct nft_data *data, unsigned int size,
7777 struct nft_data_desc *desc, const struct nlattr *nla)
7787 nla_memcpy(data->data, nla, len);
7788 desc->type = NFT_DATA_VALUE;
7793 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
7796 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
7799 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
7800 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
7801 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
7805 * nft_data_init - parse nf_tables data netlink attributes
7807 * @ctx: context of the expression using the data
7808 * @data: destination struct nft_data
7809 * @size: maximum data length
7810 * @desc: data description
7811 * @nla: netlink attribute containing data
7813 * Parse the netlink data attributes and initialize a struct nft_data.
7814 * The type and length of data are returned in the data description.
7816 * The caller can indicate that it only wants to accept data of type
7817 * NFT_DATA_VALUE by passing NULL for the ctx argument.
7819 int nft_data_init(const struct nft_ctx *ctx,
7820 struct nft_data *data, unsigned int size,
7821 struct nft_data_desc *desc, const struct nlattr *nla)
7823 struct nlattr *tb[NFTA_DATA_MAX + 1];
7826 err = nla_parse_nested_deprecated(tb, NFTA_DATA_MAX, nla,
7827 nft_data_policy, NULL);
7831 if (tb[NFTA_DATA_VALUE])
7832 return nft_value_init(ctx, data, size, desc,
7833 tb[NFTA_DATA_VALUE]);
7834 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
7835 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
7838 EXPORT_SYMBOL_GPL(nft_data_init);
7841 * nft_data_release - release a nft_data item
7843 * @data: struct nft_data to release
7844 * @type: type of data
7846 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
7847 * all others need to be released by calling this function.
7849 void nft_data_release(const struct nft_data *data, enum nft_data_types type)
7851 if (type < NFT_DATA_VERDICT)
7854 case NFT_DATA_VERDICT:
7855 return nft_verdict_uninit(data);
7860 EXPORT_SYMBOL_GPL(nft_data_release);
7862 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
7863 enum nft_data_types type, unsigned int len)
7865 struct nlattr *nest;
7868 nest = nla_nest_start_noflag(skb, attr);
7873 case NFT_DATA_VALUE:
7874 err = nft_value_dump(skb, data, len);
7876 case NFT_DATA_VERDICT:
7877 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
7884 nla_nest_end(skb, nest);
7887 EXPORT_SYMBOL_GPL(nft_data_dump);
7889 int __nft_release_basechain(struct nft_ctx *ctx)
7891 struct nft_rule *rule, *nr;
7893 if (WARN_ON(!nft_is_base_chain(ctx->chain)))
7896 nf_tables_unregister_hook(ctx->net, ctx->chain->table, ctx->chain);
7897 list_for_each_entry_safe(rule, nr, &ctx->chain->rules, list) {
7898 list_del(&rule->list);
7900 nf_tables_rule_release(ctx, rule);
7902 nft_chain_del(ctx->chain);
7904 nf_tables_chain_destroy(ctx);
7908 EXPORT_SYMBOL_GPL(__nft_release_basechain);
7910 static void __nft_release_tables(struct net *net)
7912 struct nft_flowtable *flowtable, *nf;
7913 struct nft_table *table, *nt;
7914 struct nft_chain *chain, *nc;
7915 struct nft_object *obj, *ne;
7916 struct nft_rule *rule, *nr;
7917 struct nft_set *set, *ns;
7918 struct nft_ctx ctx = {
7920 .family = NFPROTO_NETDEV,
7923 list_for_each_entry_safe(table, nt, &net->nft.tables, list) {
7924 ctx.family = table->family;
7926 list_for_each_entry(chain, &table->chains, list)
7927 nf_tables_unregister_hook(net, table, chain);
7928 /* No packets are walking on these chains anymore. */
7930 list_for_each_entry(chain, &table->chains, list) {
7932 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
7933 list_del(&rule->list);
7935 nf_tables_rule_release(&ctx, rule);
7938 list_for_each_entry_safe(flowtable, nf, &table->flowtables, list) {
7939 list_del(&flowtable->list);
7941 nf_tables_flowtable_destroy(flowtable);
7943 list_for_each_entry_safe(set, ns, &table->sets, list) {
7944 list_del(&set->list);
7946 nft_set_destroy(set);
7948 list_for_each_entry_safe(obj, ne, &table->objects, list) {
7951 nft_obj_destroy(&ctx, obj);
7953 list_for_each_entry_safe(chain, nc, &table->chains, list) {
7955 nft_chain_del(chain);
7957 nf_tables_chain_destroy(&ctx);
7959 list_del(&table->list);
7960 nf_tables_table_destroy(&ctx);
7964 static int __net_init nf_tables_init_net(struct net *net)
7966 INIT_LIST_HEAD(&net->nft.tables);
7967 INIT_LIST_HEAD(&net->nft.commit_list);
7968 mutex_init(&net->nft.commit_mutex);
7969 net->nft.base_seq = 1;
7970 net->nft.validate_state = NFT_VALIDATE_SKIP;
7975 static void __net_exit nf_tables_exit_net(struct net *net)
7977 mutex_lock(&net->nft.commit_mutex);
7978 if (!list_empty(&net->nft.commit_list))
7979 __nf_tables_abort(net);
7980 __nft_release_tables(net);
7981 mutex_unlock(&net->nft.commit_mutex);
7982 WARN_ON_ONCE(!list_empty(&net->nft.tables));
7985 static struct pernet_operations nf_tables_net_ops = {
7986 .init = nf_tables_init_net,
7987 .exit = nf_tables_exit_net,
7990 static int __init nf_tables_module_init(void)
7994 spin_lock_init(&nf_tables_destroy_list_lock);
7995 err = register_pernet_subsys(&nf_tables_net_ops);
7999 err = nft_chain_filter_init();
8003 err = nf_tables_core_module_init();
8007 err = register_netdevice_notifier(&nf_tables_flowtable_notifier);
8011 err = rhltable_init(&nft_objname_ht, &nft_objname_ht_params);
8015 err = nft_offload_init();
8020 err = nfnetlink_subsys_register(&nf_tables_subsys);
8024 nft_chain_route_init();
8030 rhltable_destroy(&nft_objname_ht);
8032 unregister_netdevice_notifier(&nf_tables_flowtable_notifier);
8034 nf_tables_core_module_exit();
8036 nft_chain_filter_fini();
8038 unregister_pernet_subsys(&nf_tables_net_ops);
8042 static void __exit nf_tables_module_exit(void)
8044 nfnetlink_subsys_unregister(&nf_tables_subsys);
8046 unregister_netdevice_notifier(&nf_tables_flowtable_notifier);
8047 nft_chain_filter_fini();
8048 nft_chain_route_fini();
8049 unregister_pernet_subsys(&nf_tables_net_ops);
8050 cancel_work_sync(&trans_destroy_work);
8052 rhltable_destroy(&nft_objname_ht);
8053 nf_tables_core_module_exit();
8056 module_init(nf_tables_module_init);
8057 module_exit(nf_tables_module_exit);
8059 MODULE_LICENSE("GPL");
8060 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
8061 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);