2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/vmalloc.h>
17 #include <linux/netfilter.h>
18 #include <linux/netfilter/nfnetlink.h>
19 #include <linux/netfilter/nf_tables.h>
20 #include <net/netfilter/nf_flow_table.h>
21 #include <net/netfilter/nf_tables_core.h>
22 #include <net/netfilter/nf_tables.h>
23 #include <net/net_namespace.h>
26 static LIST_HEAD(nf_tables_expressions);
27 static LIST_HEAD(nf_tables_objects);
28 static LIST_HEAD(nf_tables_flowtables);
29 static u64 table_handle;
31 static void nft_ctx_init(struct nft_ctx *ctx,
33 const struct sk_buff *skb,
34 const struct nlmsghdr *nlh,
36 struct nft_table *table,
37 struct nft_chain *chain,
38 const struct nlattr * const *nla)
45 ctx->portid = NETLINK_CB(skb).portid;
46 ctx->report = nlmsg_report(nlh);
47 ctx->seq = nlh->nlmsg_seq;
50 static struct nft_trans *nft_trans_alloc_gfp(const struct nft_ctx *ctx,
51 int msg_type, u32 size, gfp_t gfp)
53 struct nft_trans *trans;
55 trans = kzalloc(sizeof(struct nft_trans) + size, gfp);
59 trans->msg_type = msg_type;
65 static struct nft_trans *nft_trans_alloc(const struct nft_ctx *ctx,
66 int msg_type, u32 size)
68 return nft_trans_alloc_gfp(ctx, msg_type, size, GFP_KERNEL);
71 static void nft_trans_destroy(struct nft_trans *trans)
73 list_del(&trans->list);
77 /* removal requests are queued in the commit_list, but not acted upon
78 * until after all new rules are in place.
80 * Therefore, nf_register_net_hook(net, &nat_hook) runs before pending
81 * nf_unregister_net_hook().
83 * nf_register_net_hook thus fails if a nat hook is already in place
84 * even if the conflicting hook is about to be removed.
86 * If collision is detected, search commit_log for DELCHAIN matching
87 * the new nat hooknum; if we find one collision is temporary:
89 * Either transaction is aborted (new/colliding hook is removed), or
90 * transaction is committed (old hook is removed).
92 static bool nf_tables_allow_nat_conflict(const struct net *net,
93 const struct nf_hook_ops *ops)
95 const struct nft_trans *trans;
101 list_for_each_entry(trans, &net->nft.commit_list, list) {
102 const struct nf_hook_ops *pending_ops;
103 const struct nft_chain *pending;
105 if (trans->msg_type != NFT_MSG_NEWCHAIN &&
106 trans->msg_type != NFT_MSG_DELCHAIN)
109 pending = trans->ctx.chain;
110 if (!nft_is_base_chain(pending))
113 pending_ops = &nft_base_chain(pending)->ops;
114 if (pending_ops->nat_hook &&
115 pending_ops->pf == ops->pf &&
116 pending_ops->hooknum == ops->hooknum) {
117 /* other hook registration already pending? */
118 if (trans->msg_type == NFT_MSG_NEWCHAIN)
128 static int nf_tables_register_hook(struct net *net,
129 const struct nft_table *table,
130 struct nft_chain *chain)
132 struct nf_hook_ops *ops;
135 if (table->flags & NFT_TABLE_F_DORMANT ||
136 !nft_is_base_chain(chain))
139 ops = &nft_base_chain(chain)->ops;
140 ret = nf_register_net_hook(net, ops);
141 if (ret == -EBUSY && nf_tables_allow_nat_conflict(net, ops)) {
142 ops->nat_hook = false;
143 ret = nf_register_net_hook(net, ops);
144 ops->nat_hook = true;
150 static void nf_tables_unregister_hook(struct net *net,
151 const struct nft_table *table,
152 struct nft_chain *chain)
154 if (table->flags & NFT_TABLE_F_DORMANT ||
155 !nft_is_base_chain(chain))
158 nf_unregister_net_hook(net, &nft_base_chain(chain)->ops);
161 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
163 struct nft_trans *trans;
165 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
169 if (msg_type == NFT_MSG_NEWTABLE)
170 nft_activate_next(ctx->net, ctx->table);
172 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
176 static int nft_deltable(struct nft_ctx *ctx)
180 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
184 nft_deactivate_next(ctx->net, ctx->table);
188 static int nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
190 struct nft_trans *trans;
192 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
196 if (msg_type == NFT_MSG_NEWCHAIN)
197 nft_activate_next(ctx->net, ctx->chain);
199 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
203 static int nft_delchain(struct nft_ctx *ctx)
207 err = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
212 nft_deactivate_next(ctx->net, ctx->chain);
218 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
220 /* You cannot delete the same rule twice */
221 if (nft_is_active_next(ctx->net, rule)) {
222 nft_deactivate_next(ctx->net, rule);
229 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
230 struct nft_rule *rule)
232 struct nft_trans *trans;
234 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
238 if (msg_type == NFT_MSG_NEWRULE && ctx->nla[NFTA_RULE_ID] != NULL) {
239 nft_trans_rule_id(trans) =
240 ntohl(nla_get_be32(ctx->nla[NFTA_RULE_ID]));
242 nft_trans_rule(trans) = rule;
243 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
248 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
250 struct nft_trans *trans;
253 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
257 err = nf_tables_delrule_deactivate(ctx, rule);
259 nft_trans_destroy(trans);
266 static int nft_delrule_by_chain(struct nft_ctx *ctx)
268 struct nft_rule *rule;
271 list_for_each_entry(rule, &ctx->chain->rules, list) {
272 err = nft_delrule(ctx, rule);
279 static int nft_trans_set_add(struct nft_ctx *ctx, int msg_type,
282 struct nft_trans *trans;
284 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
288 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
289 nft_trans_set_id(trans) =
290 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
291 nft_activate_next(ctx->net, set);
293 nft_trans_set(trans) = set;
294 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
299 static int nft_delset(struct nft_ctx *ctx, struct nft_set *set)
303 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
307 nft_deactivate_next(ctx->net, set);
313 static int nft_trans_obj_add(struct nft_ctx *ctx, int msg_type,
314 struct nft_object *obj)
316 struct nft_trans *trans;
318 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_obj));
322 if (msg_type == NFT_MSG_NEWOBJ)
323 nft_activate_next(ctx->net, obj);
325 nft_trans_obj(trans) = obj;
326 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
331 static int nft_delobj(struct nft_ctx *ctx, struct nft_object *obj)
335 err = nft_trans_obj_add(ctx, NFT_MSG_DELOBJ, obj);
339 nft_deactivate_next(ctx->net, obj);
345 static int nft_trans_flowtable_add(struct nft_ctx *ctx, int msg_type,
346 struct nft_flowtable *flowtable)
348 struct nft_trans *trans;
350 trans = nft_trans_alloc(ctx, msg_type,
351 sizeof(struct nft_trans_flowtable));
355 if (msg_type == NFT_MSG_NEWFLOWTABLE)
356 nft_activate_next(ctx->net, flowtable);
358 nft_trans_flowtable(trans) = flowtable;
359 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
364 static int nft_delflowtable(struct nft_ctx *ctx,
365 struct nft_flowtable *flowtable)
369 err = nft_trans_flowtable_add(ctx, NFT_MSG_DELFLOWTABLE, flowtable);
373 nft_deactivate_next(ctx->net, flowtable);
383 static struct nft_table *nft_table_lookup(const struct net *net,
384 const struct nlattr *nla,
385 u8 family, u8 genmask)
387 struct nft_table *table;
390 return ERR_PTR(-EINVAL);
392 list_for_each_entry(table, &net->nft.tables, list) {
393 if (!nla_strcmp(nla, table->name) &&
394 table->family == family &&
395 nft_active_genmask(table, genmask))
399 return ERR_PTR(-ENOENT);
402 static struct nft_table *nft_table_lookup_byhandle(const struct net *net,
403 const struct nlattr *nla,
406 struct nft_table *table;
408 list_for_each_entry(table, &net->nft.tables, list) {
409 if (be64_to_cpu(nla_get_be64(nla)) == table->handle &&
410 nft_active_genmask(table, genmask))
414 return ERR_PTR(-ENOENT);
417 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
419 return ++table->hgenerator;
422 static const struct nft_chain_type *chain_type[NFPROTO_NUMPROTO][NFT_CHAIN_T_MAX];
424 static const struct nft_chain_type *
425 __nf_tables_chain_type_lookup(const struct nlattr *nla, u8 family)
429 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
430 if (chain_type[family][i] != NULL &&
431 !nla_strcmp(nla, chain_type[family][i]->name))
432 return chain_type[family][i];
437 static const struct nft_chain_type *
438 nf_tables_chain_type_lookup(const struct nlattr *nla, u8 family, bool autoload)
440 const struct nft_chain_type *type;
442 type = __nf_tables_chain_type_lookup(nla, family);
445 #ifdef CONFIG_MODULES
447 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
448 request_module("nft-chain-%u-%.*s", family,
449 nla_len(nla), (const char *)nla_data(nla));
450 nfnl_lock(NFNL_SUBSYS_NFTABLES);
451 type = __nf_tables_chain_type_lookup(nla, family);
453 return ERR_PTR(-EAGAIN);
456 return ERR_PTR(-ENOENT);
459 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
460 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
461 .len = NFT_TABLE_MAXNAMELEN - 1 },
462 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
463 [NFTA_TABLE_HANDLE] = { .type = NLA_U64 },
466 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
467 u32 portid, u32 seq, int event, u32 flags,
468 int family, const struct nft_table *table)
470 struct nlmsghdr *nlh;
471 struct nfgenmsg *nfmsg;
473 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
474 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
476 goto nla_put_failure;
478 nfmsg = nlmsg_data(nlh);
479 nfmsg->nfgen_family = family;
480 nfmsg->version = NFNETLINK_V0;
481 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
483 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
484 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
485 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)) ||
486 nla_put_be64(skb, NFTA_TABLE_HANDLE, cpu_to_be64(table->handle),
488 goto nla_put_failure;
494 nlmsg_trim(skb, nlh);
498 static void nf_tables_table_notify(const struct nft_ctx *ctx, int event)
504 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
507 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
511 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
512 event, 0, ctx->family, ctx->table);
518 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
519 ctx->report, GFP_KERNEL);
522 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
525 static int nf_tables_dump_tables(struct sk_buff *skb,
526 struct netlink_callback *cb)
528 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
529 const struct nft_table *table;
530 unsigned int idx = 0, s_idx = cb->args[0];
531 struct net *net = sock_net(skb->sk);
532 int family = nfmsg->nfgen_family;
535 cb->seq = net->nft.base_seq;
537 list_for_each_entry_rcu(table, &net->nft.tables, list) {
538 if (family != NFPROTO_UNSPEC && family != table->family)
544 memset(&cb->args[1], 0,
545 sizeof(cb->args) - sizeof(cb->args[0]));
546 if (!nft_is_active(net, table))
548 if (nf_tables_fill_table_info(skb, net,
549 NETLINK_CB(cb->skb).portid,
551 NFT_MSG_NEWTABLE, NLM_F_MULTI,
552 table->family, table) < 0)
555 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
565 static int nf_tables_gettable(struct net *net, struct sock *nlsk,
566 struct sk_buff *skb, const struct nlmsghdr *nlh,
567 const struct nlattr * const nla[],
568 struct netlink_ext_ack *extack)
570 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
571 u8 genmask = nft_genmask_cur(net);
572 const struct nft_table *table;
573 struct sk_buff *skb2;
574 int family = nfmsg->nfgen_family;
577 if (nlh->nlmsg_flags & NLM_F_DUMP) {
578 struct netlink_dump_control c = {
579 .dump = nf_tables_dump_tables,
581 return netlink_dump_start(nlsk, skb, nlh, &c);
584 table = nft_table_lookup(net, nla[NFTA_TABLE_NAME], family, genmask);
586 NL_SET_BAD_ATTR(extack, nla[NFTA_TABLE_NAME]);
587 return PTR_ERR(table);
590 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
594 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
595 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
600 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
607 static void nft_table_disable(struct net *net, struct nft_table *table, u32 cnt)
609 struct nft_chain *chain;
612 list_for_each_entry(chain, &table->chains, list) {
613 if (!nft_is_active_next(net, chain))
615 if (!nft_is_base_chain(chain))
618 if (cnt && i++ == cnt)
621 nf_unregister_net_hook(net, &nft_base_chain(chain)->ops);
625 static int nf_tables_table_enable(struct net *net, struct nft_table *table)
627 struct nft_chain *chain;
630 list_for_each_entry(chain, &table->chains, list) {
631 if (!nft_is_active_next(net, chain))
633 if (!nft_is_base_chain(chain))
636 err = nf_register_net_hook(net, &nft_base_chain(chain)->ops);
645 nft_table_disable(net, table, i);
649 static void nf_tables_table_disable(struct net *net, struct nft_table *table)
651 nft_table_disable(net, table, 0);
654 static int nf_tables_updtable(struct nft_ctx *ctx)
656 struct nft_trans *trans;
660 if (!ctx->nla[NFTA_TABLE_FLAGS])
663 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
664 if (flags & ~NFT_TABLE_F_DORMANT)
667 if (flags == ctx->table->flags)
670 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
671 sizeof(struct nft_trans_table));
675 if ((flags & NFT_TABLE_F_DORMANT) &&
676 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
677 nft_trans_table_enable(trans) = false;
678 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
679 ctx->table->flags & NFT_TABLE_F_DORMANT) {
680 ret = nf_tables_table_enable(ctx->net, ctx->table);
682 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
683 nft_trans_table_enable(trans) = true;
689 nft_trans_table_update(trans) = true;
690 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
693 nft_trans_destroy(trans);
697 static int nf_tables_newtable(struct net *net, struct sock *nlsk,
698 struct sk_buff *skb, const struct nlmsghdr *nlh,
699 const struct nlattr * const nla[],
700 struct netlink_ext_ack *extack)
702 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
703 u8 genmask = nft_genmask_next(net);
704 int family = nfmsg->nfgen_family;
705 const struct nlattr *attr;
706 struct nft_table *table;
711 attr = nla[NFTA_TABLE_NAME];
712 table = nft_table_lookup(net, attr, family, genmask);
714 if (PTR_ERR(table) != -ENOENT)
715 return PTR_ERR(table);
717 if (nlh->nlmsg_flags & NLM_F_EXCL) {
718 NL_SET_BAD_ATTR(extack, attr);
721 if (nlh->nlmsg_flags & NLM_F_REPLACE)
724 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
725 return nf_tables_updtable(&ctx);
728 if (nla[NFTA_TABLE_FLAGS]) {
729 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
730 if (flags & ~NFT_TABLE_F_DORMANT)
735 table = kzalloc(sizeof(*table), GFP_KERNEL);
739 table->name = nla_strdup(attr, GFP_KERNEL);
740 if (table->name == NULL)
743 INIT_LIST_HEAD(&table->chains);
744 INIT_LIST_HEAD(&table->sets);
745 INIT_LIST_HEAD(&table->objects);
746 INIT_LIST_HEAD(&table->flowtables);
747 table->family = family;
748 table->flags = flags;
749 table->handle = ++table_handle;
751 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
752 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
756 list_add_tail_rcu(&table->list, &net->nft.tables);
766 static int nft_flush_table(struct nft_ctx *ctx)
768 struct nft_flowtable *flowtable, *nft;
769 struct nft_chain *chain, *nc;
770 struct nft_object *obj, *ne;
771 struct nft_set *set, *ns;
774 list_for_each_entry(chain, &ctx->table->chains, list) {
775 if (!nft_is_active_next(ctx->net, chain))
780 err = nft_delrule_by_chain(ctx);
785 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
786 if (!nft_is_active_next(ctx->net, set))
789 if (nft_set_is_anonymous(set) &&
790 !list_empty(&set->bindings))
793 err = nft_delset(ctx, set);
798 list_for_each_entry_safe(flowtable, nft, &ctx->table->flowtables, list) {
799 err = nft_delflowtable(ctx, flowtable);
804 list_for_each_entry_safe(obj, ne, &ctx->table->objects, list) {
805 err = nft_delobj(ctx, obj);
810 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
811 if (!nft_is_active_next(ctx->net, chain))
816 err = nft_delchain(ctx);
821 err = nft_deltable(ctx);
826 static int nft_flush(struct nft_ctx *ctx, int family)
828 struct nft_table *table, *nt;
829 const struct nlattr * const *nla = ctx->nla;
832 list_for_each_entry_safe(table, nt, &ctx->net->nft.tables, list) {
833 if (family != AF_UNSPEC && table->family != family)
836 ctx->family = table->family;
838 if (!nft_is_active_next(ctx->net, table))
841 if (nla[NFTA_TABLE_NAME] &&
842 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
847 err = nft_flush_table(ctx);
855 static int nf_tables_deltable(struct net *net, struct sock *nlsk,
856 struct sk_buff *skb, const struct nlmsghdr *nlh,
857 const struct nlattr * const nla[],
858 struct netlink_ext_ack *extack)
860 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
861 u8 genmask = nft_genmask_next(net);
862 int family = nfmsg->nfgen_family;
863 const struct nlattr *attr;
864 struct nft_table *table;
867 nft_ctx_init(&ctx, net, skb, nlh, 0, NULL, NULL, nla);
868 if (family == AF_UNSPEC ||
869 (!nla[NFTA_TABLE_NAME] && !nla[NFTA_TABLE_HANDLE]))
870 return nft_flush(&ctx, family);
872 if (nla[NFTA_TABLE_HANDLE]) {
873 attr = nla[NFTA_TABLE_HANDLE];
874 table = nft_table_lookup_byhandle(net, attr, genmask);
876 attr = nla[NFTA_TABLE_NAME];
877 table = nft_table_lookup(net, attr, family, genmask);
881 NL_SET_BAD_ATTR(extack, attr);
882 return PTR_ERR(table);
885 if (nlh->nlmsg_flags & NLM_F_NONREC &&
892 return nft_flush_table(&ctx);
895 static void nf_tables_table_destroy(struct nft_ctx *ctx)
897 BUG_ON(ctx->table->use > 0);
899 kfree(ctx->table->name);
903 void nft_register_chain_type(const struct nft_chain_type *ctype)
905 if (WARN_ON(ctype->family >= NFPROTO_NUMPROTO))
908 nfnl_lock(NFNL_SUBSYS_NFTABLES);
909 if (WARN_ON(chain_type[ctype->family][ctype->type] != NULL)) {
910 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
913 chain_type[ctype->family][ctype->type] = ctype;
914 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
916 EXPORT_SYMBOL_GPL(nft_register_chain_type);
918 void nft_unregister_chain_type(const struct nft_chain_type *ctype)
920 nfnl_lock(NFNL_SUBSYS_NFTABLES);
921 chain_type[ctype->family][ctype->type] = NULL;
922 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
924 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
930 static struct nft_chain *
931 nft_chain_lookup_byhandle(const struct nft_table *table, u64 handle, u8 genmask)
933 struct nft_chain *chain;
935 list_for_each_entry(chain, &table->chains, list) {
936 if (chain->handle == handle &&
937 nft_active_genmask(chain, genmask))
941 return ERR_PTR(-ENOENT);
944 static struct nft_chain *nft_chain_lookup(const struct nft_table *table,
945 const struct nlattr *nla, u8 genmask)
947 struct nft_chain *chain;
950 return ERR_PTR(-EINVAL);
952 list_for_each_entry(chain, &table->chains, list) {
953 if (!nla_strcmp(nla, chain->name) &&
954 nft_active_genmask(chain, genmask))
958 return ERR_PTR(-ENOENT);
961 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
962 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING,
963 .len = NFT_TABLE_MAXNAMELEN - 1 },
964 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
965 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
966 .len = NFT_CHAIN_MAXNAMELEN - 1 },
967 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
968 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
969 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING },
970 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
973 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
974 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
975 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
976 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
977 .len = IFNAMSIZ - 1 },
980 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
982 struct nft_stats *cpu_stats, total;
988 memset(&total, 0, sizeof(total));
989 for_each_possible_cpu(cpu) {
990 cpu_stats = per_cpu_ptr(stats, cpu);
992 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
993 pkts = cpu_stats->pkts;
994 bytes = cpu_stats->bytes;
995 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
997 total.bytes += bytes;
999 nest = nla_nest_start(skb, NFTA_CHAIN_COUNTERS);
1001 goto nla_put_failure;
1003 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
1004 NFTA_COUNTER_PAD) ||
1005 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
1007 goto nla_put_failure;
1009 nla_nest_end(skb, nest);
1016 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
1017 u32 portid, u32 seq, int event, u32 flags,
1018 int family, const struct nft_table *table,
1019 const struct nft_chain *chain)
1021 struct nlmsghdr *nlh;
1022 struct nfgenmsg *nfmsg;
1024 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
1025 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
1027 goto nla_put_failure;
1029 nfmsg = nlmsg_data(nlh);
1030 nfmsg->nfgen_family = family;
1031 nfmsg->version = NFNETLINK_V0;
1032 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1034 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
1035 goto nla_put_failure;
1036 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
1038 goto nla_put_failure;
1039 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
1040 goto nla_put_failure;
1042 if (nft_is_base_chain(chain)) {
1043 const struct nft_base_chain *basechain = nft_base_chain(chain);
1044 const struct nf_hook_ops *ops = &basechain->ops;
1045 struct nlattr *nest;
1047 nest = nla_nest_start(skb, NFTA_CHAIN_HOOK);
1049 goto nla_put_failure;
1050 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
1051 goto nla_put_failure;
1052 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
1053 goto nla_put_failure;
1054 if (basechain->dev_name[0] &&
1055 nla_put_string(skb, NFTA_HOOK_DEV, basechain->dev_name))
1056 goto nla_put_failure;
1057 nla_nest_end(skb, nest);
1059 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
1060 htonl(basechain->policy)))
1061 goto nla_put_failure;
1063 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
1064 goto nla_put_failure;
1066 if (basechain->stats && nft_dump_stats(skb, basechain->stats))
1067 goto nla_put_failure;
1070 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
1071 goto nla_put_failure;
1073 nlmsg_end(skb, nlh);
1077 nlmsg_trim(skb, nlh);
1081 static void nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
1083 struct sk_buff *skb;
1087 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1090 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1094 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
1095 event, 0, ctx->family, ctx->table,
1102 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1103 ctx->report, GFP_KERNEL);
1106 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
1109 static int nf_tables_dump_chains(struct sk_buff *skb,
1110 struct netlink_callback *cb)
1112 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1113 const struct nft_table *table;
1114 const struct nft_chain *chain;
1115 unsigned int idx = 0, s_idx = cb->args[0];
1116 struct net *net = sock_net(skb->sk);
1117 int family = nfmsg->nfgen_family;
1120 cb->seq = net->nft.base_seq;
1122 list_for_each_entry_rcu(table, &net->nft.tables, list) {
1123 if (family != NFPROTO_UNSPEC && family != table->family)
1126 list_for_each_entry_rcu(chain, &table->chains, list) {
1130 memset(&cb->args[1], 0,
1131 sizeof(cb->args) - sizeof(cb->args[0]));
1132 if (!nft_is_active(net, chain))
1134 if (nf_tables_fill_chain_info(skb, net,
1135 NETLINK_CB(cb->skb).portid,
1139 table->family, table,
1143 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1154 static int nf_tables_getchain(struct net *net, struct sock *nlsk,
1155 struct sk_buff *skb, const struct nlmsghdr *nlh,
1156 const struct nlattr * const nla[],
1157 struct netlink_ext_ack *extack)
1159 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1160 u8 genmask = nft_genmask_cur(net);
1161 const struct nft_table *table;
1162 const struct nft_chain *chain;
1163 struct sk_buff *skb2;
1164 int family = nfmsg->nfgen_family;
1167 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1168 struct netlink_dump_control c = {
1169 .dump = nf_tables_dump_chains,
1171 return netlink_dump_start(nlsk, skb, nlh, &c);
1174 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask);
1175 if (IS_ERR(table)) {
1176 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
1177 return PTR_ERR(table);
1180 chain = nft_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1181 if (IS_ERR(chain)) {
1182 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_NAME]);
1183 return PTR_ERR(chain);
1186 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1190 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
1191 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1192 family, table, chain);
1196 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1203 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1204 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1205 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1208 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
1210 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1211 struct nft_stats __percpu *newstats;
1212 struct nft_stats *stats;
1215 err = nla_parse_nested(tb, NFTA_COUNTER_MAX, attr, nft_counter_policy,
1218 return ERR_PTR(err);
1220 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
1221 return ERR_PTR(-EINVAL);
1223 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
1224 if (newstats == NULL)
1225 return ERR_PTR(-ENOMEM);
1227 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1228 * are not exposed to userspace.
1231 stats = this_cpu_ptr(newstats);
1232 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1233 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
1239 static void nft_chain_stats_replace(struct nft_base_chain *chain,
1240 struct nft_stats __percpu *newstats)
1242 struct nft_stats __percpu *oldstats;
1244 if (newstats == NULL)
1248 oldstats = nfnl_dereference(chain->stats, NFNL_SUBSYS_NFTABLES);
1249 rcu_assign_pointer(chain->stats, newstats);
1251 free_percpu(oldstats);
1253 rcu_assign_pointer(chain->stats, newstats);
1256 static void nf_tables_chain_destroy(struct nft_ctx *ctx)
1258 struct nft_chain *chain = ctx->chain;
1260 BUG_ON(chain->use > 0);
1262 if (nft_is_base_chain(chain)) {
1263 struct nft_base_chain *basechain = nft_base_chain(chain);
1265 if (basechain->type->free)
1266 basechain->type->free(ctx);
1267 module_put(basechain->type->owner);
1268 free_percpu(basechain->stats);
1269 if (basechain->stats)
1270 static_branch_dec(&nft_counters_enabled);
1279 struct nft_chain_hook {
1282 const struct nft_chain_type *type;
1283 struct net_device *dev;
1286 static int nft_chain_parse_hook(struct net *net,
1287 const struct nlattr * const nla[],
1288 struct nft_chain_hook *hook, u8 family,
1291 struct nlattr *ha[NFTA_HOOK_MAX + 1];
1292 const struct nft_chain_type *type;
1293 struct net_device *dev;
1296 err = nla_parse_nested(ha, NFTA_HOOK_MAX, nla[NFTA_CHAIN_HOOK],
1297 nft_hook_policy, NULL);
1301 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1302 ha[NFTA_HOOK_PRIORITY] == NULL)
1305 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
1306 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1308 type = chain_type[family][NFT_CHAIN_T_DEFAULT];
1309 if (nla[NFTA_CHAIN_TYPE]) {
1310 type = nf_tables_chain_type_lookup(nla[NFTA_CHAIN_TYPE],
1313 return PTR_ERR(type);
1315 if (!(type->hook_mask & (1 << hook->num)))
1318 if (type->type == NFT_CHAIN_T_NAT &&
1319 hook->priority <= NF_IP_PRI_CONNTRACK)
1322 if (!try_module_get(type->owner))
1328 if (family == NFPROTO_NETDEV) {
1329 char ifname[IFNAMSIZ];
1331 if (!ha[NFTA_HOOK_DEV]) {
1332 module_put(type->owner);
1336 nla_strlcpy(ifname, ha[NFTA_HOOK_DEV], IFNAMSIZ);
1337 dev = __dev_get_by_name(net, ifname);
1339 module_put(type->owner);
1343 } else if (ha[NFTA_HOOK_DEV]) {
1344 module_put(type->owner);
1351 static void nft_chain_release_hook(struct nft_chain_hook *hook)
1353 module_put(hook->type->owner);
1356 static int nf_tables_addchain(struct nft_ctx *ctx, u8 family, u8 genmask,
1357 u8 policy, bool create)
1359 const struct nlattr * const *nla = ctx->nla;
1360 struct nft_table *table = ctx->table;
1361 struct nft_base_chain *basechain;
1362 struct nft_stats __percpu *stats;
1363 struct net *net = ctx->net;
1364 struct nft_chain *chain;
1367 if (table->use == UINT_MAX)
1370 if (nla[NFTA_CHAIN_HOOK]) {
1371 struct nft_chain_hook hook;
1372 struct nf_hook_ops *ops;
1374 err = nft_chain_parse_hook(net, nla, &hook, family, create);
1378 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1379 if (basechain == NULL) {
1380 nft_chain_release_hook(&hook);
1384 if (hook.dev != NULL)
1385 strncpy(basechain->dev_name, hook.dev->name, IFNAMSIZ);
1387 if (nla[NFTA_CHAIN_COUNTERS]) {
1388 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1389 if (IS_ERR(stats)) {
1390 nft_chain_release_hook(&hook);
1392 return PTR_ERR(stats);
1394 basechain->stats = stats;
1395 static_branch_inc(&nft_counters_enabled);
1398 basechain->type = hook.type;
1399 if (basechain->type->init)
1400 basechain->type->init(ctx);
1402 chain = &basechain->chain;
1404 ops = &basechain->ops;
1406 ops->hooknum = hook.num;
1407 ops->priority = hook.priority;
1409 ops->hook = hook.type->hooks[ops->hooknum];
1410 ops->dev = hook.dev;
1412 if (basechain->type->type == NFT_CHAIN_T_NAT)
1413 ops->nat_hook = true;
1415 chain->flags |= NFT_BASE_CHAIN;
1416 basechain->policy = policy;
1418 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1424 INIT_LIST_HEAD(&chain->rules);
1425 chain->handle = nf_tables_alloc_handle(table);
1426 chain->table = table;
1427 chain->name = nla_strdup(nla[NFTA_CHAIN_NAME], GFP_KERNEL);
1433 err = nf_tables_register_hook(net, table, chain);
1437 err = nft_trans_chain_add(ctx, NFT_MSG_NEWCHAIN);
1442 list_add_tail_rcu(&chain->list, &table->chains);
1446 nf_tables_unregister_hook(net, table, chain);
1448 nf_tables_chain_destroy(ctx);
1453 static int nf_tables_updchain(struct nft_ctx *ctx, u8 genmask, u8 policy,
1456 const struct nlattr * const *nla = ctx->nla;
1457 struct nft_table *table = ctx->table;
1458 struct nft_chain *chain = ctx->chain;
1459 struct nft_base_chain *basechain;
1460 struct nft_stats *stats = NULL;
1461 struct nft_chain_hook hook;
1462 const struct nlattr *name;
1463 struct nf_hook_ops *ops;
1464 struct nft_trans *trans;
1467 if (nla[NFTA_CHAIN_HOOK]) {
1468 if (!nft_is_base_chain(chain))
1471 err = nft_chain_parse_hook(ctx->net, nla, &hook, ctx->family,
1476 basechain = nft_base_chain(chain);
1477 if (basechain->type != hook.type) {
1478 nft_chain_release_hook(&hook);
1482 ops = &basechain->ops;
1483 if (ops->hooknum != hook.num ||
1484 ops->priority != hook.priority ||
1485 ops->dev != hook.dev) {
1486 nft_chain_release_hook(&hook);
1489 nft_chain_release_hook(&hook);
1492 if (nla[NFTA_CHAIN_HANDLE] &&
1493 nla[NFTA_CHAIN_NAME]) {
1494 struct nft_chain *chain2;
1496 chain2 = nft_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1497 if (!IS_ERR(chain2))
1501 if (nla[NFTA_CHAIN_COUNTERS]) {
1502 if (!nft_is_base_chain(chain))
1505 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1507 return PTR_ERR(stats);
1510 trans = nft_trans_alloc(ctx, NFT_MSG_NEWCHAIN,
1511 sizeof(struct nft_trans_chain));
1512 if (trans == NULL) {
1517 nft_trans_chain_stats(trans) = stats;
1518 nft_trans_chain_update(trans) = true;
1520 if (nla[NFTA_CHAIN_POLICY])
1521 nft_trans_chain_policy(trans) = policy;
1523 nft_trans_chain_policy(trans) = -1;
1525 name = nla[NFTA_CHAIN_NAME];
1526 if (nla[NFTA_CHAIN_HANDLE] && name) {
1527 nft_trans_chain_name(trans) =
1528 nla_strdup(name, GFP_KERNEL);
1529 if (!nft_trans_chain_name(trans)) {
1535 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
1540 static int nf_tables_newchain(struct net *net, struct sock *nlsk,
1541 struct sk_buff *skb, const struct nlmsghdr *nlh,
1542 const struct nlattr * const nla[],
1543 struct netlink_ext_ack *extack)
1545 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1546 u8 genmask = nft_genmask_next(net);
1547 int family = nfmsg->nfgen_family;
1548 const struct nlattr *attr;
1549 struct nft_table *table;
1550 struct nft_chain *chain;
1551 u8 policy = NF_ACCEPT;
1556 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1558 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask);
1559 if (IS_ERR(table)) {
1560 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
1561 return PTR_ERR(table);
1565 attr = nla[NFTA_CHAIN_NAME];
1567 if (nla[NFTA_CHAIN_HANDLE]) {
1568 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
1569 chain = nft_chain_lookup_byhandle(table, handle, genmask);
1570 if (IS_ERR(chain)) {
1571 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_HANDLE]);
1572 return PTR_ERR(chain);
1574 attr = nla[NFTA_CHAIN_HANDLE];
1576 chain = nft_chain_lookup(table, attr, genmask);
1577 if (IS_ERR(chain)) {
1578 if (PTR_ERR(chain) != -ENOENT) {
1579 NL_SET_BAD_ATTR(extack, attr);
1580 return PTR_ERR(chain);
1586 if (nla[NFTA_CHAIN_POLICY]) {
1587 if (chain != NULL &&
1588 !nft_is_base_chain(chain)) {
1589 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_POLICY]);
1593 if (chain == NULL &&
1594 nla[NFTA_CHAIN_HOOK] == NULL) {
1595 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_POLICY]);
1599 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
1609 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
1611 if (chain != NULL) {
1612 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1613 NL_SET_BAD_ATTR(extack, attr);
1616 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1619 return nf_tables_updchain(&ctx, genmask, policy, create);
1622 return nf_tables_addchain(&ctx, family, genmask, policy, create);
1625 static int nf_tables_delchain(struct net *net, struct sock *nlsk,
1626 struct sk_buff *skb, const struct nlmsghdr *nlh,
1627 const struct nlattr * const nla[],
1628 struct netlink_ext_ack *extack)
1630 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1631 u8 genmask = nft_genmask_next(net);
1632 int family = nfmsg->nfgen_family;
1633 const struct nlattr *attr;
1634 struct nft_table *table;
1635 struct nft_chain *chain;
1636 struct nft_rule *rule;
1642 table = nft_table_lookup(net, nla[NFTA_CHAIN_TABLE], family, genmask);
1643 if (IS_ERR(table)) {
1644 NL_SET_BAD_ATTR(extack, nla[NFTA_CHAIN_TABLE]);
1645 return PTR_ERR(table);
1648 if (nla[NFTA_CHAIN_HANDLE]) {
1649 attr = nla[NFTA_CHAIN_HANDLE];
1650 handle = be64_to_cpu(nla_get_be64(attr));
1651 chain = nft_chain_lookup_byhandle(table, handle, genmask);
1653 attr = nla[NFTA_CHAIN_NAME];
1654 chain = nft_chain_lookup(table, attr, genmask);
1656 if (IS_ERR(chain)) {
1657 NL_SET_BAD_ATTR(extack, attr);
1658 return PTR_ERR(chain);
1661 if (nlh->nlmsg_flags & NLM_F_NONREC &&
1665 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
1668 list_for_each_entry(rule, &chain->rules, list) {
1669 if (!nft_is_active_next(net, rule))
1673 err = nft_delrule(&ctx, rule);
1678 /* There are rules and elements that are still holding references to us,
1679 * we cannot do a recursive removal in this case.
1682 NL_SET_BAD_ATTR(extack, attr);
1686 return nft_delchain(&ctx);
1694 * nft_register_expr - register nf_tables expr type
1697 * Registers the expr type for use with nf_tables. Returns zero on
1698 * success or a negative errno code otherwise.
1700 int nft_register_expr(struct nft_expr_type *type)
1702 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1703 if (type->family == NFPROTO_UNSPEC)
1704 list_add_tail_rcu(&type->list, &nf_tables_expressions);
1706 list_add_rcu(&type->list, &nf_tables_expressions);
1707 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1710 EXPORT_SYMBOL_GPL(nft_register_expr);
1713 * nft_unregister_expr - unregister nf_tables expr type
1716 * Unregisters the expr typefor use with nf_tables.
1718 void nft_unregister_expr(struct nft_expr_type *type)
1720 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1721 list_del_rcu(&type->list);
1722 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1724 EXPORT_SYMBOL_GPL(nft_unregister_expr);
1726 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
1729 const struct nft_expr_type *type;
1731 list_for_each_entry(type, &nf_tables_expressions, list) {
1732 if (!nla_strcmp(nla, type->name) &&
1733 (!type->family || type->family == family))
1739 static const struct nft_expr_type *nft_expr_type_get(u8 family,
1742 const struct nft_expr_type *type;
1745 return ERR_PTR(-EINVAL);
1747 type = __nft_expr_type_get(family, nla);
1748 if (type != NULL && try_module_get(type->owner))
1751 #ifdef CONFIG_MODULES
1753 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1754 request_module("nft-expr-%u-%.*s", family,
1755 nla_len(nla), (char *)nla_data(nla));
1756 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1757 if (__nft_expr_type_get(family, nla))
1758 return ERR_PTR(-EAGAIN);
1760 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1761 request_module("nft-expr-%.*s",
1762 nla_len(nla), (char *)nla_data(nla));
1763 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1764 if (__nft_expr_type_get(family, nla))
1765 return ERR_PTR(-EAGAIN);
1768 return ERR_PTR(-ENOENT);
1771 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
1772 [NFTA_EXPR_NAME] = { .type = NLA_STRING },
1773 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
1776 static int nf_tables_fill_expr_info(struct sk_buff *skb,
1777 const struct nft_expr *expr)
1779 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
1780 goto nla_put_failure;
1782 if (expr->ops->dump) {
1783 struct nlattr *data = nla_nest_start(skb, NFTA_EXPR_DATA);
1785 goto nla_put_failure;
1786 if (expr->ops->dump(skb, expr) < 0)
1787 goto nla_put_failure;
1788 nla_nest_end(skb, data);
1797 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
1798 const struct nft_expr *expr)
1800 struct nlattr *nest;
1802 nest = nla_nest_start(skb, attr);
1804 goto nla_put_failure;
1805 if (nf_tables_fill_expr_info(skb, expr) < 0)
1806 goto nla_put_failure;
1807 nla_nest_end(skb, nest);
1814 struct nft_expr_info {
1815 const struct nft_expr_ops *ops;
1816 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
1819 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
1820 const struct nlattr *nla,
1821 struct nft_expr_info *info)
1823 const struct nft_expr_type *type;
1824 const struct nft_expr_ops *ops;
1825 struct nlattr *tb[NFTA_EXPR_MAX + 1];
1828 err = nla_parse_nested(tb, NFTA_EXPR_MAX, nla, nft_expr_policy, NULL);
1832 type = nft_expr_type_get(ctx->family, tb[NFTA_EXPR_NAME]);
1834 return PTR_ERR(type);
1836 if (tb[NFTA_EXPR_DATA]) {
1837 err = nla_parse_nested(info->tb, type->maxattr,
1838 tb[NFTA_EXPR_DATA], type->policy, NULL);
1842 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
1844 if (type->select_ops != NULL) {
1845 ops = type->select_ops(ctx,
1846 (const struct nlattr * const *)info->tb);
1858 module_put(type->owner);
1862 static int nf_tables_newexpr(const struct nft_ctx *ctx,
1863 const struct nft_expr_info *info,
1864 struct nft_expr *expr)
1866 const struct nft_expr_ops *ops = info->ops;
1871 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
1876 if (ops->validate) {
1877 const struct nft_data *data = NULL;
1879 err = ops->validate(ctx, expr, &data);
1888 ops->destroy(ctx, expr);
1894 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
1895 struct nft_expr *expr)
1897 if (expr->ops->destroy)
1898 expr->ops->destroy(ctx, expr);
1899 module_put(expr->ops->type->owner);
1902 struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
1903 const struct nlattr *nla)
1905 struct nft_expr_info info;
1906 struct nft_expr *expr;
1909 err = nf_tables_expr_parse(ctx, nla, &info);
1914 expr = kzalloc(info.ops->size, GFP_KERNEL);
1918 err = nf_tables_newexpr(ctx, &info, expr);
1926 module_put(info.ops->type->owner);
1928 return ERR_PTR(err);
1931 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
1933 nf_tables_expr_destroy(ctx, expr);
1941 static struct nft_rule *__nft_rule_lookup(const struct nft_chain *chain,
1944 struct nft_rule *rule;
1946 // FIXME: this sucks
1947 list_for_each_entry(rule, &chain->rules, list) {
1948 if (handle == rule->handle)
1952 return ERR_PTR(-ENOENT);
1955 static struct nft_rule *nft_rule_lookup(const struct nft_chain *chain,
1956 const struct nlattr *nla)
1959 return ERR_PTR(-EINVAL);
1961 return __nft_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
1964 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
1965 [NFTA_RULE_TABLE] = { .type = NLA_STRING,
1966 .len = NFT_TABLE_MAXNAMELEN - 1 },
1967 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
1968 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1969 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
1970 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
1971 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
1972 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
1973 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
1974 .len = NFT_USERDATA_MAXLEN },
1975 [NFTA_RULE_ID] = { .type = NLA_U32 },
1978 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
1979 u32 portid, u32 seq, int event,
1980 u32 flags, int family,
1981 const struct nft_table *table,
1982 const struct nft_chain *chain,
1983 const struct nft_rule *rule)
1985 struct nlmsghdr *nlh;
1986 struct nfgenmsg *nfmsg;
1987 const struct nft_expr *expr, *next;
1988 struct nlattr *list;
1989 const struct nft_rule *prule;
1990 u16 type = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
1992 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg), flags);
1994 goto nla_put_failure;
1996 nfmsg = nlmsg_data(nlh);
1997 nfmsg->nfgen_family = family;
1998 nfmsg->version = NFNETLINK_V0;
1999 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
2001 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
2002 goto nla_put_failure;
2003 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
2004 goto nla_put_failure;
2005 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
2007 goto nla_put_failure;
2009 if ((event != NFT_MSG_DELRULE) && (rule->list.prev != &chain->rules)) {
2010 prule = list_prev_entry(rule, list);
2011 if (nla_put_be64(skb, NFTA_RULE_POSITION,
2012 cpu_to_be64(prule->handle),
2014 goto nla_put_failure;
2017 list = nla_nest_start(skb, NFTA_RULE_EXPRESSIONS);
2019 goto nla_put_failure;
2020 nft_rule_for_each_expr(expr, next, rule) {
2021 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
2022 goto nla_put_failure;
2024 nla_nest_end(skb, list);
2027 struct nft_userdata *udata = nft_userdata(rule);
2028 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
2030 goto nla_put_failure;
2033 nlmsg_end(skb, nlh);
2037 nlmsg_trim(skb, nlh);
2041 static void nf_tables_rule_notify(const struct nft_ctx *ctx,
2042 const struct nft_rule *rule, int event)
2044 struct sk_buff *skb;
2048 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2051 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
2055 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
2056 event, 0, ctx->family, ctx->table,
2063 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
2064 ctx->report, GFP_KERNEL);
2067 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
2070 struct nft_rule_dump_ctx {
2075 static int nf_tables_dump_rules(struct sk_buff *skb,
2076 struct netlink_callback *cb)
2078 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
2079 const struct nft_rule_dump_ctx *ctx = cb->data;
2080 const struct nft_table *table;
2081 const struct nft_chain *chain;
2082 const struct nft_rule *rule;
2083 unsigned int idx = 0, s_idx = cb->args[0];
2084 struct net *net = sock_net(skb->sk);
2085 int family = nfmsg->nfgen_family;
2088 cb->seq = net->nft.base_seq;
2090 list_for_each_entry_rcu(table, &net->nft.tables, list) {
2091 if (family != NFPROTO_UNSPEC && family != table->family)
2094 if (ctx && ctx->table && strcmp(ctx->table, table->name) != 0)
2097 list_for_each_entry_rcu(chain, &table->chains, list) {
2098 if (ctx && ctx->chain &&
2099 strcmp(ctx->chain, chain->name) != 0)
2102 list_for_each_entry_rcu(rule, &chain->rules, list) {
2103 if (!nft_is_active(net, rule))
2108 memset(&cb->args[1], 0,
2109 sizeof(cb->args) - sizeof(cb->args[0]));
2110 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
2113 NLM_F_MULTI | NLM_F_APPEND,
2115 table, chain, rule) < 0)
2118 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2131 static int nf_tables_dump_rules_done(struct netlink_callback *cb)
2133 struct nft_rule_dump_ctx *ctx = cb->data;
2143 static int nf_tables_getrule(struct net *net, struct sock *nlsk,
2144 struct sk_buff *skb, const struct nlmsghdr *nlh,
2145 const struct nlattr * const nla[],
2146 struct netlink_ext_ack *extack)
2148 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2149 u8 genmask = nft_genmask_cur(net);
2150 const struct nft_table *table;
2151 const struct nft_chain *chain;
2152 const struct nft_rule *rule;
2153 struct sk_buff *skb2;
2154 int family = nfmsg->nfgen_family;
2157 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2158 struct netlink_dump_control c = {
2159 .dump = nf_tables_dump_rules,
2160 .done = nf_tables_dump_rules_done,
2163 if (nla[NFTA_RULE_TABLE] || nla[NFTA_RULE_CHAIN]) {
2164 struct nft_rule_dump_ctx *ctx;
2166 ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
2170 if (nla[NFTA_RULE_TABLE]) {
2171 ctx->table = nla_strdup(nla[NFTA_RULE_TABLE],
2178 if (nla[NFTA_RULE_CHAIN]) {
2179 ctx->chain = nla_strdup(nla[NFTA_RULE_CHAIN],
2190 return netlink_dump_start(nlsk, skb, nlh, &c);
2193 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask);
2194 if (IS_ERR(table)) {
2195 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
2196 return PTR_ERR(table);
2199 chain = nft_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2200 if (IS_ERR(chain)) {
2201 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
2202 return PTR_ERR(chain);
2205 rule = nft_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2207 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
2208 return PTR_ERR(rule);
2211 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2215 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
2216 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
2217 family, table, chain, rule);
2221 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2228 static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
2229 struct nft_rule *rule)
2231 struct nft_expr *expr;
2234 * Careful: some expressions might not be initialized in case this
2235 * is called on error from nf_tables_newrule().
2237 expr = nft_expr_first(rule);
2238 while (expr != nft_expr_last(rule) && expr->ops) {
2239 nf_tables_expr_destroy(ctx, expr);
2240 expr = nft_expr_next(expr);
2245 #define NFT_RULE_MAXEXPRS 128
2247 static struct nft_expr_info *info;
2249 static int nf_tables_newrule(struct net *net, struct sock *nlsk,
2250 struct sk_buff *skb, const struct nlmsghdr *nlh,
2251 const struct nlattr * const nla[],
2252 struct netlink_ext_ack *extack)
2254 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2255 u8 genmask = nft_genmask_next(net);
2256 int family = nfmsg->nfgen_family;
2257 struct nft_table *table;
2258 struct nft_chain *chain;
2259 struct nft_rule *rule, *old_rule = NULL;
2260 struct nft_userdata *udata;
2261 struct nft_trans *trans = NULL;
2262 struct nft_expr *expr;
2265 unsigned int size, i, n, ulen = 0, usize = 0;
2268 u64 handle, pos_handle;
2270 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2272 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask);
2273 if (IS_ERR(table)) {
2274 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
2275 return PTR_ERR(table);
2278 chain = nft_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2279 if (IS_ERR(chain)) {
2280 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
2281 return PTR_ERR(chain);
2284 if (nla[NFTA_RULE_HANDLE]) {
2285 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
2286 rule = __nft_rule_lookup(chain, handle);
2288 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
2289 return PTR_ERR(rule);
2292 if (nlh->nlmsg_flags & NLM_F_EXCL) {
2293 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
2296 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2301 if (!create || nlh->nlmsg_flags & NLM_F_REPLACE)
2303 handle = nf_tables_alloc_handle(table);
2305 if (chain->use == UINT_MAX)
2309 if (nla[NFTA_RULE_POSITION]) {
2310 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2313 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
2314 old_rule = __nft_rule_lookup(chain, pos_handle);
2315 if (IS_ERR(old_rule)) {
2316 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_POSITION]);
2317 return PTR_ERR(old_rule);
2321 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
2325 if (nla[NFTA_RULE_EXPRESSIONS]) {
2326 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
2328 if (nla_type(tmp) != NFTA_LIST_ELEM)
2330 if (n == NFT_RULE_MAXEXPRS)
2332 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
2335 size += info[n].ops->size;
2339 /* Check for overflow of dlen field */
2341 if (size >= 1 << 12)
2344 if (nla[NFTA_RULE_USERDATA]) {
2345 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
2347 usize = sizeof(struct nft_userdata) + ulen;
2351 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
2355 nft_activate_next(net, rule);
2357 rule->handle = handle;
2359 rule->udata = ulen ? 1 : 0;
2362 udata = nft_userdata(rule);
2363 udata->len = ulen - 1;
2364 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
2367 expr = nft_expr_first(rule);
2368 for (i = 0; i < n; i++) {
2369 err = nf_tables_newexpr(&ctx, &info[i], expr);
2373 expr = nft_expr_next(expr);
2376 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
2377 if (nft_is_active_next(net, old_rule)) {
2378 trans = nft_trans_rule_add(&ctx, NFT_MSG_DELRULE,
2380 if (trans == NULL) {
2384 nft_deactivate_next(net, old_rule);
2386 list_add_tail_rcu(&rule->list, &old_rule->list);
2391 } else if (nlh->nlmsg_flags & NLM_F_APPEND)
2393 list_add_rcu(&rule->list, &old_rule->list);
2395 list_add_tail_rcu(&rule->list, &chain->rules);
2398 list_add_tail_rcu(&rule->list, &old_rule->list);
2400 list_add_rcu(&rule->list, &chain->rules);
2403 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2411 list_del_rcu(&rule->list);
2413 nf_tables_rule_destroy(&ctx, rule);
2415 for (i = 0; i < n; i++) {
2416 if (info[i].ops != NULL)
2417 module_put(info[i].ops->type->owner);
2422 static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
2423 const struct nlattr *nla)
2425 u32 id = ntohl(nla_get_be32(nla));
2426 struct nft_trans *trans;
2428 list_for_each_entry(trans, &net->nft.commit_list, list) {
2429 struct nft_rule *rule = nft_trans_rule(trans);
2431 if (trans->msg_type == NFT_MSG_NEWRULE &&
2432 id == nft_trans_rule_id(trans))
2435 return ERR_PTR(-ENOENT);
2438 static int nf_tables_delrule(struct net *net, struct sock *nlsk,
2439 struct sk_buff *skb, const struct nlmsghdr *nlh,
2440 const struct nlattr * const nla[],
2441 struct netlink_ext_ack *extack)
2443 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2444 u8 genmask = nft_genmask_next(net);
2445 struct nft_table *table;
2446 struct nft_chain *chain = NULL;
2447 struct nft_rule *rule;
2448 int family = nfmsg->nfgen_family, err = 0;
2451 table = nft_table_lookup(net, nla[NFTA_RULE_TABLE], family, genmask);
2452 if (IS_ERR(table)) {
2453 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_TABLE]);
2454 return PTR_ERR(table);
2457 if (nla[NFTA_RULE_CHAIN]) {
2458 chain = nft_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2459 if (IS_ERR(chain)) {
2460 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_CHAIN]);
2461 return PTR_ERR(chain);
2465 nft_ctx_init(&ctx, net, skb, nlh, family, table, chain, nla);
2468 if (nla[NFTA_RULE_HANDLE]) {
2469 rule = nft_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2471 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_HANDLE]);
2472 return PTR_ERR(rule);
2475 err = nft_delrule(&ctx, rule);
2476 } else if (nla[NFTA_RULE_ID]) {
2477 rule = nft_rule_lookup_byid(net, nla[NFTA_RULE_ID]);
2479 NL_SET_BAD_ATTR(extack, nla[NFTA_RULE_ID]);
2480 return PTR_ERR(rule);
2483 err = nft_delrule(&ctx, rule);
2485 err = nft_delrule_by_chain(&ctx);
2488 list_for_each_entry(chain, &table->chains, list) {
2489 if (!nft_is_active_next(net, chain))
2493 err = nft_delrule_by_chain(&ctx);
2506 static LIST_HEAD(nf_tables_set_types);
2508 int nft_register_set(struct nft_set_type *type)
2510 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2511 list_add_tail_rcu(&type->list, &nf_tables_set_types);
2512 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2515 EXPORT_SYMBOL_GPL(nft_register_set);
2517 void nft_unregister_set(struct nft_set_type *type)
2519 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2520 list_del_rcu(&type->list);
2521 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2523 EXPORT_SYMBOL_GPL(nft_unregister_set);
2525 #define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
2526 NFT_SET_TIMEOUT | NFT_SET_OBJECT | \
2529 static bool nft_set_ops_candidate(const struct nft_set_type *type, u32 flags)
2531 return (flags & type->features) == (flags & NFT_SET_FEATURES);
2535 * Select a set implementation based on the data characteristics and the
2536 * given policy. The total memory use might not be known if no size is
2537 * given, in that case the amount of memory per element is used.
2539 static const struct nft_set_ops *
2540 nft_select_set_ops(const struct nft_ctx *ctx,
2541 const struct nlattr * const nla[],
2542 const struct nft_set_desc *desc,
2543 enum nft_set_policies policy)
2545 const struct nft_set_ops *ops, *bops;
2546 struct nft_set_estimate est, best;
2547 const struct nft_set_type *type;
2550 #ifdef CONFIG_MODULES
2551 if (list_empty(&nf_tables_set_types)) {
2552 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2553 request_module("nft-set");
2554 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2555 if (!list_empty(&nf_tables_set_types))
2556 return ERR_PTR(-EAGAIN);
2559 if (nla[NFTA_SET_FLAGS] != NULL)
2560 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2567 list_for_each_entry(type, &nf_tables_set_types, list) {
2570 if (!nft_set_ops_candidate(type, flags))
2572 if (!ops->estimate(desc, flags, &est))
2576 case NFT_SET_POL_PERFORMANCE:
2577 if (est.lookup < best.lookup)
2579 if (est.lookup == best.lookup &&
2580 est.space < best.space)
2583 case NFT_SET_POL_MEMORY:
2585 if (est.space < best.space)
2587 if (est.space == best.space &&
2588 est.lookup < best.lookup)
2590 } else if (est.size < best.size || !bops) {
2598 if (!try_module_get(type->owner))
2601 module_put(to_set_type(bops)->owner);
2610 return ERR_PTR(-EOPNOTSUPP);
2613 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
2614 [NFTA_SET_TABLE] = { .type = NLA_STRING,
2615 .len = NFT_TABLE_MAXNAMELEN - 1 },
2616 [NFTA_SET_NAME] = { .type = NLA_STRING,
2617 .len = NFT_SET_MAXNAMELEN - 1 },
2618 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
2619 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
2620 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
2621 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
2622 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
2623 [NFTA_SET_POLICY] = { .type = NLA_U32 },
2624 [NFTA_SET_DESC] = { .type = NLA_NESTED },
2625 [NFTA_SET_ID] = { .type = NLA_U32 },
2626 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
2627 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
2628 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
2629 .len = NFT_USERDATA_MAXLEN },
2630 [NFTA_SET_OBJ_TYPE] = { .type = NLA_U32 },
2631 [NFTA_SET_HANDLE] = { .type = NLA_U64 },
2634 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
2635 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
2638 static int nft_ctx_init_from_setattr(struct nft_ctx *ctx, struct net *net,
2639 const struct sk_buff *skb,
2640 const struct nlmsghdr *nlh,
2641 const struct nlattr * const nla[],
2642 struct netlink_ext_ack *extack,
2645 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2646 int family = nfmsg->nfgen_family;
2647 struct nft_table *table = NULL;
2649 if (nla[NFTA_SET_TABLE] != NULL) {
2650 table = nft_table_lookup(net, nla[NFTA_SET_TABLE], family,
2652 if (IS_ERR(table)) {
2653 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_TABLE]);
2654 return PTR_ERR(table);
2658 nft_ctx_init(ctx, net, skb, nlh, family, table, NULL, nla);
2662 static struct nft_set *nft_set_lookup(const struct nft_table *table,
2663 const struct nlattr *nla, u8 genmask)
2665 struct nft_set *set;
2668 return ERR_PTR(-EINVAL);
2670 list_for_each_entry(set, &table->sets, list) {
2671 if (!nla_strcmp(nla, set->name) &&
2672 nft_active_genmask(set, genmask))
2675 return ERR_PTR(-ENOENT);
2678 static struct nft_set *nft_set_lookup_byhandle(const struct nft_table *table,
2679 const struct nlattr *nla,
2682 struct nft_set *set;
2684 list_for_each_entry(set, &table->sets, list) {
2685 if (be64_to_cpu(nla_get_be64(nla)) == set->handle &&
2686 nft_active_genmask(set, genmask))
2689 return ERR_PTR(-ENOENT);
2692 static struct nft_set *nft_set_lookup_byid(const struct net *net,
2693 const struct nlattr *nla, u8 genmask)
2695 struct nft_trans *trans;
2696 u32 id = ntohl(nla_get_be32(nla));
2698 list_for_each_entry(trans, &net->nft.commit_list, list) {
2699 struct nft_set *set = nft_trans_set(trans);
2701 if (trans->msg_type == NFT_MSG_NEWSET &&
2702 id == nft_trans_set_id(trans) &&
2703 nft_active_genmask(set, genmask))
2706 return ERR_PTR(-ENOENT);
2709 struct nft_set *nft_set_lookup_global(const struct net *net,
2710 const struct nft_table *table,
2711 const struct nlattr *nla_set_name,
2712 const struct nlattr *nla_set_id,
2715 struct nft_set *set;
2717 set = nft_set_lookup(table, nla_set_name, genmask);
2722 set = nft_set_lookup_byid(net, nla_set_id, genmask);
2726 EXPORT_SYMBOL_GPL(nft_set_lookup_global);
2728 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
2731 const struct nft_set *i;
2733 unsigned long *inuse;
2734 unsigned int n = 0, min = 0;
2736 p = strchr(name, '%');
2738 if (p[1] != 'd' || strchr(p + 2, '%'))
2741 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
2745 list_for_each_entry(i, &ctx->table->sets, list) {
2748 if (!nft_is_active_next(ctx->net, set))
2750 if (!sscanf(i->name, name, &tmp))
2752 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
2755 set_bit(tmp - min, inuse);
2758 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
2759 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
2760 min += BITS_PER_BYTE * PAGE_SIZE;
2761 memset(inuse, 0, PAGE_SIZE);
2764 free_page((unsigned long)inuse);
2767 set->name = kasprintf(GFP_KERNEL, name, min + n);
2771 list_for_each_entry(i, &ctx->table->sets, list) {
2772 if (!nft_is_active_next(ctx->net, i))
2774 if (!strcmp(set->name, i->name)) {
2782 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
2783 const struct nft_set *set, u16 event, u16 flags)
2785 struct nfgenmsg *nfmsg;
2786 struct nlmsghdr *nlh;
2787 struct nlattr *desc;
2788 u32 portid = ctx->portid;
2791 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
2792 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
2795 goto nla_put_failure;
2797 nfmsg = nlmsg_data(nlh);
2798 nfmsg->nfgen_family = ctx->family;
2799 nfmsg->version = NFNETLINK_V0;
2800 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
2802 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
2803 goto nla_put_failure;
2804 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
2805 goto nla_put_failure;
2806 if (nla_put_be64(skb, NFTA_SET_HANDLE, cpu_to_be64(set->handle),
2808 goto nla_put_failure;
2809 if (set->flags != 0)
2810 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
2811 goto nla_put_failure;
2813 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
2814 goto nla_put_failure;
2815 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
2816 goto nla_put_failure;
2817 if (set->flags & NFT_SET_MAP) {
2818 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
2819 goto nla_put_failure;
2820 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
2821 goto nla_put_failure;
2823 if (set->flags & NFT_SET_OBJECT &&
2824 nla_put_be32(skb, NFTA_SET_OBJ_TYPE, htonl(set->objtype)))
2825 goto nla_put_failure;
2828 nla_put_be64(skb, NFTA_SET_TIMEOUT,
2829 cpu_to_be64(jiffies_to_msecs(set->timeout)),
2831 goto nla_put_failure;
2833 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
2834 goto nla_put_failure;
2836 if (set->policy != NFT_SET_POL_PERFORMANCE) {
2837 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
2838 goto nla_put_failure;
2841 if (nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
2842 goto nla_put_failure;
2844 desc = nla_nest_start(skb, NFTA_SET_DESC);
2846 goto nla_put_failure;
2848 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
2849 goto nla_put_failure;
2850 nla_nest_end(skb, desc);
2852 nlmsg_end(skb, nlh);
2856 nlmsg_trim(skb, nlh);
2860 static void nf_tables_set_notify(const struct nft_ctx *ctx,
2861 const struct nft_set *set, int event,
2864 struct sk_buff *skb;
2865 u32 portid = ctx->portid;
2869 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2872 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
2876 err = nf_tables_fill_set(skb, ctx, set, event, 0);
2882 nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES, ctx->report,
2886 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
2889 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
2891 const struct nft_set *set;
2892 unsigned int idx, s_idx = cb->args[0];
2893 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
2894 struct net *net = sock_net(skb->sk);
2895 struct nft_ctx *ctx = cb->data, ctx_set;
2901 cb->seq = net->nft.base_seq;
2903 list_for_each_entry_rcu(table, &net->nft.tables, list) {
2904 if (ctx->family != NFPROTO_UNSPEC &&
2905 ctx->family != table->family)
2908 if (ctx->table && ctx->table != table)
2912 if (cur_table != table)
2918 list_for_each_entry_rcu(set, &table->sets, list) {
2921 if (!nft_is_active(net, set))
2925 ctx_set.table = table;
2926 ctx_set.family = table->family;
2928 if (nf_tables_fill_set(skb, &ctx_set, set,
2932 cb->args[2] = (unsigned long) table;
2935 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2948 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
2954 static int nf_tables_getset(struct net *net, struct sock *nlsk,
2955 struct sk_buff *skb, const struct nlmsghdr *nlh,
2956 const struct nlattr * const nla[],
2957 struct netlink_ext_ack *extack)
2959 u8 genmask = nft_genmask_cur(net);
2960 const struct nft_set *set;
2962 struct sk_buff *skb2;
2963 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2966 /* Verify existence before starting dump */
2967 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, extack,
2972 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2973 struct netlink_dump_control c = {
2974 .dump = nf_tables_dump_sets,
2975 .done = nf_tables_dump_sets_done,
2977 struct nft_ctx *ctx_dump;
2979 ctx_dump = kmalloc(sizeof(*ctx_dump), GFP_KERNEL);
2980 if (ctx_dump == NULL)
2986 return netlink_dump_start(nlsk, skb, nlh, &c);
2989 /* Only accept unspec with dump */
2990 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2991 return -EAFNOSUPPORT;
2992 if (!nla[NFTA_SET_TABLE])
2995 set = nft_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
2997 return PTR_ERR(set);
2999 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
3003 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
3007 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
3014 static int nf_tables_set_desc_parse(const struct nft_ctx *ctx,
3015 struct nft_set_desc *desc,
3016 const struct nlattr *nla)
3018 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
3021 err = nla_parse_nested(da, NFTA_SET_DESC_MAX, nla,
3022 nft_set_desc_policy, NULL);
3026 if (da[NFTA_SET_DESC_SIZE] != NULL)
3027 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
3032 static int nf_tables_newset(struct net *net, struct sock *nlsk,
3033 struct sk_buff *skb, const struct nlmsghdr *nlh,
3034 const struct nlattr * const nla[],
3035 struct netlink_ext_ack *extack)
3037 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3038 u8 genmask = nft_genmask_next(net);
3039 int family = nfmsg->nfgen_family;
3040 const struct nft_set_ops *ops;
3041 struct nft_table *table;
3042 struct nft_set *set;
3048 u32 ktype, dtype, flags, policy, gc_int, objtype;
3049 struct nft_set_desc desc;
3050 unsigned char *udata;
3054 if (nla[NFTA_SET_TABLE] == NULL ||
3055 nla[NFTA_SET_NAME] == NULL ||
3056 nla[NFTA_SET_KEY_LEN] == NULL ||
3057 nla[NFTA_SET_ID] == NULL)
3060 memset(&desc, 0, sizeof(desc));
3062 ktype = NFT_DATA_VALUE;
3063 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
3064 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
3065 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
3069 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
3070 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
3074 if (nla[NFTA_SET_FLAGS] != NULL) {
3075 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
3076 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
3077 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
3078 NFT_SET_MAP | NFT_SET_EVAL |
3081 /* Only one of these operations is supported */
3082 if ((flags & (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT)) ==
3083 (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT))
3088 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
3089 if (!(flags & NFT_SET_MAP))
3092 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
3093 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
3094 dtype != NFT_DATA_VERDICT)
3097 if (dtype != NFT_DATA_VERDICT) {
3098 if (nla[NFTA_SET_DATA_LEN] == NULL)
3100 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
3101 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
3104 desc.dlen = sizeof(struct nft_verdict);
3105 } else if (flags & NFT_SET_MAP)
3108 if (nla[NFTA_SET_OBJ_TYPE] != NULL) {
3109 if (!(flags & NFT_SET_OBJECT))
3112 objtype = ntohl(nla_get_be32(nla[NFTA_SET_OBJ_TYPE]));
3113 if (objtype == NFT_OBJECT_UNSPEC ||
3114 objtype > NFT_OBJECT_MAX)
3116 } else if (flags & NFT_SET_OBJECT)
3119 objtype = NFT_OBJECT_UNSPEC;
3122 if (nla[NFTA_SET_TIMEOUT] != NULL) {
3123 if (!(flags & NFT_SET_TIMEOUT))
3125 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3126 nla[NFTA_SET_TIMEOUT])));
3129 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
3130 if (!(flags & NFT_SET_TIMEOUT))
3132 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
3135 policy = NFT_SET_POL_PERFORMANCE;
3136 if (nla[NFTA_SET_POLICY] != NULL)
3137 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
3139 if (nla[NFTA_SET_DESC] != NULL) {
3140 err = nf_tables_set_desc_parse(&ctx, &desc, nla[NFTA_SET_DESC]);
3145 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
3147 table = nft_table_lookup(net, nla[NFTA_SET_TABLE], family, genmask);
3148 if (IS_ERR(table)) {
3149 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_TABLE]);
3150 return PTR_ERR(table);
3153 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
3155 set = nft_set_lookup(table, nla[NFTA_SET_NAME], genmask);
3157 if (PTR_ERR(set) != -ENOENT) {
3158 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
3159 return PTR_ERR(set);
3162 if (nlh->nlmsg_flags & NLM_F_EXCL) {
3163 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_NAME]);
3166 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3172 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
3175 ops = nft_select_set_ops(&ctx, nla, &desc, policy);
3177 return PTR_ERR(ops);
3180 if (nla[NFTA_SET_USERDATA])
3181 udlen = nla_len(nla[NFTA_SET_USERDATA]);
3184 if (ops->privsize != NULL)
3185 size = ops->privsize(nla, &desc);
3187 set = kvzalloc(sizeof(*set) + size + udlen, GFP_KERNEL);
3193 name = nla_strdup(nla[NFTA_SET_NAME], GFP_KERNEL);
3199 err = nf_tables_set_alloc_name(&ctx, set, name);
3206 udata = set->data + size;
3207 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
3210 INIT_LIST_HEAD(&set->bindings);
3213 set->klen = desc.klen;
3215 set->objtype = objtype;
3216 set->dlen = desc.dlen;
3218 set->size = desc.size;
3219 set->policy = policy;
3222 set->timeout = timeout;
3223 set->gc_int = gc_int;
3224 set->handle = nf_tables_alloc_handle(table);
3226 err = ops->init(set, &desc, nla);
3230 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
3234 list_add_tail_rcu(&set->list, &table->sets);
3243 module_put(to_set_type(ops)->owner);
3247 static void nft_set_destroy(struct nft_set *set)
3249 set->ops->destroy(set);
3250 module_put(to_set_type(set->ops)->owner);
3255 static void nf_tables_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
3257 list_del_rcu(&set->list);
3258 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET, GFP_ATOMIC);
3259 nft_set_destroy(set);
3262 static int nf_tables_delset(struct net *net, struct sock *nlsk,
3263 struct sk_buff *skb, const struct nlmsghdr *nlh,
3264 const struct nlattr * const nla[],
3265 struct netlink_ext_ack *extack)
3267 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3268 u8 genmask = nft_genmask_next(net);
3269 const struct nlattr *attr;
3270 struct nft_set *set;
3274 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
3275 return -EAFNOSUPPORT;
3276 if (nla[NFTA_SET_TABLE] == NULL)
3279 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, extack,
3284 if (nla[NFTA_SET_HANDLE]) {
3285 attr = nla[NFTA_SET_HANDLE];
3286 set = nft_set_lookup_byhandle(ctx.table, attr, genmask);
3288 attr = nla[NFTA_SET_NAME];
3289 set = nft_set_lookup(ctx.table, attr, genmask);
3293 NL_SET_BAD_ATTR(extack, attr);
3294 return PTR_ERR(set);
3296 if (!list_empty(&set->bindings) ||
3297 (nlh->nlmsg_flags & NLM_F_NONREC && atomic_read(&set->nelems) > 0)) {
3298 NL_SET_BAD_ATTR(extack, attr);
3302 return nft_delset(&ctx, set);
3305 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
3306 struct nft_set *set,
3307 const struct nft_set_iter *iter,
3308 struct nft_set_elem *elem)
3310 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3311 enum nft_registers dreg;
3313 dreg = nft_type_to_reg(set->dtype);
3314 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
3315 set->dtype == NFT_DATA_VERDICT ?
3316 NFT_DATA_VERDICT : NFT_DATA_VALUE,
3320 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
3321 struct nft_set_binding *binding)
3323 struct nft_set_binding *i;
3324 struct nft_set_iter iter;
3326 if (!list_empty(&set->bindings) && nft_set_is_anonymous(set))
3329 if (binding->flags & NFT_SET_MAP) {
3330 /* If the set is already bound to the same chain all
3331 * jumps are already validated for that chain.
3333 list_for_each_entry(i, &set->bindings, list) {
3334 if (i->flags & NFT_SET_MAP &&
3335 i->chain == binding->chain)
3339 iter.genmask = nft_genmask_next(ctx->net);
3343 iter.fn = nf_tables_bind_check_setelem;
3345 set->ops->walk(ctx, set, &iter);
3350 binding->chain = ctx->chain;
3351 list_add_tail_rcu(&binding->list, &set->bindings);
3354 EXPORT_SYMBOL_GPL(nf_tables_bind_set);
3356 void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
3357 struct nft_set_binding *binding)
3359 list_del_rcu(&binding->list);
3361 if (list_empty(&set->bindings) && nft_set_is_anonymous(set) &&
3362 nft_is_active(ctx->net, set))
3363 nf_tables_set_destroy(ctx, set);
3365 EXPORT_SYMBOL_GPL(nf_tables_unbind_set);
3367 const struct nft_set_ext_type nft_set_ext_types[] = {
3368 [NFT_SET_EXT_KEY] = {
3369 .align = __alignof__(u32),
3371 [NFT_SET_EXT_DATA] = {
3372 .align = __alignof__(u32),
3374 [NFT_SET_EXT_EXPR] = {
3375 .align = __alignof__(struct nft_expr),
3377 [NFT_SET_EXT_OBJREF] = {
3378 .len = sizeof(struct nft_object *),
3379 .align = __alignof__(struct nft_object *),
3381 [NFT_SET_EXT_FLAGS] = {
3383 .align = __alignof__(u8),
3385 [NFT_SET_EXT_TIMEOUT] = {
3387 .align = __alignof__(u64),
3389 [NFT_SET_EXT_EXPIRATION] = {
3390 .len = sizeof(unsigned long),
3391 .align = __alignof__(unsigned long),
3393 [NFT_SET_EXT_USERDATA] = {
3394 .len = sizeof(struct nft_userdata),
3395 .align = __alignof__(struct nft_userdata),
3398 EXPORT_SYMBOL_GPL(nft_set_ext_types);
3404 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
3405 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
3406 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
3407 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
3408 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
3409 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
3410 .len = NFT_USERDATA_MAXLEN },
3411 [NFTA_SET_ELEM_EXPR] = { .type = NLA_NESTED },
3412 [NFTA_SET_ELEM_OBJREF] = { .type = NLA_STRING },
3415 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
3416 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING,
3417 .len = NFT_TABLE_MAXNAMELEN - 1 },
3418 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING,
3419 .len = NFT_SET_MAXNAMELEN - 1 },
3420 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
3421 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
3424 static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx, struct net *net,
3425 const struct sk_buff *skb,
3426 const struct nlmsghdr *nlh,
3427 const struct nlattr * const nla[],
3428 struct netlink_ext_ack *extack,
3431 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3432 int family = nfmsg->nfgen_family;
3433 struct nft_table *table;
3435 table = nft_table_lookup(net, nla[NFTA_SET_ELEM_LIST_TABLE], family,
3437 if (IS_ERR(table)) {
3438 NL_SET_BAD_ATTR(extack, nla[NFTA_SET_ELEM_LIST_TABLE]);
3439 return PTR_ERR(table);
3442 nft_ctx_init(ctx, net, skb, nlh, family, table, NULL, nla);
3446 static int nf_tables_fill_setelem(struct sk_buff *skb,
3447 const struct nft_set *set,
3448 const struct nft_set_elem *elem)
3450 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3451 unsigned char *b = skb_tail_pointer(skb);
3452 struct nlattr *nest;
3454 nest = nla_nest_start(skb, NFTA_LIST_ELEM);
3456 goto nla_put_failure;
3458 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
3459 NFT_DATA_VALUE, set->klen) < 0)
3460 goto nla_put_failure;
3462 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3463 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
3464 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
3466 goto nla_put_failure;
3468 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
3469 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
3470 goto nla_put_failure;
3472 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3473 nla_put_string(skb, NFTA_SET_ELEM_OBJREF,
3474 (*nft_set_ext_obj(ext))->name) < 0)
3475 goto nla_put_failure;
3477 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
3478 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
3479 htonl(*nft_set_ext_flags(ext))))
3480 goto nla_put_failure;
3482 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
3483 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
3484 cpu_to_be64(jiffies_to_msecs(
3485 *nft_set_ext_timeout(ext))),
3487 goto nla_put_failure;
3489 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
3490 unsigned long expires, now = jiffies;
3492 expires = *nft_set_ext_expiration(ext);
3493 if (time_before(now, expires))
3498 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
3499 cpu_to_be64(jiffies_to_msecs(expires)),
3501 goto nla_put_failure;
3504 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
3505 struct nft_userdata *udata;
3507 udata = nft_set_ext_userdata(ext);
3508 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
3509 udata->len + 1, udata->data))
3510 goto nla_put_failure;
3513 nla_nest_end(skb, nest);
3521 struct nft_set_dump_args {
3522 const struct netlink_callback *cb;
3523 struct nft_set_iter iter;
3524 struct sk_buff *skb;
3527 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
3528 struct nft_set *set,
3529 const struct nft_set_iter *iter,
3530 struct nft_set_elem *elem)
3532 struct nft_set_dump_args *args;
3534 args = container_of(iter, struct nft_set_dump_args, iter);
3535 return nf_tables_fill_setelem(args->skb, set, elem);
3538 struct nft_set_dump_ctx {
3539 const struct nft_set *set;
3543 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
3545 struct nft_set_dump_ctx *dump_ctx = cb->data;
3546 struct net *net = sock_net(skb->sk);
3547 struct nft_table *table;
3548 struct nft_set *set;
3549 struct nft_set_dump_args args;
3550 bool set_found = false;
3551 struct nfgenmsg *nfmsg;
3552 struct nlmsghdr *nlh;
3553 struct nlattr *nest;
3558 list_for_each_entry_rcu(table, &net->nft.tables, list) {
3559 if (dump_ctx->ctx.family != NFPROTO_UNSPEC &&
3560 dump_ctx->ctx.family != table->family)
3563 if (table != dump_ctx->ctx.table)
3566 list_for_each_entry_rcu(set, &table->sets, list) {
3567 if (set == dump_ctx->set) {
3580 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWSETELEM);
3581 portid = NETLINK_CB(cb->skb).portid;
3582 seq = cb->nlh->nlmsg_seq;
3584 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3587 goto nla_put_failure;
3589 nfmsg = nlmsg_data(nlh);
3590 nfmsg->nfgen_family = table->family;
3591 nfmsg->version = NFNETLINK_V0;
3592 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
3594 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, table->name))
3595 goto nla_put_failure;
3596 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
3597 goto nla_put_failure;
3599 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3601 goto nla_put_failure;
3605 args.iter.genmask = nft_genmask_cur(net);
3606 args.iter.skip = cb->args[0];
3607 args.iter.count = 0;
3609 args.iter.fn = nf_tables_dump_setelem;
3610 set->ops->walk(&dump_ctx->ctx, set, &args.iter);
3613 nla_nest_end(skb, nest);
3614 nlmsg_end(skb, nlh);
3616 if (args.iter.err && args.iter.err != -EMSGSIZE)
3617 return args.iter.err;
3618 if (args.iter.count == cb->args[0])
3621 cb->args[0] = args.iter.count;
3629 static int nf_tables_dump_set_done(struct netlink_callback *cb)
3635 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
3636 const struct nft_ctx *ctx, u32 seq,
3637 u32 portid, int event, u16 flags,
3638 const struct nft_set *set,
3639 const struct nft_set_elem *elem)
3641 struct nfgenmsg *nfmsg;
3642 struct nlmsghdr *nlh;
3643 struct nlattr *nest;
3646 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
3647 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3650 goto nla_put_failure;
3652 nfmsg = nlmsg_data(nlh);
3653 nfmsg->nfgen_family = ctx->family;
3654 nfmsg->version = NFNETLINK_V0;
3655 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
3657 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3658 goto nla_put_failure;
3659 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3660 goto nla_put_failure;
3662 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3664 goto nla_put_failure;
3666 err = nf_tables_fill_setelem(skb, set, elem);
3668 goto nla_put_failure;
3670 nla_nest_end(skb, nest);
3672 nlmsg_end(skb, nlh);
3676 nlmsg_trim(skb, nlh);
3680 static int nft_setelem_parse_flags(const struct nft_set *set,
3681 const struct nlattr *attr, u32 *flags)
3686 *flags = ntohl(nla_get_be32(attr));
3687 if (*flags & ~NFT_SET_ELEM_INTERVAL_END)
3689 if (!(set->flags & NFT_SET_INTERVAL) &&
3690 *flags & NFT_SET_ELEM_INTERVAL_END)
3696 static int nft_get_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3697 const struct nlattr *attr)
3699 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3700 const struct nft_set_ext *ext;
3701 struct nft_data_desc desc;
3702 struct nft_set_elem elem;
3703 struct sk_buff *skb;
3708 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3709 nft_set_elem_policy, NULL);
3713 if (!nla[NFTA_SET_ELEM_KEY])
3716 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3720 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
3721 nla[NFTA_SET_ELEM_KEY]);
3726 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
3729 priv = set->ops->get(ctx->net, set, &elem, flags);
3731 return PTR_ERR(priv);
3734 ext = nft_set_elem_ext(set, &elem);
3737 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3741 err = nf_tables_fill_setelem_info(skb, ctx, ctx->seq, ctx->portid,
3742 NFT_MSG_NEWSETELEM, 0, set, &elem);
3746 err = nfnetlink_unicast(skb, ctx->net, ctx->portid, MSG_DONTWAIT);
3747 /* This avoids a loop in nfnetlink. */
3755 /* this avoids a loop in nfnetlink. */
3756 return err == -EAGAIN ? -ENOBUFS : err;
3759 static int nf_tables_getsetelem(struct net *net, struct sock *nlsk,
3760 struct sk_buff *skb, const struct nlmsghdr *nlh,
3761 const struct nlattr * const nla[],
3762 struct netlink_ext_ack *extack)
3764 u8 genmask = nft_genmask_cur(net);
3765 struct nft_set *set;
3766 struct nlattr *attr;
3770 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, extack,
3775 set = nft_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET], genmask);
3777 return PTR_ERR(set);
3779 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3780 struct netlink_dump_control c = {
3781 .dump = nf_tables_dump_set,
3782 .done = nf_tables_dump_set_done,
3784 struct nft_set_dump_ctx *dump_ctx;
3786 dump_ctx = kmalloc(sizeof(*dump_ctx), GFP_KERNEL);
3790 dump_ctx->set = set;
3791 dump_ctx->ctx = ctx;
3794 return netlink_dump_start(nlsk, skb, nlh, &c);
3797 if (!nla[NFTA_SET_ELEM_LIST_ELEMENTS])
3800 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3801 err = nft_get_set_elem(&ctx, set, attr);
3809 static void nf_tables_setelem_notify(const struct nft_ctx *ctx,
3810 const struct nft_set *set,
3811 const struct nft_set_elem *elem,
3812 int event, u16 flags)
3814 struct net *net = ctx->net;
3815 u32 portid = ctx->portid;
3816 struct sk_buff *skb;
3819 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3822 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3826 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
3833 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
3837 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
3840 static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
3842 struct nft_set *set)
3844 struct nft_trans *trans;
3846 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
3850 nft_trans_elem_set(trans) = set;
3854 void *nft_set_elem_init(const struct nft_set *set,
3855 const struct nft_set_ext_tmpl *tmpl,
3856 const u32 *key, const u32 *data,
3857 u64 timeout, gfp_t gfp)
3859 struct nft_set_ext *ext;
3862 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
3866 ext = nft_set_elem_ext(set, elem);
3867 nft_set_ext_init(ext, tmpl);
3869 memcpy(nft_set_ext_key(ext), key, set->klen);
3870 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3871 memcpy(nft_set_ext_data(ext), data, set->dlen);
3872 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION))
3873 *nft_set_ext_expiration(ext) =
3875 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
3876 *nft_set_ext_timeout(ext) = timeout;
3881 void nft_set_elem_destroy(const struct nft_set *set, void *elem,
3884 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3886 nft_data_release(nft_set_ext_key(ext), NFT_DATA_VALUE);
3887 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3888 nft_data_release(nft_set_ext_data(ext), set->dtype);
3889 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3890 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3891 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
3892 (*nft_set_ext_obj(ext))->use--;
3895 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
3897 /* Only called from commit path, nft_set_elem_deactivate() already deals with
3898 * the refcounting from the preparation phase.
3900 static void nf_tables_set_elem_destroy(const struct nft_set *set, void *elem)
3902 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3904 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3905 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3909 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3910 const struct nlattr *attr, u32 nlmsg_flags)
3912 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3913 u8 genmask = nft_genmask_next(ctx->net);
3914 struct nft_data_desc d1, d2;
3915 struct nft_set_ext_tmpl tmpl;
3916 struct nft_set_ext *ext, *ext2;
3917 struct nft_set_elem elem;
3918 struct nft_set_binding *binding;
3919 struct nft_object *obj = NULL;
3920 struct nft_userdata *udata;
3921 struct nft_data data;
3922 enum nft_registers dreg;
3923 struct nft_trans *trans;
3929 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3930 nft_set_elem_policy, NULL);
3934 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3937 nft_set_ext_prepare(&tmpl);
3939 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3943 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3945 if (set->flags & NFT_SET_MAP) {
3946 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
3947 !(flags & NFT_SET_ELEM_INTERVAL_END))
3949 if (nla[NFTA_SET_ELEM_DATA] != NULL &&
3950 flags & NFT_SET_ELEM_INTERVAL_END)
3953 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3958 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
3959 if (!(set->flags & NFT_SET_TIMEOUT))
3961 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3962 nla[NFTA_SET_ELEM_TIMEOUT])));
3963 } else if (set->flags & NFT_SET_TIMEOUT) {
3964 timeout = set->timeout;
3967 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
3968 nla[NFTA_SET_ELEM_KEY]);
3972 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
3975 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
3977 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
3978 if (timeout != set->timeout)
3979 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
3982 if (nla[NFTA_SET_ELEM_OBJREF] != NULL) {
3983 if (!(set->flags & NFT_SET_OBJECT)) {
3987 obj = nft_obj_lookup(ctx->table, nla[NFTA_SET_ELEM_OBJREF],
3988 set->objtype, genmask);
3993 nft_set_ext_add(&tmpl, NFT_SET_EXT_OBJREF);
3996 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
3997 err = nft_data_init(ctx, &data, sizeof(data), &d2,
3998 nla[NFTA_SET_ELEM_DATA]);
4003 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
4006 dreg = nft_type_to_reg(set->dtype);
4007 list_for_each_entry(binding, &set->bindings, list) {
4008 struct nft_ctx bind_ctx = {
4010 .family = ctx->family,
4011 .table = ctx->table,
4012 .chain = (struct nft_chain *)binding->chain,
4015 if (!(binding->flags & NFT_SET_MAP))
4018 err = nft_validate_register_store(&bind_ctx, dreg,
4025 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
4028 /* The full maximum length of userdata can exceed the maximum
4029 * offset value (U8_MAX) for following extensions, therefor it
4030 * must be the last extension added.
4033 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
4034 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
4036 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
4041 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
4042 timeout, GFP_KERNEL);
4043 if (elem.priv == NULL)
4046 ext = nft_set_elem_ext(set, elem.priv);
4048 *nft_set_ext_flags(ext) = flags;
4050 udata = nft_set_ext_userdata(ext);
4051 udata->len = ulen - 1;
4052 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
4055 *nft_set_ext_obj(ext) = obj;
4059 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
4063 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
4064 err = set->ops->insert(ctx->net, set, &elem, &ext2);
4066 if (err == -EEXIST) {
4067 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) ^
4068 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) ||
4069 nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) ^
4070 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF))
4072 if ((nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
4073 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
4074 memcmp(nft_set_ext_data(ext),
4075 nft_set_ext_data(ext2), set->dlen) != 0) ||
4076 (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
4077 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF) &&
4078 *nft_set_ext_obj(ext) != *nft_set_ext_obj(ext2)))
4080 else if (!(nlmsg_flags & NLM_F_EXCL))
4087 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact)) {
4092 nft_trans_elem(trans) = elem;
4093 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4097 set->ops->remove(ctx->net, set, &elem);
4103 if (nla[NFTA_SET_ELEM_DATA] != NULL)
4104 nft_data_release(&data, d2.type);
4106 nft_data_release(&elem.key.val, d1.type);
4111 static int nf_tables_newsetelem(struct net *net, struct sock *nlsk,
4112 struct sk_buff *skb, const struct nlmsghdr *nlh,
4113 const struct nlattr * const nla[],
4114 struct netlink_ext_ack *extack)
4116 u8 genmask = nft_genmask_next(net);
4117 const struct nlattr *attr;
4118 struct nft_set *set;
4122 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
4125 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, extack,
4130 set = nft_set_lookup_global(net, ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
4131 nla[NFTA_SET_ELEM_LIST_SET_ID], genmask);
4133 return PTR_ERR(set);
4135 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4138 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4139 err = nft_add_set_elem(&ctx, set, attr, nlh->nlmsg_flags);
4147 * nft_data_hold - hold a nft_data item
4149 * @data: struct nft_data to release
4150 * @type: type of data
4152 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4153 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
4154 * NFT_GOTO verdicts. This function must be called on active data objects
4155 * from the second phase of the commit protocol.
4157 static void nft_data_hold(const struct nft_data *data, enum nft_data_types type)
4159 if (type == NFT_DATA_VERDICT) {
4160 switch (data->verdict.code) {
4163 data->verdict.chain->use++;
4169 static void nft_set_elem_activate(const struct net *net,
4170 const struct nft_set *set,
4171 struct nft_set_elem *elem)
4173 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4175 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4176 nft_data_hold(nft_set_ext_data(ext), set->dtype);
4177 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
4178 (*nft_set_ext_obj(ext))->use++;
4181 static void nft_set_elem_deactivate(const struct net *net,
4182 const struct nft_set *set,
4183 struct nft_set_elem *elem)
4185 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4187 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4188 nft_data_release(nft_set_ext_data(ext), set->dtype);
4189 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
4190 (*nft_set_ext_obj(ext))->use--;
4193 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
4194 const struct nlattr *attr)
4196 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
4197 struct nft_set_ext_tmpl tmpl;
4198 struct nft_data_desc desc;
4199 struct nft_set_elem elem;
4200 struct nft_set_ext *ext;
4201 struct nft_trans *trans;
4206 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
4207 nft_set_elem_policy, NULL);
4212 if (nla[NFTA_SET_ELEM_KEY] == NULL)
4215 nft_set_ext_prepare(&tmpl);
4217 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
4221 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
4223 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
4224 nla[NFTA_SET_ELEM_KEY]);
4229 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
4232 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, desc.len);
4235 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, NULL, 0,
4237 if (elem.priv == NULL)
4240 ext = nft_set_elem_ext(set, elem.priv);
4242 *nft_set_ext_flags(ext) = flags;
4244 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
4245 if (trans == NULL) {
4250 priv = set->ops->deactivate(ctx->net, set, &elem);
4258 nft_set_elem_deactivate(ctx->net, set, &elem);
4260 nft_trans_elem(trans) = elem;
4261 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4269 nft_data_release(&elem.key.val, desc.type);
4274 static int nft_flush_set(const struct nft_ctx *ctx,
4275 struct nft_set *set,
4276 const struct nft_set_iter *iter,
4277 struct nft_set_elem *elem)
4279 struct nft_trans *trans;
4282 trans = nft_trans_alloc_gfp(ctx, NFT_MSG_DELSETELEM,
4283 sizeof(struct nft_trans_elem), GFP_ATOMIC);
4287 if (!set->ops->flush(ctx->net, set, elem->priv)) {
4293 nft_trans_elem_set(trans) = set;
4294 nft_trans_elem(trans) = *elem;
4295 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4303 static int nf_tables_delsetelem(struct net *net, struct sock *nlsk,
4304 struct sk_buff *skb, const struct nlmsghdr *nlh,
4305 const struct nlattr * const nla[],
4306 struct netlink_ext_ack *extack)
4308 u8 genmask = nft_genmask_next(net);
4309 const struct nlattr *attr;
4310 struct nft_set *set;
4314 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, extack,
4319 set = nft_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET], genmask);
4321 return PTR_ERR(set);
4322 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4325 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL) {
4326 struct nft_set_iter iter = {
4328 .fn = nft_flush_set,
4330 set->ops->walk(&ctx, set, &iter);
4335 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4336 err = nft_del_setelem(&ctx, set, attr);
4345 void nft_set_gc_batch_release(struct rcu_head *rcu)
4347 struct nft_set_gc_batch *gcb;
4350 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
4351 for (i = 0; i < gcb->head.cnt; i++)
4352 nft_set_elem_destroy(gcb->head.set, gcb->elems[i], true);
4355 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
4357 struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
4360 struct nft_set_gc_batch *gcb;
4362 gcb = kzalloc(sizeof(*gcb), gfp);
4365 gcb->head.set = set;
4368 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
4375 * nft_register_obj- register nf_tables stateful object type
4378 * Registers the object type for use with nf_tables. Returns zero on
4379 * success or a negative errno code otherwise.
4381 int nft_register_obj(struct nft_object_type *obj_type)
4383 if (obj_type->type == NFT_OBJECT_UNSPEC)
4386 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4387 list_add_rcu(&obj_type->list, &nf_tables_objects);
4388 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4391 EXPORT_SYMBOL_GPL(nft_register_obj);
4394 * nft_unregister_obj - unregister nf_tables object type
4397 * Unregisters the object type for use with nf_tables.
4399 void nft_unregister_obj(struct nft_object_type *obj_type)
4401 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4402 list_del_rcu(&obj_type->list);
4403 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4405 EXPORT_SYMBOL_GPL(nft_unregister_obj);
4407 struct nft_object *nft_obj_lookup(const struct nft_table *table,
4408 const struct nlattr *nla, u32 objtype,
4411 struct nft_object *obj;
4413 list_for_each_entry(obj, &table->objects, list) {
4414 if (!nla_strcmp(nla, obj->name) &&
4415 objtype == obj->ops->type->type &&
4416 nft_active_genmask(obj, genmask))
4419 return ERR_PTR(-ENOENT);
4421 EXPORT_SYMBOL_GPL(nft_obj_lookup);
4423 static struct nft_object *nft_obj_lookup_byhandle(const struct nft_table *table,
4424 const struct nlattr *nla,
4425 u32 objtype, u8 genmask)
4427 struct nft_object *obj;
4429 list_for_each_entry(obj, &table->objects, list) {
4430 if (be64_to_cpu(nla_get_be64(nla)) == obj->handle &&
4431 objtype == obj->ops->type->type &&
4432 nft_active_genmask(obj, genmask))
4435 return ERR_PTR(-ENOENT);
4438 static const struct nla_policy nft_obj_policy[NFTA_OBJ_MAX + 1] = {
4439 [NFTA_OBJ_TABLE] = { .type = NLA_STRING,
4440 .len = NFT_TABLE_MAXNAMELEN - 1 },
4441 [NFTA_OBJ_NAME] = { .type = NLA_STRING,
4442 .len = NFT_OBJ_MAXNAMELEN - 1 },
4443 [NFTA_OBJ_TYPE] = { .type = NLA_U32 },
4444 [NFTA_OBJ_DATA] = { .type = NLA_NESTED },
4445 [NFTA_OBJ_HANDLE] = { .type = NLA_U64},
4448 static struct nft_object *nft_obj_init(const struct nft_ctx *ctx,
4449 const struct nft_object_type *type,
4450 const struct nlattr *attr)
4453 const struct nft_object_ops *ops;
4454 struct nft_object *obj;
4457 tb = kmalloc_array(type->maxattr + 1, sizeof(*tb), GFP_KERNEL);
4462 err = nla_parse_nested(tb, type->maxattr, attr, type->policy,
4467 memset(tb, 0, sizeof(tb[0]) * (type->maxattr + 1));
4470 if (type->select_ops) {
4471 ops = type->select_ops(ctx, (const struct nlattr * const *)tb);
4481 obj = kzalloc(sizeof(*obj) + ops->size, GFP_KERNEL);
4485 err = ops->init(ctx, (const struct nlattr * const *)tb, obj);
4498 return ERR_PTR(err);
4501 static int nft_object_dump(struct sk_buff *skb, unsigned int attr,
4502 struct nft_object *obj, bool reset)
4504 struct nlattr *nest;
4506 nest = nla_nest_start(skb, attr);
4508 goto nla_put_failure;
4509 if (obj->ops->dump(skb, obj, reset) < 0)
4510 goto nla_put_failure;
4511 nla_nest_end(skb, nest);
4518 static const struct nft_object_type *__nft_obj_type_get(u32 objtype)
4520 const struct nft_object_type *type;
4522 list_for_each_entry(type, &nf_tables_objects, list) {
4523 if (objtype == type->type)
4529 static const struct nft_object_type *nft_obj_type_get(u32 objtype)
4531 const struct nft_object_type *type;
4533 type = __nft_obj_type_get(objtype);
4534 if (type != NULL && try_module_get(type->owner))
4537 #ifdef CONFIG_MODULES
4539 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4540 request_module("nft-obj-%u", objtype);
4541 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4542 if (__nft_obj_type_get(objtype))
4543 return ERR_PTR(-EAGAIN);
4546 return ERR_PTR(-ENOENT);
4549 static int nf_tables_newobj(struct net *net, struct sock *nlsk,
4550 struct sk_buff *skb, const struct nlmsghdr *nlh,
4551 const struct nlattr * const nla[],
4552 struct netlink_ext_ack *extack)
4554 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4555 const struct nft_object_type *type;
4556 u8 genmask = nft_genmask_next(net);
4557 int family = nfmsg->nfgen_family;
4558 struct nft_table *table;
4559 struct nft_object *obj;
4564 if (!nla[NFTA_OBJ_TYPE] ||
4565 !nla[NFTA_OBJ_NAME] ||
4566 !nla[NFTA_OBJ_DATA])
4569 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask);
4570 if (IS_ERR(table)) {
4571 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
4572 return PTR_ERR(table);
4575 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4576 obj = nft_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4579 if (err != -ENOENT) {
4580 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
4584 if (nlh->nlmsg_flags & NLM_F_EXCL) {
4585 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
4591 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
4593 type = nft_obj_type_get(objtype);
4595 return PTR_ERR(type);
4597 obj = nft_obj_init(&ctx, type, nla[NFTA_OBJ_DATA]);
4603 obj->handle = nf_tables_alloc_handle(table);
4605 obj->name = nla_strdup(nla[NFTA_OBJ_NAME], GFP_KERNEL);
4611 err = nft_trans_obj_add(&ctx, NFT_MSG_NEWOBJ, obj);
4615 list_add_tail_rcu(&obj->list, &table->objects);
4621 if (obj->ops->destroy)
4622 obj->ops->destroy(obj);
4625 module_put(type->owner);
4629 static int nf_tables_fill_obj_info(struct sk_buff *skb, struct net *net,
4630 u32 portid, u32 seq, int event, u32 flags,
4631 int family, const struct nft_table *table,
4632 struct nft_object *obj, bool reset)
4634 struct nfgenmsg *nfmsg;
4635 struct nlmsghdr *nlh;
4637 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
4638 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
4640 goto nla_put_failure;
4642 nfmsg = nlmsg_data(nlh);
4643 nfmsg->nfgen_family = family;
4644 nfmsg->version = NFNETLINK_V0;
4645 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4647 if (nla_put_string(skb, NFTA_OBJ_TABLE, table->name) ||
4648 nla_put_string(skb, NFTA_OBJ_NAME, obj->name) ||
4649 nla_put_be32(skb, NFTA_OBJ_TYPE, htonl(obj->ops->type->type)) ||
4650 nla_put_be32(skb, NFTA_OBJ_USE, htonl(obj->use)) ||
4651 nft_object_dump(skb, NFTA_OBJ_DATA, obj, reset) ||
4652 nla_put_be64(skb, NFTA_OBJ_HANDLE, cpu_to_be64(obj->handle),
4654 goto nla_put_failure;
4656 nlmsg_end(skb, nlh);
4660 nlmsg_trim(skb, nlh);
4664 struct nft_obj_filter {
4669 static int nf_tables_dump_obj(struct sk_buff *skb, struct netlink_callback *cb)
4671 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
4672 const struct nft_table *table;
4673 unsigned int idx = 0, s_idx = cb->args[0];
4674 struct nft_obj_filter *filter = cb->data;
4675 struct net *net = sock_net(skb->sk);
4676 int family = nfmsg->nfgen_family;
4677 struct nft_object *obj;
4680 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4684 cb->seq = net->nft.base_seq;
4686 list_for_each_entry_rcu(table, &net->nft.tables, list) {
4687 if (family != NFPROTO_UNSPEC && family != table->family)
4690 list_for_each_entry_rcu(obj, &table->objects, list) {
4691 if (!nft_is_active(net, obj))
4696 memset(&cb->args[1], 0,
4697 sizeof(cb->args) - sizeof(cb->args[0]));
4698 if (filter && filter->table[0] &&
4699 strcmp(filter->table, table->name))
4702 filter->type != NFT_OBJECT_UNSPEC &&
4703 obj->ops->type->type != filter->type)
4706 if (nf_tables_fill_obj_info(skb, net, NETLINK_CB(cb->skb).portid,
4709 NLM_F_MULTI | NLM_F_APPEND,
4710 table->family, table,
4714 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
4726 static int nf_tables_dump_obj_done(struct netlink_callback *cb)
4728 struct nft_obj_filter *filter = cb->data;
4731 kfree(filter->table);
4738 static struct nft_obj_filter *
4739 nft_obj_filter_alloc(const struct nlattr * const nla[])
4741 struct nft_obj_filter *filter;
4743 filter = kzalloc(sizeof(*filter), GFP_KERNEL);
4745 return ERR_PTR(-ENOMEM);
4747 if (nla[NFTA_OBJ_TABLE]) {
4748 filter->table = nla_strdup(nla[NFTA_OBJ_TABLE], GFP_KERNEL);
4749 if (!filter->table) {
4751 return ERR_PTR(-ENOMEM);
4754 if (nla[NFTA_OBJ_TYPE])
4755 filter->type = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4760 static int nf_tables_getobj(struct net *net, struct sock *nlsk,
4761 struct sk_buff *skb, const struct nlmsghdr *nlh,
4762 const struct nlattr * const nla[],
4763 struct netlink_ext_ack *extack)
4765 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4766 u8 genmask = nft_genmask_cur(net);
4767 int family = nfmsg->nfgen_family;
4768 const struct nft_table *table;
4769 struct nft_object *obj;
4770 struct sk_buff *skb2;
4775 if (nlh->nlmsg_flags & NLM_F_DUMP) {
4776 struct netlink_dump_control c = {
4777 .dump = nf_tables_dump_obj,
4778 .done = nf_tables_dump_obj_done,
4781 if (nla[NFTA_OBJ_TABLE] ||
4782 nla[NFTA_OBJ_TYPE]) {
4783 struct nft_obj_filter *filter;
4785 filter = nft_obj_filter_alloc(nla);
4791 return netlink_dump_start(nlsk, skb, nlh, &c);
4794 if (!nla[NFTA_OBJ_NAME] ||
4795 !nla[NFTA_OBJ_TYPE])
4798 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask);
4799 if (IS_ERR(table)) {
4800 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
4801 return PTR_ERR(table);
4804 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4805 obj = nft_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4807 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_NAME]);
4808 return PTR_ERR(obj);
4811 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4815 if (NFNL_MSG_TYPE(nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4818 err = nf_tables_fill_obj_info(skb2, net, NETLINK_CB(skb).portid,
4819 nlh->nlmsg_seq, NFT_MSG_NEWOBJ, 0,
4820 family, table, obj, reset);
4824 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4830 static void nft_obj_destroy(struct nft_object *obj)
4832 if (obj->ops->destroy)
4833 obj->ops->destroy(obj);
4835 module_put(obj->ops->type->owner);
4840 static int nf_tables_delobj(struct net *net, struct sock *nlsk,
4841 struct sk_buff *skb, const struct nlmsghdr *nlh,
4842 const struct nlattr * const nla[],
4843 struct netlink_ext_ack *extack)
4845 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4846 u8 genmask = nft_genmask_next(net);
4847 int family = nfmsg->nfgen_family;
4848 const struct nlattr *attr;
4849 struct nft_table *table;
4850 struct nft_object *obj;
4854 if (!nla[NFTA_OBJ_TYPE] ||
4855 (!nla[NFTA_OBJ_NAME] && !nla[NFTA_OBJ_HANDLE]))
4858 table = nft_table_lookup(net, nla[NFTA_OBJ_TABLE], family, genmask);
4859 if (IS_ERR(table)) {
4860 NL_SET_BAD_ATTR(extack, nla[NFTA_OBJ_TABLE]);
4861 return PTR_ERR(table);
4864 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4865 if (nla[NFTA_OBJ_HANDLE]) {
4866 attr = nla[NFTA_OBJ_HANDLE];
4867 obj = nft_obj_lookup_byhandle(table, attr, objtype, genmask);
4869 attr = nla[NFTA_OBJ_NAME];
4870 obj = nft_obj_lookup(table, attr, objtype, genmask);
4874 NL_SET_BAD_ATTR(extack, attr);
4875 return PTR_ERR(obj);
4878 NL_SET_BAD_ATTR(extack, attr);
4882 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
4884 return nft_delobj(&ctx, obj);
4887 void nft_obj_notify(struct net *net, struct nft_table *table,
4888 struct nft_object *obj, u32 portid, u32 seq, int event,
4889 int family, int report, gfp_t gfp)
4891 struct sk_buff *skb;
4895 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4898 skb = nlmsg_new(NLMSG_GOODSIZE, gfp);
4902 err = nf_tables_fill_obj_info(skb, net, portid, seq, event, 0, family,
4909 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, report, gfp);
4912 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
4914 EXPORT_SYMBOL_GPL(nft_obj_notify);
4916 static void nf_tables_obj_notify(const struct nft_ctx *ctx,
4917 struct nft_object *obj, int event)
4919 nft_obj_notify(ctx->net, ctx->table, obj, ctx->portid, ctx->seq, event,
4920 ctx->family, ctx->report, GFP_KERNEL);
4926 void nft_register_flowtable_type(struct nf_flowtable_type *type)
4928 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4929 list_add_tail_rcu(&type->list, &nf_tables_flowtables);
4930 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4932 EXPORT_SYMBOL_GPL(nft_register_flowtable_type);
4934 void nft_unregister_flowtable_type(struct nf_flowtable_type *type)
4936 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4937 list_del_rcu(&type->list);
4938 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4940 EXPORT_SYMBOL_GPL(nft_unregister_flowtable_type);
4942 static const struct nla_policy nft_flowtable_policy[NFTA_FLOWTABLE_MAX + 1] = {
4943 [NFTA_FLOWTABLE_TABLE] = { .type = NLA_STRING,
4944 .len = NFT_NAME_MAXLEN - 1 },
4945 [NFTA_FLOWTABLE_NAME] = { .type = NLA_STRING,
4946 .len = NFT_NAME_MAXLEN - 1 },
4947 [NFTA_FLOWTABLE_HOOK] = { .type = NLA_NESTED },
4948 [NFTA_FLOWTABLE_HANDLE] = { .type = NLA_U64 },
4951 struct nft_flowtable *nft_flowtable_lookup(const struct nft_table *table,
4952 const struct nlattr *nla, u8 genmask)
4954 struct nft_flowtable *flowtable;
4956 list_for_each_entry(flowtable, &table->flowtables, list) {
4957 if (!nla_strcmp(nla, flowtable->name) &&
4958 nft_active_genmask(flowtable, genmask))
4961 return ERR_PTR(-ENOENT);
4963 EXPORT_SYMBOL_GPL(nft_flowtable_lookup);
4965 static struct nft_flowtable *
4966 nft_flowtable_lookup_byhandle(const struct nft_table *table,
4967 const struct nlattr *nla, u8 genmask)
4969 struct nft_flowtable *flowtable;
4971 list_for_each_entry(flowtable, &table->flowtables, list) {
4972 if (be64_to_cpu(nla_get_be64(nla)) == flowtable->handle &&
4973 nft_active_genmask(flowtable, genmask))
4976 return ERR_PTR(-ENOENT);
4979 static int nf_tables_parse_devices(const struct nft_ctx *ctx,
4980 const struct nlattr *attr,
4981 struct net_device *dev_array[], int *len)
4983 const struct nlattr *tmp;
4984 struct net_device *dev;
4985 char ifname[IFNAMSIZ];
4986 int rem, n = 0, err;
4988 nla_for_each_nested(tmp, attr, rem) {
4989 if (nla_type(tmp) != NFTA_DEVICE_NAME) {
4994 nla_strlcpy(ifname, tmp, IFNAMSIZ);
4995 dev = __dev_get_by_name(ctx->net, ifname);
5001 dev_array[n++] = dev;
5002 if (n == NFT_FLOWTABLE_DEVICE_MAX) {
5016 static const struct nla_policy nft_flowtable_hook_policy[NFTA_FLOWTABLE_HOOK_MAX + 1] = {
5017 [NFTA_FLOWTABLE_HOOK_NUM] = { .type = NLA_U32 },
5018 [NFTA_FLOWTABLE_HOOK_PRIORITY] = { .type = NLA_U32 },
5019 [NFTA_FLOWTABLE_HOOK_DEVS] = { .type = NLA_NESTED },
5022 static int nf_tables_flowtable_parse_hook(const struct nft_ctx *ctx,
5023 const struct nlattr *attr,
5024 struct nft_flowtable *flowtable)
5026 struct net_device *dev_array[NFT_FLOWTABLE_DEVICE_MAX];
5027 struct nlattr *tb[NFTA_FLOWTABLE_HOOK_MAX + 1];
5028 struct nf_hook_ops *ops;
5029 int hooknum, priority;
5032 err = nla_parse_nested(tb, NFTA_FLOWTABLE_HOOK_MAX, attr,
5033 nft_flowtable_hook_policy, NULL);
5037 if (!tb[NFTA_FLOWTABLE_HOOK_NUM] ||
5038 !tb[NFTA_FLOWTABLE_HOOK_PRIORITY] ||
5039 !tb[NFTA_FLOWTABLE_HOOK_DEVS])
5042 hooknum = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_NUM]));
5043 if (hooknum != NF_NETDEV_INGRESS)
5046 priority = ntohl(nla_get_be32(tb[NFTA_FLOWTABLE_HOOK_PRIORITY]));
5048 err = nf_tables_parse_devices(ctx, tb[NFTA_FLOWTABLE_HOOK_DEVS],
5053 ops = kzalloc(sizeof(struct nf_hook_ops) * n, GFP_KERNEL);
5057 flowtable->hooknum = hooknum;
5058 flowtable->priority = priority;
5059 flowtable->ops = ops;
5060 flowtable->ops_len = n;
5062 for (i = 0; i < n; i++) {
5063 flowtable->ops[i].pf = NFPROTO_NETDEV;
5064 flowtable->ops[i].hooknum = hooknum;
5065 flowtable->ops[i].priority = priority;
5066 flowtable->ops[i].priv = &flowtable->data;
5067 flowtable->ops[i].hook = flowtable->data.type->hook;
5068 flowtable->ops[i].dev = dev_array[i];
5069 flowtable->dev_name[i] = kstrdup(dev_array[i]->name,
5076 static const struct nf_flowtable_type *__nft_flowtable_type_get(u8 family)
5078 const struct nf_flowtable_type *type;
5080 list_for_each_entry(type, &nf_tables_flowtables, list) {
5081 if (family == type->family)
5087 static const struct nf_flowtable_type *nft_flowtable_type_get(u8 family)
5089 const struct nf_flowtable_type *type;
5091 type = __nft_flowtable_type_get(family);
5092 if (type != NULL && try_module_get(type->owner))
5095 #ifdef CONFIG_MODULES
5097 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
5098 request_module("nf-flowtable-%u", family);
5099 nfnl_lock(NFNL_SUBSYS_NFTABLES);
5100 if (__nft_flowtable_type_get(family))
5101 return ERR_PTR(-EAGAIN);
5104 return ERR_PTR(-ENOENT);
5107 static void nft_unregister_flowtable_net_hooks(struct net *net,
5108 struct nft_flowtable *flowtable)
5112 for (i = 0; i < flowtable->ops_len; i++) {
5113 if (!flowtable->ops[i].dev)
5116 nf_unregister_net_hook(net, &flowtable->ops[i]);
5120 static int nf_tables_newflowtable(struct net *net, struct sock *nlsk,
5121 struct sk_buff *skb,
5122 const struct nlmsghdr *nlh,
5123 const struct nlattr * const nla[],
5124 struct netlink_ext_ack *extack)
5126 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5127 const struct nf_flowtable_type *type;
5128 struct nft_flowtable *flowtable, *ft;
5129 u8 genmask = nft_genmask_next(net);
5130 int family = nfmsg->nfgen_family;
5131 struct nft_table *table;
5135 if (!nla[NFTA_FLOWTABLE_TABLE] ||
5136 !nla[NFTA_FLOWTABLE_NAME] ||
5137 !nla[NFTA_FLOWTABLE_HOOK])
5140 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
5142 if (IS_ERR(table)) {
5143 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_TABLE]);
5144 return PTR_ERR(table);
5147 flowtable = nft_flowtable_lookup(table, nla[NFTA_FLOWTABLE_NAME],
5149 if (IS_ERR(flowtable)) {
5150 err = PTR_ERR(flowtable);
5151 if (err != -ENOENT) {
5152 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
5156 if (nlh->nlmsg_flags & NLM_F_EXCL) {
5157 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_NAME]);
5164 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
5166 flowtable = kzalloc(sizeof(*flowtable), GFP_KERNEL);
5170 flowtable->table = table;
5171 flowtable->handle = nf_tables_alloc_handle(table);
5173 flowtable->name = nla_strdup(nla[NFTA_FLOWTABLE_NAME], GFP_KERNEL);
5174 if (!flowtable->name) {
5179 type = nft_flowtable_type_get(family);
5181 err = PTR_ERR(type);
5185 flowtable->data.type = type;
5186 err = type->init(&flowtable->data);
5190 err = nf_tables_flowtable_parse_hook(&ctx, nla[NFTA_FLOWTABLE_HOOK],
5195 for (i = 0; i < flowtable->ops_len; i++) {
5196 if (!flowtable->ops[i].dev)
5199 list_for_each_entry(ft, &table->flowtables, list) {
5200 for (k = 0; k < ft->ops_len; k++) {
5201 if (!ft->ops[k].dev)
5204 if (flowtable->ops[i].dev == ft->ops[k].dev &&
5205 flowtable->ops[i].pf == ft->ops[k].pf) {
5212 err = nf_register_net_hook(net, &flowtable->ops[i]);
5217 err = nft_trans_flowtable_add(&ctx, NFT_MSG_NEWFLOWTABLE, flowtable);
5221 list_add_tail_rcu(&flowtable->list, &table->flowtables);
5226 i = flowtable->ops_len;
5228 for (k = i - 1; k >= 0; k--) {
5229 kfree(flowtable->dev_name[k]);
5230 nf_unregister_net_hook(net, &flowtable->ops[k]);
5233 kfree(flowtable->ops);
5235 flowtable->data.type->free(&flowtable->data);
5237 module_put(type->owner);
5239 kfree(flowtable->name);
5245 static int nf_tables_delflowtable(struct net *net, struct sock *nlsk,
5246 struct sk_buff *skb,
5247 const struct nlmsghdr *nlh,
5248 const struct nlattr * const nla[],
5249 struct netlink_ext_ack *extack)
5251 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5252 u8 genmask = nft_genmask_next(net);
5253 int family = nfmsg->nfgen_family;
5254 struct nft_flowtable *flowtable;
5255 const struct nlattr *attr;
5256 struct nft_table *table;
5259 if (!nla[NFTA_FLOWTABLE_TABLE] ||
5260 (!nla[NFTA_FLOWTABLE_NAME] &&
5261 !nla[NFTA_FLOWTABLE_HANDLE]))
5264 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
5266 if (IS_ERR(table)) {
5267 NL_SET_BAD_ATTR(extack, nla[NFTA_FLOWTABLE_TABLE]);
5268 return PTR_ERR(table);
5271 if (nla[NFTA_FLOWTABLE_HANDLE]) {
5272 attr = nla[NFTA_FLOWTABLE_HANDLE];
5273 flowtable = nft_flowtable_lookup_byhandle(table, attr, genmask);
5275 attr = nla[NFTA_FLOWTABLE_NAME];
5276 flowtable = nft_flowtable_lookup(table, attr, genmask);
5279 if (IS_ERR(flowtable)) {
5280 NL_SET_BAD_ATTR(extack, attr);
5281 return PTR_ERR(flowtable);
5283 if (flowtable->use > 0) {
5284 NL_SET_BAD_ATTR(extack, attr);
5288 nft_ctx_init(&ctx, net, skb, nlh, family, table, NULL, nla);
5290 return nft_delflowtable(&ctx, flowtable);
5293 static int nf_tables_fill_flowtable_info(struct sk_buff *skb, struct net *net,
5294 u32 portid, u32 seq, int event,
5295 u32 flags, int family,
5296 struct nft_flowtable *flowtable)
5298 struct nlattr *nest, *nest_devs;
5299 struct nfgenmsg *nfmsg;
5300 struct nlmsghdr *nlh;
5303 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
5304 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
5306 goto nla_put_failure;
5308 nfmsg = nlmsg_data(nlh);
5309 nfmsg->nfgen_family = family;
5310 nfmsg->version = NFNETLINK_V0;
5311 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
5313 if (nla_put_string(skb, NFTA_FLOWTABLE_TABLE, flowtable->table->name) ||
5314 nla_put_string(skb, NFTA_FLOWTABLE_NAME, flowtable->name) ||
5315 nla_put_be32(skb, NFTA_FLOWTABLE_USE, htonl(flowtable->use)) ||
5316 nla_put_be64(skb, NFTA_FLOWTABLE_HANDLE, cpu_to_be64(flowtable->handle),
5317 NFTA_FLOWTABLE_PAD))
5318 goto nla_put_failure;
5320 nest = nla_nest_start(skb, NFTA_FLOWTABLE_HOOK);
5321 if (nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_NUM, htonl(flowtable->hooknum)) ||
5322 nla_put_be32(skb, NFTA_FLOWTABLE_HOOK_PRIORITY, htonl(flowtable->priority)))
5323 goto nla_put_failure;
5325 nest_devs = nla_nest_start(skb, NFTA_FLOWTABLE_HOOK_DEVS);
5327 goto nla_put_failure;
5329 for (i = 0; i < flowtable->ops_len; i++) {
5330 if (flowtable->dev_name[i][0] &&
5331 nla_put_string(skb, NFTA_DEVICE_NAME,
5332 flowtable->dev_name[i]))
5333 goto nla_put_failure;
5335 nla_nest_end(skb, nest_devs);
5336 nla_nest_end(skb, nest);
5338 nlmsg_end(skb, nlh);
5342 nlmsg_trim(skb, nlh);
5346 struct nft_flowtable_filter {
5350 static int nf_tables_dump_flowtable(struct sk_buff *skb,
5351 struct netlink_callback *cb)
5353 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
5354 struct nft_flowtable_filter *filter = cb->data;
5355 unsigned int idx = 0, s_idx = cb->args[0];
5356 struct net *net = sock_net(skb->sk);
5357 int family = nfmsg->nfgen_family;
5358 struct nft_flowtable *flowtable;
5359 const struct nft_table *table;
5362 cb->seq = net->nft.base_seq;
5364 list_for_each_entry_rcu(table, &net->nft.tables, list) {
5365 if (family != NFPROTO_UNSPEC && family != table->family)
5368 list_for_each_entry_rcu(flowtable, &table->flowtables, list) {
5369 if (!nft_is_active(net, flowtable))
5374 memset(&cb->args[1], 0,
5375 sizeof(cb->args) - sizeof(cb->args[0]));
5376 if (filter && filter->table[0] &&
5377 strcmp(filter->table, table->name))
5380 if (nf_tables_fill_flowtable_info(skb, net, NETLINK_CB(cb->skb).portid,
5382 NFT_MSG_NEWFLOWTABLE,
5383 NLM_F_MULTI | NLM_F_APPEND,
5384 table->family, flowtable) < 0)
5387 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
5399 static int nf_tables_dump_flowtable_done(struct netlink_callback *cb)
5401 struct nft_flowtable_filter *filter = cb->data;
5406 kfree(filter->table);
5412 static struct nft_flowtable_filter *
5413 nft_flowtable_filter_alloc(const struct nlattr * const nla[])
5415 struct nft_flowtable_filter *filter;
5417 filter = kzalloc(sizeof(*filter), GFP_KERNEL);
5419 return ERR_PTR(-ENOMEM);
5421 if (nla[NFTA_FLOWTABLE_TABLE]) {
5422 filter->table = nla_strdup(nla[NFTA_FLOWTABLE_TABLE],
5424 if (!filter->table) {
5426 return ERR_PTR(-ENOMEM);
5432 static int nf_tables_getflowtable(struct net *net, struct sock *nlsk,
5433 struct sk_buff *skb,
5434 const struct nlmsghdr *nlh,
5435 const struct nlattr * const nla[],
5436 struct netlink_ext_ack *extack)
5438 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
5439 u8 genmask = nft_genmask_cur(net);
5440 int family = nfmsg->nfgen_family;
5441 struct nft_flowtable *flowtable;
5442 const struct nft_table *table;
5443 struct sk_buff *skb2;
5446 if (nlh->nlmsg_flags & NLM_F_DUMP) {
5447 struct netlink_dump_control c = {
5448 .dump = nf_tables_dump_flowtable,
5449 .done = nf_tables_dump_flowtable_done,
5452 if (nla[NFTA_FLOWTABLE_TABLE]) {
5453 struct nft_flowtable_filter *filter;
5455 filter = nft_flowtable_filter_alloc(nla);
5461 return netlink_dump_start(nlsk, skb, nlh, &c);
5464 if (!nla[NFTA_FLOWTABLE_NAME])
5467 table = nft_table_lookup(net, nla[NFTA_FLOWTABLE_TABLE], family,
5470 return PTR_ERR(table);
5472 flowtable = nft_flowtable_lookup(table, nla[NFTA_FLOWTABLE_NAME],
5474 if (IS_ERR(flowtable))
5475 return PTR_ERR(flowtable);
5477 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
5481 err = nf_tables_fill_flowtable_info(skb2, net, NETLINK_CB(skb).portid,
5483 NFT_MSG_NEWFLOWTABLE, 0, family,
5488 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
5494 static void nf_tables_flowtable_notify(struct nft_ctx *ctx,
5495 struct nft_flowtable *flowtable,
5498 struct sk_buff *skb;
5502 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
5505 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
5509 err = nf_tables_fill_flowtable_info(skb, ctx->net, ctx->portid,
5511 ctx->family, flowtable);
5517 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
5518 ctx->report, GFP_KERNEL);
5521 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
5524 static void nf_tables_flowtable_destroy(struct nft_flowtable *flowtable)
5526 kfree(flowtable->ops);
5527 kfree(flowtable->name);
5528 flowtable->data.type->free(&flowtable->data);
5529 module_put(flowtable->data.type->owner);
5532 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
5533 u32 portid, u32 seq)
5535 struct nlmsghdr *nlh;
5536 struct nfgenmsg *nfmsg;
5537 char buf[TASK_COMM_LEN];
5538 int event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWGEN);
5540 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
5542 goto nla_put_failure;
5544 nfmsg = nlmsg_data(nlh);
5545 nfmsg->nfgen_family = AF_UNSPEC;
5546 nfmsg->version = NFNETLINK_V0;
5547 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
5549 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)) ||
5550 nla_put_be32(skb, NFTA_GEN_PROC_PID, htonl(task_pid_nr(current))) ||
5551 nla_put_string(skb, NFTA_GEN_PROC_NAME, get_task_comm(buf, current)))
5552 goto nla_put_failure;
5554 nlmsg_end(skb, nlh);
5558 nlmsg_trim(skb, nlh);
5562 static void nft_flowtable_event(unsigned long event, struct net_device *dev,
5563 struct nft_flowtable *flowtable)
5567 for (i = 0; i < flowtable->ops_len; i++) {
5568 if (flowtable->ops[i].dev != dev)
5571 nf_unregister_net_hook(dev_net(dev), &flowtable->ops[i]);
5572 flowtable->dev_name[i][0] = '\0';
5573 flowtable->ops[i].dev = NULL;
5578 static int nf_tables_flowtable_event(struct notifier_block *this,
5579 unsigned long event, void *ptr)
5581 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
5582 struct nft_flowtable *flowtable;
5583 struct nft_table *table;
5585 if (event != NETDEV_UNREGISTER)
5588 nfnl_lock(NFNL_SUBSYS_NFTABLES);
5589 list_for_each_entry(table, &dev_net(dev)->nft.tables, list) {
5590 list_for_each_entry(flowtable, &table->flowtables, list) {
5591 nft_flowtable_event(event, dev, flowtable);
5594 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
5599 static struct notifier_block nf_tables_flowtable_notifier = {
5600 .notifier_call = nf_tables_flowtable_event,
5603 static void nf_tables_gen_notify(struct net *net, struct sk_buff *skb,
5606 struct nlmsghdr *nlh = nlmsg_hdr(skb);
5607 struct sk_buff *skb2;
5610 if (nlmsg_report(nlh) &&
5611 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
5614 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
5618 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
5625 nfnetlink_send(skb2, net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
5626 nlmsg_report(nlh), GFP_KERNEL);
5629 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
5633 static int nf_tables_getgen(struct net *net, struct sock *nlsk,
5634 struct sk_buff *skb, const struct nlmsghdr *nlh,
5635 const struct nlattr * const nla[],
5636 struct netlink_ext_ack *extack)
5638 struct sk_buff *skb2;
5641 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
5645 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
5650 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
5656 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
5657 [NFT_MSG_NEWTABLE] = {
5658 .call_batch = nf_tables_newtable,
5659 .attr_count = NFTA_TABLE_MAX,
5660 .policy = nft_table_policy,
5662 [NFT_MSG_GETTABLE] = {
5663 .call = nf_tables_gettable,
5664 .attr_count = NFTA_TABLE_MAX,
5665 .policy = nft_table_policy,
5667 [NFT_MSG_DELTABLE] = {
5668 .call_batch = nf_tables_deltable,
5669 .attr_count = NFTA_TABLE_MAX,
5670 .policy = nft_table_policy,
5672 [NFT_MSG_NEWCHAIN] = {
5673 .call_batch = nf_tables_newchain,
5674 .attr_count = NFTA_CHAIN_MAX,
5675 .policy = nft_chain_policy,
5677 [NFT_MSG_GETCHAIN] = {
5678 .call = nf_tables_getchain,
5679 .attr_count = NFTA_CHAIN_MAX,
5680 .policy = nft_chain_policy,
5682 [NFT_MSG_DELCHAIN] = {
5683 .call_batch = nf_tables_delchain,
5684 .attr_count = NFTA_CHAIN_MAX,
5685 .policy = nft_chain_policy,
5687 [NFT_MSG_NEWRULE] = {
5688 .call_batch = nf_tables_newrule,
5689 .attr_count = NFTA_RULE_MAX,
5690 .policy = nft_rule_policy,
5692 [NFT_MSG_GETRULE] = {
5693 .call = nf_tables_getrule,
5694 .attr_count = NFTA_RULE_MAX,
5695 .policy = nft_rule_policy,
5697 [NFT_MSG_DELRULE] = {
5698 .call_batch = nf_tables_delrule,
5699 .attr_count = NFTA_RULE_MAX,
5700 .policy = nft_rule_policy,
5702 [NFT_MSG_NEWSET] = {
5703 .call_batch = nf_tables_newset,
5704 .attr_count = NFTA_SET_MAX,
5705 .policy = nft_set_policy,
5707 [NFT_MSG_GETSET] = {
5708 .call = nf_tables_getset,
5709 .attr_count = NFTA_SET_MAX,
5710 .policy = nft_set_policy,
5712 [NFT_MSG_DELSET] = {
5713 .call_batch = nf_tables_delset,
5714 .attr_count = NFTA_SET_MAX,
5715 .policy = nft_set_policy,
5717 [NFT_MSG_NEWSETELEM] = {
5718 .call_batch = nf_tables_newsetelem,
5719 .attr_count = NFTA_SET_ELEM_LIST_MAX,
5720 .policy = nft_set_elem_list_policy,
5722 [NFT_MSG_GETSETELEM] = {
5723 .call = nf_tables_getsetelem,
5724 .attr_count = NFTA_SET_ELEM_LIST_MAX,
5725 .policy = nft_set_elem_list_policy,
5727 [NFT_MSG_DELSETELEM] = {
5728 .call_batch = nf_tables_delsetelem,
5729 .attr_count = NFTA_SET_ELEM_LIST_MAX,
5730 .policy = nft_set_elem_list_policy,
5732 [NFT_MSG_GETGEN] = {
5733 .call = nf_tables_getgen,
5735 [NFT_MSG_NEWOBJ] = {
5736 .call_batch = nf_tables_newobj,
5737 .attr_count = NFTA_OBJ_MAX,
5738 .policy = nft_obj_policy,
5740 [NFT_MSG_GETOBJ] = {
5741 .call = nf_tables_getobj,
5742 .attr_count = NFTA_OBJ_MAX,
5743 .policy = nft_obj_policy,
5745 [NFT_MSG_DELOBJ] = {
5746 .call_batch = nf_tables_delobj,
5747 .attr_count = NFTA_OBJ_MAX,
5748 .policy = nft_obj_policy,
5750 [NFT_MSG_GETOBJ_RESET] = {
5751 .call = nf_tables_getobj,
5752 .attr_count = NFTA_OBJ_MAX,
5753 .policy = nft_obj_policy,
5755 [NFT_MSG_NEWFLOWTABLE] = {
5756 .call_batch = nf_tables_newflowtable,
5757 .attr_count = NFTA_FLOWTABLE_MAX,
5758 .policy = nft_flowtable_policy,
5760 [NFT_MSG_GETFLOWTABLE] = {
5761 .call = nf_tables_getflowtable,
5762 .attr_count = NFTA_FLOWTABLE_MAX,
5763 .policy = nft_flowtable_policy,
5765 [NFT_MSG_DELFLOWTABLE] = {
5766 .call_batch = nf_tables_delflowtable,
5767 .attr_count = NFTA_FLOWTABLE_MAX,
5768 .policy = nft_flowtable_policy,
5772 static void nft_chain_commit_update(struct nft_trans *trans)
5774 struct nft_base_chain *basechain;
5776 if (nft_trans_chain_name(trans))
5777 strcpy(trans->ctx.chain->name, nft_trans_chain_name(trans));
5779 if (!nft_is_base_chain(trans->ctx.chain))
5782 basechain = nft_base_chain(trans->ctx.chain);
5783 nft_chain_stats_replace(basechain, nft_trans_chain_stats(trans));
5785 switch (nft_trans_chain_policy(trans)) {
5788 basechain->policy = nft_trans_chain_policy(trans);
5793 static void nf_tables_commit_release(struct nft_trans *trans)
5795 switch (trans->msg_type) {
5796 case NFT_MSG_DELTABLE:
5797 nf_tables_table_destroy(&trans->ctx);
5799 case NFT_MSG_DELCHAIN:
5800 nf_tables_chain_destroy(&trans->ctx);
5802 case NFT_MSG_DELRULE:
5803 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
5805 case NFT_MSG_DELSET:
5806 nft_set_destroy(nft_trans_set(trans));
5808 case NFT_MSG_DELSETELEM:
5809 nf_tables_set_elem_destroy(nft_trans_elem_set(trans),
5810 nft_trans_elem(trans).priv);
5812 case NFT_MSG_DELOBJ:
5813 nft_obj_destroy(nft_trans_obj(trans));
5815 case NFT_MSG_DELFLOWTABLE:
5816 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
5822 static int nf_tables_commit(struct net *net, struct sk_buff *skb)
5824 struct nft_trans *trans, *next;
5825 struct nft_trans_elem *te;
5827 /* Bump generation counter, invalidate any dump in progress */
5828 while (++net->nft.base_seq == 0);
5830 /* A new generation has just started */
5831 net->nft.gencursor = nft_gencursor_next(net);
5833 /* Make sure all packets have left the previous generation before
5834 * purging old rules.
5838 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
5839 switch (trans->msg_type) {
5840 case NFT_MSG_NEWTABLE:
5841 if (nft_trans_table_update(trans)) {
5842 if (!nft_trans_table_enable(trans)) {
5843 nf_tables_table_disable(net,
5845 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
5848 nft_clear(net, trans->ctx.table);
5850 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
5851 nft_trans_destroy(trans);
5853 case NFT_MSG_DELTABLE:
5854 list_del_rcu(&trans->ctx.table->list);
5855 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
5857 case NFT_MSG_NEWCHAIN:
5858 if (nft_trans_chain_update(trans))
5859 nft_chain_commit_update(trans);
5861 nft_clear(net, trans->ctx.chain);
5863 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
5864 nft_trans_destroy(trans);
5866 case NFT_MSG_DELCHAIN:
5867 list_del_rcu(&trans->ctx.chain->list);
5868 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
5869 nf_tables_unregister_hook(trans->ctx.net,
5873 case NFT_MSG_NEWRULE:
5874 nft_clear(trans->ctx.net, nft_trans_rule(trans));
5875 nf_tables_rule_notify(&trans->ctx,
5876 nft_trans_rule(trans),
5878 nft_trans_destroy(trans);
5880 case NFT_MSG_DELRULE:
5881 list_del_rcu(&nft_trans_rule(trans)->list);
5882 nf_tables_rule_notify(&trans->ctx,
5883 nft_trans_rule(trans),
5886 case NFT_MSG_NEWSET:
5887 nft_clear(net, nft_trans_set(trans));
5888 /* This avoids hitting -EBUSY when deleting the table
5889 * from the transaction.
5891 if (nft_set_is_anonymous(nft_trans_set(trans)) &&
5892 !list_empty(&nft_trans_set(trans)->bindings))
5893 trans->ctx.table->use--;
5895 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
5896 NFT_MSG_NEWSET, GFP_KERNEL);
5897 nft_trans_destroy(trans);
5899 case NFT_MSG_DELSET:
5900 list_del_rcu(&nft_trans_set(trans)->list);
5901 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
5902 NFT_MSG_DELSET, GFP_KERNEL);
5904 case NFT_MSG_NEWSETELEM:
5905 te = (struct nft_trans_elem *)trans->data;
5907 te->set->ops->activate(net, te->set, &te->elem);
5908 nf_tables_setelem_notify(&trans->ctx, te->set,
5910 NFT_MSG_NEWSETELEM, 0);
5911 nft_trans_destroy(trans);
5913 case NFT_MSG_DELSETELEM:
5914 te = (struct nft_trans_elem *)trans->data;
5916 nf_tables_setelem_notify(&trans->ctx, te->set,
5918 NFT_MSG_DELSETELEM, 0);
5919 te->set->ops->remove(net, te->set, &te->elem);
5920 atomic_dec(&te->set->nelems);
5923 case NFT_MSG_NEWOBJ:
5924 nft_clear(net, nft_trans_obj(trans));
5925 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
5927 nft_trans_destroy(trans);
5929 case NFT_MSG_DELOBJ:
5930 list_del_rcu(&nft_trans_obj(trans)->list);
5931 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
5934 case NFT_MSG_NEWFLOWTABLE:
5935 nft_clear(net, nft_trans_flowtable(trans));
5936 nf_tables_flowtable_notify(&trans->ctx,
5937 nft_trans_flowtable(trans),
5938 NFT_MSG_NEWFLOWTABLE);
5939 nft_trans_destroy(trans);
5941 case NFT_MSG_DELFLOWTABLE:
5942 list_del_rcu(&nft_trans_flowtable(trans)->list);
5943 nf_tables_flowtable_notify(&trans->ctx,
5944 nft_trans_flowtable(trans),
5945 NFT_MSG_DELFLOWTABLE);
5946 nft_unregister_flowtable_net_hooks(net,
5947 nft_trans_flowtable(trans));
5954 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
5955 list_del(&trans->list);
5956 nf_tables_commit_release(trans);
5959 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
5964 static void nf_tables_abort_release(struct nft_trans *trans)
5966 switch (trans->msg_type) {
5967 case NFT_MSG_NEWTABLE:
5968 nf_tables_table_destroy(&trans->ctx);
5970 case NFT_MSG_NEWCHAIN:
5971 nf_tables_chain_destroy(&trans->ctx);
5973 case NFT_MSG_NEWRULE:
5974 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
5976 case NFT_MSG_NEWSET:
5977 nft_set_destroy(nft_trans_set(trans));
5979 case NFT_MSG_NEWSETELEM:
5980 nft_set_elem_destroy(nft_trans_elem_set(trans),
5981 nft_trans_elem(trans).priv, true);
5983 case NFT_MSG_NEWOBJ:
5984 nft_obj_destroy(nft_trans_obj(trans));
5986 case NFT_MSG_NEWFLOWTABLE:
5987 nf_tables_flowtable_destroy(nft_trans_flowtable(trans));
5993 static int nf_tables_abort(struct net *net, struct sk_buff *skb)
5995 struct nft_trans *trans, *next;
5996 struct nft_trans_elem *te;
5998 list_for_each_entry_safe_reverse(trans, next, &net->nft.commit_list,
6000 switch (trans->msg_type) {
6001 case NFT_MSG_NEWTABLE:
6002 if (nft_trans_table_update(trans)) {
6003 if (nft_trans_table_enable(trans)) {
6004 nf_tables_table_disable(net,
6006 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
6008 nft_trans_destroy(trans);
6010 list_del_rcu(&trans->ctx.table->list);
6013 case NFT_MSG_DELTABLE:
6014 nft_clear(trans->ctx.net, trans->ctx.table);
6015 nft_trans_destroy(trans);
6017 case NFT_MSG_NEWCHAIN:
6018 if (nft_trans_chain_update(trans)) {
6019 free_percpu(nft_trans_chain_stats(trans));
6021 nft_trans_destroy(trans);
6023 trans->ctx.table->use--;
6024 list_del_rcu(&trans->ctx.chain->list);
6025 nf_tables_unregister_hook(trans->ctx.net,
6030 case NFT_MSG_DELCHAIN:
6031 trans->ctx.table->use++;
6032 nft_clear(trans->ctx.net, trans->ctx.chain);
6033 nft_trans_destroy(trans);
6035 case NFT_MSG_NEWRULE:
6036 trans->ctx.chain->use--;
6037 list_del_rcu(&nft_trans_rule(trans)->list);
6039 case NFT_MSG_DELRULE:
6040 trans->ctx.chain->use++;
6041 nft_clear(trans->ctx.net, nft_trans_rule(trans));
6042 nft_trans_destroy(trans);
6044 case NFT_MSG_NEWSET:
6045 trans->ctx.table->use--;
6046 list_del_rcu(&nft_trans_set(trans)->list);
6048 case NFT_MSG_DELSET:
6049 trans->ctx.table->use++;
6050 nft_clear(trans->ctx.net, nft_trans_set(trans));
6051 nft_trans_destroy(trans);
6053 case NFT_MSG_NEWSETELEM:
6054 te = (struct nft_trans_elem *)trans->data;
6056 te->set->ops->remove(net, te->set, &te->elem);
6057 atomic_dec(&te->set->nelems);
6059 case NFT_MSG_DELSETELEM:
6060 te = (struct nft_trans_elem *)trans->data;
6062 nft_set_elem_activate(net, te->set, &te->elem);
6063 te->set->ops->activate(net, te->set, &te->elem);
6066 nft_trans_destroy(trans);
6068 case NFT_MSG_NEWOBJ:
6069 trans->ctx.table->use--;
6070 list_del_rcu(&nft_trans_obj(trans)->list);
6072 case NFT_MSG_DELOBJ:
6073 trans->ctx.table->use++;
6074 nft_clear(trans->ctx.net, nft_trans_obj(trans));
6075 nft_trans_destroy(trans);
6077 case NFT_MSG_NEWFLOWTABLE:
6078 trans->ctx.table->use--;
6079 list_del_rcu(&nft_trans_flowtable(trans)->list);
6080 nft_unregister_flowtable_net_hooks(net,
6081 nft_trans_flowtable(trans));
6083 case NFT_MSG_DELFLOWTABLE:
6084 trans->ctx.table->use++;
6085 nft_clear(trans->ctx.net, nft_trans_flowtable(trans));
6086 nft_trans_destroy(trans);
6093 list_for_each_entry_safe_reverse(trans, next,
6094 &net->nft.commit_list, list) {
6095 list_del(&trans->list);
6096 nf_tables_abort_release(trans);
6102 static bool nf_tables_valid_genid(struct net *net, u32 genid)
6104 return net->nft.base_seq == genid;
6107 static const struct nfnetlink_subsystem nf_tables_subsys = {
6108 .name = "nf_tables",
6109 .subsys_id = NFNL_SUBSYS_NFTABLES,
6110 .cb_count = NFT_MSG_MAX,
6112 .commit = nf_tables_commit,
6113 .abort = nf_tables_abort,
6114 .valid_genid = nf_tables_valid_genid,
6117 int nft_chain_validate_dependency(const struct nft_chain *chain,
6118 enum nft_chain_types type)
6120 const struct nft_base_chain *basechain;
6122 if (nft_is_base_chain(chain)) {
6123 basechain = nft_base_chain(chain);
6124 if (basechain->type->type != type)
6129 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
6131 int nft_chain_validate_hooks(const struct nft_chain *chain,
6132 unsigned int hook_flags)
6134 struct nft_base_chain *basechain;
6136 if (nft_is_base_chain(chain)) {
6137 basechain = nft_base_chain(chain);
6139 if ((1 << basechain->ops.hooknum) & hook_flags)
6147 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
6150 * Loop detection - walk through the ruleset beginning at the destination chain
6151 * of a new jump until either the source chain is reached (loop) or all
6152 * reachable chains have been traversed.
6154 * The loop check is performed whenever a new jump verdict is added to an
6155 * expression or verdict map or a verdict map is bound to a new chain.
6158 static int nf_tables_check_loops(const struct nft_ctx *ctx,
6159 const struct nft_chain *chain);
6161 static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
6162 struct nft_set *set,
6163 const struct nft_set_iter *iter,
6164 struct nft_set_elem *elem)
6166 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
6167 const struct nft_data *data;
6169 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
6170 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
6173 data = nft_set_ext_data(ext);
6174 switch (data->verdict.code) {
6177 return nf_tables_check_loops(ctx, data->verdict.chain);
6183 static int nf_tables_check_loops(const struct nft_ctx *ctx,
6184 const struct nft_chain *chain)
6186 const struct nft_rule *rule;
6187 const struct nft_expr *expr, *last;
6188 struct nft_set *set;
6189 struct nft_set_binding *binding;
6190 struct nft_set_iter iter;
6192 if (ctx->chain == chain)
6195 list_for_each_entry(rule, &chain->rules, list) {
6196 nft_rule_for_each_expr(expr, last, rule) {
6197 const struct nft_data *data = NULL;
6200 if (!expr->ops->validate)
6203 err = expr->ops->validate(ctx, expr, &data);
6210 switch (data->verdict.code) {
6213 err = nf_tables_check_loops(ctx,
6214 data->verdict.chain);
6223 list_for_each_entry(set, &ctx->table->sets, list) {
6224 if (!nft_is_active_next(ctx->net, set))
6226 if (!(set->flags & NFT_SET_MAP) ||
6227 set->dtype != NFT_DATA_VERDICT)
6230 list_for_each_entry(binding, &set->bindings, list) {
6231 if (!(binding->flags & NFT_SET_MAP) ||
6232 binding->chain != chain)
6235 iter.genmask = nft_genmask_next(ctx->net);
6239 iter.fn = nf_tables_loop_check_setelem;
6241 set->ops->walk(ctx, set, &iter);
6251 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
6253 * @attr: netlink attribute to fetch value from
6254 * @max: maximum value to be stored in dest
6255 * @dest: pointer to the variable
6257 * Parse, check and store a given u32 netlink attribute into variable.
6258 * This function returns -ERANGE if the value goes over maximum value.
6259 * Otherwise a 0 is returned and the attribute value is stored in the
6260 * destination variable.
6262 int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
6266 val = ntohl(nla_get_be32(attr));
6273 EXPORT_SYMBOL_GPL(nft_parse_u32_check);
6276 * nft_parse_register - parse a register value from a netlink attribute
6278 * @attr: netlink attribute
6280 * Parse and translate a register value from a netlink attribute.
6281 * Registers used to be 128 bit wide, these register numbers will be
6282 * mapped to the corresponding 32 bit register numbers.
6284 unsigned int nft_parse_register(const struct nlattr *attr)
6288 reg = ntohl(nla_get_be32(attr));
6290 case NFT_REG_VERDICT...NFT_REG_4:
6291 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
6293 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
6296 EXPORT_SYMBOL_GPL(nft_parse_register);
6299 * nft_dump_register - dump a register value to a netlink attribute
6301 * @skb: socket buffer
6302 * @attr: attribute number
6303 * @reg: register number
6305 * Construct a netlink attribute containing the register number. For
6306 * compatibility reasons, register numbers being a multiple of 4 are
6307 * translated to the corresponding 128 bit register numbers.
6309 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
6311 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
6312 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
6314 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
6316 return nla_put_be32(skb, attr, htonl(reg));
6318 EXPORT_SYMBOL_GPL(nft_dump_register);
6321 * nft_validate_register_load - validate a load from a register
6323 * @reg: the register number
6324 * @len: the length of the data
6326 * Validate that the input register is one of the general purpose
6327 * registers and that the length of the load is within the bounds.
6329 int nft_validate_register_load(enum nft_registers reg, unsigned int len)
6331 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
6335 if (reg * NFT_REG32_SIZE + len > FIELD_SIZEOF(struct nft_regs, data))
6340 EXPORT_SYMBOL_GPL(nft_validate_register_load);
6343 * nft_validate_register_store - validate an expressions' register store
6345 * @ctx: context of the expression performing the load
6346 * @reg: the destination register number
6347 * @data: the data to load
6348 * @type: the data type
6349 * @len: the length of the data
6351 * Validate that a data load uses the appropriate data type for
6352 * the destination register and the length is within the bounds.
6353 * A value of NULL for the data means that its runtime gathered
6356 int nft_validate_register_store(const struct nft_ctx *ctx,
6357 enum nft_registers reg,
6358 const struct nft_data *data,
6359 enum nft_data_types type, unsigned int len)
6364 case NFT_REG_VERDICT:
6365 if (type != NFT_DATA_VERDICT)
6369 (data->verdict.code == NFT_GOTO ||
6370 data->verdict.code == NFT_JUMP)) {
6371 err = nf_tables_check_loops(ctx, data->verdict.chain);
6375 if (ctx->chain->level + 1 >
6376 data->verdict.chain->level) {
6377 if (ctx->chain->level + 1 == NFT_JUMP_STACK_SIZE)
6379 data->verdict.chain->level = ctx->chain->level + 1;
6385 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
6389 if (reg * NFT_REG32_SIZE + len >
6390 FIELD_SIZEOF(struct nft_regs, data))
6393 if (data != NULL && type != NFT_DATA_VALUE)
6398 EXPORT_SYMBOL_GPL(nft_validate_register_store);
6400 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
6401 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
6402 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
6403 .len = NFT_CHAIN_MAXNAMELEN - 1 },
6406 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
6407 struct nft_data_desc *desc, const struct nlattr *nla)
6409 u8 genmask = nft_genmask_next(ctx->net);
6410 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
6411 struct nft_chain *chain;
6414 err = nla_parse_nested(tb, NFTA_VERDICT_MAX, nla, nft_verdict_policy,
6419 if (!tb[NFTA_VERDICT_CODE])
6421 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
6423 switch (data->verdict.code) {
6425 switch (data->verdict.code & NF_VERDICT_MASK) {
6440 if (!tb[NFTA_VERDICT_CHAIN])
6442 chain = nft_chain_lookup(ctx->table, tb[NFTA_VERDICT_CHAIN],
6445 return PTR_ERR(chain);
6446 if (nft_is_base_chain(chain))
6450 data->verdict.chain = chain;
6454 desc->len = sizeof(data->verdict);
6455 desc->type = NFT_DATA_VERDICT;
6459 static void nft_verdict_uninit(const struct nft_data *data)
6461 switch (data->verdict.code) {
6464 data->verdict.chain->use--;
6469 int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
6471 struct nlattr *nest;
6473 nest = nla_nest_start(skb, type);
6475 goto nla_put_failure;
6477 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
6478 goto nla_put_failure;
6483 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
6485 goto nla_put_failure;
6487 nla_nest_end(skb, nest);
6494 static int nft_value_init(const struct nft_ctx *ctx,
6495 struct nft_data *data, unsigned int size,
6496 struct nft_data_desc *desc, const struct nlattr *nla)
6506 nla_memcpy(data->data, nla, len);
6507 desc->type = NFT_DATA_VALUE;
6512 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
6515 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
6518 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
6519 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
6520 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
6524 * nft_data_init - parse nf_tables data netlink attributes
6526 * @ctx: context of the expression using the data
6527 * @data: destination struct nft_data
6528 * @size: maximum data length
6529 * @desc: data description
6530 * @nla: netlink attribute containing data
6532 * Parse the netlink data attributes and initialize a struct nft_data.
6533 * The type and length of data are returned in the data description.
6535 * The caller can indicate that it only wants to accept data of type
6536 * NFT_DATA_VALUE by passing NULL for the ctx argument.
6538 int nft_data_init(const struct nft_ctx *ctx,
6539 struct nft_data *data, unsigned int size,
6540 struct nft_data_desc *desc, const struct nlattr *nla)
6542 struct nlattr *tb[NFTA_DATA_MAX + 1];
6545 err = nla_parse_nested(tb, NFTA_DATA_MAX, nla, nft_data_policy, NULL);
6549 if (tb[NFTA_DATA_VALUE])
6550 return nft_value_init(ctx, data, size, desc,
6551 tb[NFTA_DATA_VALUE]);
6552 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
6553 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
6556 EXPORT_SYMBOL_GPL(nft_data_init);
6559 * nft_data_release - release a nft_data item
6561 * @data: struct nft_data to release
6562 * @type: type of data
6564 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
6565 * all others need to be released by calling this function.
6567 void nft_data_release(const struct nft_data *data, enum nft_data_types type)
6569 if (type < NFT_DATA_VERDICT)
6572 case NFT_DATA_VERDICT:
6573 return nft_verdict_uninit(data);
6578 EXPORT_SYMBOL_GPL(nft_data_release);
6580 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
6581 enum nft_data_types type, unsigned int len)
6583 struct nlattr *nest;
6586 nest = nla_nest_start(skb, attr);
6591 case NFT_DATA_VALUE:
6592 err = nft_value_dump(skb, data, len);
6594 case NFT_DATA_VERDICT:
6595 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
6602 nla_nest_end(skb, nest);
6605 EXPORT_SYMBOL_GPL(nft_data_dump);
6607 int __nft_release_basechain(struct nft_ctx *ctx)
6609 struct nft_rule *rule, *nr;
6611 BUG_ON(!nft_is_base_chain(ctx->chain));
6613 nf_tables_unregister_hook(ctx->net, ctx->chain->table, ctx->chain);
6614 list_for_each_entry_safe(rule, nr, &ctx->chain->rules, list) {
6615 list_del(&rule->list);
6617 nf_tables_rule_destroy(ctx, rule);
6619 list_del(&ctx->chain->list);
6621 nf_tables_chain_destroy(ctx);
6625 EXPORT_SYMBOL_GPL(__nft_release_basechain);
6627 static void __nft_release_tables(struct net *net)
6629 struct nft_flowtable *flowtable, *nf;
6630 struct nft_table *table, *nt;
6631 struct nft_chain *chain, *nc;
6632 struct nft_object *obj, *ne;
6633 struct nft_rule *rule, *nr;
6634 struct nft_set *set, *ns;
6635 struct nft_ctx ctx = {
6637 .family = NFPROTO_NETDEV,
6640 list_for_each_entry_safe(table, nt, &net->nft.tables, list) {
6641 ctx.family = table->family;
6643 list_for_each_entry(chain, &table->chains, list)
6644 nf_tables_unregister_hook(net, table, chain);
6645 list_for_each_entry(flowtable, &table->flowtables, list)
6646 nf_unregister_net_hooks(net, flowtable->ops,
6647 flowtable->ops_len);
6648 /* No packets are walking on these chains anymore. */
6650 list_for_each_entry(chain, &table->chains, list) {
6652 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
6653 list_del(&rule->list);
6655 nf_tables_rule_destroy(&ctx, rule);
6658 list_for_each_entry_safe(flowtable, nf, &table->flowtables, list) {
6659 list_del(&flowtable->list);
6661 nf_tables_flowtable_destroy(flowtable);
6663 list_for_each_entry_safe(set, ns, &table->sets, list) {
6664 list_del(&set->list);
6666 nft_set_destroy(set);
6668 list_for_each_entry_safe(obj, ne, &table->objects, list) {
6669 list_del(&obj->list);
6671 nft_obj_destroy(obj);
6673 list_for_each_entry_safe(chain, nc, &table->chains, list) {
6675 list_del(&chain->list);
6677 nf_tables_chain_destroy(&ctx);
6679 list_del(&table->list);
6680 nf_tables_table_destroy(&ctx);
6684 static int __net_init nf_tables_init_net(struct net *net)
6686 INIT_LIST_HEAD(&net->nft.tables);
6687 INIT_LIST_HEAD(&net->nft.commit_list);
6688 net->nft.base_seq = 1;
6692 static void __net_exit nf_tables_exit_net(struct net *net)
6694 __nft_release_tables(net);
6695 WARN_ON_ONCE(!list_empty(&net->nft.tables));
6696 WARN_ON_ONCE(!list_empty(&net->nft.commit_list));
6699 static struct pernet_operations nf_tables_net_ops = {
6700 .init = nf_tables_init_net,
6701 .exit = nf_tables_exit_net,
6704 static int __init nf_tables_module_init(void)
6708 nft_chain_filter_init();
6710 info = kmalloc(sizeof(struct nft_expr_info) * NFT_RULE_MAXEXPRS,
6717 err = nf_tables_core_module_init();
6721 err = nfnetlink_subsys_register(&nf_tables_subsys);
6725 register_netdevice_notifier(&nf_tables_flowtable_notifier);
6727 return register_pernet_subsys(&nf_tables_net_ops);
6729 nf_tables_core_module_exit();
6736 static void __exit nf_tables_module_exit(void)
6738 unregister_pernet_subsys(&nf_tables_net_ops);
6739 nfnetlink_subsys_unregister(&nf_tables_subsys);
6740 unregister_netdevice_notifier(&nf_tables_flowtable_notifier);
6742 nf_tables_core_module_exit();
6744 nft_chain_filter_fini();
6747 module_init(nf_tables_module_init);
6748 module_exit(nf_tables_module_exit);
6750 MODULE_LICENSE("GPL");
6751 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
6752 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);