2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/vmalloc.h>
17 #include <linux/netfilter.h>
18 #include <linux/netfilter/nfnetlink.h>
19 #include <linux/netfilter/nf_tables.h>
20 #include <net/netfilter/nf_tables_core.h>
21 #include <net/netfilter/nf_tables.h>
22 #include <net/net_namespace.h>
25 static LIST_HEAD(nf_tables_expressions);
26 static LIST_HEAD(nf_tables_objects);
29 * nft_register_afinfo - register nf_tables address family info
31 * @afi: address family info to register
33 * Register the address family for use with nf_tables. Returns zero on
34 * success or a negative errno code otherwise.
36 int nft_register_afinfo(struct net *net, struct nft_af_info *afi)
38 INIT_LIST_HEAD(&afi->tables);
39 nfnl_lock(NFNL_SUBSYS_NFTABLES);
40 list_add_tail_rcu(&afi->list, &net->nft.af_info);
41 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
44 EXPORT_SYMBOL_GPL(nft_register_afinfo);
46 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi);
49 * nft_unregister_afinfo - unregister nf_tables address family info
51 * @afi: address family info to unregister
53 * Unregister the address family for use with nf_tables.
55 void nft_unregister_afinfo(struct net *net, struct nft_af_info *afi)
57 nfnl_lock(NFNL_SUBSYS_NFTABLES);
58 __nft_release_afinfo(net, afi);
59 list_del_rcu(&afi->list);
60 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
62 EXPORT_SYMBOL_GPL(nft_unregister_afinfo);
64 static struct nft_af_info *nft_afinfo_lookup(struct net *net, int family)
66 struct nft_af_info *afi;
68 list_for_each_entry(afi, &net->nft.af_info, list) {
69 if (afi->family == family)
75 static struct nft_af_info *
76 nf_tables_afinfo_lookup(struct net *net, int family, bool autoload)
78 struct nft_af_info *afi;
80 afi = nft_afinfo_lookup(net, family);
85 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
86 request_module("nft-afinfo-%u", family);
87 nfnl_lock(NFNL_SUBSYS_NFTABLES);
88 afi = nft_afinfo_lookup(net, family);
90 return ERR_PTR(-EAGAIN);
93 return ERR_PTR(-EAFNOSUPPORT);
96 static void nft_ctx_init(struct nft_ctx *ctx,
98 const struct sk_buff *skb,
99 const struct nlmsghdr *nlh,
100 struct nft_af_info *afi,
101 struct nft_table *table,
102 struct nft_chain *chain,
103 const struct nlattr * const *nla)
110 ctx->portid = NETLINK_CB(skb).portid;
111 ctx->report = nlmsg_report(nlh);
112 ctx->seq = nlh->nlmsg_seq;
115 static struct nft_trans *nft_trans_alloc_gfp(const struct nft_ctx *ctx,
116 int msg_type, u32 size, gfp_t gfp)
118 struct nft_trans *trans;
120 trans = kzalloc(sizeof(struct nft_trans) + size, gfp);
124 trans->msg_type = msg_type;
130 static struct nft_trans *nft_trans_alloc(const struct nft_ctx *ctx,
131 int msg_type, u32 size)
133 return nft_trans_alloc_gfp(ctx, msg_type, size, GFP_KERNEL);
136 static void nft_trans_destroy(struct nft_trans *trans)
138 list_del(&trans->list);
142 static int nf_tables_register_hooks(struct net *net,
143 const struct nft_table *table,
144 struct nft_chain *chain,
145 unsigned int hook_nops)
147 if (table->flags & NFT_TABLE_F_DORMANT ||
148 !nft_is_base_chain(chain))
151 return nf_register_net_hooks(net, nft_base_chain(chain)->ops,
155 static void nf_tables_unregister_hooks(struct net *net,
156 const struct nft_table *table,
157 struct nft_chain *chain,
158 unsigned int hook_nops)
160 if (table->flags & NFT_TABLE_F_DORMANT ||
161 !nft_is_base_chain(chain))
164 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops, hook_nops);
167 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
169 struct nft_trans *trans;
171 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
175 if (msg_type == NFT_MSG_NEWTABLE)
176 nft_activate_next(ctx->net, ctx->table);
178 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
182 static int nft_deltable(struct nft_ctx *ctx)
186 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
190 nft_deactivate_next(ctx->net, ctx->table);
194 static int nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
196 struct nft_trans *trans;
198 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
202 if (msg_type == NFT_MSG_NEWCHAIN)
203 nft_activate_next(ctx->net, ctx->chain);
205 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
209 static int nft_delchain(struct nft_ctx *ctx)
213 err = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
218 nft_deactivate_next(ctx->net, ctx->chain);
224 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
226 /* You cannot delete the same rule twice */
227 if (nft_is_active_next(ctx->net, rule)) {
228 nft_deactivate_next(ctx->net, rule);
235 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
236 struct nft_rule *rule)
238 struct nft_trans *trans;
240 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
244 if (msg_type == NFT_MSG_NEWRULE && ctx->nla[NFTA_RULE_ID] != NULL) {
245 nft_trans_rule_id(trans) =
246 ntohl(nla_get_be32(ctx->nla[NFTA_RULE_ID]));
248 nft_trans_rule(trans) = rule;
249 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
254 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
256 struct nft_trans *trans;
259 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
263 err = nf_tables_delrule_deactivate(ctx, rule);
265 nft_trans_destroy(trans);
272 static int nft_delrule_by_chain(struct nft_ctx *ctx)
274 struct nft_rule *rule;
277 list_for_each_entry(rule, &ctx->chain->rules, list) {
278 err = nft_delrule(ctx, rule);
285 static int nft_trans_set_add(struct nft_ctx *ctx, int msg_type,
288 struct nft_trans *trans;
290 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
294 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
295 nft_trans_set_id(trans) =
296 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
297 nft_activate_next(ctx->net, set);
299 nft_trans_set(trans) = set;
300 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
305 static int nft_delset(struct nft_ctx *ctx, struct nft_set *set)
309 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
313 nft_deactivate_next(ctx->net, set);
319 static int nft_trans_obj_add(struct nft_ctx *ctx, int msg_type,
320 struct nft_object *obj)
322 struct nft_trans *trans;
324 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_obj));
328 if (msg_type == NFT_MSG_NEWOBJ)
329 nft_activate_next(ctx->net, obj);
331 nft_trans_obj(trans) = obj;
332 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
337 static int nft_delobj(struct nft_ctx *ctx, struct nft_object *obj)
341 err = nft_trans_obj_add(ctx, NFT_MSG_DELOBJ, obj);
345 nft_deactivate_next(ctx->net, obj);
355 static struct nft_table *nft_table_lookup(const struct nft_af_info *afi,
356 const struct nlattr *nla,
359 struct nft_table *table;
361 list_for_each_entry(table, &afi->tables, list) {
362 if (!nla_strcmp(nla, table->name) &&
363 nft_active_genmask(table, genmask))
369 static struct nft_table *nf_tables_table_lookup(const struct nft_af_info *afi,
370 const struct nlattr *nla,
373 struct nft_table *table;
376 return ERR_PTR(-EINVAL);
378 table = nft_table_lookup(afi, nla, genmask);
382 return ERR_PTR(-ENOENT);
385 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
387 return ++table->hgenerator;
390 static const struct nf_chain_type *chain_type[NFPROTO_NUMPROTO][NFT_CHAIN_T_MAX];
392 static const struct nf_chain_type *
393 __nf_tables_chain_type_lookup(int family, const struct nlattr *nla)
397 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
398 if (chain_type[family][i] != NULL &&
399 !nla_strcmp(nla, chain_type[family][i]->name))
400 return chain_type[family][i];
405 static const struct nf_chain_type *
406 nf_tables_chain_type_lookup(const struct nft_af_info *afi,
407 const struct nlattr *nla,
410 const struct nf_chain_type *type;
412 type = __nf_tables_chain_type_lookup(afi->family, nla);
415 #ifdef CONFIG_MODULES
417 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
418 request_module("nft-chain-%u-%.*s", afi->family,
419 nla_len(nla), (const char *)nla_data(nla));
420 nfnl_lock(NFNL_SUBSYS_NFTABLES);
421 type = __nf_tables_chain_type_lookup(afi->family, nla);
423 return ERR_PTR(-EAGAIN);
426 return ERR_PTR(-ENOENT);
429 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
430 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
431 .len = NFT_TABLE_MAXNAMELEN - 1 },
432 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
435 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
436 u32 portid, u32 seq, int event, u32 flags,
437 int family, const struct nft_table *table)
439 struct nlmsghdr *nlh;
440 struct nfgenmsg *nfmsg;
442 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
443 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
445 goto nla_put_failure;
447 nfmsg = nlmsg_data(nlh);
448 nfmsg->nfgen_family = family;
449 nfmsg->version = NFNETLINK_V0;
450 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
452 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
453 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
454 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)))
455 goto nla_put_failure;
461 nlmsg_trim(skb, nlh);
465 static void nf_tables_table_notify(const struct nft_ctx *ctx, int event)
471 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
474 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
478 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
479 event, 0, ctx->afi->family, ctx->table);
485 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
486 ctx->report, GFP_KERNEL);
489 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
492 static int nf_tables_dump_tables(struct sk_buff *skb,
493 struct netlink_callback *cb)
495 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
496 const struct nft_af_info *afi;
497 const struct nft_table *table;
498 unsigned int idx = 0, s_idx = cb->args[0];
499 struct net *net = sock_net(skb->sk);
500 int family = nfmsg->nfgen_family;
503 cb->seq = net->nft.base_seq;
505 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
506 if (family != NFPROTO_UNSPEC && family != afi->family)
509 list_for_each_entry_rcu(table, &afi->tables, list) {
513 memset(&cb->args[1], 0,
514 sizeof(cb->args) - sizeof(cb->args[0]));
515 if (!nft_is_active(net, table))
517 if (nf_tables_fill_table_info(skb, net,
518 NETLINK_CB(cb->skb).portid,
522 afi->family, table) < 0)
525 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
536 static int nf_tables_gettable(struct net *net, struct sock *nlsk,
537 struct sk_buff *skb, const struct nlmsghdr *nlh,
538 const struct nlattr * const nla[],
539 struct netlink_ext_ack *extack)
541 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
542 u8 genmask = nft_genmask_cur(net);
543 const struct nft_af_info *afi;
544 const struct nft_table *table;
545 struct sk_buff *skb2;
546 int family = nfmsg->nfgen_family;
549 if (nlh->nlmsg_flags & NLM_F_DUMP) {
550 struct netlink_dump_control c = {
551 .dump = nf_tables_dump_tables,
553 return netlink_dump_start(nlsk, skb, nlh, &c);
556 afi = nf_tables_afinfo_lookup(net, family, false);
560 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
562 return PTR_ERR(table);
564 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
568 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
569 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
574 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
581 static void _nf_tables_table_disable(struct net *net,
582 const struct nft_af_info *afi,
583 struct nft_table *table,
586 struct nft_chain *chain;
589 list_for_each_entry(chain, &table->chains, list) {
590 if (!nft_is_active_next(net, chain))
592 if (!nft_is_base_chain(chain))
595 if (cnt && i++ == cnt)
598 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops,
603 static int nf_tables_table_enable(struct net *net,
604 const struct nft_af_info *afi,
605 struct nft_table *table)
607 struct nft_chain *chain;
610 list_for_each_entry(chain, &table->chains, list) {
611 if (!nft_is_active_next(net, chain))
613 if (!nft_is_base_chain(chain))
616 err = nf_register_net_hooks(net, nft_base_chain(chain)->ops,
626 _nf_tables_table_disable(net, afi, table, i);
630 static void nf_tables_table_disable(struct net *net,
631 const struct nft_af_info *afi,
632 struct nft_table *table)
634 _nf_tables_table_disable(net, afi, table, 0);
637 static int nf_tables_updtable(struct nft_ctx *ctx)
639 struct nft_trans *trans;
643 if (!ctx->nla[NFTA_TABLE_FLAGS])
646 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
647 if (flags & ~NFT_TABLE_F_DORMANT)
650 if (flags == ctx->table->flags)
653 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
654 sizeof(struct nft_trans_table));
658 if ((flags & NFT_TABLE_F_DORMANT) &&
659 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
660 nft_trans_table_enable(trans) = false;
661 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
662 ctx->table->flags & NFT_TABLE_F_DORMANT) {
663 ret = nf_tables_table_enable(ctx->net, ctx->afi, ctx->table);
665 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
666 nft_trans_table_enable(trans) = true;
672 nft_trans_table_update(trans) = true;
673 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
676 nft_trans_destroy(trans);
680 static int nf_tables_newtable(struct net *net, struct sock *nlsk,
681 struct sk_buff *skb, const struct nlmsghdr *nlh,
682 const struct nlattr * const nla[],
683 struct netlink_ext_ack *extack)
685 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
686 u8 genmask = nft_genmask_next(net);
687 const struct nlattr *name;
688 struct nft_af_info *afi;
689 struct nft_table *table;
690 int family = nfmsg->nfgen_family;
695 afi = nf_tables_afinfo_lookup(net, family, true);
699 name = nla[NFTA_TABLE_NAME];
700 table = nf_tables_table_lookup(afi, name, genmask);
702 if (PTR_ERR(table) != -ENOENT)
703 return PTR_ERR(table);
705 if (nlh->nlmsg_flags & NLM_F_EXCL)
707 if (nlh->nlmsg_flags & NLM_F_REPLACE)
710 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
711 return nf_tables_updtable(&ctx);
714 if (nla[NFTA_TABLE_FLAGS]) {
715 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
716 if (flags & ~NFT_TABLE_F_DORMANT)
721 if (!try_module_get(afi->owner))
725 table = kzalloc(sizeof(*table), GFP_KERNEL);
729 nla_strlcpy(table->name, name, NFT_TABLE_MAXNAMELEN);
730 INIT_LIST_HEAD(&table->chains);
731 INIT_LIST_HEAD(&table->sets);
732 INIT_LIST_HEAD(&table->objects);
733 table->flags = flags;
735 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
736 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
740 list_add_tail_rcu(&table->list, &afi->tables);
745 module_put(afi->owner);
750 static int nft_flush_table(struct nft_ctx *ctx)
753 struct nft_chain *chain, *nc;
754 struct nft_object *obj, *ne;
755 struct nft_set *set, *ns;
757 list_for_each_entry(chain, &ctx->table->chains, list) {
758 if (!nft_is_active_next(ctx->net, chain))
763 err = nft_delrule_by_chain(ctx);
768 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
769 if (!nft_is_active_next(ctx->net, set))
772 if (set->flags & NFT_SET_ANONYMOUS &&
773 !list_empty(&set->bindings))
776 err = nft_delset(ctx, set);
781 list_for_each_entry_safe(obj, ne, &ctx->table->objects, list) {
782 err = nft_delobj(ctx, obj);
787 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
788 if (!nft_is_active_next(ctx->net, chain))
793 err = nft_delchain(ctx);
798 err = nft_deltable(ctx);
803 static int nft_flush(struct nft_ctx *ctx, int family)
805 struct nft_af_info *afi;
806 struct nft_table *table, *nt;
807 const struct nlattr * const *nla = ctx->nla;
810 list_for_each_entry(afi, &ctx->net->nft.af_info, list) {
811 if (family != AF_UNSPEC && afi->family != family)
815 list_for_each_entry_safe(table, nt, &afi->tables, list) {
816 if (!nft_is_active_next(ctx->net, table))
819 if (nla[NFTA_TABLE_NAME] &&
820 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
825 err = nft_flush_table(ctx);
834 static int nf_tables_deltable(struct net *net, struct sock *nlsk,
835 struct sk_buff *skb, const struct nlmsghdr *nlh,
836 const struct nlattr * const nla[],
837 struct netlink_ext_ack *extack)
839 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
840 u8 genmask = nft_genmask_next(net);
841 struct nft_af_info *afi;
842 struct nft_table *table;
843 int family = nfmsg->nfgen_family;
846 nft_ctx_init(&ctx, net, skb, nlh, NULL, NULL, NULL, nla);
847 if (family == AF_UNSPEC || nla[NFTA_TABLE_NAME] == NULL)
848 return nft_flush(&ctx, family);
850 afi = nf_tables_afinfo_lookup(net, family, false);
854 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
856 return PTR_ERR(table);
861 return nft_flush_table(&ctx);
864 static void nf_tables_table_destroy(struct nft_ctx *ctx)
866 BUG_ON(ctx->table->use > 0);
869 module_put(ctx->afi->owner);
872 int nft_register_chain_type(const struct nf_chain_type *ctype)
876 if (WARN_ON(ctype->family >= NFPROTO_NUMPROTO))
879 nfnl_lock(NFNL_SUBSYS_NFTABLES);
880 if (chain_type[ctype->family][ctype->type] != NULL) {
884 chain_type[ctype->family][ctype->type] = ctype;
886 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
889 EXPORT_SYMBOL_GPL(nft_register_chain_type);
891 void nft_unregister_chain_type(const struct nf_chain_type *ctype)
893 nfnl_lock(NFNL_SUBSYS_NFTABLES);
894 chain_type[ctype->family][ctype->type] = NULL;
895 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
897 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
903 static struct nft_chain *
904 nf_tables_chain_lookup_byhandle(const struct nft_table *table, u64 handle,
907 struct nft_chain *chain;
909 list_for_each_entry(chain, &table->chains, list) {
910 if (chain->handle == handle &&
911 nft_active_genmask(chain, genmask))
915 return ERR_PTR(-ENOENT);
918 static struct nft_chain *nf_tables_chain_lookup(const struct nft_table *table,
919 const struct nlattr *nla,
922 struct nft_chain *chain;
925 return ERR_PTR(-EINVAL);
927 list_for_each_entry(chain, &table->chains, list) {
928 if (!nla_strcmp(nla, chain->name) &&
929 nft_active_genmask(chain, genmask))
933 return ERR_PTR(-ENOENT);
936 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
937 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING,
938 .len = NFT_TABLE_MAXNAMELEN - 1 },
939 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
940 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
941 .len = NFT_CHAIN_MAXNAMELEN - 1 },
942 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
943 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
944 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING },
945 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
948 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
949 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
950 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
951 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
952 .len = IFNAMSIZ - 1 },
955 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
957 struct nft_stats *cpu_stats, total;
963 memset(&total, 0, sizeof(total));
964 for_each_possible_cpu(cpu) {
965 cpu_stats = per_cpu_ptr(stats, cpu);
967 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
968 pkts = cpu_stats->pkts;
969 bytes = cpu_stats->bytes;
970 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
972 total.bytes += bytes;
974 nest = nla_nest_start(skb, NFTA_CHAIN_COUNTERS);
976 goto nla_put_failure;
978 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
980 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
982 goto nla_put_failure;
984 nla_nest_end(skb, nest);
991 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
992 u32 portid, u32 seq, int event, u32 flags,
993 int family, const struct nft_table *table,
994 const struct nft_chain *chain)
996 struct nlmsghdr *nlh;
997 struct nfgenmsg *nfmsg;
999 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
1000 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
1002 goto nla_put_failure;
1004 nfmsg = nlmsg_data(nlh);
1005 nfmsg->nfgen_family = family;
1006 nfmsg->version = NFNETLINK_V0;
1007 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1009 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
1010 goto nla_put_failure;
1011 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
1013 goto nla_put_failure;
1014 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
1015 goto nla_put_failure;
1017 if (nft_is_base_chain(chain)) {
1018 const struct nft_base_chain *basechain = nft_base_chain(chain);
1019 const struct nf_hook_ops *ops = &basechain->ops[0];
1020 struct nlattr *nest;
1022 nest = nla_nest_start(skb, NFTA_CHAIN_HOOK);
1024 goto nla_put_failure;
1025 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
1026 goto nla_put_failure;
1027 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
1028 goto nla_put_failure;
1029 if (basechain->dev_name[0] &&
1030 nla_put_string(skb, NFTA_HOOK_DEV, basechain->dev_name))
1031 goto nla_put_failure;
1032 nla_nest_end(skb, nest);
1034 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
1035 htonl(basechain->policy)))
1036 goto nla_put_failure;
1038 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
1039 goto nla_put_failure;
1041 if (nft_dump_stats(skb, nft_base_chain(chain)->stats))
1042 goto nla_put_failure;
1045 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
1046 goto nla_put_failure;
1048 nlmsg_end(skb, nlh);
1052 nlmsg_trim(skb, nlh);
1056 static void nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
1058 struct sk_buff *skb;
1062 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1065 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1069 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
1070 event, 0, ctx->afi->family, ctx->table,
1077 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1078 ctx->report, GFP_KERNEL);
1081 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
1084 static int nf_tables_dump_chains(struct sk_buff *skb,
1085 struct netlink_callback *cb)
1087 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1088 const struct nft_af_info *afi;
1089 const struct nft_table *table;
1090 const struct nft_chain *chain;
1091 unsigned int idx = 0, s_idx = cb->args[0];
1092 struct net *net = sock_net(skb->sk);
1093 int family = nfmsg->nfgen_family;
1096 cb->seq = net->nft.base_seq;
1098 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1099 if (family != NFPROTO_UNSPEC && family != afi->family)
1102 list_for_each_entry_rcu(table, &afi->tables, list) {
1103 list_for_each_entry_rcu(chain, &table->chains, list) {
1107 memset(&cb->args[1], 0,
1108 sizeof(cb->args) - sizeof(cb->args[0]));
1109 if (!nft_is_active(net, chain))
1111 if (nf_tables_fill_chain_info(skb, net,
1112 NETLINK_CB(cb->skb).portid,
1116 afi->family, table, chain) < 0)
1119 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1131 static int nf_tables_getchain(struct net *net, struct sock *nlsk,
1132 struct sk_buff *skb, const struct nlmsghdr *nlh,
1133 const struct nlattr * const nla[],
1134 struct netlink_ext_ack *extack)
1136 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1137 u8 genmask = nft_genmask_cur(net);
1138 const struct nft_af_info *afi;
1139 const struct nft_table *table;
1140 const struct nft_chain *chain;
1141 struct sk_buff *skb2;
1142 int family = nfmsg->nfgen_family;
1145 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1146 struct netlink_dump_control c = {
1147 .dump = nf_tables_dump_chains,
1149 return netlink_dump_start(nlsk, skb, nlh, &c);
1152 afi = nf_tables_afinfo_lookup(net, family, false);
1154 return PTR_ERR(afi);
1156 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1158 return PTR_ERR(table);
1160 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1162 return PTR_ERR(chain);
1164 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1168 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
1169 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1170 family, table, chain);
1174 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1181 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1182 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1183 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1186 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
1188 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1189 struct nft_stats __percpu *newstats;
1190 struct nft_stats *stats;
1193 err = nla_parse_nested(tb, NFTA_COUNTER_MAX, attr, nft_counter_policy,
1196 return ERR_PTR(err);
1198 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
1199 return ERR_PTR(-EINVAL);
1201 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
1202 if (newstats == NULL)
1203 return ERR_PTR(-ENOMEM);
1205 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1206 * are not exposed to userspace.
1209 stats = this_cpu_ptr(newstats);
1210 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1211 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
1217 static void nft_chain_stats_replace(struct nft_base_chain *chain,
1218 struct nft_stats __percpu *newstats)
1220 if (newstats == NULL)
1224 struct nft_stats __percpu *oldstats =
1225 nft_dereference(chain->stats);
1227 rcu_assign_pointer(chain->stats, newstats);
1229 free_percpu(oldstats);
1231 rcu_assign_pointer(chain->stats, newstats);
1234 static void nf_tables_chain_destroy(struct nft_chain *chain)
1236 BUG_ON(chain->use > 0);
1238 if (nft_is_base_chain(chain)) {
1239 struct nft_base_chain *basechain = nft_base_chain(chain);
1241 module_put(basechain->type->owner);
1242 free_percpu(basechain->stats);
1243 if (basechain->ops[0].dev != NULL)
1244 dev_put(basechain->ops[0].dev);
1251 struct nft_chain_hook {
1254 const struct nf_chain_type *type;
1255 struct net_device *dev;
1258 static int nft_chain_parse_hook(struct net *net,
1259 const struct nlattr * const nla[],
1260 struct nft_af_info *afi,
1261 struct nft_chain_hook *hook, bool create)
1263 struct nlattr *ha[NFTA_HOOK_MAX + 1];
1264 const struct nf_chain_type *type;
1265 struct net_device *dev;
1268 err = nla_parse_nested(ha, NFTA_HOOK_MAX, nla[NFTA_CHAIN_HOOK],
1269 nft_hook_policy, NULL);
1273 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1274 ha[NFTA_HOOK_PRIORITY] == NULL)
1277 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
1278 if (hook->num >= afi->nhooks)
1281 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1283 type = chain_type[afi->family][NFT_CHAIN_T_DEFAULT];
1284 if (nla[NFTA_CHAIN_TYPE]) {
1285 type = nf_tables_chain_type_lookup(afi, nla[NFTA_CHAIN_TYPE],
1288 return PTR_ERR(type);
1290 if (!(type->hook_mask & (1 << hook->num)))
1292 if (!try_module_get(type->owner))
1298 if (afi->flags & NFT_AF_NEEDS_DEV) {
1299 char ifname[IFNAMSIZ];
1301 if (!ha[NFTA_HOOK_DEV]) {
1302 module_put(type->owner);
1306 nla_strlcpy(ifname, ha[NFTA_HOOK_DEV], IFNAMSIZ);
1307 dev = dev_get_by_name(net, ifname);
1309 module_put(type->owner);
1313 } else if (ha[NFTA_HOOK_DEV]) {
1314 module_put(type->owner);
1321 static void nft_chain_release_hook(struct nft_chain_hook *hook)
1323 module_put(hook->type->owner);
1324 if (hook->dev != NULL)
1328 static int nf_tables_newchain(struct net *net, struct sock *nlsk,
1329 struct sk_buff *skb, const struct nlmsghdr *nlh,
1330 const struct nlattr * const nla[],
1331 struct netlink_ext_ack *extack)
1333 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1334 const struct nlattr * uninitialized_var(name);
1335 struct nft_af_info *afi;
1336 struct nft_table *table;
1337 struct nft_chain *chain;
1338 struct nft_base_chain *basechain = NULL;
1339 u8 genmask = nft_genmask_next(net);
1340 int family = nfmsg->nfgen_family;
1341 u8 policy = NF_ACCEPT;
1344 struct nft_stats __percpu *stats;
1349 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1351 afi = nf_tables_afinfo_lookup(net, family, true);
1353 return PTR_ERR(afi);
1355 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1357 return PTR_ERR(table);
1360 name = nla[NFTA_CHAIN_NAME];
1362 if (nla[NFTA_CHAIN_HANDLE]) {
1363 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
1364 chain = nf_tables_chain_lookup_byhandle(table, handle, genmask);
1366 return PTR_ERR(chain);
1368 chain = nf_tables_chain_lookup(table, name, genmask);
1369 if (IS_ERR(chain)) {
1370 if (PTR_ERR(chain) != -ENOENT)
1371 return PTR_ERR(chain);
1376 if (nla[NFTA_CHAIN_POLICY]) {
1377 if (chain != NULL &&
1378 !nft_is_base_chain(chain))
1381 if (chain == NULL &&
1382 nla[NFTA_CHAIN_HOOK] == NULL)
1385 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
1395 if (chain != NULL) {
1396 struct nft_stats *stats = NULL;
1397 struct nft_trans *trans;
1399 if (nlh->nlmsg_flags & NLM_F_EXCL)
1401 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1404 if (nla[NFTA_CHAIN_HOOK]) {
1405 struct nft_base_chain *basechain;
1406 struct nft_chain_hook hook;
1407 struct nf_hook_ops *ops;
1409 if (!nft_is_base_chain(chain))
1412 err = nft_chain_parse_hook(net, nla, afi, &hook,
1417 basechain = nft_base_chain(chain);
1418 if (basechain->type != hook.type) {
1419 nft_chain_release_hook(&hook);
1423 for (i = 0; i < afi->nops; i++) {
1424 ops = &basechain->ops[i];
1425 if (ops->hooknum != hook.num ||
1426 ops->priority != hook.priority ||
1427 ops->dev != hook.dev) {
1428 nft_chain_release_hook(&hook);
1432 nft_chain_release_hook(&hook);
1435 if (nla[NFTA_CHAIN_HANDLE] && name) {
1436 struct nft_chain *chain2;
1438 chain2 = nf_tables_chain_lookup(table,
1439 nla[NFTA_CHAIN_NAME],
1442 return PTR_ERR(chain2);
1445 if (nla[NFTA_CHAIN_COUNTERS]) {
1446 if (!nft_is_base_chain(chain))
1449 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1451 return PTR_ERR(stats);
1454 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1455 trans = nft_trans_alloc(&ctx, NFT_MSG_NEWCHAIN,
1456 sizeof(struct nft_trans_chain));
1457 if (trans == NULL) {
1462 nft_trans_chain_stats(trans) = stats;
1463 nft_trans_chain_update(trans) = true;
1465 if (nla[NFTA_CHAIN_POLICY])
1466 nft_trans_chain_policy(trans) = policy;
1468 nft_trans_chain_policy(trans) = -1;
1470 if (nla[NFTA_CHAIN_HANDLE] && name) {
1471 nla_strlcpy(nft_trans_chain_name(trans), name,
1472 NFT_CHAIN_MAXNAMELEN);
1474 list_add_tail(&trans->list, &net->nft.commit_list);
1478 if (table->use == UINT_MAX)
1481 if (nla[NFTA_CHAIN_HOOK]) {
1482 struct nft_chain_hook hook;
1483 struct nf_hook_ops *ops;
1486 err = nft_chain_parse_hook(net, nla, afi, &hook, create);
1490 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1491 if (basechain == NULL) {
1492 nft_chain_release_hook(&hook);
1496 if (hook.dev != NULL)
1497 strncpy(basechain->dev_name, hook.dev->name, IFNAMSIZ);
1499 if (nla[NFTA_CHAIN_COUNTERS]) {
1500 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1501 if (IS_ERR(stats)) {
1502 nft_chain_release_hook(&hook);
1504 return PTR_ERR(stats);
1506 basechain->stats = stats;
1508 stats = netdev_alloc_pcpu_stats(struct nft_stats);
1509 if (stats == NULL) {
1510 nft_chain_release_hook(&hook);
1514 rcu_assign_pointer(basechain->stats, stats);
1517 hookfn = hook.type->hooks[hook.num];
1518 basechain->type = hook.type;
1519 chain = &basechain->chain;
1521 for (i = 0; i < afi->nops; i++) {
1522 ops = &basechain->ops[i];
1524 ops->hooknum = hook.num;
1525 ops->priority = hook.priority;
1527 ops->hook = afi->hooks[ops->hooknum];
1528 ops->dev = hook.dev;
1531 if (afi->hook_ops_init)
1532 afi->hook_ops_init(ops, i);
1535 chain->flags |= NFT_BASE_CHAIN;
1536 basechain->policy = policy;
1538 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1543 INIT_LIST_HEAD(&chain->rules);
1544 chain->handle = nf_tables_alloc_handle(table);
1545 chain->table = table;
1546 nla_strlcpy(chain->name, name, NFT_CHAIN_MAXNAMELEN);
1548 err = nf_tables_register_hooks(net, table, chain, afi->nops);
1552 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1553 err = nft_trans_chain_add(&ctx, NFT_MSG_NEWCHAIN);
1558 list_add_tail_rcu(&chain->list, &table->chains);
1561 nf_tables_unregister_hooks(net, table, chain, afi->nops);
1563 nf_tables_chain_destroy(chain);
1567 static int nf_tables_delchain(struct net *net, struct sock *nlsk,
1568 struct sk_buff *skb, const struct nlmsghdr *nlh,
1569 const struct nlattr * const nla[],
1570 struct netlink_ext_ack *extack)
1572 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1573 u8 genmask = nft_genmask_next(net);
1574 struct nft_af_info *afi;
1575 struct nft_table *table;
1576 struct nft_chain *chain;
1577 int family = nfmsg->nfgen_family;
1580 afi = nf_tables_afinfo_lookup(net, family, false);
1582 return PTR_ERR(afi);
1584 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1586 return PTR_ERR(table);
1588 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1590 return PTR_ERR(chain);
1594 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1596 return nft_delchain(&ctx);
1604 * nft_register_expr - register nf_tables expr type
1607 * Registers the expr type for use with nf_tables. Returns zero on
1608 * success or a negative errno code otherwise.
1610 int nft_register_expr(struct nft_expr_type *type)
1612 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1613 if (type->family == NFPROTO_UNSPEC)
1614 list_add_tail_rcu(&type->list, &nf_tables_expressions);
1616 list_add_rcu(&type->list, &nf_tables_expressions);
1617 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1620 EXPORT_SYMBOL_GPL(nft_register_expr);
1623 * nft_unregister_expr - unregister nf_tables expr type
1626 * Unregisters the expr typefor use with nf_tables.
1628 void nft_unregister_expr(struct nft_expr_type *type)
1630 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1631 list_del_rcu(&type->list);
1632 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1634 EXPORT_SYMBOL_GPL(nft_unregister_expr);
1636 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
1639 const struct nft_expr_type *type;
1641 list_for_each_entry(type, &nf_tables_expressions, list) {
1642 if (!nla_strcmp(nla, type->name) &&
1643 (!type->family || type->family == family))
1649 static const struct nft_expr_type *nft_expr_type_get(u8 family,
1652 const struct nft_expr_type *type;
1655 return ERR_PTR(-EINVAL);
1657 type = __nft_expr_type_get(family, nla);
1658 if (type != NULL && try_module_get(type->owner))
1661 #ifdef CONFIG_MODULES
1663 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1664 request_module("nft-expr-%u-%.*s", family,
1665 nla_len(nla), (char *)nla_data(nla));
1666 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1667 if (__nft_expr_type_get(family, nla))
1668 return ERR_PTR(-EAGAIN);
1670 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1671 request_module("nft-expr-%.*s",
1672 nla_len(nla), (char *)nla_data(nla));
1673 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1674 if (__nft_expr_type_get(family, nla))
1675 return ERR_PTR(-EAGAIN);
1678 return ERR_PTR(-ENOENT);
1681 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
1682 [NFTA_EXPR_NAME] = { .type = NLA_STRING },
1683 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
1686 static int nf_tables_fill_expr_info(struct sk_buff *skb,
1687 const struct nft_expr *expr)
1689 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
1690 goto nla_put_failure;
1692 if (expr->ops->dump) {
1693 struct nlattr *data = nla_nest_start(skb, NFTA_EXPR_DATA);
1695 goto nla_put_failure;
1696 if (expr->ops->dump(skb, expr) < 0)
1697 goto nla_put_failure;
1698 nla_nest_end(skb, data);
1707 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
1708 const struct nft_expr *expr)
1710 struct nlattr *nest;
1712 nest = nla_nest_start(skb, attr);
1714 goto nla_put_failure;
1715 if (nf_tables_fill_expr_info(skb, expr) < 0)
1716 goto nla_put_failure;
1717 nla_nest_end(skb, nest);
1724 struct nft_expr_info {
1725 const struct nft_expr_ops *ops;
1726 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
1729 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
1730 const struct nlattr *nla,
1731 struct nft_expr_info *info)
1733 const struct nft_expr_type *type;
1734 const struct nft_expr_ops *ops;
1735 struct nlattr *tb[NFTA_EXPR_MAX + 1];
1738 err = nla_parse_nested(tb, NFTA_EXPR_MAX, nla, nft_expr_policy, NULL);
1742 type = nft_expr_type_get(ctx->afi->family, tb[NFTA_EXPR_NAME]);
1744 return PTR_ERR(type);
1746 if (tb[NFTA_EXPR_DATA]) {
1747 err = nla_parse_nested(info->tb, type->maxattr,
1748 tb[NFTA_EXPR_DATA], type->policy, NULL);
1752 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
1754 if (type->select_ops != NULL) {
1755 ops = type->select_ops(ctx,
1756 (const struct nlattr * const *)info->tb);
1768 module_put(type->owner);
1772 static int nf_tables_newexpr(const struct nft_ctx *ctx,
1773 const struct nft_expr_info *info,
1774 struct nft_expr *expr)
1776 const struct nft_expr_ops *ops = info->ops;
1781 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
1786 if (ops->validate) {
1787 const struct nft_data *data = NULL;
1789 err = ops->validate(ctx, expr, &data);
1798 ops->destroy(ctx, expr);
1804 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
1805 struct nft_expr *expr)
1807 if (expr->ops->destroy)
1808 expr->ops->destroy(ctx, expr);
1809 module_put(expr->ops->type->owner);
1812 struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
1813 const struct nlattr *nla)
1815 struct nft_expr_info info;
1816 struct nft_expr *expr;
1819 err = nf_tables_expr_parse(ctx, nla, &info);
1824 expr = kzalloc(info.ops->size, GFP_KERNEL);
1828 err = nf_tables_newexpr(ctx, &info, expr);
1836 module_put(info.ops->type->owner);
1838 return ERR_PTR(err);
1841 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
1843 nf_tables_expr_destroy(ctx, expr);
1851 static struct nft_rule *__nf_tables_rule_lookup(const struct nft_chain *chain,
1854 struct nft_rule *rule;
1856 // FIXME: this sucks
1857 list_for_each_entry(rule, &chain->rules, list) {
1858 if (handle == rule->handle)
1862 return ERR_PTR(-ENOENT);
1865 static struct nft_rule *nf_tables_rule_lookup(const struct nft_chain *chain,
1866 const struct nlattr *nla)
1869 return ERR_PTR(-EINVAL);
1871 return __nf_tables_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
1874 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
1875 [NFTA_RULE_TABLE] = { .type = NLA_STRING,
1876 .len = NFT_TABLE_MAXNAMELEN - 1 },
1877 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
1878 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1879 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
1880 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
1881 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
1882 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
1883 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
1884 .len = NFT_USERDATA_MAXLEN },
1887 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
1888 u32 portid, u32 seq, int event,
1889 u32 flags, int family,
1890 const struct nft_table *table,
1891 const struct nft_chain *chain,
1892 const struct nft_rule *rule)
1894 struct nlmsghdr *nlh;
1895 struct nfgenmsg *nfmsg;
1896 const struct nft_expr *expr, *next;
1897 struct nlattr *list;
1898 const struct nft_rule *prule;
1899 u16 type = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
1901 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg), flags);
1903 goto nla_put_failure;
1905 nfmsg = nlmsg_data(nlh);
1906 nfmsg->nfgen_family = family;
1907 nfmsg->version = NFNETLINK_V0;
1908 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1910 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
1911 goto nla_put_failure;
1912 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
1913 goto nla_put_failure;
1914 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
1916 goto nla_put_failure;
1918 if ((event != NFT_MSG_DELRULE) && (rule->list.prev != &chain->rules)) {
1919 prule = list_prev_entry(rule, list);
1920 if (nla_put_be64(skb, NFTA_RULE_POSITION,
1921 cpu_to_be64(prule->handle),
1923 goto nla_put_failure;
1926 list = nla_nest_start(skb, NFTA_RULE_EXPRESSIONS);
1928 goto nla_put_failure;
1929 nft_rule_for_each_expr(expr, next, rule) {
1930 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
1931 goto nla_put_failure;
1933 nla_nest_end(skb, list);
1936 struct nft_userdata *udata = nft_userdata(rule);
1937 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
1939 goto nla_put_failure;
1942 nlmsg_end(skb, nlh);
1946 nlmsg_trim(skb, nlh);
1950 static void nf_tables_rule_notify(const struct nft_ctx *ctx,
1951 const struct nft_rule *rule, int event)
1953 struct sk_buff *skb;
1957 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1960 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1964 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
1965 event, 0, ctx->afi->family, ctx->table,
1972 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1973 ctx->report, GFP_KERNEL);
1976 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
1979 struct nft_rule_dump_ctx {
1980 char table[NFT_TABLE_MAXNAMELEN];
1981 char chain[NFT_CHAIN_MAXNAMELEN];
1984 static int nf_tables_dump_rules(struct sk_buff *skb,
1985 struct netlink_callback *cb)
1987 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1988 const struct nft_rule_dump_ctx *ctx = cb->data;
1989 const struct nft_af_info *afi;
1990 const struct nft_table *table;
1991 const struct nft_chain *chain;
1992 const struct nft_rule *rule;
1993 unsigned int idx = 0, s_idx = cb->args[0];
1994 struct net *net = sock_net(skb->sk);
1995 int family = nfmsg->nfgen_family;
1998 cb->seq = net->nft.base_seq;
2000 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
2001 if (family != NFPROTO_UNSPEC && family != afi->family)
2004 list_for_each_entry_rcu(table, &afi->tables, list) {
2005 if (ctx && ctx->table[0] &&
2006 strcmp(ctx->table, table->name) != 0)
2009 list_for_each_entry_rcu(chain, &table->chains, list) {
2010 if (ctx && ctx->chain[0] &&
2011 strcmp(ctx->chain, chain->name) != 0)
2014 list_for_each_entry_rcu(rule, &chain->rules, list) {
2015 if (!nft_is_active(net, rule))
2020 memset(&cb->args[1], 0,
2021 sizeof(cb->args) - sizeof(cb->args[0]));
2022 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
2025 NLM_F_MULTI | NLM_F_APPEND,
2026 afi->family, table, chain, rule) < 0)
2029 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2043 static int nf_tables_dump_rules_done(struct netlink_callback *cb)
2049 static int nf_tables_getrule(struct net *net, struct sock *nlsk,
2050 struct sk_buff *skb, const struct nlmsghdr *nlh,
2051 const struct nlattr * const nla[],
2052 struct netlink_ext_ack *extack)
2054 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2055 u8 genmask = nft_genmask_cur(net);
2056 const struct nft_af_info *afi;
2057 const struct nft_table *table;
2058 const struct nft_chain *chain;
2059 const struct nft_rule *rule;
2060 struct sk_buff *skb2;
2061 int family = nfmsg->nfgen_family;
2064 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2065 struct netlink_dump_control c = {
2066 .dump = nf_tables_dump_rules,
2067 .done = nf_tables_dump_rules_done,
2070 if (nla[NFTA_RULE_TABLE] || nla[NFTA_RULE_CHAIN]) {
2071 struct nft_rule_dump_ctx *ctx;
2073 ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
2077 if (nla[NFTA_RULE_TABLE])
2078 nla_strlcpy(ctx->table, nla[NFTA_RULE_TABLE],
2079 sizeof(ctx->table));
2080 if (nla[NFTA_RULE_CHAIN])
2081 nla_strlcpy(ctx->chain, nla[NFTA_RULE_CHAIN],
2082 sizeof(ctx->chain));
2086 return netlink_dump_start(nlsk, skb, nlh, &c);
2089 afi = nf_tables_afinfo_lookup(net, family, false);
2091 return PTR_ERR(afi);
2093 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2095 return PTR_ERR(table);
2097 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2099 return PTR_ERR(chain);
2101 rule = nf_tables_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2103 return PTR_ERR(rule);
2105 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2109 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
2110 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
2111 family, table, chain, rule);
2115 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2122 static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
2123 struct nft_rule *rule)
2125 struct nft_expr *expr;
2128 * Careful: some expressions might not be initialized in case this
2129 * is called on error from nf_tables_newrule().
2131 expr = nft_expr_first(rule);
2132 while (expr != nft_expr_last(rule) && expr->ops) {
2133 nf_tables_expr_destroy(ctx, expr);
2134 expr = nft_expr_next(expr);
2139 #define NFT_RULE_MAXEXPRS 128
2141 static struct nft_expr_info *info;
2143 static int nf_tables_newrule(struct net *net, struct sock *nlsk,
2144 struct sk_buff *skb, const struct nlmsghdr *nlh,
2145 const struct nlattr * const nla[],
2146 struct netlink_ext_ack *extack)
2148 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2149 u8 genmask = nft_genmask_next(net);
2150 struct nft_af_info *afi;
2151 struct nft_table *table;
2152 struct nft_chain *chain;
2153 struct nft_rule *rule, *old_rule = NULL;
2154 struct nft_userdata *udata;
2155 struct nft_trans *trans = NULL;
2156 struct nft_expr *expr;
2159 unsigned int size, i, n, ulen = 0, usize = 0;
2162 u64 handle, pos_handle;
2164 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2166 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
2168 return PTR_ERR(afi);
2170 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2172 return PTR_ERR(table);
2174 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2176 return PTR_ERR(chain);
2178 if (nla[NFTA_RULE_HANDLE]) {
2179 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
2180 rule = __nf_tables_rule_lookup(chain, handle);
2182 return PTR_ERR(rule);
2184 if (nlh->nlmsg_flags & NLM_F_EXCL)
2186 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2191 if (!create || nlh->nlmsg_flags & NLM_F_REPLACE)
2193 handle = nf_tables_alloc_handle(table);
2195 if (chain->use == UINT_MAX)
2199 if (nla[NFTA_RULE_POSITION]) {
2200 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2203 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
2204 old_rule = __nf_tables_rule_lookup(chain, pos_handle);
2205 if (IS_ERR(old_rule))
2206 return PTR_ERR(old_rule);
2209 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2213 if (nla[NFTA_RULE_EXPRESSIONS]) {
2214 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
2216 if (nla_type(tmp) != NFTA_LIST_ELEM)
2218 if (n == NFT_RULE_MAXEXPRS)
2220 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
2223 size += info[n].ops->size;
2227 /* Check for overflow of dlen field */
2229 if (size >= 1 << 12)
2232 if (nla[NFTA_RULE_USERDATA]) {
2233 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
2235 usize = sizeof(struct nft_userdata) + ulen;
2239 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
2243 nft_activate_next(net, rule);
2245 rule->handle = handle;
2247 rule->udata = ulen ? 1 : 0;
2250 udata = nft_userdata(rule);
2251 udata->len = ulen - 1;
2252 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
2255 expr = nft_expr_first(rule);
2256 for (i = 0; i < n; i++) {
2257 err = nf_tables_newexpr(&ctx, &info[i], expr);
2261 expr = nft_expr_next(expr);
2264 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
2265 if (nft_is_active_next(net, old_rule)) {
2266 trans = nft_trans_rule_add(&ctx, NFT_MSG_DELRULE,
2268 if (trans == NULL) {
2272 nft_deactivate_next(net, old_rule);
2274 list_add_tail_rcu(&rule->list, &old_rule->list);
2279 } else if (nlh->nlmsg_flags & NLM_F_APPEND)
2281 list_add_rcu(&rule->list, &old_rule->list);
2283 list_add_tail_rcu(&rule->list, &chain->rules);
2286 list_add_tail_rcu(&rule->list, &old_rule->list);
2288 list_add_rcu(&rule->list, &chain->rules);
2291 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2299 list_del_rcu(&rule->list);
2301 nf_tables_rule_destroy(&ctx, rule);
2303 for (i = 0; i < n; i++) {
2304 if (info[i].ops != NULL)
2305 module_put(info[i].ops->type->owner);
2310 static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
2311 const struct nlattr *nla)
2313 u32 id = ntohl(nla_get_be32(nla));
2314 struct nft_trans *trans;
2316 list_for_each_entry(trans, &net->nft.commit_list, list) {
2317 struct nft_rule *rule = nft_trans_rule(trans);
2319 if (trans->msg_type == NFT_MSG_NEWRULE &&
2320 id == nft_trans_rule_id(trans))
2323 return ERR_PTR(-ENOENT);
2326 static int nf_tables_delrule(struct net *net, struct sock *nlsk,
2327 struct sk_buff *skb, const struct nlmsghdr *nlh,
2328 const struct nlattr * const nla[],
2329 struct netlink_ext_ack *extack)
2331 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2332 u8 genmask = nft_genmask_next(net);
2333 struct nft_af_info *afi;
2334 struct nft_table *table;
2335 struct nft_chain *chain = NULL;
2336 struct nft_rule *rule;
2337 int family = nfmsg->nfgen_family, err = 0;
2340 afi = nf_tables_afinfo_lookup(net, family, false);
2342 return PTR_ERR(afi);
2344 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2346 return PTR_ERR(table);
2348 if (nla[NFTA_RULE_CHAIN]) {
2349 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN],
2352 return PTR_ERR(chain);
2355 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2358 if (nla[NFTA_RULE_HANDLE]) {
2359 rule = nf_tables_rule_lookup(chain,
2360 nla[NFTA_RULE_HANDLE]);
2362 return PTR_ERR(rule);
2364 err = nft_delrule(&ctx, rule);
2365 } else if (nla[NFTA_RULE_ID]) {
2366 rule = nft_rule_lookup_byid(net, nla[NFTA_RULE_ID]);
2368 return PTR_ERR(rule);
2370 err = nft_delrule(&ctx, rule);
2372 err = nft_delrule_by_chain(&ctx);
2375 list_for_each_entry(chain, &table->chains, list) {
2376 if (!nft_is_active_next(net, chain))
2380 err = nft_delrule_by_chain(&ctx);
2393 static LIST_HEAD(nf_tables_set_types);
2395 int nft_register_set(struct nft_set_type *type)
2397 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2398 list_add_tail_rcu(&type->list, &nf_tables_set_types);
2399 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2402 EXPORT_SYMBOL_GPL(nft_register_set);
2404 void nft_unregister_set(struct nft_set_type *type)
2406 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2407 list_del_rcu(&type->list);
2408 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2410 EXPORT_SYMBOL_GPL(nft_unregister_set);
2412 #define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
2413 NFT_SET_TIMEOUT | NFT_SET_OBJECT)
2415 static bool nft_set_ops_candidate(const struct nft_set_ops *ops, u32 flags)
2417 return (flags & ops->features) == (flags & NFT_SET_FEATURES);
2421 * Select a set implementation based on the data characteristics and the
2422 * given policy. The total memory use might not be known if no size is
2423 * given, in that case the amount of memory per element is used.
2425 static const struct nft_set_ops *
2426 nft_select_set_ops(const struct nft_ctx *ctx,
2427 const struct nlattr * const nla[],
2428 const struct nft_set_desc *desc,
2429 enum nft_set_policies policy)
2431 const struct nft_set_ops *ops, *bops;
2432 struct nft_set_estimate est, best;
2433 const struct nft_set_type *type;
2436 #ifdef CONFIG_MODULES
2437 if (list_empty(&nf_tables_set_types)) {
2438 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2439 request_module("nft-set");
2440 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2441 if (!list_empty(&nf_tables_set_types))
2442 return ERR_PTR(-EAGAIN);
2445 if (nla[NFTA_SET_FLAGS] != NULL)
2446 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2453 list_for_each_entry(type, &nf_tables_set_types, list) {
2454 if (!type->select_ops)
2457 ops = type->select_ops(ctx, desc, flags);
2461 if (!nft_set_ops_candidate(ops, flags))
2463 if (!ops->estimate(desc, flags, &est))
2467 case NFT_SET_POL_PERFORMANCE:
2468 if (est.lookup < best.lookup)
2470 if (est.lookup == best.lookup) {
2472 if (est.space < best.space)
2474 } else if (est.size < best.size) {
2479 case NFT_SET_POL_MEMORY:
2481 if (est.space < best.space)
2483 if (est.space == best.space &&
2484 est.lookup < best.lookup)
2486 } else if (est.size < best.size) {
2494 if (!try_module_get(type->owner))
2497 module_put(bops->type->owner);
2506 return ERR_PTR(-EOPNOTSUPP);
2509 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
2510 [NFTA_SET_TABLE] = { .type = NLA_STRING,
2511 .len = NFT_TABLE_MAXNAMELEN - 1 },
2512 [NFTA_SET_NAME] = { .type = NLA_STRING,
2513 .len = NFT_SET_MAXNAMELEN - 1 },
2514 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
2515 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
2516 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
2517 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
2518 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
2519 [NFTA_SET_POLICY] = { .type = NLA_U32 },
2520 [NFTA_SET_DESC] = { .type = NLA_NESTED },
2521 [NFTA_SET_ID] = { .type = NLA_U32 },
2522 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
2523 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
2524 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
2525 .len = NFT_USERDATA_MAXLEN },
2526 [NFTA_SET_OBJ_TYPE] = { .type = NLA_U32 },
2529 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
2530 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
2533 static int nft_ctx_init_from_setattr(struct nft_ctx *ctx, struct net *net,
2534 const struct sk_buff *skb,
2535 const struct nlmsghdr *nlh,
2536 const struct nlattr * const nla[],
2539 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2540 struct nft_af_info *afi = NULL;
2541 struct nft_table *table = NULL;
2543 if (nfmsg->nfgen_family != NFPROTO_UNSPEC) {
2544 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
2546 return PTR_ERR(afi);
2549 if (nla[NFTA_SET_TABLE] != NULL) {
2551 return -EAFNOSUPPORT;
2553 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE],
2556 return PTR_ERR(table);
2559 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
2563 static struct nft_set *nf_tables_set_lookup(const struct nft_table *table,
2564 const struct nlattr *nla, u8 genmask)
2566 struct nft_set *set;
2569 return ERR_PTR(-EINVAL);
2571 list_for_each_entry(set, &table->sets, list) {
2572 if (!nla_strcmp(nla, set->name) &&
2573 nft_active_genmask(set, genmask))
2576 return ERR_PTR(-ENOENT);
2579 static struct nft_set *nf_tables_set_lookup_byid(const struct net *net,
2580 const struct nlattr *nla,
2583 struct nft_trans *trans;
2584 u32 id = ntohl(nla_get_be32(nla));
2586 list_for_each_entry(trans, &net->nft.commit_list, list) {
2587 struct nft_set *set = nft_trans_set(trans);
2589 if (trans->msg_type == NFT_MSG_NEWSET &&
2590 id == nft_trans_set_id(trans) &&
2591 nft_active_genmask(set, genmask))
2594 return ERR_PTR(-ENOENT);
2597 struct nft_set *nft_set_lookup(const struct net *net,
2598 const struct nft_table *table,
2599 const struct nlattr *nla_set_name,
2600 const struct nlattr *nla_set_id,
2603 struct nft_set *set;
2605 set = nf_tables_set_lookup(table, nla_set_name, genmask);
2610 set = nf_tables_set_lookup_byid(net, nla_set_id, genmask);
2614 EXPORT_SYMBOL_GPL(nft_set_lookup);
2616 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
2619 const struct nft_set *i;
2621 unsigned long *inuse;
2622 unsigned int n = 0, min = 0;
2624 p = strnchr(name, NFT_SET_MAXNAMELEN, '%');
2626 if (p[1] != 'd' || strchr(p + 2, '%'))
2629 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
2633 list_for_each_entry(i, &ctx->table->sets, list) {
2636 if (!nft_is_active_next(ctx->net, set))
2638 if (!sscanf(i->name, name, &tmp))
2640 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
2643 set_bit(tmp - min, inuse);
2646 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
2647 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
2648 min += BITS_PER_BYTE * PAGE_SIZE;
2649 memset(inuse, 0, PAGE_SIZE);
2652 free_page((unsigned long)inuse);
2655 snprintf(set->name, sizeof(set->name), name, min + n);
2656 list_for_each_entry(i, &ctx->table->sets, list) {
2657 if (!nft_is_active_next(ctx->net, i))
2659 if (!strcmp(set->name, i->name))
2665 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
2666 const struct nft_set *set, u16 event, u16 flags)
2668 struct nfgenmsg *nfmsg;
2669 struct nlmsghdr *nlh;
2670 struct nlattr *desc;
2671 u32 portid = ctx->portid;
2674 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
2675 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
2678 goto nla_put_failure;
2680 nfmsg = nlmsg_data(nlh);
2681 nfmsg->nfgen_family = ctx->afi->family;
2682 nfmsg->version = NFNETLINK_V0;
2683 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
2685 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
2686 goto nla_put_failure;
2687 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
2688 goto nla_put_failure;
2689 if (set->flags != 0)
2690 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
2691 goto nla_put_failure;
2693 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
2694 goto nla_put_failure;
2695 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
2696 goto nla_put_failure;
2697 if (set->flags & NFT_SET_MAP) {
2698 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
2699 goto nla_put_failure;
2700 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
2701 goto nla_put_failure;
2703 if (set->flags & NFT_SET_OBJECT &&
2704 nla_put_be32(skb, NFTA_SET_OBJ_TYPE, htonl(set->objtype)))
2705 goto nla_put_failure;
2708 nla_put_be64(skb, NFTA_SET_TIMEOUT,
2709 cpu_to_be64(jiffies_to_msecs(set->timeout)),
2711 goto nla_put_failure;
2713 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
2714 goto nla_put_failure;
2716 if (set->policy != NFT_SET_POL_PERFORMANCE) {
2717 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
2718 goto nla_put_failure;
2721 if (nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
2722 goto nla_put_failure;
2724 desc = nla_nest_start(skb, NFTA_SET_DESC);
2726 goto nla_put_failure;
2728 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
2729 goto nla_put_failure;
2730 nla_nest_end(skb, desc);
2732 nlmsg_end(skb, nlh);
2736 nlmsg_trim(skb, nlh);
2740 static void nf_tables_set_notify(const struct nft_ctx *ctx,
2741 const struct nft_set *set, int event,
2744 struct sk_buff *skb;
2745 u32 portid = ctx->portid;
2749 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2752 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
2756 err = nf_tables_fill_set(skb, ctx, set, event, 0);
2762 nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES, ctx->report,
2766 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
2769 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
2771 const struct nft_set *set;
2772 unsigned int idx, s_idx = cb->args[0];
2773 struct nft_af_info *afi;
2774 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
2775 struct net *net = sock_net(skb->sk);
2776 int cur_family = cb->args[3];
2777 struct nft_ctx *ctx = cb->data, ctx_set;
2783 cb->seq = net->nft.base_seq;
2785 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
2786 if (ctx->afi && ctx->afi != afi)
2790 if (afi->family != cur_family)
2795 list_for_each_entry_rcu(table, &afi->tables, list) {
2796 if (ctx->table && ctx->table != table)
2800 if (cur_table != table)
2806 list_for_each_entry_rcu(set, &table->sets, list) {
2809 if (!nft_is_active(net, set))
2813 ctx_set.table = table;
2815 if (nf_tables_fill_set(skb, &ctx_set, set,
2819 cb->args[2] = (unsigned long) table;
2820 cb->args[3] = afi->family;
2823 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2837 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
2843 static int nf_tables_getset(struct net *net, struct sock *nlsk,
2844 struct sk_buff *skb, const struct nlmsghdr *nlh,
2845 const struct nlattr * const nla[],
2846 struct netlink_ext_ack *extack)
2848 u8 genmask = nft_genmask_cur(net);
2849 const struct nft_set *set;
2851 struct sk_buff *skb2;
2852 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2855 /* Verify existence before starting dump */
2856 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
2860 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2861 struct netlink_dump_control c = {
2862 .dump = nf_tables_dump_sets,
2863 .done = nf_tables_dump_sets_done,
2865 struct nft_ctx *ctx_dump;
2867 ctx_dump = kmalloc(sizeof(*ctx_dump), GFP_KERNEL);
2868 if (ctx_dump == NULL)
2874 return netlink_dump_start(nlsk, skb, nlh, &c);
2877 /* Only accept unspec with dump */
2878 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2879 return -EAFNOSUPPORT;
2880 if (!nla[NFTA_SET_TABLE])
2883 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
2885 return PTR_ERR(set);
2887 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2891 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
2895 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2902 static int nf_tables_set_desc_parse(const struct nft_ctx *ctx,
2903 struct nft_set_desc *desc,
2904 const struct nlattr *nla)
2906 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
2909 err = nla_parse_nested(da, NFTA_SET_DESC_MAX, nla,
2910 nft_set_desc_policy, NULL);
2914 if (da[NFTA_SET_DESC_SIZE] != NULL)
2915 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
2920 static int nf_tables_newset(struct net *net, struct sock *nlsk,
2921 struct sk_buff *skb, const struct nlmsghdr *nlh,
2922 const struct nlattr * const nla[],
2923 struct netlink_ext_ack *extack)
2925 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2926 u8 genmask = nft_genmask_next(net);
2927 const struct nft_set_ops *ops;
2928 struct nft_af_info *afi;
2929 struct nft_table *table;
2930 struct nft_set *set;
2932 char name[NFT_SET_MAXNAMELEN];
2936 u32 ktype, dtype, flags, policy, gc_int, objtype;
2937 struct nft_set_desc desc;
2938 unsigned char *udata;
2942 if (nla[NFTA_SET_TABLE] == NULL ||
2943 nla[NFTA_SET_NAME] == NULL ||
2944 nla[NFTA_SET_KEY_LEN] == NULL ||
2945 nla[NFTA_SET_ID] == NULL)
2948 memset(&desc, 0, sizeof(desc));
2950 ktype = NFT_DATA_VALUE;
2951 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
2952 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
2953 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
2957 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
2958 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
2962 if (nla[NFTA_SET_FLAGS] != NULL) {
2963 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2964 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
2965 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
2966 NFT_SET_MAP | NFT_SET_EVAL |
2969 /* Only one of these operations is supported */
2970 if ((flags & (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT)) ==
2971 (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT))
2976 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
2977 if (!(flags & NFT_SET_MAP))
2980 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
2981 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
2982 dtype != NFT_DATA_VERDICT)
2985 if (dtype != NFT_DATA_VERDICT) {
2986 if (nla[NFTA_SET_DATA_LEN] == NULL)
2988 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
2989 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
2992 desc.dlen = sizeof(struct nft_verdict);
2993 } else if (flags & NFT_SET_MAP)
2996 if (nla[NFTA_SET_OBJ_TYPE] != NULL) {
2997 if (!(flags & NFT_SET_OBJECT))
3000 objtype = ntohl(nla_get_be32(nla[NFTA_SET_OBJ_TYPE]));
3001 if (objtype == NFT_OBJECT_UNSPEC ||
3002 objtype > NFT_OBJECT_MAX)
3004 } else if (flags & NFT_SET_OBJECT)
3007 objtype = NFT_OBJECT_UNSPEC;
3010 if (nla[NFTA_SET_TIMEOUT] != NULL) {
3011 if (!(flags & NFT_SET_TIMEOUT))
3013 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3014 nla[NFTA_SET_TIMEOUT])));
3017 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
3018 if (!(flags & NFT_SET_TIMEOUT))
3020 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
3023 policy = NFT_SET_POL_PERFORMANCE;
3024 if (nla[NFTA_SET_POLICY] != NULL)
3025 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
3027 if (nla[NFTA_SET_DESC] != NULL) {
3028 err = nf_tables_set_desc_parse(&ctx, &desc, nla[NFTA_SET_DESC]);
3033 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
3035 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
3037 return PTR_ERR(afi);
3039 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE], genmask);
3041 return PTR_ERR(table);
3043 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
3045 set = nf_tables_set_lookup(table, nla[NFTA_SET_NAME], genmask);
3047 if (PTR_ERR(set) != -ENOENT)
3048 return PTR_ERR(set);
3050 if (nlh->nlmsg_flags & NLM_F_EXCL)
3052 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3057 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
3060 ops = nft_select_set_ops(&ctx, nla, &desc, policy);
3062 return PTR_ERR(ops);
3065 if (nla[NFTA_SET_USERDATA])
3066 udlen = nla_len(nla[NFTA_SET_USERDATA]);
3069 if (ops->privsize != NULL)
3070 size = ops->privsize(nla, &desc);
3072 set = kvzalloc(sizeof(*set) + size + udlen, GFP_KERNEL);
3078 nla_strlcpy(name, nla[NFTA_SET_NAME], sizeof(set->name));
3079 err = nf_tables_set_alloc_name(&ctx, set, name);
3085 udata = set->data + size;
3086 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
3089 INIT_LIST_HEAD(&set->bindings);
3092 set->klen = desc.klen;
3094 set->objtype = objtype;
3095 set->dlen = desc.dlen;
3097 set->size = desc.size;
3098 set->policy = policy;
3101 set->timeout = timeout;
3102 set->gc_int = gc_int;
3104 err = ops->init(set, &desc, nla);
3108 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
3112 list_add_tail_rcu(&set->list, &table->sets);
3121 module_put(ops->type->owner);
3125 static void nft_set_destroy(struct nft_set *set)
3127 set->ops->destroy(set);
3128 module_put(set->ops->type->owner);
3132 static void nf_tables_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
3134 list_del_rcu(&set->list);
3135 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET, GFP_ATOMIC);
3136 nft_set_destroy(set);
3139 static int nf_tables_delset(struct net *net, struct sock *nlsk,
3140 struct sk_buff *skb, const struct nlmsghdr *nlh,
3141 const struct nlattr * const nla[],
3142 struct netlink_ext_ack *extack)
3144 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3145 u8 genmask = nft_genmask_next(net);
3146 struct nft_set *set;
3150 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
3151 return -EAFNOSUPPORT;
3152 if (nla[NFTA_SET_TABLE] == NULL)
3155 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
3159 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
3161 return PTR_ERR(set);
3162 if (!list_empty(&set->bindings))
3165 return nft_delset(&ctx, set);
3168 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
3169 struct nft_set *set,
3170 const struct nft_set_iter *iter,
3171 struct nft_set_elem *elem)
3173 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3174 enum nft_registers dreg;
3176 dreg = nft_type_to_reg(set->dtype);
3177 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
3178 set->dtype == NFT_DATA_VERDICT ?
3179 NFT_DATA_VERDICT : NFT_DATA_VALUE,
3183 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
3184 struct nft_set_binding *binding)
3186 struct nft_set_binding *i;
3187 struct nft_set_iter iter;
3189 if (!list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS)
3192 if (binding->flags & NFT_SET_MAP) {
3193 /* If the set is already bound to the same chain all
3194 * jumps are already validated for that chain.
3196 list_for_each_entry(i, &set->bindings, list) {
3197 if (i->flags & NFT_SET_MAP &&
3198 i->chain == binding->chain)
3202 iter.genmask = nft_genmask_next(ctx->net);
3206 iter.fn = nf_tables_bind_check_setelem;
3208 set->ops->walk(ctx, set, &iter);
3213 binding->chain = ctx->chain;
3214 list_add_tail_rcu(&binding->list, &set->bindings);
3217 EXPORT_SYMBOL_GPL(nf_tables_bind_set);
3219 void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
3220 struct nft_set_binding *binding)
3222 list_del_rcu(&binding->list);
3224 if (list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS &&
3225 nft_is_active(ctx->net, set))
3226 nf_tables_set_destroy(ctx, set);
3228 EXPORT_SYMBOL_GPL(nf_tables_unbind_set);
3230 const struct nft_set_ext_type nft_set_ext_types[] = {
3231 [NFT_SET_EXT_KEY] = {
3232 .align = __alignof__(u32),
3234 [NFT_SET_EXT_DATA] = {
3235 .align = __alignof__(u32),
3237 [NFT_SET_EXT_EXPR] = {
3238 .align = __alignof__(struct nft_expr),
3240 [NFT_SET_EXT_OBJREF] = {
3241 .len = sizeof(struct nft_object *),
3242 .align = __alignof__(struct nft_object *),
3244 [NFT_SET_EXT_FLAGS] = {
3246 .align = __alignof__(u8),
3248 [NFT_SET_EXT_TIMEOUT] = {
3250 .align = __alignof__(u64),
3252 [NFT_SET_EXT_EXPIRATION] = {
3253 .len = sizeof(unsigned long),
3254 .align = __alignof__(unsigned long),
3256 [NFT_SET_EXT_USERDATA] = {
3257 .len = sizeof(struct nft_userdata),
3258 .align = __alignof__(struct nft_userdata),
3261 EXPORT_SYMBOL_GPL(nft_set_ext_types);
3267 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
3268 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
3269 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
3270 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
3271 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
3272 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
3273 .len = NFT_USERDATA_MAXLEN },
3276 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
3277 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING,
3278 .len = NFT_TABLE_MAXNAMELEN - 1 },
3279 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING,
3280 .len = NFT_SET_MAXNAMELEN - 1 },
3281 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
3282 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
3285 static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx, struct net *net,
3286 const struct sk_buff *skb,
3287 const struct nlmsghdr *nlh,
3288 const struct nlattr * const nla[],
3291 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3292 struct nft_af_info *afi;
3293 struct nft_table *table;
3295 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
3297 return PTR_ERR(afi);
3299 table = nf_tables_table_lookup(afi, nla[NFTA_SET_ELEM_LIST_TABLE],
3302 return PTR_ERR(table);
3304 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
3308 static int nf_tables_fill_setelem(struct sk_buff *skb,
3309 const struct nft_set *set,
3310 const struct nft_set_elem *elem)
3312 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3313 unsigned char *b = skb_tail_pointer(skb);
3314 struct nlattr *nest;
3316 nest = nla_nest_start(skb, NFTA_LIST_ELEM);
3318 goto nla_put_failure;
3320 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
3321 NFT_DATA_VALUE, set->klen) < 0)
3322 goto nla_put_failure;
3324 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3325 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
3326 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
3328 goto nla_put_failure;
3330 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
3331 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
3332 goto nla_put_failure;
3334 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3335 nla_put_string(skb, NFTA_SET_ELEM_OBJREF,
3336 (*nft_set_ext_obj(ext))->name) < 0)
3337 goto nla_put_failure;
3339 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
3340 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
3341 htonl(*nft_set_ext_flags(ext))))
3342 goto nla_put_failure;
3344 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
3345 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
3346 cpu_to_be64(jiffies_to_msecs(
3347 *nft_set_ext_timeout(ext))),
3349 goto nla_put_failure;
3351 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
3352 unsigned long expires, now = jiffies;
3354 expires = *nft_set_ext_expiration(ext);
3355 if (time_before(now, expires))
3360 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
3361 cpu_to_be64(jiffies_to_msecs(expires)),
3363 goto nla_put_failure;
3366 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
3367 struct nft_userdata *udata;
3369 udata = nft_set_ext_userdata(ext);
3370 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
3371 udata->len + 1, udata->data))
3372 goto nla_put_failure;
3375 nla_nest_end(skb, nest);
3383 struct nft_set_dump_args {
3384 const struct netlink_callback *cb;
3385 struct nft_set_iter iter;
3386 struct sk_buff *skb;
3389 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
3390 struct nft_set *set,
3391 const struct nft_set_iter *iter,
3392 struct nft_set_elem *elem)
3394 struct nft_set_dump_args *args;
3396 args = container_of(iter, struct nft_set_dump_args, iter);
3397 return nf_tables_fill_setelem(args->skb, set, elem);
3400 struct nft_set_dump_ctx {
3401 const struct nft_set *set;
3405 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
3407 struct nft_set_dump_ctx *dump_ctx = cb->data;
3408 struct net *net = sock_net(skb->sk);
3409 struct nft_af_info *afi;
3410 struct nft_table *table;
3411 struct nft_set *set;
3412 struct nft_set_dump_args args;
3413 bool set_found = false;
3414 struct nfgenmsg *nfmsg;
3415 struct nlmsghdr *nlh;
3416 struct nlattr *nest;
3421 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
3422 if (afi != dump_ctx->ctx.afi)
3425 list_for_each_entry_rcu(table, &afi->tables, list) {
3426 if (table != dump_ctx->ctx.table)
3429 list_for_each_entry_rcu(set, &table->sets, list) {
3430 if (set == dump_ctx->set) {
3445 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWSETELEM);
3446 portid = NETLINK_CB(cb->skb).portid;
3447 seq = cb->nlh->nlmsg_seq;
3449 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3452 goto nla_put_failure;
3454 nfmsg = nlmsg_data(nlh);
3455 nfmsg->nfgen_family = afi->family;
3456 nfmsg->version = NFNETLINK_V0;
3457 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
3459 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, table->name))
3460 goto nla_put_failure;
3461 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
3462 goto nla_put_failure;
3464 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3466 goto nla_put_failure;
3470 args.iter.genmask = nft_genmask_cur(net);
3471 args.iter.skip = cb->args[0];
3472 args.iter.count = 0;
3474 args.iter.fn = nf_tables_dump_setelem;
3475 set->ops->walk(&dump_ctx->ctx, set, &args.iter);
3478 nla_nest_end(skb, nest);
3479 nlmsg_end(skb, nlh);
3481 if (args.iter.err && args.iter.err != -EMSGSIZE)
3482 return args.iter.err;
3483 if (args.iter.count == cb->args[0])
3486 cb->args[0] = args.iter.count;
3494 static int nf_tables_dump_set_done(struct netlink_callback *cb)
3500 static int nf_tables_getsetelem(struct net *net, struct sock *nlsk,
3501 struct sk_buff *skb, const struct nlmsghdr *nlh,
3502 const struct nlattr * const nla[],
3503 struct netlink_ext_ack *extack)
3505 u8 genmask = nft_genmask_cur(net);
3506 const struct nft_set *set;
3510 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3514 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3517 return PTR_ERR(set);
3519 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3520 struct netlink_dump_control c = {
3521 .dump = nf_tables_dump_set,
3522 .done = nf_tables_dump_set_done,
3524 struct nft_set_dump_ctx *dump_ctx;
3526 dump_ctx = kmalloc(sizeof(*dump_ctx), GFP_KERNEL);
3530 dump_ctx->set = set;
3531 dump_ctx->ctx = ctx;
3534 return netlink_dump_start(nlsk, skb, nlh, &c);
3539 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
3540 const struct nft_ctx *ctx, u32 seq,
3541 u32 portid, int event, u16 flags,
3542 const struct nft_set *set,
3543 const struct nft_set_elem *elem)
3545 struct nfgenmsg *nfmsg;
3546 struct nlmsghdr *nlh;
3547 struct nlattr *nest;
3550 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
3551 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3554 goto nla_put_failure;
3556 nfmsg = nlmsg_data(nlh);
3557 nfmsg->nfgen_family = ctx->afi->family;
3558 nfmsg->version = NFNETLINK_V0;
3559 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
3561 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3562 goto nla_put_failure;
3563 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3564 goto nla_put_failure;
3566 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3568 goto nla_put_failure;
3570 err = nf_tables_fill_setelem(skb, set, elem);
3572 goto nla_put_failure;
3574 nla_nest_end(skb, nest);
3576 nlmsg_end(skb, nlh);
3580 nlmsg_trim(skb, nlh);
3584 static void nf_tables_setelem_notify(const struct nft_ctx *ctx,
3585 const struct nft_set *set,
3586 const struct nft_set_elem *elem,
3587 int event, u16 flags)
3589 struct net *net = ctx->net;
3590 u32 portid = ctx->portid;
3591 struct sk_buff *skb;
3594 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3597 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3601 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
3608 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
3612 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
3615 static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
3617 struct nft_set *set)
3619 struct nft_trans *trans;
3621 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
3625 nft_trans_elem_set(trans) = set;
3629 void *nft_set_elem_init(const struct nft_set *set,
3630 const struct nft_set_ext_tmpl *tmpl,
3631 const u32 *key, const u32 *data,
3632 u64 timeout, gfp_t gfp)
3634 struct nft_set_ext *ext;
3637 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
3641 ext = nft_set_elem_ext(set, elem);
3642 nft_set_ext_init(ext, tmpl);
3644 memcpy(nft_set_ext_key(ext), key, set->klen);
3645 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3646 memcpy(nft_set_ext_data(ext), data, set->dlen);
3647 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION))
3648 *nft_set_ext_expiration(ext) =
3650 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
3651 *nft_set_ext_timeout(ext) = timeout;
3656 void nft_set_elem_destroy(const struct nft_set *set, void *elem,
3659 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3661 nft_data_release(nft_set_ext_key(ext), NFT_DATA_VALUE);
3662 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3663 nft_data_release(nft_set_ext_data(ext), set->dtype);
3664 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3665 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3666 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
3667 (*nft_set_ext_obj(ext))->use--;
3670 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
3672 /* Only called from commit path, nft_set_elem_deactivate() already deals with
3673 * the refcounting from the preparation phase.
3675 static void nf_tables_set_elem_destroy(const struct nft_set *set, void *elem)
3677 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3679 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3680 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3684 static int nft_setelem_parse_flags(const struct nft_set *set,
3685 const struct nlattr *attr, u32 *flags)
3690 *flags = ntohl(nla_get_be32(attr));
3691 if (*flags & ~NFT_SET_ELEM_INTERVAL_END)
3693 if (!(set->flags & NFT_SET_INTERVAL) &&
3694 *flags & NFT_SET_ELEM_INTERVAL_END)
3700 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3701 const struct nlattr *attr, u32 nlmsg_flags)
3703 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3704 u8 genmask = nft_genmask_next(ctx->net);
3705 struct nft_data_desc d1, d2;
3706 struct nft_set_ext_tmpl tmpl;
3707 struct nft_set_ext *ext, *ext2;
3708 struct nft_set_elem elem;
3709 struct nft_set_binding *binding;
3710 struct nft_object *obj = NULL;
3711 struct nft_userdata *udata;
3712 struct nft_data data;
3713 enum nft_registers dreg;
3714 struct nft_trans *trans;
3720 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3721 nft_set_elem_policy, NULL);
3725 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3728 nft_set_ext_prepare(&tmpl);
3730 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3734 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3736 if (set->flags & NFT_SET_MAP) {
3737 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
3738 !(flags & NFT_SET_ELEM_INTERVAL_END))
3740 if (nla[NFTA_SET_ELEM_DATA] != NULL &&
3741 flags & NFT_SET_ELEM_INTERVAL_END)
3744 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3749 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
3750 if (!(set->flags & NFT_SET_TIMEOUT))
3752 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3753 nla[NFTA_SET_ELEM_TIMEOUT])));
3754 } else if (set->flags & NFT_SET_TIMEOUT) {
3755 timeout = set->timeout;
3758 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
3759 nla[NFTA_SET_ELEM_KEY]);
3763 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
3766 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
3768 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
3769 if (timeout != set->timeout)
3770 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
3773 if (nla[NFTA_SET_ELEM_OBJREF] != NULL) {
3774 if (!(set->flags & NFT_SET_OBJECT)) {
3778 obj = nf_tables_obj_lookup(ctx->table, nla[NFTA_SET_ELEM_OBJREF],
3779 set->objtype, genmask);
3784 nft_set_ext_add(&tmpl, NFT_SET_EXT_OBJREF);
3787 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
3788 err = nft_data_init(ctx, &data, sizeof(data), &d2,
3789 nla[NFTA_SET_ELEM_DATA]);
3794 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
3797 dreg = nft_type_to_reg(set->dtype);
3798 list_for_each_entry(binding, &set->bindings, list) {
3799 struct nft_ctx bind_ctx = {
3802 .table = ctx->table,
3803 .chain = (struct nft_chain *)binding->chain,
3806 if (!(binding->flags & NFT_SET_MAP))
3809 err = nft_validate_register_store(&bind_ctx, dreg,
3816 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
3819 /* The full maximum length of userdata can exceed the maximum
3820 * offset value (U8_MAX) for following extensions, therefor it
3821 * must be the last extension added.
3824 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
3825 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
3827 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
3832 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
3833 timeout, GFP_KERNEL);
3834 if (elem.priv == NULL)
3837 ext = nft_set_elem_ext(set, elem.priv);
3839 *nft_set_ext_flags(ext) = flags;
3841 udata = nft_set_ext_userdata(ext);
3842 udata->len = ulen - 1;
3843 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
3846 *nft_set_ext_obj(ext) = obj;
3850 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
3854 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
3855 err = set->ops->insert(ctx->net, set, &elem, &ext2);
3857 if (err == -EEXIST) {
3858 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) ^
3859 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) ||
3860 nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) ^
3861 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF))
3863 if ((nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3864 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
3865 memcmp(nft_set_ext_data(ext),
3866 nft_set_ext_data(ext2), set->dlen) != 0) ||
3867 (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3868 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF) &&
3869 *nft_set_ext_obj(ext) != *nft_set_ext_obj(ext2)))
3871 else if (!(nlmsg_flags & NLM_F_EXCL))
3878 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact)) {
3883 nft_trans_elem(trans) = elem;
3884 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3888 set->ops->remove(ctx->net, set, &elem);
3894 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3895 nft_data_release(&data, d2.type);
3897 nft_data_release(&elem.key.val, d1.type);
3902 static int nf_tables_newsetelem(struct net *net, struct sock *nlsk,
3903 struct sk_buff *skb, const struct nlmsghdr *nlh,
3904 const struct nlattr * const nla[],
3905 struct netlink_ext_ack *extack)
3907 u8 genmask = nft_genmask_next(net);
3908 const struct nlattr *attr;
3909 struct nft_set *set;
3913 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
3916 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3920 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3923 if (nla[NFTA_SET_ELEM_LIST_SET_ID]) {
3924 set = nf_tables_set_lookup_byid(net,
3925 nla[NFTA_SET_ELEM_LIST_SET_ID],
3929 return PTR_ERR(set);
3932 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
3935 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3936 err = nft_add_set_elem(&ctx, set, attr, nlh->nlmsg_flags);
3944 * nft_data_hold - hold a nft_data item
3946 * @data: struct nft_data to release
3947 * @type: type of data
3949 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
3950 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
3951 * NFT_GOTO verdicts. This function must be called on active data objects
3952 * from the second phase of the commit protocol.
3954 static void nft_data_hold(const struct nft_data *data, enum nft_data_types type)
3956 if (type == NFT_DATA_VERDICT) {
3957 switch (data->verdict.code) {
3960 data->verdict.chain->use++;
3966 static void nft_set_elem_activate(const struct net *net,
3967 const struct nft_set *set,
3968 struct nft_set_elem *elem)
3970 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3972 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3973 nft_data_hold(nft_set_ext_data(ext), set->dtype);
3974 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
3975 (*nft_set_ext_obj(ext))->use++;
3978 static void nft_set_elem_deactivate(const struct net *net,
3979 const struct nft_set *set,
3980 struct nft_set_elem *elem)
3982 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3984 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3985 nft_data_release(nft_set_ext_data(ext), set->dtype);
3986 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
3987 (*nft_set_ext_obj(ext))->use--;
3990 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
3991 const struct nlattr *attr)
3993 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3994 struct nft_set_ext_tmpl tmpl;
3995 struct nft_data_desc desc;
3996 struct nft_set_elem elem;
3997 struct nft_set_ext *ext;
3998 struct nft_trans *trans;
4003 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
4004 nft_set_elem_policy, NULL);
4009 if (nla[NFTA_SET_ELEM_KEY] == NULL)
4012 nft_set_ext_prepare(&tmpl);
4014 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
4018 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
4020 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
4021 nla[NFTA_SET_ELEM_KEY]);
4026 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
4029 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, desc.len);
4032 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, NULL, 0,
4034 if (elem.priv == NULL)
4037 ext = nft_set_elem_ext(set, elem.priv);
4039 *nft_set_ext_flags(ext) = flags;
4041 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
4042 if (trans == NULL) {
4047 priv = set->ops->deactivate(ctx->net, set, &elem);
4055 nft_set_elem_deactivate(ctx->net, set, &elem);
4057 nft_trans_elem(trans) = elem;
4058 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4066 nft_data_release(&elem.key.val, desc.type);
4071 static int nft_flush_set(const struct nft_ctx *ctx,
4072 struct nft_set *set,
4073 const struct nft_set_iter *iter,
4074 struct nft_set_elem *elem)
4076 struct nft_trans *trans;
4079 trans = nft_trans_alloc_gfp(ctx, NFT_MSG_DELSETELEM,
4080 sizeof(struct nft_trans_elem), GFP_ATOMIC);
4084 if (!set->ops->flush(ctx->net, set, elem->priv)) {
4090 nft_trans_elem_set(trans) = set;
4091 nft_trans_elem(trans) = *elem;
4092 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4100 static int nf_tables_delsetelem(struct net *net, struct sock *nlsk,
4101 struct sk_buff *skb, const struct nlmsghdr *nlh,
4102 const struct nlattr * const nla[],
4103 struct netlink_ext_ack *extack)
4105 u8 genmask = nft_genmask_next(net);
4106 const struct nlattr *attr;
4107 struct nft_set *set;
4111 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
4115 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
4118 return PTR_ERR(set);
4119 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4122 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL) {
4123 struct nft_set_iter iter = {
4125 .fn = nft_flush_set,
4127 set->ops->walk(&ctx, set, &iter);
4132 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4133 err = nft_del_setelem(&ctx, set, attr);
4142 void nft_set_gc_batch_release(struct rcu_head *rcu)
4144 struct nft_set_gc_batch *gcb;
4147 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
4148 for (i = 0; i < gcb->head.cnt; i++)
4149 nft_set_elem_destroy(gcb->head.set, gcb->elems[i], true);
4152 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
4154 struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
4157 struct nft_set_gc_batch *gcb;
4159 gcb = kzalloc(sizeof(*gcb), gfp);
4162 gcb->head.set = set;
4165 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
4172 * nft_register_obj- register nf_tables stateful object type
4175 * Registers the object type for use with nf_tables. Returns zero on
4176 * success or a negative errno code otherwise.
4178 int nft_register_obj(struct nft_object_type *obj_type)
4180 if (obj_type->type == NFT_OBJECT_UNSPEC)
4183 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4184 list_add_rcu(&obj_type->list, &nf_tables_objects);
4185 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4188 EXPORT_SYMBOL_GPL(nft_register_obj);
4191 * nft_unregister_obj - unregister nf_tables object type
4194 * Unregisters the object type for use with nf_tables.
4196 void nft_unregister_obj(struct nft_object_type *obj_type)
4198 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4199 list_del_rcu(&obj_type->list);
4200 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4202 EXPORT_SYMBOL_GPL(nft_unregister_obj);
4204 struct nft_object *nf_tables_obj_lookup(const struct nft_table *table,
4205 const struct nlattr *nla,
4206 u32 objtype, u8 genmask)
4208 struct nft_object *obj;
4210 list_for_each_entry(obj, &table->objects, list) {
4211 if (!nla_strcmp(nla, obj->name) &&
4212 objtype == obj->type->type &&
4213 nft_active_genmask(obj, genmask))
4216 return ERR_PTR(-ENOENT);
4218 EXPORT_SYMBOL_GPL(nf_tables_obj_lookup);
4220 static const struct nla_policy nft_obj_policy[NFTA_OBJ_MAX + 1] = {
4221 [NFTA_OBJ_TABLE] = { .type = NLA_STRING,
4222 .len = NFT_TABLE_MAXNAMELEN - 1 },
4223 [NFTA_OBJ_NAME] = { .type = NLA_STRING,
4224 .len = NFT_OBJ_MAXNAMELEN - 1 },
4225 [NFTA_OBJ_TYPE] = { .type = NLA_U32 },
4226 [NFTA_OBJ_DATA] = { .type = NLA_NESTED },
4229 static struct nft_object *nft_obj_init(const struct nft_ctx *ctx,
4230 const struct nft_object_type *type,
4231 const struct nlattr *attr)
4233 struct nlattr *tb[type->maxattr + 1];
4234 struct nft_object *obj;
4238 err = nla_parse_nested(tb, type->maxattr, attr, type->policy,
4243 memset(tb, 0, sizeof(tb[0]) * (type->maxattr + 1));
4247 obj = kzalloc(sizeof(struct nft_object) + type->size, GFP_KERNEL);
4251 err = type->init(ctx, (const struct nlattr * const *)tb, obj);
4260 return ERR_PTR(err);
4263 static int nft_object_dump(struct sk_buff *skb, unsigned int attr,
4264 struct nft_object *obj, bool reset)
4266 struct nlattr *nest;
4268 nest = nla_nest_start(skb, attr);
4270 goto nla_put_failure;
4271 if (obj->type->dump(skb, obj, reset) < 0)
4272 goto nla_put_failure;
4273 nla_nest_end(skb, nest);
4280 static const struct nft_object_type *__nft_obj_type_get(u32 objtype)
4282 const struct nft_object_type *type;
4284 list_for_each_entry(type, &nf_tables_objects, list) {
4285 if (objtype == type->type)
4291 static const struct nft_object_type *nft_obj_type_get(u32 objtype)
4293 const struct nft_object_type *type;
4295 type = __nft_obj_type_get(objtype);
4296 if (type != NULL && try_module_get(type->owner))
4299 #ifdef CONFIG_MODULES
4301 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4302 request_module("nft-obj-%u", objtype);
4303 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4304 if (__nft_obj_type_get(objtype))
4305 return ERR_PTR(-EAGAIN);
4308 return ERR_PTR(-ENOENT);
4311 static int nf_tables_newobj(struct net *net, struct sock *nlsk,
4312 struct sk_buff *skb, const struct nlmsghdr *nlh,
4313 const struct nlattr * const nla[],
4314 struct netlink_ext_ack *extack)
4316 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4317 const struct nft_object_type *type;
4318 u8 genmask = nft_genmask_next(net);
4319 int family = nfmsg->nfgen_family;
4320 struct nft_af_info *afi;
4321 struct nft_table *table;
4322 struct nft_object *obj;
4327 if (!nla[NFTA_OBJ_TYPE] ||
4328 !nla[NFTA_OBJ_NAME] ||
4329 !nla[NFTA_OBJ_DATA])
4332 afi = nf_tables_afinfo_lookup(net, family, true);
4334 return PTR_ERR(afi);
4336 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4338 return PTR_ERR(table);
4340 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4341 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4348 if (nlh->nlmsg_flags & NLM_F_EXCL)
4354 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
4356 type = nft_obj_type_get(objtype);
4358 return PTR_ERR(type);
4360 obj = nft_obj_init(&ctx, type, nla[NFTA_OBJ_DATA]);
4366 nla_strlcpy(obj->name, nla[NFTA_OBJ_NAME], NFT_OBJ_MAXNAMELEN);
4368 err = nft_trans_obj_add(&ctx, NFT_MSG_NEWOBJ, obj);
4372 list_add_tail_rcu(&obj->list, &table->objects);
4376 if (obj->type->destroy)
4377 obj->type->destroy(obj);
4380 module_put(type->owner);
4384 static int nf_tables_fill_obj_info(struct sk_buff *skb, struct net *net,
4385 u32 portid, u32 seq, int event, u32 flags,
4386 int family, const struct nft_table *table,
4387 struct nft_object *obj, bool reset)
4389 struct nfgenmsg *nfmsg;
4390 struct nlmsghdr *nlh;
4392 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
4393 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
4395 goto nla_put_failure;
4397 nfmsg = nlmsg_data(nlh);
4398 nfmsg->nfgen_family = family;
4399 nfmsg->version = NFNETLINK_V0;
4400 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4402 if (nla_put_string(skb, NFTA_OBJ_TABLE, table->name) ||
4403 nla_put_string(skb, NFTA_OBJ_NAME, obj->name) ||
4404 nla_put_be32(skb, NFTA_OBJ_TYPE, htonl(obj->type->type)) ||
4405 nla_put_be32(skb, NFTA_OBJ_USE, htonl(obj->use)) ||
4406 nft_object_dump(skb, NFTA_OBJ_DATA, obj, reset))
4407 goto nla_put_failure;
4409 nlmsg_end(skb, nlh);
4413 nlmsg_trim(skb, nlh);
4417 struct nft_obj_filter {
4418 char table[NFT_OBJ_MAXNAMELEN];
4422 static int nf_tables_dump_obj(struct sk_buff *skb, struct netlink_callback *cb)
4424 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
4425 const struct nft_af_info *afi;
4426 const struct nft_table *table;
4427 unsigned int idx = 0, s_idx = cb->args[0];
4428 struct nft_obj_filter *filter = cb->data;
4429 struct net *net = sock_net(skb->sk);
4430 int family = nfmsg->nfgen_family;
4431 struct nft_object *obj;
4434 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4438 cb->seq = net->nft.base_seq;
4440 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
4441 if (family != NFPROTO_UNSPEC && family != afi->family)
4444 list_for_each_entry_rcu(table, &afi->tables, list) {
4445 list_for_each_entry_rcu(obj, &table->objects, list) {
4446 if (!nft_is_active(net, obj))
4451 memset(&cb->args[1], 0,
4452 sizeof(cb->args) - sizeof(cb->args[0]));
4453 if (filter && filter->table[0] &&
4454 strcmp(filter->table, table->name))
4457 filter->type != NFT_OBJECT_UNSPEC &&
4458 obj->type->type != filter->type)
4461 if (nf_tables_fill_obj_info(skb, net, NETLINK_CB(cb->skb).portid,
4464 NLM_F_MULTI | NLM_F_APPEND,
4465 afi->family, table, obj, reset) < 0)
4468 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
4481 static int nf_tables_dump_obj_done(struct netlink_callback *cb)
4488 static struct nft_obj_filter *
4489 nft_obj_filter_alloc(const struct nlattr * const nla[])
4491 struct nft_obj_filter *filter;
4493 filter = kzalloc(sizeof(*filter), GFP_KERNEL);
4495 return ERR_PTR(-ENOMEM);
4497 if (nla[NFTA_OBJ_TABLE])
4498 nla_strlcpy(filter->table, nla[NFTA_OBJ_TABLE],
4499 NFT_TABLE_MAXNAMELEN);
4500 if (nla[NFTA_OBJ_TYPE])
4501 filter->type = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4506 static int nf_tables_getobj(struct net *net, struct sock *nlsk,
4507 struct sk_buff *skb, const struct nlmsghdr *nlh,
4508 const struct nlattr * const nla[],
4509 struct netlink_ext_ack *extack)
4511 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4512 u8 genmask = nft_genmask_cur(net);
4513 int family = nfmsg->nfgen_family;
4514 const struct nft_af_info *afi;
4515 const struct nft_table *table;
4516 struct nft_object *obj;
4517 struct sk_buff *skb2;
4522 if (nlh->nlmsg_flags & NLM_F_DUMP) {
4523 struct netlink_dump_control c = {
4524 .dump = nf_tables_dump_obj,
4525 .done = nf_tables_dump_obj_done,
4528 if (nla[NFTA_OBJ_TABLE] ||
4529 nla[NFTA_OBJ_TYPE]) {
4530 struct nft_obj_filter *filter;
4532 filter = nft_obj_filter_alloc(nla);
4538 return netlink_dump_start(nlsk, skb, nlh, &c);
4541 if (!nla[NFTA_OBJ_NAME] ||
4542 !nla[NFTA_OBJ_TYPE])
4545 afi = nf_tables_afinfo_lookup(net, family, false);
4547 return PTR_ERR(afi);
4549 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4551 return PTR_ERR(table);
4553 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4554 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4556 return PTR_ERR(obj);
4558 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4562 if (NFNL_MSG_TYPE(nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4565 err = nf_tables_fill_obj_info(skb2, net, NETLINK_CB(skb).portid,
4566 nlh->nlmsg_seq, NFT_MSG_NEWOBJ, 0,
4567 family, table, obj, reset);
4571 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4577 static void nft_obj_destroy(struct nft_object *obj)
4579 if (obj->type->destroy)
4580 obj->type->destroy(obj);
4582 module_put(obj->type->owner);
4586 static int nf_tables_delobj(struct net *net, struct sock *nlsk,
4587 struct sk_buff *skb, const struct nlmsghdr *nlh,
4588 const struct nlattr * const nla[],
4589 struct netlink_ext_ack *extack)
4591 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4592 u8 genmask = nft_genmask_next(net);
4593 int family = nfmsg->nfgen_family;
4594 struct nft_af_info *afi;
4595 struct nft_table *table;
4596 struct nft_object *obj;
4600 if (!nla[NFTA_OBJ_TYPE] ||
4601 !nla[NFTA_OBJ_NAME])
4604 afi = nf_tables_afinfo_lookup(net, family, true);
4606 return PTR_ERR(afi);
4608 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4610 return PTR_ERR(table);
4612 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4613 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4615 return PTR_ERR(obj);
4619 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
4621 return nft_delobj(&ctx, obj);
4624 void nft_obj_notify(struct net *net, struct nft_table *table,
4625 struct nft_object *obj, u32 portid, u32 seq, int event,
4626 int family, int report, gfp_t gfp)
4628 struct sk_buff *skb;
4632 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4635 skb = nlmsg_new(NLMSG_GOODSIZE, gfp);
4639 err = nf_tables_fill_obj_info(skb, net, portid, seq, event, 0, family,
4646 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, report, gfp);
4649 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
4651 EXPORT_SYMBOL_GPL(nft_obj_notify);
4653 static void nf_tables_obj_notify(const struct nft_ctx *ctx,
4654 struct nft_object *obj, int event)
4656 nft_obj_notify(ctx->net, ctx->table, obj, ctx->portid, ctx->seq, event,
4657 ctx->afi->family, ctx->report, GFP_KERNEL);
4660 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
4661 u32 portid, u32 seq)
4663 struct nlmsghdr *nlh;
4664 struct nfgenmsg *nfmsg;
4665 int event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWGEN);
4667 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
4669 goto nla_put_failure;
4671 nfmsg = nlmsg_data(nlh);
4672 nfmsg->nfgen_family = AF_UNSPEC;
4673 nfmsg->version = NFNETLINK_V0;
4674 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4676 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)))
4677 goto nla_put_failure;
4679 nlmsg_end(skb, nlh);
4683 nlmsg_trim(skb, nlh);
4687 static void nf_tables_gen_notify(struct net *net, struct sk_buff *skb,
4690 struct nlmsghdr *nlh = nlmsg_hdr(skb);
4691 struct sk_buff *skb2;
4694 if (nlmsg_report(nlh) &&
4695 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4698 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
4702 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
4709 nfnetlink_send(skb2, net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
4710 nlmsg_report(nlh), GFP_KERNEL);
4713 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
4717 static int nf_tables_getgen(struct net *net, struct sock *nlsk,
4718 struct sk_buff *skb, const struct nlmsghdr *nlh,
4719 const struct nlattr * const nla[],
4720 struct netlink_ext_ack *extack)
4722 struct sk_buff *skb2;
4725 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4729 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
4734 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4740 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
4741 [NFT_MSG_NEWTABLE] = {
4742 .call_batch = nf_tables_newtable,
4743 .attr_count = NFTA_TABLE_MAX,
4744 .policy = nft_table_policy,
4746 [NFT_MSG_GETTABLE] = {
4747 .call = nf_tables_gettable,
4748 .attr_count = NFTA_TABLE_MAX,
4749 .policy = nft_table_policy,
4751 [NFT_MSG_DELTABLE] = {
4752 .call_batch = nf_tables_deltable,
4753 .attr_count = NFTA_TABLE_MAX,
4754 .policy = nft_table_policy,
4756 [NFT_MSG_NEWCHAIN] = {
4757 .call_batch = nf_tables_newchain,
4758 .attr_count = NFTA_CHAIN_MAX,
4759 .policy = nft_chain_policy,
4761 [NFT_MSG_GETCHAIN] = {
4762 .call = nf_tables_getchain,
4763 .attr_count = NFTA_CHAIN_MAX,
4764 .policy = nft_chain_policy,
4766 [NFT_MSG_DELCHAIN] = {
4767 .call_batch = nf_tables_delchain,
4768 .attr_count = NFTA_CHAIN_MAX,
4769 .policy = nft_chain_policy,
4771 [NFT_MSG_NEWRULE] = {
4772 .call_batch = nf_tables_newrule,
4773 .attr_count = NFTA_RULE_MAX,
4774 .policy = nft_rule_policy,
4776 [NFT_MSG_GETRULE] = {
4777 .call = nf_tables_getrule,
4778 .attr_count = NFTA_RULE_MAX,
4779 .policy = nft_rule_policy,
4781 [NFT_MSG_DELRULE] = {
4782 .call_batch = nf_tables_delrule,
4783 .attr_count = NFTA_RULE_MAX,
4784 .policy = nft_rule_policy,
4786 [NFT_MSG_NEWSET] = {
4787 .call_batch = nf_tables_newset,
4788 .attr_count = NFTA_SET_MAX,
4789 .policy = nft_set_policy,
4791 [NFT_MSG_GETSET] = {
4792 .call = nf_tables_getset,
4793 .attr_count = NFTA_SET_MAX,
4794 .policy = nft_set_policy,
4796 [NFT_MSG_DELSET] = {
4797 .call_batch = nf_tables_delset,
4798 .attr_count = NFTA_SET_MAX,
4799 .policy = nft_set_policy,
4801 [NFT_MSG_NEWSETELEM] = {
4802 .call_batch = nf_tables_newsetelem,
4803 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4804 .policy = nft_set_elem_list_policy,
4806 [NFT_MSG_GETSETELEM] = {
4807 .call = nf_tables_getsetelem,
4808 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4809 .policy = nft_set_elem_list_policy,
4811 [NFT_MSG_DELSETELEM] = {
4812 .call_batch = nf_tables_delsetelem,
4813 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4814 .policy = nft_set_elem_list_policy,
4816 [NFT_MSG_GETGEN] = {
4817 .call = nf_tables_getgen,
4819 [NFT_MSG_NEWOBJ] = {
4820 .call_batch = nf_tables_newobj,
4821 .attr_count = NFTA_OBJ_MAX,
4822 .policy = nft_obj_policy,
4824 [NFT_MSG_GETOBJ] = {
4825 .call = nf_tables_getobj,
4826 .attr_count = NFTA_OBJ_MAX,
4827 .policy = nft_obj_policy,
4829 [NFT_MSG_DELOBJ] = {
4830 .call_batch = nf_tables_delobj,
4831 .attr_count = NFTA_OBJ_MAX,
4832 .policy = nft_obj_policy,
4834 [NFT_MSG_GETOBJ_RESET] = {
4835 .call = nf_tables_getobj,
4836 .attr_count = NFTA_OBJ_MAX,
4837 .policy = nft_obj_policy,
4841 static void nft_chain_commit_update(struct nft_trans *trans)
4843 struct nft_base_chain *basechain;
4845 if (nft_trans_chain_name(trans)[0])
4846 strcpy(trans->ctx.chain->name, nft_trans_chain_name(trans));
4848 if (!nft_is_base_chain(trans->ctx.chain))
4851 basechain = nft_base_chain(trans->ctx.chain);
4852 nft_chain_stats_replace(basechain, nft_trans_chain_stats(trans));
4854 switch (nft_trans_chain_policy(trans)) {
4857 basechain->policy = nft_trans_chain_policy(trans);
4862 static void nf_tables_commit_release(struct nft_trans *trans)
4864 switch (trans->msg_type) {
4865 case NFT_MSG_DELTABLE:
4866 nf_tables_table_destroy(&trans->ctx);
4868 case NFT_MSG_DELCHAIN:
4869 nf_tables_chain_destroy(trans->ctx.chain);
4871 case NFT_MSG_DELRULE:
4872 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
4874 case NFT_MSG_DELSET:
4875 nft_set_destroy(nft_trans_set(trans));
4877 case NFT_MSG_DELSETELEM:
4878 nf_tables_set_elem_destroy(nft_trans_elem_set(trans),
4879 nft_trans_elem(trans).priv);
4881 case NFT_MSG_DELOBJ:
4882 nft_obj_destroy(nft_trans_obj(trans));
4888 static int nf_tables_commit(struct net *net, struct sk_buff *skb)
4890 struct nft_trans *trans, *next;
4891 struct nft_trans_elem *te;
4893 /* Bump generation counter, invalidate any dump in progress */
4894 while (++net->nft.base_seq == 0);
4896 /* A new generation has just started */
4897 net->nft.gencursor = nft_gencursor_next(net);
4899 /* Make sure all packets have left the previous generation before
4900 * purging old rules.
4904 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
4905 switch (trans->msg_type) {
4906 case NFT_MSG_NEWTABLE:
4907 if (nft_trans_table_update(trans)) {
4908 if (!nft_trans_table_enable(trans)) {
4909 nf_tables_table_disable(net,
4912 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
4915 nft_clear(net, trans->ctx.table);
4917 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
4918 nft_trans_destroy(trans);
4920 case NFT_MSG_DELTABLE:
4921 list_del_rcu(&trans->ctx.table->list);
4922 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
4924 case NFT_MSG_NEWCHAIN:
4925 if (nft_trans_chain_update(trans))
4926 nft_chain_commit_update(trans);
4928 nft_clear(net, trans->ctx.chain);
4930 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
4931 nft_trans_destroy(trans);
4933 case NFT_MSG_DELCHAIN:
4934 list_del_rcu(&trans->ctx.chain->list);
4935 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
4936 nf_tables_unregister_hooks(trans->ctx.net,
4939 trans->ctx.afi->nops);
4941 case NFT_MSG_NEWRULE:
4942 nft_clear(trans->ctx.net, nft_trans_rule(trans));
4943 nf_tables_rule_notify(&trans->ctx,
4944 nft_trans_rule(trans),
4946 nft_trans_destroy(trans);
4948 case NFT_MSG_DELRULE:
4949 list_del_rcu(&nft_trans_rule(trans)->list);
4950 nf_tables_rule_notify(&trans->ctx,
4951 nft_trans_rule(trans),
4954 case NFT_MSG_NEWSET:
4955 nft_clear(net, nft_trans_set(trans));
4956 /* This avoids hitting -EBUSY when deleting the table
4957 * from the transaction.
4959 if (nft_trans_set(trans)->flags & NFT_SET_ANONYMOUS &&
4960 !list_empty(&nft_trans_set(trans)->bindings))
4961 trans->ctx.table->use--;
4963 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
4964 NFT_MSG_NEWSET, GFP_KERNEL);
4965 nft_trans_destroy(trans);
4967 case NFT_MSG_DELSET:
4968 list_del_rcu(&nft_trans_set(trans)->list);
4969 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
4970 NFT_MSG_DELSET, GFP_KERNEL);
4972 case NFT_MSG_NEWSETELEM:
4973 te = (struct nft_trans_elem *)trans->data;
4975 te->set->ops->activate(net, te->set, &te->elem);
4976 nf_tables_setelem_notify(&trans->ctx, te->set,
4978 NFT_MSG_NEWSETELEM, 0);
4979 nft_trans_destroy(trans);
4981 case NFT_MSG_DELSETELEM:
4982 te = (struct nft_trans_elem *)trans->data;
4984 nf_tables_setelem_notify(&trans->ctx, te->set,
4986 NFT_MSG_DELSETELEM, 0);
4987 te->set->ops->remove(net, te->set, &te->elem);
4988 atomic_dec(&te->set->nelems);
4991 case NFT_MSG_NEWOBJ:
4992 nft_clear(net, nft_trans_obj(trans));
4993 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
4995 nft_trans_destroy(trans);
4997 case NFT_MSG_DELOBJ:
4998 list_del_rcu(&nft_trans_obj(trans)->list);
4999 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
5007 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
5008 list_del(&trans->list);
5009 nf_tables_commit_release(trans);
5012 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
5017 static void nf_tables_abort_release(struct nft_trans *trans)
5019 switch (trans->msg_type) {
5020 case NFT_MSG_NEWTABLE:
5021 nf_tables_table_destroy(&trans->ctx);
5023 case NFT_MSG_NEWCHAIN:
5024 nf_tables_chain_destroy(trans->ctx.chain);
5026 case NFT_MSG_NEWRULE:
5027 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
5029 case NFT_MSG_NEWSET:
5030 nft_set_destroy(nft_trans_set(trans));
5032 case NFT_MSG_NEWSETELEM:
5033 nft_set_elem_destroy(nft_trans_elem_set(trans),
5034 nft_trans_elem(trans).priv, true);
5036 case NFT_MSG_NEWOBJ:
5037 nft_obj_destroy(nft_trans_obj(trans));
5043 static int nf_tables_abort(struct net *net, struct sk_buff *skb)
5045 struct nft_trans *trans, *next;
5046 struct nft_trans_elem *te;
5048 list_for_each_entry_safe_reverse(trans, next, &net->nft.commit_list,
5050 switch (trans->msg_type) {
5051 case NFT_MSG_NEWTABLE:
5052 if (nft_trans_table_update(trans)) {
5053 if (nft_trans_table_enable(trans)) {
5054 nf_tables_table_disable(net,
5057 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
5059 nft_trans_destroy(trans);
5061 list_del_rcu(&trans->ctx.table->list);
5064 case NFT_MSG_DELTABLE:
5065 nft_clear(trans->ctx.net, trans->ctx.table);
5066 nft_trans_destroy(trans);
5068 case NFT_MSG_NEWCHAIN:
5069 if (nft_trans_chain_update(trans)) {
5070 free_percpu(nft_trans_chain_stats(trans));
5072 nft_trans_destroy(trans);
5074 trans->ctx.table->use--;
5075 list_del_rcu(&trans->ctx.chain->list);
5076 nf_tables_unregister_hooks(trans->ctx.net,
5079 trans->ctx.afi->nops);
5082 case NFT_MSG_DELCHAIN:
5083 trans->ctx.table->use++;
5084 nft_clear(trans->ctx.net, trans->ctx.chain);
5085 nft_trans_destroy(trans);
5087 case NFT_MSG_NEWRULE:
5088 trans->ctx.chain->use--;
5089 list_del_rcu(&nft_trans_rule(trans)->list);
5091 case NFT_MSG_DELRULE:
5092 trans->ctx.chain->use++;
5093 nft_clear(trans->ctx.net, nft_trans_rule(trans));
5094 nft_trans_destroy(trans);
5096 case NFT_MSG_NEWSET:
5097 trans->ctx.table->use--;
5098 list_del_rcu(&nft_trans_set(trans)->list);
5100 case NFT_MSG_DELSET:
5101 trans->ctx.table->use++;
5102 nft_clear(trans->ctx.net, nft_trans_set(trans));
5103 nft_trans_destroy(trans);
5105 case NFT_MSG_NEWSETELEM:
5106 te = (struct nft_trans_elem *)trans->data;
5108 te->set->ops->remove(net, te->set, &te->elem);
5109 atomic_dec(&te->set->nelems);
5111 case NFT_MSG_DELSETELEM:
5112 te = (struct nft_trans_elem *)trans->data;
5114 nft_set_elem_activate(net, te->set, &te->elem);
5115 te->set->ops->activate(net, te->set, &te->elem);
5118 nft_trans_destroy(trans);
5120 case NFT_MSG_NEWOBJ:
5121 trans->ctx.table->use--;
5122 list_del_rcu(&nft_trans_obj(trans)->list);
5124 case NFT_MSG_DELOBJ:
5125 trans->ctx.table->use++;
5126 nft_clear(trans->ctx.net, nft_trans_obj(trans));
5127 nft_trans_destroy(trans);
5134 list_for_each_entry_safe_reverse(trans, next,
5135 &net->nft.commit_list, list) {
5136 list_del(&trans->list);
5137 nf_tables_abort_release(trans);
5143 static bool nf_tables_valid_genid(struct net *net, u32 genid)
5145 return net->nft.base_seq == genid;
5148 static const struct nfnetlink_subsystem nf_tables_subsys = {
5149 .name = "nf_tables",
5150 .subsys_id = NFNL_SUBSYS_NFTABLES,
5151 .cb_count = NFT_MSG_MAX,
5153 .commit = nf_tables_commit,
5154 .abort = nf_tables_abort,
5155 .valid_genid = nf_tables_valid_genid,
5158 int nft_chain_validate_dependency(const struct nft_chain *chain,
5159 enum nft_chain_type type)
5161 const struct nft_base_chain *basechain;
5163 if (nft_is_base_chain(chain)) {
5164 basechain = nft_base_chain(chain);
5165 if (basechain->type->type != type)
5170 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
5172 int nft_chain_validate_hooks(const struct nft_chain *chain,
5173 unsigned int hook_flags)
5175 struct nft_base_chain *basechain;
5177 if (nft_is_base_chain(chain)) {
5178 basechain = nft_base_chain(chain);
5180 if ((1 << basechain->ops[0].hooknum) & hook_flags)
5188 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
5191 * Loop detection - walk through the ruleset beginning at the destination chain
5192 * of a new jump until either the source chain is reached (loop) or all
5193 * reachable chains have been traversed.
5195 * The loop check is performed whenever a new jump verdict is added to an
5196 * expression or verdict map or a verdict map is bound to a new chain.
5199 static int nf_tables_check_loops(const struct nft_ctx *ctx,
5200 const struct nft_chain *chain);
5202 static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
5203 struct nft_set *set,
5204 const struct nft_set_iter *iter,
5205 struct nft_set_elem *elem)
5207 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
5208 const struct nft_data *data;
5210 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
5211 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
5214 data = nft_set_ext_data(ext);
5215 switch (data->verdict.code) {
5218 return nf_tables_check_loops(ctx, data->verdict.chain);
5224 static int nf_tables_check_loops(const struct nft_ctx *ctx,
5225 const struct nft_chain *chain)
5227 const struct nft_rule *rule;
5228 const struct nft_expr *expr, *last;
5229 struct nft_set *set;
5230 struct nft_set_binding *binding;
5231 struct nft_set_iter iter;
5233 if (ctx->chain == chain)
5236 list_for_each_entry(rule, &chain->rules, list) {
5237 nft_rule_for_each_expr(expr, last, rule) {
5238 const struct nft_data *data = NULL;
5241 if (!expr->ops->validate)
5244 err = expr->ops->validate(ctx, expr, &data);
5251 switch (data->verdict.code) {
5254 err = nf_tables_check_loops(ctx,
5255 data->verdict.chain);
5264 list_for_each_entry(set, &ctx->table->sets, list) {
5265 if (!nft_is_active_next(ctx->net, set))
5267 if (!(set->flags & NFT_SET_MAP) ||
5268 set->dtype != NFT_DATA_VERDICT)
5271 list_for_each_entry(binding, &set->bindings, list) {
5272 if (!(binding->flags & NFT_SET_MAP) ||
5273 binding->chain != chain)
5276 iter.genmask = nft_genmask_next(ctx->net);
5280 iter.fn = nf_tables_loop_check_setelem;
5282 set->ops->walk(ctx, set, &iter);
5292 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
5294 * @attr: netlink attribute to fetch value from
5295 * @max: maximum value to be stored in dest
5296 * @dest: pointer to the variable
5298 * Parse, check and store a given u32 netlink attribute into variable.
5299 * This function returns -ERANGE if the value goes over maximum value.
5300 * Otherwise a 0 is returned and the attribute value is stored in the
5301 * destination variable.
5303 int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
5307 val = ntohl(nla_get_be32(attr));
5314 EXPORT_SYMBOL_GPL(nft_parse_u32_check);
5317 * nft_parse_register - parse a register value from a netlink attribute
5319 * @attr: netlink attribute
5321 * Parse and translate a register value from a netlink attribute.
5322 * Registers used to be 128 bit wide, these register numbers will be
5323 * mapped to the corresponding 32 bit register numbers.
5325 unsigned int nft_parse_register(const struct nlattr *attr)
5329 reg = ntohl(nla_get_be32(attr));
5331 case NFT_REG_VERDICT...NFT_REG_4:
5332 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
5334 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
5337 EXPORT_SYMBOL_GPL(nft_parse_register);
5340 * nft_dump_register - dump a register value to a netlink attribute
5342 * @skb: socket buffer
5343 * @attr: attribute number
5344 * @reg: register number
5346 * Construct a netlink attribute containing the register number. For
5347 * compatibility reasons, register numbers being a multiple of 4 are
5348 * translated to the corresponding 128 bit register numbers.
5350 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
5352 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
5353 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
5355 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
5357 return nla_put_be32(skb, attr, htonl(reg));
5359 EXPORT_SYMBOL_GPL(nft_dump_register);
5362 * nft_validate_register_load - validate a load from a register
5364 * @reg: the register number
5365 * @len: the length of the data
5367 * Validate that the input register is one of the general purpose
5368 * registers and that the length of the load is within the bounds.
5370 int nft_validate_register_load(enum nft_registers reg, unsigned int len)
5372 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
5376 if (reg * NFT_REG32_SIZE + len > FIELD_SIZEOF(struct nft_regs, data))
5381 EXPORT_SYMBOL_GPL(nft_validate_register_load);
5384 * nft_validate_register_store - validate an expressions' register store
5386 * @ctx: context of the expression performing the load
5387 * @reg: the destination register number
5388 * @data: the data to load
5389 * @type: the data type
5390 * @len: the length of the data
5392 * Validate that a data load uses the appropriate data type for
5393 * the destination register and the length is within the bounds.
5394 * A value of NULL for the data means that its runtime gathered
5397 int nft_validate_register_store(const struct nft_ctx *ctx,
5398 enum nft_registers reg,
5399 const struct nft_data *data,
5400 enum nft_data_types type, unsigned int len)
5405 case NFT_REG_VERDICT:
5406 if (type != NFT_DATA_VERDICT)
5410 (data->verdict.code == NFT_GOTO ||
5411 data->verdict.code == NFT_JUMP)) {
5412 err = nf_tables_check_loops(ctx, data->verdict.chain);
5416 if (ctx->chain->level + 1 >
5417 data->verdict.chain->level) {
5418 if (ctx->chain->level + 1 == NFT_JUMP_STACK_SIZE)
5420 data->verdict.chain->level = ctx->chain->level + 1;
5426 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
5430 if (reg * NFT_REG32_SIZE + len >
5431 FIELD_SIZEOF(struct nft_regs, data))
5434 if (data != NULL && type != NFT_DATA_VALUE)
5439 EXPORT_SYMBOL_GPL(nft_validate_register_store);
5441 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
5442 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
5443 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
5444 .len = NFT_CHAIN_MAXNAMELEN - 1 },
5447 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
5448 struct nft_data_desc *desc, const struct nlattr *nla)
5450 u8 genmask = nft_genmask_next(ctx->net);
5451 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
5452 struct nft_chain *chain;
5455 err = nla_parse_nested(tb, NFTA_VERDICT_MAX, nla, nft_verdict_policy,
5460 if (!tb[NFTA_VERDICT_CODE])
5462 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
5464 switch (data->verdict.code) {
5466 switch (data->verdict.code & NF_VERDICT_MASK) {
5481 if (!tb[NFTA_VERDICT_CHAIN])
5483 chain = nf_tables_chain_lookup(ctx->table,
5484 tb[NFTA_VERDICT_CHAIN], genmask);
5486 return PTR_ERR(chain);
5487 if (nft_is_base_chain(chain))
5491 data->verdict.chain = chain;
5495 desc->len = sizeof(data->verdict);
5496 desc->type = NFT_DATA_VERDICT;
5500 static void nft_verdict_uninit(const struct nft_data *data)
5502 switch (data->verdict.code) {
5505 data->verdict.chain->use--;
5510 int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
5512 struct nlattr *nest;
5514 nest = nla_nest_start(skb, type);
5516 goto nla_put_failure;
5518 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
5519 goto nla_put_failure;
5524 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
5526 goto nla_put_failure;
5528 nla_nest_end(skb, nest);
5535 static int nft_value_init(const struct nft_ctx *ctx,
5536 struct nft_data *data, unsigned int size,
5537 struct nft_data_desc *desc, const struct nlattr *nla)
5547 nla_memcpy(data->data, nla, len);
5548 desc->type = NFT_DATA_VALUE;
5553 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
5556 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
5559 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
5560 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
5561 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
5565 * nft_data_init - parse nf_tables data netlink attributes
5567 * @ctx: context of the expression using the data
5568 * @data: destination struct nft_data
5569 * @size: maximum data length
5570 * @desc: data description
5571 * @nla: netlink attribute containing data
5573 * Parse the netlink data attributes and initialize a struct nft_data.
5574 * The type and length of data are returned in the data description.
5576 * The caller can indicate that it only wants to accept data of type
5577 * NFT_DATA_VALUE by passing NULL for the ctx argument.
5579 int nft_data_init(const struct nft_ctx *ctx,
5580 struct nft_data *data, unsigned int size,
5581 struct nft_data_desc *desc, const struct nlattr *nla)
5583 struct nlattr *tb[NFTA_DATA_MAX + 1];
5586 err = nla_parse_nested(tb, NFTA_DATA_MAX, nla, nft_data_policy, NULL);
5590 if (tb[NFTA_DATA_VALUE])
5591 return nft_value_init(ctx, data, size, desc,
5592 tb[NFTA_DATA_VALUE]);
5593 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
5594 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
5597 EXPORT_SYMBOL_GPL(nft_data_init);
5600 * nft_data_release - release a nft_data item
5602 * @data: struct nft_data to release
5603 * @type: type of data
5605 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
5606 * all others need to be released by calling this function.
5608 void nft_data_release(const struct nft_data *data, enum nft_data_types type)
5610 if (type < NFT_DATA_VERDICT)
5613 case NFT_DATA_VERDICT:
5614 return nft_verdict_uninit(data);
5619 EXPORT_SYMBOL_GPL(nft_data_release);
5621 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
5622 enum nft_data_types type, unsigned int len)
5624 struct nlattr *nest;
5627 nest = nla_nest_start(skb, attr);
5632 case NFT_DATA_VALUE:
5633 err = nft_value_dump(skb, data, len);
5635 case NFT_DATA_VERDICT:
5636 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
5643 nla_nest_end(skb, nest);
5646 EXPORT_SYMBOL_GPL(nft_data_dump);
5648 static int __net_init nf_tables_init_net(struct net *net)
5650 INIT_LIST_HEAD(&net->nft.af_info);
5651 INIT_LIST_HEAD(&net->nft.commit_list);
5652 net->nft.base_seq = 1;
5656 int __nft_release_basechain(struct nft_ctx *ctx)
5658 struct nft_rule *rule, *nr;
5660 BUG_ON(!nft_is_base_chain(ctx->chain));
5662 nf_tables_unregister_hooks(ctx->net, ctx->chain->table, ctx->chain,
5664 list_for_each_entry_safe(rule, nr, &ctx->chain->rules, list) {
5665 list_del(&rule->list);
5667 nf_tables_rule_destroy(ctx, rule);
5669 list_del(&ctx->chain->list);
5671 nf_tables_chain_destroy(ctx->chain);
5675 EXPORT_SYMBOL_GPL(__nft_release_basechain);
5677 /* Called by nft_unregister_afinfo() from __net_exit path, nfnl_lock is held. */
5678 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi)
5680 struct nft_table *table, *nt;
5681 struct nft_chain *chain, *nc;
5682 struct nft_object *obj, *ne;
5683 struct nft_rule *rule, *nr;
5684 struct nft_set *set, *ns;
5685 struct nft_ctx ctx = {
5690 list_for_each_entry_safe(table, nt, &afi->tables, list) {
5691 list_for_each_entry(chain, &table->chains, list)
5692 nf_tables_unregister_hooks(net, table, chain,
5694 /* No packets are walking on these chains anymore. */
5696 list_for_each_entry(chain, &table->chains, list) {
5698 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
5699 list_del(&rule->list);
5701 nf_tables_rule_destroy(&ctx, rule);
5704 list_for_each_entry_safe(set, ns, &table->sets, list) {
5705 list_del(&set->list);
5707 nft_set_destroy(set);
5709 list_for_each_entry_safe(obj, ne, &table->objects, list) {
5710 list_del(&obj->list);
5712 nft_obj_destroy(obj);
5714 list_for_each_entry_safe(chain, nc, &table->chains, list) {
5715 list_del(&chain->list);
5717 nf_tables_chain_destroy(chain);
5719 list_del(&table->list);
5720 nf_tables_table_destroy(&ctx);
5724 static struct pernet_operations nf_tables_net_ops = {
5725 .init = nf_tables_init_net,
5728 static int __init nf_tables_module_init(void)
5732 info = kmalloc(sizeof(struct nft_expr_info) * NFT_RULE_MAXEXPRS,
5739 err = nf_tables_core_module_init();
5743 err = nfnetlink_subsys_register(&nf_tables_subsys);
5747 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
5748 return register_pernet_subsys(&nf_tables_net_ops);
5750 nf_tables_core_module_exit();
5757 static void __exit nf_tables_module_exit(void)
5759 unregister_pernet_subsys(&nf_tables_net_ops);
5760 nfnetlink_subsys_unregister(&nf_tables_subsys);
5762 nf_tables_core_module_exit();
5766 module_init(nf_tables_module_init);
5767 module_exit(nf_tables_module_exit);
5769 MODULE_LICENSE("GPL");
5770 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
5771 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);