2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/netfilter.h>
17 #include <linux/netfilter/nfnetlink.h>
18 #include <linux/netfilter/nf_tables.h>
19 #include <net/netfilter/nf_tables_core.h>
20 #include <net/netfilter/nf_tables.h>
21 #include <net/net_namespace.h>
24 static LIST_HEAD(nf_tables_expressions);
27 * nft_register_afinfo - register nf_tables address family info
29 * @afi: address family info to register
31 * Register the address family for use with nf_tables. Returns zero on
32 * success or a negative errno code otherwise.
34 int nft_register_afinfo(struct net *net, struct nft_af_info *afi)
36 INIT_LIST_HEAD(&afi->tables);
37 nfnl_lock(NFNL_SUBSYS_NFTABLES);
38 list_add_tail_rcu(&afi->list, &net->nft.af_info);
39 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
42 EXPORT_SYMBOL_GPL(nft_register_afinfo);
45 * nft_unregister_afinfo - unregister nf_tables address family info
47 * @afi: address family info to unregister
49 * Unregister the address family for use with nf_tables.
51 void nft_unregister_afinfo(struct nft_af_info *afi)
53 nfnl_lock(NFNL_SUBSYS_NFTABLES);
54 list_del_rcu(&afi->list);
55 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
57 EXPORT_SYMBOL_GPL(nft_unregister_afinfo);
59 static struct nft_af_info *nft_afinfo_lookup(struct net *net, int family)
61 struct nft_af_info *afi;
63 list_for_each_entry(afi, &net->nft.af_info, list) {
64 if (afi->family == family)
70 static struct nft_af_info *
71 nf_tables_afinfo_lookup(struct net *net, int family, bool autoload)
73 struct nft_af_info *afi;
75 afi = nft_afinfo_lookup(net, family);
80 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
81 request_module("nft-afinfo-%u", family);
82 nfnl_lock(NFNL_SUBSYS_NFTABLES);
83 afi = nft_afinfo_lookup(net, family);
85 return ERR_PTR(-EAGAIN);
88 return ERR_PTR(-EAFNOSUPPORT);
91 static void nft_ctx_init(struct nft_ctx *ctx,
92 const struct sk_buff *skb,
93 const struct nlmsghdr *nlh,
94 struct nft_af_info *afi,
95 struct nft_table *table,
96 struct nft_chain *chain,
97 const struct nlattr * const *nla)
99 ctx->net = sock_net(skb->sk);
104 ctx->portid = NETLINK_CB(skb).portid;
105 ctx->report = nlmsg_report(nlh);
106 ctx->seq = nlh->nlmsg_seq;
109 static struct nft_trans *nft_trans_alloc(struct nft_ctx *ctx, int msg_type,
112 struct nft_trans *trans;
114 trans = kzalloc(sizeof(struct nft_trans) + size, GFP_KERNEL);
118 trans->msg_type = msg_type;
124 static void nft_trans_destroy(struct nft_trans *trans)
126 list_del(&trans->list);
130 static void nf_tables_unregister_hooks(const struct nft_table *table,
131 const struct nft_chain *chain,
132 unsigned int hook_nops)
134 if (!(table->flags & NFT_TABLE_F_DORMANT) &&
135 chain->flags & NFT_BASE_CHAIN)
136 nf_unregister_hooks(nft_base_chain(chain)->ops, hook_nops);
139 /* Internal table flags */
140 #define NFT_TABLE_INACTIVE (1 << 15)
142 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
144 struct nft_trans *trans;
146 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
150 if (msg_type == NFT_MSG_NEWTABLE)
151 ctx->table->flags |= NFT_TABLE_INACTIVE;
153 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
157 static int nft_deltable(struct nft_ctx *ctx)
161 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
165 list_del_rcu(&ctx->table->list);
169 static int nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
171 struct nft_trans *trans;
173 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
177 if (msg_type == NFT_MSG_NEWCHAIN)
178 ctx->chain->flags |= NFT_CHAIN_INACTIVE;
180 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
184 static int nft_delchain(struct nft_ctx *ctx)
188 err = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
193 list_del_rcu(&ctx->chain->list);
199 nft_rule_is_active(struct net *net, const struct nft_rule *rule)
201 return (rule->genmask & nft_genmask_cur(net)) == 0;
205 nft_rule_is_active_next(struct net *net, const struct nft_rule *rule)
207 return (rule->genmask & nft_genmask_next(net)) == 0;
211 nft_rule_activate_next(struct net *net, struct nft_rule *rule)
213 /* Now inactive, will be active in the future */
214 rule->genmask = nft_genmask_cur(net);
218 nft_rule_deactivate_next(struct net *net, struct nft_rule *rule)
220 rule->genmask = nft_genmask_next(net);
223 static inline void nft_rule_clear(struct net *net, struct nft_rule *rule)
225 rule->genmask &= ~nft_genmask_next(net);
229 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
231 /* You cannot delete the same rule twice */
232 if (nft_rule_is_active_next(ctx->net, rule)) {
233 nft_rule_deactivate_next(ctx->net, rule);
240 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
241 struct nft_rule *rule)
243 struct nft_trans *trans;
245 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
249 nft_trans_rule(trans) = rule;
250 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
255 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
257 struct nft_trans *trans;
260 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
264 err = nf_tables_delrule_deactivate(ctx, rule);
266 nft_trans_destroy(trans);
273 static int nft_delrule_by_chain(struct nft_ctx *ctx)
275 struct nft_rule *rule;
278 list_for_each_entry(rule, &ctx->chain->rules, list) {
279 err = nft_delrule(ctx, rule);
286 /* Internal set flag */
287 #define NFT_SET_INACTIVE (1 << 15)
289 static int nft_trans_set_add(struct nft_ctx *ctx, int msg_type,
292 struct nft_trans *trans;
294 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
298 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
299 nft_trans_set_id(trans) =
300 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
301 set->flags |= NFT_SET_INACTIVE;
303 nft_trans_set(trans) = set;
304 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
309 static int nft_delset(struct nft_ctx *ctx, struct nft_set *set)
313 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
317 list_del_rcu(&set->list);
327 static struct nft_table *nft_table_lookup(const struct nft_af_info *afi,
328 const struct nlattr *nla)
330 struct nft_table *table;
332 list_for_each_entry(table, &afi->tables, list) {
333 if (!nla_strcmp(nla, table->name))
339 static struct nft_table *nf_tables_table_lookup(const struct nft_af_info *afi,
340 const struct nlattr *nla)
342 struct nft_table *table;
345 return ERR_PTR(-EINVAL);
347 table = nft_table_lookup(afi, nla);
351 return ERR_PTR(-ENOENT);
354 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
356 return ++table->hgenerator;
359 static const struct nf_chain_type *chain_type[AF_MAX][NFT_CHAIN_T_MAX];
361 static const struct nf_chain_type *
362 __nf_tables_chain_type_lookup(int family, const struct nlattr *nla)
366 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
367 if (chain_type[family][i] != NULL &&
368 !nla_strcmp(nla, chain_type[family][i]->name))
369 return chain_type[family][i];
374 static const struct nf_chain_type *
375 nf_tables_chain_type_lookup(const struct nft_af_info *afi,
376 const struct nlattr *nla,
379 const struct nf_chain_type *type;
381 type = __nf_tables_chain_type_lookup(afi->family, nla);
384 #ifdef CONFIG_MODULES
386 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
387 request_module("nft-chain-%u-%.*s", afi->family,
388 nla_len(nla), (const char *)nla_data(nla));
389 nfnl_lock(NFNL_SUBSYS_NFTABLES);
390 type = __nf_tables_chain_type_lookup(afi->family, nla);
392 return ERR_PTR(-EAGAIN);
395 return ERR_PTR(-ENOENT);
398 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
399 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
400 .len = NFT_TABLE_MAXNAMELEN - 1 },
401 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
404 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
405 u32 portid, u32 seq, int event, u32 flags,
406 int family, const struct nft_table *table)
408 struct nlmsghdr *nlh;
409 struct nfgenmsg *nfmsg;
411 event |= NFNL_SUBSYS_NFTABLES << 8;
412 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
414 goto nla_put_failure;
416 nfmsg = nlmsg_data(nlh);
417 nfmsg->nfgen_family = family;
418 nfmsg->version = NFNETLINK_V0;
419 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
421 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
422 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
423 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)))
424 goto nla_put_failure;
430 nlmsg_trim(skb, nlh);
434 static int nf_tables_table_notify(const struct nft_ctx *ctx, int event)
440 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
444 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
448 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
449 event, 0, ctx->afi->family, ctx->table);
455 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
456 ctx->report, GFP_KERNEL);
459 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
465 static int nf_tables_dump_tables(struct sk_buff *skb,
466 struct netlink_callback *cb)
468 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
469 const struct nft_af_info *afi;
470 const struct nft_table *table;
471 unsigned int idx = 0, s_idx = cb->args[0];
472 struct net *net = sock_net(skb->sk);
473 int family = nfmsg->nfgen_family;
476 cb->seq = net->nft.base_seq;
478 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
479 if (family != NFPROTO_UNSPEC && family != afi->family)
482 list_for_each_entry_rcu(table, &afi->tables, list) {
486 memset(&cb->args[1], 0,
487 sizeof(cb->args) - sizeof(cb->args[0]));
488 if (nf_tables_fill_table_info(skb, net,
489 NETLINK_CB(cb->skb).portid,
493 afi->family, table) < 0)
496 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
507 static int nf_tables_gettable(struct sock *nlsk, struct sk_buff *skb,
508 const struct nlmsghdr *nlh,
509 const struct nlattr * const nla[])
511 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
512 const struct nft_af_info *afi;
513 const struct nft_table *table;
514 struct sk_buff *skb2;
515 struct net *net = sock_net(skb->sk);
516 int family = nfmsg->nfgen_family;
519 if (nlh->nlmsg_flags & NLM_F_DUMP) {
520 struct netlink_dump_control c = {
521 .dump = nf_tables_dump_tables,
523 return netlink_dump_start(nlsk, skb, nlh, &c);
526 afi = nf_tables_afinfo_lookup(net, family, false);
530 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME]);
532 return PTR_ERR(table);
533 if (table->flags & NFT_TABLE_INACTIVE)
536 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
540 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
541 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
546 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
553 static int nf_tables_table_enable(const struct nft_af_info *afi,
554 struct nft_table *table)
556 struct nft_chain *chain;
559 list_for_each_entry(chain, &table->chains, list) {
560 if (!(chain->flags & NFT_BASE_CHAIN))
563 err = nf_register_hooks(nft_base_chain(chain)->ops, afi->nops);
571 list_for_each_entry(chain, &table->chains, list) {
572 if (!(chain->flags & NFT_BASE_CHAIN))
578 nf_unregister_hooks(nft_base_chain(chain)->ops, afi->nops);
583 static void nf_tables_table_disable(const struct nft_af_info *afi,
584 struct nft_table *table)
586 struct nft_chain *chain;
588 list_for_each_entry(chain, &table->chains, list) {
589 if (chain->flags & NFT_BASE_CHAIN)
590 nf_unregister_hooks(nft_base_chain(chain)->ops,
595 static int nf_tables_updtable(struct nft_ctx *ctx)
597 struct nft_trans *trans;
601 if (!ctx->nla[NFTA_TABLE_FLAGS])
604 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
605 if (flags & ~NFT_TABLE_F_DORMANT)
608 if (flags == ctx->table->flags)
611 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
612 sizeof(struct nft_trans_table));
616 if ((flags & NFT_TABLE_F_DORMANT) &&
617 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
618 nft_trans_table_enable(trans) = false;
619 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
620 ctx->table->flags & NFT_TABLE_F_DORMANT) {
621 ret = nf_tables_table_enable(ctx->afi, ctx->table);
623 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
624 nft_trans_table_enable(trans) = true;
630 nft_trans_table_update(trans) = true;
631 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
634 nft_trans_destroy(trans);
638 static int nf_tables_newtable(struct sock *nlsk, struct sk_buff *skb,
639 const struct nlmsghdr *nlh,
640 const struct nlattr * const nla[])
642 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
643 const struct nlattr *name;
644 struct nft_af_info *afi;
645 struct nft_table *table;
646 struct net *net = sock_net(skb->sk);
647 int family = nfmsg->nfgen_family;
652 afi = nf_tables_afinfo_lookup(net, family, true);
656 name = nla[NFTA_TABLE_NAME];
657 table = nf_tables_table_lookup(afi, name);
659 if (PTR_ERR(table) != -ENOENT)
660 return PTR_ERR(table);
665 if (table->flags & NFT_TABLE_INACTIVE)
667 if (nlh->nlmsg_flags & NLM_F_EXCL)
669 if (nlh->nlmsg_flags & NLM_F_REPLACE)
672 nft_ctx_init(&ctx, skb, nlh, afi, table, NULL, nla);
673 return nf_tables_updtable(&ctx);
676 if (nla[NFTA_TABLE_FLAGS]) {
677 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
678 if (flags & ~NFT_TABLE_F_DORMANT)
682 if (!try_module_get(afi->owner))
683 return -EAFNOSUPPORT;
686 table = kzalloc(sizeof(*table), GFP_KERNEL);
690 nla_strlcpy(table->name, name, NFT_TABLE_MAXNAMELEN);
691 INIT_LIST_HEAD(&table->chains);
692 INIT_LIST_HEAD(&table->sets);
693 table->flags = flags;
695 nft_ctx_init(&ctx, skb, nlh, afi, table, NULL, nla);
696 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
700 list_add_tail_rcu(&table->list, &afi->tables);
705 module_put(afi->owner);
709 static int nft_flush_table(struct nft_ctx *ctx)
712 struct nft_chain *chain, *nc;
713 struct nft_set *set, *ns;
715 list_for_each_entry(chain, &ctx->table->chains, list) {
718 err = nft_delrule_by_chain(ctx);
723 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
724 if (set->flags & NFT_SET_ANONYMOUS &&
725 !list_empty(&set->bindings))
728 err = nft_delset(ctx, set);
733 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
736 err = nft_delchain(ctx);
741 err = nft_deltable(ctx);
746 static int nft_flush(struct nft_ctx *ctx, int family)
748 struct nft_af_info *afi;
749 struct nft_table *table, *nt;
750 const struct nlattr * const *nla = ctx->nla;
753 list_for_each_entry(afi, &ctx->net->nft.af_info, list) {
754 if (family != AF_UNSPEC && afi->family != family)
758 list_for_each_entry_safe(table, nt, &afi->tables, list) {
759 if (nla[NFTA_TABLE_NAME] &&
760 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
765 err = nft_flush_table(ctx);
774 static int nf_tables_deltable(struct sock *nlsk, struct sk_buff *skb,
775 const struct nlmsghdr *nlh,
776 const struct nlattr * const nla[])
778 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
779 struct nft_af_info *afi;
780 struct nft_table *table;
781 struct net *net = sock_net(skb->sk);
782 int family = nfmsg->nfgen_family;
785 nft_ctx_init(&ctx, skb, nlh, NULL, NULL, NULL, nla);
786 if (family == AF_UNSPEC || nla[NFTA_TABLE_NAME] == NULL)
787 return nft_flush(&ctx, family);
789 afi = nf_tables_afinfo_lookup(net, family, false);
793 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME]);
795 return PTR_ERR(table);
796 if (table->flags & NFT_TABLE_INACTIVE)
802 return nft_flush_table(&ctx);
805 static void nf_tables_table_destroy(struct nft_ctx *ctx)
807 BUG_ON(ctx->table->use > 0);
810 module_put(ctx->afi->owner);
813 int nft_register_chain_type(const struct nf_chain_type *ctype)
817 nfnl_lock(NFNL_SUBSYS_NFTABLES);
818 if (chain_type[ctype->family][ctype->type] != NULL) {
822 chain_type[ctype->family][ctype->type] = ctype;
824 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
827 EXPORT_SYMBOL_GPL(nft_register_chain_type);
829 void nft_unregister_chain_type(const struct nf_chain_type *ctype)
831 nfnl_lock(NFNL_SUBSYS_NFTABLES);
832 chain_type[ctype->family][ctype->type] = NULL;
833 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
835 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
841 static struct nft_chain *
842 nf_tables_chain_lookup_byhandle(const struct nft_table *table, u64 handle)
844 struct nft_chain *chain;
846 list_for_each_entry(chain, &table->chains, list) {
847 if (chain->handle == handle)
851 return ERR_PTR(-ENOENT);
854 static struct nft_chain *nf_tables_chain_lookup(const struct nft_table *table,
855 const struct nlattr *nla)
857 struct nft_chain *chain;
860 return ERR_PTR(-EINVAL);
862 list_for_each_entry(chain, &table->chains, list) {
863 if (!nla_strcmp(nla, chain->name))
867 return ERR_PTR(-ENOENT);
870 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
871 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING },
872 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
873 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
874 .len = NFT_CHAIN_MAXNAMELEN - 1 },
875 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
876 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
877 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING },
878 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
881 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
882 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
883 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
886 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
888 struct nft_stats *cpu_stats, total;
894 memset(&total, 0, sizeof(total));
895 for_each_possible_cpu(cpu) {
896 cpu_stats = per_cpu_ptr(stats, cpu);
898 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
899 pkts = cpu_stats->pkts;
900 bytes = cpu_stats->bytes;
901 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
903 total.bytes += bytes;
905 nest = nla_nest_start(skb, NFTA_CHAIN_COUNTERS);
907 goto nla_put_failure;
909 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts)) ||
910 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes)))
911 goto nla_put_failure;
913 nla_nest_end(skb, nest);
920 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
921 u32 portid, u32 seq, int event, u32 flags,
922 int family, const struct nft_table *table,
923 const struct nft_chain *chain)
925 struct nlmsghdr *nlh;
926 struct nfgenmsg *nfmsg;
928 event |= NFNL_SUBSYS_NFTABLES << 8;
929 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
931 goto nla_put_failure;
933 nfmsg = nlmsg_data(nlh);
934 nfmsg->nfgen_family = family;
935 nfmsg->version = NFNETLINK_V0;
936 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
938 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
939 goto nla_put_failure;
940 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle)))
941 goto nla_put_failure;
942 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
943 goto nla_put_failure;
945 if (chain->flags & NFT_BASE_CHAIN) {
946 const struct nft_base_chain *basechain = nft_base_chain(chain);
947 const struct nf_hook_ops *ops = &basechain->ops[0];
950 nest = nla_nest_start(skb, NFTA_CHAIN_HOOK);
952 goto nla_put_failure;
953 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
954 goto nla_put_failure;
955 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
956 goto nla_put_failure;
957 nla_nest_end(skb, nest);
959 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
960 htonl(basechain->policy)))
961 goto nla_put_failure;
963 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
964 goto nla_put_failure;
966 if (nft_dump_stats(skb, nft_base_chain(chain)->stats))
967 goto nla_put_failure;
970 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
971 goto nla_put_failure;
977 nlmsg_trim(skb, nlh);
981 static int nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
987 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
991 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
995 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
996 event, 0, ctx->afi->family, ctx->table,
1003 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1004 ctx->report, GFP_KERNEL);
1007 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1013 static int nf_tables_dump_chains(struct sk_buff *skb,
1014 struct netlink_callback *cb)
1016 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1017 const struct nft_af_info *afi;
1018 const struct nft_table *table;
1019 const struct nft_chain *chain;
1020 unsigned int idx = 0, s_idx = cb->args[0];
1021 struct net *net = sock_net(skb->sk);
1022 int family = nfmsg->nfgen_family;
1025 cb->seq = net->nft.base_seq;
1027 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1028 if (family != NFPROTO_UNSPEC && family != afi->family)
1031 list_for_each_entry_rcu(table, &afi->tables, list) {
1032 list_for_each_entry_rcu(chain, &table->chains, list) {
1036 memset(&cb->args[1], 0,
1037 sizeof(cb->args) - sizeof(cb->args[0]));
1038 if (nf_tables_fill_chain_info(skb, net,
1039 NETLINK_CB(cb->skb).portid,
1043 afi->family, table, chain) < 0)
1046 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1058 static int nf_tables_getchain(struct sock *nlsk, struct sk_buff *skb,
1059 const struct nlmsghdr *nlh,
1060 const struct nlattr * const nla[])
1062 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1063 const struct nft_af_info *afi;
1064 const struct nft_table *table;
1065 const struct nft_chain *chain;
1066 struct sk_buff *skb2;
1067 struct net *net = sock_net(skb->sk);
1068 int family = nfmsg->nfgen_family;
1071 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1072 struct netlink_dump_control c = {
1073 .dump = nf_tables_dump_chains,
1075 return netlink_dump_start(nlsk, skb, nlh, &c);
1078 afi = nf_tables_afinfo_lookup(net, family, false);
1080 return PTR_ERR(afi);
1082 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE]);
1084 return PTR_ERR(table);
1085 if (table->flags & NFT_TABLE_INACTIVE)
1088 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME]);
1090 return PTR_ERR(chain);
1091 if (chain->flags & NFT_CHAIN_INACTIVE)
1094 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1098 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
1099 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1100 family, table, chain);
1104 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1111 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1112 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1113 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1116 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
1118 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1119 struct nft_stats __percpu *newstats;
1120 struct nft_stats *stats;
1123 err = nla_parse_nested(tb, NFTA_COUNTER_MAX, attr, nft_counter_policy);
1125 return ERR_PTR(err);
1127 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
1128 return ERR_PTR(-EINVAL);
1130 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
1131 if (newstats == NULL)
1132 return ERR_PTR(-ENOMEM);
1134 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1135 * are not exposed to userspace.
1138 stats = this_cpu_ptr(newstats);
1139 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1140 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
1146 static void nft_chain_stats_replace(struct nft_base_chain *chain,
1147 struct nft_stats __percpu *newstats)
1149 if (newstats == NULL)
1153 struct nft_stats __percpu *oldstats =
1154 nft_dereference(chain->stats);
1156 rcu_assign_pointer(chain->stats, newstats);
1158 free_percpu(oldstats);
1160 rcu_assign_pointer(chain->stats, newstats);
1163 static void nf_tables_chain_destroy(struct nft_chain *chain)
1165 BUG_ON(chain->use > 0);
1167 if (chain->flags & NFT_BASE_CHAIN) {
1168 module_put(nft_base_chain(chain)->type->owner);
1169 free_percpu(nft_base_chain(chain)->stats);
1170 kfree(nft_base_chain(chain));
1176 static int nf_tables_newchain(struct sock *nlsk, struct sk_buff *skb,
1177 const struct nlmsghdr *nlh,
1178 const struct nlattr * const nla[])
1180 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1181 const struct nlattr * uninitialized_var(name);
1182 struct nft_af_info *afi;
1183 struct nft_table *table;
1184 struct nft_chain *chain;
1185 struct nft_base_chain *basechain = NULL;
1186 struct nlattr *ha[NFTA_HOOK_MAX + 1];
1187 struct net *net = sock_net(skb->sk);
1188 int family = nfmsg->nfgen_family;
1189 u8 policy = NF_ACCEPT;
1192 struct nft_stats __percpu *stats;
1197 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1199 afi = nf_tables_afinfo_lookup(net, family, true);
1201 return PTR_ERR(afi);
1203 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE]);
1205 return PTR_ERR(table);
1208 name = nla[NFTA_CHAIN_NAME];
1210 if (nla[NFTA_CHAIN_HANDLE]) {
1211 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
1212 chain = nf_tables_chain_lookup_byhandle(table, handle);
1214 return PTR_ERR(chain);
1216 chain = nf_tables_chain_lookup(table, name);
1217 if (IS_ERR(chain)) {
1218 if (PTR_ERR(chain) != -ENOENT)
1219 return PTR_ERR(chain);
1224 if (nla[NFTA_CHAIN_POLICY]) {
1225 if ((chain != NULL &&
1226 !(chain->flags & NFT_BASE_CHAIN)))
1229 if (chain == NULL &&
1230 nla[NFTA_CHAIN_HOOK] == NULL)
1233 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
1243 if (chain != NULL) {
1244 struct nft_stats *stats = NULL;
1245 struct nft_trans *trans;
1247 if (chain->flags & NFT_CHAIN_INACTIVE)
1249 if (nlh->nlmsg_flags & NLM_F_EXCL)
1251 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1254 if (nla[NFTA_CHAIN_HANDLE] && name &&
1255 !IS_ERR(nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME])))
1258 if (nla[NFTA_CHAIN_COUNTERS]) {
1259 if (!(chain->flags & NFT_BASE_CHAIN))
1262 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1264 return PTR_ERR(stats);
1267 nft_ctx_init(&ctx, skb, nlh, afi, table, chain, nla);
1268 trans = nft_trans_alloc(&ctx, NFT_MSG_NEWCHAIN,
1269 sizeof(struct nft_trans_chain));
1270 if (trans == NULL) {
1275 nft_trans_chain_stats(trans) = stats;
1276 nft_trans_chain_update(trans) = true;
1278 if (nla[NFTA_CHAIN_POLICY])
1279 nft_trans_chain_policy(trans) = policy;
1281 nft_trans_chain_policy(trans) = -1;
1283 if (nla[NFTA_CHAIN_HANDLE] && name) {
1284 nla_strlcpy(nft_trans_chain_name(trans), name,
1285 NFT_CHAIN_MAXNAMELEN);
1287 list_add_tail(&trans->list, &net->nft.commit_list);
1291 if (table->use == UINT_MAX)
1294 if (nla[NFTA_CHAIN_HOOK]) {
1295 const struct nf_chain_type *type;
1296 struct nf_hook_ops *ops;
1298 u32 hooknum, priority;
1300 type = chain_type[family][NFT_CHAIN_T_DEFAULT];
1301 if (nla[NFTA_CHAIN_TYPE]) {
1302 type = nf_tables_chain_type_lookup(afi,
1303 nla[NFTA_CHAIN_TYPE],
1306 return PTR_ERR(type);
1309 err = nla_parse_nested(ha, NFTA_HOOK_MAX, nla[NFTA_CHAIN_HOOK],
1313 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1314 ha[NFTA_HOOK_PRIORITY] == NULL)
1317 hooknum = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
1318 if (hooknum >= afi->nhooks)
1320 priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1322 if (!(type->hook_mask & (1 << hooknum)))
1324 if (!try_module_get(type->owner))
1326 hookfn = type->hooks[hooknum];
1328 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1329 if (basechain == NULL) {
1330 module_put(type->owner);
1334 if (nla[NFTA_CHAIN_COUNTERS]) {
1335 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1336 if (IS_ERR(stats)) {
1337 module_put(type->owner);
1339 return PTR_ERR(stats);
1341 basechain->stats = stats;
1343 stats = netdev_alloc_pcpu_stats(struct nft_stats);
1344 if (stats == NULL) {
1345 module_put(type->owner);
1349 rcu_assign_pointer(basechain->stats, stats);
1352 write_pnet(&basechain->pnet, net);
1353 basechain->type = type;
1354 chain = &basechain->chain;
1356 for (i = 0; i < afi->nops; i++) {
1357 ops = &basechain->ops[i];
1359 ops->owner = afi->owner;
1360 ops->hooknum = hooknum;
1361 ops->priority = priority;
1363 ops->hook = afi->hooks[ops->hooknum];
1366 if (afi->hook_ops_init)
1367 afi->hook_ops_init(ops, i);
1370 chain->flags |= NFT_BASE_CHAIN;
1371 basechain->policy = policy;
1373 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1378 INIT_LIST_HEAD(&chain->rules);
1379 chain->handle = nf_tables_alloc_handle(table);
1380 chain->table = table;
1381 nla_strlcpy(chain->name, name, NFT_CHAIN_MAXNAMELEN);
1383 if (!(table->flags & NFT_TABLE_F_DORMANT) &&
1384 chain->flags & NFT_BASE_CHAIN) {
1385 err = nf_register_hooks(nft_base_chain(chain)->ops, afi->nops);
1390 nft_ctx_init(&ctx, skb, nlh, afi, table, chain, nla);
1391 err = nft_trans_chain_add(&ctx, NFT_MSG_NEWCHAIN);
1396 list_add_tail_rcu(&chain->list, &table->chains);
1399 nf_tables_unregister_hooks(table, chain, afi->nops);
1401 nf_tables_chain_destroy(chain);
1405 static int nf_tables_delchain(struct sock *nlsk, struct sk_buff *skb,
1406 const struct nlmsghdr *nlh,
1407 const struct nlattr * const nla[])
1409 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1410 struct nft_af_info *afi;
1411 struct nft_table *table;
1412 struct nft_chain *chain;
1413 struct net *net = sock_net(skb->sk);
1414 int family = nfmsg->nfgen_family;
1417 afi = nf_tables_afinfo_lookup(net, family, false);
1419 return PTR_ERR(afi);
1421 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE]);
1423 return PTR_ERR(table);
1424 if (table->flags & NFT_TABLE_INACTIVE)
1427 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME]);
1429 return PTR_ERR(chain);
1430 if (chain->flags & NFT_CHAIN_INACTIVE)
1435 nft_ctx_init(&ctx, skb, nlh, afi, table, chain, nla);
1437 return nft_delchain(&ctx);
1445 * nft_register_expr - register nf_tables expr type
1448 * Registers the expr type for use with nf_tables. Returns zero on
1449 * success or a negative errno code otherwise.
1451 int nft_register_expr(struct nft_expr_type *type)
1453 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1454 if (type->family == NFPROTO_UNSPEC)
1455 list_add_tail_rcu(&type->list, &nf_tables_expressions);
1457 list_add_rcu(&type->list, &nf_tables_expressions);
1458 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1461 EXPORT_SYMBOL_GPL(nft_register_expr);
1464 * nft_unregister_expr - unregister nf_tables expr type
1467 * Unregisters the expr typefor use with nf_tables.
1469 void nft_unregister_expr(struct nft_expr_type *type)
1471 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1472 list_del_rcu(&type->list);
1473 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1475 EXPORT_SYMBOL_GPL(nft_unregister_expr);
1477 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
1480 const struct nft_expr_type *type;
1482 list_for_each_entry(type, &nf_tables_expressions, list) {
1483 if (!nla_strcmp(nla, type->name) &&
1484 (!type->family || type->family == family))
1490 static const struct nft_expr_type *nft_expr_type_get(u8 family,
1493 const struct nft_expr_type *type;
1496 return ERR_PTR(-EINVAL);
1498 type = __nft_expr_type_get(family, nla);
1499 if (type != NULL && try_module_get(type->owner))
1502 #ifdef CONFIG_MODULES
1504 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1505 request_module("nft-expr-%u-%.*s", family,
1506 nla_len(nla), (char *)nla_data(nla));
1507 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1508 if (__nft_expr_type_get(family, nla))
1509 return ERR_PTR(-EAGAIN);
1511 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1512 request_module("nft-expr-%.*s",
1513 nla_len(nla), (char *)nla_data(nla));
1514 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1515 if (__nft_expr_type_get(family, nla))
1516 return ERR_PTR(-EAGAIN);
1519 return ERR_PTR(-ENOENT);
1522 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
1523 [NFTA_EXPR_NAME] = { .type = NLA_STRING },
1524 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
1527 static int nf_tables_fill_expr_info(struct sk_buff *skb,
1528 const struct nft_expr *expr)
1530 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
1531 goto nla_put_failure;
1533 if (expr->ops->dump) {
1534 struct nlattr *data = nla_nest_start(skb, NFTA_EXPR_DATA);
1536 goto nla_put_failure;
1537 if (expr->ops->dump(skb, expr) < 0)
1538 goto nla_put_failure;
1539 nla_nest_end(skb, data);
1548 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
1549 const struct nft_expr *expr)
1551 struct nlattr *nest;
1553 nest = nla_nest_start(skb, attr);
1555 goto nla_put_failure;
1556 if (nf_tables_fill_expr_info(skb, expr) < 0)
1557 goto nla_put_failure;
1558 nla_nest_end(skb, nest);
1565 struct nft_expr_info {
1566 const struct nft_expr_ops *ops;
1567 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
1570 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
1571 const struct nlattr *nla,
1572 struct nft_expr_info *info)
1574 const struct nft_expr_type *type;
1575 const struct nft_expr_ops *ops;
1576 struct nlattr *tb[NFTA_EXPR_MAX + 1];
1579 err = nla_parse_nested(tb, NFTA_EXPR_MAX, nla, nft_expr_policy);
1583 type = nft_expr_type_get(ctx->afi->family, tb[NFTA_EXPR_NAME]);
1585 return PTR_ERR(type);
1587 if (tb[NFTA_EXPR_DATA]) {
1588 err = nla_parse_nested(info->tb, type->maxattr,
1589 tb[NFTA_EXPR_DATA], type->policy);
1593 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
1595 if (type->select_ops != NULL) {
1596 ops = type->select_ops(ctx,
1597 (const struct nlattr * const *)info->tb);
1609 module_put(type->owner);
1613 static int nf_tables_newexpr(const struct nft_ctx *ctx,
1614 const struct nft_expr_info *info,
1615 struct nft_expr *expr)
1617 const struct nft_expr_ops *ops = info->ops;
1622 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
1634 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
1635 struct nft_expr *expr)
1637 if (expr->ops->destroy)
1638 expr->ops->destroy(ctx, expr);
1639 module_put(expr->ops->type->owner);
1642 struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
1643 const struct nlattr *nla)
1645 struct nft_expr_info info;
1646 struct nft_expr *expr;
1649 err = nf_tables_expr_parse(ctx, nla, &info);
1654 expr = kzalloc(info.ops->size, GFP_KERNEL);
1658 err = nf_tables_newexpr(ctx, &info, expr);
1664 module_put(info.ops->type->owner);
1666 return ERR_PTR(err);
1669 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
1671 nf_tables_expr_destroy(ctx, expr);
1679 static struct nft_rule *__nf_tables_rule_lookup(const struct nft_chain *chain,
1682 struct nft_rule *rule;
1684 // FIXME: this sucks
1685 list_for_each_entry(rule, &chain->rules, list) {
1686 if (handle == rule->handle)
1690 return ERR_PTR(-ENOENT);
1693 static struct nft_rule *nf_tables_rule_lookup(const struct nft_chain *chain,
1694 const struct nlattr *nla)
1697 return ERR_PTR(-EINVAL);
1699 return __nf_tables_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
1702 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
1703 [NFTA_RULE_TABLE] = { .type = NLA_STRING },
1704 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
1705 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1706 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
1707 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
1708 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
1709 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
1710 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
1711 .len = NFT_USERDATA_MAXLEN },
1714 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
1715 u32 portid, u32 seq, int event,
1716 u32 flags, int family,
1717 const struct nft_table *table,
1718 const struct nft_chain *chain,
1719 const struct nft_rule *rule)
1721 struct nlmsghdr *nlh;
1722 struct nfgenmsg *nfmsg;
1723 const struct nft_expr *expr, *next;
1724 struct nlattr *list;
1725 const struct nft_rule *prule;
1726 int type = event | NFNL_SUBSYS_NFTABLES << 8;
1728 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg),
1731 goto nla_put_failure;
1733 nfmsg = nlmsg_data(nlh);
1734 nfmsg->nfgen_family = family;
1735 nfmsg->version = NFNETLINK_V0;
1736 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1738 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
1739 goto nla_put_failure;
1740 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
1741 goto nla_put_failure;
1742 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle)))
1743 goto nla_put_failure;
1745 if ((event != NFT_MSG_DELRULE) && (rule->list.prev != &chain->rules)) {
1746 prule = list_entry(rule->list.prev, struct nft_rule, list);
1747 if (nla_put_be64(skb, NFTA_RULE_POSITION,
1748 cpu_to_be64(prule->handle)))
1749 goto nla_put_failure;
1752 list = nla_nest_start(skb, NFTA_RULE_EXPRESSIONS);
1754 goto nla_put_failure;
1755 nft_rule_for_each_expr(expr, next, rule) {
1756 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
1757 goto nla_put_failure;
1759 nla_nest_end(skb, list);
1762 struct nft_userdata *udata = nft_userdata(rule);
1763 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
1765 goto nla_put_failure;
1768 nlmsg_end(skb, nlh);
1772 nlmsg_trim(skb, nlh);
1776 static int nf_tables_rule_notify(const struct nft_ctx *ctx,
1777 const struct nft_rule *rule,
1780 struct sk_buff *skb;
1784 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1788 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1792 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
1793 event, 0, ctx->afi->family, ctx->table,
1800 err = nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1801 ctx->report, GFP_KERNEL);
1804 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1810 static int nf_tables_dump_rules(struct sk_buff *skb,
1811 struct netlink_callback *cb)
1813 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1814 const struct nft_af_info *afi;
1815 const struct nft_table *table;
1816 const struct nft_chain *chain;
1817 const struct nft_rule *rule;
1818 unsigned int idx = 0, s_idx = cb->args[0];
1819 struct net *net = sock_net(skb->sk);
1820 int family = nfmsg->nfgen_family;
1823 cb->seq = net->nft.base_seq;
1825 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1826 if (family != NFPROTO_UNSPEC && family != afi->family)
1829 list_for_each_entry_rcu(table, &afi->tables, list) {
1830 list_for_each_entry_rcu(chain, &table->chains, list) {
1831 list_for_each_entry_rcu(rule, &chain->rules, list) {
1832 if (!nft_rule_is_active(net, rule))
1837 memset(&cb->args[1], 0,
1838 sizeof(cb->args) - sizeof(cb->args[0]));
1839 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
1842 NLM_F_MULTI | NLM_F_APPEND,
1843 afi->family, table, chain, rule) < 0)
1846 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1860 static int nf_tables_getrule(struct sock *nlsk, struct sk_buff *skb,
1861 const struct nlmsghdr *nlh,
1862 const struct nlattr * const nla[])
1864 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1865 const struct nft_af_info *afi;
1866 const struct nft_table *table;
1867 const struct nft_chain *chain;
1868 const struct nft_rule *rule;
1869 struct sk_buff *skb2;
1870 struct net *net = sock_net(skb->sk);
1871 int family = nfmsg->nfgen_family;
1874 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1875 struct netlink_dump_control c = {
1876 .dump = nf_tables_dump_rules,
1878 return netlink_dump_start(nlsk, skb, nlh, &c);
1881 afi = nf_tables_afinfo_lookup(net, family, false);
1883 return PTR_ERR(afi);
1885 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE]);
1887 return PTR_ERR(table);
1888 if (table->flags & NFT_TABLE_INACTIVE)
1891 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN]);
1893 return PTR_ERR(chain);
1894 if (chain->flags & NFT_CHAIN_INACTIVE)
1897 rule = nf_tables_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
1899 return PTR_ERR(rule);
1901 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1905 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
1906 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
1907 family, table, chain, rule);
1911 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1918 static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
1919 struct nft_rule *rule)
1921 struct nft_expr *expr;
1924 * Careful: some expressions might not be initialized in case this
1925 * is called on error from nf_tables_newrule().
1927 expr = nft_expr_first(rule);
1928 while (expr->ops && expr != nft_expr_last(rule)) {
1929 nf_tables_expr_destroy(ctx, expr);
1930 expr = nft_expr_next(expr);
1935 #define NFT_RULE_MAXEXPRS 128
1937 static struct nft_expr_info *info;
1939 static int nf_tables_newrule(struct sock *nlsk, struct sk_buff *skb,
1940 const struct nlmsghdr *nlh,
1941 const struct nlattr * const nla[])
1943 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1944 struct nft_af_info *afi;
1945 struct net *net = sock_net(skb->sk);
1946 struct nft_table *table;
1947 struct nft_chain *chain;
1948 struct nft_rule *rule, *old_rule = NULL;
1949 struct nft_userdata *udata;
1950 struct nft_trans *trans = NULL;
1951 struct nft_expr *expr;
1954 unsigned int size, i, n, ulen = 0, usize = 0;
1957 u64 handle, pos_handle;
1959 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1961 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
1963 return PTR_ERR(afi);
1965 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE]);
1967 return PTR_ERR(table);
1969 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN]);
1971 return PTR_ERR(chain);
1973 if (nla[NFTA_RULE_HANDLE]) {
1974 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
1975 rule = __nf_tables_rule_lookup(chain, handle);
1977 return PTR_ERR(rule);
1979 if (nlh->nlmsg_flags & NLM_F_EXCL)
1981 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1986 if (!create || nlh->nlmsg_flags & NLM_F_REPLACE)
1988 handle = nf_tables_alloc_handle(table);
1990 if (chain->use == UINT_MAX)
1994 if (nla[NFTA_RULE_POSITION]) {
1995 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
1998 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
1999 old_rule = __nf_tables_rule_lookup(chain, pos_handle);
2000 if (IS_ERR(old_rule))
2001 return PTR_ERR(old_rule);
2004 nft_ctx_init(&ctx, skb, nlh, afi, table, chain, nla);
2008 if (nla[NFTA_RULE_EXPRESSIONS]) {
2009 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
2011 if (nla_type(tmp) != NFTA_LIST_ELEM)
2013 if (n == NFT_RULE_MAXEXPRS)
2015 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
2018 size += info[n].ops->size;
2022 /* Check for overflow of dlen field */
2024 if (size >= 1 << 12)
2027 if (nla[NFTA_RULE_USERDATA]) {
2028 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
2030 usize = sizeof(struct nft_userdata) + ulen;
2034 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
2038 nft_rule_activate_next(net, rule);
2040 rule->handle = handle;
2042 rule->udata = ulen ? 1 : 0;
2045 udata = nft_userdata(rule);
2046 udata->len = ulen - 1;
2047 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
2050 expr = nft_expr_first(rule);
2051 for (i = 0; i < n; i++) {
2052 err = nf_tables_newexpr(&ctx, &info[i], expr);
2056 expr = nft_expr_next(expr);
2059 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
2060 if (nft_rule_is_active_next(net, old_rule)) {
2061 trans = nft_trans_rule_add(&ctx, NFT_MSG_DELRULE,
2063 if (trans == NULL) {
2067 nft_rule_deactivate_next(net, old_rule);
2069 list_add_tail_rcu(&rule->list, &old_rule->list);
2074 } else if (nlh->nlmsg_flags & NLM_F_APPEND)
2076 list_add_rcu(&rule->list, &old_rule->list);
2078 list_add_tail_rcu(&rule->list, &chain->rules);
2081 list_add_tail_rcu(&rule->list, &old_rule->list);
2083 list_add_rcu(&rule->list, &chain->rules);
2086 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2094 list_del_rcu(&rule->list);
2096 nf_tables_rule_destroy(&ctx, rule);
2098 for (i = 0; i < n; i++) {
2099 if (info[i].ops != NULL)
2100 module_put(info[i].ops->type->owner);
2105 static int nf_tables_delrule(struct sock *nlsk, struct sk_buff *skb,
2106 const struct nlmsghdr *nlh,
2107 const struct nlattr * const nla[])
2109 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2110 struct nft_af_info *afi;
2111 struct net *net = sock_net(skb->sk);
2112 struct nft_table *table;
2113 struct nft_chain *chain = NULL;
2114 struct nft_rule *rule;
2115 int family = nfmsg->nfgen_family, err = 0;
2118 afi = nf_tables_afinfo_lookup(net, family, false);
2120 return PTR_ERR(afi);
2122 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE]);
2124 return PTR_ERR(table);
2125 if (table->flags & NFT_TABLE_INACTIVE)
2128 if (nla[NFTA_RULE_CHAIN]) {
2129 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN]);
2131 return PTR_ERR(chain);
2134 nft_ctx_init(&ctx, skb, nlh, afi, table, chain, nla);
2137 if (nla[NFTA_RULE_HANDLE]) {
2138 rule = nf_tables_rule_lookup(chain,
2139 nla[NFTA_RULE_HANDLE]);
2141 return PTR_ERR(rule);
2143 err = nft_delrule(&ctx, rule);
2145 err = nft_delrule_by_chain(&ctx);
2148 list_for_each_entry(chain, &table->chains, list) {
2150 err = nft_delrule_by_chain(&ctx);
2163 static LIST_HEAD(nf_tables_set_ops);
2165 int nft_register_set(struct nft_set_ops *ops)
2167 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2168 list_add_tail_rcu(&ops->list, &nf_tables_set_ops);
2169 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2172 EXPORT_SYMBOL_GPL(nft_register_set);
2174 void nft_unregister_set(struct nft_set_ops *ops)
2176 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2177 list_del_rcu(&ops->list);
2178 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2180 EXPORT_SYMBOL_GPL(nft_unregister_set);
2183 * Select a set implementation based on the data characteristics and the
2184 * given policy. The total memory use might not be known if no size is
2185 * given, in that case the amount of memory per element is used.
2187 static const struct nft_set_ops *
2188 nft_select_set_ops(const struct nlattr * const nla[],
2189 const struct nft_set_desc *desc,
2190 enum nft_set_policies policy)
2192 const struct nft_set_ops *ops, *bops;
2193 struct nft_set_estimate est, best;
2196 #ifdef CONFIG_MODULES
2197 if (list_empty(&nf_tables_set_ops)) {
2198 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2199 request_module("nft-set");
2200 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2201 if (!list_empty(&nf_tables_set_ops))
2202 return ERR_PTR(-EAGAIN);
2206 if (nla[NFTA_SET_FLAGS] != NULL) {
2207 features = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2208 features &= NFT_SET_INTERVAL | NFT_SET_MAP | NFT_SET_TIMEOUT;
2215 list_for_each_entry(ops, &nf_tables_set_ops, list) {
2216 if ((ops->features & features) != features)
2218 if (!ops->estimate(desc, features, &est))
2222 case NFT_SET_POL_PERFORMANCE:
2223 if (est.class < best.class)
2225 if (est.class == best.class && est.size < best.size)
2228 case NFT_SET_POL_MEMORY:
2229 if (est.size < best.size)
2231 if (est.size == best.size && est.class < best.class)
2238 if (!try_module_get(ops->owner))
2241 module_put(bops->owner);
2250 return ERR_PTR(-EOPNOTSUPP);
2253 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
2254 [NFTA_SET_TABLE] = { .type = NLA_STRING },
2255 [NFTA_SET_NAME] = { .type = NLA_STRING,
2256 .len = IFNAMSIZ - 1 },
2257 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
2258 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
2259 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
2260 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
2261 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
2262 [NFTA_SET_POLICY] = { .type = NLA_U32 },
2263 [NFTA_SET_DESC] = { .type = NLA_NESTED },
2264 [NFTA_SET_ID] = { .type = NLA_U32 },
2265 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
2266 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
2269 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
2270 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
2273 static int nft_ctx_init_from_setattr(struct nft_ctx *ctx,
2274 const struct sk_buff *skb,
2275 const struct nlmsghdr *nlh,
2276 const struct nlattr * const nla[])
2278 struct net *net = sock_net(skb->sk);
2279 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2280 struct nft_af_info *afi = NULL;
2281 struct nft_table *table = NULL;
2283 if (nfmsg->nfgen_family != NFPROTO_UNSPEC) {
2284 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
2286 return PTR_ERR(afi);
2289 if (nla[NFTA_SET_TABLE] != NULL) {
2291 return -EAFNOSUPPORT;
2293 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE]);
2295 return PTR_ERR(table);
2296 if (table->flags & NFT_TABLE_INACTIVE)
2300 nft_ctx_init(ctx, skb, nlh, afi, table, NULL, nla);
2304 struct nft_set *nf_tables_set_lookup(const struct nft_table *table,
2305 const struct nlattr *nla)
2307 struct nft_set *set;
2310 return ERR_PTR(-EINVAL);
2312 list_for_each_entry(set, &table->sets, list) {
2313 if (!nla_strcmp(nla, set->name))
2316 return ERR_PTR(-ENOENT);
2319 struct nft_set *nf_tables_set_lookup_byid(const struct net *net,
2320 const struct nlattr *nla)
2322 struct nft_trans *trans;
2323 u32 id = ntohl(nla_get_be32(nla));
2325 list_for_each_entry(trans, &net->nft.commit_list, list) {
2326 if (trans->msg_type == NFT_MSG_NEWSET &&
2327 id == nft_trans_set_id(trans))
2328 return nft_trans_set(trans);
2330 return ERR_PTR(-ENOENT);
2333 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
2336 const struct nft_set *i;
2338 unsigned long *inuse;
2339 unsigned int n = 0, min = 0;
2341 p = strnchr(name, IFNAMSIZ, '%');
2343 if (p[1] != 'd' || strchr(p + 2, '%'))
2346 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
2350 list_for_each_entry(i, &ctx->table->sets, list) {
2353 if (!sscanf(i->name, name, &tmp))
2355 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
2358 set_bit(tmp - min, inuse);
2361 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
2362 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
2363 min += BITS_PER_BYTE * PAGE_SIZE;
2364 memset(inuse, 0, PAGE_SIZE);
2367 free_page((unsigned long)inuse);
2370 snprintf(set->name, sizeof(set->name), name, min + n);
2371 list_for_each_entry(i, &ctx->table->sets, list) {
2372 if (!strcmp(set->name, i->name))
2378 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
2379 const struct nft_set *set, u16 event, u16 flags)
2381 struct nfgenmsg *nfmsg;
2382 struct nlmsghdr *nlh;
2383 struct nlattr *desc;
2384 u32 portid = ctx->portid;
2387 event |= NFNL_SUBSYS_NFTABLES << 8;
2388 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
2391 goto nla_put_failure;
2393 nfmsg = nlmsg_data(nlh);
2394 nfmsg->nfgen_family = ctx->afi->family;
2395 nfmsg->version = NFNETLINK_V0;
2396 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
2398 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
2399 goto nla_put_failure;
2400 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
2401 goto nla_put_failure;
2402 if (set->flags != 0)
2403 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
2404 goto nla_put_failure;
2406 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
2407 goto nla_put_failure;
2408 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
2409 goto nla_put_failure;
2410 if (set->flags & NFT_SET_MAP) {
2411 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
2412 goto nla_put_failure;
2413 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
2414 goto nla_put_failure;
2418 nla_put_be64(skb, NFTA_SET_TIMEOUT, cpu_to_be64(set->timeout)))
2419 goto nla_put_failure;
2421 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
2422 goto nla_put_failure;
2424 if (set->policy != NFT_SET_POL_PERFORMANCE) {
2425 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
2426 goto nla_put_failure;
2429 desc = nla_nest_start(skb, NFTA_SET_DESC);
2431 goto nla_put_failure;
2433 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
2434 goto nla_put_failure;
2435 nla_nest_end(skb, desc);
2437 nlmsg_end(skb, nlh);
2441 nlmsg_trim(skb, nlh);
2445 static int nf_tables_set_notify(const struct nft_ctx *ctx,
2446 const struct nft_set *set,
2447 int event, gfp_t gfp_flags)
2449 struct sk_buff *skb;
2450 u32 portid = ctx->portid;
2454 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2458 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
2462 err = nf_tables_fill_set(skb, ctx, set, event, 0);
2468 err = nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES,
2469 ctx->report, gfp_flags);
2472 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, err);
2476 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
2478 const struct nft_set *set;
2479 unsigned int idx, s_idx = cb->args[0];
2480 struct nft_af_info *afi;
2481 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
2482 struct net *net = sock_net(skb->sk);
2483 int cur_family = cb->args[3];
2484 struct nft_ctx *ctx = cb->data, ctx_set;
2490 cb->seq = net->nft.base_seq;
2492 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
2493 if (ctx->afi && ctx->afi != afi)
2497 if (afi->family != cur_family)
2502 list_for_each_entry_rcu(table, &afi->tables, list) {
2503 if (ctx->table && ctx->table != table)
2507 if (cur_table != table)
2513 list_for_each_entry_rcu(set, &table->sets, list) {
2518 ctx_set.table = table;
2520 if (nf_tables_fill_set(skb, &ctx_set, set,
2524 cb->args[2] = (unsigned long) table;
2525 cb->args[3] = afi->family;
2528 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2542 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
2548 static int nf_tables_getset(struct sock *nlsk, struct sk_buff *skb,
2549 const struct nlmsghdr *nlh,
2550 const struct nlattr * const nla[])
2552 const struct nft_set *set;
2554 struct sk_buff *skb2;
2555 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2558 /* Verify existence before starting dump */
2559 err = nft_ctx_init_from_setattr(&ctx, skb, nlh, nla);
2563 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2564 struct netlink_dump_control c = {
2565 .dump = nf_tables_dump_sets,
2566 .done = nf_tables_dump_sets_done,
2568 struct nft_ctx *ctx_dump;
2570 ctx_dump = kmalloc(sizeof(*ctx_dump), GFP_KERNEL);
2571 if (ctx_dump == NULL)
2577 return netlink_dump_start(nlsk, skb, nlh, &c);
2580 /* Only accept unspec with dump */
2581 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2582 return -EAFNOSUPPORT;
2584 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME]);
2586 return PTR_ERR(set);
2587 if (set->flags & NFT_SET_INACTIVE)
2590 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2594 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
2598 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2605 static int nf_tables_set_desc_parse(const struct nft_ctx *ctx,
2606 struct nft_set_desc *desc,
2607 const struct nlattr *nla)
2609 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
2612 err = nla_parse_nested(da, NFTA_SET_DESC_MAX, nla, nft_set_desc_policy);
2616 if (da[NFTA_SET_DESC_SIZE] != NULL)
2617 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
2622 static int nf_tables_newset(struct sock *nlsk, struct sk_buff *skb,
2623 const struct nlmsghdr *nlh,
2624 const struct nlattr * const nla[])
2626 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2627 const struct nft_set_ops *ops;
2628 struct nft_af_info *afi;
2629 struct net *net = sock_net(skb->sk);
2630 struct nft_table *table;
2631 struct nft_set *set;
2633 char name[IFNAMSIZ];
2637 u32 ktype, dtype, flags, policy, gc_int;
2638 struct nft_set_desc desc;
2641 if (nla[NFTA_SET_TABLE] == NULL ||
2642 nla[NFTA_SET_NAME] == NULL ||
2643 nla[NFTA_SET_KEY_LEN] == NULL ||
2644 nla[NFTA_SET_ID] == NULL)
2647 memset(&desc, 0, sizeof(desc));
2649 ktype = NFT_DATA_VALUE;
2650 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
2651 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
2652 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
2656 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
2657 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
2661 if (nla[NFTA_SET_FLAGS] != NULL) {
2662 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2663 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
2664 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
2665 NFT_SET_MAP | NFT_SET_EVAL))
2667 /* Only one of both operations is supported */
2668 if ((flags & (NFT_SET_MAP | NFT_SET_EVAL)) ==
2669 (NFT_SET_MAP | NFT_SET_EVAL))
2674 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
2675 if (!(flags & NFT_SET_MAP))
2678 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
2679 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
2680 dtype != NFT_DATA_VERDICT)
2683 if (dtype != NFT_DATA_VERDICT) {
2684 if (nla[NFTA_SET_DATA_LEN] == NULL)
2686 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
2687 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
2690 desc.dlen = sizeof(struct nft_verdict);
2691 } else if (flags & NFT_SET_MAP)
2695 if (nla[NFTA_SET_TIMEOUT] != NULL) {
2696 if (!(flags & NFT_SET_TIMEOUT))
2698 timeout = be64_to_cpu(nla_get_be64(nla[NFTA_SET_TIMEOUT]));
2701 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
2702 if (!(flags & NFT_SET_TIMEOUT))
2704 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
2707 policy = NFT_SET_POL_PERFORMANCE;
2708 if (nla[NFTA_SET_POLICY] != NULL)
2709 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
2711 if (nla[NFTA_SET_DESC] != NULL) {
2712 err = nf_tables_set_desc_parse(&ctx, &desc, nla[NFTA_SET_DESC]);
2717 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2719 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
2721 return PTR_ERR(afi);
2723 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE]);
2725 return PTR_ERR(table);
2727 nft_ctx_init(&ctx, skb, nlh, afi, table, NULL, nla);
2729 set = nf_tables_set_lookup(table, nla[NFTA_SET_NAME]);
2731 if (PTR_ERR(set) != -ENOENT)
2732 return PTR_ERR(set);
2737 if (nlh->nlmsg_flags & NLM_F_EXCL)
2739 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2744 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2747 ops = nft_select_set_ops(nla, &desc, policy);
2749 return PTR_ERR(ops);
2752 if (ops->privsize != NULL)
2753 size = ops->privsize(nla);
2756 set = kzalloc(sizeof(*set) + size, GFP_KERNEL);
2760 nla_strlcpy(name, nla[NFTA_SET_NAME], sizeof(set->name));
2761 err = nf_tables_set_alloc_name(&ctx, set, name);
2765 INIT_LIST_HEAD(&set->bindings);
2766 write_pnet(&set->pnet, net);
2769 set->klen = desc.klen;
2771 set->dlen = desc.dlen;
2773 set->size = desc.size;
2774 set->policy = policy;
2775 set->timeout = timeout;
2776 set->gc_int = gc_int;
2778 err = ops->init(set, &desc, nla);
2782 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
2786 list_add_tail_rcu(&set->list, &table->sets);
2793 module_put(ops->owner);
2797 static void nft_set_destroy(struct nft_set *set)
2799 set->ops->destroy(set);
2800 module_put(set->ops->owner);
2804 static void nf_tables_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
2806 list_del_rcu(&set->list);
2807 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET, GFP_ATOMIC);
2808 nft_set_destroy(set);
2811 static int nf_tables_delset(struct sock *nlsk, struct sk_buff *skb,
2812 const struct nlmsghdr *nlh,
2813 const struct nlattr * const nla[])
2815 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2816 struct nft_set *set;
2820 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2821 return -EAFNOSUPPORT;
2822 if (nla[NFTA_SET_TABLE] == NULL)
2825 err = nft_ctx_init_from_setattr(&ctx, skb, nlh, nla);
2829 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME]);
2831 return PTR_ERR(set);
2832 if (set->flags & NFT_SET_INACTIVE)
2834 if (!list_empty(&set->bindings))
2837 return nft_delset(&ctx, set);
2840 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
2841 const struct nft_set *set,
2842 const struct nft_set_iter *iter,
2843 const struct nft_set_elem *elem)
2845 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
2846 enum nft_registers dreg;
2848 dreg = nft_type_to_reg(set->dtype);
2849 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
2850 set->dtype == NFT_DATA_VERDICT ?
2851 NFT_DATA_VERDICT : NFT_DATA_VALUE,
2855 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
2856 struct nft_set_binding *binding)
2858 struct nft_set_binding *i;
2859 struct nft_set_iter iter;
2861 if (!list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS)
2864 if (binding->flags & NFT_SET_MAP) {
2865 /* If the set is already bound to the same chain all
2866 * jumps are already validated for that chain.
2868 list_for_each_entry(i, &set->bindings, list) {
2869 if (binding->flags & NFT_SET_MAP &&
2870 i->chain == binding->chain)
2877 iter.fn = nf_tables_bind_check_setelem;
2879 set->ops->walk(ctx, set, &iter);
2881 /* Destroy anonymous sets if binding fails */
2882 if (set->flags & NFT_SET_ANONYMOUS)
2883 nf_tables_set_destroy(ctx, set);
2889 binding->chain = ctx->chain;
2890 list_add_tail_rcu(&binding->list, &set->bindings);
2894 void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
2895 struct nft_set_binding *binding)
2897 list_del_rcu(&binding->list);
2899 if (list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS &&
2900 !(set->flags & NFT_SET_INACTIVE))
2901 nf_tables_set_destroy(ctx, set);
2904 const struct nft_set_ext_type nft_set_ext_types[] = {
2905 [NFT_SET_EXT_KEY] = {
2906 .align = __alignof__(u32),
2908 [NFT_SET_EXT_DATA] = {
2909 .align = __alignof__(u32),
2911 [NFT_SET_EXT_EXPR] = {
2912 .align = __alignof__(struct nft_expr),
2914 [NFT_SET_EXT_FLAGS] = {
2916 .align = __alignof__(u8),
2918 [NFT_SET_EXT_TIMEOUT] = {
2920 .align = __alignof__(u64),
2922 [NFT_SET_EXT_EXPIRATION] = {
2923 .len = sizeof(unsigned long),
2924 .align = __alignof__(unsigned long),
2926 [NFT_SET_EXT_USERDATA] = {
2927 .len = sizeof(struct nft_userdata),
2928 .align = __alignof__(struct nft_userdata),
2931 EXPORT_SYMBOL_GPL(nft_set_ext_types);
2937 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
2938 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
2939 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
2940 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
2941 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
2942 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
2943 .len = NFT_USERDATA_MAXLEN },
2946 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
2947 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING },
2948 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING },
2949 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
2950 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
2953 static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx,
2954 const struct sk_buff *skb,
2955 const struct nlmsghdr *nlh,
2956 const struct nlattr * const nla[],
2959 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2960 struct nft_af_info *afi;
2961 struct nft_table *table;
2962 struct net *net = sock_net(skb->sk);
2964 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
2966 return PTR_ERR(afi);
2968 table = nf_tables_table_lookup(afi, nla[NFTA_SET_ELEM_LIST_TABLE]);
2970 return PTR_ERR(table);
2971 if (!trans && (table->flags & NFT_TABLE_INACTIVE))
2974 nft_ctx_init(ctx, skb, nlh, afi, table, NULL, nla);
2978 static int nf_tables_fill_setelem(struct sk_buff *skb,
2979 const struct nft_set *set,
2980 const struct nft_set_elem *elem)
2982 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
2983 unsigned char *b = skb_tail_pointer(skb);
2984 struct nlattr *nest;
2986 nest = nla_nest_start(skb, NFTA_LIST_ELEM);
2988 goto nla_put_failure;
2990 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
2991 NFT_DATA_VALUE, set->klen) < 0)
2992 goto nla_put_failure;
2994 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
2995 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
2996 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
2998 goto nla_put_failure;
3000 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
3001 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
3002 goto nla_put_failure;
3004 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
3005 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
3006 htonl(*nft_set_ext_flags(ext))))
3007 goto nla_put_failure;
3009 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
3010 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
3011 cpu_to_be64(*nft_set_ext_timeout(ext))))
3012 goto nla_put_failure;
3014 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
3015 unsigned long expires, now = jiffies;
3017 expires = *nft_set_ext_expiration(ext);
3018 if (time_before(now, expires))
3023 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
3024 cpu_to_be64(jiffies_to_msecs(expires))))
3025 goto nla_put_failure;
3028 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
3029 struct nft_userdata *udata;
3031 udata = nft_set_ext_userdata(ext);
3032 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
3033 udata->len + 1, udata->data))
3034 goto nla_put_failure;
3037 nla_nest_end(skb, nest);
3045 struct nft_set_dump_args {
3046 const struct netlink_callback *cb;
3047 struct nft_set_iter iter;
3048 struct sk_buff *skb;
3051 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
3052 const struct nft_set *set,
3053 const struct nft_set_iter *iter,
3054 const struct nft_set_elem *elem)
3056 struct nft_set_dump_args *args;
3058 args = container_of(iter, struct nft_set_dump_args, iter);
3059 return nf_tables_fill_setelem(args->skb, set, elem);
3062 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
3064 const struct nft_set *set;
3065 struct nft_set_dump_args args;
3067 struct nlattr *nla[NFTA_SET_ELEM_LIST_MAX + 1];
3068 struct nfgenmsg *nfmsg;
3069 struct nlmsghdr *nlh;
3070 struct nlattr *nest;
3074 err = nlmsg_parse(cb->nlh, sizeof(struct nfgenmsg), nla,
3075 NFTA_SET_ELEM_LIST_MAX, nft_set_elem_list_policy);
3079 err = nft_ctx_init_from_elemattr(&ctx, cb->skb, cb->nlh, (void *)nla,
3084 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET]);
3086 return PTR_ERR(set);
3087 if (set->flags & NFT_SET_INACTIVE)
3090 event = NFT_MSG_NEWSETELEM;
3091 event |= NFNL_SUBSYS_NFTABLES << 8;
3092 portid = NETLINK_CB(cb->skb).portid;
3093 seq = cb->nlh->nlmsg_seq;
3095 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3098 goto nla_put_failure;
3100 nfmsg = nlmsg_data(nlh);
3101 nfmsg->nfgen_family = ctx.afi->family;
3102 nfmsg->version = NFNETLINK_V0;
3103 nfmsg->res_id = htons(ctx.net->nft.base_seq & 0xffff);
3105 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, ctx.table->name))
3106 goto nla_put_failure;
3107 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
3108 goto nla_put_failure;
3110 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3112 goto nla_put_failure;
3116 args.iter.skip = cb->args[0];
3117 args.iter.count = 0;
3119 args.iter.fn = nf_tables_dump_setelem;
3120 set->ops->walk(&ctx, set, &args.iter);
3122 nla_nest_end(skb, nest);
3123 nlmsg_end(skb, nlh);
3125 if (args.iter.err && args.iter.err != -EMSGSIZE)
3126 return args.iter.err;
3127 if (args.iter.count == cb->args[0])
3130 cb->args[0] = args.iter.count;
3137 static int nf_tables_getsetelem(struct sock *nlsk, struct sk_buff *skb,
3138 const struct nlmsghdr *nlh,
3139 const struct nlattr * const nla[])
3141 const struct nft_set *set;
3145 err = nft_ctx_init_from_elemattr(&ctx, skb, nlh, nla, false);
3149 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET]);
3151 return PTR_ERR(set);
3152 if (set->flags & NFT_SET_INACTIVE)
3155 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3156 struct netlink_dump_control c = {
3157 .dump = nf_tables_dump_set,
3159 return netlink_dump_start(nlsk, skb, nlh, &c);
3164 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
3165 const struct nft_ctx *ctx, u32 seq,
3166 u32 portid, int event, u16 flags,
3167 const struct nft_set *set,
3168 const struct nft_set_elem *elem)
3170 struct nfgenmsg *nfmsg;
3171 struct nlmsghdr *nlh;
3172 struct nlattr *nest;
3175 event |= NFNL_SUBSYS_NFTABLES << 8;
3176 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3179 goto nla_put_failure;
3181 nfmsg = nlmsg_data(nlh);
3182 nfmsg->nfgen_family = ctx->afi->family;
3183 nfmsg->version = NFNETLINK_V0;
3184 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
3186 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3187 goto nla_put_failure;
3188 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3189 goto nla_put_failure;
3191 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3193 goto nla_put_failure;
3195 err = nf_tables_fill_setelem(skb, set, elem);
3197 goto nla_put_failure;
3199 nla_nest_end(skb, nest);
3201 nlmsg_end(skb, nlh);
3205 nlmsg_trim(skb, nlh);
3209 static int nf_tables_setelem_notify(const struct nft_ctx *ctx,
3210 const struct nft_set *set,
3211 const struct nft_set_elem *elem,
3212 int event, u16 flags)
3214 struct net *net = ctx->net;
3215 u32 portid = ctx->portid;
3216 struct sk_buff *skb;
3219 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3223 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3227 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
3234 err = nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
3238 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, err);
3242 static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
3244 struct nft_set *set)
3246 struct nft_trans *trans;
3248 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
3252 nft_trans_elem_set(trans) = set;
3256 void *nft_set_elem_init(const struct nft_set *set,
3257 const struct nft_set_ext_tmpl *tmpl,
3258 const u32 *key, const u32 *data,
3259 u64 timeout, gfp_t gfp)
3261 struct nft_set_ext *ext;
3264 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
3268 ext = nft_set_elem_ext(set, elem);
3269 nft_set_ext_init(ext, tmpl);
3271 memcpy(nft_set_ext_key(ext), key, set->klen);
3272 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3273 memcpy(nft_set_ext_data(ext), data, set->dlen);
3274 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION))
3275 *nft_set_ext_expiration(ext) =
3276 jiffies + msecs_to_jiffies(timeout);
3277 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
3278 *nft_set_ext_timeout(ext) = timeout;
3283 void nft_set_elem_destroy(const struct nft_set *set, void *elem)
3285 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3287 nft_data_uninit(nft_set_ext_key(ext), NFT_DATA_VALUE);
3288 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3289 nft_data_uninit(nft_set_ext_data(ext), set->dtype);
3290 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3291 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3295 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
3297 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3298 const struct nlattr *attr)
3300 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3301 struct nft_data_desc d1, d2;
3302 struct nft_set_ext_tmpl tmpl;
3303 struct nft_set_ext *ext;
3304 struct nft_set_elem elem;
3305 struct nft_set_binding *binding;
3306 struct nft_userdata *udata;
3307 struct nft_data data;
3308 enum nft_registers dreg;
3309 struct nft_trans *trans;
3315 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3316 nft_set_elem_policy);
3320 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3323 nft_set_ext_prepare(&tmpl);
3326 if (nla[NFTA_SET_ELEM_FLAGS] != NULL) {
3327 flags = ntohl(nla_get_be32(nla[NFTA_SET_ELEM_FLAGS]));
3328 if (flags & ~NFT_SET_ELEM_INTERVAL_END)
3330 if (!(set->flags & NFT_SET_INTERVAL) &&
3331 flags & NFT_SET_ELEM_INTERVAL_END)
3334 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3337 if (set->flags & NFT_SET_MAP) {
3338 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
3339 !(flags & NFT_SET_ELEM_INTERVAL_END))
3341 if (nla[NFTA_SET_ELEM_DATA] != NULL &&
3342 flags & NFT_SET_ELEM_INTERVAL_END)
3345 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3350 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
3351 if (!(set->flags & NFT_SET_TIMEOUT))
3353 timeout = be64_to_cpu(nla_get_be64(nla[NFTA_SET_ELEM_TIMEOUT]));
3354 } else if (set->flags & NFT_SET_TIMEOUT) {
3355 timeout = set->timeout;
3358 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
3359 nla[NFTA_SET_ELEM_KEY]);
3363 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
3366 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
3368 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
3369 if (timeout != set->timeout)
3370 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
3373 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
3374 err = nft_data_init(ctx, &data, sizeof(data), &d2,
3375 nla[NFTA_SET_ELEM_DATA]);
3380 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
3383 dreg = nft_type_to_reg(set->dtype);
3384 list_for_each_entry(binding, &set->bindings, list) {
3385 struct nft_ctx bind_ctx = {
3387 .table = ctx->table,
3388 .chain = (struct nft_chain *)binding->chain,
3391 if (!(binding->flags & NFT_SET_MAP))
3394 err = nft_validate_register_store(&bind_ctx, dreg,
3401 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
3404 /* The full maximum length of userdata can exceed the maximum
3405 * offset value (U8_MAX) for following extensions, therefor it
3406 * must be the last extension added.
3409 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
3410 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
3412 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
3417 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
3418 timeout, GFP_KERNEL);
3419 if (elem.priv == NULL)
3422 ext = nft_set_elem_ext(set, elem.priv);
3424 *nft_set_ext_flags(ext) = flags;
3426 udata = nft_set_ext_userdata(ext);
3427 udata->len = ulen - 1;
3428 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
3431 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
3435 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
3436 err = set->ops->insert(set, &elem);
3440 nft_trans_elem(trans) = elem;
3441 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3449 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3450 nft_data_uninit(&data, d2.type);
3452 nft_data_uninit(&elem.key.val, d1.type);
3457 static int nf_tables_newsetelem(struct sock *nlsk, struct sk_buff *skb,
3458 const struct nlmsghdr *nlh,
3459 const struct nlattr * const nla[])
3461 struct net *net = sock_net(skb->sk);
3462 const struct nlattr *attr;
3463 struct nft_set *set;
3467 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
3470 err = nft_ctx_init_from_elemattr(&ctx, skb, nlh, nla, true);
3474 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET]);
3476 if (nla[NFTA_SET_ELEM_LIST_SET_ID]) {
3477 set = nf_tables_set_lookup_byid(net,
3478 nla[NFTA_SET_ELEM_LIST_SET_ID]);
3481 return PTR_ERR(set);
3484 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
3487 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3489 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact))
3492 err = nft_add_set_elem(&ctx, set, attr);
3494 atomic_dec(&set->nelems);
3501 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
3502 const struct nlattr *attr)
3504 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3505 struct nft_data_desc desc;
3506 struct nft_set_elem elem;
3507 struct nft_trans *trans;
3510 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3511 nft_set_elem_policy);
3516 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3519 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
3520 nla[NFTA_SET_ELEM_KEY]);
3525 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
3528 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
3529 if (trans == NULL) {
3534 elem.priv = set->ops->deactivate(set, &elem);
3535 if (elem.priv == NULL) {
3540 nft_trans_elem(trans) = elem;
3541 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3547 nft_data_uninit(&elem.key.val, desc.type);
3552 static int nf_tables_delsetelem(struct sock *nlsk, struct sk_buff *skb,
3553 const struct nlmsghdr *nlh,
3554 const struct nlattr * const nla[])
3556 const struct nlattr *attr;
3557 struct nft_set *set;
3561 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
3564 err = nft_ctx_init_from_elemattr(&ctx, skb, nlh, nla, false);
3568 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET]);
3570 return PTR_ERR(set);
3571 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
3574 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
3575 err = nft_del_setelem(&ctx, set, attr);
3584 void nft_set_gc_batch_release(struct rcu_head *rcu)
3586 struct nft_set_gc_batch *gcb;
3589 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
3590 for (i = 0; i < gcb->head.cnt; i++)
3591 nft_set_elem_destroy(gcb->head.set, gcb->elems[i]);
3594 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
3596 struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
3599 struct nft_set_gc_batch *gcb;
3601 gcb = kzalloc(sizeof(*gcb), gfp);
3604 gcb->head.set = set;
3607 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
3609 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
3610 u32 portid, u32 seq)
3612 struct nlmsghdr *nlh;
3613 struct nfgenmsg *nfmsg;
3614 int event = (NFNL_SUBSYS_NFTABLES << 8) | NFT_MSG_NEWGEN;
3616 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
3618 goto nla_put_failure;
3620 nfmsg = nlmsg_data(nlh);
3621 nfmsg->nfgen_family = AF_UNSPEC;
3622 nfmsg->version = NFNETLINK_V0;
3623 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
3625 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)))
3626 goto nla_put_failure;
3628 nlmsg_end(skb, nlh);
3632 nlmsg_trim(skb, nlh);
3636 static int nf_tables_gen_notify(struct net *net, struct sk_buff *skb, int event)
3638 struct nlmsghdr *nlh = nlmsg_hdr(skb);
3639 struct sk_buff *skb2;
3642 if (nlmsg_report(nlh) &&
3643 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3647 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3651 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
3658 err = nfnetlink_send(skb2, net, NETLINK_CB(skb).portid,
3659 NFNLGRP_NFTABLES, nlmsg_report(nlh), GFP_KERNEL);
3662 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
3668 static int nf_tables_getgen(struct sock *nlsk, struct sk_buff *skb,
3669 const struct nlmsghdr *nlh,
3670 const struct nlattr * const nla[])
3672 struct net *net = sock_net(skb->sk);
3673 struct sk_buff *skb2;
3676 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
3680 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
3685 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
3691 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
3692 [NFT_MSG_NEWTABLE] = {
3693 .call_batch = nf_tables_newtable,
3694 .attr_count = NFTA_TABLE_MAX,
3695 .policy = nft_table_policy,
3697 [NFT_MSG_GETTABLE] = {
3698 .call = nf_tables_gettable,
3699 .attr_count = NFTA_TABLE_MAX,
3700 .policy = nft_table_policy,
3702 [NFT_MSG_DELTABLE] = {
3703 .call_batch = nf_tables_deltable,
3704 .attr_count = NFTA_TABLE_MAX,
3705 .policy = nft_table_policy,
3707 [NFT_MSG_NEWCHAIN] = {
3708 .call_batch = nf_tables_newchain,
3709 .attr_count = NFTA_CHAIN_MAX,
3710 .policy = nft_chain_policy,
3712 [NFT_MSG_GETCHAIN] = {
3713 .call = nf_tables_getchain,
3714 .attr_count = NFTA_CHAIN_MAX,
3715 .policy = nft_chain_policy,
3717 [NFT_MSG_DELCHAIN] = {
3718 .call_batch = nf_tables_delchain,
3719 .attr_count = NFTA_CHAIN_MAX,
3720 .policy = nft_chain_policy,
3722 [NFT_MSG_NEWRULE] = {
3723 .call_batch = nf_tables_newrule,
3724 .attr_count = NFTA_RULE_MAX,
3725 .policy = nft_rule_policy,
3727 [NFT_MSG_GETRULE] = {
3728 .call = nf_tables_getrule,
3729 .attr_count = NFTA_RULE_MAX,
3730 .policy = nft_rule_policy,
3732 [NFT_MSG_DELRULE] = {
3733 .call_batch = nf_tables_delrule,
3734 .attr_count = NFTA_RULE_MAX,
3735 .policy = nft_rule_policy,
3737 [NFT_MSG_NEWSET] = {
3738 .call_batch = nf_tables_newset,
3739 .attr_count = NFTA_SET_MAX,
3740 .policy = nft_set_policy,
3742 [NFT_MSG_GETSET] = {
3743 .call = nf_tables_getset,
3744 .attr_count = NFTA_SET_MAX,
3745 .policy = nft_set_policy,
3747 [NFT_MSG_DELSET] = {
3748 .call_batch = nf_tables_delset,
3749 .attr_count = NFTA_SET_MAX,
3750 .policy = nft_set_policy,
3752 [NFT_MSG_NEWSETELEM] = {
3753 .call_batch = nf_tables_newsetelem,
3754 .attr_count = NFTA_SET_ELEM_LIST_MAX,
3755 .policy = nft_set_elem_list_policy,
3757 [NFT_MSG_GETSETELEM] = {
3758 .call = nf_tables_getsetelem,
3759 .attr_count = NFTA_SET_ELEM_LIST_MAX,
3760 .policy = nft_set_elem_list_policy,
3762 [NFT_MSG_DELSETELEM] = {
3763 .call_batch = nf_tables_delsetelem,
3764 .attr_count = NFTA_SET_ELEM_LIST_MAX,
3765 .policy = nft_set_elem_list_policy,
3767 [NFT_MSG_GETGEN] = {
3768 .call = nf_tables_getgen,
3772 static void nft_chain_commit_update(struct nft_trans *trans)
3774 struct nft_base_chain *basechain;
3776 if (nft_trans_chain_name(trans)[0])
3777 strcpy(trans->ctx.chain->name, nft_trans_chain_name(trans));
3779 if (!(trans->ctx.chain->flags & NFT_BASE_CHAIN))
3782 basechain = nft_base_chain(trans->ctx.chain);
3783 nft_chain_stats_replace(basechain, nft_trans_chain_stats(trans));
3785 switch (nft_trans_chain_policy(trans)) {
3788 basechain->policy = nft_trans_chain_policy(trans);
3793 static void nf_tables_commit_release(struct nft_trans *trans)
3795 switch (trans->msg_type) {
3796 case NFT_MSG_DELTABLE:
3797 nf_tables_table_destroy(&trans->ctx);
3799 case NFT_MSG_DELCHAIN:
3800 nf_tables_chain_destroy(trans->ctx.chain);
3802 case NFT_MSG_DELRULE:
3803 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
3805 case NFT_MSG_DELSET:
3806 nft_set_destroy(nft_trans_set(trans));
3808 case NFT_MSG_DELSETELEM:
3809 nft_set_elem_destroy(nft_trans_elem_set(trans),
3810 nft_trans_elem(trans).priv);
3816 static int nf_tables_commit(struct sk_buff *skb)
3818 struct net *net = sock_net(skb->sk);
3819 struct nft_trans *trans, *next;
3820 struct nft_trans_elem *te;
3822 /* Bump generation counter, invalidate any dump in progress */
3823 while (++net->nft.base_seq == 0);
3825 /* A new generation has just started */
3826 net->nft.gencursor = nft_gencursor_next(net);
3828 /* Make sure all packets have left the previous generation before
3829 * purging old rules.
3833 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
3834 switch (trans->msg_type) {
3835 case NFT_MSG_NEWTABLE:
3836 if (nft_trans_table_update(trans)) {
3837 if (!nft_trans_table_enable(trans)) {
3838 nf_tables_table_disable(trans->ctx.afi,
3840 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
3843 trans->ctx.table->flags &= ~NFT_TABLE_INACTIVE;
3845 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
3846 nft_trans_destroy(trans);
3848 case NFT_MSG_DELTABLE:
3849 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
3851 case NFT_MSG_NEWCHAIN:
3852 if (nft_trans_chain_update(trans))
3853 nft_chain_commit_update(trans);
3855 trans->ctx.chain->flags &= ~NFT_CHAIN_INACTIVE;
3857 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
3858 nft_trans_destroy(trans);
3860 case NFT_MSG_DELCHAIN:
3861 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
3862 nf_tables_unregister_hooks(trans->ctx.table,
3864 trans->ctx.afi->nops);
3866 case NFT_MSG_NEWRULE:
3867 nft_rule_clear(trans->ctx.net, nft_trans_rule(trans));
3868 nf_tables_rule_notify(&trans->ctx,
3869 nft_trans_rule(trans),
3871 nft_trans_destroy(trans);
3873 case NFT_MSG_DELRULE:
3874 list_del_rcu(&nft_trans_rule(trans)->list);
3875 nf_tables_rule_notify(&trans->ctx,
3876 nft_trans_rule(trans),
3879 case NFT_MSG_NEWSET:
3880 nft_trans_set(trans)->flags &= ~NFT_SET_INACTIVE;
3881 /* This avoids hitting -EBUSY when deleting the table
3882 * from the transaction.
3884 if (nft_trans_set(trans)->flags & NFT_SET_ANONYMOUS &&
3885 !list_empty(&nft_trans_set(trans)->bindings))
3886 trans->ctx.table->use--;
3888 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
3889 NFT_MSG_NEWSET, GFP_KERNEL);
3890 nft_trans_destroy(trans);
3892 case NFT_MSG_DELSET:
3893 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
3894 NFT_MSG_DELSET, GFP_KERNEL);
3896 case NFT_MSG_NEWSETELEM:
3897 te = (struct nft_trans_elem *)trans->data;
3899 te->set->ops->activate(te->set, &te->elem);
3900 nf_tables_setelem_notify(&trans->ctx, te->set,
3902 NFT_MSG_NEWSETELEM, 0);
3903 nft_trans_destroy(trans);
3905 case NFT_MSG_DELSETELEM:
3906 te = (struct nft_trans_elem *)trans->data;
3908 nf_tables_setelem_notify(&trans->ctx, te->set,
3910 NFT_MSG_DELSETELEM, 0);
3911 te->set->ops->remove(te->set, &te->elem);
3912 atomic_dec(&te->set->nelems);
3920 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
3921 list_del(&trans->list);
3922 nf_tables_commit_release(trans);
3925 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
3930 static void nf_tables_abort_release(struct nft_trans *trans)
3932 switch (trans->msg_type) {
3933 case NFT_MSG_NEWTABLE:
3934 nf_tables_table_destroy(&trans->ctx);
3936 case NFT_MSG_NEWCHAIN:
3937 nf_tables_chain_destroy(trans->ctx.chain);
3939 case NFT_MSG_NEWRULE:
3940 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
3942 case NFT_MSG_NEWSET:
3943 nft_set_destroy(nft_trans_set(trans));
3945 case NFT_MSG_NEWSETELEM:
3946 nft_set_elem_destroy(nft_trans_elem_set(trans),
3947 nft_trans_elem(trans).priv);
3953 static int nf_tables_abort(struct sk_buff *skb)
3955 struct net *net = sock_net(skb->sk);
3956 struct nft_trans *trans, *next;
3957 struct nft_trans_elem *te;
3959 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
3960 switch (trans->msg_type) {
3961 case NFT_MSG_NEWTABLE:
3962 if (nft_trans_table_update(trans)) {
3963 if (nft_trans_table_enable(trans)) {
3964 nf_tables_table_disable(trans->ctx.afi,
3966 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
3968 nft_trans_destroy(trans);
3970 list_del_rcu(&trans->ctx.table->list);
3973 case NFT_MSG_DELTABLE:
3974 list_add_tail_rcu(&trans->ctx.table->list,
3975 &trans->ctx.afi->tables);
3976 nft_trans_destroy(trans);
3978 case NFT_MSG_NEWCHAIN:
3979 if (nft_trans_chain_update(trans)) {
3980 free_percpu(nft_trans_chain_stats(trans));
3982 nft_trans_destroy(trans);
3984 trans->ctx.table->use--;
3985 list_del_rcu(&trans->ctx.chain->list);
3986 nf_tables_unregister_hooks(trans->ctx.table,
3988 trans->ctx.afi->nops);
3991 case NFT_MSG_DELCHAIN:
3992 trans->ctx.table->use++;
3993 list_add_tail_rcu(&trans->ctx.chain->list,
3994 &trans->ctx.table->chains);
3995 nft_trans_destroy(trans);
3997 case NFT_MSG_NEWRULE:
3998 trans->ctx.chain->use--;
3999 list_del_rcu(&nft_trans_rule(trans)->list);
4001 case NFT_MSG_DELRULE:
4002 trans->ctx.chain->use++;
4003 nft_rule_clear(trans->ctx.net, nft_trans_rule(trans));
4004 nft_trans_destroy(trans);
4006 case NFT_MSG_NEWSET:
4007 trans->ctx.table->use--;
4008 list_del_rcu(&nft_trans_set(trans)->list);
4010 case NFT_MSG_DELSET:
4011 trans->ctx.table->use++;
4012 list_add_tail_rcu(&nft_trans_set(trans)->list,
4013 &trans->ctx.table->sets);
4014 nft_trans_destroy(trans);
4016 case NFT_MSG_NEWSETELEM:
4017 te = (struct nft_trans_elem *)trans->data;
4019 te->set->ops->remove(te->set, &te->elem);
4020 atomic_dec(&te->set->nelems);
4022 case NFT_MSG_DELSETELEM:
4023 te = (struct nft_trans_elem *)trans->data;
4025 te->set->ops->activate(te->set, &te->elem);
4028 nft_trans_destroy(trans);
4035 list_for_each_entry_safe_reverse(trans, next,
4036 &net->nft.commit_list, list) {
4037 list_del(&trans->list);
4038 nf_tables_abort_release(trans);
4044 static const struct nfnetlink_subsystem nf_tables_subsys = {
4045 .name = "nf_tables",
4046 .subsys_id = NFNL_SUBSYS_NFTABLES,
4047 .cb_count = NFT_MSG_MAX,
4049 .commit = nf_tables_commit,
4050 .abort = nf_tables_abort,
4053 int nft_chain_validate_dependency(const struct nft_chain *chain,
4054 enum nft_chain_type type)
4056 const struct nft_base_chain *basechain;
4058 if (chain->flags & NFT_BASE_CHAIN) {
4059 basechain = nft_base_chain(chain);
4060 if (basechain->type->type != type)
4065 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
4067 int nft_chain_validate_hooks(const struct nft_chain *chain,
4068 unsigned int hook_flags)
4070 struct nft_base_chain *basechain;
4072 if (chain->flags & NFT_BASE_CHAIN) {
4073 basechain = nft_base_chain(chain);
4075 if ((1 << basechain->ops[0].hooknum) & hook_flags)
4083 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
4086 * Loop detection - walk through the ruleset beginning at the destination chain
4087 * of a new jump until either the source chain is reached (loop) or all
4088 * reachable chains have been traversed.
4090 * The loop check is performed whenever a new jump verdict is added to an
4091 * expression or verdict map or a verdict map is bound to a new chain.
4094 static int nf_tables_check_loops(const struct nft_ctx *ctx,
4095 const struct nft_chain *chain);
4097 static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
4098 const struct nft_set *set,
4099 const struct nft_set_iter *iter,
4100 const struct nft_set_elem *elem)
4102 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4103 const struct nft_data *data;
4105 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
4106 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
4109 data = nft_set_ext_data(ext);
4110 switch (data->verdict.code) {
4113 return nf_tables_check_loops(ctx, data->verdict.chain);
4119 static int nf_tables_check_loops(const struct nft_ctx *ctx,
4120 const struct nft_chain *chain)
4122 const struct nft_rule *rule;
4123 const struct nft_expr *expr, *last;
4124 const struct nft_set *set;
4125 struct nft_set_binding *binding;
4126 struct nft_set_iter iter;
4128 if (ctx->chain == chain)
4131 list_for_each_entry(rule, &chain->rules, list) {
4132 nft_rule_for_each_expr(expr, last, rule) {
4133 const struct nft_data *data = NULL;
4136 if (!expr->ops->validate)
4139 err = expr->ops->validate(ctx, expr, &data);
4146 switch (data->verdict.code) {
4149 err = nf_tables_check_loops(ctx,
4150 data->verdict.chain);
4159 list_for_each_entry(set, &ctx->table->sets, list) {
4160 if (!(set->flags & NFT_SET_MAP) ||
4161 set->dtype != NFT_DATA_VERDICT)
4164 list_for_each_entry(binding, &set->bindings, list) {
4165 if (!(binding->flags & NFT_SET_MAP) ||
4166 binding->chain != chain)
4172 iter.fn = nf_tables_loop_check_setelem;
4174 set->ops->walk(ctx, set, &iter);
4184 * nft_parse_register - parse a register value from a netlink attribute
4186 * @attr: netlink attribute
4188 * Parse and translate a register value from a netlink attribute.
4189 * Registers used to be 128 bit wide, these register numbers will be
4190 * mapped to the corresponding 32 bit register numbers.
4192 unsigned int nft_parse_register(const struct nlattr *attr)
4196 reg = ntohl(nla_get_be32(attr));
4198 case NFT_REG_VERDICT...NFT_REG_4:
4199 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
4201 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
4204 EXPORT_SYMBOL_GPL(nft_parse_register);
4207 * nft_dump_register - dump a register value to a netlink attribute
4209 * @skb: socket buffer
4210 * @attr: attribute number
4211 * @reg: register number
4213 * Construct a netlink attribute containing the register number. For
4214 * compatibility reasons, register numbers being a multiple of 4 are
4215 * translated to the corresponding 128 bit register numbers.
4217 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
4219 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
4220 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
4222 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
4224 return nla_put_be32(skb, attr, htonl(reg));
4226 EXPORT_SYMBOL_GPL(nft_dump_register);
4229 * nft_validate_register_load - validate a load from a register
4231 * @reg: the register number
4232 * @len: the length of the data
4234 * Validate that the input register is one of the general purpose
4235 * registers and that the length of the load is within the bounds.
4237 int nft_validate_register_load(enum nft_registers reg, unsigned int len)
4239 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
4243 if (reg * NFT_REG32_SIZE + len > FIELD_SIZEOF(struct nft_regs, data))
4248 EXPORT_SYMBOL_GPL(nft_validate_register_load);
4251 * nft_validate_register_store - validate an expressions' register store
4253 * @ctx: context of the expression performing the load
4254 * @reg: the destination register number
4255 * @data: the data to load
4256 * @type: the data type
4257 * @len: the length of the data
4259 * Validate that a data load uses the appropriate data type for
4260 * the destination register and the length is within the bounds.
4261 * A value of NULL for the data means that its runtime gathered
4264 int nft_validate_register_store(const struct nft_ctx *ctx,
4265 enum nft_registers reg,
4266 const struct nft_data *data,
4267 enum nft_data_types type, unsigned int len)
4272 case NFT_REG_VERDICT:
4273 if (type != NFT_DATA_VERDICT)
4277 (data->verdict.code == NFT_GOTO ||
4278 data->verdict.code == NFT_JUMP)) {
4279 err = nf_tables_check_loops(ctx, data->verdict.chain);
4283 if (ctx->chain->level + 1 >
4284 data->verdict.chain->level) {
4285 if (ctx->chain->level + 1 == NFT_JUMP_STACK_SIZE)
4287 data->verdict.chain->level = ctx->chain->level + 1;
4293 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
4297 if (reg * NFT_REG32_SIZE + len >
4298 FIELD_SIZEOF(struct nft_regs, data))
4301 if (data != NULL && type != NFT_DATA_VALUE)
4306 EXPORT_SYMBOL_GPL(nft_validate_register_store);
4308 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
4309 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
4310 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
4311 .len = NFT_CHAIN_MAXNAMELEN - 1 },
4314 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
4315 struct nft_data_desc *desc, const struct nlattr *nla)
4317 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
4318 struct nft_chain *chain;
4321 err = nla_parse_nested(tb, NFTA_VERDICT_MAX, nla, nft_verdict_policy);
4325 if (!tb[NFTA_VERDICT_CODE])
4327 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
4329 switch (data->verdict.code) {
4331 switch (data->verdict.code & NF_VERDICT_MASK) {
4343 desc->len = sizeof(data->verdict);
4347 if (!tb[NFTA_VERDICT_CHAIN])
4349 chain = nf_tables_chain_lookup(ctx->table,
4350 tb[NFTA_VERDICT_CHAIN]);
4352 return PTR_ERR(chain);
4353 if (chain->flags & NFT_BASE_CHAIN)
4357 data->verdict.chain = chain;
4358 desc->len = sizeof(data);
4362 desc->type = NFT_DATA_VERDICT;
4366 static void nft_verdict_uninit(const struct nft_data *data)
4368 switch (data->verdict.code) {
4371 data->verdict.chain->use--;
4376 static int nft_verdict_dump(struct sk_buff *skb, const struct nft_data *data)
4378 struct nlattr *nest;
4380 nest = nla_nest_start(skb, NFTA_DATA_VERDICT);
4382 goto nla_put_failure;
4384 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(data->verdict.code)))
4385 goto nla_put_failure;
4387 switch (data->verdict.code) {
4390 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
4391 data->verdict.chain->name))
4392 goto nla_put_failure;
4394 nla_nest_end(skb, nest);
4401 static int nft_value_init(const struct nft_ctx *ctx,
4402 struct nft_data *data, unsigned int size,
4403 struct nft_data_desc *desc, const struct nlattr *nla)
4413 nla_memcpy(data->data, nla, len);
4414 desc->type = NFT_DATA_VALUE;
4419 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
4422 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
4425 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
4426 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
4427 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
4431 * nft_data_init - parse nf_tables data netlink attributes
4433 * @ctx: context of the expression using the data
4434 * @data: destination struct nft_data
4435 * @size: maximum data length
4436 * @desc: data description
4437 * @nla: netlink attribute containing data
4439 * Parse the netlink data attributes and initialize a struct nft_data.
4440 * The type and length of data are returned in the data description.
4442 * The caller can indicate that it only wants to accept data of type
4443 * NFT_DATA_VALUE by passing NULL for the ctx argument.
4445 int nft_data_init(const struct nft_ctx *ctx,
4446 struct nft_data *data, unsigned int size,
4447 struct nft_data_desc *desc, const struct nlattr *nla)
4449 struct nlattr *tb[NFTA_DATA_MAX + 1];
4452 err = nla_parse_nested(tb, NFTA_DATA_MAX, nla, nft_data_policy);
4456 if (tb[NFTA_DATA_VALUE])
4457 return nft_value_init(ctx, data, size, desc,
4458 tb[NFTA_DATA_VALUE]);
4459 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
4460 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
4463 EXPORT_SYMBOL_GPL(nft_data_init);
4466 * nft_data_uninit - release a nft_data item
4468 * @data: struct nft_data to release
4469 * @type: type of data
4471 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4472 * all others need to be released by calling this function.
4474 void nft_data_uninit(const struct nft_data *data, enum nft_data_types type)
4477 case NFT_DATA_VALUE:
4479 case NFT_DATA_VERDICT:
4480 return nft_verdict_uninit(data);
4485 EXPORT_SYMBOL_GPL(nft_data_uninit);
4487 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
4488 enum nft_data_types type, unsigned int len)
4490 struct nlattr *nest;
4493 nest = nla_nest_start(skb, attr);
4498 case NFT_DATA_VALUE:
4499 err = nft_value_dump(skb, data, len);
4501 case NFT_DATA_VERDICT:
4502 err = nft_verdict_dump(skb, data);
4509 nla_nest_end(skb, nest);
4512 EXPORT_SYMBOL_GPL(nft_data_dump);
4514 static int nf_tables_init_net(struct net *net)
4516 INIT_LIST_HEAD(&net->nft.af_info);
4517 INIT_LIST_HEAD(&net->nft.commit_list);
4518 net->nft.base_seq = 1;
4522 static struct pernet_operations nf_tables_net_ops = {
4523 .init = nf_tables_init_net,
4526 static int __init nf_tables_module_init(void)
4530 info = kmalloc(sizeof(struct nft_expr_info) * NFT_RULE_MAXEXPRS,
4537 err = nf_tables_core_module_init();
4541 err = nfnetlink_subsys_register(&nf_tables_subsys);
4545 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
4546 return register_pernet_subsys(&nf_tables_net_ops);
4548 nf_tables_core_module_exit();
4555 static void __exit nf_tables_module_exit(void)
4557 unregister_pernet_subsys(&nf_tables_net_ops);
4558 nfnetlink_subsys_unregister(&nf_tables_subsys);
4560 nf_tables_core_module_exit();
4564 module_init(nf_tables_module_init);
4565 module_exit(nf_tables_module_exit);
4567 MODULE_LICENSE("GPL");
4568 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
4569 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);