2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/vmalloc.h>
17 #include <linux/netfilter.h>
18 #include <linux/netfilter/nfnetlink.h>
19 #include <linux/netfilter/nf_tables.h>
20 #include <net/netfilter/nf_tables_core.h>
21 #include <net/netfilter/nf_tables.h>
22 #include <net/net_namespace.h>
25 static LIST_HEAD(nf_tables_expressions);
26 static LIST_HEAD(nf_tables_objects);
29 * nft_register_afinfo - register nf_tables address family info
31 * @afi: address family info to register
33 * Register the address family for use with nf_tables. Returns zero on
34 * success or a negative errno code otherwise.
36 int nft_register_afinfo(struct net *net, struct nft_af_info *afi)
38 INIT_LIST_HEAD(&afi->tables);
39 nfnl_lock(NFNL_SUBSYS_NFTABLES);
40 list_add_tail_rcu(&afi->list, &net->nft.af_info);
41 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
44 EXPORT_SYMBOL_GPL(nft_register_afinfo);
46 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi);
49 * nft_unregister_afinfo - unregister nf_tables address family info
51 * @afi: address family info to unregister
53 * Unregister the address family for use with nf_tables.
55 void nft_unregister_afinfo(struct net *net, struct nft_af_info *afi)
57 nfnl_lock(NFNL_SUBSYS_NFTABLES);
58 __nft_release_afinfo(net, afi);
59 list_del_rcu(&afi->list);
60 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
62 EXPORT_SYMBOL_GPL(nft_unregister_afinfo);
64 static struct nft_af_info *nft_afinfo_lookup(struct net *net, int family)
66 struct nft_af_info *afi;
68 list_for_each_entry(afi, &net->nft.af_info, list) {
69 if (afi->family == family)
75 static struct nft_af_info *
76 nf_tables_afinfo_lookup(struct net *net, int family, bool autoload)
78 struct nft_af_info *afi;
80 afi = nft_afinfo_lookup(net, family);
85 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
86 request_module("nft-afinfo-%u", family);
87 nfnl_lock(NFNL_SUBSYS_NFTABLES);
88 afi = nft_afinfo_lookup(net, family);
90 return ERR_PTR(-EAGAIN);
93 return ERR_PTR(-EAFNOSUPPORT);
96 static void nft_ctx_init(struct nft_ctx *ctx,
98 const struct sk_buff *skb,
99 const struct nlmsghdr *nlh,
100 struct nft_af_info *afi,
101 struct nft_table *table,
102 struct nft_chain *chain,
103 const struct nlattr * const *nla)
110 ctx->portid = NETLINK_CB(skb).portid;
111 ctx->report = nlmsg_report(nlh);
112 ctx->seq = nlh->nlmsg_seq;
115 static struct nft_trans *nft_trans_alloc_gfp(const struct nft_ctx *ctx,
116 int msg_type, u32 size, gfp_t gfp)
118 struct nft_trans *trans;
120 trans = kzalloc(sizeof(struct nft_trans) + size, gfp);
124 trans->msg_type = msg_type;
130 static struct nft_trans *nft_trans_alloc(const struct nft_ctx *ctx,
131 int msg_type, u32 size)
133 return nft_trans_alloc_gfp(ctx, msg_type, size, GFP_KERNEL);
136 static void nft_trans_destroy(struct nft_trans *trans)
138 list_del(&trans->list);
142 static int nf_tables_register_hooks(struct net *net,
143 const struct nft_table *table,
144 struct nft_chain *chain,
145 unsigned int hook_nops)
147 if (table->flags & NFT_TABLE_F_DORMANT ||
148 !nft_is_base_chain(chain))
151 return nf_register_net_hooks(net, nft_base_chain(chain)->ops,
155 static void nf_tables_unregister_hooks(struct net *net,
156 const struct nft_table *table,
157 struct nft_chain *chain,
158 unsigned int hook_nops)
160 if (table->flags & NFT_TABLE_F_DORMANT ||
161 !nft_is_base_chain(chain))
164 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops, hook_nops);
167 static int nft_trans_table_add(struct nft_ctx *ctx, int msg_type)
169 struct nft_trans *trans;
171 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_table));
175 if (msg_type == NFT_MSG_NEWTABLE)
176 nft_activate_next(ctx->net, ctx->table);
178 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
182 static int nft_deltable(struct nft_ctx *ctx)
186 err = nft_trans_table_add(ctx, NFT_MSG_DELTABLE);
190 nft_deactivate_next(ctx->net, ctx->table);
194 static int nft_trans_chain_add(struct nft_ctx *ctx, int msg_type)
196 struct nft_trans *trans;
198 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_chain));
202 if (msg_type == NFT_MSG_NEWCHAIN)
203 nft_activate_next(ctx->net, ctx->chain);
205 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
209 static int nft_delchain(struct nft_ctx *ctx)
213 err = nft_trans_chain_add(ctx, NFT_MSG_DELCHAIN);
218 nft_deactivate_next(ctx->net, ctx->chain);
224 nf_tables_delrule_deactivate(struct nft_ctx *ctx, struct nft_rule *rule)
226 /* You cannot delete the same rule twice */
227 if (nft_is_active_next(ctx->net, rule)) {
228 nft_deactivate_next(ctx->net, rule);
235 static struct nft_trans *nft_trans_rule_add(struct nft_ctx *ctx, int msg_type,
236 struct nft_rule *rule)
238 struct nft_trans *trans;
240 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_rule));
244 if (msg_type == NFT_MSG_NEWRULE && ctx->nla[NFTA_RULE_ID] != NULL) {
245 nft_trans_rule_id(trans) =
246 ntohl(nla_get_be32(ctx->nla[NFTA_RULE_ID]));
248 nft_trans_rule(trans) = rule;
249 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
254 static int nft_delrule(struct nft_ctx *ctx, struct nft_rule *rule)
256 struct nft_trans *trans;
259 trans = nft_trans_rule_add(ctx, NFT_MSG_DELRULE, rule);
263 err = nf_tables_delrule_deactivate(ctx, rule);
265 nft_trans_destroy(trans);
272 static int nft_delrule_by_chain(struct nft_ctx *ctx)
274 struct nft_rule *rule;
277 list_for_each_entry(rule, &ctx->chain->rules, list) {
278 err = nft_delrule(ctx, rule);
285 static int nft_trans_set_add(struct nft_ctx *ctx, int msg_type,
288 struct nft_trans *trans;
290 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_set));
294 if (msg_type == NFT_MSG_NEWSET && ctx->nla[NFTA_SET_ID] != NULL) {
295 nft_trans_set_id(trans) =
296 ntohl(nla_get_be32(ctx->nla[NFTA_SET_ID]));
297 nft_activate_next(ctx->net, set);
299 nft_trans_set(trans) = set;
300 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
305 static int nft_delset(struct nft_ctx *ctx, struct nft_set *set)
309 err = nft_trans_set_add(ctx, NFT_MSG_DELSET, set);
313 nft_deactivate_next(ctx->net, set);
319 static int nft_trans_obj_add(struct nft_ctx *ctx, int msg_type,
320 struct nft_object *obj)
322 struct nft_trans *trans;
324 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_obj));
328 if (msg_type == NFT_MSG_NEWOBJ)
329 nft_activate_next(ctx->net, obj);
331 nft_trans_obj(trans) = obj;
332 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
337 static int nft_delobj(struct nft_ctx *ctx, struct nft_object *obj)
341 err = nft_trans_obj_add(ctx, NFT_MSG_DELOBJ, obj);
345 nft_deactivate_next(ctx->net, obj);
355 static struct nft_table *nft_table_lookup(const struct nft_af_info *afi,
356 const struct nlattr *nla,
359 struct nft_table *table;
361 list_for_each_entry(table, &afi->tables, list) {
362 if (!nla_strcmp(nla, table->name) &&
363 nft_active_genmask(table, genmask))
369 static struct nft_table *nf_tables_table_lookup(const struct nft_af_info *afi,
370 const struct nlattr *nla,
373 struct nft_table *table;
376 return ERR_PTR(-EINVAL);
378 table = nft_table_lookup(afi, nla, genmask);
382 return ERR_PTR(-ENOENT);
385 static inline u64 nf_tables_alloc_handle(struct nft_table *table)
387 return ++table->hgenerator;
390 static const struct nf_chain_type *chain_type[NFPROTO_NUMPROTO][NFT_CHAIN_T_MAX];
392 static const struct nf_chain_type *
393 __nf_tables_chain_type_lookup(int family, const struct nlattr *nla)
397 for (i = 0; i < NFT_CHAIN_T_MAX; i++) {
398 if (chain_type[family][i] != NULL &&
399 !nla_strcmp(nla, chain_type[family][i]->name))
400 return chain_type[family][i];
405 static const struct nf_chain_type *
406 nf_tables_chain_type_lookup(const struct nft_af_info *afi,
407 const struct nlattr *nla,
410 const struct nf_chain_type *type;
412 type = __nf_tables_chain_type_lookup(afi->family, nla);
415 #ifdef CONFIG_MODULES
417 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
418 request_module("nft-chain-%u-%.*s", afi->family,
419 nla_len(nla), (const char *)nla_data(nla));
420 nfnl_lock(NFNL_SUBSYS_NFTABLES);
421 type = __nf_tables_chain_type_lookup(afi->family, nla);
423 return ERR_PTR(-EAGAIN);
426 return ERR_PTR(-ENOENT);
429 static const struct nla_policy nft_table_policy[NFTA_TABLE_MAX + 1] = {
430 [NFTA_TABLE_NAME] = { .type = NLA_STRING,
431 .len = NFT_TABLE_MAXNAMELEN - 1 },
432 [NFTA_TABLE_FLAGS] = { .type = NLA_U32 },
435 static int nf_tables_fill_table_info(struct sk_buff *skb, struct net *net,
436 u32 portid, u32 seq, int event, u32 flags,
437 int family, const struct nft_table *table)
439 struct nlmsghdr *nlh;
440 struct nfgenmsg *nfmsg;
442 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
443 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
445 goto nla_put_failure;
447 nfmsg = nlmsg_data(nlh);
448 nfmsg->nfgen_family = family;
449 nfmsg->version = NFNETLINK_V0;
450 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
452 if (nla_put_string(skb, NFTA_TABLE_NAME, table->name) ||
453 nla_put_be32(skb, NFTA_TABLE_FLAGS, htonl(table->flags)) ||
454 nla_put_be32(skb, NFTA_TABLE_USE, htonl(table->use)))
455 goto nla_put_failure;
461 nlmsg_trim(skb, nlh);
465 static void nf_tables_table_notify(const struct nft_ctx *ctx, int event)
471 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
474 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
478 err = nf_tables_fill_table_info(skb, ctx->net, ctx->portid, ctx->seq,
479 event, 0, ctx->afi->family, ctx->table);
485 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
486 ctx->report, GFP_KERNEL);
489 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
492 static int nf_tables_dump_tables(struct sk_buff *skb,
493 struct netlink_callback *cb)
495 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
496 const struct nft_af_info *afi;
497 const struct nft_table *table;
498 unsigned int idx = 0, s_idx = cb->args[0];
499 struct net *net = sock_net(skb->sk);
500 int family = nfmsg->nfgen_family;
503 cb->seq = net->nft.base_seq;
505 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
506 if (family != NFPROTO_UNSPEC && family != afi->family)
509 list_for_each_entry_rcu(table, &afi->tables, list) {
513 memset(&cb->args[1], 0,
514 sizeof(cb->args) - sizeof(cb->args[0]));
515 if (!nft_is_active(net, table))
517 if (nf_tables_fill_table_info(skb, net,
518 NETLINK_CB(cb->skb).portid,
522 afi->family, table) < 0)
525 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
536 static int nf_tables_gettable(struct net *net, struct sock *nlsk,
537 struct sk_buff *skb, const struct nlmsghdr *nlh,
538 const struct nlattr * const nla[],
539 struct netlink_ext_ack *extack)
541 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
542 u8 genmask = nft_genmask_cur(net);
543 const struct nft_af_info *afi;
544 const struct nft_table *table;
545 struct sk_buff *skb2;
546 int family = nfmsg->nfgen_family;
549 if (nlh->nlmsg_flags & NLM_F_DUMP) {
550 struct netlink_dump_control c = {
551 .dump = nf_tables_dump_tables,
553 return netlink_dump_start(nlsk, skb, nlh, &c);
556 afi = nf_tables_afinfo_lookup(net, family, false);
560 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
562 return PTR_ERR(table);
564 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
568 err = nf_tables_fill_table_info(skb2, net, NETLINK_CB(skb).portid,
569 nlh->nlmsg_seq, NFT_MSG_NEWTABLE, 0,
574 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
581 static void _nf_tables_table_disable(struct net *net,
582 const struct nft_af_info *afi,
583 struct nft_table *table,
586 struct nft_chain *chain;
589 list_for_each_entry(chain, &table->chains, list) {
590 if (!nft_is_active_next(net, chain))
592 if (!nft_is_base_chain(chain))
595 if (cnt && i++ == cnt)
598 nf_unregister_net_hooks(net, nft_base_chain(chain)->ops,
603 static int nf_tables_table_enable(struct net *net,
604 const struct nft_af_info *afi,
605 struct nft_table *table)
607 struct nft_chain *chain;
610 list_for_each_entry(chain, &table->chains, list) {
611 if (!nft_is_active_next(net, chain))
613 if (!nft_is_base_chain(chain))
616 err = nf_register_net_hooks(net, nft_base_chain(chain)->ops,
626 _nf_tables_table_disable(net, afi, table, i);
630 static void nf_tables_table_disable(struct net *net,
631 const struct nft_af_info *afi,
632 struct nft_table *table)
634 _nf_tables_table_disable(net, afi, table, 0);
637 static int nf_tables_updtable(struct nft_ctx *ctx)
639 struct nft_trans *trans;
643 if (!ctx->nla[NFTA_TABLE_FLAGS])
646 flags = ntohl(nla_get_be32(ctx->nla[NFTA_TABLE_FLAGS]));
647 if (flags & ~NFT_TABLE_F_DORMANT)
650 if (flags == ctx->table->flags)
653 trans = nft_trans_alloc(ctx, NFT_MSG_NEWTABLE,
654 sizeof(struct nft_trans_table));
658 if ((flags & NFT_TABLE_F_DORMANT) &&
659 !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
660 nft_trans_table_enable(trans) = false;
661 } else if (!(flags & NFT_TABLE_F_DORMANT) &&
662 ctx->table->flags & NFT_TABLE_F_DORMANT) {
663 ret = nf_tables_table_enable(ctx->net, ctx->afi, ctx->table);
665 ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
666 nft_trans_table_enable(trans) = true;
672 nft_trans_table_update(trans) = true;
673 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
676 nft_trans_destroy(trans);
680 static int nf_tables_newtable(struct net *net, struct sock *nlsk,
681 struct sk_buff *skb, const struct nlmsghdr *nlh,
682 const struct nlattr * const nla[],
683 struct netlink_ext_ack *extack)
685 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
686 u8 genmask = nft_genmask_next(net);
687 const struct nlattr *name;
688 struct nft_af_info *afi;
689 struct nft_table *table;
690 int family = nfmsg->nfgen_family;
695 afi = nf_tables_afinfo_lookup(net, family, true);
699 name = nla[NFTA_TABLE_NAME];
700 table = nf_tables_table_lookup(afi, name, genmask);
702 if (PTR_ERR(table) != -ENOENT)
703 return PTR_ERR(table);
705 if (nlh->nlmsg_flags & NLM_F_EXCL)
707 if (nlh->nlmsg_flags & NLM_F_REPLACE)
710 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
711 return nf_tables_updtable(&ctx);
714 if (nla[NFTA_TABLE_FLAGS]) {
715 flags = ntohl(nla_get_be32(nla[NFTA_TABLE_FLAGS]));
716 if (flags & ~NFT_TABLE_F_DORMANT)
721 if (!try_module_get(afi->owner))
725 table = kzalloc(sizeof(*table), GFP_KERNEL);
729 table->name = nla_strdup(name, GFP_KERNEL);
730 if (table->name == NULL)
733 INIT_LIST_HEAD(&table->chains);
734 INIT_LIST_HEAD(&table->sets);
735 INIT_LIST_HEAD(&table->objects);
736 table->flags = flags;
738 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
739 err = nft_trans_table_add(&ctx, NFT_MSG_NEWTABLE);
743 list_add_tail_rcu(&table->list, &afi->tables);
750 module_put(afi->owner);
755 static int nft_flush_table(struct nft_ctx *ctx)
758 struct nft_chain *chain, *nc;
759 struct nft_object *obj, *ne;
760 struct nft_set *set, *ns;
762 list_for_each_entry(chain, &ctx->table->chains, list) {
763 if (!nft_is_active_next(ctx->net, chain))
768 err = nft_delrule_by_chain(ctx);
773 list_for_each_entry_safe(set, ns, &ctx->table->sets, list) {
774 if (!nft_is_active_next(ctx->net, set))
777 if (set->flags & NFT_SET_ANONYMOUS &&
778 !list_empty(&set->bindings))
781 err = nft_delset(ctx, set);
786 list_for_each_entry_safe(obj, ne, &ctx->table->objects, list) {
787 err = nft_delobj(ctx, obj);
792 list_for_each_entry_safe(chain, nc, &ctx->table->chains, list) {
793 if (!nft_is_active_next(ctx->net, chain))
798 err = nft_delchain(ctx);
803 err = nft_deltable(ctx);
808 static int nft_flush(struct nft_ctx *ctx, int family)
810 struct nft_af_info *afi;
811 struct nft_table *table, *nt;
812 const struct nlattr * const *nla = ctx->nla;
815 list_for_each_entry(afi, &ctx->net->nft.af_info, list) {
816 if (family != AF_UNSPEC && afi->family != family)
820 list_for_each_entry_safe(table, nt, &afi->tables, list) {
821 if (!nft_is_active_next(ctx->net, table))
824 if (nla[NFTA_TABLE_NAME] &&
825 nla_strcmp(nla[NFTA_TABLE_NAME], table->name) != 0)
830 err = nft_flush_table(ctx);
839 static int nf_tables_deltable(struct net *net, struct sock *nlsk,
840 struct sk_buff *skb, const struct nlmsghdr *nlh,
841 const struct nlattr * const nla[],
842 struct netlink_ext_ack *extack)
844 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
845 u8 genmask = nft_genmask_next(net);
846 struct nft_af_info *afi;
847 struct nft_table *table;
848 int family = nfmsg->nfgen_family;
851 nft_ctx_init(&ctx, net, skb, nlh, NULL, NULL, NULL, nla);
852 if (family == AF_UNSPEC || nla[NFTA_TABLE_NAME] == NULL)
853 return nft_flush(&ctx, family);
855 afi = nf_tables_afinfo_lookup(net, family, false);
859 table = nf_tables_table_lookup(afi, nla[NFTA_TABLE_NAME], genmask);
861 return PTR_ERR(table);
863 if (nlh->nlmsg_flags & NLM_F_NONREC &&
870 return nft_flush_table(&ctx);
873 static void nf_tables_table_destroy(struct nft_ctx *ctx)
875 BUG_ON(ctx->table->use > 0);
877 kfree(ctx->table->name);
879 module_put(ctx->afi->owner);
882 int nft_register_chain_type(const struct nf_chain_type *ctype)
886 if (WARN_ON(ctype->family >= NFPROTO_NUMPROTO))
889 nfnl_lock(NFNL_SUBSYS_NFTABLES);
890 if (chain_type[ctype->family][ctype->type] != NULL) {
894 chain_type[ctype->family][ctype->type] = ctype;
896 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
899 EXPORT_SYMBOL_GPL(nft_register_chain_type);
901 void nft_unregister_chain_type(const struct nf_chain_type *ctype)
903 nfnl_lock(NFNL_SUBSYS_NFTABLES);
904 chain_type[ctype->family][ctype->type] = NULL;
905 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
907 EXPORT_SYMBOL_GPL(nft_unregister_chain_type);
913 static struct nft_chain *
914 nf_tables_chain_lookup_byhandle(const struct nft_table *table, u64 handle,
917 struct nft_chain *chain;
919 list_for_each_entry(chain, &table->chains, list) {
920 if (chain->handle == handle &&
921 nft_active_genmask(chain, genmask))
925 return ERR_PTR(-ENOENT);
928 static struct nft_chain *nf_tables_chain_lookup(const struct nft_table *table,
929 const struct nlattr *nla,
932 struct nft_chain *chain;
935 return ERR_PTR(-EINVAL);
937 list_for_each_entry(chain, &table->chains, list) {
938 if (!nla_strcmp(nla, chain->name) &&
939 nft_active_genmask(chain, genmask))
943 return ERR_PTR(-ENOENT);
946 static const struct nla_policy nft_chain_policy[NFTA_CHAIN_MAX + 1] = {
947 [NFTA_CHAIN_TABLE] = { .type = NLA_STRING,
948 .len = NFT_TABLE_MAXNAMELEN - 1 },
949 [NFTA_CHAIN_HANDLE] = { .type = NLA_U64 },
950 [NFTA_CHAIN_NAME] = { .type = NLA_STRING,
951 .len = NFT_CHAIN_MAXNAMELEN - 1 },
952 [NFTA_CHAIN_HOOK] = { .type = NLA_NESTED },
953 [NFTA_CHAIN_POLICY] = { .type = NLA_U32 },
954 [NFTA_CHAIN_TYPE] = { .type = NLA_STRING },
955 [NFTA_CHAIN_COUNTERS] = { .type = NLA_NESTED },
958 static const struct nla_policy nft_hook_policy[NFTA_HOOK_MAX + 1] = {
959 [NFTA_HOOK_HOOKNUM] = { .type = NLA_U32 },
960 [NFTA_HOOK_PRIORITY] = { .type = NLA_U32 },
961 [NFTA_HOOK_DEV] = { .type = NLA_STRING,
962 .len = IFNAMSIZ - 1 },
965 static int nft_dump_stats(struct sk_buff *skb, struct nft_stats __percpu *stats)
967 struct nft_stats *cpu_stats, total;
973 memset(&total, 0, sizeof(total));
974 for_each_possible_cpu(cpu) {
975 cpu_stats = per_cpu_ptr(stats, cpu);
977 seq = u64_stats_fetch_begin_irq(&cpu_stats->syncp);
978 pkts = cpu_stats->pkts;
979 bytes = cpu_stats->bytes;
980 } while (u64_stats_fetch_retry_irq(&cpu_stats->syncp, seq));
982 total.bytes += bytes;
984 nest = nla_nest_start(skb, NFTA_CHAIN_COUNTERS);
986 goto nla_put_failure;
988 if (nla_put_be64(skb, NFTA_COUNTER_PACKETS, cpu_to_be64(total.pkts),
990 nla_put_be64(skb, NFTA_COUNTER_BYTES, cpu_to_be64(total.bytes),
992 goto nla_put_failure;
994 nla_nest_end(skb, nest);
1001 static int nf_tables_fill_chain_info(struct sk_buff *skb, struct net *net,
1002 u32 portid, u32 seq, int event, u32 flags,
1003 int family, const struct nft_table *table,
1004 const struct nft_chain *chain)
1006 struct nlmsghdr *nlh;
1007 struct nfgenmsg *nfmsg;
1009 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
1010 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
1012 goto nla_put_failure;
1014 nfmsg = nlmsg_data(nlh);
1015 nfmsg->nfgen_family = family;
1016 nfmsg->version = NFNETLINK_V0;
1017 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1019 if (nla_put_string(skb, NFTA_CHAIN_TABLE, table->name))
1020 goto nla_put_failure;
1021 if (nla_put_be64(skb, NFTA_CHAIN_HANDLE, cpu_to_be64(chain->handle),
1023 goto nla_put_failure;
1024 if (nla_put_string(skb, NFTA_CHAIN_NAME, chain->name))
1025 goto nla_put_failure;
1027 if (nft_is_base_chain(chain)) {
1028 const struct nft_base_chain *basechain = nft_base_chain(chain);
1029 const struct nf_hook_ops *ops = &basechain->ops[0];
1030 struct nlattr *nest;
1032 nest = nla_nest_start(skb, NFTA_CHAIN_HOOK);
1034 goto nla_put_failure;
1035 if (nla_put_be32(skb, NFTA_HOOK_HOOKNUM, htonl(ops->hooknum)))
1036 goto nla_put_failure;
1037 if (nla_put_be32(skb, NFTA_HOOK_PRIORITY, htonl(ops->priority)))
1038 goto nla_put_failure;
1039 if (basechain->dev_name[0] &&
1040 nla_put_string(skb, NFTA_HOOK_DEV, basechain->dev_name))
1041 goto nla_put_failure;
1042 nla_nest_end(skb, nest);
1044 if (nla_put_be32(skb, NFTA_CHAIN_POLICY,
1045 htonl(basechain->policy)))
1046 goto nla_put_failure;
1048 if (nla_put_string(skb, NFTA_CHAIN_TYPE, basechain->type->name))
1049 goto nla_put_failure;
1051 if (basechain->stats && nft_dump_stats(skb, basechain->stats))
1052 goto nla_put_failure;
1055 if (nla_put_be32(skb, NFTA_CHAIN_USE, htonl(chain->use)))
1056 goto nla_put_failure;
1058 nlmsg_end(skb, nlh);
1062 nlmsg_trim(skb, nlh);
1066 static void nf_tables_chain_notify(const struct nft_ctx *ctx, int event)
1068 struct sk_buff *skb;
1072 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
1075 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
1079 err = nf_tables_fill_chain_info(skb, ctx->net, ctx->portid, ctx->seq,
1080 event, 0, ctx->afi->family, ctx->table,
1087 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
1088 ctx->report, GFP_KERNEL);
1091 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
1094 static int nf_tables_dump_chains(struct sk_buff *skb,
1095 struct netlink_callback *cb)
1097 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
1098 const struct nft_af_info *afi;
1099 const struct nft_table *table;
1100 const struct nft_chain *chain;
1101 unsigned int idx = 0, s_idx = cb->args[0];
1102 struct net *net = sock_net(skb->sk);
1103 int family = nfmsg->nfgen_family;
1106 cb->seq = net->nft.base_seq;
1108 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
1109 if (family != NFPROTO_UNSPEC && family != afi->family)
1112 list_for_each_entry_rcu(table, &afi->tables, list) {
1113 list_for_each_entry_rcu(chain, &table->chains, list) {
1117 memset(&cb->args[1], 0,
1118 sizeof(cb->args) - sizeof(cb->args[0]));
1119 if (!nft_is_active(net, chain))
1121 if (nf_tables_fill_chain_info(skb, net,
1122 NETLINK_CB(cb->skb).portid,
1126 afi->family, table, chain) < 0)
1129 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
1141 static int nf_tables_getchain(struct net *net, struct sock *nlsk,
1142 struct sk_buff *skb, const struct nlmsghdr *nlh,
1143 const struct nlattr * const nla[],
1144 struct netlink_ext_ack *extack)
1146 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1147 u8 genmask = nft_genmask_cur(net);
1148 const struct nft_af_info *afi;
1149 const struct nft_table *table;
1150 const struct nft_chain *chain;
1151 struct sk_buff *skb2;
1152 int family = nfmsg->nfgen_family;
1155 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1156 struct netlink_dump_control c = {
1157 .dump = nf_tables_dump_chains,
1159 return netlink_dump_start(nlsk, skb, nlh, &c);
1162 afi = nf_tables_afinfo_lookup(net, family, false);
1164 return PTR_ERR(afi);
1166 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1168 return PTR_ERR(table);
1170 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1172 return PTR_ERR(chain);
1174 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1178 err = nf_tables_fill_chain_info(skb2, net, NETLINK_CB(skb).portid,
1179 nlh->nlmsg_seq, NFT_MSG_NEWCHAIN, 0,
1180 family, table, chain);
1184 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
1191 static const struct nla_policy nft_counter_policy[NFTA_COUNTER_MAX + 1] = {
1192 [NFTA_COUNTER_PACKETS] = { .type = NLA_U64 },
1193 [NFTA_COUNTER_BYTES] = { .type = NLA_U64 },
1196 static struct nft_stats __percpu *nft_stats_alloc(const struct nlattr *attr)
1198 struct nlattr *tb[NFTA_COUNTER_MAX+1];
1199 struct nft_stats __percpu *newstats;
1200 struct nft_stats *stats;
1203 err = nla_parse_nested(tb, NFTA_COUNTER_MAX, attr, nft_counter_policy,
1206 return ERR_PTR(err);
1208 if (!tb[NFTA_COUNTER_BYTES] || !tb[NFTA_COUNTER_PACKETS])
1209 return ERR_PTR(-EINVAL);
1211 newstats = netdev_alloc_pcpu_stats(struct nft_stats);
1212 if (newstats == NULL)
1213 return ERR_PTR(-ENOMEM);
1215 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1216 * are not exposed to userspace.
1219 stats = this_cpu_ptr(newstats);
1220 stats->bytes = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_BYTES]));
1221 stats->pkts = be64_to_cpu(nla_get_be64(tb[NFTA_COUNTER_PACKETS]));
1227 static void nft_chain_stats_replace(struct nft_base_chain *chain,
1228 struct nft_stats __percpu *newstats)
1230 if (newstats == NULL)
1234 struct nft_stats __percpu *oldstats =
1235 nft_dereference(chain->stats);
1237 rcu_assign_pointer(chain->stats, newstats);
1239 free_percpu(oldstats);
1241 rcu_assign_pointer(chain->stats, newstats);
1244 static void nf_tables_chain_destroy(struct nft_chain *chain)
1246 BUG_ON(chain->use > 0);
1248 if (nft_is_base_chain(chain)) {
1249 struct nft_base_chain *basechain = nft_base_chain(chain);
1251 module_put(basechain->type->owner);
1252 free_percpu(basechain->stats);
1253 if (basechain->stats)
1254 static_branch_dec(&nft_counters_enabled);
1255 if (basechain->ops[0].dev != NULL)
1256 dev_put(basechain->ops[0].dev);
1265 struct nft_chain_hook {
1268 const struct nf_chain_type *type;
1269 struct net_device *dev;
1272 static int nft_chain_parse_hook(struct net *net,
1273 const struct nlattr * const nla[],
1274 struct nft_af_info *afi,
1275 struct nft_chain_hook *hook, bool create)
1277 struct nlattr *ha[NFTA_HOOK_MAX + 1];
1278 const struct nf_chain_type *type;
1279 struct net_device *dev;
1282 err = nla_parse_nested(ha, NFTA_HOOK_MAX, nla[NFTA_CHAIN_HOOK],
1283 nft_hook_policy, NULL);
1287 if (ha[NFTA_HOOK_HOOKNUM] == NULL ||
1288 ha[NFTA_HOOK_PRIORITY] == NULL)
1291 hook->num = ntohl(nla_get_be32(ha[NFTA_HOOK_HOOKNUM]));
1292 if (hook->num >= afi->nhooks)
1295 hook->priority = ntohl(nla_get_be32(ha[NFTA_HOOK_PRIORITY]));
1297 type = chain_type[afi->family][NFT_CHAIN_T_DEFAULT];
1298 if (nla[NFTA_CHAIN_TYPE]) {
1299 type = nf_tables_chain_type_lookup(afi, nla[NFTA_CHAIN_TYPE],
1302 return PTR_ERR(type);
1304 if (!(type->hook_mask & (1 << hook->num)))
1306 if (!try_module_get(type->owner))
1312 if (afi->flags & NFT_AF_NEEDS_DEV) {
1313 char ifname[IFNAMSIZ];
1315 if (!ha[NFTA_HOOK_DEV]) {
1316 module_put(type->owner);
1320 nla_strlcpy(ifname, ha[NFTA_HOOK_DEV], IFNAMSIZ);
1321 dev = dev_get_by_name(net, ifname);
1323 module_put(type->owner);
1327 } else if (ha[NFTA_HOOK_DEV]) {
1328 module_put(type->owner);
1335 static void nft_chain_release_hook(struct nft_chain_hook *hook)
1337 module_put(hook->type->owner);
1338 if (hook->dev != NULL)
1342 static int nf_tables_addchain(struct nft_ctx *ctx, u8 family, u8 genmask,
1343 u8 policy, bool create)
1345 const struct nlattr * const *nla = ctx->nla;
1346 struct nft_table *table = ctx->table;
1347 struct nft_af_info *afi = ctx->afi;
1348 struct nft_base_chain *basechain;
1349 struct nft_stats __percpu *stats;
1350 struct net *net = ctx->net;
1351 struct nft_chain *chain;
1355 if (table->use == UINT_MAX)
1358 if (nla[NFTA_CHAIN_HOOK]) {
1359 struct nft_chain_hook hook;
1360 struct nf_hook_ops *ops;
1363 err = nft_chain_parse_hook(net, nla, afi, &hook, create);
1367 basechain = kzalloc(sizeof(*basechain), GFP_KERNEL);
1368 if (basechain == NULL) {
1369 nft_chain_release_hook(&hook);
1373 if (hook.dev != NULL)
1374 strncpy(basechain->dev_name, hook.dev->name, IFNAMSIZ);
1376 if (nla[NFTA_CHAIN_COUNTERS]) {
1377 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1378 if (IS_ERR(stats)) {
1379 nft_chain_release_hook(&hook);
1381 return PTR_ERR(stats);
1383 basechain->stats = stats;
1384 static_branch_inc(&nft_counters_enabled);
1387 hookfn = hook.type->hooks[hook.num];
1388 basechain->type = hook.type;
1389 chain = &basechain->chain;
1391 for (i = 0; i < afi->nops; i++) {
1392 ops = &basechain->ops[i];
1394 ops->hooknum = hook.num;
1395 ops->priority = hook.priority;
1397 ops->hook = afi->hooks[ops->hooknum];
1398 ops->dev = hook.dev;
1401 if (afi->hook_ops_init)
1402 afi->hook_ops_init(ops, i);
1405 chain->flags |= NFT_BASE_CHAIN;
1406 basechain->policy = policy;
1408 chain = kzalloc(sizeof(*chain), GFP_KERNEL);
1412 INIT_LIST_HEAD(&chain->rules);
1413 chain->handle = nf_tables_alloc_handle(table);
1414 chain->table = table;
1415 chain->name = nla_strdup(nla[NFTA_CHAIN_NAME], GFP_KERNEL);
1421 err = nf_tables_register_hooks(net, table, chain, afi->nops);
1426 err = nft_trans_chain_add(ctx, NFT_MSG_NEWCHAIN);
1431 list_add_tail_rcu(&chain->list, &table->chains);
1435 nf_tables_unregister_hooks(net, table, chain, afi->nops);
1437 nf_tables_chain_destroy(chain);
1442 static int nf_tables_updchain(struct nft_ctx *ctx, u8 genmask, u8 policy,
1445 const struct nlattr * const *nla = ctx->nla;
1446 struct nft_table *table = ctx->table;
1447 struct nft_chain *chain = ctx->chain;
1448 struct nft_af_info *afi = ctx->afi;
1449 struct nft_base_chain *basechain;
1450 struct nft_stats *stats = NULL;
1451 struct nft_chain_hook hook;
1452 const struct nlattr *name;
1453 struct nf_hook_ops *ops;
1454 struct nft_trans *trans;
1457 if (nla[NFTA_CHAIN_HOOK]) {
1458 if (!nft_is_base_chain(chain))
1461 err = nft_chain_parse_hook(ctx->net, nla, ctx->afi, &hook,
1466 basechain = nft_base_chain(chain);
1467 if (basechain->type != hook.type) {
1468 nft_chain_release_hook(&hook);
1472 for (i = 0; i < afi->nops; i++) {
1473 ops = &basechain->ops[i];
1474 if (ops->hooknum != hook.num ||
1475 ops->priority != hook.priority ||
1476 ops->dev != hook.dev) {
1477 nft_chain_release_hook(&hook);
1481 nft_chain_release_hook(&hook);
1484 if (nla[NFTA_CHAIN_HANDLE] &&
1485 nla[NFTA_CHAIN_NAME]) {
1486 struct nft_chain *chain2;
1488 chain2 = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME],
1490 if (!IS_ERR(chain2))
1494 if (nla[NFTA_CHAIN_COUNTERS]) {
1495 if (!nft_is_base_chain(chain))
1498 stats = nft_stats_alloc(nla[NFTA_CHAIN_COUNTERS]);
1500 return PTR_ERR(stats);
1503 trans = nft_trans_alloc(ctx, NFT_MSG_NEWCHAIN,
1504 sizeof(struct nft_trans_chain));
1505 if (trans == NULL) {
1510 nft_trans_chain_stats(trans) = stats;
1511 nft_trans_chain_update(trans) = true;
1513 if (nla[NFTA_CHAIN_POLICY])
1514 nft_trans_chain_policy(trans) = policy;
1516 nft_trans_chain_policy(trans) = -1;
1518 name = nla[NFTA_CHAIN_NAME];
1519 if (nla[NFTA_CHAIN_HANDLE] && name) {
1520 nft_trans_chain_name(trans) =
1521 nla_strdup(name, GFP_KERNEL);
1522 if (!nft_trans_chain_name(trans)) {
1528 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
1533 static int nf_tables_newchain(struct net *net, struct sock *nlsk,
1534 struct sk_buff *skb, const struct nlmsghdr *nlh,
1535 const struct nlattr * const nla[],
1536 struct netlink_ext_ack *extack)
1538 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1539 const struct nlattr * uninitialized_var(name);
1540 u8 genmask = nft_genmask_next(net);
1541 int family = nfmsg->nfgen_family;
1542 struct nft_af_info *afi;
1543 struct nft_table *table;
1544 struct nft_chain *chain;
1545 u8 policy = NF_ACCEPT;
1550 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
1552 afi = nf_tables_afinfo_lookup(net, family, true);
1554 return PTR_ERR(afi);
1556 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1558 return PTR_ERR(table);
1561 name = nla[NFTA_CHAIN_NAME];
1563 if (nla[NFTA_CHAIN_HANDLE]) {
1564 handle = be64_to_cpu(nla_get_be64(nla[NFTA_CHAIN_HANDLE]));
1565 chain = nf_tables_chain_lookup_byhandle(table, handle, genmask);
1567 return PTR_ERR(chain);
1569 chain = nf_tables_chain_lookup(table, name, genmask);
1570 if (IS_ERR(chain)) {
1571 if (PTR_ERR(chain) != -ENOENT)
1572 return PTR_ERR(chain);
1577 if (nla[NFTA_CHAIN_POLICY]) {
1578 if (chain != NULL &&
1579 !nft_is_base_chain(chain))
1582 if (chain == NULL &&
1583 nla[NFTA_CHAIN_HOOK] == NULL)
1586 policy = ntohl(nla_get_be32(nla[NFTA_CHAIN_POLICY]));
1596 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1598 if (chain != NULL) {
1599 if (nlh->nlmsg_flags & NLM_F_EXCL)
1601 if (nlh->nlmsg_flags & NLM_F_REPLACE)
1604 return nf_tables_updchain(&ctx, genmask, policy, create);
1607 return nf_tables_addchain(&ctx, family, genmask, policy, create);
1610 static int nf_tables_delchain(struct net *net, struct sock *nlsk,
1611 struct sk_buff *skb, const struct nlmsghdr *nlh,
1612 const struct nlattr * const nla[],
1613 struct netlink_ext_ack *extack)
1615 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
1616 u8 genmask = nft_genmask_next(net);
1617 struct nft_af_info *afi;
1618 struct nft_table *table;
1619 struct nft_chain *chain;
1620 struct nft_rule *rule;
1621 int family = nfmsg->nfgen_family;
1626 afi = nf_tables_afinfo_lookup(net, family, false);
1628 return PTR_ERR(afi);
1630 table = nf_tables_table_lookup(afi, nla[NFTA_CHAIN_TABLE], genmask);
1632 return PTR_ERR(table);
1634 chain = nf_tables_chain_lookup(table, nla[NFTA_CHAIN_NAME], genmask);
1636 return PTR_ERR(chain);
1638 if (nlh->nlmsg_flags & NLM_F_NONREC &&
1642 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
1645 list_for_each_entry(rule, &chain->rules, list) {
1646 if (!nft_is_active_next(net, rule))
1650 err = nft_delrule(&ctx, rule);
1655 /* There are rules and elements that are still holding references to us,
1656 * we cannot do a recursive removal in this case.
1661 return nft_delchain(&ctx);
1669 * nft_register_expr - register nf_tables expr type
1672 * Registers the expr type for use with nf_tables. Returns zero on
1673 * success or a negative errno code otherwise.
1675 int nft_register_expr(struct nft_expr_type *type)
1677 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1678 if (type->family == NFPROTO_UNSPEC)
1679 list_add_tail_rcu(&type->list, &nf_tables_expressions);
1681 list_add_rcu(&type->list, &nf_tables_expressions);
1682 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1685 EXPORT_SYMBOL_GPL(nft_register_expr);
1688 * nft_unregister_expr - unregister nf_tables expr type
1691 * Unregisters the expr typefor use with nf_tables.
1693 void nft_unregister_expr(struct nft_expr_type *type)
1695 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1696 list_del_rcu(&type->list);
1697 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1699 EXPORT_SYMBOL_GPL(nft_unregister_expr);
1701 static const struct nft_expr_type *__nft_expr_type_get(u8 family,
1704 const struct nft_expr_type *type;
1706 list_for_each_entry(type, &nf_tables_expressions, list) {
1707 if (!nla_strcmp(nla, type->name) &&
1708 (!type->family || type->family == family))
1714 static const struct nft_expr_type *nft_expr_type_get(u8 family,
1717 const struct nft_expr_type *type;
1720 return ERR_PTR(-EINVAL);
1722 type = __nft_expr_type_get(family, nla);
1723 if (type != NULL && try_module_get(type->owner))
1726 #ifdef CONFIG_MODULES
1728 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1729 request_module("nft-expr-%u-%.*s", family,
1730 nla_len(nla), (char *)nla_data(nla));
1731 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1732 if (__nft_expr_type_get(family, nla))
1733 return ERR_PTR(-EAGAIN);
1735 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
1736 request_module("nft-expr-%.*s",
1737 nla_len(nla), (char *)nla_data(nla));
1738 nfnl_lock(NFNL_SUBSYS_NFTABLES);
1739 if (__nft_expr_type_get(family, nla))
1740 return ERR_PTR(-EAGAIN);
1743 return ERR_PTR(-ENOENT);
1746 static const struct nla_policy nft_expr_policy[NFTA_EXPR_MAX + 1] = {
1747 [NFTA_EXPR_NAME] = { .type = NLA_STRING },
1748 [NFTA_EXPR_DATA] = { .type = NLA_NESTED },
1751 static int nf_tables_fill_expr_info(struct sk_buff *skb,
1752 const struct nft_expr *expr)
1754 if (nla_put_string(skb, NFTA_EXPR_NAME, expr->ops->type->name))
1755 goto nla_put_failure;
1757 if (expr->ops->dump) {
1758 struct nlattr *data = nla_nest_start(skb, NFTA_EXPR_DATA);
1760 goto nla_put_failure;
1761 if (expr->ops->dump(skb, expr) < 0)
1762 goto nla_put_failure;
1763 nla_nest_end(skb, data);
1772 int nft_expr_dump(struct sk_buff *skb, unsigned int attr,
1773 const struct nft_expr *expr)
1775 struct nlattr *nest;
1777 nest = nla_nest_start(skb, attr);
1779 goto nla_put_failure;
1780 if (nf_tables_fill_expr_info(skb, expr) < 0)
1781 goto nla_put_failure;
1782 nla_nest_end(skb, nest);
1789 struct nft_expr_info {
1790 const struct nft_expr_ops *ops;
1791 struct nlattr *tb[NFT_EXPR_MAXATTR + 1];
1794 static int nf_tables_expr_parse(const struct nft_ctx *ctx,
1795 const struct nlattr *nla,
1796 struct nft_expr_info *info)
1798 const struct nft_expr_type *type;
1799 const struct nft_expr_ops *ops;
1800 struct nlattr *tb[NFTA_EXPR_MAX + 1];
1803 err = nla_parse_nested(tb, NFTA_EXPR_MAX, nla, nft_expr_policy, NULL);
1807 type = nft_expr_type_get(ctx->afi->family, tb[NFTA_EXPR_NAME]);
1809 return PTR_ERR(type);
1811 if (tb[NFTA_EXPR_DATA]) {
1812 err = nla_parse_nested(info->tb, type->maxattr,
1813 tb[NFTA_EXPR_DATA], type->policy, NULL);
1817 memset(info->tb, 0, sizeof(info->tb[0]) * (type->maxattr + 1));
1819 if (type->select_ops != NULL) {
1820 ops = type->select_ops(ctx,
1821 (const struct nlattr * const *)info->tb);
1833 module_put(type->owner);
1837 static int nf_tables_newexpr(const struct nft_ctx *ctx,
1838 const struct nft_expr_info *info,
1839 struct nft_expr *expr)
1841 const struct nft_expr_ops *ops = info->ops;
1846 err = ops->init(ctx, expr, (const struct nlattr **)info->tb);
1851 if (ops->validate) {
1852 const struct nft_data *data = NULL;
1854 err = ops->validate(ctx, expr, &data);
1863 ops->destroy(ctx, expr);
1869 static void nf_tables_expr_destroy(const struct nft_ctx *ctx,
1870 struct nft_expr *expr)
1872 if (expr->ops->destroy)
1873 expr->ops->destroy(ctx, expr);
1874 module_put(expr->ops->type->owner);
1877 struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
1878 const struct nlattr *nla)
1880 struct nft_expr_info info;
1881 struct nft_expr *expr;
1884 err = nf_tables_expr_parse(ctx, nla, &info);
1889 expr = kzalloc(info.ops->size, GFP_KERNEL);
1893 err = nf_tables_newexpr(ctx, &info, expr);
1901 module_put(info.ops->type->owner);
1903 return ERR_PTR(err);
1906 void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr)
1908 nf_tables_expr_destroy(ctx, expr);
1916 static struct nft_rule *__nf_tables_rule_lookup(const struct nft_chain *chain,
1919 struct nft_rule *rule;
1921 // FIXME: this sucks
1922 list_for_each_entry(rule, &chain->rules, list) {
1923 if (handle == rule->handle)
1927 return ERR_PTR(-ENOENT);
1930 static struct nft_rule *nf_tables_rule_lookup(const struct nft_chain *chain,
1931 const struct nlattr *nla)
1934 return ERR_PTR(-EINVAL);
1936 return __nf_tables_rule_lookup(chain, be64_to_cpu(nla_get_be64(nla)));
1939 static const struct nla_policy nft_rule_policy[NFTA_RULE_MAX + 1] = {
1940 [NFTA_RULE_TABLE] = { .type = NLA_STRING,
1941 .len = NFT_TABLE_MAXNAMELEN - 1 },
1942 [NFTA_RULE_CHAIN] = { .type = NLA_STRING,
1943 .len = NFT_CHAIN_MAXNAMELEN - 1 },
1944 [NFTA_RULE_HANDLE] = { .type = NLA_U64 },
1945 [NFTA_RULE_EXPRESSIONS] = { .type = NLA_NESTED },
1946 [NFTA_RULE_COMPAT] = { .type = NLA_NESTED },
1947 [NFTA_RULE_POSITION] = { .type = NLA_U64 },
1948 [NFTA_RULE_USERDATA] = { .type = NLA_BINARY,
1949 .len = NFT_USERDATA_MAXLEN },
1952 static int nf_tables_fill_rule_info(struct sk_buff *skb, struct net *net,
1953 u32 portid, u32 seq, int event,
1954 u32 flags, int family,
1955 const struct nft_table *table,
1956 const struct nft_chain *chain,
1957 const struct nft_rule *rule)
1959 struct nlmsghdr *nlh;
1960 struct nfgenmsg *nfmsg;
1961 const struct nft_expr *expr, *next;
1962 struct nlattr *list;
1963 const struct nft_rule *prule;
1964 u16 type = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
1966 nlh = nlmsg_put(skb, portid, seq, type, sizeof(struct nfgenmsg), flags);
1968 goto nla_put_failure;
1970 nfmsg = nlmsg_data(nlh);
1971 nfmsg->nfgen_family = family;
1972 nfmsg->version = NFNETLINK_V0;
1973 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
1975 if (nla_put_string(skb, NFTA_RULE_TABLE, table->name))
1976 goto nla_put_failure;
1977 if (nla_put_string(skb, NFTA_RULE_CHAIN, chain->name))
1978 goto nla_put_failure;
1979 if (nla_put_be64(skb, NFTA_RULE_HANDLE, cpu_to_be64(rule->handle),
1981 goto nla_put_failure;
1983 if ((event != NFT_MSG_DELRULE) && (rule->list.prev != &chain->rules)) {
1984 prule = list_prev_entry(rule, list);
1985 if (nla_put_be64(skb, NFTA_RULE_POSITION,
1986 cpu_to_be64(prule->handle),
1988 goto nla_put_failure;
1991 list = nla_nest_start(skb, NFTA_RULE_EXPRESSIONS);
1993 goto nla_put_failure;
1994 nft_rule_for_each_expr(expr, next, rule) {
1995 if (nft_expr_dump(skb, NFTA_LIST_ELEM, expr) < 0)
1996 goto nla_put_failure;
1998 nla_nest_end(skb, list);
2001 struct nft_userdata *udata = nft_userdata(rule);
2002 if (nla_put(skb, NFTA_RULE_USERDATA, udata->len + 1,
2004 goto nla_put_failure;
2007 nlmsg_end(skb, nlh);
2011 nlmsg_trim(skb, nlh);
2015 static void nf_tables_rule_notify(const struct nft_ctx *ctx,
2016 const struct nft_rule *rule, int event)
2018 struct sk_buff *skb;
2022 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2025 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
2029 err = nf_tables_fill_rule_info(skb, ctx->net, ctx->portid, ctx->seq,
2030 event, 0, ctx->afi->family, ctx->table,
2037 nfnetlink_send(skb, ctx->net, ctx->portid, NFNLGRP_NFTABLES,
2038 ctx->report, GFP_KERNEL);
2041 nfnetlink_set_err(ctx->net, ctx->portid, NFNLGRP_NFTABLES, -ENOBUFS);
2044 struct nft_rule_dump_ctx {
2049 static int nf_tables_dump_rules(struct sk_buff *skb,
2050 struct netlink_callback *cb)
2052 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
2053 const struct nft_rule_dump_ctx *ctx = cb->data;
2054 const struct nft_af_info *afi;
2055 const struct nft_table *table;
2056 const struct nft_chain *chain;
2057 const struct nft_rule *rule;
2058 unsigned int idx = 0, s_idx = cb->args[0];
2059 struct net *net = sock_net(skb->sk);
2060 int family = nfmsg->nfgen_family;
2063 cb->seq = net->nft.base_seq;
2065 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
2066 if (family != NFPROTO_UNSPEC && family != afi->family)
2069 list_for_each_entry_rcu(table, &afi->tables, list) {
2070 if (ctx && ctx->table &&
2071 strcmp(ctx->table, table->name) != 0)
2074 list_for_each_entry_rcu(chain, &table->chains, list) {
2075 if (ctx && ctx->chain[0] &&
2076 strcmp(ctx->chain, chain->name) != 0)
2079 list_for_each_entry_rcu(rule, &chain->rules, list) {
2080 if (!nft_is_active(net, rule))
2085 memset(&cb->args[1], 0,
2086 sizeof(cb->args) - sizeof(cb->args[0]));
2087 if (nf_tables_fill_rule_info(skb, net, NETLINK_CB(cb->skb).portid,
2090 NLM_F_MULTI | NLM_F_APPEND,
2091 afi->family, table, chain, rule) < 0)
2094 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2108 static int nf_tables_dump_rules_done(struct netlink_callback *cb)
2110 struct nft_rule_dump_ctx *ctx = cb->data;
2120 static int nf_tables_getrule(struct net *net, struct sock *nlsk,
2121 struct sk_buff *skb, const struct nlmsghdr *nlh,
2122 const struct nlattr * const nla[],
2123 struct netlink_ext_ack *extack)
2125 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2126 u8 genmask = nft_genmask_cur(net);
2127 const struct nft_af_info *afi;
2128 const struct nft_table *table;
2129 const struct nft_chain *chain;
2130 const struct nft_rule *rule;
2131 struct sk_buff *skb2;
2132 int family = nfmsg->nfgen_family;
2135 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2136 struct netlink_dump_control c = {
2137 .dump = nf_tables_dump_rules,
2138 .done = nf_tables_dump_rules_done,
2141 if (nla[NFTA_RULE_TABLE] || nla[NFTA_RULE_CHAIN]) {
2142 struct nft_rule_dump_ctx *ctx;
2144 ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
2148 if (nla[NFTA_RULE_TABLE]) {
2149 ctx->table = nla_strdup(nla[NFTA_RULE_TABLE],
2156 if (nla[NFTA_RULE_CHAIN]) {
2157 ctx->chain = nla_strdup(nla[NFTA_RULE_CHAIN],
2168 return netlink_dump_start(nlsk, skb, nlh, &c);
2171 afi = nf_tables_afinfo_lookup(net, family, false);
2173 return PTR_ERR(afi);
2175 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2177 return PTR_ERR(table);
2179 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2181 return PTR_ERR(chain);
2183 rule = nf_tables_rule_lookup(chain, nla[NFTA_RULE_HANDLE]);
2185 return PTR_ERR(rule);
2187 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2191 err = nf_tables_fill_rule_info(skb2, net, NETLINK_CB(skb).portid,
2192 nlh->nlmsg_seq, NFT_MSG_NEWRULE, 0,
2193 family, table, chain, rule);
2197 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2204 static void nf_tables_rule_destroy(const struct nft_ctx *ctx,
2205 struct nft_rule *rule)
2207 struct nft_expr *expr;
2210 * Careful: some expressions might not be initialized in case this
2211 * is called on error from nf_tables_newrule().
2213 expr = nft_expr_first(rule);
2214 while (expr != nft_expr_last(rule) && expr->ops) {
2215 nf_tables_expr_destroy(ctx, expr);
2216 expr = nft_expr_next(expr);
2221 #define NFT_RULE_MAXEXPRS 128
2223 static struct nft_expr_info *info;
2225 static int nf_tables_newrule(struct net *net, struct sock *nlsk,
2226 struct sk_buff *skb, const struct nlmsghdr *nlh,
2227 const struct nlattr * const nla[],
2228 struct netlink_ext_ack *extack)
2230 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2231 u8 genmask = nft_genmask_next(net);
2232 struct nft_af_info *afi;
2233 struct nft_table *table;
2234 struct nft_chain *chain;
2235 struct nft_rule *rule, *old_rule = NULL;
2236 struct nft_userdata *udata;
2237 struct nft_trans *trans = NULL;
2238 struct nft_expr *expr;
2241 unsigned int size, i, n, ulen = 0, usize = 0;
2244 u64 handle, pos_handle;
2246 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
2248 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
2250 return PTR_ERR(afi);
2252 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2254 return PTR_ERR(table);
2256 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN], genmask);
2258 return PTR_ERR(chain);
2260 if (nla[NFTA_RULE_HANDLE]) {
2261 handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_HANDLE]));
2262 rule = __nf_tables_rule_lookup(chain, handle);
2264 return PTR_ERR(rule);
2266 if (nlh->nlmsg_flags & NLM_F_EXCL)
2268 if (nlh->nlmsg_flags & NLM_F_REPLACE)
2273 if (!create || nlh->nlmsg_flags & NLM_F_REPLACE)
2275 handle = nf_tables_alloc_handle(table);
2277 if (chain->use == UINT_MAX)
2281 if (nla[NFTA_RULE_POSITION]) {
2282 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
2285 pos_handle = be64_to_cpu(nla_get_be64(nla[NFTA_RULE_POSITION]));
2286 old_rule = __nf_tables_rule_lookup(chain, pos_handle);
2287 if (IS_ERR(old_rule))
2288 return PTR_ERR(old_rule);
2291 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2295 if (nla[NFTA_RULE_EXPRESSIONS]) {
2296 nla_for_each_nested(tmp, nla[NFTA_RULE_EXPRESSIONS], rem) {
2298 if (nla_type(tmp) != NFTA_LIST_ELEM)
2300 if (n == NFT_RULE_MAXEXPRS)
2302 err = nf_tables_expr_parse(&ctx, tmp, &info[n]);
2305 size += info[n].ops->size;
2309 /* Check for overflow of dlen field */
2311 if (size >= 1 << 12)
2314 if (nla[NFTA_RULE_USERDATA]) {
2315 ulen = nla_len(nla[NFTA_RULE_USERDATA]);
2317 usize = sizeof(struct nft_userdata) + ulen;
2321 rule = kzalloc(sizeof(*rule) + size + usize, GFP_KERNEL);
2325 nft_activate_next(net, rule);
2327 rule->handle = handle;
2329 rule->udata = ulen ? 1 : 0;
2332 udata = nft_userdata(rule);
2333 udata->len = ulen - 1;
2334 nla_memcpy(udata->data, nla[NFTA_RULE_USERDATA], ulen);
2337 expr = nft_expr_first(rule);
2338 for (i = 0; i < n; i++) {
2339 err = nf_tables_newexpr(&ctx, &info[i], expr);
2343 expr = nft_expr_next(expr);
2346 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
2347 if (nft_is_active_next(net, old_rule)) {
2348 trans = nft_trans_rule_add(&ctx, NFT_MSG_DELRULE,
2350 if (trans == NULL) {
2354 nft_deactivate_next(net, old_rule);
2356 list_add_tail_rcu(&rule->list, &old_rule->list);
2361 } else if (nlh->nlmsg_flags & NLM_F_APPEND)
2363 list_add_rcu(&rule->list, &old_rule->list);
2365 list_add_tail_rcu(&rule->list, &chain->rules);
2368 list_add_tail_rcu(&rule->list, &old_rule->list);
2370 list_add_rcu(&rule->list, &chain->rules);
2373 if (nft_trans_rule_add(&ctx, NFT_MSG_NEWRULE, rule) == NULL) {
2381 list_del_rcu(&rule->list);
2383 nf_tables_rule_destroy(&ctx, rule);
2385 for (i = 0; i < n; i++) {
2386 if (info[i].ops != NULL)
2387 module_put(info[i].ops->type->owner);
2392 static struct nft_rule *nft_rule_lookup_byid(const struct net *net,
2393 const struct nlattr *nla)
2395 u32 id = ntohl(nla_get_be32(nla));
2396 struct nft_trans *trans;
2398 list_for_each_entry(trans, &net->nft.commit_list, list) {
2399 struct nft_rule *rule = nft_trans_rule(trans);
2401 if (trans->msg_type == NFT_MSG_NEWRULE &&
2402 id == nft_trans_rule_id(trans))
2405 return ERR_PTR(-ENOENT);
2408 static int nf_tables_delrule(struct net *net, struct sock *nlsk,
2409 struct sk_buff *skb, const struct nlmsghdr *nlh,
2410 const struct nlattr * const nla[],
2411 struct netlink_ext_ack *extack)
2413 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2414 u8 genmask = nft_genmask_next(net);
2415 struct nft_af_info *afi;
2416 struct nft_table *table;
2417 struct nft_chain *chain = NULL;
2418 struct nft_rule *rule;
2419 int family = nfmsg->nfgen_family, err = 0;
2422 afi = nf_tables_afinfo_lookup(net, family, false);
2424 return PTR_ERR(afi);
2426 table = nf_tables_table_lookup(afi, nla[NFTA_RULE_TABLE], genmask);
2428 return PTR_ERR(table);
2430 if (nla[NFTA_RULE_CHAIN]) {
2431 chain = nf_tables_chain_lookup(table, nla[NFTA_RULE_CHAIN],
2434 return PTR_ERR(chain);
2437 nft_ctx_init(&ctx, net, skb, nlh, afi, table, chain, nla);
2440 if (nla[NFTA_RULE_HANDLE]) {
2441 rule = nf_tables_rule_lookup(chain,
2442 nla[NFTA_RULE_HANDLE]);
2444 return PTR_ERR(rule);
2446 err = nft_delrule(&ctx, rule);
2447 } else if (nla[NFTA_RULE_ID]) {
2448 rule = nft_rule_lookup_byid(net, nla[NFTA_RULE_ID]);
2450 return PTR_ERR(rule);
2452 err = nft_delrule(&ctx, rule);
2454 err = nft_delrule_by_chain(&ctx);
2457 list_for_each_entry(chain, &table->chains, list) {
2458 if (!nft_is_active_next(net, chain))
2462 err = nft_delrule_by_chain(&ctx);
2475 static LIST_HEAD(nf_tables_set_types);
2477 int nft_register_set(struct nft_set_type *type)
2479 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2480 list_add_tail_rcu(&type->list, &nf_tables_set_types);
2481 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2484 EXPORT_SYMBOL_GPL(nft_register_set);
2486 void nft_unregister_set(struct nft_set_type *type)
2488 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2489 list_del_rcu(&type->list);
2490 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2492 EXPORT_SYMBOL_GPL(nft_unregister_set);
2494 #define NFT_SET_FEATURES (NFT_SET_INTERVAL | NFT_SET_MAP | \
2495 NFT_SET_TIMEOUT | NFT_SET_OBJECT)
2497 static bool nft_set_ops_candidate(const struct nft_set_ops *ops, u32 flags)
2499 return (flags & ops->features) == (flags & NFT_SET_FEATURES);
2503 * Select a set implementation based on the data characteristics and the
2504 * given policy. The total memory use might not be known if no size is
2505 * given, in that case the amount of memory per element is used.
2507 static const struct nft_set_ops *
2508 nft_select_set_ops(const struct nft_ctx *ctx,
2509 const struct nlattr * const nla[],
2510 const struct nft_set_desc *desc,
2511 enum nft_set_policies policy)
2513 const struct nft_set_ops *ops, *bops;
2514 struct nft_set_estimate est, best;
2515 const struct nft_set_type *type;
2518 #ifdef CONFIG_MODULES
2519 if (list_empty(&nf_tables_set_types)) {
2520 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
2521 request_module("nft-set");
2522 nfnl_lock(NFNL_SUBSYS_NFTABLES);
2523 if (!list_empty(&nf_tables_set_types))
2524 return ERR_PTR(-EAGAIN);
2527 if (nla[NFTA_SET_FLAGS] != NULL)
2528 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
2535 list_for_each_entry(type, &nf_tables_set_types, list) {
2536 if (!type->select_ops)
2539 ops = type->select_ops(ctx, desc, flags);
2543 if (!nft_set_ops_candidate(ops, flags))
2545 if (!ops->estimate(desc, flags, &est))
2549 case NFT_SET_POL_PERFORMANCE:
2550 if (est.lookup < best.lookup)
2552 if (est.lookup == best.lookup) {
2554 if (est.space < best.space)
2556 } else if (est.size < best.size) {
2561 case NFT_SET_POL_MEMORY:
2563 if (est.space < best.space)
2565 if (est.space == best.space &&
2566 est.lookup < best.lookup)
2568 } else if (est.size < best.size) {
2576 if (!try_module_get(type->owner))
2579 module_put(bops->type->owner);
2588 return ERR_PTR(-EOPNOTSUPP);
2591 static const struct nla_policy nft_set_policy[NFTA_SET_MAX + 1] = {
2592 [NFTA_SET_TABLE] = { .type = NLA_STRING,
2593 .len = NFT_TABLE_MAXNAMELEN - 1 },
2594 [NFTA_SET_NAME] = { .type = NLA_STRING,
2595 .len = NFT_SET_MAXNAMELEN - 1 },
2596 [NFTA_SET_FLAGS] = { .type = NLA_U32 },
2597 [NFTA_SET_KEY_TYPE] = { .type = NLA_U32 },
2598 [NFTA_SET_KEY_LEN] = { .type = NLA_U32 },
2599 [NFTA_SET_DATA_TYPE] = { .type = NLA_U32 },
2600 [NFTA_SET_DATA_LEN] = { .type = NLA_U32 },
2601 [NFTA_SET_POLICY] = { .type = NLA_U32 },
2602 [NFTA_SET_DESC] = { .type = NLA_NESTED },
2603 [NFTA_SET_ID] = { .type = NLA_U32 },
2604 [NFTA_SET_TIMEOUT] = { .type = NLA_U64 },
2605 [NFTA_SET_GC_INTERVAL] = { .type = NLA_U32 },
2606 [NFTA_SET_USERDATA] = { .type = NLA_BINARY,
2607 .len = NFT_USERDATA_MAXLEN },
2608 [NFTA_SET_OBJ_TYPE] = { .type = NLA_U32 },
2611 static const struct nla_policy nft_set_desc_policy[NFTA_SET_DESC_MAX + 1] = {
2612 [NFTA_SET_DESC_SIZE] = { .type = NLA_U32 },
2615 static int nft_ctx_init_from_setattr(struct nft_ctx *ctx, struct net *net,
2616 const struct sk_buff *skb,
2617 const struct nlmsghdr *nlh,
2618 const struct nlattr * const nla[],
2621 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2622 struct nft_af_info *afi = NULL;
2623 struct nft_table *table = NULL;
2625 if (nfmsg->nfgen_family != NFPROTO_UNSPEC) {
2626 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
2628 return PTR_ERR(afi);
2631 if (nla[NFTA_SET_TABLE] != NULL) {
2633 return -EAFNOSUPPORT;
2635 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE],
2638 return PTR_ERR(table);
2641 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
2645 static struct nft_set *nf_tables_set_lookup(const struct nft_table *table,
2646 const struct nlattr *nla, u8 genmask)
2648 struct nft_set *set;
2651 return ERR_PTR(-EINVAL);
2653 list_for_each_entry(set, &table->sets, list) {
2654 if (!nla_strcmp(nla, set->name) &&
2655 nft_active_genmask(set, genmask))
2658 return ERR_PTR(-ENOENT);
2661 static struct nft_set *nf_tables_set_lookup_byid(const struct net *net,
2662 const struct nlattr *nla,
2665 struct nft_trans *trans;
2666 u32 id = ntohl(nla_get_be32(nla));
2668 list_for_each_entry(trans, &net->nft.commit_list, list) {
2669 struct nft_set *set = nft_trans_set(trans);
2671 if (trans->msg_type == NFT_MSG_NEWSET &&
2672 id == nft_trans_set_id(trans) &&
2673 nft_active_genmask(set, genmask))
2676 return ERR_PTR(-ENOENT);
2679 struct nft_set *nft_set_lookup(const struct net *net,
2680 const struct nft_table *table,
2681 const struct nlattr *nla_set_name,
2682 const struct nlattr *nla_set_id,
2685 struct nft_set *set;
2687 set = nf_tables_set_lookup(table, nla_set_name, genmask);
2692 set = nf_tables_set_lookup_byid(net, nla_set_id, genmask);
2696 EXPORT_SYMBOL_GPL(nft_set_lookup);
2698 static int nf_tables_set_alloc_name(struct nft_ctx *ctx, struct nft_set *set,
2701 const struct nft_set *i;
2703 unsigned long *inuse;
2704 unsigned int n = 0, min = 0;
2706 p = strchr(name, '%');
2708 if (p[1] != 'd' || strchr(p + 2, '%'))
2711 inuse = (unsigned long *)get_zeroed_page(GFP_KERNEL);
2715 list_for_each_entry(i, &ctx->table->sets, list) {
2718 if (!nft_is_active_next(ctx->net, set))
2720 if (!sscanf(i->name, name, &tmp))
2722 if (tmp < min || tmp >= min + BITS_PER_BYTE * PAGE_SIZE)
2725 set_bit(tmp - min, inuse);
2728 n = find_first_zero_bit(inuse, BITS_PER_BYTE * PAGE_SIZE);
2729 if (n >= BITS_PER_BYTE * PAGE_SIZE) {
2730 min += BITS_PER_BYTE * PAGE_SIZE;
2731 memset(inuse, 0, PAGE_SIZE);
2734 free_page((unsigned long)inuse);
2737 set->name = kasprintf(GFP_KERNEL, name, min + n);
2741 list_for_each_entry(i, &ctx->table->sets, list) {
2742 if (!nft_is_active_next(ctx->net, i))
2744 if (!strcmp(set->name, i->name)) {
2752 static int nf_tables_fill_set(struct sk_buff *skb, const struct nft_ctx *ctx,
2753 const struct nft_set *set, u16 event, u16 flags)
2755 struct nfgenmsg *nfmsg;
2756 struct nlmsghdr *nlh;
2757 struct nlattr *desc;
2758 u32 portid = ctx->portid;
2761 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
2762 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
2765 goto nla_put_failure;
2767 nfmsg = nlmsg_data(nlh);
2768 nfmsg->nfgen_family = ctx->afi->family;
2769 nfmsg->version = NFNETLINK_V0;
2770 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
2772 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
2773 goto nla_put_failure;
2774 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
2775 goto nla_put_failure;
2776 if (set->flags != 0)
2777 if (nla_put_be32(skb, NFTA_SET_FLAGS, htonl(set->flags)))
2778 goto nla_put_failure;
2780 if (nla_put_be32(skb, NFTA_SET_KEY_TYPE, htonl(set->ktype)))
2781 goto nla_put_failure;
2782 if (nla_put_be32(skb, NFTA_SET_KEY_LEN, htonl(set->klen)))
2783 goto nla_put_failure;
2784 if (set->flags & NFT_SET_MAP) {
2785 if (nla_put_be32(skb, NFTA_SET_DATA_TYPE, htonl(set->dtype)))
2786 goto nla_put_failure;
2787 if (nla_put_be32(skb, NFTA_SET_DATA_LEN, htonl(set->dlen)))
2788 goto nla_put_failure;
2790 if (set->flags & NFT_SET_OBJECT &&
2791 nla_put_be32(skb, NFTA_SET_OBJ_TYPE, htonl(set->objtype)))
2792 goto nla_put_failure;
2795 nla_put_be64(skb, NFTA_SET_TIMEOUT,
2796 cpu_to_be64(jiffies_to_msecs(set->timeout)),
2798 goto nla_put_failure;
2800 nla_put_be32(skb, NFTA_SET_GC_INTERVAL, htonl(set->gc_int)))
2801 goto nla_put_failure;
2803 if (set->policy != NFT_SET_POL_PERFORMANCE) {
2804 if (nla_put_be32(skb, NFTA_SET_POLICY, htonl(set->policy)))
2805 goto nla_put_failure;
2808 if (nla_put(skb, NFTA_SET_USERDATA, set->udlen, set->udata))
2809 goto nla_put_failure;
2811 desc = nla_nest_start(skb, NFTA_SET_DESC);
2813 goto nla_put_failure;
2815 nla_put_be32(skb, NFTA_SET_DESC_SIZE, htonl(set->size)))
2816 goto nla_put_failure;
2817 nla_nest_end(skb, desc);
2819 nlmsg_end(skb, nlh);
2823 nlmsg_trim(skb, nlh);
2827 static void nf_tables_set_notify(const struct nft_ctx *ctx,
2828 const struct nft_set *set, int event,
2831 struct sk_buff *skb;
2832 u32 portid = ctx->portid;
2836 !nfnetlink_has_listeners(ctx->net, NFNLGRP_NFTABLES))
2839 skb = nlmsg_new(NLMSG_GOODSIZE, gfp_flags);
2843 err = nf_tables_fill_set(skb, ctx, set, event, 0);
2849 nfnetlink_send(skb, ctx->net, portid, NFNLGRP_NFTABLES, ctx->report,
2853 nfnetlink_set_err(ctx->net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
2856 static int nf_tables_dump_sets(struct sk_buff *skb, struct netlink_callback *cb)
2858 const struct nft_set *set;
2859 unsigned int idx, s_idx = cb->args[0];
2860 struct nft_af_info *afi;
2861 struct nft_table *table, *cur_table = (struct nft_table *)cb->args[2];
2862 struct net *net = sock_net(skb->sk);
2863 int cur_family = cb->args[3];
2864 struct nft_ctx *ctx = cb->data, ctx_set;
2870 cb->seq = net->nft.base_seq;
2872 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
2873 if (ctx->afi && ctx->afi != afi)
2877 if (afi->family != cur_family)
2882 list_for_each_entry_rcu(table, &afi->tables, list) {
2883 if (ctx->table && ctx->table != table)
2887 if (cur_table != table)
2893 list_for_each_entry_rcu(set, &table->sets, list) {
2896 if (!nft_is_active(net, set))
2900 ctx_set.table = table;
2902 if (nf_tables_fill_set(skb, &ctx_set, set,
2906 cb->args[2] = (unsigned long) table;
2907 cb->args[3] = afi->family;
2910 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2924 static int nf_tables_dump_sets_done(struct netlink_callback *cb)
2930 static int nf_tables_getset(struct net *net, struct sock *nlsk,
2931 struct sk_buff *skb, const struct nlmsghdr *nlh,
2932 const struct nlattr * const nla[],
2933 struct netlink_ext_ack *extack)
2935 u8 genmask = nft_genmask_cur(net);
2936 const struct nft_set *set;
2938 struct sk_buff *skb2;
2939 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
2942 /* Verify existence before starting dump */
2943 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
2947 if (nlh->nlmsg_flags & NLM_F_DUMP) {
2948 struct netlink_dump_control c = {
2949 .dump = nf_tables_dump_sets,
2950 .done = nf_tables_dump_sets_done,
2952 struct nft_ctx *ctx_dump;
2954 ctx_dump = kmalloc(sizeof(*ctx_dump), GFP_KERNEL);
2955 if (ctx_dump == NULL)
2961 return netlink_dump_start(nlsk, skb, nlh, &c);
2964 /* Only accept unspec with dump */
2965 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
2966 return -EAFNOSUPPORT;
2967 if (!nla[NFTA_SET_TABLE])
2970 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
2972 return PTR_ERR(set);
2974 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
2978 err = nf_tables_fill_set(skb2, &ctx, set, NFT_MSG_NEWSET, 0);
2982 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
2989 static int nf_tables_set_desc_parse(const struct nft_ctx *ctx,
2990 struct nft_set_desc *desc,
2991 const struct nlattr *nla)
2993 struct nlattr *da[NFTA_SET_DESC_MAX + 1];
2996 err = nla_parse_nested(da, NFTA_SET_DESC_MAX, nla,
2997 nft_set_desc_policy, NULL);
3001 if (da[NFTA_SET_DESC_SIZE] != NULL)
3002 desc->size = ntohl(nla_get_be32(da[NFTA_SET_DESC_SIZE]));
3007 static int nf_tables_newset(struct net *net, struct sock *nlsk,
3008 struct sk_buff *skb, const struct nlmsghdr *nlh,
3009 const struct nlattr * const nla[],
3010 struct netlink_ext_ack *extack)
3012 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3013 u8 genmask = nft_genmask_next(net);
3014 const struct nft_set_ops *ops;
3015 struct nft_af_info *afi;
3016 struct nft_table *table;
3017 struct nft_set *set;
3023 u32 ktype, dtype, flags, policy, gc_int, objtype;
3024 struct nft_set_desc desc;
3025 unsigned char *udata;
3029 if (nla[NFTA_SET_TABLE] == NULL ||
3030 nla[NFTA_SET_NAME] == NULL ||
3031 nla[NFTA_SET_KEY_LEN] == NULL ||
3032 nla[NFTA_SET_ID] == NULL)
3035 memset(&desc, 0, sizeof(desc));
3037 ktype = NFT_DATA_VALUE;
3038 if (nla[NFTA_SET_KEY_TYPE] != NULL) {
3039 ktype = ntohl(nla_get_be32(nla[NFTA_SET_KEY_TYPE]));
3040 if ((ktype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK)
3044 desc.klen = ntohl(nla_get_be32(nla[NFTA_SET_KEY_LEN]));
3045 if (desc.klen == 0 || desc.klen > NFT_DATA_VALUE_MAXLEN)
3049 if (nla[NFTA_SET_FLAGS] != NULL) {
3050 flags = ntohl(nla_get_be32(nla[NFTA_SET_FLAGS]));
3051 if (flags & ~(NFT_SET_ANONYMOUS | NFT_SET_CONSTANT |
3052 NFT_SET_INTERVAL | NFT_SET_TIMEOUT |
3053 NFT_SET_MAP | NFT_SET_EVAL |
3056 /* Only one of these operations is supported */
3057 if ((flags & (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT)) ==
3058 (NFT_SET_MAP | NFT_SET_EVAL | NFT_SET_OBJECT))
3063 if (nla[NFTA_SET_DATA_TYPE] != NULL) {
3064 if (!(flags & NFT_SET_MAP))
3067 dtype = ntohl(nla_get_be32(nla[NFTA_SET_DATA_TYPE]));
3068 if ((dtype & NFT_DATA_RESERVED_MASK) == NFT_DATA_RESERVED_MASK &&
3069 dtype != NFT_DATA_VERDICT)
3072 if (dtype != NFT_DATA_VERDICT) {
3073 if (nla[NFTA_SET_DATA_LEN] == NULL)
3075 desc.dlen = ntohl(nla_get_be32(nla[NFTA_SET_DATA_LEN]));
3076 if (desc.dlen == 0 || desc.dlen > NFT_DATA_VALUE_MAXLEN)
3079 desc.dlen = sizeof(struct nft_verdict);
3080 } else if (flags & NFT_SET_MAP)
3083 if (nla[NFTA_SET_OBJ_TYPE] != NULL) {
3084 if (!(flags & NFT_SET_OBJECT))
3087 objtype = ntohl(nla_get_be32(nla[NFTA_SET_OBJ_TYPE]));
3088 if (objtype == NFT_OBJECT_UNSPEC ||
3089 objtype > NFT_OBJECT_MAX)
3091 } else if (flags & NFT_SET_OBJECT)
3094 objtype = NFT_OBJECT_UNSPEC;
3097 if (nla[NFTA_SET_TIMEOUT] != NULL) {
3098 if (!(flags & NFT_SET_TIMEOUT))
3100 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3101 nla[NFTA_SET_TIMEOUT])));
3104 if (nla[NFTA_SET_GC_INTERVAL] != NULL) {
3105 if (!(flags & NFT_SET_TIMEOUT))
3107 gc_int = ntohl(nla_get_be32(nla[NFTA_SET_GC_INTERVAL]));
3110 policy = NFT_SET_POL_PERFORMANCE;
3111 if (nla[NFTA_SET_POLICY] != NULL)
3112 policy = ntohl(nla_get_be32(nla[NFTA_SET_POLICY]));
3114 if (nla[NFTA_SET_DESC] != NULL) {
3115 err = nf_tables_set_desc_parse(&ctx, &desc, nla[NFTA_SET_DESC]);
3120 create = nlh->nlmsg_flags & NLM_F_CREATE ? true : false;
3122 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, create);
3124 return PTR_ERR(afi);
3126 table = nf_tables_table_lookup(afi, nla[NFTA_SET_TABLE], genmask);
3128 return PTR_ERR(table);
3130 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
3132 set = nf_tables_set_lookup(table, nla[NFTA_SET_NAME], genmask);
3134 if (PTR_ERR(set) != -ENOENT)
3135 return PTR_ERR(set);
3137 if (nlh->nlmsg_flags & NLM_F_EXCL)
3139 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3144 if (!(nlh->nlmsg_flags & NLM_F_CREATE))
3147 ops = nft_select_set_ops(&ctx, nla, &desc, policy);
3149 return PTR_ERR(ops);
3152 if (nla[NFTA_SET_USERDATA])
3153 udlen = nla_len(nla[NFTA_SET_USERDATA]);
3156 if (ops->privsize != NULL)
3157 size = ops->privsize(nla, &desc);
3159 set = kvzalloc(sizeof(*set) + size + udlen, GFP_KERNEL);
3165 name = nla_strdup(nla[NFTA_SET_NAME], GFP_KERNEL);
3171 err = nf_tables_set_alloc_name(&ctx, set, name);
3178 udata = set->data + size;
3179 nla_memcpy(udata, nla[NFTA_SET_USERDATA], udlen);
3182 INIT_LIST_HEAD(&set->bindings);
3185 set->klen = desc.klen;
3187 set->objtype = objtype;
3188 set->dlen = desc.dlen;
3190 set->size = desc.size;
3191 set->policy = policy;
3194 set->timeout = timeout;
3195 set->gc_int = gc_int;
3197 err = ops->init(set, &desc, nla);
3201 err = nft_trans_set_add(&ctx, NFT_MSG_NEWSET, set);
3205 list_add_tail_rcu(&set->list, &table->sets);
3214 module_put(ops->type->owner);
3218 static void nft_set_destroy(struct nft_set *set)
3220 set->ops->destroy(set);
3221 module_put(set->ops->type->owner);
3226 static void nf_tables_set_destroy(const struct nft_ctx *ctx, struct nft_set *set)
3228 list_del_rcu(&set->list);
3229 nf_tables_set_notify(ctx, set, NFT_MSG_DELSET, GFP_ATOMIC);
3230 nft_set_destroy(set);
3233 static int nf_tables_delset(struct net *net, struct sock *nlsk,
3234 struct sk_buff *skb, const struct nlmsghdr *nlh,
3235 const struct nlattr * const nla[],
3236 struct netlink_ext_ack *extack)
3238 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3239 u8 genmask = nft_genmask_next(net);
3240 struct nft_set *set;
3244 if (nfmsg->nfgen_family == NFPROTO_UNSPEC)
3245 return -EAFNOSUPPORT;
3246 if (nla[NFTA_SET_TABLE] == NULL)
3249 err = nft_ctx_init_from_setattr(&ctx, net, skb, nlh, nla, genmask);
3253 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_NAME], genmask);
3255 return PTR_ERR(set);
3257 if (!list_empty(&set->bindings) ||
3258 (nlh->nlmsg_flags & NLM_F_NONREC && atomic_read(&set->nelems) > 0))
3261 return nft_delset(&ctx, set);
3264 static int nf_tables_bind_check_setelem(const struct nft_ctx *ctx,
3265 struct nft_set *set,
3266 const struct nft_set_iter *iter,
3267 struct nft_set_elem *elem)
3269 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3270 enum nft_registers dreg;
3272 dreg = nft_type_to_reg(set->dtype);
3273 return nft_validate_register_store(ctx, dreg, nft_set_ext_data(ext),
3274 set->dtype == NFT_DATA_VERDICT ?
3275 NFT_DATA_VERDICT : NFT_DATA_VALUE,
3279 int nf_tables_bind_set(const struct nft_ctx *ctx, struct nft_set *set,
3280 struct nft_set_binding *binding)
3282 struct nft_set_binding *i;
3283 struct nft_set_iter iter;
3285 if (!list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS)
3288 if (binding->flags & NFT_SET_MAP) {
3289 /* If the set is already bound to the same chain all
3290 * jumps are already validated for that chain.
3292 list_for_each_entry(i, &set->bindings, list) {
3293 if (i->flags & NFT_SET_MAP &&
3294 i->chain == binding->chain)
3298 iter.genmask = nft_genmask_next(ctx->net);
3302 iter.fn = nf_tables_bind_check_setelem;
3304 set->ops->walk(ctx, set, &iter);
3309 binding->chain = ctx->chain;
3310 list_add_tail_rcu(&binding->list, &set->bindings);
3313 EXPORT_SYMBOL_GPL(nf_tables_bind_set);
3315 void nf_tables_unbind_set(const struct nft_ctx *ctx, struct nft_set *set,
3316 struct nft_set_binding *binding)
3318 list_del_rcu(&binding->list);
3320 if (list_empty(&set->bindings) && set->flags & NFT_SET_ANONYMOUS &&
3321 nft_is_active(ctx->net, set))
3322 nf_tables_set_destroy(ctx, set);
3324 EXPORT_SYMBOL_GPL(nf_tables_unbind_set);
3326 const struct nft_set_ext_type nft_set_ext_types[] = {
3327 [NFT_SET_EXT_KEY] = {
3328 .align = __alignof__(u32),
3330 [NFT_SET_EXT_DATA] = {
3331 .align = __alignof__(u32),
3333 [NFT_SET_EXT_EXPR] = {
3334 .align = __alignof__(struct nft_expr),
3336 [NFT_SET_EXT_OBJREF] = {
3337 .len = sizeof(struct nft_object *),
3338 .align = __alignof__(struct nft_object *),
3340 [NFT_SET_EXT_FLAGS] = {
3342 .align = __alignof__(u8),
3344 [NFT_SET_EXT_TIMEOUT] = {
3346 .align = __alignof__(u64),
3348 [NFT_SET_EXT_EXPIRATION] = {
3349 .len = sizeof(unsigned long),
3350 .align = __alignof__(unsigned long),
3352 [NFT_SET_EXT_USERDATA] = {
3353 .len = sizeof(struct nft_userdata),
3354 .align = __alignof__(struct nft_userdata),
3357 EXPORT_SYMBOL_GPL(nft_set_ext_types);
3363 static const struct nla_policy nft_set_elem_policy[NFTA_SET_ELEM_MAX + 1] = {
3364 [NFTA_SET_ELEM_KEY] = { .type = NLA_NESTED },
3365 [NFTA_SET_ELEM_DATA] = { .type = NLA_NESTED },
3366 [NFTA_SET_ELEM_FLAGS] = { .type = NLA_U32 },
3367 [NFTA_SET_ELEM_TIMEOUT] = { .type = NLA_U64 },
3368 [NFTA_SET_ELEM_USERDATA] = { .type = NLA_BINARY,
3369 .len = NFT_USERDATA_MAXLEN },
3372 static const struct nla_policy nft_set_elem_list_policy[NFTA_SET_ELEM_LIST_MAX + 1] = {
3373 [NFTA_SET_ELEM_LIST_TABLE] = { .type = NLA_STRING,
3374 .len = NFT_TABLE_MAXNAMELEN - 1 },
3375 [NFTA_SET_ELEM_LIST_SET] = { .type = NLA_STRING,
3376 .len = NFT_SET_MAXNAMELEN - 1 },
3377 [NFTA_SET_ELEM_LIST_ELEMENTS] = { .type = NLA_NESTED },
3378 [NFTA_SET_ELEM_LIST_SET_ID] = { .type = NLA_U32 },
3381 static int nft_ctx_init_from_elemattr(struct nft_ctx *ctx, struct net *net,
3382 const struct sk_buff *skb,
3383 const struct nlmsghdr *nlh,
3384 const struct nlattr * const nla[],
3387 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
3388 struct nft_af_info *afi;
3389 struct nft_table *table;
3391 afi = nf_tables_afinfo_lookup(net, nfmsg->nfgen_family, false);
3393 return PTR_ERR(afi);
3395 table = nf_tables_table_lookup(afi, nla[NFTA_SET_ELEM_LIST_TABLE],
3398 return PTR_ERR(table);
3400 nft_ctx_init(ctx, net, skb, nlh, afi, table, NULL, nla);
3404 static int nf_tables_fill_setelem(struct sk_buff *skb,
3405 const struct nft_set *set,
3406 const struct nft_set_elem *elem)
3408 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
3409 unsigned char *b = skb_tail_pointer(skb);
3410 struct nlattr *nest;
3412 nest = nla_nest_start(skb, NFTA_LIST_ELEM);
3414 goto nla_put_failure;
3416 if (nft_data_dump(skb, NFTA_SET_ELEM_KEY, nft_set_ext_key(ext),
3417 NFT_DATA_VALUE, set->klen) < 0)
3418 goto nla_put_failure;
3420 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3421 nft_data_dump(skb, NFTA_SET_ELEM_DATA, nft_set_ext_data(ext),
3422 set->dtype == NFT_DATA_VERDICT ? NFT_DATA_VERDICT : NFT_DATA_VALUE,
3424 goto nla_put_failure;
3426 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR) &&
3427 nft_expr_dump(skb, NFTA_SET_ELEM_EXPR, nft_set_ext_expr(ext)) < 0)
3428 goto nla_put_failure;
3430 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3431 nla_put_string(skb, NFTA_SET_ELEM_OBJREF,
3432 (*nft_set_ext_obj(ext))->name) < 0)
3433 goto nla_put_failure;
3435 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
3436 nla_put_be32(skb, NFTA_SET_ELEM_FLAGS,
3437 htonl(*nft_set_ext_flags(ext))))
3438 goto nla_put_failure;
3440 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT) &&
3441 nla_put_be64(skb, NFTA_SET_ELEM_TIMEOUT,
3442 cpu_to_be64(jiffies_to_msecs(
3443 *nft_set_ext_timeout(ext))),
3445 goto nla_put_failure;
3447 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION)) {
3448 unsigned long expires, now = jiffies;
3450 expires = *nft_set_ext_expiration(ext);
3451 if (time_before(now, expires))
3456 if (nla_put_be64(skb, NFTA_SET_ELEM_EXPIRATION,
3457 cpu_to_be64(jiffies_to_msecs(expires)),
3459 goto nla_put_failure;
3462 if (nft_set_ext_exists(ext, NFT_SET_EXT_USERDATA)) {
3463 struct nft_userdata *udata;
3465 udata = nft_set_ext_userdata(ext);
3466 if (nla_put(skb, NFTA_SET_ELEM_USERDATA,
3467 udata->len + 1, udata->data))
3468 goto nla_put_failure;
3471 nla_nest_end(skb, nest);
3479 struct nft_set_dump_args {
3480 const struct netlink_callback *cb;
3481 struct nft_set_iter iter;
3482 struct sk_buff *skb;
3485 static int nf_tables_dump_setelem(const struct nft_ctx *ctx,
3486 struct nft_set *set,
3487 const struct nft_set_iter *iter,
3488 struct nft_set_elem *elem)
3490 struct nft_set_dump_args *args;
3492 args = container_of(iter, struct nft_set_dump_args, iter);
3493 return nf_tables_fill_setelem(args->skb, set, elem);
3496 struct nft_set_dump_ctx {
3497 const struct nft_set *set;
3501 static int nf_tables_dump_set(struct sk_buff *skb, struct netlink_callback *cb)
3503 struct nft_set_dump_ctx *dump_ctx = cb->data;
3504 struct net *net = sock_net(skb->sk);
3505 struct nft_af_info *afi;
3506 struct nft_table *table;
3507 struct nft_set *set;
3508 struct nft_set_dump_args args;
3509 bool set_found = false;
3510 struct nfgenmsg *nfmsg;
3511 struct nlmsghdr *nlh;
3512 struct nlattr *nest;
3517 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
3518 if (afi != dump_ctx->ctx.afi)
3521 list_for_each_entry_rcu(table, &afi->tables, list) {
3522 if (table != dump_ctx->ctx.table)
3525 list_for_each_entry_rcu(set, &table->sets, list) {
3526 if (set == dump_ctx->set) {
3541 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWSETELEM);
3542 portid = NETLINK_CB(cb->skb).portid;
3543 seq = cb->nlh->nlmsg_seq;
3545 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3548 goto nla_put_failure;
3550 nfmsg = nlmsg_data(nlh);
3551 nfmsg->nfgen_family = afi->family;
3552 nfmsg->version = NFNETLINK_V0;
3553 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
3555 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_TABLE, table->name))
3556 goto nla_put_failure;
3557 if (nla_put_string(skb, NFTA_SET_ELEM_LIST_SET, set->name))
3558 goto nla_put_failure;
3560 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3562 goto nla_put_failure;
3566 args.iter.genmask = nft_genmask_cur(net);
3567 args.iter.skip = cb->args[0];
3568 args.iter.count = 0;
3570 args.iter.fn = nf_tables_dump_setelem;
3571 set->ops->walk(&dump_ctx->ctx, set, &args.iter);
3574 nla_nest_end(skb, nest);
3575 nlmsg_end(skb, nlh);
3577 if (args.iter.err && args.iter.err != -EMSGSIZE)
3578 return args.iter.err;
3579 if (args.iter.count == cb->args[0])
3582 cb->args[0] = args.iter.count;
3590 static int nf_tables_dump_set_done(struct netlink_callback *cb)
3596 static int nf_tables_getsetelem(struct net *net, struct sock *nlsk,
3597 struct sk_buff *skb, const struct nlmsghdr *nlh,
3598 const struct nlattr * const nla[],
3599 struct netlink_ext_ack *extack)
3601 u8 genmask = nft_genmask_cur(net);
3602 const struct nft_set *set;
3606 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
3610 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
3613 return PTR_ERR(set);
3615 if (nlh->nlmsg_flags & NLM_F_DUMP) {
3616 struct netlink_dump_control c = {
3617 .dump = nf_tables_dump_set,
3618 .done = nf_tables_dump_set_done,
3620 struct nft_set_dump_ctx *dump_ctx;
3622 dump_ctx = kmalloc(sizeof(*dump_ctx), GFP_KERNEL);
3626 dump_ctx->set = set;
3627 dump_ctx->ctx = ctx;
3630 return netlink_dump_start(nlsk, skb, nlh, &c);
3635 static int nf_tables_fill_setelem_info(struct sk_buff *skb,
3636 const struct nft_ctx *ctx, u32 seq,
3637 u32 portid, int event, u16 flags,
3638 const struct nft_set *set,
3639 const struct nft_set_elem *elem)
3641 struct nfgenmsg *nfmsg;
3642 struct nlmsghdr *nlh;
3643 struct nlattr *nest;
3646 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
3647 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg),
3650 goto nla_put_failure;
3652 nfmsg = nlmsg_data(nlh);
3653 nfmsg->nfgen_family = ctx->afi->family;
3654 nfmsg->version = NFNETLINK_V0;
3655 nfmsg->res_id = htons(ctx->net->nft.base_seq & 0xffff);
3657 if (nla_put_string(skb, NFTA_SET_TABLE, ctx->table->name))
3658 goto nla_put_failure;
3659 if (nla_put_string(skb, NFTA_SET_NAME, set->name))
3660 goto nla_put_failure;
3662 nest = nla_nest_start(skb, NFTA_SET_ELEM_LIST_ELEMENTS);
3664 goto nla_put_failure;
3666 err = nf_tables_fill_setelem(skb, set, elem);
3668 goto nla_put_failure;
3670 nla_nest_end(skb, nest);
3672 nlmsg_end(skb, nlh);
3676 nlmsg_trim(skb, nlh);
3680 static void nf_tables_setelem_notify(const struct nft_ctx *ctx,
3681 const struct nft_set *set,
3682 const struct nft_set_elem *elem,
3683 int event, u16 flags)
3685 struct net *net = ctx->net;
3686 u32 portid = ctx->portid;
3687 struct sk_buff *skb;
3690 if (!ctx->report && !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
3693 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
3697 err = nf_tables_fill_setelem_info(skb, ctx, 0, portid, event, flags,
3704 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, ctx->report,
3708 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
3711 static struct nft_trans *nft_trans_elem_alloc(struct nft_ctx *ctx,
3713 struct nft_set *set)
3715 struct nft_trans *trans;
3717 trans = nft_trans_alloc(ctx, msg_type, sizeof(struct nft_trans_elem));
3721 nft_trans_elem_set(trans) = set;
3725 void *nft_set_elem_init(const struct nft_set *set,
3726 const struct nft_set_ext_tmpl *tmpl,
3727 const u32 *key, const u32 *data,
3728 u64 timeout, gfp_t gfp)
3730 struct nft_set_ext *ext;
3733 elem = kzalloc(set->ops->elemsize + tmpl->len, gfp);
3737 ext = nft_set_elem_ext(set, elem);
3738 nft_set_ext_init(ext, tmpl);
3740 memcpy(nft_set_ext_key(ext), key, set->klen);
3741 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3742 memcpy(nft_set_ext_data(ext), data, set->dlen);
3743 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPIRATION))
3744 *nft_set_ext_expiration(ext) =
3746 if (nft_set_ext_exists(ext, NFT_SET_EXT_TIMEOUT))
3747 *nft_set_ext_timeout(ext) = timeout;
3752 void nft_set_elem_destroy(const struct nft_set *set, void *elem,
3755 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3757 nft_data_release(nft_set_ext_key(ext), NFT_DATA_VALUE);
3758 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
3759 nft_data_release(nft_set_ext_data(ext), set->dtype);
3760 if (destroy_expr && nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3761 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3762 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
3763 (*nft_set_ext_obj(ext))->use--;
3766 EXPORT_SYMBOL_GPL(nft_set_elem_destroy);
3768 /* Only called from commit path, nft_set_elem_deactivate() already deals with
3769 * the refcounting from the preparation phase.
3771 static void nf_tables_set_elem_destroy(const struct nft_set *set, void *elem)
3773 struct nft_set_ext *ext = nft_set_elem_ext(set, elem);
3775 if (nft_set_ext_exists(ext, NFT_SET_EXT_EXPR))
3776 nf_tables_expr_destroy(NULL, nft_set_ext_expr(ext));
3780 static int nft_setelem_parse_flags(const struct nft_set *set,
3781 const struct nlattr *attr, u32 *flags)
3786 *flags = ntohl(nla_get_be32(attr));
3787 if (*flags & ~NFT_SET_ELEM_INTERVAL_END)
3789 if (!(set->flags & NFT_SET_INTERVAL) &&
3790 *flags & NFT_SET_ELEM_INTERVAL_END)
3796 static int nft_add_set_elem(struct nft_ctx *ctx, struct nft_set *set,
3797 const struct nlattr *attr, u32 nlmsg_flags)
3799 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
3800 u8 genmask = nft_genmask_next(ctx->net);
3801 struct nft_data_desc d1, d2;
3802 struct nft_set_ext_tmpl tmpl;
3803 struct nft_set_ext *ext, *ext2;
3804 struct nft_set_elem elem;
3805 struct nft_set_binding *binding;
3806 struct nft_object *obj = NULL;
3807 struct nft_userdata *udata;
3808 struct nft_data data;
3809 enum nft_registers dreg;
3810 struct nft_trans *trans;
3816 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
3817 nft_set_elem_policy, NULL);
3821 if (nla[NFTA_SET_ELEM_KEY] == NULL)
3824 nft_set_ext_prepare(&tmpl);
3826 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
3830 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
3832 if (set->flags & NFT_SET_MAP) {
3833 if (nla[NFTA_SET_ELEM_DATA] == NULL &&
3834 !(flags & NFT_SET_ELEM_INTERVAL_END))
3836 if (nla[NFTA_SET_ELEM_DATA] != NULL &&
3837 flags & NFT_SET_ELEM_INTERVAL_END)
3840 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3845 if (nla[NFTA_SET_ELEM_TIMEOUT] != NULL) {
3846 if (!(set->flags & NFT_SET_TIMEOUT))
3848 timeout = msecs_to_jiffies(be64_to_cpu(nla_get_be64(
3849 nla[NFTA_SET_ELEM_TIMEOUT])));
3850 } else if (set->flags & NFT_SET_TIMEOUT) {
3851 timeout = set->timeout;
3854 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &d1,
3855 nla[NFTA_SET_ELEM_KEY]);
3859 if (d1.type != NFT_DATA_VALUE || d1.len != set->klen)
3862 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, d1.len);
3864 nft_set_ext_add(&tmpl, NFT_SET_EXT_EXPIRATION);
3865 if (timeout != set->timeout)
3866 nft_set_ext_add(&tmpl, NFT_SET_EXT_TIMEOUT);
3869 if (nla[NFTA_SET_ELEM_OBJREF] != NULL) {
3870 if (!(set->flags & NFT_SET_OBJECT)) {
3874 obj = nf_tables_obj_lookup(ctx->table, nla[NFTA_SET_ELEM_OBJREF],
3875 set->objtype, genmask);
3880 nft_set_ext_add(&tmpl, NFT_SET_EXT_OBJREF);
3883 if (nla[NFTA_SET_ELEM_DATA] != NULL) {
3884 err = nft_data_init(ctx, &data, sizeof(data), &d2,
3885 nla[NFTA_SET_ELEM_DATA]);
3890 if (set->dtype != NFT_DATA_VERDICT && d2.len != set->dlen)
3893 dreg = nft_type_to_reg(set->dtype);
3894 list_for_each_entry(binding, &set->bindings, list) {
3895 struct nft_ctx bind_ctx = {
3898 .table = ctx->table,
3899 .chain = (struct nft_chain *)binding->chain,
3902 if (!(binding->flags & NFT_SET_MAP))
3905 err = nft_validate_register_store(&bind_ctx, dreg,
3912 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_DATA, d2.len);
3915 /* The full maximum length of userdata can exceed the maximum
3916 * offset value (U8_MAX) for following extensions, therefor it
3917 * must be the last extension added.
3920 if (nla[NFTA_SET_ELEM_USERDATA] != NULL) {
3921 ulen = nla_len(nla[NFTA_SET_ELEM_USERDATA]);
3923 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_USERDATA,
3928 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, data.data,
3929 timeout, GFP_KERNEL);
3930 if (elem.priv == NULL)
3933 ext = nft_set_elem_ext(set, elem.priv);
3935 *nft_set_ext_flags(ext) = flags;
3937 udata = nft_set_ext_userdata(ext);
3938 udata->len = ulen - 1;
3939 nla_memcpy(&udata->data, nla[NFTA_SET_ELEM_USERDATA], ulen);
3942 *nft_set_ext_obj(ext) = obj;
3946 trans = nft_trans_elem_alloc(ctx, NFT_MSG_NEWSETELEM, set);
3950 ext->genmask = nft_genmask_cur(ctx->net) | NFT_SET_ELEM_BUSY_MASK;
3951 err = set->ops->insert(ctx->net, set, &elem, &ext2);
3953 if (err == -EEXIST) {
3954 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA) ^
3955 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) ||
3956 nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) ^
3957 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF))
3959 if ((nft_set_ext_exists(ext, NFT_SET_EXT_DATA) &&
3960 nft_set_ext_exists(ext2, NFT_SET_EXT_DATA) &&
3961 memcmp(nft_set_ext_data(ext),
3962 nft_set_ext_data(ext2), set->dlen) != 0) ||
3963 (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF) &&
3964 nft_set_ext_exists(ext2, NFT_SET_EXT_OBJREF) &&
3965 *nft_set_ext_obj(ext) != *nft_set_ext_obj(ext2)))
3967 else if (!(nlmsg_flags & NLM_F_EXCL))
3974 !atomic_add_unless(&set->nelems, 1, set->size + set->ndeact)) {
3979 nft_trans_elem(trans) = elem;
3980 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
3984 set->ops->remove(ctx->net, set, &elem);
3990 if (nla[NFTA_SET_ELEM_DATA] != NULL)
3991 nft_data_release(&data, d2.type);
3993 nft_data_release(&elem.key.val, d1.type);
3998 static int nf_tables_newsetelem(struct net *net, struct sock *nlsk,
3999 struct sk_buff *skb, const struct nlmsghdr *nlh,
4000 const struct nlattr * const nla[],
4001 struct netlink_ext_ack *extack)
4003 u8 genmask = nft_genmask_next(net);
4004 const struct nlattr *attr;
4005 struct nft_set *set;
4009 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL)
4012 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
4016 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
4019 if (nla[NFTA_SET_ELEM_LIST_SET_ID]) {
4020 set = nf_tables_set_lookup_byid(net,
4021 nla[NFTA_SET_ELEM_LIST_SET_ID],
4025 return PTR_ERR(set);
4028 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4031 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4032 err = nft_add_set_elem(&ctx, set, attr, nlh->nlmsg_flags);
4040 * nft_data_hold - hold a nft_data item
4042 * @data: struct nft_data to release
4043 * @type: type of data
4045 * Hold a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4046 * NFT_DATA_VERDICT bumps the reference to chains in case of NFT_JUMP and
4047 * NFT_GOTO verdicts. This function must be called on active data objects
4048 * from the second phase of the commit protocol.
4050 static void nft_data_hold(const struct nft_data *data, enum nft_data_types type)
4052 if (type == NFT_DATA_VERDICT) {
4053 switch (data->verdict.code) {
4056 data->verdict.chain->use++;
4062 static void nft_set_elem_activate(const struct net *net,
4063 const struct nft_set *set,
4064 struct nft_set_elem *elem)
4066 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4068 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4069 nft_data_hold(nft_set_ext_data(ext), set->dtype);
4070 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
4071 (*nft_set_ext_obj(ext))->use++;
4074 static void nft_set_elem_deactivate(const struct net *net,
4075 const struct nft_set *set,
4076 struct nft_set_elem *elem)
4078 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
4080 if (nft_set_ext_exists(ext, NFT_SET_EXT_DATA))
4081 nft_data_release(nft_set_ext_data(ext), set->dtype);
4082 if (nft_set_ext_exists(ext, NFT_SET_EXT_OBJREF))
4083 (*nft_set_ext_obj(ext))->use--;
4086 static int nft_del_setelem(struct nft_ctx *ctx, struct nft_set *set,
4087 const struct nlattr *attr)
4089 struct nlattr *nla[NFTA_SET_ELEM_MAX + 1];
4090 struct nft_set_ext_tmpl tmpl;
4091 struct nft_data_desc desc;
4092 struct nft_set_elem elem;
4093 struct nft_set_ext *ext;
4094 struct nft_trans *trans;
4099 err = nla_parse_nested(nla, NFTA_SET_ELEM_MAX, attr,
4100 nft_set_elem_policy, NULL);
4105 if (nla[NFTA_SET_ELEM_KEY] == NULL)
4108 nft_set_ext_prepare(&tmpl);
4110 err = nft_setelem_parse_flags(set, nla[NFTA_SET_ELEM_FLAGS], &flags);
4114 nft_set_ext_add(&tmpl, NFT_SET_EXT_FLAGS);
4116 err = nft_data_init(ctx, &elem.key.val, sizeof(elem.key), &desc,
4117 nla[NFTA_SET_ELEM_KEY]);
4122 if (desc.type != NFT_DATA_VALUE || desc.len != set->klen)
4125 nft_set_ext_add_length(&tmpl, NFT_SET_EXT_KEY, desc.len);
4128 elem.priv = nft_set_elem_init(set, &tmpl, elem.key.val.data, NULL, 0,
4130 if (elem.priv == NULL)
4133 ext = nft_set_elem_ext(set, elem.priv);
4135 *nft_set_ext_flags(ext) = flags;
4137 trans = nft_trans_elem_alloc(ctx, NFT_MSG_DELSETELEM, set);
4138 if (trans == NULL) {
4143 priv = set->ops->deactivate(ctx->net, set, &elem);
4151 nft_set_elem_deactivate(ctx->net, set, &elem);
4153 nft_trans_elem(trans) = elem;
4154 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4162 nft_data_release(&elem.key.val, desc.type);
4167 static int nft_flush_set(const struct nft_ctx *ctx,
4168 struct nft_set *set,
4169 const struct nft_set_iter *iter,
4170 struct nft_set_elem *elem)
4172 struct nft_trans *trans;
4175 trans = nft_trans_alloc_gfp(ctx, NFT_MSG_DELSETELEM,
4176 sizeof(struct nft_trans_elem), GFP_ATOMIC);
4180 if (!set->ops->flush(ctx->net, set, elem->priv)) {
4186 nft_trans_elem_set(trans) = set;
4187 nft_trans_elem(trans) = *elem;
4188 list_add_tail(&trans->list, &ctx->net->nft.commit_list);
4196 static int nf_tables_delsetelem(struct net *net, struct sock *nlsk,
4197 struct sk_buff *skb, const struct nlmsghdr *nlh,
4198 const struct nlattr * const nla[],
4199 struct netlink_ext_ack *extack)
4201 u8 genmask = nft_genmask_next(net);
4202 const struct nlattr *attr;
4203 struct nft_set *set;
4207 err = nft_ctx_init_from_elemattr(&ctx, net, skb, nlh, nla, genmask);
4211 set = nf_tables_set_lookup(ctx.table, nla[NFTA_SET_ELEM_LIST_SET],
4214 return PTR_ERR(set);
4215 if (!list_empty(&set->bindings) && set->flags & NFT_SET_CONSTANT)
4218 if (nla[NFTA_SET_ELEM_LIST_ELEMENTS] == NULL) {
4219 struct nft_set_iter iter = {
4221 .fn = nft_flush_set,
4223 set->ops->walk(&ctx, set, &iter);
4228 nla_for_each_nested(attr, nla[NFTA_SET_ELEM_LIST_ELEMENTS], rem) {
4229 err = nft_del_setelem(&ctx, set, attr);
4238 void nft_set_gc_batch_release(struct rcu_head *rcu)
4240 struct nft_set_gc_batch *gcb;
4243 gcb = container_of(rcu, struct nft_set_gc_batch, head.rcu);
4244 for (i = 0; i < gcb->head.cnt; i++)
4245 nft_set_elem_destroy(gcb->head.set, gcb->elems[i], true);
4248 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release);
4250 struct nft_set_gc_batch *nft_set_gc_batch_alloc(const struct nft_set *set,
4253 struct nft_set_gc_batch *gcb;
4255 gcb = kzalloc(sizeof(*gcb), gfp);
4258 gcb->head.set = set;
4261 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc);
4268 * nft_register_obj- register nf_tables stateful object type
4271 * Registers the object type for use with nf_tables. Returns zero on
4272 * success or a negative errno code otherwise.
4274 int nft_register_obj(struct nft_object_type *obj_type)
4276 if (obj_type->type == NFT_OBJECT_UNSPEC)
4279 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4280 list_add_rcu(&obj_type->list, &nf_tables_objects);
4281 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4284 EXPORT_SYMBOL_GPL(nft_register_obj);
4287 * nft_unregister_obj - unregister nf_tables object type
4290 * Unregisters the object type for use with nf_tables.
4292 void nft_unregister_obj(struct nft_object_type *obj_type)
4294 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4295 list_del_rcu(&obj_type->list);
4296 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4298 EXPORT_SYMBOL_GPL(nft_unregister_obj);
4300 struct nft_object *nf_tables_obj_lookup(const struct nft_table *table,
4301 const struct nlattr *nla,
4302 u32 objtype, u8 genmask)
4304 struct nft_object *obj;
4306 list_for_each_entry(obj, &table->objects, list) {
4307 if (!nla_strcmp(nla, obj->name) &&
4308 objtype == obj->ops->type->type &&
4309 nft_active_genmask(obj, genmask))
4312 return ERR_PTR(-ENOENT);
4314 EXPORT_SYMBOL_GPL(nf_tables_obj_lookup);
4316 static const struct nla_policy nft_obj_policy[NFTA_OBJ_MAX + 1] = {
4317 [NFTA_OBJ_TABLE] = { .type = NLA_STRING,
4318 .len = NFT_TABLE_MAXNAMELEN - 1 },
4319 [NFTA_OBJ_NAME] = { .type = NLA_STRING,
4320 .len = NFT_OBJ_MAXNAMELEN - 1 },
4321 [NFTA_OBJ_TYPE] = { .type = NLA_U32 },
4322 [NFTA_OBJ_DATA] = { .type = NLA_NESTED },
4325 static struct nft_object *nft_obj_init(const struct nft_ctx *ctx,
4326 const struct nft_object_type *type,
4327 const struct nlattr *attr)
4329 struct nlattr *tb[type->maxattr + 1];
4330 const struct nft_object_ops *ops;
4331 struct nft_object *obj;
4335 err = nla_parse_nested(tb, type->maxattr, attr, type->policy,
4340 memset(tb, 0, sizeof(tb[0]) * (type->maxattr + 1));
4343 if (type->select_ops) {
4344 ops = type->select_ops(ctx, (const struct nlattr * const *)tb);
4354 obj = kzalloc(sizeof(*obj) + ops->size, GFP_KERNEL);
4358 err = ops->init(ctx, (const struct nlattr * const *)tb, obj);
4368 return ERR_PTR(err);
4371 static int nft_object_dump(struct sk_buff *skb, unsigned int attr,
4372 struct nft_object *obj, bool reset)
4374 struct nlattr *nest;
4376 nest = nla_nest_start(skb, attr);
4378 goto nla_put_failure;
4379 if (obj->ops->dump(skb, obj, reset) < 0)
4380 goto nla_put_failure;
4381 nla_nest_end(skb, nest);
4388 static const struct nft_object_type *__nft_obj_type_get(u32 objtype)
4390 const struct nft_object_type *type;
4392 list_for_each_entry(type, &nf_tables_objects, list) {
4393 if (objtype == type->type)
4399 static const struct nft_object_type *nft_obj_type_get(u32 objtype)
4401 const struct nft_object_type *type;
4403 type = __nft_obj_type_get(objtype);
4404 if (type != NULL && try_module_get(type->owner))
4407 #ifdef CONFIG_MODULES
4409 nfnl_unlock(NFNL_SUBSYS_NFTABLES);
4410 request_module("nft-obj-%u", objtype);
4411 nfnl_lock(NFNL_SUBSYS_NFTABLES);
4412 if (__nft_obj_type_get(objtype))
4413 return ERR_PTR(-EAGAIN);
4416 return ERR_PTR(-ENOENT);
4419 static int nf_tables_newobj(struct net *net, struct sock *nlsk,
4420 struct sk_buff *skb, const struct nlmsghdr *nlh,
4421 const struct nlattr * const nla[],
4422 struct netlink_ext_ack *extack)
4424 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4425 const struct nft_object_type *type;
4426 u8 genmask = nft_genmask_next(net);
4427 int family = nfmsg->nfgen_family;
4428 struct nft_af_info *afi;
4429 struct nft_table *table;
4430 struct nft_object *obj;
4435 if (!nla[NFTA_OBJ_TYPE] ||
4436 !nla[NFTA_OBJ_NAME] ||
4437 !nla[NFTA_OBJ_DATA])
4440 afi = nf_tables_afinfo_lookup(net, family, true);
4442 return PTR_ERR(afi);
4444 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4446 return PTR_ERR(table);
4448 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4449 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4456 if (nlh->nlmsg_flags & NLM_F_EXCL)
4462 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
4464 type = nft_obj_type_get(objtype);
4466 return PTR_ERR(type);
4468 obj = nft_obj_init(&ctx, type, nla[NFTA_OBJ_DATA]);
4474 obj->name = nla_strdup(nla[NFTA_OBJ_NAME], GFP_KERNEL);
4480 err = nft_trans_obj_add(&ctx, NFT_MSG_NEWOBJ, obj);
4484 list_add_tail_rcu(&obj->list, &table->objects);
4490 if (obj->ops->destroy)
4491 obj->ops->destroy(obj);
4494 module_put(type->owner);
4498 static int nf_tables_fill_obj_info(struct sk_buff *skb, struct net *net,
4499 u32 portid, u32 seq, int event, u32 flags,
4500 int family, const struct nft_table *table,
4501 struct nft_object *obj, bool reset)
4503 struct nfgenmsg *nfmsg;
4504 struct nlmsghdr *nlh;
4506 event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, event);
4507 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), flags);
4509 goto nla_put_failure;
4511 nfmsg = nlmsg_data(nlh);
4512 nfmsg->nfgen_family = family;
4513 nfmsg->version = NFNETLINK_V0;
4514 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4516 if (nla_put_string(skb, NFTA_OBJ_TABLE, table->name) ||
4517 nla_put_string(skb, NFTA_OBJ_NAME, obj->name) ||
4518 nla_put_be32(skb, NFTA_OBJ_TYPE, htonl(obj->ops->type->type)) ||
4519 nla_put_be32(skb, NFTA_OBJ_USE, htonl(obj->use)) ||
4520 nft_object_dump(skb, NFTA_OBJ_DATA, obj, reset))
4521 goto nla_put_failure;
4523 nlmsg_end(skb, nlh);
4527 nlmsg_trim(skb, nlh);
4531 struct nft_obj_filter {
4536 static int nf_tables_dump_obj(struct sk_buff *skb, struct netlink_callback *cb)
4538 const struct nfgenmsg *nfmsg = nlmsg_data(cb->nlh);
4539 const struct nft_af_info *afi;
4540 const struct nft_table *table;
4541 unsigned int idx = 0, s_idx = cb->args[0];
4542 struct nft_obj_filter *filter = cb->data;
4543 struct net *net = sock_net(skb->sk);
4544 int family = nfmsg->nfgen_family;
4545 struct nft_object *obj;
4548 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4552 cb->seq = net->nft.base_seq;
4554 list_for_each_entry_rcu(afi, &net->nft.af_info, list) {
4555 if (family != NFPROTO_UNSPEC && family != afi->family)
4558 list_for_each_entry_rcu(table, &afi->tables, list) {
4559 list_for_each_entry_rcu(obj, &table->objects, list) {
4560 if (!nft_is_active(net, obj))
4565 memset(&cb->args[1], 0,
4566 sizeof(cb->args) - sizeof(cb->args[0]));
4567 if (filter && filter->table[0] &&
4568 strcmp(filter->table, table->name))
4571 filter->type != NFT_OBJECT_UNSPEC &&
4572 obj->ops->type->type != filter->type)
4575 if (nf_tables_fill_obj_info(skb, net, NETLINK_CB(cb->skb).portid,
4578 NLM_F_MULTI | NLM_F_APPEND,
4579 afi->family, table, obj, reset) < 0)
4582 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
4595 static int nf_tables_dump_obj_done(struct netlink_callback *cb)
4597 struct nft_obj_filter *filter = cb->data;
4599 kfree(filter->table);
4605 static struct nft_obj_filter *
4606 nft_obj_filter_alloc(const struct nlattr * const nla[])
4608 struct nft_obj_filter *filter;
4610 filter = kzalloc(sizeof(*filter), GFP_KERNEL);
4612 return ERR_PTR(-ENOMEM);
4614 if (nla[NFTA_OBJ_TABLE]) {
4615 filter->table = nla_strdup(nla[NFTA_OBJ_TABLE], GFP_KERNEL);
4616 if (!filter->table) {
4618 return ERR_PTR(-ENOMEM);
4621 if (nla[NFTA_OBJ_TYPE])
4622 filter->type = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4627 static int nf_tables_getobj(struct net *net, struct sock *nlsk,
4628 struct sk_buff *skb, const struct nlmsghdr *nlh,
4629 const struct nlattr * const nla[],
4630 struct netlink_ext_ack *extack)
4632 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4633 u8 genmask = nft_genmask_cur(net);
4634 int family = nfmsg->nfgen_family;
4635 const struct nft_af_info *afi;
4636 const struct nft_table *table;
4637 struct nft_object *obj;
4638 struct sk_buff *skb2;
4643 if (nlh->nlmsg_flags & NLM_F_DUMP) {
4644 struct netlink_dump_control c = {
4645 .dump = nf_tables_dump_obj,
4646 .done = nf_tables_dump_obj_done,
4649 if (nla[NFTA_OBJ_TABLE] ||
4650 nla[NFTA_OBJ_TYPE]) {
4651 struct nft_obj_filter *filter;
4653 filter = nft_obj_filter_alloc(nla);
4659 return netlink_dump_start(nlsk, skb, nlh, &c);
4662 if (!nla[NFTA_OBJ_NAME] ||
4663 !nla[NFTA_OBJ_TYPE])
4666 afi = nf_tables_afinfo_lookup(net, family, false);
4668 return PTR_ERR(afi);
4670 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4672 return PTR_ERR(table);
4674 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4675 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4677 return PTR_ERR(obj);
4679 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4683 if (NFNL_MSG_TYPE(nlh->nlmsg_type) == NFT_MSG_GETOBJ_RESET)
4686 err = nf_tables_fill_obj_info(skb2, net, NETLINK_CB(skb).portid,
4687 nlh->nlmsg_seq, NFT_MSG_NEWOBJ, 0,
4688 family, table, obj, reset);
4692 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4698 static void nft_obj_destroy(struct nft_object *obj)
4700 if (obj->ops->destroy)
4701 obj->ops->destroy(obj);
4703 module_put(obj->ops->type->owner);
4708 static int nf_tables_delobj(struct net *net, struct sock *nlsk,
4709 struct sk_buff *skb, const struct nlmsghdr *nlh,
4710 const struct nlattr * const nla[],
4711 struct netlink_ext_ack *extack)
4713 const struct nfgenmsg *nfmsg = nlmsg_data(nlh);
4714 u8 genmask = nft_genmask_next(net);
4715 int family = nfmsg->nfgen_family;
4716 struct nft_af_info *afi;
4717 struct nft_table *table;
4718 struct nft_object *obj;
4722 if (!nla[NFTA_OBJ_TYPE] ||
4723 !nla[NFTA_OBJ_NAME])
4726 afi = nf_tables_afinfo_lookup(net, family, true);
4728 return PTR_ERR(afi);
4730 table = nf_tables_table_lookup(afi, nla[NFTA_OBJ_TABLE], genmask);
4732 return PTR_ERR(table);
4734 objtype = ntohl(nla_get_be32(nla[NFTA_OBJ_TYPE]));
4735 obj = nf_tables_obj_lookup(table, nla[NFTA_OBJ_NAME], objtype, genmask);
4737 return PTR_ERR(obj);
4741 nft_ctx_init(&ctx, net, skb, nlh, afi, table, NULL, nla);
4743 return nft_delobj(&ctx, obj);
4746 void nft_obj_notify(struct net *net, struct nft_table *table,
4747 struct nft_object *obj, u32 portid, u32 seq, int event,
4748 int family, int report, gfp_t gfp)
4750 struct sk_buff *skb;
4754 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4757 skb = nlmsg_new(NLMSG_GOODSIZE, gfp);
4761 err = nf_tables_fill_obj_info(skb, net, portid, seq, event, 0, family,
4768 nfnetlink_send(skb, net, portid, NFNLGRP_NFTABLES, report, gfp);
4771 nfnetlink_set_err(net, portid, NFNLGRP_NFTABLES, -ENOBUFS);
4773 EXPORT_SYMBOL_GPL(nft_obj_notify);
4775 static void nf_tables_obj_notify(const struct nft_ctx *ctx,
4776 struct nft_object *obj, int event)
4778 nft_obj_notify(ctx->net, ctx->table, obj, ctx->portid, ctx->seq, event,
4779 ctx->afi->family, ctx->report, GFP_KERNEL);
4782 static int nf_tables_fill_gen_info(struct sk_buff *skb, struct net *net,
4783 u32 portid, u32 seq)
4785 struct nlmsghdr *nlh;
4786 struct nfgenmsg *nfmsg;
4787 char buf[TASK_COMM_LEN];
4788 int event = nfnl_msg_type(NFNL_SUBSYS_NFTABLES, NFT_MSG_NEWGEN);
4790 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct nfgenmsg), 0);
4792 goto nla_put_failure;
4794 nfmsg = nlmsg_data(nlh);
4795 nfmsg->nfgen_family = AF_UNSPEC;
4796 nfmsg->version = NFNETLINK_V0;
4797 nfmsg->res_id = htons(net->nft.base_seq & 0xffff);
4799 if (nla_put_be32(skb, NFTA_GEN_ID, htonl(net->nft.base_seq)) ||
4800 nla_put_be32(skb, NFTA_GEN_PROC_PID, htonl(task_pid_nr(current))) ||
4801 nla_put_string(skb, NFTA_GEN_PROC_NAME, get_task_comm(buf, current)))
4802 goto nla_put_failure;
4804 nlmsg_end(skb, nlh);
4808 nlmsg_trim(skb, nlh);
4812 static void nf_tables_gen_notify(struct net *net, struct sk_buff *skb,
4815 struct nlmsghdr *nlh = nlmsg_hdr(skb);
4816 struct sk_buff *skb2;
4819 if (nlmsg_report(nlh) &&
4820 !nfnetlink_has_listeners(net, NFNLGRP_NFTABLES))
4823 skb2 = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
4827 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
4834 nfnetlink_send(skb2, net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
4835 nlmsg_report(nlh), GFP_KERNEL);
4838 nfnetlink_set_err(net, NETLINK_CB(skb).portid, NFNLGRP_NFTABLES,
4842 static int nf_tables_getgen(struct net *net, struct sock *nlsk,
4843 struct sk_buff *skb, const struct nlmsghdr *nlh,
4844 const struct nlattr * const nla[],
4845 struct netlink_ext_ack *extack)
4847 struct sk_buff *skb2;
4850 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
4854 err = nf_tables_fill_gen_info(skb2, net, NETLINK_CB(skb).portid,
4859 return nlmsg_unicast(nlsk, skb2, NETLINK_CB(skb).portid);
4865 static const struct nfnl_callback nf_tables_cb[NFT_MSG_MAX] = {
4866 [NFT_MSG_NEWTABLE] = {
4867 .call_batch = nf_tables_newtable,
4868 .attr_count = NFTA_TABLE_MAX,
4869 .policy = nft_table_policy,
4871 [NFT_MSG_GETTABLE] = {
4872 .call = nf_tables_gettable,
4873 .attr_count = NFTA_TABLE_MAX,
4874 .policy = nft_table_policy,
4876 [NFT_MSG_DELTABLE] = {
4877 .call_batch = nf_tables_deltable,
4878 .attr_count = NFTA_TABLE_MAX,
4879 .policy = nft_table_policy,
4881 [NFT_MSG_NEWCHAIN] = {
4882 .call_batch = nf_tables_newchain,
4883 .attr_count = NFTA_CHAIN_MAX,
4884 .policy = nft_chain_policy,
4886 [NFT_MSG_GETCHAIN] = {
4887 .call = nf_tables_getchain,
4888 .attr_count = NFTA_CHAIN_MAX,
4889 .policy = nft_chain_policy,
4891 [NFT_MSG_DELCHAIN] = {
4892 .call_batch = nf_tables_delchain,
4893 .attr_count = NFTA_CHAIN_MAX,
4894 .policy = nft_chain_policy,
4896 [NFT_MSG_NEWRULE] = {
4897 .call_batch = nf_tables_newrule,
4898 .attr_count = NFTA_RULE_MAX,
4899 .policy = nft_rule_policy,
4901 [NFT_MSG_GETRULE] = {
4902 .call = nf_tables_getrule,
4903 .attr_count = NFTA_RULE_MAX,
4904 .policy = nft_rule_policy,
4906 [NFT_MSG_DELRULE] = {
4907 .call_batch = nf_tables_delrule,
4908 .attr_count = NFTA_RULE_MAX,
4909 .policy = nft_rule_policy,
4911 [NFT_MSG_NEWSET] = {
4912 .call_batch = nf_tables_newset,
4913 .attr_count = NFTA_SET_MAX,
4914 .policy = nft_set_policy,
4916 [NFT_MSG_GETSET] = {
4917 .call = nf_tables_getset,
4918 .attr_count = NFTA_SET_MAX,
4919 .policy = nft_set_policy,
4921 [NFT_MSG_DELSET] = {
4922 .call_batch = nf_tables_delset,
4923 .attr_count = NFTA_SET_MAX,
4924 .policy = nft_set_policy,
4926 [NFT_MSG_NEWSETELEM] = {
4927 .call_batch = nf_tables_newsetelem,
4928 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4929 .policy = nft_set_elem_list_policy,
4931 [NFT_MSG_GETSETELEM] = {
4932 .call = nf_tables_getsetelem,
4933 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4934 .policy = nft_set_elem_list_policy,
4936 [NFT_MSG_DELSETELEM] = {
4937 .call_batch = nf_tables_delsetelem,
4938 .attr_count = NFTA_SET_ELEM_LIST_MAX,
4939 .policy = nft_set_elem_list_policy,
4941 [NFT_MSG_GETGEN] = {
4942 .call = nf_tables_getgen,
4944 [NFT_MSG_NEWOBJ] = {
4945 .call_batch = nf_tables_newobj,
4946 .attr_count = NFTA_OBJ_MAX,
4947 .policy = nft_obj_policy,
4949 [NFT_MSG_GETOBJ] = {
4950 .call = nf_tables_getobj,
4951 .attr_count = NFTA_OBJ_MAX,
4952 .policy = nft_obj_policy,
4954 [NFT_MSG_DELOBJ] = {
4955 .call_batch = nf_tables_delobj,
4956 .attr_count = NFTA_OBJ_MAX,
4957 .policy = nft_obj_policy,
4959 [NFT_MSG_GETOBJ_RESET] = {
4960 .call = nf_tables_getobj,
4961 .attr_count = NFTA_OBJ_MAX,
4962 .policy = nft_obj_policy,
4966 static void nft_chain_commit_update(struct nft_trans *trans)
4968 struct nft_base_chain *basechain;
4970 if (nft_trans_chain_name(trans))
4971 strcpy(trans->ctx.chain->name, nft_trans_chain_name(trans));
4973 if (!nft_is_base_chain(trans->ctx.chain))
4976 basechain = nft_base_chain(trans->ctx.chain);
4977 nft_chain_stats_replace(basechain, nft_trans_chain_stats(trans));
4979 switch (nft_trans_chain_policy(trans)) {
4982 basechain->policy = nft_trans_chain_policy(trans);
4987 static void nf_tables_commit_release(struct nft_trans *trans)
4989 switch (trans->msg_type) {
4990 case NFT_MSG_DELTABLE:
4991 nf_tables_table_destroy(&trans->ctx);
4993 case NFT_MSG_DELCHAIN:
4994 nf_tables_chain_destroy(trans->ctx.chain);
4996 case NFT_MSG_DELRULE:
4997 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
4999 case NFT_MSG_DELSET:
5000 nft_set_destroy(nft_trans_set(trans));
5002 case NFT_MSG_DELSETELEM:
5003 nf_tables_set_elem_destroy(nft_trans_elem_set(trans),
5004 nft_trans_elem(trans).priv);
5006 case NFT_MSG_DELOBJ:
5007 nft_obj_destroy(nft_trans_obj(trans));
5013 static int nf_tables_commit(struct net *net, struct sk_buff *skb)
5015 struct nft_trans *trans, *next;
5016 struct nft_trans_elem *te;
5018 /* Bump generation counter, invalidate any dump in progress */
5019 while (++net->nft.base_seq == 0);
5021 /* A new generation has just started */
5022 net->nft.gencursor = nft_gencursor_next(net);
5024 /* Make sure all packets have left the previous generation before
5025 * purging old rules.
5029 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
5030 switch (trans->msg_type) {
5031 case NFT_MSG_NEWTABLE:
5032 if (nft_trans_table_update(trans)) {
5033 if (!nft_trans_table_enable(trans)) {
5034 nf_tables_table_disable(net,
5037 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
5040 nft_clear(net, trans->ctx.table);
5042 nf_tables_table_notify(&trans->ctx, NFT_MSG_NEWTABLE);
5043 nft_trans_destroy(trans);
5045 case NFT_MSG_DELTABLE:
5046 list_del_rcu(&trans->ctx.table->list);
5047 nf_tables_table_notify(&trans->ctx, NFT_MSG_DELTABLE);
5049 case NFT_MSG_NEWCHAIN:
5050 if (nft_trans_chain_update(trans))
5051 nft_chain_commit_update(trans);
5053 nft_clear(net, trans->ctx.chain);
5055 nf_tables_chain_notify(&trans->ctx, NFT_MSG_NEWCHAIN);
5056 nft_trans_destroy(trans);
5058 case NFT_MSG_DELCHAIN:
5059 list_del_rcu(&trans->ctx.chain->list);
5060 nf_tables_chain_notify(&trans->ctx, NFT_MSG_DELCHAIN);
5061 nf_tables_unregister_hooks(trans->ctx.net,
5064 trans->ctx.afi->nops);
5066 case NFT_MSG_NEWRULE:
5067 nft_clear(trans->ctx.net, nft_trans_rule(trans));
5068 nf_tables_rule_notify(&trans->ctx,
5069 nft_trans_rule(trans),
5071 nft_trans_destroy(trans);
5073 case NFT_MSG_DELRULE:
5074 list_del_rcu(&nft_trans_rule(trans)->list);
5075 nf_tables_rule_notify(&trans->ctx,
5076 nft_trans_rule(trans),
5079 case NFT_MSG_NEWSET:
5080 nft_clear(net, nft_trans_set(trans));
5081 /* This avoids hitting -EBUSY when deleting the table
5082 * from the transaction.
5084 if (nft_trans_set(trans)->flags & NFT_SET_ANONYMOUS &&
5085 !list_empty(&nft_trans_set(trans)->bindings))
5086 trans->ctx.table->use--;
5088 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
5089 NFT_MSG_NEWSET, GFP_KERNEL);
5090 nft_trans_destroy(trans);
5092 case NFT_MSG_DELSET:
5093 list_del_rcu(&nft_trans_set(trans)->list);
5094 nf_tables_set_notify(&trans->ctx, nft_trans_set(trans),
5095 NFT_MSG_DELSET, GFP_KERNEL);
5097 case NFT_MSG_NEWSETELEM:
5098 te = (struct nft_trans_elem *)trans->data;
5100 te->set->ops->activate(net, te->set, &te->elem);
5101 nf_tables_setelem_notify(&trans->ctx, te->set,
5103 NFT_MSG_NEWSETELEM, 0);
5104 nft_trans_destroy(trans);
5106 case NFT_MSG_DELSETELEM:
5107 te = (struct nft_trans_elem *)trans->data;
5109 nf_tables_setelem_notify(&trans->ctx, te->set,
5111 NFT_MSG_DELSETELEM, 0);
5112 te->set->ops->remove(net, te->set, &te->elem);
5113 atomic_dec(&te->set->nelems);
5116 case NFT_MSG_NEWOBJ:
5117 nft_clear(net, nft_trans_obj(trans));
5118 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
5120 nft_trans_destroy(trans);
5122 case NFT_MSG_DELOBJ:
5123 list_del_rcu(&nft_trans_obj(trans)->list);
5124 nf_tables_obj_notify(&trans->ctx, nft_trans_obj(trans),
5132 list_for_each_entry_safe(trans, next, &net->nft.commit_list, list) {
5133 list_del(&trans->list);
5134 nf_tables_commit_release(trans);
5137 nf_tables_gen_notify(net, skb, NFT_MSG_NEWGEN);
5142 static void nf_tables_abort_release(struct nft_trans *trans)
5144 switch (trans->msg_type) {
5145 case NFT_MSG_NEWTABLE:
5146 nf_tables_table_destroy(&trans->ctx);
5148 case NFT_MSG_NEWCHAIN:
5149 nf_tables_chain_destroy(trans->ctx.chain);
5151 case NFT_MSG_NEWRULE:
5152 nf_tables_rule_destroy(&trans->ctx, nft_trans_rule(trans));
5154 case NFT_MSG_NEWSET:
5155 nft_set_destroy(nft_trans_set(trans));
5157 case NFT_MSG_NEWSETELEM:
5158 nft_set_elem_destroy(nft_trans_elem_set(trans),
5159 nft_trans_elem(trans).priv, true);
5161 case NFT_MSG_NEWOBJ:
5162 nft_obj_destroy(nft_trans_obj(trans));
5168 static int nf_tables_abort(struct net *net, struct sk_buff *skb)
5170 struct nft_trans *trans, *next;
5171 struct nft_trans_elem *te;
5173 list_for_each_entry_safe_reverse(trans, next, &net->nft.commit_list,
5175 switch (trans->msg_type) {
5176 case NFT_MSG_NEWTABLE:
5177 if (nft_trans_table_update(trans)) {
5178 if (nft_trans_table_enable(trans)) {
5179 nf_tables_table_disable(net,
5182 trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
5184 nft_trans_destroy(trans);
5186 list_del_rcu(&trans->ctx.table->list);
5189 case NFT_MSG_DELTABLE:
5190 nft_clear(trans->ctx.net, trans->ctx.table);
5191 nft_trans_destroy(trans);
5193 case NFT_MSG_NEWCHAIN:
5194 if (nft_trans_chain_update(trans)) {
5195 free_percpu(nft_trans_chain_stats(trans));
5197 nft_trans_destroy(trans);
5199 trans->ctx.table->use--;
5200 list_del_rcu(&trans->ctx.chain->list);
5201 nf_tables_unregister_hooks(trans->ctx.net,
5204 trans->ctx.afi->nops);
5207 case NFT_MSG_DELCHAIN:
5208 trans->ctx.table->use++;
5209 nft_clear(trans->ctx.net, trans->ctx.chain);
5210 nft_trans_destroy(trans);
5212 case NFT_MSG_NEWRULE:
5213 trans->ctx.chain->use--;
5214 list_del_rcu(&nft_trans_rule(trans)->list);
5216 case NFT_MSG_DELRULE:
5217 trans->ctx.chain->use++;
5218 nft_clear(trans->ctx.net, nft_trans_rule(trans));
5219 nft_trans_destroy(trans);
5221 case NFT_MSG_NEWSET:
5222 trans->ctx.table->use--;
5223 list_del_rcu(&nft_trans_set(trans)->list);
5225 case NFT_MSG_DELSET:
5226 trans->ctx.table->use++;
5227 nft_clear(trans->ctx.net, nft_trans_set(trans));
5228 nft_trans_destroy(trans);
5230 case NFT_MSG_NEWSETELEM:
5231 te = (struct nft_trans_elem *)trans->data;
5233 te->set->ops->remove(net, te->set, &te->elem);
5234 atomic_dec(&te->set->nelems);
5236 case NFT_MSG_DELSETELEM:
5237 te = (struct nft_trans_elem *)trans->data;
5239 nft_set_elem_activate(net, te->set, &te->elem);
5240 te->set->ops->activate(net, te->set, &te->elem);
5243 nft_trans_destroy(trans);
5245 case NFT_MSG_NEWOBJ:
5246 trans->ctx.table->use--;
5247 list_del_rcu(&nft_trans_obj(trans)->list);
5249 case NFT_MSG_DELOBJ:
5250 trans->ctx.table->use++;
5251 nft_clear(trans->ctx.net, nft_trans_obj(trans));
5252 nft_trans_destroy(trans);
5259 list_for_each_entry_safe_reverse(trans, next,
5260 &net->nft.commit_list, list) {
5261 list_del(&trans->list);
5262 nf_tables_abort_release(trans);
5268 static bool nf_tables_valid_genid(struct net *net, u32 genid)
5270 return net->nft.base_seq == genid;
5273 static const struct nfnetlink_subsystem nf_tables_subsys = {
5274 .name = "nf_tables",
5275 .subsys_id = NFNL_SUBSYS_NFTABLES,
5276 .cb_count = NFT_MSG_MAX,
5278 .commit = nf_tables_commit,
5279 .abort = nf_tables_abort,
5280 .valid_genid = nf_tables_valid_genid,
5283 int nft_chain_validate_dependency(const struct nft_chain *chain,
5284 enum nft_chain_type type)
5286 const struct nft_base_chain *basechain;
5288 if (nft_is_base_chain(chain)) {
5289 basechain = nft_base_chain(chain);
5290 if (basechain->type->type != type)
5295 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency);
5297 int nft_chain_validate_hooks(const struct nft_chain *chain,
5298 unsigned int hook_flags)
5300 struct nft_base_chain *basechain;
5302 if (nft_is_base_chain(chain)) {
5303 basechain = nft_base_chain(chain);
5305 if ((1 << basechain->ops[0].hooknum) & hook_flags)
5313 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks);
5316 * Loop detection - walk through the ruleset beginning at the destination chain
5317 * of a new jump until either the source chain is reached (loop) or all
5318 * reachable chains have been traversed.
5320 * The loop check is performed whenever a new jump verdict is added to an
5321 * expression or verdict map or a verdict map is bound to a new chain.
5324 static int nf_tables_check_loops(const struct nft_ctx *ctx,
5325 const struct nft_chain *chain);
5327 static int nf_tables_loop_check_setelem(const struct nft_ctx *ctx,
5328 struct nft_set *set,
5329 const struct nft_set_iter *iter,
5330 struct nft_set_elem *elem)
5332 const struct nft_set_ext *ext = nft_set_elem_ext(set, elem->priv);
5333 const struct nft_data *data;
5335 if (nft_set_ext_exists(ext, NFT_SET_EXT_FLAGS) &&
5336 *nft_set_ext_flags(ext) & NFT_SET_ELEM_INTERVAL_END)
5339 data = nft_set_ext_data(ext);
5340 switch (data->verdict.code) {
5343 return nf_tables_check_loops(ctx, data->verdict.chain);
5349 static int nf_tables_check_loops(const struct nft_ctx *ctx,
5350 const struct nft_chain *chain)
5352 const struct nft_rule *rule;
5353 const struct nft_expr *expr, *last;
5354 struct nft_set *set;
5355 struct nft_set_binding *binding;
5356 struct nft_set_iter iter;
5358 if (ctx->chain == chain)
5361 list_for_each_entry(rule, &chain->rules, list) {
5362 nft_rule_for_each_expr(expr, last, rule) {
5363 const struct nft_data *data = NULL;
5366 if (!expr->ops->validate)
5369 err = expr->ops->validate(ctx, expr, &data);
5376 switch (data->verdict.code) {
5379 err = nf_tables_check_loops(ctx,
5380 data->verdict.chain);
5389 list_for_each_entry(set, &ctx->table->sets, list) {
5390 if (!nft_is_active_next(ctx->net, set))
5392 if (!(set->flags & NFT_SET_MAP) ||
5393 set->dtype != NFT_DATA_VERDICT)
5396 list_for_each_entry(binding, &set->bindings, list) {
5397 if (!(binding->flags & NFT_SET_MAP) ||
5398 binding->chain != chain)
5401 iter.genmask = nft_genmask_next(ctx->net);
5405 iter.fn = nf_tables_loop_check_setelem;
5407 set->ops->walk(ctx, set, &iter);
5417 * nft_parse_u32_check - fetch u32 attribute and check for maximum value
5419 * @attr: netlink attribute to fetch value from
5420 * @max: maximum value to be stored in dest
5421 * @dest: pointer to the variable
5423 * Parse, check and store a given u32 netlink attribute into variable.
5424 * This function returns -ERANGE if the value goes over maximum value.
5425 * Otherwise a 0 is returned and the attribute value is stored in the
5426 * destination variable.
5428 int nft_parse_u32_check(const struct nlattr *attr, int max, u32 *dest)
5432 val = ntohl(nla_get_be32(attr));
5439 EXPORT_SYMBOL_GPL(nft_parse_u32_check);
5442 * nft_parse_register - parse a register value from a netlink attribute
5444 * @attr: netlink attribute
5446 * Parse and translate a register value from a netlink attribute.
5447 * Registers used to be 128 bit wide, these register numbers will be
5448 * mapped to the corresponding 32 bit register numbers.
5450 unsigned int nft_parse_register(const struct nlattr *attr)
5454 reg = ntohl(nla_get_be32(attr));
5456 case NFT_REG_VERDICT...NFT_REG_4:
5457 return reg * NFT_REG_SIZE / NFT_REG32_SIZE;
5459 return reg + NFT_REG_SIZE / NFT_REG32_SIZE - NFT_REG32_00;
5462 EXPORT_SYMBOL_GPL(nft_parse_register);
5465 * nft_dump_register - dump a register value to a netlink attribute
5467 * @skb: socket buffer
5468 * @attr: attribute number
5469 * @reg: register number
5471 * Construct a netlink attribute containing the register number. For
5472 * compatibility reasons, register numbers being a multiple of 4 are
5473 * translated to the corresponding 128 bit register numbers.
5475 int nft_dump_register(struct sk_buff *skb, unsigned int attr, unsigned int reg)
5477 if (reg % (NFT_REG_SIZE / NFT_REG32_SIZE) == 0)
5478 reg = reg / (NFT_REG_SIZE / NFT_REG32_SIZE);
5480 reg = reg - NFT_REG_SIZE / NFT_REG32_SIZE + NFT_REG32_00;
5482 return nla_put_be32(skb, attr, htonl(reg));
5484 EXPORT_SYMBOL_GPL(nft_dump_register);
5487 * nft_validate_register_load - validate a load from a register
5489 * @reg: the register number
5490 * @len: the length of the data
5492 * Validate that the input register is one of the general purpose
5493 * registers and that the length of the load is within the bounds.
5495 int nft_validate_register_load(enum nft_registers reg, unsigned int len)
5497 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
5501 if (reg * NFT_REG32_SIZE + len > FIELD_SIZEOF(struct nft_regs, data))
5506 EXPORT_SYMBOL_GPL(nft_validate_register_load);
5509 * nft_validate_register_store - validate an expressions' register store
5511 * @ctx: context of the expression performing the load
5512 * @reg: the destination register number
5513 * @data: the data to load
5514 * @type: the data type
5515 * @len: the length of the data
5517 * Validate that a data load uses the appropriate data type for
5518 * the destination register and the length is within the bounds.
5519 * A value of NULL for the data means that its runtime gathered
5522 int nft_validate_register_store(const struct nft_ctx *ctx,
5523 enum nft_registers reg,
5524 const struct nft_data *data,
5525 enum nft_data_types type, unsigned int len)
5530 case NFT_REG_VERDICT:
5531 if (type != NFT_DATA_VERDICT)
5535 (data->verdict.code == NFT_GOTO ||
5536 data->verdict.code == NFT_JUMP)) {
5537 err = nf_tables_check_loops(ctx, data->verdict.chain);
5541 if (ctx->chain->level + 1 >
5542 data->verdict.chain->level) {
5543 if (ctx->chain->level + 1 == NFT_JUMP_STACK_SIZE)
5545 data->verdict.chain->level = ctx->chain->level + 1;
5551 if (reg < NFT_REG_1 * NFT_REG_SIZE / NFT_REG32_SIZE)
5555 if (reg * NFT_REG32_SIZE + len >
5556 FIELD_SIZEOF(struct nft_regs, data))
5559 if (data != NULL && type != NFT_DATA_VALUE)
5564 EXPORT_SYMBOL_GPL(nft_validate_register_store);
5566 static const struct nla_policy nft_verdict_policy[NFTA_VERDICT_MAX + 1] = {
5567 [NFTA_VERDICT_CODE] = { .type = NLA_U32 },
5568 [NFTA_VERDICT_CHAIN] = { .type = NLA_STRING,
5569 .len = NFT_CHAIN_MAXNAMELEN - 1 },
5572 static int nft_verdict_init(const struct nft_ctx *ctx, struct nft_data *data,
5573 struct nft_data_desc *desc, const struct nlattr *nla)
5575 u8 genmask = nft_genmask_next(ctx->net);
5576 struct nlattr *tb[NFTA_VERDICT_MAX + 1];
5577 struct nft_chain *chain;
5580 err = nla_parse_nested(tb, NFTA_VERDICT_MAX, nla, nft_verdict_policy,
5585 if (!tb[NFTA_VERDICT_CODE])
5587 data->verdict.code = ntohl(nla_get_be32(tb[NFTA_VERDICT_CODE]));
5589 switch (data->verdict.code) {
5591 switch (data->verdict.code & NF_VERDICT_MASK) {
5606 if (!tb[NFTA_VERDICT_CHAIN])
5608 chain = nf_tables_chain_lookup(ctx->table,
5609 tb[NFTA_VERDICT_CHAIN], genmask);
5611 return PTR_ERR(chain);
5612 if (nft_is_base_chain(chain))
5616 data->verdict.chain = chain;
5620 desc->len = sizeof(data->verdict);
5621 desc->type = NFT_DATA_VERDICT;
5625 static void nft_verdict_uninit(const struct nft_data *data)
5627 switch (data->verdict.code) {
5630 data->verdict.chain->use--;
5635 int nft_verdict_dump(struct sk_buff *skb, int type, const struct nft_verdict *v)
5637 struct nlattr *nest;
5639 nest = nla_nest_start(skb, type);
5641 goto nla_put_failure;
5643 if (nla_put_be32(skb, NFTA_VERDICT_CODE, htonl(v->code)))
5644 goto nla_put_failure;
5649 if (nla_put_string(skb, NFTA_VERDICT_CHAIN,
5651 goto nla_put_failure;
5653 nla_nest_end(skb, nest);
5660 static int nft_value_init(const struct nft_ctx *ctx,
5661 struct nft_data *data, unsigned int size,
5662 struct nft_data_desc *desc, const struct nlattr *nla)
5672 nla_memcpy(data->data, nla, len);
5673 desc->type = NFT_DATA_VALUE;
5678 static int nft_value_dump(struct sk_buff *skb, const struct nft_data *data,
5681 return nla_put(skb, NFTA_DATA_VALUE, len, data->data);
5684 static const struct nla_policy nft_data_policy[NFTA_DATA_MAX + 1] = {
5685 [NFTA_DATA_VALUE] = { .type = NLA_BINARY },
5686 [NFTA_DATA_VERDICT] = { .type = NLA_NESTED },
5690 * nft_data_init - parse nf_tables data netlink attributes
5692 * @ctx: context of the expression using the data
5693 * @data: destination struct nft_data
5694 * @size: maximum data length
5695 * @desc: data description
5696 * @nla: netlink attribute containing data
5698 * Parse the netlink data attributes and initialize a struct nft_data.
5699 * The type and length of data are returned in the data description.
5701 * The caller can indicate that it only wants to accept data of type
5702 * NFT_DATA_VALUE by passing NULL for the ctx argument.
5704 int nft_data_init(const struct nft_ctx *ctx,
5705 struct nft_data *data, unsigned int size,
5706 struct nft_data_desc *desc, const struct nlattr *nla)
5708 struct nlattr *tb[NFTA_DATA_MAX + 1];
5711 err = nla_parse_nested(tb, NFTA_DATA_MAX, nla, nft_data_policy, NULL);
5715 if (tb[NFTA_DATA_VALUE])
5716 return nft_value_init(ctx, data, size, desc,
5717 tb[NFTA_DATA_VALUE]);
5718 if (tb[NFTA_DATA_VERDICT] && ctx != NULL)
5719 return nft_verdict_init(ctx, data, desc, tb[NFTA_DATA_VERDICT]);
5722 EXPORT_SYMBOL_GPL(nft_data_init);
5725 * nft_data_release - release a nft_data item
5727 * @data: struct nft_data to release
5728 * @type: type of data
5730 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
5731 * all others need to be released by calling this function.
5733 void nft_data_release(const struct nft_data *data, enum nft_data_types type)
5735 if (type < NFT_DATA_VERDICT)
5738 case NFT_DATA_VERDICT:
5739 return nft_verdict_uninit(data);
5744 EXPORT_SYMBOL_GPL(nft_data_release);
5746 int nft_data_dump(struct sk_buff *skb, int attr, const struct nft_data *data,
5747 enum nft_data_types type, unsigned int len)
5749 struct nlattr *nest;
5752 nest = nla_nest_start(skb, attr);
5757 case NFT_DATA_VALUE:
5758 err = nft_value_dump(skb, data, len);
5760 case NFT_DATA_VERDICT:
5761 err = nft_verdict_dump(skb, NFTA_DATA_VERDICT, &data->verdict);
5768 nla_nest_end(skb, nest);
5771 EXPORT_SYMBOL_GPL(nft_data_dump);
5773 static int __net_init nf_tables_init_net(struct net *net)
5775 INIT_LIST_HEAD(&net->nft.af_info);
5776 INIT_LIST_HEAD(&net->nft.commit_list);
5777 net->nft.base_seq = 1;
5781 int __nft_release_basechain(struct nft_ctx *ctx)
5783 struct nft_rule *rule, *nr;
5785 BUG_ON(!nft_is_base_chain(ctx->chain));
5787 nf_tables_unregister_hooks(ctx->net, ctx->chain->table, ctx->chain,
5789 list_for_each_entry_safe(rule, nr, &ctx->chain->rules, list) {
5790 list_del(&rule->list);
5792 nf_tables_rule_destroy(ctx, rule);
5794 list_del(&ctx->chain->list);
5796 nf_tables_chain_destroy(ctx->chain);
5800 EXPORT_SYMBOL_GPL(__nft_release_basechain);
5802 /* Called by nft_unregister_afinfo() from __net_exit path, nfnl_lock is held. */
5803 static void __nft_release_afinfo(struct net *net, struct nft_af_info *afi)
5805 struct nft_table *table, *nt;
5806 struct nft_chain *chain, *nc;
5807 struct nft_object *obj, *ne;
5808 struct nft_rule *rule, *nr;
5809 struct nft_set *set, *ns;
5810 struct nft_ctx ctx = {
5815 list_for_each_entry_safe(table, nt, &afi->tables, list) {
5816 list_for_each_entry(chain, &table->chains, list)
5817 nf_tables_unregister_hooks(net, table, chain,
5819 /* No packets are walking on these chains anymore. */
5821 list_for_each_entry(chain, &table->chains, list) {
5823 list_for_each_entry_safe(rule, nr, &chain->rules, list) {
5824 list_del(&rule->list);
5826 nf_tables_rule_destroy(&ctx, rule);
5829 list_for_each_entry_safe(set, ns, &table->sets, list) {
5830 list_del(&set->list);
5832 nft_set_destroy(set);
5834 list_for_each_entry_safe(obj, ne, &table->objects, list) {
5835 list_del(&obj->list);
5837 nft_obj_destroy(obj);
5839 list_for_each_entry_safe(chain, nc, &table->chains, list) {
5840 list_del(&chain->list);
5842 nf_tables_chain_destroy(chain);
5844 list_del(&table->list);
5845 nf_tables_table_destroy(&ctx);
5849 static struct pernet_operations nf_tables_net_ops = {
5850 .init = nf_tables_init_net,
5853 static int __init nf_tables_module_init(void)
5857 info = kmalloc(sizeof(struct nft_expr_info) * NFT_RULE_MAXEXPRS,
5864 err = nf_tables_core_module_init();
5868 err = nfnetlink_subsys_register(&nf_tables_subsys);
5872 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
5873 return register_pernet_subsys(&nf_tables_net_ops);
5875 nf_tables_core_module_exit();
5882 static void __exit nf_tables_module_exit(void)
5884 unregister_pernet_subsys(&nf_tables_net_ops);
5885 nfnetlink_subsys_unregister(&nf_tables_subsys);
5887 nf_tables_core_module_exit();
5891 module_init(nf_tables_module_init);
5892 module_exit(nf_tables_module_exit);
5894 MODULE_LICENSE("GPL");
5895 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
5896 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES);