2 * Copyright (c) 2007-2009 Patrick McHardy <kaber@trash.net>
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
8 * Development of this code funded by Astaro AG (http://www.astaro.com/)
11 #include <linux/module.h>
12 #include <linux/init.h>
13 #include <linux/list.h>
14 #include <linux/skbuff.h>
15 #include <linux/netlink.h>
16 #include <linux/netfilter.h>
17 #include <linux/netfilter/nfnetlink.h>
18 #include <linux/netfilter/nf_tables.h>
19 #include <net/netfilter/nf_tables_core.h>
20 #include <net/netfilter/nf_tables.h>
21 #include <net/net_namespace.h>
24 static LIST_HEAD(nf_tables_expressions
);
27 * nft_register_afinfo - register nf_tables address family info
29 * @afi: address family info to register
31 * Register the address family for use with nf_tables. Returns zero on
32 * success or a negative errno code otherwise.
34 int nft_register_afinfo(struct net
*net
, struct nft_af_info
*afi
)
36 INIT_LIST_HEAD(&afi
->tables
);
37 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
38 list_add_tail_rcu(&afi
->list
, &net
->nft
.af_info
);
39 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
42 EXPORT_SYMBOL_GPL(nft_register_afinfo
);
45 * nft_unregister_afinfo - unregister nf_tables address family info
47 * @afi: address family info to unregister
49 * Unregister the address family for use with nf_tables.
51 void nft_unregister_afinfo(struct nft_af_info
*afi
)
53 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
54 list_del_rcu(&afi
->list
);
55 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
57 EXPORT_SYMBOL_GPL(nft_unregister_afinfo
);
59 static struct nft_af_info
*nft_afinfo_lookup(struct net
*net
, int family
)
61 struct nft_af_info
*afi
;
63 list_for_each_entry(afi
, &net
->nft
.af_info
, list
) {
64 if (afi
->family
== family
)
70 static struct nft_af_info
*
71 nf_tables_afinfo_lookup(struct net
*net
, int family
, bool autoload
)
73 struct nft_af_info
*afi
;
75 afi
= nft_afinfo_lookup(net
, family
);
80 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
81 request_module("nft-afinfo-%u", family
);
82 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
83 afi
= nft_afinfo_lookup(net
, family
);
85 return ERR_PTR(-EAGAIN
);
88 return ERR_PTR(-EAFNOSUPPORT
);
91 static void nft_ctx_init(struct nft_ctx
*ctx
,
92 const struct sk_buff
*skb
,
93 const struct nlmsghdr
*nlh
,
94 struct nft_af_info
*afi
,
95 struct nft_table
*table
,
96 struct nft_chain
*chain
,
97 const struct nlattr
* const *nla
)
99 ctx
->net
= sock_net(skb
->sk
);
104 ctx
->portid
= NETLINK_CB(skb
).portid
;
105 ctx
->report
= nlmsg_report(nlh
);
106 ctx
->seq
= nlh
->nlmsg_seq
;
109 static struct nft_trans
*nft_trans_alloc(struct nft_ctx
*ctx
, int msg_type
,
112 struct nft_trans
*trans
;
114 trans
= kzalloc(sizeof(struct nft_trans
) + size
, GFP_KERNEL
);
118 trans
->msg_type
= msg_type
;
124 static void nft_trans_destroy(struct nft_trans
*trans
)
126 list_del(&trans
->list
);
130 static void nf_tables_unregister_hooks(const struct nft_table
*table
,
131 const struct nft_chain
*chain
,
132 unsigned int hook_nops
)
134 if (!(table
->flags
& NFT_TABLE_F_DORMANT
) &&
135 chain
->flags
& NFT_BASE_CHAIN
)
136 nf_unregister_hooks(nft_base_chain(chain
)->ops
, hook_nops
);
139 /* Internal table flags */
140 #define NFT_TABLE_INACTIVE (1 << 15)
142 static int nft_trans_table_add(struct nft_ctx
*ctx
, int msg_type
)
144 struct nft_trans
*trans
;
146 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_table
));
150 if (msg_type
== NFT_MSG_NEWTABLE
)
151 ctx
->table
->flags
|= NFT_TABLE_INACTIVE
;
153 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
157 static int nft_deltable(struct nft_ctx
*ctx
)
161 err
= nft_trans_table_add(ctx
, NFT_MSG_DELTABLE
);
165 list_del_rcu(&ctx
->table
->list
);
169 static int nft_trans_chain_add(struct nft_ctx
*ctx
, int msg_type
)
171 struct nft_trans
*trans
;
173 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_chain
));
177 if (msg_type
== NFT_MSG_NEWCHAIN
)
178 ctx
->chain
->flags
|= NFT_CHAIN_INACTIVE
;
180 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
184 static int nft_delchain(struct nft_ctx
*ctx
)
188 err
= nft_trans_chain_add(ctx
, NFT_MSG_DELCHAIN
);
193 list_del_rcu(&ctx
->chain
->list
);
199 nft_rule_is_active(struct net
*net
, const struct nft_rule
*rule
)
201 return (rule
->genmask
& nft_genmask_cur(net
)) == 0;
205 nft_rule_is_active_next(struct net
*net
, const struct nft_rule
*rule
)
207 return (rule
->genmask
& nft_genmask_next(net
)) == 0;
211 nft_rule_activate_next(struct net
*net
, struct nft_rule
*rule
)
213 /* Now inactive, will be active in the future */
214 rule
->genmask
= nft_genmask_cur(net
);
218 nft_rule_deactivate_next(struct net
*net
, struct nft_rule
*rule
)
220 rule
->genmask
= nft_genmask_next(net
);
223 static inline void nft_rule_clear(struct net
*net
, struct nft_rule
*rule
)
225 rule
->genmask
&= ~nft_genmask_next(net
);
229 nf_tables_delrule_deactivate(struct nft_ctx
*ctx
, struct nft_rule
*rule
)
231 /* You cannot delete the same rule twice */
232 if (nft_rule_is_active_next(ctx
->net
, rule
)) {
233 nft_rule_deactivate_next(ctx
->net
, rule
);
240 static struct nft_trans
*nft_trans_rule_add(struct nft_ctx
*ctx
, int msg_type
,
241 struct nft_rule
*rule
)
243 struct nft_trans
*trans
;
245 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_rule
));
249 nft_trans_rule(trans
) = rule
;
250 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
255 static int nft_delrule(struct nft_ctx
*ctx
, struct nft_rule
*rule
)
257 struct nft_trans
*trans
;
260 trans
= nft_trans_rule_add(ctx
, NFT_MSG_DELRULE
, rule
);
264 err
= nf_tables_delrule_deactivate(ctx
, rule
);
266 nft_trans_destroy(trans
);
273 static int nft_delrule_by_chain(struct nft_ctx
*ctx
)
275 struct nft_rule
*rule
;
278 list_for_each_entry(rule
, &ctx
->chain
->rules
, list
) {
279 err
= nft_delrule(ctx
, rule
);
286 /* Internal set flag */
287 #define NFT_SET_INACTIVE (1 << 15)
289 static int nft_trans_set_add(struct nft_ctx
*ctx
, int msg_type
,
292 struct nft_trans
*trans
;
294 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_set
));
298 if (msg_type
== NFT_MSG_NEWSET
&& ctx
->nla
[NFTA_SET_ID
] != NULL
) {
299 nft_trans_set_id(trans
) =
300 ntohl(nla_get_be32(ctx
->nla
[NFTA_SET_ID
]));
301 set
->flags
|= NFT_SET_INACTIVE
;
303 nft_trans_set(trans
) = set
;
304 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
309 static int nft_delset(struct nft_ctx
*ctx
, struct nft_set
*set
)
313 err
= nft_trans_set_add(ctx
, NFT_MSG_DELSET
, set
);
317 list_del_rcu(&set
->list
);
327 static struct nft_table
*nft_table_lookup(const struct nft_af_info
*afi
,
328 const struct nlattr
*nla
)
330 struct nft_table
*table
;
332 list_for_each_entry(table
, &afi
->tables
, list
) {
333 if (!nla_strcmp(nla
, table
->name
))
339 static struct nft_table
*nf_tables_table_lookup(const struct nft_af_info
*afi
,
340 const struct nlattr
*nla
)
342 struct nft_table
*table
;
345 return ERR_PTR(-EINVAL
);
347 table
= nft_table_lookup(afi
, nla
);
351 return ERR_PTR(-ENOENT
);
354 static inline u64
nf_tables_alloc_handle(struct nft_table
*table
)
356 return ++table
->hgenerator
;
359 static const struct nf_chain_type
*chain_type
[AF_MAX
][NFT_CHAIN_T_MAX
];
361 static const struct nf_chain_type
*
362 __nf_tables_chain_type_lookup(int family
, const struct nlattr
*nla
)
366 for (i
= 0; i
< NFT_CHAIN_T_MAX
; i
++) {
367 if (chain_type
[family
][i
] != NULL
&&
368 !nla_strcmp(nla
, chain_type
[family
][i
]->name
))
369 return chain_type
[family
][i
];
374 static const struct nf_chain_type
*
375 nf_tables_chain_type_lookup(const struct nft_af_info
*afi
,
376 const struct nlattr
*nla
,
379 const struct nf_chain_type
*type
;
381 type
= __nf_tables_chain_type_lookup(afi
->family
, nla
);
384 #ifdef CONFIG_MODULES
386 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
387 request_module("nft-chain-%u-%.*s", afi
->family
,
388 nla_len(nla
), (const char *)nla_data(nla
));
389 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
390 type
= __nf_tables_chain_type_lookup(afi
->family
, nla
);
392 return ERR_PTR(-EAGAIN
);
395 return ERR_PTR(-ENOENT
);
398 static const struct nla_policy nft_table_policy
[NFTA_TABLE_MAX
+ 1] = {
399 [NFTA_TABLE_NAME
] = { .type
= NLA_STRING
,
400 .len
= NFT_TABLE_MAXNAMELEN
- 1 },
401 [NFTA_TABLE_FLAGS
] = { .type
= NLA_U32
},
404 static int nf_tables_fill_table_info(struct sk_buff
*skb
, struct net
*net
,
405 u32 portid
, u32 seq
, int event
, u32 flags
,
406 int family
, const struct nft_table
*table
)
408 struct nlmsghdr
*nlh
;
409 struct nfgenmsg
*nfmsg
;
411 event
|= NFNL_SUBSYS_NFTABLES
<< 8;
412 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
414 goto nla_put_failure
;
416 nfmsg
= nlmsg_data(nlh
);
417 nfmsg
->nfgen_family
= family
;
418 nfmsg
->version
= NFNETLINK_V0
;
419 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
421 if (nla_put_string(skb
, NFTA_TABLE_NAME
, table
->name
) ||
422 nla_put_be32(skb
, NFTA_TABLE_FLAGS
, htonl(table
->flags
)) ||
423 nla_put_be32(skb
, NFTA_TABLE_USE
, htonl(table
->use
)))
424 goto nla_put_failure
;
430 nlmsg_trim(skb
, nlh
);
434 static int nf_tables_table_notify(const struct nft_ctx
*ctx
, int event
)
440 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
444 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
448 err
= nf_tables_fill_table_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
449 event
, 0, ctx
->afi
->family
, ctx
->table
);
455 err
= nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
456 ctx
->report
, GFP_KERNEL
);
459 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
465 static int nf_tables_dump_tables(struct sk_buff
*skb
,
466 struct netlink_callback
*cb
)
468 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
469 const struct nft_af_info
*afi
;
470 const struct nft_table
*table
;
471 unsigned int idx
= 0, s_idx
= cb
->args
[0];
472 struct net
*net
= sock_net(skb
->sk
);
473 int family
= nfmsg
->nfgen_family
;
476 cb
->seq
= net
->nft
.base_seq
;
478 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
479 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
482 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
486 memset(&cb
->args
[1], 0,
487 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
488 if (nf_tables_fill_table_info(skb
, net
,
489 NETLINK_CB(cb
->skb
).portid
,
493 afi
->family
, table
) < 0)
496 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
507 static int nf_tables_gettable(struct sock
*nlsk
, struct sk_buff
*skb
,
508 const struct nlmsghdr
*nlh
,
509 const struct nlattr
* const nla
[])
511 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
512 const struct nft_af_info
*afi
;
513 const struct nft_table
*table
;
514 struct sk_buff
*skb2
;
515 struct net
*net
= sock_net(skb
->sk
);
516 int family
= nfmsg
->nfgen_family
;
519 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
520 struct netlink_dump_control c
= {
521 .dump
= nf_tables_dump_tables
,
523 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
526 afi
= nf_tables_afinfo_lookup(net
, family
, false);
530 table
= nf_tables_table_lookup(afi
, nla
[NFTA_TABLE_NAME
]);
532 return PTR_ERR(table
);
533 if (table
->flags
& NFT_TABLE_INACTIVE
)
536 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
540 err
= nf_tables_fill_table_info(skb2
, net
, NETLINK_CB(skb
).portid
,
541 nlh
->nlmsg_seq
, NFT_MSG_NEWTABLE
, 0,
546 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
553 static int nf_tables_table_enable(const struct nft_af_info
*afi
,
554 struct nft_table
*table
)
556 struct nft_chain
*chain
;
559 list_for_each_entry(chain
, &table
->chains
, list
) {
560 if (!(chain
->flags
& NFT_BASE_CHAIN
))
563 err
= nf_register_hooks(nft_base_chain(chain
)->ops
, afi
->nops
);
571 list_for_each_entry(chain
, &table
->chains
, list
) {
572 if (!(chain
->flags
& NFT_BASE_CHAIN
))
578 nf_unregister_hooks(nft_base_chain(chain
)->ops
, afi
->nops
);
583 static void nf_tables_table_disable(const struct nft_af_info
*afi
,
584 struct nft_table
*table
)
586 struct nft_chain
*chain
;
588 list_for_each_entry(chain
, &table
->chains
, list
) {
589 if (chain
->flags
& NFT_BASE_CHAIN
)
590 nf_unregister_hooks(nft_base_chain(chain
)->ops
,
595 static int nf_tables_updtable(struct nft_ctx
*ctx
)
597 struct nft_trans
*trans
;
601 if (!ctx
->nla
[NFTA_TABLE_FLAGS
])
604 flags
= ntohl(nla_get_be32(ctx
->nla
[NFTA_TABLE_FLAGS
]));
605 if (flags
& ~NFT_TABLE_F_DORMANT
)
608 if (flags
== ctx
->table
->flags
)
611 trans
= nft_trans_alloc(ctx
, NFT_MSG_NEWTABLE
,
612 sizeof(struct nft_trans_table
));
616 if ((flags
& NFT_TABLE_F_DORMANT
) &&
617 !(ctx
->table
->flags
& NFT_TABLE_F_DORMANT
)) {
618 nft_trans_table_enable(trans
) = false;
619 } else if (!(flags
& NFT_TABLE_F_DORMANT
) &&
620 ctx
->table
->flags
& NFT_TABLE_F_DORMANT
) {
621 ret
= nf_tables_table_enable(ctx
->afi
, ctx
->table
);
623 ctx
->table
->flags
&= ~NFT_TABLE_F_DORMANT
;
624 nft_trans_table_enable(trans
) = true;
630 nft_trans_table_update(trans
) = true;
631 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
634 nft_trans_destroy(trans
);
638 static int nf_tables_newtable(struct sock
*nlsk
, struct sk_buff
*skb
,
639 const struct nlmsghdr
*nlh
,
640 const struct nlattr
* const nla
[])
642 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
643 const struct nlattr
*name
;
644 struct nft_af_info
*afi
;
645 struct nft_table
*table
;
646 struct net
*net
= sock_net(skb
->sk
);
647 int family
= nfmsg
->nfgen_family
;
652 afi
= nf_tables_afinfo_lookup(net
, family
, true);
656 name
= nla
[NFTA_TABLE_NAME
];
657 table
= nf_tables_table_lookup(afi
, name
);
659 if (PTR_ERR(table
) != -ENOENT
)
660 return PTR_ERR(table
);
665 if (table
->flags
& NFT_TABLE_INACTIVE
)
667 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
669 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
672 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, NULL
, nla
);
673 return nf_tables_updtable(&ctx
);
676 if (nla
[NFTA_TABLE_FLAGS
]) {
677 flags
= ntohl(nla_get_be32(nla
[NFTA_TABLE_FLAGS
]));
678 if (flags
& ~NFT_TABLE_F_DORMANT
)
682 if (!try_module_get(afi
->owner
))
683 return -EAFNOSUPPORT
;
686 table
= kzalloc(sizeof(*table
), GFP_KERNEL
);
690 nla_strlcpy(table
->name
, name
, NFT_TABLE_MAXNAMELEN
);
691 INIT_LIST_HEAD(&table
->chains
);
692 INIT_LIST_HEAD(&table
->sets
);
693 table
->flags
= flags
;
695 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, NULL
, nla
);
696 err
= nft_trans_table_add(&ctx
, NFT_MSG_NEWTABLE
);
700 list_add_tail_rcu(&table
->list
, &afi
->tables
);
705 module_put(afi
->owner
);
709 static int nft_flush_table(struct nft_ctx
*ctx
)
712 struct nft_chain
*chain
, *nc
;
713 struct nft_set
*set
, *ns
;
715 list_for_each_entry(chain
, &ctx
->table
->chains
, list
) {
718 err
= nft_delrule_by_chain(ctx
);
723 list_for_each_entry_safe(set
, ns
, &ctx
->table
->sets
, list
) {
724 if (set
->flags
& NFT_SET_ANONYMOUS
&&
725 !list_empty(&set
->bindings
))
728 err
= nft_delset(ctx
, set
);
733 list_for_each_entry_safe(chain
, nc
, &ctx
->table
->chains
, list
) {
736 err
= nft_delchain(ctx
);
741 err
= nft_deltable(ctx
);
746 static int nft_flush(struct nft_ctx
*ctx
, int family
)
748 struct nft_af_info
*afi
;
749 struct nft_table
*table
, *nt
;
750 const struct nlattr
* const *nla
= ctx
->nla
;
753 list_for_each_entry(afi
, &ctx
->net
->nft
.af_info
, list
) {
754 if (family
!= AF_UNSPEC
&& afi
->family
!= family
)
758 list_for_each_entry_safe(table
, nt
, &afi
->tables
, list
) {
759 if (nla
[NFTA_TABLE_NAME
] &&
760 nla_strcmp(nla
[NFTA_TABLE_NAME
], table
->name
) != 0)
765 err
= nft_flush_table(ctx
);
774 static int nf_tables_deltable(struct sock
*nlsk
, struct sk_buff
*skb
,
775 const struct nlmsghdr
*nlh
,
776 const struct nlattr
* const nla
[])
778 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
779 struct nft_af_info
*afi
;
780 struct nft_table
*table
;
781 struct net
*net
= sock_net(skb
->sk
);
782 int family
= nfmsg
->nfgen_family
;
785 nft_ctx_init(&ctx
, skb
, nlh
, NULL
, NULL
, NULL
, nla
);
786 if (family
== AF_UNSPEC
|| nla
[NFTA_TABLE_NAME
] == NULL
)
787 return nft_flush(&ctx
, family
);
789 afi
= nf_tables_afinfo_lookup(net
, family
, false);
793 table
= nf_tables_table_lookup(afi
, nla
[NFTA_TABLE_NAME
]);
795 return PTR_ERR(table
);
796 if (table
->flags
& NFT_TABLE_INACTIVE
)
802 return nft_flush_table(&ctx
);
805 static void nf_tables_table_destroy(struct nft_ctx
*ctx
)
807 BUG_ON(ctx
->table
->use
> 0);
810 module_put(ctx
->afi
->owner
);
813 int nft_register_chain_type(const struct nf_chain_type
*ctype
)
817 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
818 if (chain_type
[ctype
->family
][ctype
->type
] != NULL
) {
822 chain_type
[ctype
->family
][ctype
->type
] = ctype
;
824 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
827 EXPORT_SYMBOL_GPL(nft_register_chain_type
);
829 void nft_unregister_chain_type(const struct nf_chain_type
*ctype
)
831 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
832 chain_type
[ctype
->family
][ctype
->type
] = NULL
;
833 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
835 EXPORT_SYMBOL_GPL(nft_unregister_chain_type
);
841 static struct nft_chain
*
842 nf_tables_chain_lookup_byhandle(const struct nft_table
*table
, u64 handle
)
844 struct nft_chain
*chain
;
846 list_for_each_entry(chain
, &table
->chains
, list
) {
847 if (chain
->handle
== handle
)
851 return ERR_PTR(-ENOENT
);
854 static struct nft_chain
*nf_tables_chain_lookup(const struct nft_table
*table
,
855 const struct nlattr
*nla
)
857 struct nft_chain
*chain
;
860 return ERR_PTR(-EINVAL
);
862 list_for_each_entry(chain
, &table
->chains
, list
) {
863 if (!nla_strcmp(nla
, chain
->name
))
867 return ERR_PTR(-ENOENT
);
870 static const struct nla_policy nft_chain_policy
[NFTA_CHAIN_MAX
+ 1] = {
871 [NFTA_CHAIN_TABLE
] = { .type
= NLA_STRING
},
872 [NFTA_CHAIN_HANDLE
] = { .type
= NLA_U64
},
873 [NFTA_CHAIN_NAME
] = { .type
= NLA_STRING
,
874 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
875 [NFTA_CHAIN_HOOK
] = { .type
= NLA_NESTED
},
876 [NFTA_CHAIN_POLICY
] = { .type
= NLA_U32
},
877 [NFTA_CHAIN_TYPE
] = { .type
= NLA_STRING
},
878 [NFTA_CHAIN_COUNTERS
] = { .type
= NLA_NESTED
},
881 static const struct nla_policy nft_hook_policy
[NFTA_HOOK_MAX
+ 1] = {
882 [NFTA_HOOK_HOOKNUM
] = { .type
= NLA_U32
},
883 [NFTA_HOOK_PRIORITY
] = { .type
= NLA_U32
},
886 static int nft_dump_stats(struct sk_buff
*skb
, struct nft_stats __percpu
*stats
)
888 struct nft_stats
*cpu_stats
, total
;
894 memset(&total
, 0, sizeof(total
));
895 for_each_possible_cpu(cpu
) {
896 cpu_stats
= per_cpu_ptr(stats
, cpu
);
898 seq
= u64_stats_fetch_begin_irq(&cpu_stats
->syncp
);
899 pkts
= cpu_stats
->pkts
;
900 bytes
= cpu_stats
->bytes
;
901 } while (u64_stats_fetch_retry_irq(&cpu_stats
->syncp
, seq
));
903 total
.bytes
+= bytes
;
905 nest
= nla_nest_start(skb
, NFTA_CHAIN_COUNTERS
);
907 goto nla_put_failure
;
909 if (nla_put_be64(skb
, NFTA_COUNTER_PACKETS
, cpu_to_be64(total
.pkts
)) ||
910 nla_put_be64(skb
, NFTA_COUNTER_BYTES
, cpu_to_be64(total
.bytes
)))
911 goto nla_put_failure
;
913 nla_nest_end(skb
, nest
);
920 static int nf_tables_fill_chain_info(struct sk_buff
*skb
, struct net
*net
,
921 u32 portid
, u32 seq
, int event
, u32 flags
,
922 int family
, const struct nft_table
*table
,
923 const struct nft_chain
*chain
)
925 struct nlmsghdr
*nlh
;
926 struct nfgenmsg
*nfmsg
;
928 event
|= NFNL_SUBSYS_NFTABLES
<< 8;
929 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), flags
);
931 goto nla_put_failure
;
933 nfmsg
= nlmsg_data(nlh
);
934 nfmsg
->nfgen_family
= family
;
935 nfmsg
->version
= NFNETLINK_V0
;
936 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
938 if (nla_put_string(skb
, NFTA_CHAIN_TABLE
, table
->name
))
939 goto nla_put_failure
;
940 if (nla_put_be64(skb
, NFTA_CHAIN_HANDLE
, cpu_to_be64(chain
->handle
)))
941 goto nla_put_failure
;
942 if (nla_put_string(skb
, NFTA_CHAIN_NAME
, chain
->name
))
943 goto nla_put_failure
;
945 if (chain
->flags
& NFT_BASE_CHAIN
) {
946 const struct nft_base_chain
*basechain
= nft_base_chain(chain
);
947 const struct nf_hook_ops
*ops
= &basechain
->ops
[0];
950 nest
= nla_nest_start(skb
, NFTA_CHAIN_HOOK
);
952 goto nla_put_failure
;
953 if (nla_put_be32(skb
, NFTA_HOOK_HOOKNUM
, htonl(ops
->hooknum
)))
954 goto nla_put_failure
;
955 if (nla_put_be32(skb
, NFTA_HOOK_PRIORITY
, htonl(ops
->priority
)))
956 goto nla_put_failure
;
957 nla_nest_end(skb
, nest
);
959 if (nla_put_be32(skb
, NFTA_CHAIN_POLICY
,
960 htonl(basechain
->policy
)))
961 goto nla_put_failure
;
963 if (nla_put_string(skb
, NFTA_CHAIN_TYPE
, basechain
->type
->name
))
964 goto nla_put_failure
;
966 if (nft_dump_stats(skb
, nft_base_chain(chain
)->stats
))
967 goto nla_put_failure
;
970 if (nla_put_be32(skb
, NFTA_CHAIN_USE
, htonl(chain
->use
)))
971 goto nla_put_failure
;
977 nlmsg_trim(skb
, nlh
);
981 static int nf_tables_chain_notify(const struct nft_ctx
*ctx
, int event
)
987 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
991 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
995 err
= nf_tables_fill_chain_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
996 event
, 0, ctx
->afi
->family
, ctx
->table
,
1003 err
= nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
1004 ctx
->report
, GFP_KERNEL
);
1007 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
1013 static int nf_tables_dump_chains(struct sk_buff
*skb
,
1014 struct netlink_callback
*cb
)
1016 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
1017 const struct nft_af_info
*afi
;
1018 const struct nft_table
*table
;
1019 const struct nft_chain
*chain
;
1020 unsigned int idx
= 0, s_idx
= cb
->args
[0];
1021 struct net
*net
= sock_net(skb
->sk
);
1022 int family
= nfmsg
->nfgen_family
;
1025 cb
->seq
= net
->nft
.base_seq
;
1027 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
1028 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
1031 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
1032 list_for_each_entry_rcu(chain
, &table
->chains
, list
) {
1036 memset(&cb
->args
[1], 0,
1037 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
1038 if (nf_tables_fill_chain_info(skb
, net
,
1039 NETLINK_CB(cb
->skb
).portid
,
1043 afi
->family
, table
, chain
) < 0)
1046 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
1058 static int nf_tables_getchain(struct sock
*nlsk
, struct sk_buff
*skb
,
1059 const struct nlmsghdr
*nlh
,
1060 const struct nlattr
* const nla
[])
1062 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1063 const struct nft_af_info
*afi
;
1064 const struct nft_table
*table
;
1065 const struct nft_chain
*chain
;
1066 struct sk_buff
*skb2
;
1067 struct net
*net
= sock_net(skb
->sk
);
1068 int family
= nfmsg
->nfgen_family
;
1071 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
1072 struct netlink_dump_control c
= {
1073 .dump
= nf_tables_dump_chains
,
1075 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
1078 afi
= nf_tables_afinfo_lookup(net
, family
, false);
1080 return PTR_ERR(afi
);
1082 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
]);
1084 return PTR_ERR(table
);
1085 if (table
->flags
& NFT_TABLE_INACTIVE
)
1088 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
]);
1090 return PTR_ERR(chain
);
1091 if (chain
->flags
& NFT_CHAIN_INACTIVE
)
1094 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
1098 err
= nf_tables_fill_chain_info(skb2
, net
, NETLINK_CB(skb
).portid
,
1099 nlh
->nlmsg_seq
, NFT_MSG_NEWCHAIN
, 0,
1100 family
, table
, chain
);
1104 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
1111 static const struct nla_policy nft_counter_policy
[NFTA_COUNTER_MAX
+ 1] = {
1112 [NFTA_COUNTER_PACKETS
] = { .type
= NLA_U64
},
1113 [NFTA_COUNTER_BYTES
] = { .type
= NLA_U64
},
1116 static struct nft_stats __percpu
*nft_stats_alloc(const struct nlattr
*attr
)
1118 struct nlattr
*tb
[NFTA_COUNTER_MAX
+1];
1119 struct nft_stats __percpu
*newstats
;
1120 struct nft_stats
*stats
;
1123 err
= nla_parse_nested(tb
, NFTA_COUNTER_MAX
, attr
, nft_counter_policy
);
1125 return ERR_PTR(err
);
1127 if (!tb
[NFTA_COUNTER_BYTES
] || !tb
[NFTA_COUNTER_PACKETS
])
1128 return ERR_PTR(-EINVAL
);
1130 newstats
= netdev_alloc_pcpu_stats(struct nft_stats
);
1131 if (newstats
== NULL
)
1132 return ERR_PTR(-ENOMEM
);
1134 /* Restore old counters on this cpu, no problem. Per-cpu statistics
1135 * are not exposed to userspace.
1138 stats
= this_cpu_ptr(newstats
);
1139 stats
->bytes
= be64_to_cpu(nla_get_be64(tb
[NFTA_COUNTER_BYTES
]));
1140 stats
->pkts
= be64_to_cpu(nla_get_be64(tb
[NFTA_COUNTER_PACKETS
]));
1146 static void nft_chain_stats_replace(struct nft_base_chain
*chain
,
1147 struct nft_stats __percpu
*newstats
)
1149 if (newstats
== NULL
)
1153 struct nft_stats __percpu
*oldstats
=
1154 nft_dereference(chain
->stats
);
1156 rcu_assign_pointer(chain
->stats
, newstats
);
1158 free_percpu(oldstats
);
1160 rcu_assign_pointer(chain
->stats
, newstats
);
1163 static void nf_tables_chain_destroy(struct nft_chain
*chain
)
1165 BUG_ON(chain
->use
> 0);
1167 if (chain
->flags
& NFT_BASE_CHAIN
) {
1168 module_put(nft_base_chain(chain
)->type
->owner
);
1169 free_percpu(nft_base_chain(chain
)->stats
);
1170 kfree(nft_base_chain(chain
));
1176 static int nf_tables_newchain(struct sock
*nlsk
, struct sk_buff
*skb
,
1177 const struct nlmsghdr
*nlh
,
1178 const struct nlattr
* const nla
[])
1180 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1181 const struct nlattr
* uninitialized_var(name
);
1182 struct nft_af_info
*afi
;
1183 struct nft_table
*table
;
1184 struct nft_chain
*chain
;
1185 struct nft_base_chain
*basechain
= NULL
;
1186 struct nlattr
*ha
[NFTA_HOOK_MAX
+ 1];
1187 struct net
*net
= sock_net(skb
->sk
);
1188 int family
= nfmsg
->nfgen_family
;
1189 u8 policy
= NF_ACCEPT
;
1192 struct nft_stats __percpu
*stats
;
1197 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
1199 afi
= nf_tables_afinfo_lookup(net
, family
, true);
1201 return PTR_ERR(afi
);
1203 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
]);
1205 return PTR_ERR(table
);
1208 name
= nla
[NFTA_CHAIN_NAME
];
1210 if (nla
[NFTA_CHAIN_HANDLE
]) {
1211 handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_CHAIN_HANDLE
]));
1212 chain
= nf_tables_chain_lookup_byhandle(table
, handle
);
1214 return PTR_ERR(chain
);
1216 chain
= nf_tables_chain_lookup(table
, name
);
1217 if (IS_ERR(chain
)) {
1218 if (PTR_ERR(chain
) != -ENOENT
)
1219 return PTR_ERR(chain
);
1224 if (nla
[NFTA_CHAIN_POLICY
]) {
1225 if ((chain
!= NULL
&&
1226 !(chain
->flags
& NFT_BASE_CHAIN
)))
1229 if (chain
== NULL
&&
1230 nla
[NFTA_CHAIN_HOOK
] == NULL
)
1233 policy
= ntohl(nla_get_be32(nla
[NFTA_CHAIN_POLICY
]));
1243 if (chain
!= NULL
) {
1244 struct nft_stats
*stats
= NULL
;
1245 struct nft_trans
*trans
;
1247 if (chain
->flags
& NFT_CHAIN_INACTIVE
)
1249 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
1251 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
1254 if (nla
[NFTA_CHAIN_HANDLE
] && name
&&
1255 !IS_ERR(nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
])))
1258 if (nla
[NFTA_CHAIN_COUNTERS
]) {
1259 if (!(chain
->flags
& NFT_BASE_CHAIN
))
1262 stats
= nft_stats_alloc(nla
[NFTA_CHAIN_COUNTERS
]);
1264 return PTR_ERR(stats
);
1267 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, chain
, nla
);
1268 trans
= nft_trans_alloc(&ctx
, NFT_MSG_NEWCHAIN
,
1269 sizeof(struct nft_trans_chain
));
1270 if (trans
== NULL
) {
1275 nft_trans_chain_stats(trans
) = stats
;
1276 nft_trans_chain_update(trans
) = true;
1278 if (nla
[NFTA_CHAIN_POLICY
])
1279 nft_trans_chain_policy(trans
) = policy
;
1281 nft_trans_chain_policy(trans
) = -1;
1283 if (nla
[NFTA_CHAIN_HANDLE
] && name
) {
1284 nla_strlcpy(nft_trans_chain_name(trans
), name
,
1285 NFT_CHAIN_MAXNAMELEN
);
1287 list_add_tail(&trans
->list
, &net
->nft
.commit_list
);
1291 if (table
->use
== UINT_MAX
)
1294 if (nla
[NFTA_CHAIN_HOOK
]) {
1295 const struct nf_chain_type
*type
;
1296 struct nf_hook_ops
*ops
;
1298 u32 hooknum
, priority
;
1300 type
= chain_type
[family
][NFT_CHAIN_T_DEFAULT
];
1301 if (nla
[NFTA_CHAIN_TYPE
]) {
1302 type
= nf_tables_chain_type_lookup(afi
,
1303 nla
[NFTA_CHAIN_TYPE
],
1306 return PTR_ERR(type
);
1309 err
= nla_parse_nested(ha
, NFTA_HOOK_MAX
, nla
[NFTA_CHAIN_HOOK
],
1313 if (ha
[NFTA_HOOK_HOOKNUM
] == NULL
||
1314 ha
[NFTA_HOOK_PRIORITY
] == NULL
)
1317 hooknum
= ntohl(nla_get_be32(ha
[NFTA_HOOK_HOOKNUM
]));
1318 if (hooknum
>= afi
->nhooks
)
1320 priority
= ntohl(nla_get_be32(ha
[NFTA_HOOK_PRIORITY
]));
1322 if (!(type
->hook_mask
& (1 << hooknum
)))
1324 if (!try_module_get(type
->owner
))
1326 hookfn
= type
->hooks
[hooknum
];
1328 basechain
= kzalloc(sizeof(*basechain
), GFP_KERNEL
);
1329 if (basechain
== NULL
) {
1330 module_put(type
->owner
);
1334 if (nla
[NFTA_CHAIN_COUNTERS
]) {
1335 stats
= nft_stats_alloc(nla
[NFTA_CHAIN_COUNTERS
]);
1336 if (IS_ERR(stats
)) {
1337 module_put(type
->owner
);
1339 return PTR_ERR(stats
);
1341 basechain
->stats
= stats
;
1343 stats
= netdev_alloc_pcpu_stats(struct nft_stats
);
1344 if (stats
== NULL
) {
1345 module_put(type
->owner
);
1349 rcu_assign_pointer(basechain
->stats
, stats
);
1352 write_pnet(&basechain
->pnet
, net
);
1353 basechain
->type
= type
;
1354 chain
= &basechain
->chain
;
1356 for (i
= 0; i
< afi
->nops
; i
++) {
1357 ops
= &basechain
->ops
[i
];
1359 ops
->owner
= afi
->owner
;
1360 ops
->hooknum
= hooknum
;
1361 ops
->priority
= priority
;
1363 ops
->hook
= afi
->hooks
[ops
->hooknum
];
1366 if (afi
->hook_ops_init
)
1367 afi
->hook_ops_init(ops
, i
);
1370 chain
->flags
|= NFT_BASE_CHAIN
;
1371 basechain
->policy
= policy
;
1373 chain
= kzalloc(sizeof(*chain
), GFP_KERNEL
);
1378 INIT_LIST_HEAD(&chain
->rules
);
1379 chain
->handle
= nf_tables_alloc_handle(table
);
1380 chain
->table
= table
;
1381 nla_strlcpy(chain
->name
, name
, NFT_CHAIN_MAXNAMELEN
);
1383 if (!(table
->flags
& NFT_TABLE_F_DORMANT
) &&
1384 chain
->flags
& NFT_BASE_CHAIN
) {
1385 err
= nf_register_hooks(nft_base_chain(chain
)->ops
, afi
->nops
);
1390 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, chain
, nla
);
1391 err
= nft_trans_chain_add(&ctx
, NFT_MSG_NEWCHAIN
);
1396 list_add_tail_rcu(&chain
->list
, &table
->chains
);
1399 nf_tables_unregister_hooks(table
, chain
, afi
->nops
);
1401 nf_tables_chain_destroy(chain
);
1405 static int nf_tables_delchain(struct sock
*nlsk
, struct sk_buff
*skb
,
1406 const struct nlmsghdr
*nlh
,
1407 const struct nlattr
* const nla
[])
1409 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1410 struct nft_af_info
*afi
;
1411 struct nft_table
*table
;
1412 struct nft_chain
*chain
;
1413 struct net
*net
= sock_net(skb
->sk
);
1414 int family
= nfmsg
->nfgen_family
;
1417 afi
= nf_tables_afinfo_lookup(net
, family
, false);
1419 return PTR_ERR(afi
);
1421 table
= nf_tables_table_lookup(afi
, nla
[NFTA_CHAIN_TABLE
]);
1423 return PTR_ERR(table
);
1424 if (table
->flags
& NFT_TABLE_INACTIVE
)
1427 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_CHAIN_NAME
]);
1429 return PTR_ERR(chain
);
1430 if (chain
->flags
& NFT_CHAIN_INACTIVE
)
1435 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, chain
, nla
);
1437 return nft_delchain(&ctx
);
1445 * nft_register_expr - register nf_tables expr type
1448 * Registers the expr type for use with nf_tables. Returns zero on
1449 * success or a negative errno code otherwise.
1451 int nft_register_expr(struct nft_expr_type
*type
)
1453 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1454 if (type
->family
== NFPROTO_UNSPEC
)
1455 list_add_tail_rcu(&type
->list
, &nf_tables_expressions
);
1457 list_add_rcu(&type
->list
, &nf_tables_expressions
);
1458 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1461 EXPORT_SYMBOL_GPL(nft_register_expr
);
1464 * nft_unregister_expr - unregister nf_tables expr type
1467 * Unregisters the expr typefor use with nf_tables.
1469 void nft_unregister_expr(struct nft_expr_type
*type
)
1471 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1472 list_del_rcu(&type
->list
);
1473 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1475 EXPORT_SYMBOL_GPL(nft_unregister_expr
);
1477 static const struct nft_expr_type
*__nft_expr_type_get(u8 family
,
1480 const struct nft_expr_type
*type
;
1482 list_for_each_entry(type
, &nf_tables_expressions
, list
) {
1483 if (!nla_strcmp(nla
, type
->name
) &&
1484 (!type
->family
|| type
->family
== family
))
1490 static const struct nft_expr_type
*nft_expr_type_get(u8 family
,
1493 const struct nft_expr_type
*type
;
1496 return ERR_PTR(-EINVAL
);
1498 type
= __nft_expr_type_get(family
, nla
);
1499 if (type
!= NULL
&& try_module_get(type
->owner
))
1502 #ifdef CONFIG_MODULES
1504 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1505 request_module("nft-expr-%u-%.*s", family
,
1506 nla_len(nla
), (char *)nla_data(nla
));
1507 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1508 if (__nft_expr_type_get(family
, nla
))
1509 return ERR_PTR(-EAGAIN
);
1511 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
1512 request_module("nft-expr-%.*s",
1513 nla_len(nla
), (char *)nla_data(nla
));
1514 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
1515 if (__nft_expr_type_get(family
, nla
))
1516 return ERR_PTR(-EAGAIN
);
1519 return ERR_PTR(-ENOENT
);
1522 static const struct nla_policy nft_expr_policy
[NFTA_EXPR_MAX
+ 1] = {
1523 [NFTA_EXPR_NAME
] = { .type
= NLA_STRING
},
1524 [NFTA_EXPR_DATA
] = { .type
= NLA_NESTED
},
1527 static int nf_tables_fill_expr_info(struct sk_buff
*skb
,
1528 const struct nft_expr
*expr
)
1530 if (nla_put_string(skb
, NFTA_EXPR_NAME
, expr
->ops
->type
->name
))
1531 goto nla_put_failure
;
1533 if (expr
->ops
->dump
) {
1534 struct nlattr
*data
= nla_nest_start(skb
, NFTA_EXPR_DATA
);
1536 goto nla_put_failure
;
1537 if (expr
->ops
->dump(skb
, expr
) < 0)
1538 goto nla_put_failure
;
1539 nla_nest_end(skb
, data
);
1548 int nft_expr_dump(struct sk_buff
*skb
, unsigned int attr
,
1549 const struct nft_expr
*expr
)
1551 struct nlattr
*nest
;
1553 nest
= nla_nest_start(skb
, attr
);
1555 goto nla_put_failure
;
1556 if (nf_tables_fill_expr_info(skb
, expr
) < 0)
1557 goto nla_put_failure
;
1558 nla_nest_end(skb
, nest
);
1565 struct nft_expr_info
{
1566 const struct nft_expr_ops
*ops
;
1567 struct nlattr
*tb
[NFT_EXPR_MAXATTR
+ 1];
1570 static int nf_tables_expr_parse(const struct nft_ctx
*ctx
,
1571 const struct nlattr
*nla
,
1572 struct nft_expr_info
*info
)
1574 const struct nft_expr_type
*type
;
1575 const struct nft_expr_ops
*ops
;
1576 struct nlattr
*tb
[NFTA_EXPR_MAX
+ 1];
1579 err
= nla_parse_nested(tb
, NFTA_EXPR_MAX
, nla
, nft_expr_policy
);
1583 type
= nft_expr_type_get(ctx
->afi
->family
, tb
[NFTA_EXPR_NAME
]);
1585 return PTR_ERR(type
);
1587 if (tb
[NFTA_EXPR_DATA
]) {
1588 err
= nla_parse_nested(info
->tb
, type
->maxattr
,
1589 tb
[NFTA_EXPR_DATA
], type
->policy
);
1593 memset(info
->tb
, 0, sizeof(info
->tb
[0]) * (type
->maxattr
+ 1));
1595 if (type
->select_ops
!= NULL
) {
1596 ops
= type
->select_ops(ctx
,
1597 (const struct nlattr
* const *)info
->tb
);
1609 module_put(type
->owner
);
1613 static int nf_tables_newexpr(const struct nft_ctx
*ctx
,
1614 const struct nft_expr_info
*info
,
1615 struct nft_expr
*expr
)
1617 const struct nft_expr_ops
*ops
= info
->ops
;
1622 err
= ops
->init(ctx
, expr
, (const struct nlattr
**)info
->tb
);
1634 static void nf_tables_expr_destroy(const struct nft_ctx
*ctx
,
1635 struct nft_expr
*expr
)
1637 if (expr
->ops
->destroy
)
1638 expr
->ops
->destroy(ctx
, expr
);
1639 module_put(expr
->ops
->type
->owner
);
1642 struct nft_expr
*nft_expr_init(const struct nft_ctx
*ctx
,
1643 const struct nlattr
*nla
)
1645 struct nft_expr_info info
;
1646 struct nft_expr
*expr
;
1649 err
= nf_tables_expr_parse(ctx
, nla
, &info
);
1654 expr
= kzalloc(info
.ops
->size
, GFP_KERNEL
);
1658 err
= nf_tables_newexpr(ctx
, &info
, expr
);
1664 module_put(info
.ops
->type
->owner
);
1666 return ERR_PTR(err
);
1669 void nft_expr_destroy(const struct nft_ctx
*ctx
, struct nft_expr
*expr
)
1671 nf_tables_expr_destroy(ctx
, expr
);
1679 static struct nft_rule
*__nf_tables_rule_lookup(const struct nft_chain
*chain
,
1682 struct nft_rule
*rule
;
1684 // FIXME: this sucks
1685 list_for_each_entry(rule
, &chain
->rules
, list
) {
1686 if (handle
== rule
->handle
)
1690 return ERR_PTR(-ENOENT
);
1693 static struct nft_rule
*nf_tables_rule_lookup(const struct nft_chain
*chain
,
1694 const struct nlattr
*nla
)
1697 return ERR_PTR(-EINVAL
);
1699 return __nf_tables_rule_lookup(chain
, be64_to_cpu(nla_get_be64(nla
)));
1702 static const struct nla_policy nft_rule_policy
[NFTA_RULE_MAX
+ 1] = {
1703 [NFTA_RULE_TABLE
] = { .type
= NLA_STRING
},
1704 [NFTA_RULE_CHAIN
] = { .type
= NLA_STRING
,
1705 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
1706 [NFTA_RULE_HANDLE
] = { .type
= NLA_U64
},
1707 [NFTA_RULE_EXPRESSIONS
] = { .type
= NLA_NESTED
},
1708 [NFTA_RULE_COMPAT
] = { .type
= NLA_NESTED
},
1709 [NFTA_RULE_POSITION
] = { .type
= NLA_U64
},
1710 [NFTA_RULE_USERDATA
] = { .type
= NLA_BINARY
,
1711 .len
= NFT_USERDATA_MAXLEN
},
1714 static int nf_tables_fill_rule_info(struct sk_buff
*skb
, struct net
*net
,
1715 u32 portid
, u32 seq
, int event
,
1716 u32 flags
, int family
,
1717 const struct nft_table
*table
,
1718 const struct nft_chain
*chain
,
1719 const struct nft_rule
*rule
)
1721 struct nlmsghdr
*nlh
;
1722 struct nfgenmsg
*nfmsg
;
1723 const struct nft_expr
*expr
, *next
;
1724 struct nlattr
*list
;
1725 const struct nft_rule
*prule
;
1726 int type
= event
| NFNL_SUBSYS_NFTABLES
<< 8;
1728 nlh
= nlmsg_put(skb
, portid
, seq
, type
, sizeof(struct nfgenmsg
),
1731 goto nla_put_failure
;
1733 nfmsg
= nlmsg_data(nlh
);
1734 nfmsg
->nfgen_family
= family
;
1735 nfmsg
->version
= NFNETLINK_V0
;
1736 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
1738 if (nla_put_string(skb
, NFTA_RULE_TABLE
, table
->name
))
1739 goto nla_put_failure
;
1740 if (nla_put_string(skb
, NFTA_RULE_CHAIN
, chain
->name
))
1741 goto nla_put_failure
;
1742 if (nla_put_be64(skb
, NFTA_RULE_HANDLE
, cpu_to_be64(rule
->handle
)))
1743 goto nla_put_failure
;
1745 if ((event
!= NFT_MSG_DELRULE
) && (rule
->list
.prev
!= &chain
->rules
)) {
1746 prule
= list_entry(rule
->list
.prev
, struct nft_rule
, list
);
1747 if (nla_put_be64(skb
, NFTA_RULE_POSITION
,
1748 cpu_to_be64(prule
->handle
)))
1749 goto nla_put_failure
;
1752 list
= nla_nest_start(skb
, NFTA_RULE_EXPRESSIONS
);
1754 goto nla_put_failure
;
1755 nft_rule_for_each_expr(expr
, next
, rule
) {
1756 if (nft_expr_dump(skb
, NFTA_LIST_ELEM
, expr
) < 0)
1757 goto nla_put_failure
;
1759 nla_nest_end(skb
, list
);
1762 struct nft_userdata
*udata
= nft_userdata(rule
);
1763 if (nla_put(skb
, NFTA_RULE_USERDATA
, udata
->len
+ 1,
1765 goto nla_put_failure
;
1768 nlmsg_end(skb
, nlh
);
1772 nlmsg_trim(skb
, nlh
);
1776 static int nf_tables_rule_notify(const struct nft_ctx
*ctx
,
1777 const struct nft_rule
*rule
,
1780 struct sk_buff
*skb
;
1784 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
1788 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
1792 err
= nf_tables_fill_rule_info(skb
, ctx
->net
, ctx
->portid
, ctx
->seq
,
1793 event
, 0, ctx
->afi
->family
, ctx
->table
,
1800 err
= nfnetlink_send(skb
, ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
1801 ctx
->report
, GFP_KERNEL
);
1804 nfnetlink_set_err(ctx
->net
, ctx
->portid
, NFNLGRP_NFTABLES
,
1810 static int nf_tables_dump_rules(struct sk_buff
*skb
,
1811 struct netlink_callback
*cb
)
1813 const struct nfgenmsg
*nfmsg
= nlmsg_data(cb
->nlh
);
1814 const struct nft_af_info
*afi
;
1815 const struct nft_table
*table
;
1816 const struct nft_chain
*chain
;
1817 const struct nft_rule
*rule
;
1818 unsigned int idx
= 0, s_idx
= cb
->args
[0];
1819 struct net
*net
= sock_net(skb
->sk
);
1820 int family
= nfmsg
->nfgen_family
;
1823 cb
->seq
= net
->nft
.base_seq
;
1825 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
1826 if (family
!= NFPROTO_UNSPEC
&& family
!= afi
->family
)
1829 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
1830 list_for_each_entry_rcu(chain
, &table
->chains
, list
) {
1831 list_for_each_entry_rcu(rule
, &chain
->rules
, list
) {
1832 if (!nft_rule_is_active(net
, rule
))
1837 memset(&cb
->args
[1], 0,
1838 sizeof(cb
->args
) - sizeof(cb
->args
[0]));
1839 if (nf_tables_fill_rule_info(skb
, net
, NETLINK_CB(cb
->skb
).portid
,
1842 NLM_F_MULTI
| NLM_F_APPEND
,
1843 afi
->family
, table
, chain
, rule
) < 0)
1846 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
1860 static int nf_tables_getrule(struct sock
*nlsk
, struct sk_buff
*skb
,
1861 const struct nlmsghdr
*nlh
,
1862 const struct nlattr
* const nla
[])
1864 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1865 const struct nft_af_info
*afi
;
1866 const struct nft_table
*table
;
1867 const struct nft_chain
*chain
;
1868 const struct nft_rule
*rule
;
1869 struct sk_buff
*skb2
;
1870 struct net
*net
= sock_net(skb
->sk
);
1871 int family
= nfmsg
->nfgen_family
;
1874 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
1875 struct netlink_dump_control c
= {
1876 .dump
= nf_tables_dump_rules
,
1878 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
1881 afi
= nf_tables_afinfo_lookup(net
, family
, false);
1883 return PTR_ERR(afi
);
1885 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
]);
1887 return PTR_ERR(table
);
1888 if (table
->flags
& NFT_TABLE_INACTIVE
)
1891 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
]);
1893 return PTR_ERR(chain
);
1894 if (chain
->flags
& NFT_CHAIN_INACTIVE
)
1897 rule
= nf_tables_rule_lookup(chain
, nla
[NFTA_RULE_HANDLE
]);
1899 return PTR_ERR(rule
);
1901 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
1905 err
= nf_tables_fill_rule_info(skb2
, net
, NETLINK_CB(skb
).portid
,
1906 nlh
->nlmsg_seq
, NFT_MSG_NEWRULE
, 0,
1907 family
, table
, chain
, rule
);
1911 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
1918 static void nf_tables_rule_destroy(const struct nft_ctx
*ctx
,
1919 struct nft_rule
*rule
)
1921 struct nft_expr
*expr
;
1924 * Careful: some expressions might not be initialized in case this
1925 * is called on error from nf_tables_newrule().
1927 expr
= nft_expr_first(rule
);
1928 while (expr
->ops
&& expr
!= nft_expr_last(rule
)) {
1929 nf_tables_expr_destroy(ctx
, expr
);
1930 expr
= nft_expr_next(expr
);
1935 #define NFT_RULE_MAXEXPRS 128
1937 static struct nft_expr_info
*info
;
1939 static int nf_tables_newrule(struct sock
*nlsk
, struct sk_buff
*skb
,
1940 const struct nlmsghdr
*nlh
,
1941 const struct nlattr
* const nla
[])
1943 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
1944 struct nft_af_info
*afi
;
1945 struct net
*net
= sock_net(skb
->sk
);
1946 struct nft_table
*table
;
1947 struct nft_chain
*chain
;
1948 struct nft_rule
*rule
, *old_rule
= NULL
;
1949 struct nft_userdata
*udata
;
1950 struct nft_trans
*trans
= NULL
;
1951 struct nft_expr
*expr
;
1954 unsigned int size
, i
, n
, ulen
= 0, usize
= 0;
1957 u64 handle
, pos_handle
;
1959 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
1961 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, create
);
1963 return PTR_ERR(afi
);
1965 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
]);
1967 return PTR_ERR(table
);
1969 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
]);
1971 return PTR_ERR(chain
);
1973 if (nla
[NFTA_RULE_HANDLE
]) {
1974 handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_RULE_HANDLE
]));
1975 rule
= __nf_tables_rule_lookup(chain
, handle
);
1977 return PTR_ERR(rule
);
1979 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
1981 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
1986 if (!create
|| nlh
->nlmsg_flags
& NLM_F_REPLACE
)
1988 handle
= nf_tables_alloc_handle(table
);
1990 if (chain
->use
== UINT_MAX
)
1994 if (nla
[NFTA_RULE_POSITION
]) {
1995 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
))
1998 pos_handle
= be64_to_cpu(nla_get_be64(nla
[NFTA_RULE_POSITION
]));
1999 old_rule
= __nf_tables_rule_lookup(chain
, pos_handle
);
2000 if (IS_ERR(old_rule
))
2001 return PTR_ERR(old_rule
);
2004 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, chain
, nla
);
2008 if (nla
[NFTA_RULE_EXPRESSIONS
]) {
2009 nla_for_each_nested(tmp
, nla
[NFTA_RULE_EXPRESSIONS
], rem
) {
2011 if (nla_type(tmp
) != NFTA_LIST_ELEM
)
2013 if (n
== NFT_RULE_MAXEXPRS
)
2015 err
= nf_tables_expr_parse(&ctx
, tmp
, &info
[n
]);
2018 size
+= info
[n
].ops
->size
;
2022 /* Check for overflow of dlen field */
2024 if (size
>= 1 << 12)
2027 if (nla
[NFTA_RULE_USERDATA
]) {
2028 ulen
= nla_len(nla
[NFTA_RULE_USERDATA
]);
2030 usize
= sizeof(struct nft_userdata
) + ulen
;
2034 rule
= kzalloc(sizeof(*rule
) + size
+ usize
, GFP_KERNEL
);
2038 nft_rule_activate_next(net
, rule
);
2040 rule
->handle
= handle
;
2042 rule
->udata
= ulen
? 1 : 0;
2045 udata
= nft_userdata(rule
);
2046 udata
->len
= ulen
- 1;
2047 nla_memcpy(udata
->data
, nla
[NFTA_RULE_USERDATA
], ulen
);
2050 expr
= nft_expr_first(rule
);
2051 for (i
= 0; i
< n
; i
++) {
2052 err
= nf_tables_newexpr(&ctx
, &info
[i
], expr
);
2056 expr
= nft_expr_next(expr
);
2059 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
) {
2060 if (nft_rule_is_active_next(net
, old_rule
)) {
2061 trans
= nft_trans_rule_add(&ctx
, NFT_MSG_DELRULE
,
2063 if (trans
== NULL
) {
2067 nft_rule_deactivate_next(net
, old_rule
);
2069 list_add_tail_rcu(&rule
->list
, &old_rule
->list
);
2074 } else if (nlh
->nlmsg_flags
& NLM_F_APPEND
)
2076 list_add_rcu(&rule
->list
, &old_rule
->list
);
2078 list_add_tail_rcu(&rule
->list
, &chain
->rules
);
2081 list_add_tail_rcu(&rule
->list
, &old_rule
->list
);
2083 list_add_rcu(&rule
->list
, &chain
->rules
);
2086 if (nft_trans_rule_add(&ctx
, NFT_MSG_NEWRULE
, rule
) == NULL
) {
2094 list_del_rcu(&rule
->list
);
2096 nf_tables_rule_destroy(&ctx
, rule
);
2098 for (i
= 0; i
< n
; i
++) {
2099 if (info
[i
].ops
!= NULL
)
2100 module_put(info
[i
].ops
->type
->owner
);
2105 static int nf_tables_delrule(struct sock
*nlsk
, struct sk_buff
*skb
,
2106 const struct nlmsghdr
*nlh
,
2107 const struct nlattr
* const nla
[])
2109 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2110 struct nft_af_info
*afi
;
2111 struct net
*net
= sock_net(skb
->sk
);
2112 struct nft_table
*table
;
2113 struct nft_chain
*chain
= NULL
;
2114 struct nft_rule
*rule
;
2115 int family
= nfmsg
->nfgen_family
, err
= 0;
2118 afi
= nf_tables_afinfo_lookup(net
, family
, false);
2120 return PTR_ERR(afi
);
2122 table
= nf_tables_table_lookup(afi
, nla
[NFTA_RULE_TABLE
]);
2124 return PTR_ERR(table
);
2125 if (table
->flags
& NFT_TABLE_INACTIVE
)
2128 if (nla
[NFTA_RULE_CHAIN
]) {
2129 chain
= nf_tables_chain_lookup(table
, nla
[NFTA_RULE_CHAIN
]);
2131 return PTR_ERR(chain
);
2134 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, chain
, nla
);
2137 if (nla
[NFTA_RULE_HANDLE
]) {
2138 rule
= nf_tables_rule_lookup(chain
,
2139 nla
[NFTA_RULE_HANDLE
]);
2141 return PTR_ERR(rule
);
2143 err
= nft_delrule(&ctx
, rule
);
2145 err
= nft_delrule_by_chain(&ctx
);
2148 list_for_each_entry(chain
, &table
->chains
, list
) {
2150 err
= nft_delrule_by_chain(&ctx
);
2163 static LIST_HEAD(nf_tables_set_ops
);
2165 int nft_register_set(struct nft_set_ops
*ops
)
2167 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2168 list_add_tail_rcu(&ops
->list
, &nf_tables_set_ops
);
2169 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2172 EXPORT_SYMBOL_GPL(nft_register_set
);
2174 void nft_unregister_set(struct nft_set_ops
*ops
)
2176 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2177 list_del_rcu(&ops
->list
);
2178 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2180 EXPORT_SYMBOL_GPL(nft_unregister_set
);
2183 * Select a set implementation based on the data characteristics and the
2184 * given policy. The total memory use might not be known if no size is
2185 * given, in that case the amount of memory per element is used.
2187 static const struct nft_set_ops
*
2188 nft_select_set_ops(const struct nlattr
* const nla
[],
2189 const struct nft_set_desc
*desc
,
2190 enum nft_set_policies policy
)
2192 const struct nft_set_ops
*ops
, *bops
;
2193 struct nft_set_estimate est
, best
;
2196 #ifdef CONFIG_MODULES
2197 if (list_empty(&nf_tables_set_ops
)) {
2198 nfnl_unlock(NFNL_SUBSYS_NFTABLES
);
2199 request_module("nft-set");
2200 nfnl_lock(NFNL_SUBSYS_NFTABLES
);
2201 if (!list_empty(&nf_tables_set_ops
))
2202 return ERR_PTR(-EAGAIN
);
2206 if (nla
[NFTA_SET_FLAGS
] != NULL
) {
2207 features
= ntohl(nla_get_be32(nla
[NFTA_SET_FLAGS
]));
2208 features
&= NFT_SET_INTERVAL
| NFT_SET_MAP
| NFT_SET_TIMEOUT
;
2215 list_for_each_entry(ops
, &nf_tables_set_ops
, list
) {
2216 if ((ops
->features
& features
) != features
)
2218 if (!ops
->estimate(desc
, features
, &est
))
2222 case NFT_SET_POL_PERFORMANCE
:
2223 if (est
.class < best
.class)
2225 if (est
.class == best
.class && est
.size
< best
.size
)
2228 case NFT_SET_POL_MEMORY
:
2229 if (est
.size
< best
.size
)
2231 if (est
.size
== best
.size
&& est
.class < best
.class)
2238 if (!try_module_get(ops
->owner
))
2241 module_put(bops
->owner
);
2250 return ERR_PTR(-EOPNOTSUPP
);
2253 static const struct nla_policy nft_set_policy
[NFTA_SET_MAX
+ 1] = {
2254 [NFTA_SET_TABLE
] = { .type
= NLA_STRING
},
2255 [NFTA_SET_NAME
] = { .type
= NLA_STRING
,
2256 .len
= IFNAMSIZ
- 1 },
2257 [NFTA_SET_FLAGS
] = { .type
= NLA_U32
},
2258 [NFTA_SET_KEY_TYPE
] = { .type
= NLA_U32
},
2259 [NFTA_SET_KEY_LEN
] = { .type
= NLA_U32
},
2260 [NFTA_SET_DATA_TYPE
] = { .type
= NLA_U32
},
2261 [NFTA_SET_DATA_LEN
] = { .type
= NLA_U32
},
2262 [NFTA_SET_POLICY
] = { .type
= NLA_U32
},
2263 [NFTA_SET_DESC
] = { .type
= NLA_NESTED
},
2264 [NFTA_SET_ID
] = { .type
= NLA_U32
},
2265 [NFTA_SET_TIMEOUT
] = { .type
= NLA_U64
},
2266 [NFTA_SET_GC_INTERVAL
] = { .type
= NLA_U32
},
2269 static const struct nla_policy nft_set_desc_policy
[NFTA_SET_DESC_MAX
+ 1] = {
2270 [NFTA_SET_DESC_SIZE
] = { .type
= NLA_U32
},
2273 static int nft_ctx_init_from_setattr(struct nft_ctx
*ctx
,
2274 const struct sk_buff
*skb
,
2275 const struct nlmsghdr
*nlh
,
2276 const struct nlattr
* const nla
[])
2278 struct net
*net
= sock_net(skb
->sk
);
2279 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2280 struct nft_af_info
*afi
= NULL
;
2281 struct nft_table
*table
= NULL
;
2283 if (nfmsg
->nfgen_family
!= NFPROTO_UNSPEC
) {
2284 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, false);
2286 return PTR_ERR(afi
);
2289 if (nla
[NFTA_SET_TABLE
] != NULL
) {
2291 return -EAFNOSUPPORT
;
2293 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_TABLE
]);
2295 return PTR_ERR(table
);
2296 if (table
->flags
& NFT_TABLE_INACTIVE
)
2300 nft_ctx_init(ctx
, skb
, nlh
, afi
, table
, NULL
, nla
);
2304 struct nft_set
*nf_tables_set_lookup(const struct nft_table
*table
,
2305 const struct nlattr
*nla
)
2307 struct nft_set
*set
;
2310 return ERR_PTR(-EINVAL
);
2312 list_for_each_entry(set
, &table
->sets
, list
) {
2313 if (!nla_strcmp(nla
, set
->name
))
2316 return ERR_PTR(-ENOENT
);
2319 struct nft_set
*nf_tables_set_lookup_byid(const struct net
*net
,
2320 const struct nlattr
*nla
)
2322 struct nft_trans
*trans
;
2323 u32 id
= ntohl(nla_get_be32(nla
));
2325 list_for_each_entry(trans
, &net
->nft
.commit_list
, list
) {
2326 if (trans
->msg_type
== NFT_MSG_NEWSET
&&
2327 id
== nft_trans_set_id(trans
))
2328 return nft_trans_set(trans
);
2330 return ERR_PTR(-ENOENT
);
2333 static int nf_tables_set_alloc_name(struct nft_ctx
*ctx
, struct nft_set
*set
,
2336 const struct nft_set
*i
;
2338 unsigned long *inuse
;
2339 unsigned int n
= 0, min
= 0;
2341 p
= strnchr(name
, IFNAMSIZ
, '%');
2343 if (p
[1] != 'd' || strchr(p
+ 2, '%'))
2346 inuse
= (unsigned long *)get_zeroed_page(GFP_KERNEL
);
2350 list_for_each_entry(i
, &ctx
->table
->sets
, list
) {
2353 if (!sscanf(i
->name
, name
, &tmp
))
2355 if (tmp
< min
|| tmp
>= min
+ BITS_PER_BYTE
* PAGE_SIZE
)
2358 set_bit(tmp
- min
, inuse
);
2361 n
= find_first_zero_bit(inuse
, BITS_PER_BYTE
* PAGE_SIZE
);
2362 if (n
>= BITS_PER_BYTE
* PAGE_SIZE
) {
2363 min
+= BITS_PER_BYTE
* PAGE_SIZE
;
2364 memset(inuse
, 0, PAGE_SIZE
);
2367 free_page((unsigned long)inuse
);
2370 snprintf(set
->name
, sizeof(set
->name
), name
, min
+ n
);
2371 list_for_each_entry(i
, &ctx
->table
->sets
, list
) {
2372 if (!strcmp(set
->name
, i
->name
))
2378 static int nf_tables_fill_set(struct sk_buff
*skb
, const struct nft_ctx
*ctx
,
2379 const struct nft_set
*set
, u16 event
, u16 flags
)
2381 struct nfgenmsg
*nfmsg
;
2382 struct nlmsghdr
*nlh
;
2383 struct nlattr
*desc
;
2384 u32 portid
= ctx
->portid
;
2387 event
|= NFNL_SUBSYS_NFTABLES
<< 8;
2388 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
2391 goto nla_put_failure
;
2393 nfmsg
= nlmsg_data(nlh
);
2394 nfmsg
->nfgen_family
= ctx
->afi
->family
;
2395 nfmsg
->version
= NFNETLINK_V0
;
2396 nfmsg
->res_id
= htons(ctx
->net
->nft
.base_seq
& 0xffff);
2398 if (nla_put_string(skb
, NFTA_SET_TABLE
, ctx
->table
->name
))
2399 goto nla_put_failure
;
2400 if (nla_put_string(skb
, NFTA_SET_NAME
, set
->name
))
2401 goto nla_put_failure
;
2402 if (set
->flags
!= 0)
2403 if (nla_put_be32(skb
, NFTA_SET_FLAGS
, htonl(set
->flags
)))
2404 goto nla_put_failure
;
2406 if (nla_put_be32(skb
, NFTA_SET_KEY_TYPE
, htonl(set
->ktype
)))
2407 goto nla_put_failure
;
2408 if (nla_put_be32(skb
, NFTA_SET_KEY_LEN
, htonl(set
->klen
)))
2409 goto nla_put_failure
;
2410 if (set
->flags
& NFT_SET_MAP
) {
2411 if (nla_put_be32(skb
, NFTA_SET_DATA_TYPE
, htonl(set
->dtype
)))
2412 goto nla_put_failure
;
2413 if (nla_put_be32(skb
, NFTA_SET_DATA_LEN
, htonl(set
->dlen
)))
2414 goto nla_put_failure
;
2418 nla_put_be64(skb
, NFTA_SET_TIMEOUT
, cpu_to_be64(set
->timeout
)))
2419 goto nla_put_failure
;
2421 nla_put_be32(skb
, NFTA_SET_GC_INTERVAL
, htonl(set
->gc_int
)))
2422 goto nla_put_failure
;
2424 if (set
->policy
!= NFT_SET_POL_PERFORMANCE
) {
2425 if (nla_put_be32(skb
, NFTA_SET_POLICY
, htonl(set
->policy
)))
2426 goto nla_put_failure
;
2429 desc
= nla_nest_start(skb
, NFTA_SET_DESC
);
2431 goto nla_put_failure
;
2433 nla_put_be32(skb
, NFTA_SET_DESC_SIZE
, htonl(set
->size
)))
2434 goto nla_put_failure
;
2435 nla_nest_end(skb
, desc
);
2437 nlmsg_end(skb
, nlh
);
2441 nlmsg_trim(skb
, nlh
);
2445 static int nf_tables_set_notify(const struct nft_ctx
*ctx
,
2446 const struct nft_set
*set
,
2447 int event
, gfp_t gfp_flags
)
2449 struct sk_buff
*skb
;
2450 u32 portid
= ctx
->portid
;
2454 !nfnetlink_has_listeners(ctx
->net
, NFNLGRP_NFTABLES
))
2458 skb
= nlmsg_new(NLMSG_GOODSIZE
, gfp_flags
);
2462 err
= nf_tables_fill_set(skb
, ctx
, set
, event
, 0);
2468 err
= nfnetlink_send(skb
, ctx
->net
, portid
, NFNLGRP_NFTABLES
,
2469 ctx
->report
, gfp_flags
);
2472 nfnetlink_set_err(ctx
->net
, portid
, NFNLGRP_NFTABLES
, err
);
2476 static int nf_tables_dump_sets(struct sk_buff
*skb
, struct netlink_callback
*cb
)
2478 const struct nft_set
*set
;
2479 unsigned int idx
, s_idx
= cb
->args
[0];
2480 struct nft_af_info
*afi
;
2481 struct nft_table
*table
, *cur_table
= (struct nft_table
*)cb
->args
[2];
2482 struct net
*net
= sock_net(skb
->sk
);
2483 int cur_family
= cb
->args
[3];
2484 struct nft_ctx
*ctx
= cb
->data
, ctx_set
;
2490 cb
->seq
= net
->nft
.base_seq
;
2492 list_for_each_entry_rcu(afi
, &net
->nft
.af_info
, list
) {
2493 if (ctx
->afi
&& ctx
->afi
!= afi
)
2497 if (afi
->family
!= cur_family
)
2502 list_for_each_entry_rcu(table
, &afi
->tables
, list
) {
2503 if (ctx
->table
&& ctx
->table
!= table
)
2507 if (cur_table
!= table
)
2513 list_for_each_entry_rcu(set
, &table
->sets
, list
) {
2518 ctx_set
.table
= table
;
2520 if (nf_tables_fill_set(skb
, &ctx_set
, set
,
2524 cb
->args
[2] = (unsigned long) table
;
2525 cb
->args
[3] = afi
->family
;
2528 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
2542 static int nf_tables_dump_sets_done(struct netlink_callback
*cb
)
2548 static int nf_tables_getset(struct sock
*nlsk
, struct sk_buff
*skb
,
2549 const struct nlmsghdr
*nlh
,
2550 const struct nlattr
* const nla
[])
2552 const struct nft_set
*set
;
2554 struct sk_buff
*skb2
;
2555 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2558 /* Verify existence before starting dump */
2559 err
= nft_ctx_init_from_setattr(&ctx
, skb
, nlh
, nla
);
2563 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
2564 struct netlink_dump_control c
= {
2565 .dump
= nf_tables_dump_sets
,
2566 .done
= nf_tables_dump_sets_done
,
2568 struct nft_ctx
*ctx_dump
;
2570 ctx_dump
= kmalloc(sizeof(*ctx_dump
), GFP_KERNEL
);
2571 if (ctx_dump
== NULL
)
2577 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
2580 /* Only accept unspec with dump */
2581 if (nfmsg
->nfgen_family
== NFPROTO_UNSPEC
)
2582 return -EAFNOSUPPORT
;
2584 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_NAME
]);
2586 return PTR_ERR(set
);
2587 if (set
->flags
& NFT_SET_INACTIVE
)
2590 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
2594 err
= nf_tables_fill_set(skb2
, &ctx
, set
, NFT_MSG_NEWSET
, 0);
2598 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
2605 static int nf_tables_set_desc_parse(const struct nft_ctx
*ctx
,
2606 struct nft_set_desc
*desc
,
2607 const struct nlattr
*nla
)
2609 struct nlattr
*da
[NFTA_SET_DESC_MAX
+ 1];
2612 err
= nla_parse_nested(da
, NFTA_SET_DESC_MAX
, nla
, nft_set_desc_policy
);
2616 if (da
[NFTA_SET_DESC_SIZE
] != NULL
)
2617 desc
->size
= ntohl(nla_get_be32(da
[NFTA_SET_DESC_SIZE
]));
2622 static int nf_tables_newset(struct sock
*nlsk
, struct sk_buff
*skb
,
2623 const struct nlmsghdr
*nlh
,
2624 const struct nlattr
* const nla
[])
2626 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2627 const struct nft_set_ops
*ops
;
2628 struct nft_af_info
*afi
;
2629 struct net
*net
= sock_net(skb
->sk
);
2630 struct nft_table
*table
;
2631 struct nft_set
*set
;
2633 char name
[IFNAMSIZ
];
2637 u32 ktype
, dtype
, flags
, policy
, gc_int
;
2638 struct nft_set_desc desc
;
2641 if (nla
[NFTA_SET_TABLE
] == NULL
||
2642 nla
[NFTA_SET_NAME
] == NULL
||
2643 nla
[NFTA_SET_KEY_LEN
] == NULL
||
2644 nla
[NFTA_SET_ID
] == NULL
)
2647 memset(&desc
, 0, sizeof(desc
));
2649 ktype
= NFT_DATA_VALUE
;
2650 if (nla
[NFTA_SET_KEY_TYPE
] != NULL
) {
2651 ktype
= ntohl(nla_get_be32(nla
[NFTA_SET_KEY_TYPE
]));
2652 if ((ktype
& NFT_DATA_RESERVED_MASK
) == NFT_DATA_RESERVED_MASK
)
2656 desc
.klen
= ntohl(nla_get_be32(nla
[NFTA_SET_KEY_LEN
]));
2657 if (desc
.klen
== 0 || desc
.klen
> NFT_DATA_VALUE_MAXLEN
)
2661 if (nla
[NFTA_SET_FLAGS
] != NULL
) {
2662 flags
= ntohl(nla_get_be32(nla
[NFTA_SET_FLAGS
]));
2663 if (flags
& ~(NFT_SET_ANONYMOUS
| NFT_SET_CONSTANT
|
2664 NFT_SET_INTERVAL
| NFT_SET_TIMEOUT
|
2665 NFT_SET_MAP
| NFT_SET_EVAL
))
2667 /* Only one of both operations is supported */
2668 if ((flags
& (NFT_SET_MAP
| NFT_SET_EVAL
)) ==
2669 (NFT_SET_MAP
| NFT_SET_EVAL
))
2674 if (nla
[NFTA_SET_DATA_TYPE
] != NULL
) {
2675 if (!(flags
& NFT_SET_MAP
))
2678 dtype
= ntohl(nla_get_be32(nla
[NFTA_SET_DATA_TYPE
]));
2679 if ((dtype
& NFT_DATA_RESERVED_MASK
) == NFT_DATA_RESERVED_MASK
&&
2680 dtype
!= NFT_DATA_VERDICT
)
2683 if (dtype
!= NFT_DATA_VERDICT
) {
2684 if (nla
[NFTA_SET_DATA_LEN
] == NULL
)
2686 desc
.dlen
= ntohl(nla_get_be32(nla
[NFTA_SET_DATA_LEN
]));
2687 if (desc
.dlen
== 0 || desc
.dlen
> NFT_DATA_VALUE_MAXLEN
)
2690 desc
.dlen
= sizeof(struct nft_verdict
);
2691 } else if (flags
& NFT_SET_MAP
)
2695 if (nla
[NFTA_SET_TIMEOUT
] != NULL
) {
2696 if (!(flags
& NFT_SET_TIMEOUT
))
2698 timeout
= be64_to_cpu(nla_get_be64(nla
[NFTA_SET_TIMEOUT
]));
2701 if (nla
[NFTA_SET_GC_INTERVAL
] != NULL
) {
2702 if (!(flags
& NFT_SET_TIMEOUT
))
2704 gc_int
= ntohl(nla_get_be32(nla
[NFTA_SET_GC_INTERVAL
]));
2707 policy
= NFT_SET_POL_PERFORMANCE
;
2708 if (nla
[NFTA_SET_POLICY
] != NULL
)
2709 policy
= ntohl(nla_get_be32(nla
[NFTA_SET_POLICY
]));
2711 if (nla
[NFTA_SET_DESC
] != NULL
) {
2712 err
= nf_tables_set_desc_parse(&ctx
, &desc
, nla
[NFTA_SET_DESC
]);
2717 create
= nlh
->nlmsg_flags
& NLM_F_CREATE
? true : false;
2719 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, create
);
2721 return PTR_ERR(afi
);
2723 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_TABLE
]);
2725 return PTR_ERR(table
);
2727 nft_ctx_init(&ctx
, skb
, nlh
, afi
, table
, NULL
, nla
);
2729 set
= nf_tables_set_lookup(table
, nla
[NFTA_SET_NAME
]);
2731 if (PTR_ERR(set
) != -ENOENT
)
2732 return PTR_ERR(set
);
2737 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
2739 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
2744 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
))
2747 ops
= nft_select_set_ops(nla
, &desc
, policy
);
2749 return PTR_ERR(ops
);
2752 if (ops
->privsize
!= NULL
)
2753 size
= ops
->privsize(nla
);
2756 set
= kzalloc(sizeof(*set
) + size
, GFP_KERNEL
);
2760 nla_strlcpy(name
, nla
[NFTA_SET_NAME
], sizeof(set
->name
));
2761 err
= nf_tables_set_alloc_name(&ctx
, set
, name
);
2765 INIT_LIST_HEAD(&set
->bindings
);
2766 write_pnet(&set
->pnet
, net
);
2769 set
->klen
= desc
.klen
;
2771 set
->dlen
= desc
.dlen
;
2773 set
->size
= desc
.size
;
2774 set
->policy
= policy
;
2775 set
->timeout
= timeout
;
2776 set
->gc_int
= gc_int
;
2778 err
= ops
->init(set
, &desc
, nla
);
2782 err
= nft_trans_set_add(&ctx
, NFT_MSG_NEWSET
, set
);
2786 list_add_tail_rcu(&set
->list
, &table
->sets
);
2793 module_put(ops
->owner
);
2797 static void nft_set_destroy(struct nft_set
*set
)
2799 set
->ops
->destroy(set
);
2800 module_put(set
->ops
->owner
);
2804 static void nf_tables_set_destroy(const struct nft_ctx
*ctx
, struct nft_set
*set
)
2806 list_del_rcu(&set
->list
);
2807 nf_tables_set_notify(ctx
, set
, NFT_MSG_DELSET
, GFP_ATOMIC
);
2808 nft_set_destroy(set
);
2811 static int nf_tables_delset(struct sock
*nlsk
, struct sk_buff
*skb
,
2812 const struct nlmsghdr
*nlh
,
2813 const struct nlattr
* const nla
[])
2815 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2816 struct nft_set
*set
;
2820 if (nfmsg
->nfgen_family
== NFPROTO_UNSPEC
)
2821 return -EAFNOSUPPORT
;
2822 if (nla
[NFTA_SET_TABLE
] == NULL
)
2825 err
= nft_ctx_init_from_setattr(&ctx
, skb
, nlh
, nla
);
2829 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_NAME
]);
2831 return PTR_ERR(set
);
2832 if (set
->flags
& NFT_SET_INACTIVE
)
2834 if (!list_empty(&set
->bindings
))
2837 return nft_delset(&ctx
, set
);
2840 static int nf_tables_bind_check_setelem(const struct nft_ctx
*ctx
,
2841 const struct nft_set
*set
,
2842 const struct nft_set_iter
*iter
,
2843 const struct nft_set_elem
*elem
)
2845 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
2846 enum nft_registers dreg
;
2848 dreg
= nft_type_to_reg(set
->dtype
);
2849 return nft_validate_register_store(ctx
, dreg
, nft_set_ext_data(ext
),
2850 set
->dtype
== NFT_DATA_VERDICT
?
2851 NFT_DATA_VERDICT
: NFT_DATA_VALUE
,
2855 int nf_tables_bind_set(const struct nft_ctx
*ctx
, struct nft_set
*set
,
2856 struct nft_set_binding
*binding
)
2858 struct nft_set_binding
*i
;
2859 struct nft_set_iter iter
;
2861 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_ANONYMOUS
)
2864 if (binding
->flags
& NFT_SET_MAP
) {
2865 /* If the set is already bound to the same chain all
2866 * jumps are already validated for that chain.
2868 list_for_each_entry(i
, &set
->bindings
, list
) {
2869 if (binding
->flags
& NFT_SET_MAP
&&
2870 i
->chain
== binding
->chain
)
2877 iter
.fn
= nf_tables_bind_check_setelem
;
2879 set
->ops
->walk(ctx
, set
, &iter
);
2881 /* Destroy anonymous sets if binding fails */
2882 if (set
->flags
& NFT_SET_ANONYMOUS
)
2883 nf_tables_set_destroy(ctx
, set
);
2889 binding
->chain
= ctx
->chain
;
2890 list_add_tail_rcu(&binding
->list
, &set
->bindings
);
2894 void nf_tables_unbind_set(const struct nft_ctx
*ctx
, struct nft_set
*set
,
2895 struct nft_set_binding
*binding
)
2897 list_del_rcu(&binding
->list
);
2899 if (list_empty(&set
->bindings
) && set
->flags
& NFT_SET_ANONYMOUS
&&
2900 !(set
->flags
& NFT_SET_INACTIVE
))
2901 nf_tables_set_destroy(ctx
, set
);
2904 const struct nft_set_ext_type nft_set_ext_types
[] = {
2905 [NFT_SET_EXT_KEY
] = {
2906 .align
= __alignof__(u32
),
2908 [NFT_SET_EXT_DATA
] = {
2909 .align
= __alignof__(u32
),
2911 [NFT_SET_EXT_EXPR
] = {
2912 .align
= __alignof__(struct nft_expr
),
2914 [NFT_SET_EXT_FLAGS
] = {
2916 .align
= __alignof__(u8
),
2918 [NFT_SET_EXT_TIMEOUT
] = {
2920 .align
= __alignof__(u64
),
2922 [NFT_SET_EXT_EXPIRATION
] = {
2923 .len
= sizeof(unsigned long),
2924 .align
= __alignof__(unsigned long),
2926 [NFT_SET_EXT_USERDATA
] = {
2927 .len
= sizeof(struct nft_userdata
),
2928 .align
= __alignof__(struct nft_userdata
),
2931 EXPORT_SYMBOL_GPL(nft_set_ext_types
);
2937 static const struct nla_policy nft_set_elem_policy
[NFTA_SET_ELEM_MAX
+ 1] = {
2938 [NFTA_SET_ELEM_KEY
] = { .type
= NLA_NESTED
},
2939 [NFTA_SET_ELEM_DATA
] = { .type
= NLA_NESTED
},
2940 [NFTA_SET_ELEM_FLAGS
] = { .type
= NLA_U32
},
2941 [NFTA_SET_ELEM_TIMEOUT
] = { .type
= NLA_U64
},
2942 [NFTA_SET_ELEM_USERDATA
] = { .type
= NLA_BINARY
,
2943 .len
= NFT_USERDATA_MAXLEN
},
2946 static const struct nla_policy nft_set_elem_list_policy
[NFTA_SET_ELEM_LIST_MAX
+ 1] = {
2947 [NFTA_SET_ELEM_LIST_TABLE
] = { .type
= NLA_STRING
},
2948 [NFTA_SET_ELEM_LIST_SET
] = { .type
= NLA_STRING
},
2949 [NFTA_SET_ELEM_LIST_ELEMENTS
] = { .type
= NLA_NESTED
},
2950 [NFTA_SET_ELEM_LIST_SET_ID
] = { .type
= NLA_U32
},
2953 static int nft_ctx_init_from_elemattr(struct nft_ctx
*ctx
,
2954 const struct sk_buff
*skb
,
2955 const struct nlmsghdr
*nlh
,
2956 const struct nlattr
* const nla
[],
2959 const struct nfgenmsg
*nfmsg
= nlmsg_data(nlh
);
2960 struct nft_af_info
*afi
;
2961 struct nft_table
*table
;
2962 struct net
*net
= sock_net(skb
->sk
);
2964 afi
= nf_tables_afinfo_lookup(net
, nfmsg
->nfgen_family
, false);
2966 return PTR_ERR(afi
);
2968 table
= nf_tables_table_lookup(afi
, nla
[NFTA_SET_ELEM_LIST_TABLE
]);
2970 return PTR_ERR(table
);
2971 if (!trans
&& (table
->flags
& NFT_TABLE_INACTIVE
))
2974 nft_ctx_init(ctx
, skb
, nlh
, afi
, table
, NULL
, nla
);
2978 static int nf_tables_fill_setelem(struct sk_buff
*skb
,
2979 const struct nft_set
*set
,
2980 const struct nft_set_elem
*elem
)
2982 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
2983 unsigned char *b
= skb_tail_pointer(skb
);
2984 struct nlattr
*nest
;
2986 nest
= nla_nest_start(skb
, NFTA_LIST_ELEM
);
2988 goto nla_put_failure
;
2990 if (nft_data_dump(skb
, NFTA_SET_ELEM_KEY
, nft_set_ext_key(ext
),
2991 NFT_DATA_VALUE
, set
->klen
) < 0)
2992 goto nla_put_failure
;
2994 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
) &&
2995 nft_data_dump(skb
, NFTA_SET_ELEM_DATA
, nft_set_ext_data(ext
),
2996 set
->dtype
== NFT_DATA_VERDICT
? NFT_DATA_VERDICT
: NFT_DATA_VALUE
,
2998 goto nla_put_failure
;
3000 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
) &&
3001 nft_expr_dump(skb
, NFTA_SET_ELEM_EXPR
, nft_set_ext_expr(ext
)) < 0)
3002 goto nla_put_failure
;
3004 if (nft_set_ext_exists(ext
, NFT_SET_EXT_FLAGS
) &&
3005 nla_put_be32(skb
, NFTA_SET_ELEM_FLAGS
,
3006 htonl(*nft_set_ext_flags(ext
))))
3007 goto nla_put_failure
;
3009 if (nft_set_ext_exists(ext
, NFT_SET_EXT_TIMEOUT
) &&
3010 nla_put_be64(skb
, NFTA_SET_ELEM_TIMEOUT
,
3011 cpu_to_be64(*nft_set_ext_timeout(ext
))))
3012 goto nla_put_failure
;
3014 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPIRATION
)) {
3015 unsigned long expires
, now
= jiffies
;
3017 expires
= *nft_set_ext_expiration(ext
);
3018 if (time_before(now
, expires
))
3023 if (nla_put_be64(skb
, NFTA_SET_ELEM_EXPIRATION
,
3024 cpu_to_be64(jiffies_to_msecs(expires
))))
3025 goto nla_put_failure
;
3028 if (nft_set_ext_exists(ext
, NFT_SET_EXT_USERDATA
)) {
3029 struct nft_userdata
*udata
;
3031 udata
= nft_set_ext_userdata(ext
);
3032 if (nla_put(skb
, NFTA_SET_ELEM_USERDATA
,
3033 udata
->len
+ 1, udata
->data
))
3034 goto nla_put_failure
;
3037 nla_nest_end(skb
, nest
);
3045 struct nft_set_dump_args
{
3046 const struct netlink_callback
*cb
;
3047 struct nft_set_iter iter
;
3048 struct sk_buff
*skb
;
3051 static int nf_tables_dump_setelem(const struct nft_ctx
*ctx
,
3052 const struct nft_set
*set
,
3053 const struct nft_set_iter
*iter
,
3054 const struct nft_set_elem
*elem
)
3056 struct nft_set_dump_args
*args
;
3058 args
= container_of(iter
, struct nft_set_dump_args
, iter
);
3059 return nf_tables_fill_setelem(args
->skb
, set
, elem
);
3062 static int nf_tables_dump_set(struct sk_buff
*skb
, struct netlink_callback
*cb
)
3064 const struct nft_set
*set
;
3065 struct nft_set_dump_args args
;
3067 struct nlattr
*nla
[NFTA_SET_ELEM_LIST_MAX
+ 1];
3068 struct nfgenmsg
*nfmsg
;
3069 struct nlmsghdr
*nlh
;
3070 struct nlattr
*nest
;
3074 err
= nlmsg_parse(cb
->nlh
, sizeof(struct nfgenmsg
), nla
,
3075 NFTA_SET_ELEM_LIST_MAX
, nft_set_elem_list_policy
);
3079 err
= nft_ctx_init_from_elemattr(&ctx
, cb
->skb
, cb
->nlh
, (void *)nla
,
3084 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
]);
3086 return PTR_ERR(set
);
3087 if (set
->flags
& NFT_SET_INACTIVE
)
3090 event
= NFT_MSG_NEWSETELEM
;
3091 event
|= NFNL_SUBSYS_NFTABLES
<< 8;
3092 portid
= NETLINK_CB(cb
->skb
).portid
;
3093 seq
= cb
->nlh
->nlmsg_seq
;
3095 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
3098 goto nla_put_failure
;
3100 nfmsg
= nlmsg_data(nlh
);
3101 nfmsg
->nfgen_family
= ctx
.afi
->family
;
3102 nfmsg
->version
= NFNETLINK_V0
;
3103 nfmsg
->res_id
= htons(ctx
.net
->nft
.base_seq
& 0xffff);
3105 if (nla_put_string(skb
, NFTA_SET_ELEM_LIST_TABLE
, ctx
.table
->name
))
3106 goto nla_put_failure
;
3107 if (nla_put_string(skb
, NFTA_SET_ELEM_LIST_SET
, set
->name
))
3108 goto nla_put_failure
;
3110 nest
= nla_nest_start(skb
, NFTA_SET_ELEM_LIST_ELEMENTS
);
3112 goto nla_put_failure
;
3116 args
.iter
.skip
= cb
->args
[0];
3117 args
.iter
.count
= 0;
3119 args
.iter
.fn
= nf_tables_dump_setelem
;
3120 set
->ops
->walk(&ctx
, set
, &args
.iter
);
3122 nla_nest_end(skb
, nest
);
3123 nlmsg_end(skb
, nlh
);
3125 if (args
.iter
.err
&& args
.iter
.err
!= -EMSGSIZE
)
3126 return args
.iter
.err
;
3127 if (args
.iter
.count
== cb
->args
[0])
3130 cb
->args
[0] = args
.iter
.count
;
3137 static int nf_tables_getsetelem(struct sock
*nlsk
, struct sk_buff
*skb
,
3138 const struct nlmsghdr
*nlh
,
3139 const struct nlattr
* const nla
[])
3141 const struct nft_set
*set
;
3145 err
= nft_ctx_init_from_elemattr(&ctx
, skb
, nlh
, nla
, false);
3149 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
]);
3151 return PTR_ERR(set
);
3152 if (set
->flags
& NFT_SET_INACTIVE
)
3155 if (nlh
->nlmsg_flags
& NLM_F_DUMP
) {
3156 struct netlink_dump_control c
= {
3157 .dump
= nf_tables_dump_set
,
3159 return netlink_dump_start(nlsk
, skb
, nlh
, &c
);
3164 static int nf_tables_fill_setelem_info(struct sk_buff
*skb
,
3165 const struct nft_ctx
*ctx
, u32 seq
,
3166 u32 portid
, int event
, u16 flags
,
3167 const struct nft_set
*set
,
3168 const struct nft_set_elem
*elem
)
3170 struct nfgenmsg
*nfmsg
;
3171 struct nlmsghdr
*nlh
;
3172 struct nlattr
*nest
;
3175 event
|= NFNL_SUBSYS_NFTABLES
<< 8;
3176 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
),
3179 goto nla_put_failure
;
3181 nfmsg
= nlmsg_data(nlh
);
3182 nfmsg
->nfgen_family
= ctx
->afi
->family
;
3183 nfmsg
->version
= NFNETLINK_V0
;
3184 nfmsg
->res_id
= htons(ctx
->net
->nft
.base_seq
& 0xffff);
3186 if (nla_put_string(skb
, NFTA_SET_TABLE
, ctx
->table
->name
))
3187 goto nla_put_failure
;
3188 if (nla_put_string(skb
, NFTA_SET_NAME
, set
->name
))
3189 goto nla_put_failure
;
3191 nest
= nla_nest_start(skb
, NFTA_SET_ELEM_LIST_ELEMENTS
);
3193 goto nla_put_failure
;
3195 err
= nf_tables_fill_setelem(skb
, set
, elem
);
3197 goto nla_put_failure
;
3199 nla_nest_end(skb
, nest
);
3201 nlmsg_end(skb
, nlh
);
3205 nlmsg_trim(skb
, nlh
);
3209 static int nf_tables_setelem_notify(const struct nft_ctx
*ctx
,
3210 const struct nft_set
*set
,
3211 const struct nft_set_elem
*elem
,
3212 int event
, u16 flags
)
3214 struct net
*net
= ctx
->net
;
3215 u32 portid
= ctx
->portid
;
3216 struct sk_buff
*skb
;
3219 if (!ctx
->report
&& !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
3223 skb
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
3227 err
= nf_tables_fill_setelem_info(skb
, ctx
, 0, portid
, event
, flags
,
3234 err
= nfnetlink_send(skb
, net
, portid
, NFNLGRP_NFTABLES
, ctx
->report
,
3238 nfnetlink_set_err(net
, portid
, NFNLGRP_NFTABLES
, err
);
3242 static struct nft_trans
*nft_trans_elem_alloc(struct nft_ctx
*ctx
,
3244 struct nft_set
*set
)
3246 struct nft_trans
*trans
;
3248 trans
= nft_trans_alloc(ctx
, msg_type
, sizeof(struct nft_trans_elem
));
3252 nft_trans_elem_set(trans
) = set
;
3256 void *nft_set_elem_init(const struct nft_set
*set
,
3257 const struct nft_set_ext_tmpl
*tmpl
,
3258 const u32
*key
, const u32
*data
,
3259 u64 timeout
, gfp_t gfp
)
3261 struct nft_set_ext
*ext
;
3264 elem
= kzalloc(set
->ops
->elemsize
+ tmpl
->len
, gfp
);
3268 ext
= nft_set_elem_ext(set
, elem
);
3269 nft_set_ext_init(ext
, tmpl
);
3271 memcpy(nft_set_ext_key(ext
), key
, set
->klen
);
3272 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
3273 memcpy(nft_set_ext_data(ext
), data
, set
->dlen
);
3274 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPIRATION
))
3275 *nft_set_ext_expiration(ext
) =
3276 jiffies
+ msecs_to_jiffies(timeout
);
3277 if (nft_set_ext_exists(ext
, NFT_SET_EXT_TIMEOUT
))
3278 *nft_set_ext_timeout(ext
) = timeout
;
3283 void nft_set_elem_destroy(const struct nft_set
*set
, void *elem
)
3285 struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
);
3287 nft_data_uninit(nft_set_ext_key(ext
), NFT_DATA_VALUE
);
3288 if (nft_set_ext_exists(ext
, NFT_SET_EXT_DATA
))
3289 nft_data_uninit(nft_set_ext_data(ext
), set
->dtype
);
3290 if (nft_set_ext_exists(ext
, NFT_SET_EXT_EXPR
))
3291 nf_tables_expr_destroy(NULL
, nft_set_ext_expr(ext
));
3295 EXPORT_SYMBOL_GPL(nft_set_elem_destroy
);
3297 static int nft_add_set_elem(struct nft_ctx
*ctx
, struct nft_set
*set
,
3298 const struct nlattr
*attr
)
3300 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
3301 struct nft_data_desc d1
, d2
;
3302 struct nft_set_ext_tmpl tmpl
;
3303 struct nft_set_ext
*ext
;
3304 struct nft_set_elem elem
;
3305 struct nft_set_binding
*binding
;
3306 struct nft_userdata
*udata
;
3307 struct nft_data data
;
3308 enum nft_registers dreg
;
3309 struct nft_trans
*trans
;
3315 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
3316 nft_set_elem_policy
);
3320 if (nla
[NFTA_SET_ELEM_KEY
] == NULL
)
3323 nft_set_ext_prepare(&tmpl
);
3326 if (nla
[NFTA_SET_ELEM_FLAGS
] != NULL
) {
3327 flags
= ntohl(nla_get_be32(nla
[NFTA_SET_ELEM_FLAGS
]));
3328 if (flags
& ~NFT_SET_ELEM_INTERVAL_END
)
3330 if (!(set
->flags
& NFT_SET_INTERVAL
) &&
3331 flags
& NFT_SET_ELEM_INTERVAL_END
)
3334 nft_set_ext_add(&tmpl
, NFT_SET_EXT_FLAGS
);
3337 if (set
->flags
& NFT_SET_MAP
) {
3338 if (nla
[NFTA_SET_ELEM_DATA
] == NULL
&&
3339 !(flags
& NFT_SET_ELEM_INTERVAL_END
))
3341 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
&&
3342 flags
& NFT_SET_ELEM_INTERVAL_END
)
3345 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
)
3350 if (nla
[NFTA_SET_ELEM_TIMEOUT
] != NULL
) {
3351 if (!(set
->flags
& NFT_SET_TIMEOUT
))
3353 timeout
= be64_to_cpu(nla_get_be64(nla
[NFTA_SET_ELEM_TIMEOUT
]));
3354 } else if (set
->flags
& NFT_SET_TIMEOUT
) {
3355 timeout
= set
->timeout
;
3358 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &d1
,
3359 nla
[NFTA_SET_ELEM_KEY
]);
3363 if (d1
.type
!= NFT_DATA_VALUE
|| d1
.len
!= set
->klen
)
3366 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_KEY
, d1
.len
);
3368 nft_set_ext_add(&tmpl
, NFT_SET_EXT_EXPIRATION
);
3369 if (timeout
!= set
->timeout
)
3370 nft_set_ext_add(&tmpl
, NFT_SET_EXT_TIMEOUT
);
3373 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
) {
3374 err
= nft_data_init(ctx
, &data
, sizeof(data
), &d2
,
3375 nla
[NFTA_SET_ELEM_DATA
]);
3380 if (set
->dtype
!= NFT_DATA_VERDICT
&& d2
.len
!= set
->dlen
)
3383 dreg
= nft_type_to_reg(set
->dtype
);
3384 list_for_each_entry(binding
, &set
->bindings
, list
) {
3385 struct nft_ctx bind_ctx
= {
3387 .table
= ctx
->table
,
3388 .chain
= (struct nft_chain
*)binding
->chain
,
3391 if (!(binding
->flags
& NFT_SET_MAP
))
3394 err
= nft_validate_register_store(&bind_ctx
, dreg
,
3401 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_DATA
, d2
.len
);
3404 /* The full maximum length of userdata can exceed the maximum
3405 * offset value (U8_MAX) for following extensions, therefor it
3406 * must be the last extension added.
3409 if (nla
[NFTA_SET_ELEM_USERDATA
] != NULL
) {
3410 ulen
= nla_len(nla
[NFTA_SET_ELEM_USERDATA
]);
3412 nft_set_ext_add_length(&tmpl
, NFT_SET_EXT_USERDATA
,
3417 elem
.priv
= nft_set_elem_init(set
, &tmpl
, elem
.key
.val
.data
, data
.data
,
3418 timeout
, GFP_KERNEL
);
3419 if (elem
.priv
== NULL
)
3422 ext
= nft_set_elem_ext(set
, elem
.priv
);
3424 *nft_set_ext_flags(ext
) = flags
;
3426 udata
= nft_set_ext_userdata(ext
);
3427 udata
->len
= ulen
- 1;
3428 nla_memcpy(&udata
->data
, nla
[NFTA_SET_ELEM_USERDATA
], ulen
);
3431 trans
= nft_trans_elem_alloc(ctx
, NFT_MSG_NEWSETELEM
, set
);
3435 ext
->genmask
= nft_genmask_cur(ctx
->net
) | NFT_SET_ELEM_BUSY_MASK
;
3436 err
= set
->ops
->insert(set
, &elem
);
3440 nft_trans_elem(trans
) = elem
;
3441 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
3449 if (nla
[NFTA_SET_ELEM_DATA
] != NULL
)
3450 nft_data_uninit(&data
, d2
.type
);
3452 nft_data_uninit(&elem
.key
.val
, d1
.type
);
3457 static int nf_tables_newsetelem(struct sock
*nlsk
, struct sk_buff
*skb
,
3458 const struct nlmsghdr
*nlh
,
3459 const struct nlattr
* const nla
[])
3461 struct net
*net
= sock_net(skb
->sk
);
3462 const struct nlattr
*attr
;
3463 struct nft_set
*set
;
3467 if (nla
[NFTA_SET_ELEM_LIST_ELEMENTS
] == NULL
)
3470 err
= nft_ctx_init_from_elemattr(&ctx
, skb
, nlh
, nla
, true);
3474 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
]);
3476 if (nla
[NFTA_SET_ELEM_LIST_SET_ID
]) {
3477 set
= nf_tables_set_lookup_byid(net
,
3478 nla
[NFTA_SET_ELEM_LIST_SET_ID
]);
3481 return PTR_ERR(set
);
3484 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_CONSTANT
)
3487 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
3489 !atomic_add_unless(&set
->nelems
, 1, set
->size
+ set
->ndeact
))
3492 err
= nft_add_set_elem(&ctx
, set
, attr
);
3494 atomic_dec(&set
->nelems
);
3501 static int nft_del_setelem(struct nft_ctx
*ctx
, struct nft_set
*set
,
3502 const struct nlattr
*attr
)
3504 struct nlattr
*nla
[NFTA_SET_ELEM_MAX
+ 1];
3505 struct nft_data_desc desc
;
3506 struct nft_set_elem elem
;
3507 struct nft_trans
*trans
;
3510 err
= nla_parse_nested(nla
, NFTA_SET_ELEM_MAX
, attr
,
3511 nft_set_elem_policy
);
3516 if (nla
[NFTA_SET_ELEM_KEY
] == NULL
)
3519 err
= nft_data_init(ctx
, &elem
.key
.val
, sizeof(elem
.key
), &desc
,
3520 nla
[NFTA_SET_ELEM_KEY
]);
3525 if (desc
.type
!= NFT_DATA_VALUE
|| desc
.len
!= set
->klen
)
3528 trans
= nft_trans_elem_alloc(ctx
, NFT_MSG_DELSETELEM
, set
);
3529 if (trans
== NULL
) {
3534 elem
.priv
= set
->ops
->deactivate(set
, &elem
);
3535 if (elem
.priv
== NULL
) {
3540 nft_trans_elem(trans
) = elem
;
3541 list_add_tail(&trans
->list
, &ctx
->net
->nft
.commit_list
);
3547 nft_data_uninit(&elem
.key
.val
, desc
.type
);
3552 static int nf_tables_delsetelem(struct sock
*nlsk
, struct sk_buff
*skb
,
3553 const struct nlmsghdr
*nlh
,
3554 const struct nlattr
* const nla
[])
3556 const struct nlattr
*attr
;
3557 struct nft_set
*set
;
3561 if (nla
[NFTA_SET_ELEM_LIST_ELEMENTS
] == NULL
)
3564 err
= nft_ctx_init_from_elemattr(&ctx
, skb
, nlh
, nla
, false);
3568 set
= nf_tables_set_lookup(ctx
.table
, nla
[NFTA_SET_ELEM_LIST_SET
]);
3570 return PTR_ERR(set
);
3571 if (!list_empty(&set
->bindings
) && set
->flags
& NFT_SET_CONSTANT
)
3574 nla_for_each_nested(attr
, nla
[NFTA_SET_ELEM_LIST_ELEMENTS
], rem
) {
3575 err
= nft_del_setelem(&ctx
, set
, attr
);
3584 void nft_set_gc_batch_release(struct rcu_head
*rcu
)
3586 struct nft_set_gc_batch
*gcb
;
3589 gcb
= container_of(rcu
, struct nft_set_gc_batch
, head
.rcu
);
3590 for (i
= 0; i
< gcb
->head
.cnt
; i
++)
3591 nft_set_elem_destroy(gcb
->head
.set
, gcb
->elems
[i
]);
3594 EXPORT_SYMBOL_GPL(nft_set_gc_batch_release
);
3596 struct nft_set_gc_batch
*nft_set_gc_batch_alloc(const struct nft_set
*set
,
3599 struct nft_set_gc_batch
*gcb
;
3601 gcb
= kzalloc(sizeof(*gcb
), gfp
);
3604 gcb
->head
.set
= set
;
3607 EXPORT_SYMBOL_GPL(nft_set_gc_batch_alloc
);
3609 static int nf_tables_fill_gen_info(struct sk_buff
*skb
, struct net
*net
,
3610 u32 portid
, u32 seq
)
3612 struct nlmsghdr
*nlh
;
3613 struct nfgenmsg
*nfmsg
;
3614 int event
= (NFNL_SUBSYS_NFTABLES
<< 8) | NFT_MSG_NEWGEN
;
3616 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(struct nfgenmsg
), 0);
3618 goto nla_put_failure
;
3620 nfmsg
= nlmsg_data(nlh
);
3621 nfmsg
->nfgen_family
= AF_UNSPEC
;
3622 nfmsg
->version
= NFNETLINK_V0
;
3623 nfmsg
->res_id
= htons(net
->nft
.base_seq
& 0xffff);
3625 if (nla_put_be32(skb
, NFTA_GEN_ID
, htonl(net
->nft
.base_seq
)))
3626 goto nla_put_failure
;
3628 nlmsg_end(skb
, nlh
);
3632 nlmsg_trim(skb
, nlh
);
3636 static int nf_tables_gen_notify(struct net
*net
, struct sk_buff
*skb
, int event
)
3638 struct nlmsghdr
*nlh
= nlmsg_hdr(skb
);
3639 struct sk_buff
*skb2
;
3642 if (nlmsg_report(nlh
) &&
3643 !nfnetlink_has_listeners(net
, NFNLGRP_NFTABLES
))
3647 skb2
= nlmsg_new(NLMSG_GOODSIZE
, GFP_KERNEL
);
3651 err
= nf_tables_fill_gen_info(skb2
, net
, NETLINK_CB(skb
).portid
,
3658 err
= nfnetlink_send(skb2
, net
, NETLINK_CB(skb
).portid
,
3659 NFNLGRP_NFTABLES
, nlmsg_report(nlh
), GFP_KERNEL
);
3662 nfnetlink_set_err(net
, NETLINK_CB(skb
).portid
, NFNLGRP_NFTABLES
,
3668 static int nf_tables_getgen(struct sock
*nlsk
, struct sk_buff
*skb
,
3669 const struct nlmsghdr
*nlh
,
3670 const struct nlattr
* const nla
[])
3672 struct net
*net
= sock_net(skb
->sk
);
3673 struct sk_buff
*skb2
;
3676 skb2
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
3680 err
= nf_tables_fill_gen_info(skb2
, net
, NETLINK_CB(skb
).portid
,
3685 return nlmsg_unicast(nlsk
, skb2
, NETLINK_CB(skb
).portid
);
3691 static const struct nfnl_callback nf_tables_cb
[NFT_MSG_MAX
] = {
3692 [NFT_MSG_NEWTABLE
] = {
3693 .call_batch
= nf_tables_newtable
,
3694 .attr_count
= NFTA_TABLE_MAX
,
3695 .policy
= nft_table_policy
,
3697 [NFT_MSG_GETTABLE
] = {
3698 .call
= nf_tables_gettable
,
3699 .attr_count
= NFTA_TABLE_MAX
,
3700 .policy
= nft_table_policy
,
3702 [NFT_MSG_DELTABLE
] = {
3703 .call_batch
= nf_tables_deltable
,
3704 .attr_count
= NFTA_TABLE_MAX
,
3705 .policy
= nft_table_policy
,
3707 [NFT_MSG_NEWCHAIN
] = {
3708 .call_batch
= nf_tables_newchain
,
3709 .attr_count
= NFTA_CHAIN_MAX
,
3710 .policy
= nft_chain_policy
,
3712 [NFT_MSG_GETCHAIN
] = {
3713 .call
= nf_tables_getchain
,
3714 .attr_count
= NFTA_CHAIN_MAX
,
3715 .policy
= nft_chain_policy
,
3717 [NFT_MSG_DELCHAIN
] = {
3718 .call_batch
= nf_tables_delchain
,
3719 .attr_count
= NFTA_CHAIN_MAX
,
3720 .policy
= nft_chain_policy
,
3722 [NFT_MSG_NEWRULE
] = {
3723 .call_batch
= nf_tables_newrule
,
3724 .attr_count
= NFTA_RULE_MAX
,
3725 .policy
= nft_rule_policy
,
3727 [NFT_MSG_GETRULE
] = {
3728 .call
= nf_tables_getrule
,
3729 .attr_count
= NFTA_RULE_MAX
,
3730 .policy
= nft_rule_policy
,
3732 [NFT_MSG_DELRULE
] = {
3733 .call_batch
= nf_tables_delrule
,
3734 .attr_count
= NFTA_RULE_MAX
,
3735 .policy
= nft_rule_policy
,
3737 [NFT_MSG_NEWSET
] = {
3738 .call_batch
= nf_tables_newset
,
3739 .attr_count
= NFTA_SET_MAX
,
3740 .policy
= nft_set_policy
,
3742 [NFT_MSG_GETSET
] = {
3743 .call
= nf_tables_getset
,
3744 .attr_count
= NFTA_SET_MAX
,
3745 .policy
= nft_set_policy
,
3747 [NFT_MSG_DELSET
] = {
3748 .call_batch
= nf_tables_delset
,
3749 .attr_count
= NFTA_SET_MAX
,
3750 .policy
= nft_set_policy
,
3752 [NFT_MSG_NEWSETELEM
] = {
3753 .call_batch
= nf_tables_newsetelem
,
3754 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
3755 .policy
= nft_set_elem_list_policy
,
3757 [NFT_MSG_GETSETELEM
] = {
3758 .call
= nf_tables_getsetelem
,
3759 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
3760 .policy
= nft_set_elem_list_policy
,
3762 [NFT_MSG_DELSETELEM
] = {
3763 .call_batch
= nf_tables_delsetelem
,
3764 .attr_count
= NFTA_SET_ELEM_LIST_MAX
,
3765 .policy
= nft_set_elem_list_policy
,
3767 [NFT_MSG_GETGEN
] = {
3768 .call
= nf_tables_getgen
,
3772 static void nft_chain_commit_update(struct nft_trans
*trans
)
3774 struct nft_base_chain
*basechain
;
3776 if (nft_trans_chain_name(trans
)[0])
3777 strcpy(trans
->ctx
.chain
->name
, nft_trans_chain_name(trans
));
3779 if (!(trans
->ctx
.chain
->flags
& NFT_BASE_CHAIN
))
3782 basechain
= nft_base_chain(trans
->ctx
.chain
);
3783 nft_chain_stats_replace(basechain
, nft_trans_chain_stats(trans
));
3785 switch (nft_trans_chain_policy(trans
)) {
3788 basechain
->policy
= nft_trans_chain_policy(trans
);
3793 static void nf_tables_commit_release(struct nft_trans
*trans
)
3795 switch (trans
->msg_type
) {
3796 case NFT_MSG_DELTABLE
:
3797 nf_tables_table_destroy(&trans
->ctx
);
3799 case NFT_MSG_DELCHAIN
:
3800 nf_tables_chain_destroy(trans
->ctx
.chain
);
3802 case NFT_MSG_DELRULE
:
3803 nf_tables_rule_destroy(&trans
->ctx
, nft_trans_rule(trans
));
3805 case NFT_MSG_DELSET
:
3806 nft_set_destroy(nft_trans_set(trans
));
3808 case NFT_MSG_DELSETELEM
:
3809 nft_set_elem_destroy(nft_trans_elem_set(trans
),
3810 nft_trans_elem(trans
).priv
);
3816 static int nf_tables_commit(struct sk_buff
*skb
)
3818 struct net
*net
= sock_net(skb
->sk
);
3819 struct nft_trans
*trans
, *next
;
3820 struct nft_trans_elem
*te
;
3822 /* Bump generation counter, invalidate any dump in progress */
3823 while (++net
->nft
.base_seq
== 0);
3825 /* A new generation has just started */
3826 net
->nft
.gencursor
= nft_gencursor_next(net
);
3828 /* Make sure all packets have left the previous generation before
3829 * purging old rules.
3833 list_for_each_entry_safe(trans
, next
, &net
->nft
.commit_list
, list
) {
3834 switch (trans
->msg_type
) {
3835 case NFT_MSG_NEWTABLE
:
3836 if (nft_trans_table_update(trans
)) {
3837 if (!nft_trans_table_enable(trans
)) {
3838 nf_tables_table_disable(trans
->ctx
.afi
,
3840 trans
->ctx
.table
->flags
|= NFT_TABLE_F_DORMANT
;
3843 trans
->ctx
.table
->flags
&= ~NFT_TABLE_INACTIVE
;
3845 nf_tables_table_notify(&trans
->ctx
, NFT_MSG_NEWTABLE
);
3846 nft_trans_destroy(trans
);
3848 case NFT_MSG_DELTABLE
:
3849 nf_tables_table_notify(&trans
->ctx
, NFT_MSG_DELTABLE
);
3851 case NFT_MSG_NEWCHAIN
:
3852 if (nft_trans_chain_update(trans
))
3853 nft_chain_commit_update(trans
);
3855 trans
->ctx
.chain
->flags
&= ~NFT_CHAIN_INACTIVE
;
3857 nf_tables_chain_notify(&trans
->ctx
, NFT_MSG_NEWCHAIN
);
3858 nft_trans_destroy(trans
);
3860 case NFT_MSG_DELCHAIN
:
3861 nf_tables_chain_notify(&trans
->ctx
, NFT_MSG_DELCHAIN
);
3862 nf_tables_unregister_hooks(trans
->ctx
.table
,
3864 trans
->ctx
.afi
->nops
);
3866 case NFT_MSG_NEWRULE
:
3867 nft_rule_clear(trans
->ctx
.net
, nft_trans_rule(trans
));
3868 nf_tables_rule_notify(&trans
->ctx
,
3869 nft_trans_rule(trans
),
3871 nft_trans_destroy(trans
);
3873 case NFT_MSG_DELRULE
:
3874 list_del_rcu(&nft_trans_rule(trans
)->list
);
3875 nf_tables_rule_notify(&trans
->ctx
,
3876 nft_trans_rule(trans
),
3879 case NFT_MSG_NEWSET
:
3880 nft_trans_set(trans
)->flags
&= ~NFT_SET_INACTIVE
;
3881 /* This avoids hitting -EBUSY when deleting the table
3882 * from the transaction.
3884 if (nft_trans_set(trans
)->flags
& NFT_SET_ANONYMOUS
&&
3885 !list_empty(&nft_trans_set(trans
)->bindings
))
3886 trans
->ctx
.table
->use
--;
3888 nf_tables_set_notify(&trans
->ctx
, nft_trans_set(trans
),
3889 NFT_MSG_NEWSET
, GFP_KERNEL
);
3890 nft_trans_destroy(trans
);
3892 case NFT_MSG_DELSET
:
3893 nf_tables_set_notify(&trans
->ctx
, nft_trans_set(trans
),
3894 NFT_MSG_DELSET
, GFP_KERNEL
);
3896 case NFT_MSG_NEWSETELEM
:
3897 te
= (struct nft_trans_elem
*)trans
->data
;
3899 te
->set
->ops
->activate(te
->set
, &te
->elem
);
3900 nf_tables_setelem_notify(&trans
->ctx
, te
->set
,
3902 NFT_MSG_NEWSETELEM
, 0);
3903 nft_trans_destroy(trans
);
3905 case NFT_MSG_DELSETELEM
:
3906 te
= (struct nft_trans_elem
*)trans
->data
;
3908 nf_tables_setelem_notify(&trans
->ctx
, te
->set
,
3910 NFT_MSG_DELSETELEM
, 0);
3911 te
->set
->ops
->remove(te
->set
, &te
->elem
);
3912 atomic_dec(&te
->set
->nelems
);
3920 list_for_each_entry_safe(trans
, next
, &net
->nft
.commit_list
, list
) {
3921 list_del(&trans
->list
);
3922 nf_tables_commit_release(trans
);
3925 nf_tables_gen_notify(net
, skb
, NFT_MSG_NEWGEN
);
3930 static void nf_tables_abort_release(struct nft_trans
*trans
)
3932 switch (trans
->msg_type
) {
3933 case NFT_MSG_NEWTABLE
:
3934 nf_tables_table_destroy(&trans
->ctx
);
3936 case NFT_MSG_NEWCHAIN
:
3937 nf_tables_chain_destroy(trans
->ctx
.chain
);
3939 case NFT_MSG_NEWRULE
:
3940 nf_tables_rule_destroy(&trans
->ctx
, nft_trans_rule(trans
));
3942 case NFT_MSG_NEWSET
:
3943 nft_set_destroy(nft_trans_set(trans
));
3945 case NFT_MSG_NEWSETELEM
:
3946 nft_set_elem_destroy(nft_trans_elem_set(trans
),
3947 nft_trans_elem(trans
).priv
);
3953 static int nf_tables_abort(struct sk_buff
*skb
)
3955 struct net
*net
= sock_net(skb
->sk
);
3956 struct nft_trans
*trans
, *next
;
3957 struct nft_trans_elem
*te
;
3959 list_for_each_entry_safe(trans
, next
, &net
->nft
.commit_list
, list
) {
3960 switch (trans
->msg_type
) {
3961 case NFT_MSG_NEWTABLE
:
3962 if (nft_trans_table_update(trans
)) {
3963 if (nft_trans_table_enable(trans
)) {
3964 nf_tables_table_disable(trans
->ctx
.afi
,
3966 trans
->ctx
.table
->flags
|= NFT_TABLE_F_DORMANT
;
3968 nft_trans_destroy(trans
);
3970 list_del_rcu(&trans
->ctx
.table
->list
);
3973 case NFT_MSG_DELTABLE
:
3974 list_add_tail_rcu(&trans
->ctx
.table
->list
,
3975 &trans
->ctx
.afi
->tables
);
3976 nft_trans_destroy(trans
);
3978 case NFT_MSG_NEWCHAIN
:
3979 if (nft_trans_chain_update(trans
)) {
3980 free_percpu(nft_trans_chain_stats(trans
));
3982 nft_trans_destroy(trans
);
3984 trans
->ctx
.table
->use
--;
3985 list_del_rcu(&trans
->ctx
.chain
->list
);
3986 nf_tables_unregister_hooks(trans
->ctx
.table
,
3988 trans
->ctx
.afi
->nops
);
3991 case NFT_MSG_DELCHAIN
:
3992 trans
->ctx
.table
->use
++;
3993 list_add_tail_rcu(&trans
->ctx
.chain
->list
,
3994 &trans
->ctx
.table
->chains
);
3995 nft_trans_destroy(trans
);
3997 case NFT_MSG_NEWRULE
:
3998 trans
->ctx
.chain
->use
--;
3999 list_del_rcu(&nft_trans_rule(trans
)->list
);
4001 case NFT_MSG_DELRULE
:
4002 trans
->ctx
.chain
->use
++;
4003 nft_rule_clear(trans
->ctx
.net
, nft_trans_rule(trans
));
4004 nft_trans_destroy(trans
);
4006 case NFT_MSG_NEWSET
:
4007 trans
->ctx
.table
->use
--;
4008 list_del_rcu(&nft_trans_set(trans
)->list
);
4010 case NFT_MSG_DELSET
:
4011 trans
->ctx
.table
->use
++;
4012 list_add_tail_rcu(&nft_trans_set(trans
)->list
,
4013 &trans
->ctx
.table
->sets
);
4014 nft_trans_destroy(trans
);
4016 case NFT_MSG_NEWSETELEM
:
4017 te
= (struct nft_trans_elem
*)trans
->data
;
4019 te
->set
->ops
->remove(te
->set
, &te
->elem
);
4020 atomic_dec(&te
->set
->nelems
);
4022 case NFT_MSG_DELSETELEM
:
4023 te
= (struct nft_trans_elem
*)trans
->data
;
4025 te
->set
->ops
->activate(te
->set
, &te
->elem
);
4028 nft_trans_destroy(trans
);
4035 list_for_each_entry_safe_reverse(trans
, next
,
4036 &net
->nft
.commit_list
, list
) {
4037 list_del(&trans
->list
);
4038 nf_tables_abort_release(trans
);
4044 static const struct nfnetlink_subsystem nf_tables_subsys
= {
4045 .name
= "nf_tables",
4046 .subsys_id
= NFNL_SUBSYS_NFTABLES
,
4047 .cb_count
= NFT_MSG_MAX
,
4049 .commit
= nf_tables_commit
,
4050 .abort
= nf_tables_abort
,
4053 int nft_chain_validate_dependency(const struct nft_chain
*chain
,
4054 enum nft_chain_type type
)
4056 const struct nft_base_chain
*basechain
;
4058 if (chain
->flags
& NFT_BASE_CHAIN
) {
4059 basechain
= nft_base_chain(chain
);
4060 if (basechain
->type
->type
!= type
)
4065 EXPORT_SYMBOL_GPL(nft_chain_validate_dependency
);
4067 int nft_chain_validate_hooks(const struct nft_chain
*chain
,
4068 unsigned int hook_flags
)
4070 struct nft_base_chain
*basechain
;
4072 if (chain
->flags
& NFT_BASE_CHAIN
) {
4073 basechain
= nft_base_chain(chain
);
4075 if ((1 << basechain
->ops
[0].hooknum
) & hook_flags
)
4083 EXPORT_SYMBOL_GPL(nft_chain_validate_hooks
);
4086 * Loop detection - walk through the ruleset beginning at the destination chain
4087 * of a new jump until either the source chain is reached (loop) or all
4088 * reachable chains have been traversed.
4090 * The loop check is performed whenever a new jump verdict is added to an
4091 * expression or verdict map or a verdict map is bound to a new chain.
4094 static int nf_tables_check_loops(const struct nft_ctx
*ctx
,
4095 const struct nft_chain
*chain
);
4097 static int nf_tables_loop_check_setelem(const struct nft_ctx
*ctx
,
4098 const struct nft_set
*set
,
4099 const struct nft_set_iter
*iter
,
4100 const struct nft_set_elem
*elem
)
4102 const struct nft_set_ext
*ext
= nft_set_elem_ext(set
, elem
->priv
);
4103 const struct nft_data
*data
;
4105 if (nft_set_ext_exists(ext
, NFT_SET_EXT_FLAGS
) &&
4106 *nft_set_ext_flags(ext
) & NFT_SET_ELEM_INTERVAL_END
)
4109 data
= nft_set_ext_data(ext
);
4110 switch (data
->verdict
.code
) {
4113 return nf_tables_check_loops(ctx
, data
->verdict
.chain
);
4119 static int nf_tables_check_loops(const struct nft_ctx
*ctx
,
4120 const struct nft_chain
*chain
)
4122 const struct nft_rule
*rule
;
4123 const struct nft_expr
*expr
, *last
;
4124 const struct nft_set
*set
;
4125 struct nft_set_binding
*binding
;
4126 struct nft_set_iter iter
;
4128 if (ctx
->chain
== chain
)
4131 list_for_each_entry(rule
, &chain
->rules
, list
) {
4132 nft_rule_for_each_expr(expr
, last
, rule
) {
4133 const struct nft_data
*data
= NULL
;
4136 if (!expr
->ops
->validate
)
4139 err
= expr
->ops
->validate(ctx
, expr
, &data
);
4146 switch (data
->verdict
.code
) {
4149 err
= nf_tables_check_loops(ctx
,
4150 data
->verdict
.chain
);
4159 list_for_each_entry(set
, &ctx
->table
->sets
, list
) {
4160 if (!(set
->flags
& NFT_SET_MAP
) ||
4161 set
->dtype
!= NFT_DATA_VERDICT
)
4164 list_for_each_entry(binding
, &set
->bindings
, list
) {
4165 if (!(binding
->flags
& NFT_SET_MAP
) ||
4166 binding
->chain
!= chain
)
4172 iter
.fn
= nf_tables_loop_check_setelem
;
4174 set
->ops
->walk(ctx
, set
, &iter
);
4184 * nft_parse_register - parse a register value from a netlink attribute
4186 * @attr: netlink attribute
4188 * Parse and translate a register value from a netlink attribute.
4189 * Registers used to be 128 bit wide, these register numbers will be
4190 * mapped to the corresponding 32 bit register numbers.
4192 unsigned int nft_parse_register(const struct nlattr
*attr
)
4196 reg
= ntohl(nla_get_be32(attr
));
4198 case NFT_REG_VERDICT
...NFT_REG_4
:
4199 return reg
* NFT_REG_SIZE
/ NFT_REG32_SIZE
;
4201 return reg
+ NFT_REG_SIZE
/ NFT_REG32_SIZE
- NFT_REG32_00
;
4204 EXPORT_SYMBOL_GPL(nft_parse_register
);
4207 * nft_dump_register - dump a register value to a netlink attribute
4209 * @skb: socket buffer
4210 * @attr: attribute number
4211 * @reg: register number
4213 * Construct a netlink attribute containing the register number. For
4214 * compatibility reasons, register numbers being a multiple of 4 are
4215 * translated to the corresponding 128 bit register numbers.
4217 int nft_dump_register(struct sk_buff
*skb
, unsigned int attr
, unsigned int reg
)
4219 if (reg
% (NFT_REG_SIZE
/ NFT_REG32_SIZE
) == 0)
4220 reg
= reg
/ (NFT_REG_SIZE
/ NFT_REG32_SIZE
);
4222 reg
= reg
- NFT_REG_SIZE
/ NFT_REG32_SIZE
+ NFT_REG32_00
;
4224 return nla_put_be32(skb
, attr
, htonl(reg
));
4226 EXPORT_SYMBOL_GPL(nft_dump_register
);
4229 * nft_validate_register_load - validate a load from a register
4231 * @reg: the register number
4232 * @len: the length of the data
4234 * Validate that the input register is one of the general purpose
4235 * registers and that the length of the load is within the bounds.
4237 int nft_validate_register_load(enum nft_registers reg
, unsigned int len
)
4239 if (reg
< NFT_REG_1
* NFT_REG_SIZE
/ NFT_REG32_SIZE
)
4243 if (reg
* NFT_REG32_SIZE
+ len
> FIELD_SIZEOF(struct nft_regs
, data
))
4248 EXPORT_SYMBOL_GPL(nft_validate_register_load
);
4251 * nft_validate_register_store - validate an expressions' register store
4253 * @ctx: context of the expression performing the load
4254 * @reg: the destination register number
4255 * @data: the data to load
4256 * @type: the data type
4257 * @len: the length of the data
4259 * Validate that a data load uses the appropriate data type for
4260 * the destination register and the length is within the bounds.
4261 * A value of NULL for the data means that its runtime gathered
4264 int nft_validate_register_store(const struct nft_ctx
*ctx
,
4265 enum nft_registers reg
,
4266 const struct nft_data
*data
,
4267 enum nft_data_types type
, unsigned int len
)
4272 case NFT_REG_VERDICT
:
4273 if (type
!= NFT_DATA_VERDICT
)
4277 (data
->verdict
.code
== NFT_GOTO
||
4278 data
->verdict
.code
== NFT_JUMP
)) {
4279 err
= nf_tables_check_loops(ctx
, data
->verdict
.chain
);
4283 if (ctx
->chain
->level
+ 1 >
4284 data
->verdict
.chain
->level
) {
4285 if (ctx
->chain
->level
+ 1 == NFT_JUMP_STACK_SIZE
)
4287 data
->verdict
.chain
->level
= ctx
->chain
->level
+ 1;
4293 if (reg
< NFT_REG_1
* NFT_REG_SIZE
/ NFT_REG32_SIZE
)
4297 if (reg
* NFT_REG32_SIZE
+ len
>
4298 FIELD_SIZEOF(struct nft_regs
, data
))
4301 if (data
!= NULL
&& type
!= NFT_DATA_VALUE
)
4306 EXPORT_SYMBOL_GPL(nft_validate_register_store
);
4308 static const struct nla_policy nft_verdict_policy
[NFTA_VERDICT_MAX
+ 1] = {
4309 [NFTA_VERDICT_CODE
] = { .type
= NLA_U32
},
4310 [NFTA_VERDICT_CHAIN
] = { .type
= NLA_STRING
,
4311 .len
= NFT_CHAIN_MAXNAMELEN
- 1 },
4314 static int nft_verdict_init(const struct nft_ctx
*ctx
, struct nft_data
*data
,
4315 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
4317 struct nlattr
*tb
[NFTA_VERDICT_MAX
+ 1];
4318 struct nft_chain
*chain
;
4321 err
= nla_parse_nested(tb
, NFTA_VERDICT_MAX
, nla
, nft_verdict_policy
);
4325 if (!tb
[NFTA_VERDICT_CODE
])
4327 data
->verdict
.code
= ntohl(nla_get_be32(tb
[NFTA_VERDICT_CODE
]));
4329 switch (data
->verdict
.code
) {
4331 switch (data
->verdict
.code
& NF_VERDICT_MASK
) {
4343 desc
->len
= sizeof(data
->verdict
);
4347 if (!tb
[NFTA_VERDICT_CHAIN
])
4349 chain
= nf_tables_chain_lookup(ctx
->table
,
4350 tb
[NFTA_VERDICT_CHAIN
]);
4352 return PTR_ERR(chain
);
4353 if (chain
->flags
& NFT_BASE_CHAIN
)
4357 data
->verdict
.chain
= chain
;
4358 desc
->len
= sizeof(data
);
4362 desc
->type
= NFT_DATA_VERDICT
;
4366 static void nft_verdict_uninit(const struct nft_data
*data
)
4368 switch (data
->verdict
.code
) {
4371 data
->verdict
.chain
->use
--;
4376 static int nft_verdict_dump(struct sk_buff
*skb
, const struct nft_data
*data
)
4378 struct nlattr
*nest
;
4380 nest
= nla_nest_start(skb
, NFTA_DATA_VERDICT
);
4382 goto nla_put_failure
;
4384 if (nla_put_be32(skb
, NFTA_VERDICT_CODE
, htonl(data
->verdict
.code
)))
4385 goto nla_put_failure
;
4387 switch (data
->verdict
.code
) {
4390 if (nla_put_string(skb
, NFTA_VERDICT_CHAIN
,
4391 data
->verdict
.chain
->name
))
4392 goto nla_put_failure
;
4394 nla_nest_end(skb
, nest
);
4401 static int nft_value_init(const struct nft_ctx
*ctx
,
4402 struct nft_data
*data
, unsigned int size
,
4403 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
4413 nla_memcpy(data
->data
, nla
, len
);
4414 desc
->type
= NFT_DATA_VALUE
;
4419 static int nft_value_dump(struct sk_buff
*skb
, const struct nft_data
*data
,
4422 return nla_put(skb
, NFTA_DATA_VALUE
, len
, data
->data
);
4425 static const struct nla_policy nft_data_policy
[NFTA_DATA_MAX
+ 1] = {
4426 [NFTA_DATA_VALUE
] = { .type
= NLA_BINARY
},
4427 [NFTA_DATA_VERDICT
] = { .type
= NLA_NESTED
},
4431 * nft_data_init - parse nf_tables data netlink attributes
4433 * @ctx: context of the expression using the data
4434 * @data: destination struct nft_data
4435 * @size: maximum data length
4436 * @desc: data description
4437 * @nla: netlink attribute containing data
4439 * Parse the netlink data attributes and initialize a struct nft_data.
4440 * The type and length of data are returned in the data description.
4442 * The caller can indicate that it only wants to accept data of type
4443 * NFT_DATA_VALUE by passing NULL for the ctx argument.
4445 int nft_data_init(const struct nft_ctx
*ctx
,
4446 struct nft_data
*data
, unsigned int size
,
4447 struct nft_data_desc
*desc
, const struct nlattr
*nla
)
4449 struct nlattr
*tb
[NFTA_DATA_MAX
+ 1];
4452 err
= nla_parse_nested(tb
, NFTA_DATA_MAX
, nla
, nft_data_policy
);
4456 if (tb
[NFTA_DATA_VALUE
])
4457 return nft_value_init(ctx
, data
, size
, desc
,
4458 tb
[NFTA_DATA_VALUE
]);
4459 if (tb
[NFTA_DATA_VERDICT
] && ctx
!= NULL
)
4460 return nft_verdict_init(ctx
, data
, desc
, tb
[NFTA_DATA_VERDICT
]);
4463 EXPORT_SYMBOL_GPL(nft_data_init
);
4466 * nft_data_uninit - release a nft_data item
4468 * @data: struct nft_data to release
4469 * @type: type of data
4471 * Release a nft_data item. NFT_DATA_VALUE types can be silently discarded,
4472 * all others need to be released by calling this function.
4474 void nft_data_uninit(const struct nft_data
*data
, enum nft_data_types type
)
4477 case NFT_DATA_VALUE
:
4479 case NFT_DATA_VERDICT
:
4480 return nft_verdict_uninit(data
);
4485 EXPORT_SYMBOL_GPL(nft_data_uninit
);
4487 int nft_data_dump(struct sk_buff
*skb
, int attr
, const struct nft_data
*data
,
4488 enum nft_data_types type
, unsigned int len
)
4490 struct nlattr
*nest
;
4493 nest
= nla_nest_start(skb
, attr
);
4498 case NFT_DATA_VALUE
:
4499 err
= nft_value_dump(skb
, data
, len
);
4501 case NFT_DATA_VERDICT
:
4502 err
= nft_verdict_dump(skb
, data
);
4509 nla_nest_end(skb
, nest
);
4512 EXPORT_SYMBOL_GPL(nft_data_dump
);
4514 static int nf_tables_init_net(struct net
*net
)
4516 INIT_LIST_HEAD(&net
->nft
.af_info
);
4517 INIT_LIST_HEAD(&net
->nft
.commit_list
);
4518 net
->nft
.base_seq
= 1;
4522 static struct pernet_operations nf_tables_net_ops
= {
4523 .init
= nf_tables_init_net
,
4526 static int __init
nf_tables_module_init(void)
4530 info
= kmalloc(sizeof(struct nft_expr_info
) * NFT_RULE_MAXEXPRS
,
4537 err
= nf_tables_core_module_init();
4541 err
= nfnetlink_subsys_register(&nf_tables_subsys
);
4545 pr_info("nf_tables: (c) 2007-2009 Patrick McHardy <kaber@trash.net>\n");
4546 return register_pernet_subsys(&nf_tables_net_ops
);
4548 nf_tables_core_module_exit();
4555 static void __exit
nf_tables_module_exit(void)
4557 unregister_pernet_subsys(&nf_tables_net_ops
);
4558 nfnetlink_subsys_unregister(&nf_tables_subsys
);
4560 nf_tables_core_module_exit();
4564 module_init(nf_tables_module_init
);
4565 module_exit(nf_tables_module_exit
);
4567 MODULE_LICENSE("GPL");
4568 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
4569 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFTABLES
);