netfilter: nft_compat: use .release_ops and remove list of extension

Add .release_ops, that is called in case of error at a later stage in
the expression initialization path, ie. .select_ops() has been already
set up operations and that needs to be undone. This allows us to unwind
.select_ops from the error path, ie. release the dynamic operations for
this extension.

Moreover, allocate one single operation instead of recycling them, this
comes at the cost of consuming a bit more memory per rule, but it
simplifies the infrastructure.

Signed-off-by: Pablo Neira Ayuso <pablo@netfilter.org>
This commit is contained in:
Pablo Neira Ayuso 2019-02-13 13:18:36 +01:00
parent ff8285f818
commit b8e2040063
3 changed files with 64 additions and 227 deletions

View File

@ -690,10 +690,12 @@ static inline void nft_set_gc_batch_add(struct nft_set_gc_batch *gcb,
gcb->elems[gcb->head.cnt++] = elem; gcb->elems[gcb->head.cnt++] = elem;
} }
struct nft_expr_ops;
/** /**
* struct nft_expr_type - nf_tables expression type * struct nft_expr_type - nf_tables expression type
* *
* @select_ops: function to select nft_expr_ops * @select_ops: function to select nft_expr_ops
* @release_ops: release nft_expr_ops
* @ops: default ops, used when no select_ops functions is present * @ops: default ops, used when no select_ops functions is present
* @list: used internally * @list: used internally
* @name: Identifier * @name: Identifier
@ -706,6 +708,7 @@ static inline void nft_set_gc_batch_add(struct nft_set_gc_batch *gcb,
struct nft_expr_type { struct nft_expr_type {
const struct nft_expr_ops *(*select_ops)(const struct nft_ctx *, const struct nft_expr_ops *(*select_ops)(const struct nft_ctx *,
const struct nlattr * const tb[]); const struct nlattr * const tb[]);
void (*release_ops)(const struct nft_expr_ops *ops);
const struct nft_expr_ops *ops; const struct nft_expr_ops *ops;
struct list_head list; struct list_head list;
const char *name; const char *name;

View File

@ -2172,6 +2172,7 @@ struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
{ {
struct nft_expr_info info; struct nft_expr_info info;
struct nft_expr *expr; struct nft_expr *expr;
struct module *owner;
int err; int err;
err = nf_tables_expr_parse(ctx, nla, &info); err = nf_tables_expr_parse(ctx, nla, &info);
@ -2191,7 +2192,11 @@ struct nft_expr *nft_expr_init(const struct nft_ctx *ctx,
err3: err3:
kfree(expr); kfree(expr);
err2: err2:
module_put(info.ops->type->owner); owner = info.ops->type->owner;
if (info.ops->type->release_ops)
info.ops->type->release_ops(info.ops);
module_put(owner);
err1: err1:
return ERR_PTR(err); return ERR_PTR(err);
} }

View File

@ -22,23 +22,6 @@
#include <linux/netfilter_bridge/ebtables.h> #include <linux/netfilter_bridge/ebtables.h>
#include <linux/netfilter_arp/arp_tables.h> #include <linux/netfilter_arp/arp_tables.h>
#include <net/netfilter/nf_tables.h> #include <net/netfilter/nf_tables.h>
#include <net/netns/generic.h>
struct nft_xt {
struct list_head head;
struct nft_expr_ops ops;
refcount_t refcnt;
/* used only when transaction mutex is locked */
unsigned int listcnt;
/* Unlike other expressions, ops doesn't have static storage duration.
* nft core assumes they do. We use kfree_rcu so that nft core can
* can check expr->ops->size even after nft_compat->destroy() frees
* the nft_xt struct that holds the ops structure.
*/
struct rcu_head rcu_head;
};
/* Used for matches where *info is larger than X byte */ /* Used for matches where *info is larger than X byte */
#define NFT_MATCH_LARGE_THRESH 192 #define NFT_MATCH_LARGE_THRESH 192
@ -47,46 +30,6 @@ struct nft_xt_match_priv {
void *info; void *info;
}; };
struct nft_compat_net {
struct list_head nft_target_list;
struct list_head nft_match_list;
};
static unsigned int nft_compat_net_id __read_mostly;
static struct nft_expr_type nft_match_type;
static struct nft_expr_type nft_target_type;
static struct nft_compat_net *nft_compat_pernet(struct net *net)
{
return net_generic(net, nft_compat_net_id);
}
static void nft_xt_get(struct nft_xt *xt)
{
/* refcount_inc() warns on 0 -> 1 transition, but we can't
* init the reference count to 1 in .select_ops -- we can't
* undo such an increase when another expression inside the same
* rule fails afterwards.
*/
if (xt->listcnt == 0)
refcount_set(&xt->refcnt, 1);
else
refcount_inc(&xt->refcnt);
xt->listcnt++;
}
static bool nft_xt_put(struct nft_xt *xt)
{
if (refcount_dec_and_test(&xt->refcnt)) {
WARN_ON_ONCE(!list_empty(&xt->head));
kfree_rcu(xt, rcu_head);
return true;
}
return false;
}
static int nft_compat_chain_validate_dependency(const struct nft_ctx *ctx, static int nft_compat_chain_validate_dependency(const struct nft_ctx *ctx,
const char *tablename) const char *tablename)
{ {
@ -281,7 +224,6 @@ nft_target_init(const struct nft_ctx *ctx, const struct nft_expr *expr,
struct xt_target *target = expr->ops->data; struct xt_target *target = expr->ops->data;
struct xt_tgchk_param par; struct xt_tgchk_param par;
size_t size = XT_ALIGN(nla_len(tb[NFTA_TARGET_INFO])); size_t size = XT_ALIGN(nla_len(tb[NFTA_TARGET_INFO]));
struct nft_xt *nft_xt;
u16 proto = 0; u16 proto = 0;
bool inv = false; bool inv = false;
union nft_entry e = {}; union nft_entry e = {};
@ -305,8 +247,6 @@ nft_target_init(const struct nft_ctx *ctx, const struct nft_expr *expr,
if (!target->target) if (!target->target)
return -EINVAL; return -EINVAL;
nft_xt = container_of(expr->ops, struct nft_xt, ops);
nft_xt_get(nft_xt);
return 0; return 0;
} }
@ -325,8 +265,8 @@ nft_target_destroy(const struct nft_ctx *ctx, const struct nft_expr *expr)
if (par.target->destroy != NULL) if (par.target->destroy != NULL)
par.target->destroy(&par); par.target->destroy(&par);
if (nft_xt_put(container_of(expr->ops, struct nft_xt, ops))) module_put(me);
module_put(me); kfree(expr->ops);
} }
static int nft_extension_dump_info(struct sk_buff *skb, int attr, static int nft_extension_dump_info(struct sk_buff *skb, int attr,
@ -499,7 +439,6 @@ __nft_match_init(const struct nft_ctx *ctx, const struct nft_expr *expr,
struct xt_match *match = expr->ops->data; struct xt_match *match = expr->ops->data;
struct xt_mtchk_param par; struct xt_mtchk_param par;
size_t size = XT_ALIGN(nla_len(tb[NFTA_MATCH_INFO])); size_t size = XT_ALIGN(nla_len(tb[NFTA_MATCH_INFO]));
struct nft_xt *nft_xt;
u16 proto = 0; u16 proto = 0;
bool inv = false; bool inv = false;
union nft_entry e = {}; union nft_entry e = {};
@ -515,13 +454,7 @@ __nft_match_init(const struct nft_ctx *ctx, const struct nft_expr *expr,
nft_match_set_mtchk_param(&par, ctx, match, info, &e, proto, inv); nft_match_set_mtchk_param(&par, ctx, match, info, &e, proto, inv);
ret = xt_check_match(&par, size, proto, inv); return xt_check_match(&par, size, proto, inv);
if (ret < 0)
return ret;
nft_xt = container_of(expr->ops, struct nft_xt, ops);
nft_xt_get(nft_xt);
return 0;
} }
static int static int
@ -564,8 +497,8 @@ __nft_match_destroy(const struct nft_ctx *ctx, const struct nft_expr *expr,
if (par.match->destroy != NULL) if (par.match->destroy != NULL)
par.match->destroy(&par); par.match->destroy(&par);
if (nft_xt_put(container_of(expr->ops, struct nft_xt, ops))) module_put(me);
module_put(me); kfree(expr->ops);
} }
static void static void
@ -574,18 +507,6 @@ nft_match_destroy(const struct nft_ctx *ctx, const struct nft_expr *expr)
__nft_match_destroy(ctx, expr, nft_expr_priv(expr)); __nft_match_destroy(ctx, expr, nft_expr_priv(expr));
} }
static void nft_compat_deactivate(const struct nft_ctx *ctx,
const struct nft_expr *expr,
enum nft_trans_phase phase)
{
struct nft_xt *xt = container_of(expr->ops, struct nft_xt, ops);
if (phase == NFT_TRANS_ABORT || phase == NFT_TRANS_COMMIT) {
if (--xt->listcnt == 0)
list_del_init(&xt->head);
}
}
static void static void
nft_match_large_destroy(const struct nft_ctx *ctx, const struct nft_expr *expr) nft_match_large_destroy(const struct nft_ctx *ctx, const struct nft_expr *expr)
{ {
@ -780,19 +701,13 @@ static const struct nfnetlink_subsystem nfnl_compat_subsys = {
.cb = nfnl_nft_compat_cb, .cb = nfnl_nft_compat_cb,
}; };
static bool nft_match_cmp(const struct xt_match *match, static struct nft_expr_type nft_match_type;
const char *name, u32 rev, u32 family)
{
return strcmp(match->name, name) == 0 && match->revision == rev &&
(match->family == NFPROTO_UNSPEC || match->family == family);
}
static const struct nft_expr_ops * static const struct nft_expr_ops *
nft_match_select_ops(const struct nft_ctx *ctx, nft_match_select_ops(const struct nft_ctx *ctx,
const struct nlattr * const tb[]) const struct nlattr * const tb[])
{ {
struct nft_compat_net *cn; struct nft_expr_ops *ops;
struct nft_xt *nft_match;
struct xt_match *match; struct xt_match *match;
unsigned int matchsize; unsigned int matchsize;
char *mt_name; char *mt_name;
@ -808,16 +723,6 @@ nft_match_select_ops(const struct nft_ctx *ctx,
rev = ntohl(nla_get_be32(tb[NFTA_MATCH_REV])); rev = ntohl(nla_get_be32(tb[NFTA_MATCH_REV]));
family = ctx->family; family = ctx->family;
cn = nft_compat_pernet(ctx->net);
/* Re-use the existing match if it's already loaded. */
list_for_each_entry(nft_match, &cn->nft_match_list, head) {
struct xt_match *match = nft_match->ops.data;
if (nft_match_cmp(match, mt_name, rev, family))
return &nft_match->ops;
}
match = xt_request_find_match(family, mt_name, rev); match = xt_request_find_match(family, mt_name, rev);
if (IS_ERR(match)) if (IS_ERR(match))
return ERR_PTR(-ENOENT); return ERR_PTR(-ENOENT);
@ -827,65 +732,62 @@ nft_match_select_ops(const struct nft_ctx *ctx,
goto err; goto err;
} }
/* This is the first time we use this match, allocate operations */ ops = kzalloc(sizeof(struct nft_expr_ops), GFP_KERNEL);
nft_match = kzalloc(sizeof(struct nft_xt), GFP_KERNEL); if (!ops) {
if (nft_match == NULL) {
err = -ENOMEM; err = -ENOMEM;
goto err; goto err;
} }
refcount_set(&nft_match->refcnt, 0); ops->type = &nft_match_type;
nft_match->ops.type = &nft_match_type; ops->eval = nft_match_eval;
nft_match->ops.eval = nft_match_eval; ops->init = nft_match_init;
nft_match->ops.init = nft_match_init; ops->destroy = nft_match_destroy;
nft_match->ops.destroy = nft_match_destroy; ops->dump = nft_match_dump;
nft_match->ops.deactivate = nft_compat_deactivate; ops->validate = nft_match_validate;
nft_match->ops.dump = nft_match_dump; ops->data = match;
nft_match->ops.validate = nft_match_validate;
nft_match->ops.data = match;
matchsize = NFT_EXPR_SIZE(XT_ALIGN(match->matchsize)); matchsize = NFT_EXPR_SIZE(XT_ALIGN(match->matchsize));
if (matchsize > NFT_MATCH_LARGE_THRESH) { if (matchsize > NFT_MATCH_LARGE_THRESH) {
matchsize = NFT_EXPR_SIZE(sizeof(struct nft_xt_match_priv)); matchsize = NFT_EXPR_SIZE(sizeof(struct nft_xt_match_priv));
nft_match->ops.eval = nft_match_large_eval; ops->eval = nft_match_large_eval;
nft_match->ops.init = nft_match_large_init; ops->init = nft_match_large_init;
nft_match->ops.destroy = nft_match_large_destroy; ops->destroy = nft_match_large_destroy;
nft_match->ops.dump = nft_match_large_dump; ops->dump = nft_match_large_dump;
} }
nft_match->ops.size = matchsize; ops->size = matchsize;
nft_match->listcnt = 0; return ops;
list_add(&nft_match->head, &cn->nft_match_list);
return &nft_match->ops;
err: err:
module_put(match->me); module_put(match->me);
return ERR_PTR(err); return ERR_PTR(err);
} }
static void nft_match_release_ops(const struct nft_expr_ops *ops)
{
struct xt_match *match = ops->data;
module_put(match->me);
kfree(ops);
}
static struct nft_expr_type nft_match_type __read_mostly = { static struct nft_expr_type nft_match_type __read_mostly = {
.name = "match", .name = "match",
.select_ops = nft_match_select_ops, .select_ops = nft_match_select_ops,
.release_ops = nft_match_release_ops,
.policy = nft_match_policy, .policy = nft_match_policy,
.maxattr = NFTA_MATCH_MAX, .maxattr = NFTA_MATCH_MAX,
.owner = THIS_MODULE, .owner = THIS_MODULE,
}; };
static bool nft_target_cmp(const struct xt_target *tg, static struct nft_expr_type nft_target_type;
const char *name, u32 rev, u32 family)
{
return strcmp(tg->name, name) == 0 && tg->revision == rev &&
(tg->family == NFPROTO_UNSPEC || tg->family == family);
}
static const struct nft_expr_ops * static const struct nft_expr_ops *
nft_target_select_ops(const struct nft_ctx *ctx, nft_target_select_ops(const struct nft_ctx *ctx,
const struct nlattr * const tb[]) const struct nlattr * const tb[])
{ {
struct nft_compat_net *cn; struct nft_expr_ops *ops;
struct nft_xt *nft_target;
struct xt_target *target; struct xt_target *target;
char *tg_name; char *tg_name;
u32 rev, family; u32 rev, family;
@ -905,18 +807,6 @@ nft_target_select_ops(const struct nft_ctx *ctx,
strcmp(tg_name, "standard") == 0) strcmp(tg_name, "standard") == 0)
return ERR_PTR(-EINVAL); return ERR_PTR(-EINVAL);
cn = nft_compat_pernet(ctx->net);
/* Re-use the existing target if it's already loaded. */
list_for_each_entry(nft_target, &cn->nft_target_list, head) {
struct xt_target *target = nft_target->ops.data;
if (!target->target)
continue;
if (nft_target_cmp(target, tg_name, rev, family))
return &nft_target->ops;
}
target = xt_request_find_target(family, tg_name, rev); target = xt_request_find_target(family, tg_name, rev);
if (IS_ERR(target)) if (IS_ERR(target))
return ERR_PTR(-ENOENT); return ERR_PTR(-ENOENT);
@ -931,113 +821,55 @@ nft_target_select_ops(const struct nft_ctx *ctx,
goto err; goto err;
} }
/* This is the first time we use this target, allocate operations */ ops = kzalloc(sizeof(struct nft_expr_ops), GFP_KERNEL);
nft_target = kzalloc(sizeof(struct nft_xt), GFP_KERNEL); if (!ops) {
if (nft_target == NULL) {
err = -ENOMEM; err = -ENOMEM;
goto err; goto err;
} }
refcount_set(&nft_target->refcnt, 0); ops->type = &nft_target_type;
nft_target->ops.type = &nft_target_type; ops->size = NFT_EXPR_SIZE(XT_ALIGN(target->targetsize));
nft_target->ops.size = NFT_EXPR_SIZE(XT_ALIGN(target->targetsize)); ops->init = nft_target_init;
nft_target->ops.init = nft_target_init; ops->destroy = nft_target_destroy;
nft_target->ops.destroy = nft_target_destroy; ops->dump = nft_target_dump;
nft_target->ops.deactivate = nft_compat_deactivate; ops->validate = nft_target_validate;
nft_target->ops.dump = nft_target_dump; ops->data = target;
nft_target->ops.validate = nft_target_validate;
nft_target->ops.data = target;
if (family == NFPROTO_BRIDGE) if (family == NFPROTO_BRIDGE)
nft_target->ops.eval = nft_target_eval_bridge; ops->eval = nft_target_eval_bridge;
else else
nft_target->ops.eval = nft_target_eval_xt; ops->eval = nft_target_eval_xt;
nft_target->listcnt = 0; return ops;
list_add(&nft_target->head, &cn->nft_target_list);
return &nft_target->ops;
err: err:
module_put(target->me); module_put(target->me);
return ERR_PTR(err); return ERR_PTR(err);
} }
static void nft_target_release_ops(const struct nft_expr_ops *ops)
{
struct xt_target *target = ops->data;
module_put(target->me);
kfree(ops);
}
static struct nft_expr_type nft_target_type __read_mostly = { static struct nft_expr_type nft_target_type __read_mostly = {
.name = "target", .name = "target",
.select_ops = nft_target_select_ops, .select_ops = nft_target_select_ops,
.release_ops = nft_target_release_ops,
.policy = nft_target_policy, .policy = nft_target_policy,
.maxattr = NFTA_TARGET_MAX, .maxattr = NFTA_TARGET_MAX,
.owner = THIS_MODULE, .owner = THIS_MODULE,
}; };
static int __net_init nft_compat_init_net(struct net *net)
{
struct nft_compat_net *cn = nft_compat_pernet(net);
INIT_LIST_HEAD(&cn->nft_target_list);
INIT_LIST_HEAD(&cn->nft_match_list);
return 0;
}
static void __net_exit nft_compat_exit_net(struct net *net)
{
struct nft_compat_net *cn = nft_compat_pernet(net);
struct nft_xt *xt, *next;
if (list_empty(&cn->nft_match_list) &&
list_empty(&cn->nft_target_list))
return;
/* If there was an error that caused nft_xt expr to not be initialized
* fully and noone else requested the same expression later, the lists
* contain 0-refcount entries that still hold module reference.
*
* Clean them here.
*/
mutex_lock(&net->nft.commit_mutex);
list_for_each_entry_safe(xt, next, &cn->nft_target_list, head) {
struct xt_target *target = xt->ops.data;
list_del_init(&xt->head);
if (refcount_read(&xt->refcnt))
continue;
module_put(target->me);
kfree(xt);
}
list_for_each_entry_safe(xt, next, &cn->nft_match_list, head) {
struct xt_match *match = xt->ops.data;
list_del_init(&xt->head);
if (refcount_read(&xt->refcnt))
continue;
module_put(match->me);
kfree(xt);
}
mutex_unlock(&net->nft.commit_mutex);
}
static struct pernet_operations nft_compat_net_ops = {
.init = nft_compat_init_net,
.exit = nft_compat_exit_net,
.id = &nft_compat_net_id,
.size = sizeof(struct nft_compat_net),
};
static int __init nft_compat_module_init(void) static int __init nft_compat_module_init(void)
{ {
int ret; int ret;
ret = register_pernet_subsys(&nft_compat_net_ops);
if (ret < 0)
goto err_target;
ret = nft_register_expr(&nft_match_type); ret = nft_register_expr(&nft_match_type);
if (ret < 0) if (ret < 0)
goto err_pernet; return ret;
ret = nft_register_expr(&nft_target_type); ret = nft_register_expr(&nft_target_type);
if (ret < 0) if (ret < 0)
@ -1054,8 +886,6 @@ err_target:
nft_unregister_expr(&nft_target_type); nft_unregister_expr(&nft_target_type);
err_match: err_match:
nft_unregister_expr(&nft_match_type); nft_unregister_expr(&nft_match_type);
err_pernet:
unregister_pernet_subsys(&nft_compat_net_ops);
return ret; return ret;
} }
@ -1064,7 +894,6 @@ static void __exit nft_compat_module_exit(void)
nfnetlink_subsys_unregister(&nfnl_compat_subsys); nfnetlink_subsys_unregister(&nfnl_compat_subsys);
nft_unregister_expr(&nft_target_type); nft_unregister_expr(&nft_target_type);
nft_unregister_expr(&nft_match_type); nft_unregister_expr(&nft_match_type);
unregister_pernet_subsys(&nft_compat_net_ops);
} }
MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFT_COMPAT); MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_NFT_COMPAT);