From: Pablo Neira Ayuso <pablo@xxxxxxxxxxxxx> commit fa23e0d4b756d25829e124d6b670a4c6bbd4bf7e upstream. Sven Auhagen reports transaction failures with following error: ./main.nft:13:1-26: Error: Could not process rule: Cannot allocate memory percpu: allocation failed, size=16 align=8 atomic=1, atomic alloc failed, no space left This points to failing pcpu allocation with GFP_ATOMIC flag. However, transactions happen from user context and are allowed to sleep. One case where we can call into percpu allocator with GFP_ATOMIC is nft_counter expression. Normally this happens from control plane, so this could use GFP_KERNEL instead. But one use case, element insertion from packet path, needs to use GFP_ATOMIC allocations (nft_dynset expression). At this time, .clone callbacks always use GFP_ATOMIC for this reason. Add gfp_t argument to the .clone function and pass GFP_KERNEL or GFP_ATOMIC flag depending on context, this allows all clone memory allocations to sleep for the normal (transaction) case. Cc: Sven Auhagen <sven.auhagen@xxxxxxxxxxxx> Signed-off-by: Florian Westphal <fw@xxxxxxxxx> Signed-off-by: Pablo Neira Ayuso <pablo@xxxxxxxxxxxxx> Signed-off-by: Greg Kroah-Hartman <gregkh@xxxxxxxxxxxxxxxxxxx> --- include/net/netfilter/nf_tables.h | 4 ++-- net/netfilter/nf_tables_api.c | 8 ++++---- net/netfilter/nft_connlimit.c | 2 +- net/netfilter/nft_counter.c | 4 ++-- net/netfilter/nft_dynset.c | 2 +- 5 files changed, 10 insertions(+), 10 deletions(-) --- a/include/net/netfilter/nf_tables.h +++ b/include/net/netfilter/nf_tables.h @@ -786,7 +786,7 @@ struct nft_expr_ops { struct nft_regs *regs, const struct nft_pktinfo *pkt); int (*clone)(struct nft_expr *dst, - const struct nft_expr *src); + const struct nft_expr *src, gfp_t gfp); unsigned int size; int (*init)(const struct nft_ctx *ctx, @@ -837,7 +837,7 @@ static inline void *nft_expr_priv(const return (void *)expr->data; } -int nft_expr_clone(struct nft_expr *dst, struct nft_expr *src); +int nft_expr_clone(struct nft_expr *dst, struct nft_expr *src, gfp_t gfp); void nft_expr_destroy(const struct nft_ctx *ctx, struct nft_expr *expr); int nft_expr_dump(struct sk_buff *skb, unsigned int attr, const struct nft_expr *expr); --- a/net/netfilter/nf_tables_api.c +++ b/net/netfilter/nf_tables_api.c @@ -2968,13 +2968,13 @@ err_expr_parse: return ERR_PTR(err); } -int nft_expr_clone(struct nft_expr *dst, struct nft_expr *src) +int nft_expr_clone(struct nft_expr *dst, struct nft_expr *src, gfp_t gfp) { int err; if (src->ops->clone) { dst->ops = src->ops; - err = src->ops->clone(dst, src); + err = src->ops->clone(dst, src, gfp); if (err < 0) return err; } else { @@ -5524,7 +5524,7 @@ static int nft_set_elem_expr_setup(struc if (expr == NULL) return 0; - err = nft_expr_clone(elem_expr, expr); + err = nft_expr_clone(elem_expr, expr, GFP_KERNEL); if (err < 0) return -ENOMEM; @@ -5632,7 +5632,7 @@ static int nft_add_set_elem(struct nft_c if (!expr) return -ENOMEM; - err = nft_expr_clone(expr, set->expr); + err = nft_expr_clone(expr, set->expr, GFP_KERNEL); if (err < 0) goto err_set_elem_expr; } --- a/net/netfilter/nft_connlimit.c +++ b/net/netfilter/nft_connlimit.c @@ -195,7 +195,7 @@ static void nft_connlimit_destroy(const nft_connlimit_do_destroy(ctx, priv); } -static int nft_connlimit_clone(struct nft_expr *dst, const struct nft_expr *src) +static int nft_connlimit_clone(struct nft_expr *dst, const struct nft_expr *src, gfp_t gfp) { struct nft_connlimit *priv_dst = nft_expr_priv(dst); struct nft_connlimit *priv_src = nft_expr_priv(src); --- a/net/netfilter/nft_counter.c +++ b/net/netfilter/nft_counter.c @@ -224,7 +224,7 @@ static void nft_counter_destroy(const st nft_counter_do_destroy(priv); } -static int nft_counter_clone(struct nft_expr *dst, const struct nft_expr *src) +static int nft_counter_clone(struct nft_expr *dst, const struct nft_expr *src, gfp_t gfp) { struct nft_counter_percpu_priv *priv = nft_expr_priv(src); struct nft_counter_percpu_priv *priv_clone = nft_expr_priv(dst); @@ -234,7 +234,7 @@ static int nft_counter_clone(struct nft_ nft_counter_fetch(priv, &total); - cpu_stats = alloc_percpu_gfp(struct nft_counter, GFP_ATOMIC); + cpu_stats = alloc_percpu_gfp(struct nft_counter, gfp); if (cpu_stats == NULL) return -ENOMEM; --- a/net/netfilter/nft_dynset.c +++ b/net/netfilter/nft_dynset.c @@ -48,7 +48,7 @@ static void *nft_dynset_new(struct nft_s ext = nft_set_elem_ext(set, elem); if (priv->expr != NULL && - nft_expr_clone(nft_set_ext_expr(ext), priv->expr) < 0) + nft_expr_clone(nft_set_ext_expr(ext), priv->expr, GFP_ATOMIC) < 0) goto err2; return elem; Patches currently in stable-queue which might be from kroah.com@xxxxxxxxxxxxxxx are queue-5.10/samples-make-fs-monitor-depend-on-libc-and-headers.patch queue-5.10/pci-dpc-fix-use-after-free-on-concurrent-dpc-and-hot-removal.patch queue-5.10/netfilter-nf_tables-set-element-extended-ack-reporting-support.patch queue-5.10/samples-add-fs-error-monitoring-example.patch queue-5.10/mptcp-fix-nl-pm-announced-address-accounting.patch queue-5.10/mptcp-distinguish-rcv-vs-sent-backup-flag-in-requests.patch queue-5.10/mptcp-pm-fix-backup-support-in-signal-endpoints.patch queue-5.10/netfilter-nf_tables-prefer-nft_chain_validate.patch queue-5.10/mptcp-mib-count-mpj-with-backup-flag.patch queue-5.10/mptcp-sched-check-both-directions-for-backup.patch queue-5.10/netfilter-nf_tables-allow-clone-callbacks-to-sleep.patch queue-5.10/add-gitignore-file-for-samples-fanotify-subdirectory.patch queue-5.10/mptcp-export-local_address.patch queue-5.10/netfilter-nf_tables-use-timestamp-to-check-for-set-element-timeout.patch