A rule may be added before or after another one using index keyword. To support for the other rule being added within the same batch, one has to make use of NFTNL_RULE_ID and NFTNL_RULE_POSITION_ID attributes. This patch does just that among a few more crucial things: * Fetch full kernel ruleset upon encountering a rule which references another one. Any earlier rule add/insert commands are then restored by cache_add_commands(). * Avoid cache updates for rules not referencing another one by index, but add them immediately to cache if cache is already complete - otherwise they are not inserted if a later one with index reference is added. * Reduce rule_translate_index() to its core code which is the actual linking of rules and consequently rename the function. The removed bits are pulled into the calling rule_evaluate() to reduce code duplication in between cache inserts with and without rule reference. * Pass the current command op to rule_evaluate() as indicator whether to insert before or after a referenced rule or at beginning or end of chain in cache. Exploit this from chain_evaluate() to avoid adding the chain's rules a second time. Signed-off-by: Phil Sutter <phil@xxxxxx> --- Changes since v4: - Move whole rule reference finding and linking code into rule_cache_update() to simplify callers. - Move rule_cache_update() to right before cache_add_rule_cmd(). - Fix the code regarding which handle and which rule pointer to use, resolves The segfault Eric mentioned. - Skip cache updates for rule delete and replace commands, this restores old behaviour regarding "guessed" rule handles. - Also simplify skp logic itself: If cache is complete, add all rules while evaluating them. Previous cache completeness level lowering was problematic after cache flush command. - Add additional test case for delete/replace commands. Changes since v1: - Move rule list manipulation into a dedicated function rule_cache_update(). - Restore old performance for simple commands by fetching a full rule cache only if the currently evaluated rule references another one. - Extend 0024rule_0 test a bit to make sure things work with interactive nft also. --- include/rule.h | 4 + src/evaluate.c | 60 ++++-------- src/mnl.c | 4 + src/rule.c | 98 +++++++++++++++++++ .../shell/testcases/cache/0003_cache_update_0 | 7 ++ tests/shell/testcases/transactions/0024rule_0 | 17 ++++ tests/shell/testcases/transactions/0025rule_0 | 21 ++++ .../transactions/dumps/0024rule_0.nft | 8 ++ .../transactions/dumps/0025rule_0.nft | 6 ++ 9 files changed, 182 insertions(+), 43 deletions(-) create mode 100755 tests/shell/testcases/transactions/0024rule_0 create mode 100755 tests/shell/testcases/transactions/0025rule_0 create mode 100644 tests/shell/testcases/transactions/dumps/0024rule_0.nft create mode 100644 tests/shell/testcases/transactions/dumps/0025rule_0.nft diff --git a/include/rule.h b/include/rule.h index aa8881d375b96..87ea8b8a25b96 100644 --- a/include/rule.h +++ b/include/rule.h @@ -73,6 +73,8 @@ struct handle { struct position_spec position; struct position_spec index; uint32_t set_id; + uint32_t rule_id; + uint32_t position_id; }; extern void handle_merge(struct handle *dst, const struct handle *src); @@ -639,6 +641,8 @@ extern void cache_flush(struct nft_ctx *ctx, enum cmd_ops cmd, struct list_head *msgs); extern void cache_release(struct nft_cache *cache); extern bool cache_is_complete(struct nft_cache *cache, enum cmd_ops cmd); +extern int rule_cache_update(struct eval_ctx *ectx, struct rule *rule, + enum cmd_ops op); struct timeout_protocol { uint32_t array_size; diff --git a/src/evaluate.c b/src/evaluate.c index 358f5b7152634..4fa4a0c73e9ca 100644 --- a/src/evaluate.c +++ b/src/evaluate.c @@ -3177,46 +3177,11 @@ static int flowtable_evaluate(struct eval_ctx *ctx, struct flowtable *ft) return 0; } -/* Convert rule's handle.index into handle.position. */ -static int rule_translate_index(struct eval_ctx *ctx, struct rule *rule) -{ - struct table *table; - struct chain *chain; - uint64_t index = 0; - struct rule *r; - int ret; - - /* update cache with CMD_LIST so that rules are fetched, too */ - ret = cache_update(ctx->nft, CMD_LIST, ctx->msgs); - if (ret < 0) - return ret; - - table = table_lookup(&rule->handle, &ctx->nft->cache); - if (!table) - return table_not_found(ctx); - - chain = chain_lookup(table, &rule->handle); - if (!chain) - return chain_not_found(ctx); - - list_for_each_entry(r, &chain->rules, list) { - if (++index < rule->handle.index.id) - continue; - rule->handle.position.id = r->handle.handle.id; - rule->handle.position.location = rule->handle.index.location; - break; - } - if (!rule->handle.position.id) - return cmd_error(ctx, &rule->handle.index.location, - "Could not process rule: %s", - strerror(ENOENT)); - return 0; -} - -static int rule_evaluate(struct eval_ctx *ctx, struct rule *rule) +static int rule_evaluate(struct eval_ctx *ctx, struct rule *rule, enum cmd_ops op) { struct stmt *stmt, *tstmt = NULL; struct error_record *erec; + int ret; proto_ctx_init(&ctx->pctx, rule->handle.family, ctx->nft->debug_mask); memset(&ctx->ectx, 0, sizeof(ctx->ectx)); @@ -3241,11 +3206,20 @@ static int rule_evaluate(struct eval_ctx *ctx, struct rule *rule) return -1; } - if (rule->handle.index.id && - rule_translate_index(ctx, rule)) - return -1; + /* Cache update may be avoided if the rule doesn't reference another + * one by index: If later rules containing a reference by index will + * cause a cache update, the current one will be inserted from command + * list. */ + if (!rule->handle.index.id && + !cache_is_complete(&ctx->nft->cache, CMD_LIST)) + return 0; - return 0; + /* update cache with CMD_LIST so that rules are fetched, too */ + ret = cache_update(ctx->nft, CMD_LIST, ctx->msgs); + if (ret < 0) + return ret; + + return rule_cache_update(ctx, rule, op); } static uint32_t str2hooknum(uint32_t family, const char *hook) @@ -3326,7 +3300,7 @@ static int chain_evaluate(struct eval_ctx *ctx, struct chain *chain) list_for_each_entry(rule, &chain->rules, list) { handle_merge(&rule->handle, &chain->handle); - if (rule_evaluate(ctx, rule) < 0) + if (rule_evaluate(ctx, rule, CMD_INVALID) < 0) return -1; } return 0; @@ -3423,7 +3397,7 @@ static int cmd_evaluate_add(struct eval_ctx *ctx, struct cmd *cmd) return set_evaluate(ctx, cmd->set); case CMD_OBJ_RULE: handle_merge(&cmd->rule->handle, &cmd->handle); - return rule_evaluate(ctx, cmd->rule); + return rule_evaluate(ctx, cmd->rule, cmd->op); case CMD_OBJ_CHAIN: ret = cache_update(ctx->nft, cmd->op, ctx->msgs); if (ret < 0) diff --git a/src/mnl.c b/src/mnl.c index 579210e4736a4..a38a4b4d3dd51 100644 --- a/src/mnl.c +++ b/src/mnl.c @@ -373,6 +373,10 @@ int mnl_nft_rule_add(struct netlink_ctx *ctx, const struct cmd *cmd, nftnl_rule_set_str(nlr, NFTNL_RULE_CHAIN, h->chain.name); if (h->position.id) nftnl_rule_set_u64(nlr, NFTNL_RULE_POSITION, h->position.id); + if (h->rule_id) + nftnl_rule_set_u32(nlr, NFTNL_RULE_ID, h->rule_id); + if (h->position_id) + nftnl_rule_set_u32(nlr, NFTNL_RULE_POSITION_ID, h->position_id); netlink_linearize_rule(ctx, nlr, rule); nlh = nftnl_nlmsg_build_hdr(nftnl_batch_buffer(ctx->batch), diff --git a/src/rule.c b/src/rule.c index 8343614a9d9c5..699efca2a6e11 100644 --- a/src/rule.c +++ b/src/rule.c @@ -24,6 +24,7 @@ #include <mnl.h> #include <misspell.h> #include <json.h> +#include <erec.h> #include <libnftnl/common.h> #include <libnftnl/ruleset.h> @@ -295,6 +296,98 @@ static int cache_add_set_cmd(struct eval_ctx *ectx) return 0; } +/* make src point at dst, either via handle.position or handle.position_id */ +static void link_rules(struct rule *src, struct rule *dst) +{ + static uint32_t ref_id = 0; + + if (dst->handle.handle.id) { + /* dst is in kernel, make src reference it by handle */ + src->handle.position.id = dst->handle.handle.id; + src->handle.position.location = src->handle.index.location; + return; + } + + /* dst is not in kernel, make src reference it by per-transaction ID */ + if (!dst->handle.rule_id) + dst->handle.rule_id = ++ref_id; + src->handle.position_id = dst->handle.rule_id; +} + +int rule_cache_update(struct eval_ctx *ectx, struct rule *rule, enum cmd_ops op) +{ + struct handle *handle = rule ? &rule->handle : &ectx->cmd->handle; + struct rule *ref = NULL; + struct table *table; + struct chain *chain; + + if (!rule) + rule = ectx->cmd->rule; + + table = table_lookup(handle, &ectx->nft->cache); + if (!table) + return table_not_found(ectx); + + chain = chain_lookup(table, handle); + if (!chain) + return chain_not_found(ectx); + + if (handle->index.id) { + ref = rule_lookup_by_index(chain, handle->index.id); + if (!ref) + return cmd_error(ectx, &handle->index.location, + "Could not process rule: %s", + strerror(ENOENT)); + + link_rules(rule, ref); + } else if (handle->handle.id) { + ref = rule_lookup(chain, handle->handle.id); + if (!ref) + return cmd_error(ectx, &handle->handle.location, + "Could not process rule: %s", + strerror(ENOENT)); + } else if (handle->position.id) { + ref = rule_lookup(chain, handle->position.id); + if (!ref) + return cmd_error(ectx, &handle->position.location, + "Could not process rule: %s", + strerror(ENOENT)); + } + + switch (op) { + case CMD_INSERT: + rule_get(rule); + if (ref) + list_add_tail(&rule->list, &ref->list); + else + list_add(&rule->list, &chain->rules); + break; + case CMD_ADD: + rule_get(rule); + if (ref) + list_add(&rule->list, &ref->list); + else + list_add_tail(&rule->list, &chain->rules); + break; + case CMD_REPLACE: + rule_get(rule); + list_add(&rule->list, &ref->list); + /* fall through */ + case CMD_DELETE: + list_del(&ref->list); + rule_free(ref); + break; + default: + break; + } + return 0; +} + +static int cache_add_rule_cmd(struct eval_ctx *ectx) +{ + return rule_cache_update(ectx, ectx->cmd->rule, ectx->cmd->op); +} + static int cache_add_commands(struct nft_ctx *nft, struct list_head *msgs) { struct eval_ctx ectx = { @@ -316,6 +409,11 @@ static int cache_add_commands(struct nft_ctx *nft, struct list_head *msgs) continue; ret = cache_add_set_cmd(&ectx); break; + case CMD_OBJ_RULE: + if (!cache_is_complete(&nft->cache, CMD_LIST)) + continue; + ret = cache_add_rule_cmd(&ectx); + break; default: break; } diff --git a/tests/shell/testcases/cache/0003_cache_update_0 b/tests/shell/testcases/cache/0003_cache_update_0 index fa9b5df380a41..05edc9c7c33eb 100755 --- a/tests/shell/testcases/cache/0003_cache_update_0 +++ b/tests/shell/testcases/cache/0003_cache_update_0 @@ -34,6 +34,9 @@ EOF # add rule ip t4 c meta l4proto icmp accept -> rule to reference in next step # add rule ip t4 c index 0 drop -> index 0 is not found due to rule cache not # being updated +# add rule ip t4 c index 2 drop -> index 2 is not found due to igmp rule being +# in same transaction and therefore not having +# an allocated handle $NFT -i >/dev/null <<EOF add table ip t4; add chain ip t4 c add rule ip t4 c meta l4proto icmp accept @@ -41,3 +44,7 @@ EOF $NFT -f - >/dev/null <<EOF add rule ip t4 c index 0 drop EOF +$NFT -f - >/dev/null <<EOF +add rule ip t4 c meta l4proto igmp accept +add rule ip t4 c index 2 drop +EOF diff --git a/tests/shell/testcases/transactions/0024rule_0 b/tests/shell/testcases/transactions/0024rule_0 new file mode 100755 index 0000000000000..4c1ac41db3b47 --- /dev/null +++ b/tests/shell/testcases/transactions/0024rule_0 @@ -0,0 +1,17 @@ +#!/bin/bash + +RULESET="flush ruleset +add table x +add chain x y +add rule x y accept comment rule1 +add rule x y accept comment rule4 +add rule x y index 0 accept comment rule2 +insert rule x y index 2 accept comment rule3" + +$NFT -f - <<< "$RULESET" && \ + $NFT -f - <<< "$RULESET" && \ + echo "$RULESET" | tr '\n' ';' | $NFT -i >/dev/null && \ + exit 0 +echo "E: intra-transaction rule reference failed" +exit 1 + diff --git a/tests/shell/testcases/transactions/0025rule_0 b/tests/shell/testcases/transactions/0025rule_0 new file mode 100755 index 0000000000000..d72d5cfcc75d4 --- /dev/null +++ b/tests/shell/testcases/transactions/0025rule_0 @@ -0,0 +1,21 @@ +#!/bin/bash + +# make sure stored delete/replace rule commands are correctly applied + +set -e + +$NFT -f - <<EOF +flush ruleset +table x { + chain y { + accept + log + } +} +EOF + +$NFT -f - <<EOF +replace rule x y handle 2 log +delete rule x y handle 3 +add rule x y index 0 drop +EOF diff --git a/tests/shell/testcases/transactions/dumps/0024rule_0.nft b/tests/shell/testcases/transactions/dumps/0024rule_0.nft new file mode 100644 index 0000000000000..7860ff654c5e2 --- /dev/null +++ b/tests/shell/testcases/transactions/dumps/0024rule_0.nft @@ -0,0 +1,8 @@ +table ip x { + chain y { + accept comment "rule1" + accept comment "rule2" + accept comment "rule3" + accept comment "rule4" + } +} diff --git a/tests/shell/testcases/transactions/dumps/0025rule_0.nft b/tests/shell/testcases/transactions/dumps/0025rule_0.nft new file mode 100644 index 0000000000000..dcb61ae65fbde --- /dev/null +++ b/tests/shell/testcases/transactions/dumps/0025rule_0.nft @@ -0,0 +1,6 @@ +table ip x { + chain y { + log + drop + } +} -- 2.21.0