Re: [PATCH bpf-next v4 2/8] bpf: x86: Support in-register struct arguments in trampoline programs

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 





On 9/6/22 9:40 AM, Kui-Feng Lee wrote:
On Wed, 2022-08-31 at 08:26 -0700, Yonghong Song wrote:
In C, struct value can be passed as a function argument.
For small structs, struct value may be passed in
one or more registers. For trampoline based bpf programs,
this would cause complication since one-to-one mapping between
function argument and arch argument register is not valid
any more.

The latest llvm16 added bpf support to pass by values
for struct up to 16 bytes ([1]). This is also true for
x86_64 architecture where two registers will hold
the struct value if the struct size is >8 and <= 16.
This may not be true if one of struct member is 'double'
type but in current linux source code we don't have
such instance yet, so we assume all >8 && <= 16 struct
holds two general purpose argument registers.

Also change on-stack nr_args value to the number
of registers holding the arguments. This will
permit bpf_get_func_arg() helper to get all
argument values.

  [1] https://reviews.llvm.org/D132144

Signed-off-by: Yonghong Song <yhs@xxxxxx>
---
  arch/x86/net/bpf_jit_comp.c | 68 +++++++++++++++++++++++++++--------
--
  1 file changed, 51 insertions(+), 17 deletions(-)

diff --git a/arch/x86/net/bpf_jit_comp.c
b/arch/x86/net/bpf_jit_comp.c
index c1f6c1c51d99..ae89f4143eb4 100644
--- a/arch/x86/net/bpf_jit_comp.c
+++ b/arch/x86/net/bpf_jit_comp.c
@@ -1751,34 +1751,60 @@ st:                     if (is_imm8(insn-
off))
  static void save_regs(const struct btf_func_model *m, u8 **prog, int
nr_args,
                       int stack_size)
  {
-       int i;
+       int i, j, arg_size, nr_regs;
         /* Store function arguments to stack.
          * For a function that accepts two pointers the sequence will
be:
          * mov QWORD PTR [rbp-0x10],rdi
          * mov QWORD PTR [rbp-0x8],rsi
          */
-       for (i = 0; i < min(nr_args, 6); i++)
-               emit_stx(prog, bytes_to_bpf_size(m->arg_size[i]),
-                        BPF_REG_FP,
-                        i == 5 ? X86_REG_R9 : BPF_REG_1 + i,
-                        -(stack_size - i * 8));
+       for (i = 0, j = 0; i < min(nr_args, 6); i++) {

Is 6 still correct since an argument can take more than one register
now?  Perphaps j < min(...)?

'min(nr_args, 6)' probably a historical artifact. It can be
replaced with 'nr_args' since in the beginning of function
arch_prepare_bpf_trampoline(), we have

/* x86-64 supports up to 6 arguments. 7+ can be added in the future */
        if (nr_args > 6)
                return -ENOTSUPP;

so nr_args <= 6 is true.


I am not sure how to deal with a corner case that a 16 bytes struct
arguement happens to be at 6th place.  Does that mean first 8 bytes are
in a register and the reset bytes are in the stack?

This won't happen, see below change in arch_prepare_bpf_trampoline()
where it is checked to ensure the number of registers holding
all arguments mush be <= 6.



+               if (m->arg_flags[i] & BTF_FMODEL_STRUCT_ARG) {
+                       nr_regs = (m->arg_size[i] + 7) / 8;
+                       arg_size = 8;
+               } else {
+                       nr_regs = 1;
+                       arg_size = m->arg_size[i];
+               }
+
+               while (nr_regs) {
+                       emit_stx(prog, bytes_to_bpf_size(arg_size),
+                                BPF_REG_FP,
+                                j == 5 ? X86_REG_R9 : BPF_REG_1 + j,
+                                -(stack_size - j * 8));
+                       nr_regs--;
+                       j++;
+               }
+       }
  }
 static void restore_regs(const struct btf_func_model *m, u8 **prog,
int nr_args,
                          int stack_size)
  {
-       int i;
+       int i, j, arg_size, nr_regs;
        /* Restore function arguments from stack.
          * For a function that accepts two pointers the sequence will
be:
          * EMIT4(0x48, 0x8B, 0x7D, 0xF0); mov rdi,QWORD PTR [rbp-
0x10]
          * EMIT4(0x48, 0x8B, 0x75, 0xF8); mov rsi,QWORD PTR [rbp-0x8]
          */
-       for (i = 0; i < min(nr_args, 6); i++)
-               emit_ldx(prog, bytes_to_bpf_size(m->arg_size[i]),
-                        i == 5 ? X86_REG_R9 : BPF_REG_1 + i,
-                        BPF_REG_FP,
-                        -(stack_size - i * 8));
+       for (i = 0, j = 0; i < min(nr_args, 6); i++) {
+               if (m->arg_flags[i] & BTF_FMODEL_STRUCT_ARG) {
+                       nr_regs = (m->arg_size[i] + 7) / 8;
+                       arg_size = 8;
+               } else {
+                       nr_regs = 1;
+                       arg_size = m->arg_size[i];
+               }
+
+               while (nr_regs) {
+                       emit_ldx(prog, bytes_to_bpf_size(arg_size),
+                                j == 5 ? X86_REG_R9 : BPF_REG_1 + j,
+                                BPF_REG_FP,
+                                -(stack_size - j * 8));
+                       nr_regs--;
+                       j++;
+               }
+       }
  }
 static int invoke_bpf_prog(const struct btf_func_model *m, u8
**pprog,
@@ -2015,7 +2041,7 @@ int arch_prepare_bpf_trampoline(struct
bpf_tramp_image *im, void *image, void *i
                                 struct bpf_tramp_links *tlinks,
                                 void *orig_call)
  {
-       int ret, i, nr_args = m->nr_args;
+       int ret, i, nr_args = m->nr_args, extra_nregs = 0;
         int regs_off, ip_off, args_off, stack_size = nr_args * 8,
run_ctx_off;
         struct bpf_tramp_links *fentry = &tlinks[BPF_TRAMP_FENTRY];
         struct bpf_tramp_links *fexit = &tlinks[BPF_TRAMP_FEXIT];
@@ -2028,6 +2054,14 @@ int arch_prepare_bpf_trampoline(struct
bpf_tramp_image *im, void *image, void *i
         if (nr_args > 6)
                 return -ENOTSUPP;
+       for (i = 0; i < MAX_BPF_FUNC_ARGS; i++) {
+               if (m->arg_flags[i] & BTF_FMODEL_STRUCT_ARG)
+                       extra_nregs += (m->arg_size[i] + 7) / 8 - 1;
+       }
+       if (nr_args + extra_nregs > 6)
+               return -ENOTSUPP;

Here to ensure the number of registers holding all arguments
must be <= 6.

+       stack_size += extra_nregs * 8;
+
         /* Generated trampoline stack layout:
          *
          * RBP + 8         [ return address  ]
[...]



[Index of Archives]     [Linux Samsung SoC]     [Linux Rockchip SoC]     [Linux Actions SoC]     [Linux for Synopsys ARC Processors]     [Linux NFS]     [Linux NILFS]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]


  Powered by Linux