On Thu, 19 Mar 2015 18:59:43 -0700 Alexei Starovoitov <ast@xxxxxxxxxxxx> wrote: > Debugging of BPF programs needs some form of printk from the program, > so let programs call limited trace_printk() with %d %u %x %p modifiers only. > > Similar to kernel modules, during program load verifier checks whether program > is calling bpf_trace_printk() and if so, kernel allocates trace_printk buffers > and emits big 'this is debug only' banner. > > Signed-off-by: Alexei Starovoitov <ast@xxxxxxxxxxxx> > --- > include/uapi/linux/bpf.h | 1 + > kernel/trace/bpf_trace.c | 75 ++++++++++++++++++++++++++++++++++++++++++++++ > 2 files changed, 76 insertions(+) > > diff --git a/include/uapi/linux/bpf.h b/include/uapi/linux/bpf.h > index 238c6883877b..cc47ef41076a 100644 > --- a/include/uapi/linux/bpf.h > +++ b/include/uapi/linux/bpf.h > @@ -166,6 +166,7 @@ enum bpf_func_id { > BPF_FUNC_map_delete_elem, /* int map_delete_elem(&map, &key) */ > BPF_FUNC_probe_read, /* int bpf_probe_read(void *dst, int size, void *src) */ > BPF_FUNC_ktime_get_ns, /* u64 bpf_ktime_get_ns(void) */ > + BPF_FUNC_trace_printk, /* int bpf_trace_printk(const char *fmt, int fmt_size, ...) */ > __BPF_FUNC_MAX_ID, > }; > > diff --git a/kernel/trace/bpf_trace.c b/kernel/trace/bpf_trace.c > index 769c577a1fc8..d5b6284edd75 100644 > --- a/kernel/trace/bpf_trace.c > +++ b/kernel/trace/bpf_trace.c > @@ -10,6 +10,7 @@ > #include <linux/bpf.h> > #include <linux/filter.h> > #include <linux/uaccess.h> > +#include <linux/ctype.h> > #include "trace.h" > > static DEFINE_PER_CPU(int, bpf_prog_active); > @@ -83,6 +84,72 @@ static const struct bpf_func_proto bpf_ktime_get_ns_proto = { > .ret_type = RET_INTEGER, > }; > > +/* limited trace_printk() > + * only %d %u %x %ld %lu %lx %lld %llu %llx %p conversion specifiers allowed > + */ Ah! Again, don't contaminate the rest of the kernel with net comment styles! :-) I change my comment style when I submit net patches. So patches that go into tracing must conform to the tracing style. > +static u64 bpf_trace_printk(u64 r1, u64 fmt_size, u64 r3, u64 r4, u64 r5) > +{ > + char *fmt = (char *) (long) r1; > + int mod[3] = {}; > + int fmt_cnt = 0; > + int i; > + > + /* bpf_check()->check_func_arg()->check_stack_boundary() It spreads like a disease! > + * guarantees that fmt points to bpf program stack, > + * fmt_size bytes of it were initialized and fmt_size > 0 > + */ > + if (fmt[--fmt_size] != 0) > + return -EINVAL; > + > + /* check format string for allowed specifiers */ > + for (i = 0; i < fmt_size; i++) { > + if ((!isprint(fmt[i]) && !isspace(fmt[i])) || !isascii(fmt[i])) > + return -EINVAL; > + > + if (fmt[i] != '%') > + continue; > + > + if (fmt_cnt >= 3) > + return -EINVAL; > + > + /* fmt[i] != 0 && fmt[last] == 0, so we can access fmt[i + 1] */ > + i++; > + if (fmt[i] == 'l') { > + mod[fmt_cnt]++; > + i++; > + } else if (fmt[i] == 'p') { > + mod[fmt_cnt]++; > + i++; > + if (!isspace(fmt[i]) && fmt[i] != 0) I wonder if we should allow punctuation here too? None alpha-numeric characters? > + return -EINVAL; > + fmt_cnt++; > + continue; > + } > + > + if (fmt[i] == 'l') { > + mod[fmt_cnt]++; > + i++; > + } > + > + if (fmt[i] != 'd' && fmt[i] != 'u' && fmt[i] != 'x') > + return -EINVAL; > + fmt_cnt++; > + } > + > + return __trace_printk(1/* fake ip will not be printed */, fmt, > + mod[0] == 2 ? r3 : mod[0] == 1 ? (long) r3 : (u32) r3, > + mod[1] == 2 ? r4 : mod[1] == 1 ? (long) r4 : (u32) r4, > + mod[2] == 2 ? r5 : mod[2] == 1 ? (long) r5 : (u32) r5); Nice trick. Except for the net-contaminated-comments, the rest looks good. Reviewed-by: Steven Rostedt <rostedt@xxxxxxxxxxx> -- Steve > +} > + > +static const struct bpf_func_proto bpf_trace_printk_proto = { > + .func = bpf_trace_printk, > + .gpl_only = true, > + .ret_type = RET_INTEGER, > + .arg1_type = ARG_PTR_TO_STACK, > + .arg2_type = ARG_CONST_STACK_SIZE, > +}; > + > static const struct bpf_func_proto *kprobe_prog_func_proto(enum bpf_func_id func_id) > { > switch (func_id) { > @@ -96,6 +163,14 @@ static const struct bpf_func_proto *kprobe_prog_func_proto(enum bpf_func_id func > return &bpf_probe_read_proto; > case BPF_FUNC_ktime_get_ns: > return &bpf_ktime_get_ns_proto; > + > + case BPF_FUNC_trace_printk: > + /* this program might be calling bpf_trace_printk, > + * so allocate per-cpu printk buffers > + */ > + trace_printk_init_buffers(); > + > + return &bpf_trace_printk_proto; > default: > return NULL; > } -- To unsubscribe from this list: send the line "unsubscribe linux-api" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html