On Wed, 1 May 2019 15:11:17 +0200 Peter Zijlstra <peterz@xxxxxxxxxxxxx> wrote: > On Tue, Apr 30, 2019 at 11:33:21AM -0700, Linus Torvalds wrote: > > Anyway, since Andy really likes the entry code change, can we have > > that patch in parallel and judge the difference that way? Iirc, that > > was x86-64 specific too. > > Here goes, compile tested only... > > It obviously needs a self-test, but that shoulnd't be too hard to > arrange. > I was able to get it applied (with slight tweaking) but it then crashed. But that was due to incorrect updates in the ftrace_int3_handler(). > --- > arch/x86/entry/entry_32.S | 7 +++++++ > arch/x86/entry/entry_64.S | 14 ++++++++++++-- > arch/x86/include/asm/text-patching.h | 20 ++++++++++++++++++++ > arch/x86/kernel/ftrace.c | 24 +++++++++++++++++++----- > 4 files changed, 58 insertions(+), 7 deletions(-) > #endif /* _ASM_X86_TEXT_PATCHING_H */ > diff --git a/arch/x86/kernel/ftrace.c b/arch/x86/kernel/ftrace.c > index ef49517f6bb2..90d319687d7e 100644 > --- a/arch/x86/kernel/ftrace.c > +++ b/arch/x86/kernel/ftrace.c > @@ -29,6 +29,7 @@ > #include <asm/kprobes.h> > #include <asm/ftrace.h> > #include <asm/nops.h> > +#include <asm/text-patching.h> > > #ifdef CONFIG_DYNAMIC_FTRACE > > @@ -231,6 +232,7 @@ int ftrace_modify_call(struct dyn_ftrace *rec, > unsigned long old_addr, } > > static unsigned long ftrace_update_func; > +static unsigned long ftrace_update_func_call; > > static int update_ftrace_func(unsigned long ip, void *new) > { > @@ -259,6 +261,8 @@ int ftrace_update_ftrace_func(ftrace_func_t func) > unsigned char *new; > int ret; > > + ftrace_update_func_call = (unsigned long)func; > + > new = ftrace_call_replace(ip, (unsigned long)func); > ret = update_ftrace_func(ip, new); > > @@ -295,12 +299,19 @@ int ftrace_int3_handler(struct pt_regs *regs) > return 0; > > ip = regs->ip - 1; > - if (!ftrace_location(ip) && !is_ftrace_caller(ip)) > - return 0; > - > - regs->ip += MCOUNT_INSN_SIZE - 1; > + if (ftrace_location(ip)) { > + int3_emulate_call(regs, ftrace_update_func_call); Should be: int3_emulate_call(regs, (unsigned long)ftrace_regs_caller); > + return 1; > + } else if (is_ftrace_caller(ip)) { > + if (!ftrace_update_func_call) { > + int3_emulate_jmp(regs, regs->ip - INT3_INSN_SIZE + CALL_INSN_SIZE); I see what you did here, but I think: int3_emulate_jmp(regs, ip + CALL_INSN_SIZE); looks better. But that said, we could in the beginning do: ip = regs->ip - INT3_INSN_SIZE; instead of ip = regs->ip - 1; I made these updates and posted them to Linus. -- Steve > + return 1; > + } > + int3_emulate_call(regs, ftrace_update_func_call); > + return 1; > + } > > - return 1; > + return 0; > } > NOKPROBE_SYMBOL(ftrace_int3_handler); > > @@ -859,6 +870,8 @@ void arch_ftrace_update_trampoline(struct > ftrace_ops *ops) > func = ftrace_ops_get_func(ops); > > + ftrace_update_func_call = (unsigned long)func; > + > /* Do a safe modify in case the trampoline is executing */ > new = ftrace_call_replace(ip, (unsigned long)func); > ret = update_ftrace_func(ip, new); > @@ -960,6 +973,7 @@ static int ftrace_mod_jmp(unsigned long ip, void > *func) { > unsigned char *new; > > + ftrace_update_func_call = 0UL; > new = ftrace_jmp_replace(ip, (unsigned long)func); > > return update_ftrace_func(ip, new);