On 3/2/16, Peter Zijlstra <peterz@xxxxxxxxxxxxx> wrote: > On Wed, Mar 02, 2016 at 04:53:36PM +0100, Sedat Dilek wrote: >> ffffffff8110f570 <del_timer_sync>: >> ffffffff8110f570: 55 push %rbp >> ffffffff8110f571: 48 89 e5 mov %rsp,%rbp >> ffffffff8110f574: 41 57 push %r15 >> ffffffff8110f576: 41 56 push %r14 >> ffffffff8110f578: 53 push %rbx >> ffffffff8110f579: 48 83 ec 28 sub $0x28,%rsp > > stack offset is 0x28 bytes [*] > >> ffffffff8110f57d: 48 89 fb mov %rdi,%rbx >> ffffffff8110f580: e8 6b 6e 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f585: e8 66 6e 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f58a: e8 61 6e 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f58f: e8 5c 6e 80 00 callq ffffffff819163f0 <mcount> > > Your compiler is on drugs! > >> ffffffff8110f594: 9c pushfq >> ffffffff8110f595: 8f 45 e0 popq -0x20(%rbp) > > Saves flags in -0x20(%rbp) > >> ffffffff8110f598: 4c 8b 7d e0 mov -0x20(%rbp),%r15 > > And in %r15 > > /me wonders what's wrong with: popf %r15 > >> ffffffff8110f59c: e8 4f 6e 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f5a1: e8 4a 6e 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f5a6: fa cli >> ffffffff8110f5a7: e8 84 cb fc ff callq ffffffff810dc130 >> <trace_hardirqs_off> >> ffffffff8110f5ac: 4c 8d 73 50 lea 0x50(%rbx),%r14 >> ffffffff8110f5b0: 48 c7 04 24 b0 f5 10 movq $0xffffffff8110f5b0,(%rsp) >> ffffffff8110f5b7: 81 >> ffffffff8110f5b8: 31 f6 xor %esi,%esi >> ffffffff8110f5ba: 31 d2 xor %edx,%edx >> ffffffff8110f5bc: 31 c9 xor %ecx,%ecx >> ffffffff8110f5be: 41 b8 01 00 00 00 mov $0x1,%r8d >> ffffffff8110f5c4: 45 31 c9 xor %r9d,%r9d >> ffffffff8110f5c7: 4c 89 f7 mov %r14,%rdi >> ffffffff8110f5ca: e8 c1 e5 fc ff callq ffffffff810ddb90 >> <lock_acquire> >> ffffffff8110f5cf: be 01 00 00 00 mov $0x1,%esi >> ffffffff8110f5d4: 48 c7 c2 cf f5 10 81 mov $0xffffffff8110f5cf,%rdx >> ffffffff8110f5db: 4c 89 f7 mov %r14,%rdi >> ffffffff8110f5de: e8 8d 08 fd ff callq ffffffff810dfe70 >> <lock_release> >> ffffffff8110f5e3: e8 08 6e 80 00 callq ffffffff819163f0 <mcount> > >> ffffffff8110f5e8: 4c 89 f8 mov %r15,%rax >> ffffffff8110f5eb: 49 89 c6 mov %rax,%r14 > > Moves r15 into r14 through rax > > >> ffffffff8110f5ee: f6 c4 02 test $0x2,%ah >> ffffffff8110f5f1: 75 19 jne ffffffff8110f60c >> <del_timer_sync+0x9c> >> ffffffff8110f5f3: e8 f8 6d 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f5f8: e8 f3 6d 80 00 callq ffffffff819163f0 <mcount> > > >> ffffffff8110f5fd: 4c 89 75 d0 mov %r14,-0x30(%rbp) >> ffffffff8110f601: ff 75 d0 pushq -0x30(%rbp) >> ffffffff8110f604: 9d popfq > > put r14 into -0x30(rbp) and pushes/pops that, see [*] this is 8 bytes > over stack ?! > >> ffffffff8110f605: e8 26 cb fc ff callq ffffffff810dc130 >> <trace_hardirqs_off> >> ffffffff8110f60a: eb 17 jmp ffffffff8110f623 >> <del_timer_sync+0xb3> >> ffffffff8110f60c: e8 2f cb fc ff callq ffffffff810dc140 >> <trace_hardirqs_on> >> ffffffff8110f611: e8 da 6d 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f616: e8 d5 6d 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f61b: 4c 89 75 d8 mov %r14,-0x28(%rbp) >> ffffffff8110f61f: ff 75 d8 pushq -0x28(%rbp) >> ffffffff8110f622: 9d popfq > > puts r14 into -0x28(rbp) and pushes/pops that > >> ffffffff8110f623: e8 c8 6d 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f628: 65 8b 04 25 d4 ae 00 mov %gs:0xaed4,%eax >> ffffffff8110f62f: 00 >> ffffffff8110f630: a9 00 00 0f 00 test $0xf0000,%eax >> ffffffff8110f635: 74 25 je ffffffff8110f65c >> <del_timer_sync+0xec> >> ffffffff8110f637: f6 43 2a 20 testb $0x20,0x2a(%rbx) >> ffffffff8110f63b: 75 1f jne ffffffff8110f65c >> <del_timer_sync+0xec> >> ffffffff8110f63d: 48 c7 c7 04 54 c5 81 mov $0xffffffff81c55404,%rdi >> ffffffff8110f644: be 61 04 00 00 mov $0x461,%esi >> ffffffff8110f649: e8 12 c4 f6 ff callq ffffffff8107ba60 >> <warn_slowpath_null> >> ffffffff8110f64e: eb 0c jmp ffffffff8110f65c >> <del_timer_sync+0xec> >> ffffffff8110f650: e8 9b 6d 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f655: e8 96 6d 80 00 callq ffffffff819163f0 <mcount> >> ffffffff8110f65a: f3 90 pause >> ffffffff8110f65c: 48 89 df mov %rbx,%rdi >> ffffffff8110f65f: e8 4c fe ff ff callq ffffffff8110f4b0 >> <try_to_del_timer_sync> >> ffffffff8110f664: 85 c0 test %eax,%eax >> ffffffff8110f666: 78 e8 js ffffffff8110f650 >> <del_timer_sync+0xe0> >> ffffffff8110f668: 48 83 c4 28 add $0x28,%rsp >> ffffffff8110f66c: 5b pop %rbx >> ffffffff8110f66d: 41 5e pop %r14 >> ffffffff8110f66f: 41 5f pop %r15 >> ffffffff8110f671: 5d pop %rbp >> ffffffff8110f672: c3 retq >> ffffffff8110f673: 66 66 66 66 2e 0f 1f data32 data32 data32 nopw >> %cs:0x0(%rax,%rax,1) >> ffffffff8110f67a: 84 00 00 00 00 00 > > > That LLVM generate disgusting code, as a contrast, this is what my GCC > makes of this: > > ffffffff81155f50 <del_timer_sync>: > ffffffff81155f50: e8 bb 02 9c 00 callq ffffffff81b16210 > <__fentry__> > ffffffff81155f55: 55 push %rbp > ffffffff81155f56: 48 89 e5 mov %rsp,%rbp > ffffffff81155f59: 41 55 push %r13 > ffffffff81155f5b: 41 54 push %r12 > ffffffff81155f5d: 53 push %rbx > ffffffff81155f5e: 48 89 fb mov %rdi,%rbx > ffffffff81155f61: 48 83 ec 08 sub $0x8,%rsp > ffffffff81155f65: 9c pushfq > ffffffff81155f66: 41 5c pop %r12 > ffffffff81155f68: fa cli > ffffffff81155f69: e8 72 5c fd ff callq ffffffff8112bbe0 > <trace_hardirqs_off> > ffffffff81155f6e: 4c 8d 6b 50 lea 0x50(%rbx),%r13 > ffffffff81155f72: 45 31 c9 xor %r9d,%r9d > ffffffff81155f75: 31 c9 xor %ecx,%ecx > ffffffff81155f77: 31 d2 xor %edx,%edx > ffffffff81155f79: 31 f6 xor %esi,%esi > ffffffff81155f7b: 4c 89 ef mov %r13,%rdi > ffffffff81155f7e: 48 c7 04 24 55 5f 15 movq > $0xffffffff81155f55,(%rsp) > ffffffff81155f85: 81 > ffffffff81155f86: 41 b8 01 00 00 00 mov $0x1,%r8d > ffffffff81155f8c: e8 3f b3 fd ff callq ffffffff811312d0 > <lock_acquire> > ffffffff81155f91: 48 c7 c2 55 5f 15 81 mov > $0xffffffff81155f55,%rdx > ffffffff81155f98: be 01 00 00 00 mov $0x1,%esi > ffffffff81155f9d: 4c 89 ef mov %r13,%rdi > ffffffff81155fa0: e8 0b b5 fd ff callq ffffffff811314b0 > <lock_release> > ffffffff81155fa5: 41 f7 c4 00 02 00 00 test $0x200,%r12d > ffffffff81155fac: 75 52 jne ffffffff81156000 > <del_timer_sync+0xb0> > ffffffff81155fae: 41 54 push %r12 > ffffffff81155fb0: 9d popfq > ffffffff81155fb1: e8 2a 5c fd ff callq ffffffff8112bbe0 > <trace_hardirqs_off> > ffffffff81155fb6: 65 8b 05 5b 66 eb 7e mov > %gs:0x7eeb665b(%rip),%eax # c618 <__preempt_count> > ffffffff81155fbd: a9 00 00 0f 00 test $0xf0000,%eax > ffffffff81155fc2: 74 25 je ffffffff81155fe9 > <del_timer_sync+0x99> > ffffffff81155fc4: f6 43 2a 20 testb $0x20,0x2a(%rbx) > ffffffff81155fc8: 75 1f jne ffffffff81155fe9 > <del_timer_sync+0x99> > ffffffff81155fca: be 61 04 00 00 mov $0x461,%esi > ffffffff81155fcf: 48 c7 c7 09 87 f3 81 mov > $0xffffffff81f38709,%rdi > ffffffff81155fd6: e8 15 03 f8 ff callq ffffffff810d62f0 > <warn_slowpath_null> > ffffffff81155fdb: 48 89 df mov %rbx,%rdi > ffffffff81155fde: e8 fd fe ff ff callq ffffffff81155ee0 > <try_to_del_timer_sync> > ffffffff81155fe3: 85 c0 test %eax,%eax > ffffffff81155fe5: 79 0e jns ffffffff81155ff5 > <del_timer_sync+0xa5> > ffffffff81155fe7: f3 90 pause > ffffffff81155fe9: 48 89 df mov %rbx,%rdi > ffffffff81155fec: e8 ef fe ff ff callq ffffffff81155ee0 > <try_to_del_timer_sync> > ffffffff81155ff1: 85 c0 test %eax,%eax > ffffffff81155ff3: 78 f2 js ffffffff81155fe7 > <del_timer_sync+0x97> > ffffffff81155ff5: 48 83 c4 08 add $0x8,%rsp > ffffffff81155ff9: 5b pop %rbx > ffffffff81155ffa: 41 5c pop %r12 > ffffffff81155ffc: 41 5d pop %r13 > ffffffff81155ffe: 5d pop %rbp > ffffffff81155fff: c3 retq > ffffffff81156000: e8 4b 8b fd ff callq ffffffff8112eb50 > <trace_hardirqs_on> > ffffffff81156005: 41 54 push %r12 > ffffffff81156007: 9d popfq > ffffffff81156008: eb ac jmp ffffffff81155fb6 > <del_timer_sync+0x66> > ffffffff8115600a: 66 0f 1f 44 00 00 nopw 0x0(%rax,%rax,1) > OK, I cannot say much to your analysis. The full make-lines look differently. GCC for example has '-mfentry -DCC_USING_FENTRY'. [ CLANG ] mycompiler -Wp,-MD,kernel/.workqueue.o.d -nostdinc -isystem /opt/llvm-toolchain-3.8.0rc3/bin/../lib/clang/3.8.0/include -nostdinc -isystem /opt/llvm-toolchain-3.8.0rc3/bin/../lib/clang/3.8.0/include -I./arch/x86/include -Iarch/x86/include/generated/uapi -Iarch/x86/include/generated -Iinclude -I./arch/x86/include/uapi -Iarch/x86/include/generated/uapi -I./include/uapi -Iinclude/generated/uapi -include ./include/linux/kconfig.h -D__KERNEL__ -Qunused-arguments -Wno-unknown-warning-option -Wall -Wundef -Wstrict-prototypes -Wno-trigraphs -fno-strict-aliasing -fno-common -Werror-implicit-function-declaration -Wno-format-security -std=gnu89 -no-integrated-as -mno-sse -mno-mmx -mno-sse2 -mno-3dnow -mno-avx -m64 -mtune=generic -mno-red-zone -mcmodel=kernel -funit-at-a-time -DCONFIG_X86_X32_ABI -DCONFIG_AS_CFI=1 -DCONFIG_AS_CFI_SIGNAL_FRAME=1 -DCONFIG_AS_CFI_SECTIONS=1 -DCONFIG_AS_FXSAVEQ=1 -DCONFIG_AS_SSSE3=1 -DCONFIG_AS_CRC32=1 -DCONFIG_AS_AVX=1 -DCONFIG_AS_AVX2=1 -pipe -Wno-sign-compare -fno-asynchronous-unwind-tables -O2 -Wframe-larger-than=1024 -fno-stack-protector -Wno-unused-variable -Wno-format-invalid-specifier -Wno-gnu -Wno-asm-operand-widths -Wno-initializer-overrides -fno-builtin -Wno-tautological-compare -mno-global-merge -fno-omit-frame-pointer -fno-optimize-sibling-calls -pg -Wdeclaration-after-statement -Wno-pointer-sign -fno-strict-overflow -Werror=implicit-int -Werror=strict-prototypes -Werror=date-time -Wno-initializer-overrides -Wno-unused-value -Wno-format -Wno-unknown-warning-option -Wno-sign-compare -Wno-format-zero-length -Wno-uninitialized -D"KBUILD_STR(s)=#s" -D"KBUILD_BASENAME=KBUILD_STR(workqueue)" -D"KBUILD_MODNAME=KBUILD_STR(workqueue)" -c -o kernel/.tmp_workqueue.o kernel/workqueue.c mycompiler -Wp,-MD,kernel/time/.timer.o.d -nostdinc -isystem /opt/llvm-toolchain-3.8.0rc3/bin/../lib/clang/3.8.0/include -nostdinc -isystem /opt/llvm-toolchain-3.8.0rc3/bin/../lib/clang/3.8.0/include -I./arch/x86/include -Iarch/x86/include/generated/uapi -Iarch/x86/include/generated -Iinclude -I./arch/x86/include/uapi -Iarch/x86/include/generated/uapi -I./include/uapi -Iinclude/generated/uapi -include ./include/linux/kconfig.h -D__KERNEL__ -Qunused-arguments -Wno-unknown-warning-option -Wall -Wundef -Wstrict-prototypes -Wno-trigraphs -fno-strict-aliasing -fno-common -Werror-implicit-function-declaration -Wno-format-security -std=gnu89 -no-integrated-as -mno-sse -mno-mmx -mno-sse2 -mno-3dnow -mno-avx -m64 -mtune=generic -mno-red-zone -mcmodel=kernel -funit-at-a-time -DCONFIG_X86_X32_ABI -DCONFIG_AS_CFI=1 -DCONFIG_AS_CFI_SIGNAL_FRAME=1 -DCONFIG_AS_CFI_SECTIONS=1 -DCONFIG_AS_FXSAVEQ=1 -DCONFIG_AS_SSSE3=1 -DCONFIG_AS_CRC32=1 -DCONFIG_AS_AVX=1 -DCONFIG_AS_AVX2=1 -pipe -Wno-sign-compare -fno-asynchronous-unwind-tables -O2 -Wframe-larger-than=1024 -fno-stack-protector -Wno-unused-variable -Wno-format-invalid-specifier -Wno-gnu -Wno-asm-operand-widths -Wno-initializer-overrides -fno-builtin -Wno-tautological-compare -mno-global-merge -fno-omit-frame-pointer -fno-optimize-sibling-calls -pg -Wdeclaration-after-statement -Wno-pointer-sign -fno-strict-overflow -Werror=implicit-int -Werror=strict-prototypes -Werror=date-time -Wno-initializer-overrides -Wno-unused-value -Wno-format -Wno-unknown-warning-option -Wno-sign-compare -Wno-format-zero-length -Wno-uninitialized -D"KBUILD_STR(s)=#s" -D"KBUILD_BASENAME=KBUILD_STR(timer)" -D"KBUILD_MODNAME=KBUILD_STR(timer)" -c -o kernel/time/.tmp_timer.o kernel/time/timer.c [ GCC ] mycompiler -Wp,-MD,kernel/.workqueue.o.d -nostdinc -isystem /usr/lib/gcc/x86_64-linux-gnu/4.9/include -nostdinc -isystem /usr/lib/gcc/x86_64-linux-gnu/4.9/include -I./arch/x86/include -Iarch/x86/include/generated/uapi -Iarch/x86/include/generated -Iinclude -I./arch/x86/include/uapi -Iarch/x86/include/generated/uapi -I./include/uapi -Iinclude/generated/uapi -include ./include/linux/kconfig.h -D__KERNEL__ -Wall -Wundef -Wstrict-prototypes -Wno-trigraphs -fno-strict-aliasing -fno-common -Werror-implicit-function-declaration -Wno-format-security -std=gnu89 -mno-sse -mno-mmx -mno-sse2 -mno-3dnow -mno-avx -m64 -falign-jumps=1 -falign-loops=1 -mno-80387 -mno-fp-ret-in-387 -mpreferred-stack-boundary=3 -mtune=generic -mno-red-zone -mcmodel=kernel -funit-at-a-time -maccumulate-outgoing-args -DCONFIG_X86_X32_ABI -DCONFIG_AS_CFI=1 -DCONFIG_AS_CFI_SIGNAL_FRAME=1 -DCONFIG_AS_CFI_SECTIONS=1 -DCONFIG_AS_FXSAVEQ=1 -DCONFIG_AS_SSSE3=1 -DCONFIG_AS_CRC32=1 -DCONFIG_AS_AVX=1 -DCONFIG_AS_AVX2=1 -pipe -Wno-sign-compare -fno-asynchronous-unwind-tables -fno-delete-null-pointer-checks -O2 --param=allow-store-data-races=0 -Wframe-larger-than=1024 -fno-stack-protector -Wno-unused-but-set-variable -fno-omit-frame-pointer -fno-optimize-sibling-calls -fno-var-tracking-assignments -pg -mfentry -DCC_USING_FENTRY -Wdeclaration-after-statement -Wno-pointer-sign -fno-strict-overflow -fconserve-stack -Werror=implicit-int -Werror=strict-prototypes -Werror=date-time -DCC_HAVE_ASM_GOTO -D"KBUILD_STR(s)=#s" -D"KBUILD_BASENAME=KBUILD_STR(workqueue)" -D"KBUILD_MODNAME=KBUILD_STR(workqueue)" -c -o kernel/.tmp_workqueue.o kernel/workqueue.c mycompiler -Wp,-MD,kernel/time/.timer.o.d -nostdinc -isystem /usr/lib/gcc/x86_64-linux-gnu/4.9/include -nostdinc -isystem /usr/lib/gcc/x86_64-linux-gnu/4.9/include -I./arch/x86/include -Iarch/x86/include/generated/uapi -Iarch/x86/include/generated -Iinclude -I./arch/x86/include/uapi -Iarch/x86/include/generated/uapi -I./include/uapi -Iinclude/generated/uapi -include ./include/linux/kconfig.h -D__KERNEL__ -Wall -Wundef -Wstrict-prototypes -Wno-trigraphs -fno-strict-aliasing -fno-common -Werror-implicit-function-declaration -Wno-format-security -std=gnu89 -mno-sse -mno-mmx -mno-sse2 -mno-3dnow -mno-avx -m64 -falign-jumps=1 -falign-loops=1 -mno-80387 -mno-fp-ret-in-387 -mpreferred-stack-boundary=3 -mtune=generic -mno-red-zone -mcmodel=kernel -funit-at-a-time -maccumulate-outgoing-args -DCONFIG_X86_X32_ABI -DCONFIG_AS_CFI=1 -DCONFIG_AS_CFI_SIGNAL_FRAME=1 -DCONFIG_AS_CFI_SECTIONS=1 -DCONFIG_AS_FXSAVEQ=1 -DCONFIG_AS_SSSE3=1 -DCONFIG_AS_CRC32=1 -DCONFIG_AS_AVX=1 -DCONFIG_AS_AVX2=1 -pipe -Wno-sign-compare -fno-asynchronous-unwind-tables -fno-delete-null-pointer-checks -O2 --param=allow-store-data-races=0 -Wframe-larger-than=1024 -fno-stack-protector -Wno-unused-but-set-variable -fno-omit-frame-pointer -fno-optimize-sibling-calls -fno-var-tracking-assignments -pg -mfentry -DCC_USING_FENTRY -Wdeclaration-after-statement -Wno-pointer-sign -fno-strict-overflow -fconserve-stack -Werror=implicit-int -Werror=strict-prototypes -Werror=date-time -DCC_HAVE_ASM_GOTO -D"KBUILD_STR(s)=#s" -D"KBUILD_BASENAME=KBUILD_STR(timer)" -D"KBUILD_MODNAME=KBUILD_STR(timer)" -c -o kernel/time/.tmp_timer.o kernel/time/timer.c I can try to use the make-line of GCC and re-compile. - Sedat - -- To unsubscribe from this list: send the line "unsubscribe linux-usb" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html