From: Ard Biesheuvel <ardb@xxxxxxxxxx> kallsyms is a directory of all the symbols in the vmlinux binary, and so creating it poses somewhat of a chicken-and-egg problem, as its non-zero size affects the layout of the binary, and therefore the values of the symbols. For this reason, the kernel is linked more than once, and the first pass does not include any kallsyms data at all. For the linker to accept this, the symbol declarations describing the kallsyms metadata are emitted as having weak linkage, so they can remain unsatisfied. During the subsequent passes, the weak references are satisfied by the kallsyms metadata that was constructed based on information gathered from the preceding passes. Weak references lead to somewhat worse codegen, because taking their address may need to produce NULL (if the reference was unsatisfied), and this is not usually supported by RIP or PC relative symbol references. Given that these references are ultimately always satisfied in the final link, let's drop the weak annotation on the declarations, and instead, provide fallback definitions with weak linkage. This informs the compiler that ultimately, the reference will always be satisfied. While at it, drop the FRV specific annotation that these symbols reside in .rodata - FRV is long gone. Cc: Masahiro Yamada <masahiroy@xxxxxxxxxx> Cc: linux-kbuild@xxxxxxxxxxxxxxx Acked-by: Nick Desaulniers <ndesaulniers@xxxxxxxxxx> Acked-by: Kees Cook <keescook@xxxxxxxxxxxx> Acked-by: Arnd Bergmann <arnd@xxxxxxxx> Link: https://lore.kernel.org/all/20240415075837.2349766-5-ardb+git@xxxxxxxxxx Signed-off-by: Ard Biesheuvel <ardb@xxxxxxxxxx> --- v5: - avoid PROVIDE() in the linker script, use weak definitions instead - drop tested-by, replace reviewed-by with acked-by kernel/kallsyms.c | 31 ++++++++++++++++---- kernel/kallsyms_internal.h | 25 ++++++---------- 2 files changed, 34 insertions(+), 22 deletions(-) diff --git a/kernel/kallsyms.c b/kernel/kallsyms.c index 18edd57b5fe8..fada7fbb24cf 100644 --- a/kernel/kallsyms.c +++ b/kernel/kallsyms.c @@ -34,6 +34,31 @@ #include "kallsyms_internal.h" +/* + * The real definitions of the symbols below will not exist yet during the + * first pass of the link, but are guaranteed to exist in the final link. + * Provide preliminary weak definitions that will be superseded in the final + * link, to avoid having to rely on weak references, which require a GOT when + * used in position independent code. + */ + +#ifndef CONFIG_KALLSYMS_BASE_RELATIVE +const unsigned long __weak kallsyms_addresses[1]; +#else +const int __weak kallsyms_offsets[1]; +const unsigned long __weak kallsyms_relative_base; +#endif + +const u8 __weak kallsyms_names[1]; + +const unsigned int __weak kallsyms_num_syms; + +const char __weak kallsyms_token_table[1]; +const u16 __weak kallsyms_token_index[1]; + +const unsigned int __weak kallsyms_markers[1]; +const u8 __weak kallsyms_seqs_of_names[3]; + /* * Expand a compressed symbol data into the resulting uncompressed string, * if uncompressed string is too long (>= maxlen), it will be truncated, @@ -325,12 +350,6 @@ static unsigned long get_symbol_pos(unsigned long addr, unsigned long symbol_start = 0, symbol_end = 0; unsigned long i, low, high, mid; - /* This kernel should never had been booted. */ - if (!IS_ENABLED(CONFIG_KALLSYMS_BASE_RELATIVE)) - BUG_ON(!kallsyms_addresses); - else - BUG_ON(!kallsyms_offsets); - /* Do a binary search on the sorted kallsyms_addresses array. */ low = 0; high = kallsyms_num_syms; diff --git a/kernel/kallsyms_internal.h b/kernel/kallsyms_internal.h index 27fabdcc40f5..cf4124dbcc5b 100644 --- a/kernel/kallsyms_internal.h +++ b/kernel/kallsyms_internal.h @@ -8,24 +8,17 @@ * These will be re-linked against their real values * during the second link stage. */ -extern const unsigned long kallsyms_addresses[] __weak; -extern const int kallsyms_offsets[] __weak; -extern const u8 kallsyms_names[] __weak; +extern const unsigned long kallsyms_addresses[]; +extern const int kallsyms_offsets[]; +extern const u8 kallsyms_names[]; -/* - * Tell the compiler that the count isn't in the small data section if the arch - * has one (eg: FRV). - */ -extern const unsigned int kallsyms_num_syms -__section(".rodata") __attribute__((weak)); - -extern const unsigned long kallsyms_relative_base -__section(".rodata") __attribute__((weak)); +extern const unsigned int kallsyms_num_syms; +extern const unsigned long kallsyms_relative_base; -extern const char kallsyms_token_table[] __weak; -extern const u16 kallsyms_token_index[] __weak; +extern const char kallsyms_token_table[]; +extern const u16 kallsyms_token_index[]; -extern const unsigned int kallsyms_markers[] __weak; -extern const u8 kallsyms_seqs_of_names[] __weak; +extern const unsigned int kallsyms_markers[]; +extern const u8 kallsyms_seqs_of_names[]; #endif // LINUX_KALLSYMS_INTERNAL_H_ -- 2.44.0.769.g3c40516874-goog