On Thu, Aug 15, 2024 at 9:27 PM Alexandre Ghiti <alex@xxxxxxxx> wrote: > > Hi Andrew, > > On 01/08/2024 08:53, Alexandre Ghiti wrote: > > On Wed, Jul 31, 2024 at 5:29 PM Andrew Jones <ajones@xxxxxxxxxxxxxxxx> wrote: > >> On Wed, Jul 31, 2024 at 09:24:05AM GMT, Alexandre Ghiti wrote: > >>> In order to produce a generic kernel, a user can select > >>> CONFIG_COMBO_SPINLOCKS which will fallback at runtime to the ticket > >>> spinlock implementation if Zabha or Ziccrse are not present. > >>> > >>> Note that we can't use alternatives here because the discovery of > >>> extensions is done too late and we need to start with the qspinlock > >>> implementation because the ticket spinlock implementation would pollute > >>> the spinlock value, so let's use static keys. > >>> > >>> This is largely based on Guo's work and Leonardo reviews at [1]. > >>> > >>> Link: https://lore.kernel.org/linux-riscv/20231225125847.2778638-1-guoren@xxxxxxxxxx/ [1] > >>> Signed-off-by: Guo Ren <guoren@xxxxxxxxxx> > >>> Signed-off-by: Alexandre Ghiti <alexghiti@xxxxxxxxxxxx> > >>> --- > >>> .../locking/queued-spinlocks/arch-support.txt | 2 +- > >>> arch/riscv/Kconfig | 29 +++++++++++++ > >>> arch/riscv/include/asm/Kbuild | 4 +- > >>> arch/riscv/include/asm/spinlock.h | 43 +++++++++++++++++++ > >>> arch/riscv/kernel/setup.c | 38 ++++++++++++++++ > >>> include/asm-generic/qspinlock.h | 2 + > >>> include/asm-generic/ticket_spinlock.h | 2 + > >>> 7 files changed, 118 insertions(+), 2 deletions(-) > >>> create mode 100644 arch/riscv/include/asm/spinlock.h > >>> > >>> diff --git a/Documentation/features/locking/queued-spinlocks/arch-support.txt b/Documentation/features/locking/queued-spinlocks/arch-support.txt > >>> index 22f2990392ff..cf26042480e2 100644 > >>> --- a/Documentation/features/locking/queued-spinlocks/arch-support.txt > >>> +++ b/Documentation/features/locking/queued-spinlocks/arch-support.txt > >>> @@ -20,7 +20,7 @@ > >>> | openrisc: | ok | > >>> | parisc: | TODO | > >>> | powerpc: | ok | > >>> - | riscv: | TODO | > >>> + | riscv: | ok | > >>> | s390: | TODO | > >>> | sh: | TODO | > >>> | sparc: | ok | > >>> diff --git a/arch/riscv/Kconfig b/arch/riscv/Kconfig > >>> index ef55ab94027e..c9ff8081efc1 100644 > >>> --- a/arch/riscv/Kconfig > >>> +++ b/arch/riscv/Kconfig > >>> @@ -79,6 +79,7 @@ config RISCV > >>> select ARCH_WANT_OPTIMIZE_HUGETLB_VMEMMAP > >>> select ARCH_WANTS_NO_INSTR > >>> select ARCH_WANTS_THP_SWAP if HAVE_ARCH_TRANSPARENT_HUGEPAGE > >>> + select ARCH_WEAK_RELEASE_ACQUIRE if ARCH_USE_QUEUED_SPINLOCKS > >> Why do we need this? Also, we presumably would prefer not to have it > >> when we end up using ticket spinlocks when combo spinlocks is selected. > >> Is there no way to avoid it? > > I'll let Andrea answer this as he asked for it. > > > >>> select BINFMT_FLAT_NO_DATA_START_OFFSET if !MMU > >>> select BUILDTIME_TABLE_SORT if MMU > >>> select CLINT_TIMER if RISCV_M_MODE > >>> @@ -488,6 +489,34 @@ config NODES_SHIFT > >>> Specify the maximum number of NUMA Nodes available on the target > >>> system. Increases memory reserved to accommodate various tables. > >>> > >>> +choice > >>> + prompt "RISC-V spinlock type" > >>> + default RISCV_COMBO_SPINLOCKS > >>> + > >>> +config RISCV_TICKET_SPINLOCKS > >>> + bool "Using ticket spinlock" > >>> + > >>> +config RISCV_QUEUED_SPINLOCKS > >>> + bool "Using queued spinlock" > >>> + depends on SMP && MMU && NONPORTABLE > >>> + select ARCH_USE_QUEUED_SPINLOCKS > >>> + help > >>> + The queued spinlock implementation requires the forward progress > >>> + guarantee of cmpxchg()/xchg() atomic operations: CAS with Zabha or > >>> + LR/SC with Ziccrse provide such guarantee. > >>> + > >>> + Select this if and only if Zabha or Ziccrse is available on your > >>> + platform. > >> Maybe some text recommending combo spinlocks here? As it stands it sounds > >> like enabling queued spinlocks is a bad idea for anybody that doesn't know > >> what platforms will run the kernel they're building, which is all distros. > > That's NONPORTABLE, so people enabling this config are supposed to > > know that right? > > > >>> + > >>> +config RISCV_COMBO_SPINLOCKS > >>> + bool "Using combo spinlock" > >>> + depends on SMP && MMU > >>> + select ARCH_USE_QUEUED_SPINLOCKS > >>> + help > >>> + Embed both queued spinlock and ticket lock so that the spinlock > >>> + implementation can be chosen at runtime. > >> nit: Add a blank line here > > Done > > > >>> +endchoice > >>> + > >>> config RISCV_ALTERNATIVE > >>> bool > >>> depends on !XIP_KERNEL > >>> diff --git a/arch/riscv/include/asm/Kbuild b/arch/riscv/include/asm/Kbuild > >>> index 5c589770f2a8..1c2618c964f0 100644 > >>> --- a/arch/riscv/include/asm/Kbuild > >>> +++ b/arch/riscv/include/asm/Kbuild > >>> @@ -5,10 +5,12 @@ syscall-y += syscall_table_64.h > >>> generic-y += early_ioremap.h > >>> generic-y += flat.h > >>> generic-y += kvm_para.h > >>> +generic-y += mcs_spinlock.h > >>> generic-y += parport.h > >>> -generic-y += spinlock.h > >>> generic-y += spinlock_types.h > >>> +generic-y += ticket_spinlock.h > >>> generic-y += qrwlock.h > >>> generic-y += qrwlock_types.h > >>> +generic-y += qspinlock.h > >>> generic-y += user.h > >>> generic-y += vmlinux.lds.h > >>> diff --git a/arch/riscv/include/asm/spinlock.h b/arch/riscv/include/asm/spinlock.h > >>> new file mode 100644 > >>> index 000000000000..503aef31db83 > >>> --- /dev/null > >>> +++ b/arch/riscv/include/asm/spinlock.h > >>> @@ -0,0 +1,43 @@ > >>> +/* SPDX-License-Identifier: GPL-2.0 */ > >>> + > >>> +#ifndef __ASM_RISCV_SPINLOCK_H > >>> +#define __ASM_RISCV_SPINLOCK_H > >>> + > >>> +#ifdef CONFIG_RISCV_COMBO_SPINLOCKS > >>> +#define _Q_PENDING_LOOPS (1 << 9) > >>> + > >>> +#define __no_arch_spinlock_redefine > >>> +#include <asm/ticket_spinlock.h> > >>> +#include <asm/qspinlock.h> > >>> +#include <asm/alternative.h> > >> We need asm/jump_label.h instead of asm/alternative.h, but... > >> > >>> + > >>> +DECLARE_STATIC_KEY_TRUE(qspinlock_key); > >>> + > >>> +#define SPINLOCK_BASE_DECLARE(op, type, type_lock) \ > >>> +static __always_inline type arch_spin_##op(type_lock lock) \ > >>> +{ \ > >>> + if (static_branch_unlikely(&qspinlock_key)) \ > >>> + return queued_spin_##op(lock); \ > >>> + return ticket_spin_##op(lock); \ > >>> +} > >> ...do you know what impact this inlined static key check has on the > >> kernel size? > > No, I'll check, thanks. > > > So I have just checked the size of the jump table section: > > * defconfig: > > - ticket: 26928 bytes > - combo: 28320 bytes > > So that's a ~5% increase. > > * ubuntu config > > - ticket: 107840 bytes > - combo: 174752 bytes > > And that's a ~62% increase. The size of the jump table section has increased from 5% to 62%. I think some configuration triggers the jump table's debug code. If it's not a debugging configuration, that's a bug of the Ubuntu config. > > This is the ELF size difference between ticket and combo spinlocks: > > * ticket: 776915592 bytes > * combo: 786958968 bytes > > So that's an increase of ~1.3% on the ELF. > > And the .text section size: > > * ticket: 12290960 bytes > * combo: 12366644 bytes > > And that's a ~0.6% increase! > > Finally, I'd say the impact is very limited :) > > Thanks, > > Alex > > > > > >> Actually, why not use ALTERNATIVE with any nonzero cpufeature value. > >> Then add code to riscv_cpufeature_patch_check() to return true when > >> qspinlocks should be enabled (based on the value of some global set > >> during riscv_spinlock_init)? > > As discussed with Guo in the previous iteration, the patching of the > > alternatives intervenes far after the first use of the spinlocks and > > the ticket spinlock implementation pollutes the spinlock value, so > > we'd have to unconditionally start with the qspinlock implementation > > and after switch to the ticket implementation if not supported by the > > platform. It works but it's dirty, I really don't like this hack. > > > > We could though: > > - add an initial value to the alternatives (not sure it's feasible though) > > - make the patching of alternatives happen sooner by parsing the isa > > string sooner, either in DT or ACPI (I have a working PoC for very > > early parsing of ACPI). > > > > I intend to do the latter as I think we should be aware of the > > extensions sooner in the boot process, so I'll change that to the > > alternatives when it's done. WDYT, any other idea? > > > > > >>> + > >>> +SPINLOCK_BASE_DECLARE(lock, void, arch_spinlock_t *) > >>> +SPINLOCK_BASE_DECLARE(unlock, void, arch_spinlock_t *) > >>> +SPINLOCK_BASE_DECLARE(is_locked, int, arch_spinlock_t *) > >>> +SPINLOCK_BASE_DECLARE(is_contended, int, arch_spinlock_t *) > >>> +SPINLOCK_BASE_DECLARE(trylock, bool, arch_spinlock_t *) > >>> +SPINLOCK_BASE_DECLARE(value_unlocked, int, arch_spinlock_t) > >>> + > >>> +#elif defined(CONFIG_RISCV_QUEUED_SPINLOCKS) > >>> + > >>> +#include <asm/qspinlock.h> > >>> + > >>> +#else > >>> + > >>> +#include <asm/ticket_spinlock.h> > >>> + > >>> +#endif > >>> + > >>> +#include <asm/qrwlock.h> > >>> + > >>> +#endif /* __ASM_RISCV_SPINLOCK_H */ > >>> diff --git a/arch/riscv/kernel/setup.c b/arch/riscv/kernel/setup.c > >>> index a2cde65b69e9..b811fa331982 100644 > >>> --- a/arch/riscv/kernel/setup.c > >>> +++ b/arch/riscv/kernel/setup.c > >>> @@ -244,6 +244,43 @@ static void __init parse_dtb(void) > >>> #endif > >>> } > >>> > >>> +#if defined(CONFIG_RISCV_COMBO_SPINLOCKS) > >>> +DEFINE_STATIC_KEY_TRUE(qspinlock_key); > >>> +EXPORT_SYMBOL(qspinlock_key); > >>> +#endif > >>> + > >>> +static void __init riscv_spinlock_init(void) > >>> +{ > >>> + char *using_ext = NULL; > >>> + > >>> + if (IS_ENABLED(CONFIG_RISCV_TICKET_SPINLOCKS)) { > >>> + pr_info("Ticket spinlock: enabled\n"); > >>> + return; > >>> + } > >>> + > >>> + if (IS_ENABLED(CONFIG_RISCV_ISA_ZABHA) && > >>> + IS_ENABLED(CONFIG_RISCV_ISA_ZACAS) && > >>> + riscv_isa_extension_available(NULL, ZABHA) && > >>> + riscv_isa_extension_available(NULL, ZACAS)) { > >>> + using_ext = "using Zabha"; > >>> + } else if (riscv_isa_extension_available(NULL, ZICCRSE)) { > >>> + using_ext = "using Ziccrse"; > >>> + } > >>> +#if defined(CONFIG_RISCV_COMBO_SPINLOCKS) > >>> + else { > >> else if (IS_ENABLED(CONFIG_RISCV_COMBO_SPINLOCKS)) > >> > >>> + static_branch_disable(&qspinlock_key); > >>> + pr_info("Ticket spinlock: enabled\n"); > >>> + > >> nit: remove this blank line > >> > >>> + return; > >>> + } > >>> +#endif > >>> + > >>> + if (!using_ext) > >>> + pr_err("Queued spinlock without Zabha or Ziccrse"); > >>> + else > >>> + pr_info("Queued spinlock %s: enabled\n", using_ext); > >>> +} > >>> + > >>> extern void __init init_rt_signal_env(void); > >>> > >>> void __init setup_arch(char **cmdline_p) > >>> @@ -297,6 +334,7 @@ void __init setup_arch(char **cmdline_p) > >>> riscv_set_dma_cache_alignment(); > >>> > >>> riscv_user_isa_enable(); > >>> + riscv_spinlock_init(); > >>> } > >>> > >>> bool arch_cpu_is_hotpluggable(int cpu) > >>> diff --git a/include/asm-generic/qspinlock.h b/include/asm-generic/qspinlock.h > >>> index 0655aa5b57b2..bf47cca2c375 100644 > >>> --- a/include/asm-generic/qspinlock.h > >>> +++ b/include/asm-generic/qspinlock.h > >>> @@ -136,6 +136,7 @@ static __always_inline bool virt_spin_lock(struct qspinlock *lock) > >>> } > >>> #endif > >>> > >>> +#ifndef __no_arch_spinlock_redefine > >> I'm not sure what's better/worse, but instead of inventing this > >> __no_arch_spinlock_redefine thing we could just name all the functions > >> something like __arch_spin* and then add defines for both to asm/spinlock.h, > >> i.e. > >> > >> #define queued_spin_lock(l) __arch_spin_lock(l) > >> ... > >> > >> #define ticket_spin_lock(l) __arch_spin_lock(l) > >> ... > >> > >> Besides not having to touch asm-generic/qspinlock.h and > >> asm-generic/ticket_spinlock.h it allows one to find the implementations > >> a bit easier as following a tag to arch_spin_lock() will take them to > >> queued_spin_lock() which will then take them to > >> arch/riscv/include/asm/spinlock.h and there they'll figure out how > >> __arch_spin_lock() was defined. > >> > >>> /* > >>> * Remapping spinlock architecture specific functions to the corresponding > >>> * queued spinlock functions. > >>> @@ -146,5 +147,6 @@ static __always_inline bool virt_spin_lock(struct qspinlock *lock) > >>> #define arch_spin_lock(l) queued_spin_lock(l) > >>> #define arch_spin_trylock(l) queued_spin_trylock(l) > >>> #define arch_spin_unlock(l) queued_spin_unlock(l) > >>> +#endif > >>> > >>> #endif /* __ASM_GENERIC_QSPINLOCK_H */ > >>> diff --git a/include/asm-generic/ticket_spinlock.h b/include/asm-generic/ticket_spinlock.h > >>> index cfcff22b37b3..325779970d8a 100644 > >>> --- a/include/asm-generic/ticket_spinlock.h > >>> +++ b/include/asm-generic/ticket_spinlock.h > >>> @@ -89,6 +89,7 @@ static __always_inline int ticket_spin_is_contended(arch_spinlock_t *lock) > >>> return (s16)((val >> 16) - (val & 0xffff)) > 1; > >>> } > >>> > >>> +#ifndef __no_arch_spinlock_redefine > >>> /* > >>> * Remapping spinlock architecture specific functions to the corresponding > >>> * ticket spinlock functions. > >>> @@ -99,5 +100,6 @@ static __always_inline int ticket_spin_is_contended(arch_spinlock_t *lock) > >>> #define arch_spin_lock(l) ticket_spin_lock(l) > >>> #define arch_spin_trylock(l) ticket_spin_trylock(l) > >>> #define arch_spin_unlock(l) ticket_spin_unlock(l) > >>> +#endif > >>> > >>> #endif /* __ASM_GENERIC_TICKET_SPINLOCK_H */ > >>> -- > >>> 2.39.2 > >>> > >> Thanks, > >> drew > > _______________________________________________ > > linux-riscv mailing list > > linux-riscv@xxxxxxxxxxxxxxxxxxx > > http://lists.infradead.org/mailman/listinfo/linux-riscv -- Best Regards Guo Ren