On Mon, Jun 26, 2023 at 12:19:45PM +0100, Conor Dooley wrote: > Before adding more complexity to it, split riscv_fill_hwcap() into 3 > distinct sections: > - riscv_fill_hwcap() still is the top level function, into which the > additional complexity will be added. > - riscv_fill_hwcap_from_isa_string() handles getting the information > from the riscv,isa/ACPI equivalent across harts & the various quirks > there > - riscv_parse_isa_string() does what it says on the tin. > > Signed-off-by: Conor Dooley <conor.dooley@xxxxxxxxxxxxx> > --- > arch/riscv/kernel/cpufeature.c | 350 +++++++++++++++++---------------- > 1 file changed, 182 insertions(+), 168 deletions(-) > > diff --git a/arch/riscv/kernel/cpufeature.c b/arch/riscv/kernel/cpufeature.c > index 5405d8a58537..366477ba1eea 100644 > --- a/arch/riscv/kernel/cpufeature.c > +++ b/arch/riscv/kernel/cpufeature.c > @@ -180,29 +180,172 @@ const struct riscv_isa_ext_data riscv_isa_ext[] = { > > const size_t riscv_isa_ext_count = ARRAY_SIZE(riscv_isa_ext); > > -void __init riscv_fill_hwcap(void) > +static void __init riscv_parse_isa_string(unsigned long *this_hwcap, struct riscv_isainfo *isainfo, > + unsigned long *isa2hwcap, const char *isa) > +{ > + /* > + * For all possible cpus, we have already validated in > + * the boot process that they at least contain "rv" and > + * whichever of "32"/"64" this kernel supports, and so this > + * section can be skipped. > + */ > + isa += 4; > + > + while (*isa) { > + const char *ext = isa++; > + const char *ext_end = isa; > + bool ext_long = false, ext_err = false; > + > + switch (*ext) { > + case 's': > + /* > + * Workaround for invalid single-letter 's' & 'u'(QEMU). > + * No need to set the bit in riscv_isa as 's' & 'u' are > + * not valid ISA extensions. It works until multi-letter > + * extension starting with "Su" appears. > + */ > + if (ext[-1] != '_' && ext[1] == 'u') { > + ++isa; > + ext_err = true; > + break; > + } > + fallthrough; > + case 'S': > + case 'x': > + case 'X': > + case 'z': > + case 'Z': > + /* > + * Before attempting to parse the extension itself, we find its end. > + * As multi-letter extensions must be split from other multi-letter > + * extensions with an "_", the end of a multi-letter extension will > + * either be the null character or the "_" at the start of the next > + * multi-letter extension. > + * > + * Next, as the extensions version is currently ignored, we > + * eliminate that portion. This is done by parsing backwards from > + * the end of the extension, removing any numbers. This may be a > + * major or minor number however, so the process is repeated if a > + * minor number was found. > + * > + * ext_end is intended to represent the first character *after* the > + * name portion of an extension, but will be decremented to the last > + * character itself while eliminating the extensions version number. > + * A simple re-increment solves this problem. > + */ > + ext_long = true; > + for (; *isa && *isa != '_'; ++isa) > + if (unlikely(!isalnum(*isa))) > + ext_err = true; > + > + ext_end = isa; > + if (unlikely(ext_err)) > + break; > + > + if (!isdigit(ext_end[-1])) > + break; > + > + while (isdigit(*--ext_end)) > + ; > + > + if (tolower(ext_end[0]) != 'p' || !isdigit(ext_end[-1])) { > + ++ext_end; > + break; > + } > + > + while (isdigit(*--ext_end)) > + ; > + > + ++ext_end; > + break; > + default: > + /* > + * Things are a little easier for single-letter extensions, as they > + * are parsed forwards. > + * > + * After checking that our starting position is valid, we need to > + * ensure that, when isa was incremented at the start of the loop, > + * that it arrived at the start of the next extension. > + * > + * If we are already on a non-digit, there is nothing to do. Either > + * we have a multi-letter extension's _, or the start of an > + * extension. > + * > + * Otherwise we have found the current extension's major version > + * number. Parse past it, and a subsequent p/minor version number > + * if present. The `p` extension must not appear immediately after > + * a number, so there is no fear of missing it. > + * > + */ > + if (unlikely(!isalpha(*ext))) { > + ext_err = true; > + break; > + } > + > + if (!isdigit(*isa)) > + break; > + > + while (isdigit(*++isa)) > + ; > + > + if (tolower(*isa) != 'p') > + break; > + > + if (!isdigit(*++isa)) { > + --isa; > + break; > + } > + > + while (isdigit(*++isa)) > + ; > + > + break; > + } > + > + /* > + * The parser expects that at the start of an iteration isa points to the > + * first character of the next extension. As we stop parsing an extension > + * on meeting a non-alphanumeric character, an extra increment is needed > + * where the succeeding extension is a multi-letter prefixed with an "_". > + */ > + if (*isa == '_') > + ++isa; > + > +#define SET_ISA_EXT_MAP(name, bit) \ > + do { \ > + if ((ext_end - ext == sizeof(name) - 1) && \ > + !strncasecmp(ext, name, sizeof(name) - 1) && \ > + riscv_isa_extension_check(bit)) \ > + set_bit(bit, isainfo->isa); \ > + } while (false) \ > + > + if (unlikely(ext_err)) > + continue; > + if (!ext_long) { > + int nr = tolower(*ext) - 'a'; > + > + if (riscv_isa_extension_check(nr)) { > + *this_hwcap |= isa2hwcap[nr]; > + set_bit(nr, isainfo->isa); > + } > + } else { > + for (int i = 0; i < riscv_isa_ext_count; i++) > + SET_ISA_EXT_MAP(riscv_isa_ext[i].name, > + riscv_isa_ext[i].id); > + } > +#undef SET_ISA_EXT_MAP > + } > +} > + > +static void __init riscv_fill_hwcap_from_isa_string(unsigned long *isa2hwcap) > { > struct device_node *node; > const char *isa; > - char print_str[NUM_ALPHA_EXTS + 1]; > - int i, j, rc; > - unsigned long isa2hwcap[26] = {0}; > + int rc; > struct acpi_table_header *rhct; > acpi_status status; > unsigned int cpu; > > - isa2hwcap['i' - 'a'] = COMPAT_HWCAP_ISA_I; > - isa2hwcap['m' - 'a'] = COMPAT_HWCAP_ISA_M; > - isa2hwcap['a' - 'a'] = COMPAT_HWCAP_ISA_A; > - isa2hwcap['f' - 'a'] = COMPAT_HWCAP_ISA_F; > - isa2hwcap['d' - 'a'] = COMPAT_HWCAP_ISA_D; > - isa2hwcap['c' - 'a'] = COMPAT_HWCAP_ISA_C; > - isa2hwcap['v' - 'a'] = COMPAT_HWCAP_ISA_V; > - > - elf_hwcap = 0; > - > - bitmap_zero(riscv_isa, RISCV_ISA_EXT_MAX); > - > if (!acpi_disabled) { > status = acpi_get_table(ACPI_SIG_RHCT, 0, &rhct); > if (ACPI_FAILURE(status)) > @@ -234,158 +377,7 @@ void __init riscv_fill_hwcap(void) > } > } > > - /* > - * For all possible cpus, we have already validated in > - * the boot process that they at least contain "rv" and > - * whichever of "32"/"64" this kernel supports, and so this > - * section can be skipped. > - */ > - isa += 4; > - > - while (*isa) { > - const char *ext = isa++; > - const char *ext_end = isa; > - bool ext_long = false, ext_err = false; > - > - switch (*ext) { > - case 's': > - /* > - * Workaround for invalid single-letter 's' & 'u'(QEMU). > - * No need to set the bit in riscv_isa as 's' & 'u' are > - * not valid ISA extensions. It works until multi-letter > - * extension starting with "Su" appears. > - */ > - if (ext[-1] != '_' && ext[1] == 'u') { > - ++isa; > - ext_err = true; > - break; > - } > - fallthrough; > - case 'S': > - case 'x': > - case 'X': > - case 'z': > - case 'Z': > - /* > - * Before attempting to parse the extension itself, we find its end. > - * As multi-letter extensions must be split from other multi-letter > - * extensions with an "_", the end of a multi-letter extension will > - * either be the null character or the "_" at the start of the next > - * multi-letter extension. > - * > - * Next, as the extensions version is currently ignored, we > - * eliminate that portion. This is done by parsing backwards from > - * the end of the extension, removing any numbers. This may be a > - * major or minor number however, so the process is repeated if a > - * minor number was found. > - * > - * ext_end is intended to represent the first character *after* the > - * name portion of an extension, but will be decremented to the last > - * character itself while eliminating the extensions version number. > - * A simple re-increment solves this problem. > - */ > - ext_long = true; > - for (; *isa && *isa != '_'; ++isa) > - if (unlikely(!isalnum(*isa))) > - ext_err = true; > - > - ext_end = isa; > - if (unlikely(ext_err)) > - break; > - > - if (!isdigit(ext_end[-1])) > - break; > - > - while (isdigit(*--ext_end)) > - ; > - > - if (tolower(ext_end[0]) != 'p' || !isdigit(ext_end[-1])) { > - ++ext_end; > - break; > - } > - > - while (isdigit(*--ext_end)) > - ; > - > - ++ext_end; > - break; > - default: > - /* > - * Things are a little easier for single-letter extensions, as they > - * are parsed forwards. > - * > - * After checking that our starting position is valid, we need to > - * ensure that, when isa was incremented at the start of the loop, > - * that it arrived at the start of the next extension. > - * > - * If we are already on a non-digit, there is nothing to do. Either > - * we have a multi-letter extension's _, or the start of an > - * extension. > - * > - * Otherwise we have found the current extension's major version > - * number. Parse past it, and a subsequent p/minor version number > - * if present. The `p` extension must not appear immediately after > - * a number, so there is no fear of missing it. > - * > - */ > - if (unlikely(!isalpha(*ext))) { > - ext_err = true; > - break; > - } > - > - if (!isdigit(*isa)) > - break; > - > - while (isdigit(*++isa)) > - ; > - > - if (tolower(*isa) != 'p') > - break; > - > - if (!isdigit(*++isa)) { > - --isa; > - break; > - } > - > - while (isdigit(*++isa)) > - ; > - > - break; > - } > - > - /* > - * The parser expects that at the start of an iteration isa points to the > - * first character of the next extension. As we stop parsing an extension > - * on meeting a non-alphanumeric character, an extra increment is needed > - * where the succeeding extension is a multi-letter prefixed with an "_". > - */ > - if (*isa == '_') > - ++isa; > - > -#define SET_ISA_EXT_MAP(name, bit) \ > - do { \ > - if ((ext_end - ext == sizeof(name) - 1) && \ > - !strncasecmp(ext, name, sizeof(name) - 1) && \ > - riscv_isa_extension_check(bit)) \ > - set_bit(bit, isainfo->isa); \ > - } while (false) \ > - > - if (unlikely(ext_err)) > - continue; > - if (!ext_long) { > - int nr = tolower(*ext) - 'a'; > - > - if (riscv_isa_extension_check(nr)) { > - this_hwcap |= isa2hwcap[nr]; > - set_bit(nr, isainfo->isa); > - } > - } else { > - for (int i = 0; i < riscv_isa_ext_count; i++) > - SET_ISA_EXT_MAP(riscv_isa_ext[i].name, > - riscv_isa_ext[i].id); > - } > -#undef SET_ISA_EXT_MAP > - } > + riscv_parse_isa_string(&this_hwcap, isainfo, isa2hwcap, isa); > > /* > * Linux requires the following extensions, so we may as well > @@ -422,6 +414,28 @@ void __init riscv_fill_hwcap(void) > > if (!acpi_disabled && rhct) > acpi_put_table((struct acpi_table_header *)rhct); > +} > + > +void __init riscv_fill_hwcap(void) > +{ > + struct device_node *node; > + const char *isa; > + char print_str[NUM_ALPHA_EXTS + 1]; > + int i, j, rc; > + unsigned long isa2hwcap[26] = {0}; > + struct acpi_table_header *rhct; > + acpi_status status; > + unsigned int cpu; I see all these unused variables get removed in the next patch, but they should get removed here, lest they trigger some warnings and bots come after you! > + > + isa2hwcap['i' - 'a'] = COMPAT_HWCAP_ISA_I; > + isa2hwcap['m' - 'a'] = COMPAT_HWCAP_ISA_M; > + isa2hwcap['a' - 'a'] = COMPAT_HWCAP_ISA_A; > + isa2hwcap['f' - 'a'] = COMPAT_HWCAP_ISA_F; > + isa2hwcap['d' - 'a'] = COMPAT_HWCAP_ISA_D; > + isa2hwcap['c' - 'a'] = COMPAT_HWCAP_ISA_C; > + isa2hwcap['v' - 'a'] = COMPAT_HWCAP_ISA_V; > + > + riscv_fill_hwcap_from_isa_string(isa2hwcap); > > /* We don't support systems with F but without D, so mask those out > * here. */ > -- > 2.40.1 > Otherwise, Reviewed-by: Andrew Jones <ajones@xxxxxxxxxxxxxxxx> Thanks, drew