On Thu, May 06, 2021 at 06:16:47PM -0400, Eduardo Habkost wrote: > On Fri, Feb 26, 2021 at 10:20:54AM +0800, Yang Weijiang wrote: > > Currently, CPUID.(EAX=0DH,ECX=01H) doesn't enumerate features in > > XSS properly, add the support here. XCR0 bits indicate user-mode XSAVE > > components, and XSS bits indicate supervisor-mode XSAVE components. > > > > Signed-off-by: Yang Weijiang <weijiang.yang@xxxxxxxxx> > > --- > > target/i386/cpu.c | 48 ++++++++++++++++++++++++++++++++++++++++++----- > > target/i386/cpu.h | 12 ++++++++++++ > > 2 files changed, 55 insertions(+), 5 deletions(-) > > [...] > > @@ -1478,6 +1496,9 @@ static uint32_t xsave_area_size(uint64_t mask) > > for (i = 0; i < ARRAY_SIZE(x86_ext_save_areas); i++) { > > const ExtSaveArea *esa = &x86_ext_save_areas[i]; > > if ((mask >> i) & 1) { > > + if (i >= 2 && !esa->offset) { > > Maybe a few comments at the definition of ExtSaveArea to explain > that offset can now be zero (and what it means when it's zero) > would be helpful. I took a while to understand why this is safe. > Thanks Eduardo! Sure, I'll add some comments in next version. > Would it be valid to say "ExtSaveArea.offset has a valid offset > only if the component is in CPUID_XSTATE_XCR0_MASK"? If so, > can't this check be simply replaced with: > if ((1 << i) & CPUID_XSTATE_XCR0_MASK) > ? > > Or maybe this function should just contain a: > assert(!(mask & CPUID_XSTATE_XCR0_MASK)); > at the beginning? > Maybe I need to modifiy the function a bit to accommodate compacted format size calculation for CPUID(0xD,1).EBX. > > > + continue; > > + } > > ret = MAX(ret, esa->offset + esa->size); > > } > > } > > @@ -1489,12 +1510,18 @@ static inline bool accel_uses_host_cpuid(void) > > return kvm_enabled() || hvf_enabled(); > > } [...] > > > > @@ -5716,7 +5743,7 @@ void cpu_x86_cpuid(CPUX86State *env, uint32_t index, uint32_t count, > > } > > > > if (count == 0) { > > - *ecx = xsave_area_size(x86_cpu_xsave_components(cpu)); > > + *ecx = xsave_area_size(x86_cpu_xsave_xcr0_components(cpu)); > > *eax = env->features[FEAT_XSAVE_XCR0_LO]; > > *edx = env->features[FEAT_XSAVE_XCR0_HI]; > > /* > > @@ -5728,11 +5755,17 @@ void cpu_x86_cpuid(CPUX86State *env, uint32_t index, uint32_t count, > > *ebx = kvm_enabled() ? *ecx : xsave_area_size(env->xcr0); > > } else if (count == 1) { > > *eax = env->features[FEAT_XSAVE]; > > + *ecx = env->features[FEAT_XSAVE_XSS_LO]; > > + *edx = env->features[FEAT_XSAVE_XSS_HI]; > > What about EBX? It is documented as "The size in bytes of the > XSAVE area containing all states enabled by XCRO | IA32_XSS". > > The Intel SDM is not clear, but I assume this would be > necessarily the size of the area in compacted format? Yes, I'll add ebx assignment. > > > > } else if (count < ARRAY_SIZE(x86_ext_save_areas)) { > > - if ((x86_cpu_xsave_components(cpu) >> count) & 1) { > > - const ExtSaveArea *esa = &x86_ext_save_areas[count]; > > + const ExtSaveArea *esa = &x86_ext_save_areas[count]; > > + if ((x86_cpu_xsave_xcr0_components(cpu) >> count) & 1) { > > *eax = esa->size; > > *ebx = esa->offset; > > + } else if ((x86_cpu_xsave_xss_components(cpu) >> count) & 1) { > > + *eax = esa->size; > > + *ebx = 0; > > + *ecx = 1; > > } > > } > > break; > > @@ -6059,6 +6092,9 @@ static void x86_cpu_reset(DeviceState *dev) > > } > > for (i = 2; i < ARRAY_SIZE(x86_ext_save_areas); i++) { > > const ExtSaveArea *esa = &x86_ext_save_areas[i]; > > + if (!esa->offset) { > > + continue; > > Most of the comments at the xsave_area_size() hunk would apply > here. I miss some clarity on what esa->offset==0 really means. > > Would it be valid to replace this with a check for > ((1 << i) & CPUID_XSTATE_XCR0_MASK) > ? Sure, I'll use this check to make things clearer, thanks for the comments! > > > + } > > if (env->features[esa->feature] & esa->bits) { > > xcr0 |= 1ull << i; > > } [...] > > +/* CPUID feature bits available in XCR0 */ > > +#define CPUID_XSTATE_XCR0_MASK (XSTATE_FP_MASK | XSTATE_SSE_MASK | \ > > + XSTATE_YMM_MASK | XSTATE_BNDREGS_MASK | \ > > + XSTATE_BNDCSR_MASK | XSTATE_OPMASK_MASK | \ > > + XSTATE_ZMM_Hi256_MASK | \ > > + XSTATE_Hi16_ZMM_MASK | XSTATE_PKRU_MASK) > > + > > +/* CPUID feature bits available in XSS */ > > +#define CPUID_XSTATE_XSS_MASK 0 > > Do you expect this to be used outside target/i386/cpu.c? If not, > maybe it could be moved close to the x86_ext_save_areas[] > definition, as any updates to x86_ext_save_areas will require an > update to these macros. > > > + > > /* CPUID feature words */ > > typedef enum FeatureWord { > > FEAT_1_EDX, /* CPUID[1].EDX */ > > @@ -541,6 +551,8 @@ typedef enum FeatureWord { > > FEAT_VMX_EPT_VPID_CAPS, > > FEAT_VMX_BASIC, > > FEAT_VMX_VMFUNC, > > + FEAT_XSAVE_XSS_LO, /* CPUID[EAX=0xd,ECX=1].ECX */ > > + FEAT_XSAVE_XSS_HI, /* CPUID[EAX=0xd,ECX=1].EDX */ > > FEATURE_WORDS, > > } FeatureWord; > > > > -- > > 2.26.2 > > > > > > -- > Eduardo