We currently always shift APIC ID as if APIC was in xAPIC mode. x2APIC mode wants to use more bits and storing a hardware-compabible value is the the sanest option. VMX can stop intercepting the APIC ID register then. KVM API to set the lapic expects that bottom 8 bits of APIC ID are in top 8 bits of APIC_ID register. Definite that x2APIC IDs are byte swapped to keep compatibility without new toggles. Signed-off-by: Radim Krčmář <rkrcmar@xxxxxxxxxx> --- Documentation/virtual/kvm/api.txt | 6 ++++++ arch/x86/kvm/lapic.c | 44 ++++++++++++++++++++++++++++----------- arch/x86/kvm/lapic.h | 7 ++++++- arch/x86/kvm/vmx.c | 4 ---- arch/x86/kvm/x86.c | 2 ++ 5 files changed, 46 insertions(+), 17 deletions(-) diff --git a/Documentation/virtual/kvm/api.txt b/Documentation/virtual/kvm/api.txt index 07bcedc0ba09..b1ddea38e6b9 100644 --- a/Documentation/virtual/kvm/api.txt +++ b/Documentation/virtual/kvm/api.txt @@ -1583,6 +1583,11 @@ struct kvm_lapic_state { Reads the Local APIC registers and copies them into the input argument. The data format and layout are the same as documented in the architecture manual. +Note that the APIC ID is stored in APIC_ID register in big endian format. +This makes no difference for xAPIC APIC ID, which is still in the top 8 bits, +but x2APIC ID needs to be byteswapped. The reason is compatibility with KVM's +definition of x2APIC. (The hardware stores x2APIC ID as little endian.) + 4.58 KVM_SET_LAPIC @@ -1600,6 +1605,7 @@ struct kvm_lapic_state { Copies the input argument into the Local APIC registers. The data format and layout are the same as documented in the architecture manual. +See the note about APIC_ID register in KVM_GET_LAPIC. 4.59 KVM_IOEVENTFD diff --git a/arch/x86/kvm/lapic.c b/arch/x86/kvm/lapic.c index 615067b41dde..25702584d65c 100644 --- a/arch/x86/kvm/lapic.c +++ b/arch/x86/kvm/lapic.c @@ -239,7 +239,7 @@ static inline void apic_set_spiv(struct kvm_lapic *apic, u32 val) } } -static inline void kvm_apic_set_id(struct kvm_lapic *apic, u8 id) +static inline void kvm_apic_set_xapic_id(struct kvm_lapic *apic, u8 id) { apic_set_reg(apic, APIC_ID, id << 24); recalculate_apic_map(apic->vcpu->kvm); @@ -251,11 +251,11 @@ static inline void kvm_apic_set_ldr(struct kvm_lapic *apic, u32 id) recalculate_apic_map(apic->vcpu->kvm); } -static inline void kvm_apic_set_x2apic_id(struct kvm_lapic *apic, u8 id) +static inline void kvm_apic_set_x2apic_id(struct kvm_lapic *apic, u32 id) { u32 ldr = ((id >> 4) << 16) | (1 << (id & 0xf)); - apic_set_reg(apic, APIC_ID, id << 24); + apic_set_reg(apic, APIC_ID, id); apic_set_reg(apic, APIC_LDR, ldr); recalculate_apic_map(apic->vcpu->kvm); } @@ -1116,12 +1116,6 @@ static u32 __apic_read(struct kvm_lapic *apic, unsigned int offset) return 0; switch (offset) { - case APIC_ID: - if (apic_x2apic_mode(apic)) - val = kvm_apic_id(apic); - else - val = kvm_apic_id(apic) << 24; - break; case APIC_ARBPRI: apic_debug("Access APIC ARBPRI register which is for P6\n"); break; @@ -1400,7 +1394,7 @@ static int apic_reg_write(struct kvm_lapic *apic, u32 reg, u32 val) switch (reg) { case APIC_ID: /* Local APIC ID */ if (!apic_x2apic_mode(apic)) - kvm_apic_set_id(apic, val >> 24); + kvm_apic_set_xapic_id(apic, val >> 24); else ret = 1; break; @@ -1671,8 +1665,10 @@ void kvm_lapic_set_base(struct kvm_vcpu *vcpu, u64 value) if (value & X2APIC_ENABLE) { kvm_apic_set_x2apic_id(apic, vcpu->vcpu_id); kvm_x86_ops->set_virtual_x2apic_mode(vcpu, true); - } else + } else { + kvm_apic_set_xapic_id(apic, vcpu->vcpu_id); kvm_x86_ops->set_virtual_x2apic_mode(vcpu, false); + } } apic->base_address = apic->vcpu->arch.apic_base & @@ -1703,7 +1699,7 @@ void kvm_lapic_reset(struct kvm_vcpu *vcpu, bool init_event) hrtimer_cancel(&apic->lapic_timer.timer); if (!init_event) - kvm_apic_set_id(apic, vcpu->vcpu_id); + kvm_apic_set_xapic_id(apic, vcpu->vcpu_id); kvm_apic_set_version(apic->vcpu); for (i = 0; i < APIC_LVT_NUM; i++) @@ -1924,6 +1920,30 @@ int kvm_get_apic_interrupt(struct kvm_vcpu *vcpu) return vector; } +static void __kvm_apic_state_fixup(struct kvm_vcpu *vcpu, + struct kvm_lapic_state *s, bool restore) +{ + if (apic_x2apic_mode(vcpu->arch.apic)) { + u32 *id = (u32 *)(s->regs + APIC_ID); + if (restore) + *id = be32_to_cpu(*id); + else + *id = cpu_to_be32(*id); + } +} + +void kvm_apic_state_get_fixup(struct kvm_vcpu *vcpu, + struct kvm_lapic_state *s) +{ + __kvm_apic_state_fixup(vcpu, s, false); +} + +void kvm_apic_state_set_fixup(struct kvm_vcpu *vcpu, + struct kvm_lapic_state *s) +{ + __kvm_apic_state_fixup(vcpu, s, true); +} + void kvm_apic_post_state_restore(struct kvm_vcpu *vcpu, struct kvm_lapic_state *s) { diff --git a/arch/x86/kvm/lapic.h b/arch/x86/kvm/lapic.h index d818a36ce24e..435606dd916f 100644 --- a/arch/x86/kvm/lapic.h +++ b/arch/x86/kvm/lapic.h @@ -71,6 +71,10 @@ bool kvm_irq_delivery_to_apic_fast(struct kvm *kvm, struct kvm_lapic *src, u64 kvm_get_apic_base(struct kvm_vcpu *vcpu); int kvm_set_apic_base(struct kvm_vcpu *vcpu, struct msr_data *msr_info); +void kvm_apic_state_get_fixup(struct kvm_vcpu *vcpu, + struct kvm_lapic_state *s); +void kvm_apic_state_set_fixup(struct kvm_vcpu *vcpu, + struct kvm_lapic_state *s); void kvm_apic_post_state_restore(struct kvm_vcpu *vcpu, struct kvm_lapic_state *s); int kvm_lapic_find_highest_irr(struct kvm_vcpu *vcpu); @@ -169,7 +173,8 @@ static inline int kvm_lapic_latched_init(struct kvm_vcpu *vcpu) static inline u32 kvm_apic_id(struct kvm_lapic *apic) { - return (kvm_apic_get_reg(apic, APIC_ID) >> 24) & 0xff; + u32 id = kvm_apic_get_reg(apic, APIC_ID); + return apic_x2apic_mode(apic) ? id : id >> 24; } bool kvm_apic_pending_eoi(struct kvm_vcpu *vcpu, int vector); diff --git a/arch/x86/kvm/vmx.c b/arch/x86/kvm/vmx.c index 35df8d757d1d..12beb83c61d6 100644 --- a/arch/x86/kvm/vmx.c +++ b/arch/x86/kvm/vmx.c @@ -6337,10 +6337,6 @@ static __init int hardware_setup(void) for (msr = 0x800; msr <= 0x8ff; msr++) vmx_disable_intercept_msr_read_x2apic(msr); - /* According SDM, in x2apic mode, the whole id reg is used. - * But in KVM, it only use the highest eight bits. Need to - * intercept it */ - vmx_enable_intercept_msr_read_x2apic(0x802); /* TMCCT */ vmx_enable_intercept_msr_read_x2apic(0x839); /* TPR */ diff --git a/arch/x86/kvm/x86.c b/arch/x86/kvm/x86.c index 86d1eb1c9d8b..2a2446240320 100644 --- a/arch/x86/kvm/x86.c +++ b/arch/x86/kvm/x86.c @@ -2769,6 +2769,7 @@ static int kvm_vcpu_ioctl_get_lapic(struct kvm_vcpu *vcpu, kvm_x86_ops->sync_pir_to_irr(vcpu); memcpy(s->regs, vcpu->arch.apic->regs, sizeof *s); + kvm_apic_state_get_fixup(vcpu, s); return 0; } @@ -2776,6 +2777,7 @@ static int kvm_vcpu_ioctl_get_lapic(struct kvm_vcpu *vcpu, static int kvm_vcpu_ioctl_set_lapic(struct kvm_vcpu *vcpu, struct kvm_lapic_state *s) { + kvm_apic_state_set_fixup(vcpu, s); kvm_apic_post_state_restore(vcpu, s); update_cr8_intercept(vcpu); -- 2.8.2 -- To unsubscribe from this list: send the line "unsubscribe kvm" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html