On Tue, Oct 16, 2018 at 12:53 AM Wanpeng Li <kernellwp@xxxxxxxxx> wrote: > > On Thu, 11 Oct 2018 at 06:59, Peter Shier <pshier@xxxxxxxxxx> wrote: > > > > kvm_vcpu_ioctl_get_lapic (implements KVM_GET_LAPIC ioctl) does a bulk copy > > of the LAPIC registers but must take into account that the one-shot and > > periodic timer current count register is computed upon reads and is not > > present in register state. When restoring LAPIC state (e.g. after > > migration), restart timers from their their current count values at time of > > save. > > > > Note: When a one-shot timer expires, the code in arch/x86/kvm/lapic.c does > > not zero the value of the LAPIC initial count register (emulating HW > > behavior). If no other timer is run and pending prior to a subsequent > > KVM_GET_LAPIC call, the returned register set will include the expired > > one-shot initial count. On a subsequent KVM_SET_LAPIC call the code will > > see a non-zero initial count and start a new one-shot timer using the > > expired timer's count. This is a prior existing bug and will be addressed > > in a separate patch. Thanks to jmattson@xxxxxxxxxx for this find. > > > > Signed-off-by: Peter Shier <pshier@xxxxxxxxxx> > > Reviewed-by: Jim Mattson <jmattson@xxxxxxxxxx> > > Reviewed-by: Wanpeng Li <wanpengli@xxxxxxxxxxx> > > > --- > > arch/x86/kvm/lapic.c | 64 +++++++++++++++++++++++++++++++++++--------- > > arch/x86/kvm/lapic.h | 7 ++++- > > 2 files changed, 58 insertions(+), 13 deletions(-) > > > > diff --git a/arch/x86/kvm/lapic.c b/arch/x86/kvm/lapic.c > > index fbb0e6df121b2..8e7f3cf552871 100644 > > --- a/arch/x86/kvm/lapic.c > > +++ b/arch/x86/kvm/lapic.c > > @@ -1524,13 +1524,18 @@ static void start_sw_tscdeadline(struct kvm_lapic *apic) > > local_irq_restore(flags); > > } > > > > +static inline u64 tmict_to_ns(struct kvm_lapic *apic, u32 tmict) > > +{ > > + return (u64)tmict * APIC_BUS_CYCLE_NS * (u64)apic->divide_count; > > +} > > + > > static void update_target_expiration(struct kvm_lapic *apic, uint32_t old_divisor) > > { > > ktime_t now, remaining; > > u64 ns_remaining_old, ns_remaining_new; > > > > - apic->lapic_timer.period = (u64)kvm_lapic_get_reg(apic, APIC_TMICT) > > - * APIC_BUS_CYCLE_NS * apic->divide_count; > > + apic->lapic_timer.period = > > + tmict_to_ns(apic, kvm_lapic_get_reg(apic, APIC_TMICT)); > > limit_periodic_timer_frequency(apic); > > > > now = ktime_get(); > > @@ -1548,14 +1553,15 @@ static void update_target_expiration(struct kvm_lapic *apic, uint32_t old_diviso > > apic->lapic_timer.target_expiration = ktime_add_ns(now, ns_remaining_new); > > } > > > > -static bool set_target_expiration(struct kvm_lapic *apic) > > +static bool set_target_expiration(struct kvm_lapic *apic, u32 count_reg) > > { > > ktime_t now; > > u64 tscl = rdtsc(); > > + s64 deadline; > > > > now = ktime_get(); > > - apic->lapic_timer.period = (u64)kvm_lapic_get_reg(apic, APIC_TMICT) > > - * APIC_BUS_CYCLE_NS * apic->divide_count; > > + apic->lapic_timer.period = > > + tmict_to_ns(apic, kvm_lapic_get_reg(apic, APIC_TMICT)); > > > > if (!apic->lapic_timer.period) { > > apic->lapic_timer.tscdeadline = 0; > > @@ -1563,6 +1569,28 @@ static bool set_target_expiration(struct kvm_lapic *apic) > > } > > > > limit_periodic_timer_frequency(apic); > > + deadline = apic->lapic_timer.period; > > + > > + if (apic_lvtt_period(apic) || apic_lvtt_oneshot(apic)) { > > + if (unlikely(count_reg != APIC_TMICT)) { > > + deadline = tmict_to_ns(apic, > > + kvm_lapic_get_reg(apic, count_reg)); > > + if (unlikely(deadline <= 0)) > > + deadline = apic->lapic_timer.period; > > + else if (unlikely(deadline > apic->lapic_timer.period)) { > > + pr_info_ratelimited( > > + "kvm: vcpu %i: requested lapic timer restore with " > > + "starting count register %#x=%u (%lld ns) > initial count (%lld ns). " > > + "Using initial count to start timer.\n", > > + apic->vcpu->vcpu_id, > > + count_reg, > > + kvm_lapic_get_reg(apic, count_reg), > > + deadline, apic->lapic_timer.period); > > + kvm_lapic_set_reg(apic, count_reg, 0); > > + deadline = apic->lapic_timer.period; > > + } > > + } > > + } > > > > apic_debug("%s: bus cycle is %" PRId64 "ns, now 0x%016" > > PRIx64 ", " > > @@ -1571,12 +1599,11 @@ static bool set_target_expiration(struct kvm_lapic *apic) > > APIC_BUS_CYCLE_NS, ktime_to_ns(now), > > kvm_lapic_get_reg(apic, APIC_TMICT), > > apic->lapic_timer.period, > > - ktime_to_ns(ktime_add_ns(now, > > - apic->lapic_timer.period))); > > + ktime_to_ns(ktime_add_ns(now, deadline))); > > > > apic->lapic_timer.tscdeadline = kvm_read_l1_tsc(apic->vcpu, tscl) + > > - nsec_to_cycles(apic->vcpu, apic->lapic_timer.period); > > - apic->lapic_timer.target_expiration = ktime_add_ns(now, apic->lapic_timer.period); > > + nsec_to_cycles(apic->vcpu, deadline); > > + apic->lapic_timer.target_expiration = ktime_add_ns(now, deadline); > > > > return true; > > } > > @@ -1748,17 +1775,22 @@ void kvm_lapic_restart_hv_timer(struct kvm_vcpu *vcpu) > > restart_apic_timer(apic); > > } > > > > -static void start_apic_timer(struct kvm_lapic *apic) > > +static void __start_apic_timer(struct kvm_lapic *apic, u32 count_reg) > > { > > atomic_set(&apic->lapic_timer.pending, 0); > > > > if ((apic_lvtt_period(apic) || apic_lvtt_oneshot(apic)) > > - && !set_target_expiration(apic)) > > + && !set_target_expiration(apic, count_reg)) > > return; > > > > restart_apic_timer(apic); > > } > > > > +static void start_apic_timer(struct kvm_lapic *apic) > > +{ > > + __start_apic_timer(apic, APIC_TMICT); > > +} > > + > > static void apic_manage_nmi_watchdog(struct kvm_lapic *apic, u32 lvt0_val) > > { > > bool lvt0_in_nmi_mode = apic_lvt_nmi_mode(lvt0_val); > > @@ -2370,6 +2402,14 @@ static int kvm_apic_state_fixup(struct kvm_vcpu *vcpu, > > int kvm_apic_get_state(struct kvm_vcpu *vcpu, struct kvm_lapic_state *s) > > { > > memcpy(s->regs, vcpu->arch.apic->regs, sizeof(*s)); > > + > > + /* > > + * Get calculated timer current count for remaining timer period (if > > + * any) and store it in the returned register set. > > + */ > > + __kvm_lapic_set_reg(s->regs, APIC_TMCCT, > > + __apic_read(vcpu->arch.apic, APIC_TMCCT)); > > + > > return kvm_apic_state_fixup(vcpu, s, false); > > } > > > > @@ -2396,7 +2436,7 @@ int kvm_apic_set_state(struct kvm_vcpu *vcpu, struct kvm_lapic_state *s) > > apic_update_lvtt(apic); > > apic_manage_nmi_watchdog(apic, kvm_lapic_get_reg(apic, APIC_LVT0)); > > update_divide_count(apic); > > - start_apic_timer(apic); > > + __start_apic_timer(apic, APIC_TMCCT); > > apic->irr_pending = true; > > apic->isr_count = vcpu->arch.apicv_active ? > > 1 : count_vectors(apic->regs + APIC_ISR); > > diff --git a/arch/x86/kvm/lapic.h b/arch/x86/kvm/lapic.h > > index ed0ed39abd369..fadefa1a9d678 100644 > > --- a/arch/x86/kvm/lapic.h > > +++ b/arch/x86/kvm/lapic.h > > @@ -147,9 +147,14 @@ static inline u32 kvm_lapic_get_reg(struct kvm_lapic *apic, int reg_off) > > return *((u32 *) (apic->regs + reg_off)); > > } > > > > +static inline void __kvm_lapic_set_reg(char *regs, int reg_off, u32 val) > > +{ > > + *((u32 *) (regs + reg_off)) = val; > > +} > > + > > static inline void kvm_lapic_set_reg(struct kvm_lapic *apic, int reg_off, u32 val) > > { > > - *((u32 *) (apic->regs + reg_off)) = val; > > + __kvm_lapic_set_reg(apic->regs, reg_off, val); > > } > > > > extern struct static_key kvm_no_apic_vcpu; > > -- > > 2.19.0.605.g01d371f741-goog > > Ping?