Hi Sasha, [adding the kvm list; not sure why it was dropped] On Wed, Oct 28, 2015 at 01:34:25PM +0000, Will Deacon wrote: > On Wed, Oct 28, 2015 at 09:00:07AM -0400, Sasha Levin wrote: > > On 10/28/2015 08:27 AM, Will Deacon wrote: > > > On Tue, Oct 27, 2015 at 10:08:44PM -0400, Sasha Levin wrote: > > >> > On 10/27/2015 12:08 PM, Will Deacon wrote: > > >>>> > >> for (i = 0; i < kvm->nrcpus; i++) > > >>>>> > >> > - pthread_kill(kvm->cpus[i]->thread, SIGKVMPAUSE); > > >>>>> > >> > + if (kvm->cpus[i]->is_running) > > >>>>> > >> > + pthread_kill(kvm->cpus[i]->thread, SIGKVMPAUSE); > > >>>>> > >> > + else > > >>>>> > >> > + paused_vcpus++; > > >>> > > What serialises the test of kvm->cpus[i]->is_running against a concurrent > > >>> > > SIGKVMEXIT? > > >> > > > >> > If there's a pause signal pending we'd still end up marking it as paused > > >> > and do the whole process even though the vcpu is actually dead, so while > > >> > we can race with SIGKVMEXIT, it'll just mean we'd go through the whole > > >> > pausing procedure even though the vcpu is dead. > > >> > > > >> > Or did you mean something else? > > > I couldn't convince myself there was an issue here (hence the question ;), > > > but I was wondering about something like: > > > > > > 1. The VCPUn thread takes SIGKVMEXIT (e.g. due to kvm_cpu__reboot) > > > 2. The IPC thread handles a pause event and reads kvm->cpus[n]->is_running > > > as true > > > 3. VCPUn sets kvm->cpus[n]->is_running to false > > > 4. VCPUn exits > > > 5. The IPC thread trues to pthread_kill on an exited thread > > > > > > am I missing some obvious synchronisation here? > > > > Can we take two signals in parallel? (I'm really not sure). If yes, than > > what you've described is a problem (and has been for a while). If not, > > then no :) > > Regardless, isn't the pause event coming from polling the IPC file > descriptor as opposed to a signal? It looks like lkvm is currently SEGVing on exit due to the original issue. Digging deeper, it looks like we should be taking the pause_lock for the SIGKVMEXIT case too, so that we can serialise access to is_running. What do you think about the patch below? Will --->8 diff --git a/hw/i8042.c b/hw/i8042.c index 3801e20a675d..288b7d1108ac 100644 --- a/hw/i8042.c +++ b/hw/i8042.c @@ -163,7 +163,7 @@ static void kbd_write_command(struct kvm *kvm, u8 val) state.mode &= ~MODE_DISABLE_AUX; break; case I8042_CMD_SYSTEM_RESET: - kvm_cpu__reboot(kvm); + kvm__reboot(kvm); break; default: break; diff --git a/include/kvm/kvm-cpu.h b/include/kvm/kvm-cpu.h index aa0cb543f8fb..c4c9cca449eb 100644 --- a/include/kvm/kvm-cpu.h +++ b/include/kvm/kvm-cpu.h @@ -12,7 +12,6 @@ void kvm_cpu__reset_vcpu(struct kvm_cpu *vcpu); void kvm_cpu__setup_cpuid(struct kvm_cpu *vcpu); void kvm_cpu__enable_singlestep(struct kvm_cpu *vcpu); void kvm_cpu__run(struct kvm_cpu *vcpu); -void kvm_cpu__reboot(struct kvm *kvm); int kvm_cpu__start(struct kvm_cpu *cpu); bool kvm_cpu__handle_exit(struct kvm_cpu *vcpu); int kvm_cpu__get_endianness(struct kvm_cpu *vcpu); diff --git a/include/kvm/kvm.h b/include/kvm/kvm.h index 37155dbc132b..a474dae6c2cf 100644 --- a/include/kvm/kvm.h +++ b/include/kvm/kvm.h @@ -93,6 +93,7 @@ int kvm__register_mmio(struct kvm *kvm, u64 phys_addr, u64 phys_addr_len, bool c void (*mmio_fn)(struct kvm_cpu *vcpu, u64 addr, u8 *data, u32 len, u8 is_write, void *ptr), void *ptr); bool kvm__deregister_mmio(struct kvm *kvm, u64 phys_addr); +void kvm__reboot(struct kvm *kvm); void kvm__pause(struct kvm *kvm); void kvm__continue(struct kvm *kvm); void kvm__notify_paused(void); diff --git a/kvm-cpu.c b/kvm-cpu.c index ad4441b1d96c..3e2037e3ccb3 100644 --- a/kvm-cpu.c +++ b/kvm-cpu.c @@ -45,10 +45,8 @@ void kvm_cpu__run(struct kvm_cpu *vcpu) static void kvm_cpu_signal_handler(int signum) { if (signum == SIGKVMEXIT) { - if (current_kvm_cpu && current_kvm_cpu->is_running) { + if (current_kvm_cpu && current_kvm_cpu->is_running) current_kvm_cpu->is_running = false; - kvm__continue(current_kvm_cpu->kvm); - } } else if (signum == SIGKVMPAUSE) { current_kvm_cpu->paused = 1; } @@ -70,19 +68,6 @@ static void kvm_cpu__handle_coalesced_mmio(struct kvm_cpu *cpu) } } -void kvm_cpu__reboot(struct kvm *kvm) -{ - int i; - - /* The kvm->cpus array contains a null pointer in the last location */ - for (i = 0; ; i++) { - if (kvm->cpus[i]) - pthread_kill(kvm->cpus[i]->thread, SIGKVMEXIT); - else - break; - } -} - int kvm_cpu__start(struct kvm_cpu *cpu) { sigset_t sigset; @@ -177,7 +162,7 @@ int kvm_cpu__start(struct kvm_cpu *cpu) * Ensure that all VCPUs are torn down, * regardless of which CPU generated the event. */ - kvm_cpu__reboot(cpu->kvm); + kvm__reboot(cpu->kvm); goto exit_kvm; }; break; diff --git a/kvm-ipc.c b/kvm-ipc.c index 857b0dc943e5..1ef3c3e4c5bc 100644 --- a/kvm-ipc.c +++ b/kvm-ipc.c @@ -341,7 +341,7 @@ static void handle_stop(struct kvm *kvm, int fd, u32 type, u32 len, u8 *msg) if (WARN_ON(type != KVM_IPC_STOP || len)) return; - kvm_cpu__reboot(kvm); + kvm__reboot(kvm); } /* Pause/resume the guest using SIGUSR2 */ diff --git a/kvm.c b/kvm.c index 10ed2300ed71..db301a3ae0fc 100644 --- a/kvm.c +++ b/kvm.c @@ -428,6 +428,27 @@ void kvm__dump_mem(struct kvm *kvm, unsigned long addr, unsigned long size, int } } +void kvm__reboot(struct kvm *kvm) +{ + int i; + + /* Check if the guest is running */ + if (!kvm->cpus[0] || kvm->cpus[0]->thread == 0) + return; + + mutex_lock(&pause_lock); + + /* The kvm->cpus array contains a null pointer in the last location */ + for (i = 0; ; i++) { + if (kvm->cpus[i]) + pthread_kill(kvm->cpus[i]->thread, SIGKVMEXIT); + else + break; + } + + kvm__continue(kvm); +} + void kvm__pause(struct kvm *kvm) { int i, paused_vcpus = 0; @@ -441,8 +462,12 @@ void kvm__pause(struct kvm *kvm) pause_event = eventfd(0, 0); if (pause_event < 0) die("Failed creating pause notification event"); - for (i = 0; i < kvm->nrcpus; i++) - pthread_kill(kvm->cpus[i]->thread, SIGKVMPAUSE); + for (i = 0; i < kvm->nrcpus; i++) { + if (kvm->cpus[i]->is_running) + pthread_kill(kvm->cpus[i]->thread, SIGKVMPAUSE); + else + paused_vcpus++; + } while (paused_vcpus < kvm->nrcpus) { u64 cur_read; diff --git a/powerpc/spapr_rtas.c b/powerpc/spapr_rtas.c index 38d899c7f561..b898ff20ba5a 100644 --- a/powerpc/spapr_rtas.c +++ b/powerpc/spapr_rtas.c @@ -118,7 +118,7 @@ static void rtas_power_off(struct kvm_cpu *vcpu, rtas_st(vcpu->kvm, rets, 0, -3); return; } - kvm_cpu__reboot(vcpu->kvm); + kvm__reboot(vcpu->kvm); } static void rtas_system_reboot(struct kvm_cpu *vcpu, @@ -131,7 +131,7 @@ static void rtas_system_reboot(struct kvm_cpu *vcpu, } /* NB this actually halts the VM */ - kvm_cpu__reboot(vcpu->kvm); + kvm__reboot(vcpu->kvm); } static void rtas_query_cpu_stopped_state(struct kvm_cpu *vcpu, diff --git a/term.c b/term.c index aebd174597b1..58f66a0c0ea5 100644 --- a/term.c +++ b/term.c @@ -37,7 +37,7 @@ int term_getc(struct kvm *kvm, int term) if (term_got_escape) { term_got_escape = false; if (c == 'x') - kvm_cpu__reboot(kvm); + kvm__reboot(kvm); if (c == term_escape_char) return c; } diff --git a/ui/sdl.c b/ui/sdl.c index f97a5112eca9..5035405bb488 100644 --- a/ui/sdl.c +++ b/ui/sdl.c @@ -266,7 +266,7 @@ static void *sdl__thread(void *p) } exit: done = true; - kvm_cpu__reboot(fb->kvm); + kvm__reboot(fb->kvm); return NULL; } -- To unsubscribe from this list: send the line "unsubscribe kvm" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html