Skip to content

Commit 0acc723

Browse files
ouptonMarc Zyngier
authored andcommitted
KVM: arm64: Avoid vcpu->mutex v. kvm->lock inversion in CPU_ON
KVM/arm64 had the lock ordering backwards on vcpu->mutex and kvm->lock from the very beginning. One such example is the way vCPU resets are handled: the kvm->lock is acquired while handling a guest CPU_ON PSCI call. Add a dedicated lock to serialize writes to kvm_vcpu_arch::{mp_state, reset_state}. Promote all accessors of mp_state to {READ,WRITE}_ONCE() as readers do not acquire the mp_state_lock. While at it, plug yet another race by taking the mp_state_lock in the KVM_SET_MP_STATE ioctl handler. As changes to MP state are now guarded with a dedicated lock, drop the kvm->lock acquisition from the PSCI CPU_ON path. Similarly, move the reader of reset_state outside of the kvm->lock and instead protect it with the mp_state_lock. Note that writes to reset_state::reset have been demoted to regular stores as both readers and writers acquire the mp_state_lock. While the kvm->lock inversion still exists in kvm_reset_vcpu(), at least now PSCI CPU_ON no longer depends on it for serializing vCPU reset. Cc: stable@vger.kernel.org Tested-by: Jeremy Linton <jeremy.linton@arm.com> Signed-off-by: Oliver Upton <oliver.upton@linux.dev> Signed-off-by: Marc Zyngier <maz@kernel.org> Link: https://lore.kernel.org/r/20230327164747.2466958-2-oliver.upton@linux.dev
1 parent 197b6b6 commit 0acc723

4 files changed

Lines changed: 44 additions & 25 deletions

File tree

arch/arm64/include/asm/kvm_host.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -522,6 +522,7 @@ struct kvm_vcpu_arch {
522522

523523
/* vcpu power state */
524524
struct kvm_mp_state mp_state;
525+
spinlock_t mp_state_lock;
525526

526527
/* Cache some mmu pages needed inside spinlock regions */
527528
struct kvm_mmu_memory_cache mmu_page_cache;

arch/arm64/kvm/arm.c

Lines changed: 22 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -326,6 +326,8 @@ int kvm_arch_vcpu_create(struct kvm_vcpu *vcpu)
326326
{
327327
int err;
328328

329+
spin_lock_init(&vcpu->arch.mp_state_lock);
330+
329331
/* Force users to call KVM_ARM_VCPU_INIT */
330332
vcpu->arch.target = -1;
331333
bitmap_zero(vcpu->arch.features, KVM_VCPU_MAX_FEATURES);
@@ -443,34 +445,41 @@ void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu)
443445
vcpu->cpu = -1;
444446
}
445447

446-
void kvm_arm_vcpu_power_off(struct kvm_vcpu *vcpu)
448+
static void __kvm_arm_vcpu_power_off(struct kvm_vcpu *vcpu)
447449
{
448-
vcpu->arch.mp_state.mp_state = KVM_MP_STATE_STOPPED;
450+
WRITE_ONCE(vcpu->arch.mp_state.mp_state, KVM_MP_STATE_STOPPED);
449451
kvm_make_request(KVM_REQ_SLEEP, vcpu);
450452
kvm_vcpu_kick(vcpu);
451453
}
452454

455+
void kvm_arm_vcpu_power_off(struct kvm_vcpu *vcpu)
456+
{
457+
spin_lock(&vcpu->arch.mp_state_lock);
458+
__kvm_arm_vcpu_power_off(vcpu);
459+
spin_unlock(&vcpu->arch.mp_state_lock);
460+
}
461+
453462
bool kvm_arm_vcpu_stopped(struct kvm_vcpu *vcpu)
454463
{
455-
return vcpu->arch.mp_state.mp_state == KVM_MP_STATE_STOPPED;
464+
return READ_ONCE(vcpu->arch.mp_state.mp_state) == KVM_MP_STATE_STOPPED;
456465
}
457466

458467
static void kvm_arm_vcpu_suspend(struct kvm_vcpu *vcpu)
459468
{
460-
vcpu->arch.mp_state.mp_state = KVM_MP_STATE_SUSPENDED;
469+
WRITE_ONCE(vcpu->arch.mp_state.mp_state, KVM_MP_STATE_SUSPENDED);
461470
kvm_make_request(KVM_REQ_SUSPEND, vcpu);
462471
kvm_vcpu_kick(vcpu);
463472
}
464473

465474
static bool kvm_arm_vcpu_suspended(struct kvm_vcpu *vcpu)
466475
{
467-
return vcpu->arch.mp_state.mp_state == KVM_MP_STATE_SUSPENDED;
476+
return READ_ONCE(vcpu->arch.mp_state.mp_state) == KVM_MP_STATE_SUSPENDED;
468477
}
469478

470479
int kvm_arch_vcpu_ioctl_get_mpstate(struct kvm_vcpu *vcpu,
471480
struct kvm_mp_state *mp_state)
472481
{
473-
*mp_state = vcpu->arch.mp_state;
482+
*mp_state = READ_ONCE(vcpu->arch.mp_state);
474483

475484
return 0;
476485
}
@@ -480,12 +489,14 @@ int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu,
480489
{
481490
int ret = 0;
482491

492+
spin_lock(&vcpu->arch.mp_state_lock);
493+
483494
switch (mp_state->mp_state) {
484495
case KVM_MP_STATE_RUNNABLE:
485-
vcpu->arch.mp_state = *mp_state;
496+
WRITE_ONCE(vcpu->arch.mp_state, *mp_state);
486497
break;
487498
case KVM_MP_STATE_STOPPED:
488-
kvm_arm_vcpu_power_off(vcpu);
499+
__kvm_arm_vcpu_power_off(vcpu);
489500
break;
490501
case KVM_MP_STATE_SUSPENDED:
491502
kvm_arm_vcpu_suspend(vcpu);
@@ -494,6 +505,8 @@ int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu,
494505
ret = -EINVAL;
495506
}
496507

508+
spin_unlock(&vcpu->arch.mp_state_lock);
509+
497510
return ret;
498511
}
499512

@@ -1213,7 +1226,7 @@ static int kvm_arch_vcpu_ioctl_vcpu_init(struct kvm_vcpu *vcpu,
12131226
if (test_bit(KVM_ARM_VCPU_POWER_OFF, vcpu->arch.features))
12141227
kvm_arm_vcpu_power_off(vcpu);
12151228
else
1216-
vcpu->arch.mp_state.mp_state = KVM_MP_STATE_RUNNABLE;
1229+
WRITE_ONCE(vcpu->arch.mp_state.mp_state, KVM_MP_STATE_RUNNABLE);
12171230

12181231
return 0;
12191232
}

arch/arm64/kvm/psci.c

Lines changed: 16 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -62,6 +62,7 @@ static unsigned long kvm_psci_vcpu_on(struct kvm_vcpu *source_vcpu)
6262
struct vcpu_reset_state *reset_state;
6363
struct kvm *kvm = source_vcpu->kvm;
6464
struct kvm_vcpu *vcpu = NULL;
65+
int ret = PSCI_RET_SUCCESS;
6566
unsigned long cpu_id;
6667

6768
cpu_id = smccc_get_arg1(source_vcpu);
@@ -76,11 +77,15 @@ static unsigned long kvm_psci_vcpu_on(struct kvm_vcpu *source_vcpu)
7677
*/
7778
if (!vcpu)
7879
return PSCI_RET_INVALID_PARAMS;
80+
81+
spin_lock(&vcpu->arch.mp_state_lock);
7982
if (!kvm_arm_vcpu_stopped(vcpu)) {
8083
if (kvm_psci_version(source_vcpu) != KVM_ARM_PSCI_0_1)
81-
return PSCI_RET_ALREADY_ON;
84+
ret = PSCI_RET_ALREADY_ON;
8285
else
83-
return PSCI_RET_INVALID_PARAMS;
86+
ret = PSCI_RET_INVALID_PARAMS;
87+
88+
goto out_unlock;
8489
}
8590

8691
reset_state = &vcpu->arch.reset_state;
@@ -96,7 +101,7 @@ static unsigned long kvm_psci_vcpu_on(struct kvm_vcpu *source_vcpu)
96101
*/
97102
reset_state->r0 = smccc_get_arg3(source_vcpu);
98103

99-
WRITE_ONCE(reset_state->reset, true);
104+
reset_state->reset = true;
100105
kvm_make_request(KVM_REQ_VCPU_RESET, vcpu);
101106

102107
/*
@@ -108,7 +113,9 @@ static unsigned long kvm_psci_vcpu_on(struct kvm_vcpu *source_vcpu)
108113
vcpu->arch.mp_state.mp_state = KVM_MP_STATE_RUNNABLE;
109114
kvm_vcpu_wake_up(vcpu);
110115

111-
return PSCI_RET_SUCCESS;
116+
out_unlock:
117+
spin_unlock(&vcpu->arch.mp_state_lock);
118+
return ret;
112119
}
113120

114121
static unsigned long kvm_psci_vcpu_affinity_info(struct kvm_vcpu *vcpu)
@@ -168,8 +175,11 @@ static void kvm_prepare_system_event(struct kvm_vcpu *vcpu, u32 type, u64 flags)
168175
* after this call is handled and before the VCPUs have been
169176
* re-initialized.
170177
*/
171-
kvm_for_each_vcpu(i, tmp, vcpu->kvm)
172-
tmp->arch.mp_state.mp_state = KVM_MP_STATE_STOPPED;
178+
kvm_for_each_vcpu(i, tmp, vcpu->kvm) {
179+
spin_lock(&tmp->arch.mp_state_lock);
180+
WRITE_ONCE(tmp->arch.mp_state.mp_state, KVM_MP_STATE_STOPPED);
181+
spin_unlock(&tmp->arch.mp_state_lock);
182+
}
173183
kvm_make_all_cpus_request(vcpu->kvm, KVM_REQ_SLEEP);
174184

175185
memset(&vcpu->run->system_event, 0, sizeof(vcpu->run->system_event));
@@ -229,7 +239,6 @@ static unsigned long kvm_psci_check_allowed_function(struct kvm_vcpu *vcpu, u32
229239

230240
static int kvm_psci_0_2_call(struct kvm_vcpu *vcpu)
231241
{
232-
struct kvm *kvm = vcpu->kvm;
233242
u32 psci_fn = smccc_get_function(vcpu);
234243
unsigned long val;
235244
int ret = 1;
@@ -254,9 +263,7 @@ static int kvm_psci_0_2_call(struct kvm_vcpu *vcpu)
254263
kvm_psci_narrow_to_32bit(vcpu);
255264
fallthrough;
256265
case PSCI_0_2_FN64_CPU_ON:
257-
mutex_lock(&kvm->lock);
258266
val = kvm_psci_vcpu_on(vcpu);
259-
mutex_unlock(&kvm->lock);
260267
break;
261268
case PSCI_0_2_FN_AFFINITY_INFO:
262269
kvm_psci_narrow_to_32bit(vcpu);
@@ -395,7 +402,6 @@ static int kvm_psci_1_x_call(struct kvm_vcpu *vcpu, u32 minor)
395402

396403
static int kvm_psci_0_1_call(struct kvm_vcpu *vcpu)
397404
{
398-
struct kvm *kvm = vcpu->kvm;
399405
u32 psci_fn = smccc_get_function(vcpu);
400406
unsigned long val;
401407

@@ -405,9 +411,7 @@ static int kvm_psci_0_1_call(struct kvm_vcpu *vcpu)
405411
val = PSCI_RET_SUCCESS;
406412
break;
407413
case KVM_PSCI_FN_CPU_ON:
408-
mutex_lock(&kvm->lock);
409414
val = kvm_psci_vcpu_on(vcpu);
410-
mutex_unlock(&kvm->lock);
411415
break;
412416
default:
413417
val = PSCI_RET_NOT_SUPPORTED;

arch/arm64/kvm/reset.c

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -264,15 +264,16 @@ int kvm_reset_vcpu(struct kvm_vcpu *vcpu)
264264

265265
mutex_lock(&vcpu->kvm->lock);
266266
ret = kvm_set_vm_width(vcpu);
267-
if (!ret) {
268-
reset_state = vcpu->arch.reset_state;
269-
WRITE_ONCE(vcpu->arch.reset_state.reset, false);
270-
}
271267
mutex_unlock(&vcpu->kvm->lock);
272268

273269
if (ret)
274270
return ret;
275271

272+
spin_lock(&vcpu->arch.mp_state_lock);
273+
reset_state = vcpu->arch.reset_state;
274+
vcpu->arch.reset_state.reset = false;
275+
spin_unlock(&vcpu->arch.mp_state_lock);
276+
276277
/* Reset PMU outside of the non-preemptible section */
277278
kvm_pmu_vcpu_reset(vcpu);
278279

0 commit comments

Comments
 (0)