Skip to content

Commit eb0461c

Browse files
dwmw2gregkh
authored andcommitted
KVM: x86: switch pvclock_gtod_sync_lock to a raw spinlock
commit 8228c77 upstream. On the preemption path when updating a Xen guest's runstate times, this lock is taken inside the scheduler rq->lock, which is a raw spinlock. This was shown in a lockdep warning: [ 89.138354] ============================= [ 89.138356] [ BUG: Invalid wait context ] [ 89.138358] 5.15.0-rc5+ #834 Tainted: G S I E [ 89.138360] ----------------------------- [ 89.138361] xen_shinfo_test/2575 is trying to lock: [ 89.138363] ffffa34a0364efd8 (&kvm->arch.pvclock_gtod_sync_lock){....}-{3:3}, at: get_kvmclock_ns+0x1f/0x130 [kvm] [ 89.138442] other info that might help us debug this: [ 89.138444] context-{5:5} [ 89.138445] 4 locks held by xen_shinfo_test/2575: [ 89.138447] #0: ffff972bdc3b8108 (&vcpu->mutex){+.+.}-{4:4}, at: kvm_vcpu_ioctl+0x77/0x6f0 [kvm] [ 89.138483] #1: ffffa34a03662e90 (&kvm->srcu){....}-{0:0}, at: kvm_arch_vcpu_ioctl_run+0xdc/0x8b0 [kvm] [ 89.138526] #2: ffff97331fdbac98 (&rq->__lock){-.-.}-{2:2}, at: __schedule+0xff/0xbd0 [ 89.138534] #3: ffffa34a03662e90 (&kvm->srcu){....}-{0:0}, at: kvm_arch_vcpu_put+0x26/0x170 [kvm] ... [ 89.138695] get_kvmclock_ns+0x1f/0x130 [kvm] [ 89.138734] kvm_xen_update_runstate+0x14/0x90 [kvm] [ 89.138783] kvm_xen_update_runstate_guest+0x15/0xd0 [kvm] [ 89.138830] kvm_arch_vcpu_put+0xe6/0x170 [kvm] [ 89.138870] kvm_sched_out+0x2f/0x40 [kvm] [ 89.138900] __schedule+0x5de/0xbd0 Cc: [email protected] Reported-by: [email protected] Fixes: 30b5c85 ("KVM: x86/xen: Add support for vCPU runstate information") Signed-off-by: David Woodhouse <[email protected]> Message-Id: <[email protected]> Signed-off-by: Paolo Bonzini <[email protected]> Signed-off-by: Greg Kroah-Hartman <[email protected]>
1 parent 10242cc commit eb0461c

File tree

2 files changed

+15
-15
lines changed

2 files changed

+15
-15
lines changed

arch/x86/include/asm/kvm_host.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1084,7 +1084,7 @@ struct kvm_arch {
10841084
u64 cur_tsc_generation;
10851085
int nr_vcpus_matched_tsc;
10861086

1087-
spinlock_t pvclock_gtod_sync_lock;
1087+
raw_spinlock_t pvclock_gtod_sync_lock;
10881088
bool use_master_clock;
10891089
u64 master_kernel_ns;
10901090
u64 master_cycle_now;

arch/x86/kvm/x86.c

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -2537,15 +2537,15 @@ static void kvm_synchronize_tsc(struct kvm_vcpu *vcpu, u64 data)
25372537
kvm_vcpu_write_tsc_offset(vcpu, offset);
25382538
raw_spin_unlock_irqrestore(&kvm->arch.tsc_write_lock, flags);
25392539

2540-
spin_lock_irqsave(&kvm->arch.pvclock_gtod_sync_lock, flags);
2540+
raw_spin_lock_irqsave(&kvm->arch.pvclock_gtod_sync_lock, flags);
25412541
if (!matched) {
25422542
kvm->arch.nr_vcpus_matched_tsc = 0;
25432543
} else if (!already_matched) {
25442544
kvm->arch.nr_vcpus_matched_tsc++;
25452545
}
25462546

25472547
kvm_track_tsc_matching(vcpu);
2548-
spin_unlock_irqrestore(&kvm->arch.pvclock_gtod_sync_lock, flags);
2548+
raw_spin_unlock_irqrestore(&kvm->arch.pvclock_gtod_sync_lock, flags);
25492549
}
25502550

25512551
static inline void adjust_tsc_offset_guest(struct kvm_vcpu *vcpu,
@@ -2775,9 +2775,9 @@ static void kvm_gen_update_masterclock(struct kvm *kvm)
27752775
kvm_make_mclock_inprogress_request(kvm);
27762776

27772777
/* no guest entries from this point */
2778-
spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
2778+
raw_spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
27792779
pvclock_update_vm_gtod_copy(kvm);
2780-
spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
2780+
raw_spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
27812781

27822782
kvm_for_each_vcpu(i, vcpu, kvm)
27832783
kvm_make_request(KVM_REQ_CLOCK_UPDATE, vcpu);
@@ -2795,15 +2795,15 @@ u64 get_kvmclock_ns(struct kvm *kvm)
27952795
unsigned long flags;
27962796
u64 ret;
27972797

2798-
spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
2798+
raw_spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
27992799
if (!ka->use_master_clock) {
2800-
spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
2800+
raw_spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
28012801
return get_kvmclock_base_ns() + ka->kvmclock_offset;
28022802
}
28032803

28042804
hv_clock.tsc_timestamp = ka->master_cycle_now;
28052805
hv_clock.system_time = ka->master_kernel_ns + ka->kvmclock_offset;
2806-
spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
2806+
raw_spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
28072807

28082808
/* both __this_cpu_read() and rdtsc() should be on the same cpu */
28092809
get_cpu();
@@ -2897,13 +2897,13 @@ static int kvm_guest_time_update(struct kvm_vcpu *v)
28972897
* If the host uses TSC clock, then passthrough TSC as stable
28982898
* to the guest.
28992899
*/
2900-
spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
2900+
raw_spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
29012901
use_master_clock = ka->use_master_clock;
29022902
if (use_master_clock) {
29032903
host_tsc = ka->master_cycle_now;
29042904
kernel_ns = ka->master_kernel_ns;
29052905
}
2906-
spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
2906+
raw_spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
29072907

29082908
/* Keep irq disabled to prevent changes to the clock */
29092909
local_irq_save(flags);
@@ -6101,13 +6101,13 @@ long kvm_arch_vm_ioctl(struct file *filp,
61016101
* is slightly ahead) here we risk going negative on unsigned
61026102
* 'system_time' when 'user_ns.clock' is very small.
61036103
*/
6104-
spin_lock_irq(&ka->pvclock_gtod_sync_lock);
6104+
raw_spin_lock_irq(&ka->pvclock_gtod_sync_lock);
61056105
if (kvm->arch.use_master_clock)
61066106
now_ns = ka->master_kernel_ns;
61076107
else
61086108
now_ns = get_kvmclock_base_ns();
61096109
ka->kvmclock_offset = user_ns.clock - now_ns;
6110-
spin_unlock_irq(&ka->pvclock_gtod_sync_lock);
6110+
raw_spin_unlock_irq(&ka->pvclock_gtod_sync_lock);
61116111

61126112
kvm_make_all_cpus_request(kvm, KVM_REQ_CLOCK_UPDATE);
61136113
break;
@@ -8157,9 +8157,9 @@ static void kvm_hyperv_tsc_notifier(void)
81578157
list_for_each_entry(kvm, &vm_list, vm_list) {
81588158
struct kvm_arch *ka = &kvm->arch;
81598159

8160-
spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
8160+
raw_spin_lock_irqsave(&ka->pvclock_gtod_sync_lock, flags);
81618161
pvclock_update_vm_gtod_copy(kvm);
8162-
spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
8162+
raw_spin_unlock_irqrestore(&ka->pvclock_gtod_sync_lock, flags);
81638163

81648164
kvm_for_each_vcpu(cpu, vcpu, kvm)
81658165
kvm_make_request(KVM_REQ_CLOCK_UPDATE, vcpu);
@@ -11148,7 +11148,7 @@ int kvm_arch_init_vm(struct kvm *kvm, unsigned long type)
1114811148

1114911149
raw_spin_lock_init(&kvm->arch.tsc_write_lock);
1115011150
mutex_init(&kvm->arch.apic_map_lock);
11151-
spin_lock_init(&kvm->arch.pvclock_gtod_sync_lock);
11151+
raw_spin_lock_init(&kvm->arch.pvclock_gtod_sync_lock);
1115211152

1115311153
kvm->arch.kvmclock_offset = -get_kvmclock_base_ns();
1115411154
pvclock_update_vm_gtod_copy(kvm);

0 commit comments

Comments
 (0)