Skip to content

Commit 3a025de

Browse files
yisun-gitKAGA-KOKO
authored andcommitted
x86/hyperv: Enable PV qspinlock for Hyper-V
Implement the required wait and kick callbacks to support PV spinlocks in Hyper-V guests. [ tglx: Document the requirement for disabling interrupts in the wait() callback. Remove goto and unnecessary includes. Add prototype for hv_vcpu_is_preempted(). Adapted to pending paravirt changes. ] Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com> Signed-off-by: Thomas Gleixner <tglx@linutronix.de> Reviewed-by: Juergen Gross <jgross@suse.com> Cc: "K. Y. Srinivasan" <kys@microsoft.com> Cc: Haiyang Zhang <haiyangz@microsoft.com> Cc: Stephen Hemminger <sthemmin@microsoft.com> Cc: Michael Kelley (EOSG) <Michael.H.Kelley@microsoft.com> Cc: chao.p.peng@intel.com Cc: chao.gao@intel.com Cc: isaku.yamahata@intel.com Cc: tianyu.lan@microsoft.com Link: https://lkml.kernel.org/r/1538987374-51217-3-git-send-email-yi.y.sun@linux.intel.com
1 parent f726c46 commit 3a025de

File tree

5 files changed

+113
-0
lines changed

5 files changed

+113
-0
lines changed

Documentation/admin-guide/kernel-parameters.txt

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1385,6 +1385,11 @@
13851385
hvc_iucv_allow= [S390] Comma-separated list of z/VM user IDs.
13861386
If specified, z/VM IUCV HVC accepts connections
13871387
from listed z/VM user IDs only.
1388+
1389+
hv_nopvspin [X86,HYPER_V] Disables the paravirt spinlock optimizations
1390+
which allow the hypervisor to 'idle' the
1391+
guest on lock contention.
1392+
13881393
keep_bootcon [KNL]
13891394
Do not unregister boot console at start. This is only
13901395
useful for debugging when something happens in the window

arch/x86/hyperv/Makefile

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,6 @@
11
obj-y := hv_init.o mmu.o nested.o
22
obj-$(CONFIG_X86_64) += hv_apic.o
3+
4+
ifdef CONFIG_X86_64
5+
obj-$(CONFIG_PARAVIRT_SPINLOCKS) += hv_spinlock.o
6+
endif

arch/x86/hyperv/hv_spinlock.c

Lines changed: 88 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,88 @@
1+
// SPDX-License-Identifier: GPL-2.0
2+
3+
/*
4+
* Hyper-V specific spinlock code.
5+
*
6+
* Copyright (C) 2018, Intel, Inc.
7+
*
8+
* Author : Yi Sun <yi.y.sun@intel.com>
9+
*/
10+
11+
#define pr_fmt(fmt) "Hyper-V: " fmt
12+
13+
#include <linux/spinlock.h>
14+
15+
#include <asm/mshyperv.h>
16+
#include <asm/paravirt.h>
17+
#include <asm/apic.h>
18+
19+
static bool __initdata hv_pvspin = true;
20+
21+
static void hv_qlock_kick(int cpu)
22+
{
23+
apic->send_IPI(cpu, X86_PLATFORM_IPI_VECTOR);
24+
}
25+
26+
static void hv_qlock_wait(u8 *byte, u8 val)
27+
{
28+
unsigned long msr_val;
29+
unsigned long flags;
30+
31+
if (in_nmi())
32+
return;
33+
34+
/*
35+
* Reading HV_X64_MSR_GUEST_IDLE MSR tells the hypervisor that the
36+
* vCPU can be put into 'idle' state. This 'idle' state is
37+
* terminated by an IPI, usually from hv_qlock_kick(), even if
38+
* interrupts are disabled on the vCPU.
39+
*
40+
* To prevent a race against the unlock path it is required to
41+
* disable interrupts before accessing the HV_X64_MSR_GUEST_IDLE
42+
* MSR. Otherwise, if the IPI from hv_qlock_kick() arrives between
43+
* the lock value check and the rdmsrl() then the vCPU might be put
44+
* into 'idle' state by the hypervisor and kept in that state for
45+
* an unspecified amount of time.
46+
*/
47+
local_irq_save(flags);
48+
/*
49+
* Only issue the rdmsrl() when the lock state has not changed.
50+
*/
51+
if (READ_ONCE(*byte) == val)
52+
rdmsrl(HV_X64_MSR_GUEST_IDLE, msr_val);
53+
local_irq_restore(flags);
54+
}
55+
56+
/*
57+
* Hyper-V does not support this so far.
58+
*/
59+
bool hv_vcpu_is_preempted(int vcpu)
60+
{
61+
return false;
62+
}
63+
PV_CALLEE_SAVE_REGS_THUNK(hv_vcpu_is_preempted);
64+
65+
void __init hv_init_spinlocks(void)
66+
{
67+
if (!hv_pvspin || !apic ||
68+
!(ms_hyperv.hints & HV_X64_CLUSTER_IPI_RECOMMENDED) ||
69+
!(ms_hyperv.features & HV_X64_MSR_GUEST_IDLE_AVAILABLE)) {
70+
pr_info("PV spinlocks disabled\n");
71+
return;
72+
}
73+
pr_info("PV spinlocks enabled\n");
74+
75+
__pv_init_lock_hash();
76+
pv_ops.lock.queued_spin_lock_slowpath = __pv_queued_spin_lock_slowpath;
77+
pv_ops.lock.queued_spin_unlock = PV_CALLEE_SAVE(__pv_queued_spin_unlock);
78+
pv_ops.lock.wait = hv_qlock_wait;
79+
pv_ops.lock.kick = hv_qlock_kick;
80+
pv_ops.lock.vcpu_is_preempted = PV_CALLEE_SAVE(hv_vcpu_is_preempted);
81+
}
82+
83+
static __init int hv_parse_nopvspin(char *arg)
84+
{
85+
hv_pvspin = false;
86+
return 0;
87+
}
88+
early_param("hv_nopvspin", hv_parse_nopvspin);

arch/x86/include/asm/mshyperv.h

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -351,6 +351,8 @@ int hyperv_flush_guest_mapping(u64 as);
351351

352352
#ifdef CONFIG_X86_64
353353
void hv_apic_init(void);
354+
void __init hv_init_spinlocks(void);
355+
bool hv_vcpu_is_preempted(int vcpu);
354356
#else
355357
static inline void hv_apic_init(void) {}
356358
#endif

arch/x86/kernel/cpu/mshyperv.c

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -199,6 +199,16 @@ static unsigned long hv_get_tsc_khz(void)
199199
return freq / 1000;
200200
}
201201

202+
#if defined(CONFIG_SMP) && IS_ENABLED(CONFIG_HYPERV)
203+
static void __init hv_smp_prepare_boot_cpu(void)
204+
{
205+
native_smp_prepare_boot_cpu();
206+
#if defined(CONFIG_X86_64) && defined(CONFIG_PARAVIRT_SPINLOCKS)
207+
hv_init_spinlocks();
208+
#endif
209+
}
210+
#endif
211+
202212
static void __init ms_hyperv_init_platform(void)
203213
{
204214
int hv_host_info_eax;
@@ -303,6 +313,10 @@ static void __init ms_hyperv_init_platform(void)
303313
if (ms_hyperv.misc_features & HV_STIMER_DIRECT_MODE_AVAILABLE)
304314
alloc_intr_gate(HYPERV_STIMER0_VECTOR,
305315
hv_stimer0_callback_vector);
316+
317+
# ifdef CONFIG_SMP
318+
smp_ops.smp_prepare_boot_cpu = hv_smp_prepare_boot_cpu;
319+
# endif
306320
#endif
307321
}
308322

0 commit comments

Comments
 (0)