mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	 a2b7861bb3
			
		
	
	
		a2b7861bb3
		
	
	
	
	
		
			
			Currently, in PREEMPT_COUNT=n kernel, kvm_async_pf_task_wait() could call schedule() to reschedule in some cases. This could result in accidentally ending the current RCU read-side critical section early, causing random memory corruption in the guest, or otherwise preempting the currently running task inside between preempt_disable and preempt_enable. The difficulty to handle this well is because we don't know whether an async PF delivered in a preemptible section or RCU read-side critical section for PREEMPT_COUNT=n, since preempt_disable()/enable() and rcu_read_lock/unlock() are both no-ops in that case. To cure this, we treat any async PF interrupting a kernel context as one that cannot be preempted, preventing kvm_async_pf_task_wait() from choosing the schedule() path in that case. To do so, a second parameter for kvm_async_pf_task_wait() is introduced, so that we know whether it's called from a context interrupting the kernel, and the parameter is set properly in all the callsites. Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Wanpeng Li <wanpeng.li@hotmail.com> Cc: stable@vger.kernel.org Signed-off-by: Boqun Feng <boqun.feng@gmail.com> Signed-off-by: Radim Krčmář <rkrcmar@redhat.com>
		
			
				
	
	
		
			131 lines
		
	
	
		
			3.0 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			131 lines
		
	
	
		
			3.0 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| #ifndef _ASM_X86_KVM_PARA_H
 | |
| #define _ASM_X86_KVM_PARA_H
 | |
| 
 | |
| #include <asm/processor.h>
 | |
| #include <asm/alternative.h>
 | |
| #include <uapi/asm/kvm_para.h>
 | |
| 
 | |
| extern void kvmclock_init(void);
 | |
| extern int kvm_register_clock(char *txt);
 | |
| 
 | |
| #ifdef CONFIG_KVM_GUEST
 | |
| bool kvm_check_and_clear_guest_paused(void);
 | |
| #else
 | |
| static inline bool kvm_check_and_clear_guest_paused(void)
 | |
| {
 | |
| 	return false;
 | |
| }
 | |
| #endif /* CONFIG_KVM_GUEST */
 | |
| 
 | |
| #define KVM_HYPERCALL \
 | |
|         ALTERNATIVE(".byte 0x0f,0x01,0xc1", ".byte 0x0f,0x01,0xd9", X86_FEATURE_VMMCALL)
 | |
| 
 | |
| /* For KVM hypercalls, a three-byte sequence of either the vmcall or the vmmcall
 | |
|  * instruction.  The hypervisor may replace it with something else but only the
 | |
|  * instructions are guaranteed to be supported.
 | |
|  *
 | |
|  * Up to four arguments may be passed in rbx, rcx, rdx, and rsi respectively.
 | |
|  * The hypercall number should be placed in rax and the return value will be
 | |
|  * placed in rax.  No other registers will be clobbered unless explicitly
 | |
|  * noted by the particular hypercall.
 | |
|  */
 | |
| 
 | |
| static inline long kvm_hypercall0(unsigned int nr)
 | |
| {
 | |
| 	long ret;
 | |
| 	asm volatile(KVM_HYPERCALL
 | |
| 		     : "=a"(ret)
 | |
| 		     : "a"(nr)
 | |
| 		     : "memory");
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline long kvm_hypercall1(unsigned int nr, unsigned long p1)
 | |
| {
 | |
| 	long ret;
 | |
| 	asm volatile(KVM_HYPERCALL
 | |
| 		     : "=a"(ret)
 | |
| 		     : "a"(nr), "b"(p1)
 | |
| 		     : "memory");
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline long kvm_hypercall2(unsigned int nr, unsigned long p1,
 | |
| 				  unsigned long p2)
 | |
| {
 | |
| 	long ret;
 | |
| 	asm volatile(KVM_HYPERCALL
 | |
| 		     : "=a"(ret)
 | |
| 		     : "a"(nr), "b"(p1), "c"(p2)
 | |
| 		     : "memory");
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline long kvm_hypercall3(unsigned int nr, unsigned long p1,
 | |
| 				  unsigned long p2, unsigned long p3)
 | |
| {
 | |
| 	long ret;
 | |
| 	asm volatile(KVM_HYPERCALL
 | |
| 		     : "=a"(ret)
 | |
| 		     : "a"(nr), "b"(p1), "c"(p2), "d"(p3)
 | |
| 		     : "memory");
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline long kvm_hypercall4(unsigned int nr, unsigned long p1,
 | |
| 				  unsigned long p2, unsigned long p3,
 | |
| 				  unsigned long p4)
 | |
| {
 | |
| 	long ret;
 | |
| 	asm volatile(KVM_HYPERCALL
 | |
| 		     : "=a"(ret)
 | |
| 		     : "a"(nr), "b"(p1), "c"(p2), "d"(p3), "S"(p4)
 | |
| 		     : "memory");
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| #ifdef CONFIG_KVM_GUEST
 | |
| bool kvm_para_available(void);
 | |
| unsigned int kvm_arch_para_features(void);
 | |
| void __init kvm_guest_init(void);
 | |
| void kvm_async_pf_task_wait(u32 token, int interrupt_kernel);
 | |
| void kvm_async_pf_task_wake(u32 token);
 | |
| u32 kvm_read_and_reset_pf_reason(void);
 | |
| extern void kvm_disable_steal_time(void);
 | |
| 
 | |
| #ifdef CONFIG_PARAVIRT_SPINLOCKS
 | |
| void __init kvm_spinlock_init(void);
 | |
| #else /* !CONFIG_PARAVIRT_SPINLOCKS */
 | |
| static inline void kvm_spinlock_init(void)
 | |
| {
 | |
| }
 | |
| #endif /* CONFIG_PARAVIRT_SPINLOCKS */
 | |
| 
 | |
| #else /* CONFIG_KVM_GUEST */
 | |
| #define kvm_guest_init() do {} while (0)
 | |
| #define kvm_async_pf_task_wait(T, I) do {} while(0)
 | |
| #define kvm_async_pf_task_wake(T) do {} while(0)
 | |
| 
 | |
| static inline bool kvm_para_available(void)
 | |
| {
 | |
| 	return false;
 | |
| }
 | |
| 
 | |
| static inline unsigned int kvm_arch_para_features(void)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline u32 kvm_read_and_reset_pf_reason(void)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline void kvm_disable_steal_time(void)
 | |
| {
 | |
| 	return;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| #endif /* _ASM_X86_KVM_PARA_H */
 |