diff options
Diffstat (limited to 'arch/x86/include')
61 files changed, 616 insertions, 719 deletions
| diff --git a/arch/x86/include/asm/alternative.h b/arch/x86/include/asm/alternative.h index e77a6443104f..1b020381ab38 100644 --- a/arch/x86/include/asm/alternative.h +++ b/arch/x86/include/asm/alternative.h @@ -217,10 +217,14 @@ static inline int alternatives_text_reserved(void *start, void *end)   */  #define alternative_call_2(oldfunc, newfunc1, feature1, newfunc2, feature2,   \  			   output, input...)				      \ +{									      \ +	register void *__sp asm(_ASM_SP);				      \  	asm volatile (ALTERNATIVE_2("call %P[old]", "call %P[new1]", feature1,\  		"call %P[new2]", feature2)				      \ -		: output : [old] "i" (oldfunc), [new1] "i" (newfunc1),	      \ -		[new2] "i" (newfunc2), ## input) +		: output, "+r" (__sp)					      \ +		: [old] "i" (oldfunc), [new1] "i" (newfunc1),		      \ +		  [new2] "i" (newfunc2), ## input);			      \ +}  /*   * use this macro(s) if you need more than one output parameter diff --git a/arch/x86/include/asm/apic.h b/arch/x86/include/asm/apic.h index 124357773ffa..f5aaf6c83222 100644 --- a/arch/x86/include/asm/apic.h +++ b/arch/x86/include/asm/apic.h @@ -650,8 +650,8 @@ static inline void entering_ack_irq(void)  static inline void ipi_entering_ack_irq(void)  { -	ack_APIC_irq();  	irq_enter(); +	ack_APIC_irq();  }  static inline void exiting_irq(void) @@ -661,9 +661,8 @@ static inline void exiting_irq(void)  static inline void exiting_ack_irq(void)  { -	irq_exit(); -	/* Ack only at the end to avoid potential reentry */  	ack_APIC_irq(); +	irq_exit();  }  extern void ioapic_zap_locks(void); diff --git a/arch/x86/include/asm/cacheflush.h b/arch/x86/include/asm/cacheflush.h index 61518cf79437..872877d930de 100644 --- a/arch/x86/include/asm/cacheflush.h +++ b/arch/x86/include/asm/cacheflush.h @@ -4,7 +4,6 @@  /* Caches aren't brain-dead on the intel. */  #include <asm-generic/cacheflush.h>  #include <asm/special_insns.h> -#include <asm/uaccess.h>  /*   * The set_memory_* API can be used to change various attributes of a virtual diff --git a/arch/x86/include/asm/cmpxchg.h b/arch/x86/include/asm/cmpxchg.h index 9733361fed6f..97848cdfcb1a 100644 --- a/arch/x86/include/asm/cmpxchg.h +++ b/arch/x86/include/asm/cmpxchg.h @@ -158,53 +158,9 @@ extern void __add_wrong_size(void)   * value of "*ptr".   *   * xadd() is locked when multiple CPUs are online - * xadd_sync() is always locked - * xadd_local() is never locked   */  #define __xadd(ptr, inc, lock)	__xchg_op((ptr), (inc), xadd, lock)  #define xadd(ptr, inc)		__xadd((ptr), (inc), LOCK_PREFIX) -#define xadd_sync(ptr, inc)	__xadd((ptr), (inc), "lock; ") -#define xadd_local(ptr, inc)	__xadd((ptr), (inc), "") - -#define __add(ptr, inc, lock)						\ -	({								\ -	        __typeof__ (*(ptr)) __ret = (inc);			\ -		switch (sizeof(*(ptr))) {				\ -		case __X86_CASE_B:					\ -			asm volatile (lock "addb %b1, %0\n"		\ -				      : "+m" (*(ptr)) : "qi" (inc)	\ -				      : "memory", "cc");		\ -			break;						\ -		case __X86_CASE_W:					\ -			asm volatile (lock "addw %w1, %0\n"		\ -				      : "+m" (*(ptr)) : "ri" (inc)	\ -				      : "memory", "cc");		\ -			break;						\ -		case __X86_CASE_L:					\ -			asm volatile (lock "addl %1, %0\n"		\ -				      : "+m" (*(ptr)) : "ri" (inc)	\ -				      : "memory", "cc");		\ -			break;						\ -		case __X86_CASE_Q:					\ -			asm volatile (lock "addq %1, %0\n"		\ -				      : "+m" (*(ptr)) : "ri" (inc)	\ -				      : "memory", "cc");		\ -			break;						\ -		default:						\ -			__add_wrong_size();				\ -		}							\ -		__ret;							\ -	}) - -/* - * add_*() adds "inc" to "*ptr" - * - * __add() takes a lock prefix - * add_smp() is locked when multiple CPUs are online - * add_sync() is always locked - */ -#define add_smp(ptr, inc)	__add((ptr), (inc), LOCK_PREFIX) -#define add_sync(ptr, inc)	__add((ptr), (inc), "lock; ")  #define __cmpxchg_double(pfx, p1, p2, o1, o2, n1, n2)			\  ({									\ diff --git a/arch/x86/include/asm/compat.h b/arch/x86/include/asm/compat.h index a18806165fe4..03d269bed941 100644 --- a/arch/x86/include/asm/compat.h +++ b/arch/x86/include/asm/compat.h @@ -275,10 +275,10 @@ struct compat_shmid64_ds {  #ifdef CONFIG_X86_X32_ABI  typedef struct user_regs_struct compat_elf_gregset_t; -#define PR_REG_SIZE(S) (test_thread_flag(TIF_IA32) ? 68 : 216) -#define PRSTATUS_SIZE(S) (test_thread_flag(TIF_IA32) ? 144 : 296) -#define SET_PR_FPVALID(S,V) \ -  do { *(int *) (((void *) &((S)->pr_reg)) + PR_REG_SIZE(0)) = (V); } \ +/* Full regset -- prstatus on x32, otherwise on ia32 */ +#define PRSTATUS_SIZE(S, R) (R != sizeof(S.pr_reg) ? 144 : 296) +#define SET_PR_FPVALID(S, V, R) \ +  do { *(int *) (((void *) &((S)->pr_reg)) + R) = (V); } \    while (0)  #define COMPAT_USE_64BIT_TIME \ diff --git a/arch/x86/include/asm/cpufeatures.h b/arch/x86/include/asm/cpufeatures.h index 92a8308b96f6..a39629206864 100644 --- a/arch/x86/include/asm/cpufeatures.h +++ b/arch/x86/include/asm/cpufeatures.h @@ -106,7 +106,6 @@  #define X86_FEATURE_APERFMPERF	( 3*32+28) /* APERFMPERF */  #define X86_FEATURE_EAGER_FPU	( 3*32+29) /* "eagerfpu" Non lazy FPU restore */  #define X86_FEATURE_NONSTOP_TSC_S3 ( 3*32+30) /* TSC doesn't stop in S3 state */ -#define X86_FEATURE_MCE_RECOVERY ( 3*32+31) /* cpu has recoverable machine checks */  /* Intel-defined CPU features, CPUID level 0x00000001 (ecx), word 4 */  #define X86_FEATURE_XMM3	( 4*32+ 0) /* "pni" SSE-3 */ @@ -195,6 +194,8 @@  #define X86_FEATURE_PROC_FEEDBACK ( 7*32+ 9) /* AMD ProcFeedbackInterface */  #define X86_FEATURE_INTEL_PT	( 7*32+15) /* Intel Processor Trace */ +#define X86_FEATURE_AVX512_4VNNIW (7*32+16) /* AVX-512 Neural Network Instructions */ +#define X86_FEATURE_AVX512_4FMAPS (7*32+17) /* AVX-512 Multiply Accumulation Single precision */  /* Virtualization flags: Linux defined, word 8 */  #define X86_FEATURE_TPR_SHADOW  ( 8*32+ 0) /* Intel TPR Shadow */ diff --git a/arch/x86/include/asm/desc.h b/arch/x86/include/asm/desc.h index 4e10d73cf018..12080d87da3b 100644 --- a/arch/x86/include/asm/desc.h +++ b/arch/x86/include/asm/desc.h @@ -36,7 +36,7 @@ static inline void fill_ldt(struct desc_struct *desc, const struct user_desc *in  extern struct desc_ptr idt_descr;  extern gate_desc idt_table[]; -extern struct desc_ptr debug_idt_descr; +extern const struct desc_ptr debug_idt_descr;  extern gate_desc debug_idt_table[];  struct gdt_page { diff --git a/arch/x86/include/asm/e820.h b/arch/x86/include/asm/e820.h index 3ab0537872fb..476b574de99e 100644 --- a/arch/x86/include/asm/e820.h +++ b/arch/x86/include/asm/e820.h @@ -10,8 +10,8 @@  #include <uapi/asm/e820.h>  #ifndef __ASSEMBLY__  /* see comment in arch/x86/kernel/e820.c */ -extern struct e820map e820; -extern struct e820map e820_saved; +extern struct e820map *e820; +extern struct e820map *e820_saved;  extern unsigned long pci_mem_start;  extern int e820_any_mapped(u64 start, u64 end, unsigned type); @@ -53,6 +53,8 @@ extern void e820_reserve_resources_late(void);  extern void setup_memory_map(void);  extern char *default_machine_specific_memory_setup(void); +extern void e820_reallocate_tables(void); +  /*   * Returns true iff the specified range [s,e) is completely contained inside   * the ISA region. diff --git a/arch/x86/include/asm/efi.h b/arch/x86/include/asm/efi.h index d0bb76d81402..389d700b961e 100644 --- a/arch/x86/include/asm/efi.h +++ b/arch/x86/include/asm/efi.h @@ -117,7 +117,6 @@ extern int __init efi_memblock_x86_reserve_range(void);  extern pgd_t * __init efi_call_phys_prolog(void);  extern void __init efi_call_phys_epilog(pgd_t *save_pgd);  extern void __init efi_print_memmap(void); -extern void __init efi_unmap_memmap(void);  extern void __init efi_memory_uc(u64 addr, unsigned long size);  extern void __init efi_map_region(efi_memory_desc_t *md);  extern void __init efi_map_region_fixed(efi_memory_desc_t *md); @@ -192,14 +191,7 @@ static inline efi_status_t efi_thunk_set_virtual_address_map(  struct efi_config {  	u64 image_handle;  	u64 table; -	u64 allocate_pool; -	u64 allocate_pages; -	u64 get_memory_map; -	u64 free_pool; -	u64 free_pages; -	u64 locate_handle; -	u64 handle_protocol; -	u64 exit_boot_services; +	u64 boot_services;  	u64 text_output;  	efi_status_t (*call)(unsigned long, ...);  	bool is64; @@ -207,14 +199,27 @@ struct efi_config {  __pure const struct efi_config *__efi_early(void); +static inline bool efi_is_64bit(void) +{ +	if (!IS_ENABLED(CONFIG_X86_64)) +		return false; + +	if (!IS_ENABLED(CONFIG_EFI_MIXED)) +		return true; + +	return __efi_early()->is64; +} +  #define efi_call_early(f, ...)						\ -	__efi_early()->call(__efi_early()->f, __VA_ARGS__); +	__efi_early()->call(efi_is_64bit() ?				\ +		((efi_boot_services_64_t *)(unsigned long)		\ +			__efi_early()->boot_services)->f :		\ +		((efi_boot_services_32_t *)(unsigned long)		\ +			__efi_early()->boot_services)->f, __VA_ARGS__)  #define __efi_call_early(f, ...)					\  	__efi_early()->call((unsigned long)f, __VA_ARGS__); -#define efi_is_64bit()		__efi_early()->is64 -  extern bool efi_reboot_required(void);  #else diff --git a/arch/x86/include/asm/export.h b/arch/x86/include/asm/export.h new file mode 100644 index 000000000000..138de56b13eb --- /dev/null +++ b/arch/x86/include/asm/export.h @@ -0,0 +1,4 @@ +#ifdef CONFIG_64BIT +#define KSYM_ALIGN 16 +#endif +#include <asm-generic/export.h> diff --git a/arch/x86/include/asm/extable.h b/arch/x86/include/asm/extable.h new file mode 100644 index 000000000000..b8ad261d11dc --- /dev/null +++ b/arch/x86/include/asm/extable.h @@ -0,0 +1,35 @@ +#ifndef _ASM_X86_EXTABLE_H +#define _ASM_X86_EXTABLE_H +/* + * The exception table consists of triples of addresses relative to the + * exception table entry itself. The first address is of an instruction + * that is allowed to fault, the second is the target at which the program + * should continue. The third is a handler function to deal with the fault + * caused by the instruction in the first field. + * + * All the routines below use bits of fixup code that are out of line + * with the main instruction path.  This means when everything is well, + * we don't even have to jump over them.  Further, they do not intrude + * on our cache or tlb entries. + */ + +struct exception_table_entry { +	int insn, fixup, handler; +}; +struct pt_regs; + +#define ARCH_HAS_RELATIVE_EXTABLE + +#define swap_ex_entry_fixup(a, b, tmp, delta)			\ +	do {							\ +		(a)->fixup = (b)->fixup + (delta);		\ +		(b)->fixup = (tmp).fixup - (delta);		\ +		(a)->handler = (b)->handler + (delta);		\ +		(b)->handler = (tmp).handler - (delta);		\ +	} while (0) + +extern int fixup_exception(struct pt_regs *regs, int trapnr); +extern bool ex_has_fault_handler(unsigned long ip); +extern void early_fixup_exception(struct pt_regs *regs, int trapnr); + +#endif diff --git a/arch/x86/include/asm/fpu/signal.h b/arch/x86/include/asm/fpu/signal.h index 0e970d00dfcd..20a1fbf7fe4e 100644 --- a/arch/x86/include/asm/fpu/signal.h +++ b/arch/x86/include/asm/fpu/signal.h @@ -19,6 +19,12 @@ int ia32_setup_frame(int sig, struct ksignal *ksig,  # define ia32_setup_rt_frame	__setup_rt_frame  #endif +#ifdef CONFIG_COMPAT +int __copy_siginfo_to_user32(compat_siginfo_t __user *to, +		const siginfo_t *from, bool x32_ABI); +#endif + +  extern void convert_from_fxsr(struct user_i387_ia32_struct *env,  			      struct task_struct *tsk);  extern void convert_to_fxsr(struct task_struct *tsk, diff --git a/arch/x86/include/asm/fpu/xstate.h b/arch/x86/include/asm/fpu/xstate.h index ae55a43e09c0..430bacf73074 100644 --- a/arch/x86/include/asm/fpu/xstate.h +++ b/arch/x86/include/asm/fpu/xstate.h @@ -27,11 +27,12 @@  				 XFEATURE_MASK_YMM | \  				 XFEATURE_MASK_OPMASK | \  				 XFEATURE_MASK_ZMM_Hi256 | \ -				 XFEATURE_MASK_Hi16_ZMM	 | \ -				 XFEATURE_MASK_PKRU) +				 XFEATURE_MASK_Hi16_ZMM)  /* Supported features which require eager state saving */ -#define XFEATURE_MASK_EAGER	(XFEATURE_MASK_BNDREGS | XFEATURE_MASK_BNDCSR) +#define XFEATURE_MASK_EAGER	(XFEATURE_MASK_BNDREGS | \ +				 XFEATURE_MASK_BNDCSR | \ +				 XFEATURE_MASK_PKRU)  /* All currently supported features */  #define XCNTXT_MASK	(XFEATURE_MASK_LAZY | XFEATURE_MASK_EAGER) @@ -45,7 +46,8 @@  extern u64 xfeatures_mask;  extern u64 xstate_fx_sw_bytes[USER_XSTATE_FX_SW_WORDS]; -extern void update_regset_xstate_info(unsigned int size, u64 xstate_mask); +extern void __init update_regset_xstate_info(unsigned int size, +					     u64 xstate_mask);  void fpu__xstate_clear_all_cpu_caps(void);  void *get_xsave_addr(struct xregs_state *xsave, int xstate); diff --git a/arch/x86/include/asm/ftrace.h b/arch/x86/include/asm/ftrace.h index a4820d4df617..eccd0ac6bc38 100644 --- a/arch/x86/include/asm/ftrace.h +++ b/arch/x86/include/asm/ftrace.h @@ -6,6 +6,7 @@  # define MCOUNT_ADDR		((unsigned long)(__fentry__))  #else  # define MCOUNT_ADDR		((unsigned long)(mcount)) +# define HAVE_FUNCTION_GRAPH_FP_TEST  #endif  #define MCOUNT_INSN_SIZE	5 /* sizeof mcount call */ @@ -13,6 +14,8 @@  #define ARCH_SUPPORTS_FTRACE_OPS 1  #endif +#define HAVE_FUNCTION_GRAPH_RET_ADDR_PTR +  #ifndef __ASSEMBLY__  extern void mcount(void);  extern atomic_t modifying_ftrace_code; diff --git a/arch/x86/include/asm/hypervisor.h b/arch/x86/include/asm/hypervisor.h index 055ea9941dd5..67942b6ad4b7 100644 --- a/arch/x86/include/asm/hypervisor.h +++ b/arch/x86/include/asm/hypervisor.h @@ -43,6 +43,9 @@ struct hypervisor_x86 {  	/* X2APIC detection (run once per boot) */  	bool		(*x2apic_available)(void); + +	/* pin current vcpu to specified physical cpu (run rarely) */ +	void		(*pin_vcpu)(int);  };  extern const struct hypervisor_x86 *x86_hyper; @@ -56,6 +59,7 @@ extern const struct hypervisor_x86 x86_hyper_kvm;  extern void init_hypervisor(struct cpuinfo_x86 *c);  extern void init_hypervisor_platform(void);  extern bool hypervisor_x2apic_available(void); +extern void hypervisor_pin_vcpu(int cpu);  #else  static inline void init_hypervisor(struct cpuinfo_x86 *c) { }  static inline void init_hypervisor_platform(void) { } diff --git a/arch/x86/include/asm/intel-family.h b/arch/x86/include/asm/intel-family.h index 627719475457..34a46dc076d3 100644 --- a/arch/x86/include/asm/intel-family.h +++ b/arch/x86/include/asm/intel-family.h @@ -56,13 +56,14 @@  #define INTEL_FAM6_ATOM_SILVERMONT1	0x37 /* BayTrail/BYT / Valleyview */  #define INTEL_FAM6_ATOM_SILVERMONT2	0x4D /* Avaton/Rangely */  #define INTEL_FAM6_ATOM_AIRMONT		0x4C /* CherryTrail / Braswell */ -#define INTEL_FAM6_ATOM_MERRIFIELD1	0x4A /* Tangier */ -#define INTEL_FAM6_ATOM_MERRIFIELD2	0x5A /* Annidale */ +#define INTEL_FAM6_ATOM_MERRIFIELD	0x4A /* Tangier */ +#define INTEL_FAM6_ATOM_MOOREFIELD	0x5A /* Annidale */  #define INTEL_FAM6_ATOM_GOLDMONT	0x5C  #define INTEL_FAM6_ATOM_DENVERTON	0x5F /* Goldmont Microserver */  /* Xeon Phi */  #define INTEL_FAM6_XEON_PHI_KNL		0x57 /* Knights Landing */ +#define INTEL_FAM6_XEON_PHI_KNM		0x85 /* Knights Mill */  #endif /* _ASM_X86_INTEL_FAMILY_H */ diff --git a/arch/x86/include/asm/intel-mid.h b/arch/x86/include/asm/intel-mid.h index 9d6b097aa73d..49da9f497b90 100644 --- a/arch/x86/include/asm/intel-mid.h +++ b/arch/x86/include/asm/intel-mid.h @@ -17,6 +17,9 @@  extern int intel_mid_pci_init(void);  extern int intel_mid_pci_set_power_state(struct pci_dev *pdev, pci_power_t state); +extern pci_power_t intel_mid_pci_get_power_state(struct pci_dev *pdev); + +extern void intel_mid_pwr_power_off(void);  #define INTEL_MID_PWR_LSS_OFFSET	4  #define INTEL_MID_PWR_LSS_TYPE		(1 << 7) diff --git a/arch/x86/include/asm/intel_scu_ipc.h b/arch/x86/include/asm/intel_scu_ipc.h index 925b605eb5c6..4fb1d0abef95 100644 --- a/arch/x86/include/asm/intel_scu_ipc.h +++ b/arch/x86/include/asm/intel_scu_ipc.h @@ -3,6 +3,8 @@  #include <linux/notifier.h> +#define IPCMSG_COLD_OFF		0x80	/* Only for Tangier */ +  #define IPCMSG_WARM_RESET	0xF0  #define IPCMSG_COLD_RESET	0xF1  #define IPCMSG_SOFT_RESET	0xF2 diff --git a/arch/x86/include/asm/io.h b/arch/x86/include/asm/io.h index de25aad07853..d34bd370074b 100644 --- a/arch/x86/include/asm/io.h +++ b/arch/x86/include/asm/io.h @@ -351,4 +351,10 @@ extern void arch_phys_wc_del(int handle);  #define arch_phys_wc_add arch_phys_wc_add  #endif +#ifdef CONFIG_X86_PAT +extern int arch_io_reserve_memtype_wc(resource_size_t start, resource_size_t size); +extern void arch_io_free_memtype_wc(resource_size_t start, resource_size_t size); +#define arch_io_reserve_memtype_wc arch_io_reserve_memtype_wc +#endif +  #endif /* _ASM_X86_IO_H */ diff --git a/arch/x86/include/asm/irq.h b/arch/x86/include/asm/irq.h index e7de5c9a4fbd..16d3fa211962 100644 --- a/arch/x86/include/asm/irq.h +++ b/arch/x86/include/asm/irq.h @@ -50,8 +50,9 @@ extern int vector_used_by_percpu_irq(unsigned int vector);  extern void init_ISA_irqs(void);  #ifdef CONFIG_X86_LOCAL_APIC -void arch_trigger_all_cpu_backtrace(bool); -#define arch_trigger_all_cpu_backtrace arch_trigger_all_cpu_backtrace +void arch_trigger_cpumask_backtrace(const struct cpumask *mask, +				    bool exclude_self); +#define arch_trigger_cpumask_backtrace arch_trigger_cpumask_backtrace  #endif  #endif /* _ASM_X86_IRQ_H */ diff --git a/arch/x86/include/asm/irqflags.h b/arch/x86/include/asm/irqflags.h index b77f5edb03b0..ac7692dcfa2e 100644 --- a/arch/x86/include/asm/irqflags.h +++ b/arch/x86/include/asm/irqflags.h @@ -4,6 +4,10 @@  #include <asm/processor-flags.h>  #ifndef __ASSEMBLY__ + +/* Provide __cpuidle; we can't safely include <linux/cpu.h> */ +#define __cpuidle __attribute__((__section__(".cpuidle.text"))) +  /*   * Interrupt control:   */ @@ -44,12 +48,12 @@ static inline void native_irq_enable(void)  	asm volatile("sti": : :"memory");  } -static inline void native_safe_halt(void) +static inline __cpuidle void native_safe_halt(void)  {  	asm volatile("sti; hlt": : :"memory");  } -static inline void native_halt(void) +static inline __cpuidle void native_halt(void)  {  	asm volatile("hlt": : :"memory");  } @@ -86,7 +90,7 @@ static inline notrace void arch_local_irq_enable(void)   * Used in the idle loop; sti takes one instruction cycle   * to complete:   */ -static inline void arch_safe_halt(void) +static inline __cpuidle void arch_safe_halt(void)  {  	native_safe_halt();  } @@ -95,7 +99,7 @@ static inline void arch_safe_halt(void)   * Used when interrupts are already enabled or to   * shutdown the processor:   */ -static inline void halt(void) +static inline __cpuidle void halt(void)  {  	native_halt();  } diff --git a/arch/x86/include/asm/kaslr.h b/arch/x86/include/asm/kaslr.h index 2674ee3de748..1052a797d71d 100644 --- a/arch/x86/include/asm/kaslr.h +++ b/arch/x86/include/asm/kaslr.h @@ -6,6 +6,7 @@ unsigned long kaslr_get_random_long(const char *purpose);  #ifdef CONFIG_RANDOMIZE_MEMORY  extern unsigned long page_offset_base;  extern unsigned long vmalloc_base; +extern unsigned long vmemmap_base;  void kernel_randomize_memory(void);  #else diff --git a/arch/x86/include/asm/kdebug.h b/arch/x86/include/asm/kdebug.h index 1ef9d581b5d9..d31881188431 100644 --- a/arch/x86/include/asm/kdebug.h +++ b/arch/x86/include/asm/kdebug.h @@ -24,8 +24,6 @@ enum die_val {  extern void printk_address(unsigned long address);  extern void die(const char *, struct pt_regs *,long);  extern int __must_check __die(const char *, struct pt_regs *, long); -extern void show_trace(struct task_struct *t, struct pt_regs *regs, -		       unsigned long *sp, unsigned long bp);  extern void show_stack_regs(struct pt_regs *regs);  extern void __show_regs(struct pt_regs *regs, int all);  extern unsigned long oops_begin(void); diff --git a/arch/x86/include/asm/kexec.h b/arch/x86/include/asm/kexec.h index d2434c1cad05..282630e4c6ea 100644 --- a/arch/x86/include/asm/kexec.h +++ b/arch/x86/include/asm/kexec.h @@ -210,6 +210,7 @@ struct kexec_entry64_regs {  typedef void crash_vmclear_fn(void);  extern crash_vmclear_fn __rcu *crash_vmclear_loaded_vmcss; +extern void kdump_nmi_shootdown_cpus(void);  #endif /* __ASSEMBLY__ */ diff --git a/arch/x86/include/asm/kvm_host.h b/arch/x86/include/asm/kvm_host.h index 33ae3a4d0159..bdde80731f49 100644 --- a/arch/x86/include/asm/kvm_host.h +++ b/arch/x86/include/asm/kvm_host.h @@ -568,6 +568,7 @@ struct kvm_vcpu_arch {  		struct kvm_steal_time steal;  	} st; +	u64 tsc_offset;  	u64 last_guest_tsc;  	u64 last_host_tsc;  	u64 tsc_offset_adjustment; @@ -701,6 +702,8 @@ struct kvm_hv {  	/* Hyper-v based guest crash (NT kernel bugcheck) parameters */  	u64 hv_crash_param[HV_X64_MSR_CRASH_PARAMS];  	u64 hv_crash_ctl; + +	HV_REFERENCE_TSC_PAGE tsc_ref;  };  struct kvm_arch { @@ -781,54 +784,56 @@ struct kvm_arch {  	bool disabled_lapic_found;  	/* Struct members for AVIC */ +	u32 avic_vm_id;  	u32 ldr_mode;  	struct page *avic_logical_id_table_page;  	struct page *avic_physical_id_table_page; +	struct hlist_node hnode;  	bool x2apic_format;  	bool x2apic_broadcast_quirk_disabled;  };  struct kvm_vm_stat { -	u32 mmu_shadow_zapped; -	u32 mmu_pte_write; -	u32 mmu_pte_updated; -	u32 mmu_pde_zapped; -	u32 mmu_flooded; -	u32 mmu_recycled; -	u32 mmu_cache_miss; -	u32 mmu_unsync; -	u32 remote_tlb_flush; -	u32 lpages; +	ulong mmu_shadow_zapped; +	ulong mmu_pte_write; +	ulong mmu_pte_updated; +	ulong mmu_pde_zapped; +	ulong mmu_flooded; +	ulong mmu_recycled; +	ulong mmu_cache_miss; +	ulong mmu_unsync; +	ulong remote_tlb_flush; +	ulong lpages;  };  struct kvm_vcpu_stat { -	u32 pf_fixed; -	u32 pf_guest; -	u32 tlb_flush; -	u32 invlpg; - -	u32 exits; -	u32 io_exits; -	u32 mmio_exits; -	u32 signal_exits; -	u32 irq_window_exits; -	u32 nmi_window_exits; -	u32 halt_exits; -	u32 halt_successful_poll; -	u32 halt_attempted_poll; -	u32 halt_poll_invalid; -	u32 halt_wakeup; -	u32 request_irq_exits; -	u32 irq_exits; -	u32 host_state_reload; -	u32 efer_reload; -	u32 fpu_reload; -	u32 insn_emulation; -	u32 insn_emulation_fail; -	u32 hypercalls; -	u32 irq_injections; -	u32 nmi_injections; +	u64 pf_fixed; +	u64 pf_guest; +	u64 tlb_flush; +	u64 invlpg; + +	u64 exits; +	u64 io_exits; +	u64 mmio_exits; +	u64 signal_exits; +	u64 irq_window_exits; +	u64 nmi_window_exits; +	u64 halt_exits; +	u64 halt_successful_poll; +	u64 halt_attempted_poll; +	u64 halt_poll_invalid; +	u64 halt_wakeup; +	u64 request_irq_exits; +	u64 irq_exits; +	u64 host_state_reload; +	u64 efer_reload; +	u64 fpu_reload; +	u64 insn_emulation; +	u64 insn_emulation_fail; +	u64 hypercalls; +	u64 irq_injections; +	u64 nmi_injections;  };  struct x86_instruction_info; @@ -943,7 +948,6 @@ struct kvm_x86_ops {  	int (*get_lpage_level)(void);  	bool (*rdtscp_supported)(void);  	bool (*invpcid_supported)(void); -	void (*adjust_tsc_offset_guest)(struct kvm_vcpu *vcpu, s64 adjustment);  	void (*set_tdp_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3); @@ -951,11 +955,8 @@ struct kvm_x86_ops {  	bool (*has_wbinvd_exit)(void); -	u64 (*read_tsc_offset)(struct kvm_vcpu *vcpu);  	void (*write_tsc_offset)(struct kvm_vcpu *vcpu, u64 offset); -	u64 (*read_l1_tsc)(struct kvm_vcpu *vcpu, u64 host_tsc); -  	void (*get_exit_info)(struct kvm_vcpu *vcpu, u64 *info1, u64 *info2);  	int (*check_intercept)(struct kvm_vcpu *vcpu, diff --git a/arch/x86/include/asm/mce.h b/arch/x86/include/asm/mce.h index 8bf766ef0e18..9bd7ff5ffbcc 100644 --- a/arch/x86/include/asm/mce.h +++ b/arch/x86/include/asm/mce.h @@ -40,9 +40,10 @@  #define MCI_STATUS_AR	 (1ULL<<55)  /* Action required */  /* AMD-specific bits */ +#define MCI_STATUS_TCC		(1ULL<<55)  /* Task context corrupt */ +#define MCI_STATUS_SYNDV	(1ULL<<53)  /* synd reg. valid */  #define MCI_STATUS_DEFERRED	(1ULL<<44)  /* uncorrected error, deferred exception */  #define MCI_STATUS_POISON	(1ULL<<43)  /* access poisonous data */ -#define MCI_STATUS_TCC		(1ULL<<55)  /* Task context corrupt */  /*   * McaX field if set indicates a given bank supports MCA extensions: @@ -110,6 +111,7 @@  #define MSR_AMD64_SMCA_MC0_MISC0	0xc0002003  #define MSR_AMD64_SMCA_MC0_CONFIG	0xc0002004  #define MSR_AMD64_SMCA_MC0_IPID		0xc0002005 +#define MSR_AMD64_SMCA_MC0_SYND		0xc0002006  #define MSR_AMD64_SMCA_MC0_DESTAT	0xc0002008  #define MSR_AMD64_SMCA_MC0_DEADDR	0xc0002009  #define MSR_AMD64_SMCA_MC0_MISC1	0xc000200a @@ -119,6 +121,7 @@  #define MSR_AMD64_SMCA_MCx_MISC(x)	(MSR_AMD64_SMCA_MC0_MISC0 + 0x10*(x))  #define MSR_AMD64_SMCA_MCx_CONFIG(x)	(MSR_AMD64_SMCA_MC0_CONFIG + 0x10*(x))  #define MSR_AMD64_SMCA_MCx_IPID(x)	(MSR_AMD64_SMCA_MC0_IPID + 0x10*(x)) +#define MSR_AMD64_SMCA_MCx_SYND(x)	(MSR_AMD64_SMCA_MC0_SYND + 0x10*(x))  #define MSR_AMD64_SMCA_MCx_DESTAT(x)	(MSR_AMD64_SMCA_MC0_DESTAT + 0x10*(x))  #define MSR_AMD64_SMCA_MCx_DEADDR(x)	(MSR_AMD64_SMCA_MC0_DEADDR + 0x10*(x))  #define MSR_AMD64_SMCA_MCx_MISCy(x, y)	((MSR_AMD64_SMCA_MC0_MISC1 + y) + (0x10*(x))) @@ -334,44 +337,47 @@ extern void apei_mce_report_mem_error(int corrected,   * Scalable MCA.   */  #ifdef CONFIG_X86_MCE_AMD -enum amd_ip_types { -	SMCA_F17H_CORE = 0,	/* Core errors */ -	SMCA_DF,		/* Data Fabric */ -	SMCA_UMC,		/* Unified Memory Controller */ -	SMCA_PB,		/* Parameter Block */ -	SMCA_PSP,		/* Platform Security Processor */ -	SMCA_SMU,		/* System Management Unit */ -	N_AMD_IP_TYPES -}; - -struct amd_hwid { -	const char *name; -	unsigned int hwid; -}; - -extern struct amd_hwid amd_hwids[N_AMD_IP_TYPES]; -enum amd_core_mca_blocks { +/* These may be used by multiple smca_hwid_mcatypes */ +enum smca_bank_types {  	SMCA_LS = 0,	/* Load Store */  	SMCA_IF,	/* Instruction Fetch */ -	SMCA_L2_CACHE,	/* L2 cache */ -	SMCA_DE,	/* Decoder unit */ -	RES,		/* Reserved */ -	SMCA_EX,	/* Execution unit */ +	SMCA_L2_CACHE,	/* L2 Cache */ +	SMCA_DE,	/* Decoder Unit */ +	SMCA_EX,	/* Execution Unit */  	SMCA_FP,	/* Floating Point */ -	SMCA_L3_CACHE,	/* L3 cache */ -	N_CORE_MCA_BLOCKS +	SMCA_L3_CACHE,	/* L3 Cache */ +	SMCA_CS,	/* Coherent Slave */ +	SMCA_PIE,	/* Power, Interrupts, etc. */ +	SMCA_UMC,	/* Unified Memory Controller */ +	SMCA_PB,	/* Parameter Block */ +	SMCA_PSP,	/* Platform Security Processor */ +	SMCA_SMU,	/* System Management Unit */ +	N_SMCA_BANK_TYPES  }; -extern const char * const amd_core_mcablock_names[N_CORE_MCA_BLOCKS]; +struct smca_bank_name { +	const char *name;	/* Short name for sysfs */ +	const char *long_name;	/* Long name for pretty-printing */ +}; + +extern struct smca_bank_name smca_bank_names[N_SMCA_BANK_TYPES]; + +#define HWID_MCATYPE(hwid, mcatype) ((hwid << 16) | mcatype) -enum amd_df_mca_blocks { -	SMCA_CS = 0,	/* Coherent Slave */ -	SMCA_PIE,	/* Power management, Interrupts, etc */ -	N_DF_BLOCKS +struct smca_hwid_mcatype { +	unsigned int bank_type;	/* Use with smca_bank_types for easy indexing. */ +	u32 hwid_mcatype;	/* (hwid,mcatype) tuple */ +	u32 xec_bitmap;		/* Bitmap of valid ExtErrorCodes; current max is 21. */  }; -extern const char * const amd_df_mcablock_names[N_DF_BLOCKS]; +struct smca_bank_info { +	struct smca_hwid_mcatype *type; +	u32 type_instance; +}; + +extern struct smca_bank_info smca_banks[MAX_NR_BANKS]; +  #endif  #endif /* _ASM_X86_MCE_H */ diff --git a/arch/x86/include/asm/mmu.h b/arch/x86/include/asm/mmu.h index 1ea0baef1175..72198c64e646 100644 --- a/arch/x86/include/asm/mmu.h +++ b/arch/x86/include/asm/mmu.h @@ -23,6 +23,14 @@ typedef struct {  	const struct vdso_image *vdso_image;	/* vdso image in use */  	atomic_t perf_rdpmc_allowed;	/* nonzero if rdpmc is allowed */ +#ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS +	/* +	 * One bit per protection key says whether userspace can +	 * use it or not.  protected by mmap_sem. +	 */ +	u16 pkey_allocation_map; +	s16 execute_only_pkey; +#endif  } mm_context_t;  #ifdef CONFIG_SMP diff --git a/arch/x86/include/asm/mmu_context.h b/arch/x86/include/asm/mmu_context.h index d8abfcf524d1..8e0a9fe86de4 100644 --- a/arch/x86/include/asm/mmu_context.h +++ b/arch/x86/include/asm/mmu_context.h @@ -4,6 +4,7 @@  #include <asm/desc.h>  #include <linux/atomic.h>  #include <linux/mm_types.h> +#include <linux/pkeys.h>  #include <trace/events/tlb.h> @@ -107,7 +108,16 @@ static inline void enter_lazy_tlb(struct mm_struct *mm, struct task_struct *tsk)  static inline int init_new_context(struct task_struct *tsk,  				   struct mm_struct *mm)  { +	#ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS +	if (cpu_feature_enabled(X86_FEATURE_OSPKE)) { +		/* pkey 0 is the default and always allocated */ +		mm->context.pkey_allocation_map = 0x1; +		/* -1 means unallocated or invalid */ +		mm->context.execute_only_pkey = -1; +	} +	#endif  	init_new_context_ldt(tsk, mm); +  	return 0;  }  static inline void destroy_context(struct mm_struct *mm) @@ -195,16 +205,20 @@ static inline void arch_unmap(struct mm_struct *mm, struct vm_area_struct *vma,  		mpx_notify_unmap(mm, vma, start, end);  } +#ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS  static inline int vma_pkey(struct vm_area_struct *vma)  { -	u16 pkey = 0; -#ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS  	unsigned long vma_pkey_mask = VM_PKEY_BIT0 | VM_PKEY_BIT1 |  				      VM_PKEY_BIT2 | VM_PKEY_BIT3; -	pkey = (vma->vm_flags & vma_pkey_mask) >> VM_PKEY_SHIFT; -#endif -	return pkey; + +	return (vma->vm_flags & vma_pkey_mask) >> VM_PKEY_SHIFT; +} +#else +static inline int vma_pkey(struct vm_area_struct *vma) +{ +	return 0;  } +#endif  static inline bool __pkru_allows_pkey(u16 pkey, bool write)  { @@ -258,5 +272,4 @@ static inline bool arch_pte_access_permitted(pte_t pte, bool write)  {  	return __pkru_allows_pkey(pte_flags_pkey(pte_flags(pte)), write);  } -  #endif /* _ASM_X86_MMU_CONTEXT_H */ diff --git a/arch/x86/include/asm/mpspec.h b/arch/x86/include/asm/mpspec.h index b07233b64578..32007041ef8c 100644 --- a/arch/x86/include/asm/mpspec.h +++ b/arch/x86/include/asm/mpspec.h @@ -6,7 +6,6 @@  #include <asm/x86_init.h>  #include <asm/apicdef.h> -extern int apic_version[];  extern int pic_mode;  #ifdef CONFIG_X86_32 @@ -40,6 +39,7 @@ extern int mp_bus_id_to_type[MAX_MP_BUSSES];  extern DECLARE_BITMAP(mp_bus_not_pci, MAX_MP_BUSSES);  extern unsigned int boot_cpu_physical_apicid; +extern u8 boot_cpu_apic_version;  extern unsigned long mp_lapic_addr;  #ifdef CONFIG_X86_LOCAL_APIC @@ -86,6 +86,7 @@ static inline void early_reserve_e820_mpc_new(void) { }  #endif  int generic_processor_info(int apicid, int version); +int __generic_processor_info(int apicid, int version, bool enabled);  #define PHYSID_ARRAY_SIZE	BITS_TO_LONGS(MAX_LOCAL_APIC) diff --git a/arch/x86/include/asm/msr-index.h b/arch/x86/include/asm/msr-index.h index 56f4c6676b29..78f3760ca1f2 100644 --- a/arch/x86/include/asm/msr-index.h +++ b/arch/x86/include/asm/msr-index.h @@ -88,7 +88,6 @@  #define MSR_IA32_RTIT_CTL		0x00000570  #define MSR_IA32_RTIT_STATUS		0x00000571 -#define MSR_IA32_RTIT_STATUS		0x00000571  #define MSR_IA32_RTIT_ADDR0_A		0x00000580  #define MSR_IA32_RTIT_ADDR0_B		0x00000581  #define MSR_IA32_RTIT_ADDR1_A		0x00000582 diff --git a/arch/x86/include/asm/paravirt.h b/arch/x86/include/asm/paravirt.h index 2970d22d7766..ce932812f142 100644 --- a/arch/x86/include/asm/paravirt.h +++ b/arch/x86/include/asm/paravirt.h @@ -80,10 +80,6 @@ static inline unsigned long __read_cr4(void)  {  	return PVOP_CALL0(unsigned long, pv_cpu_ops.read_cr4);  } -static inline unsigned long __read_cr4_safe(void) -{ -	return PVOP_CALL0(unsigned long, pv_cpu_ops.read_cr4_safe); -}  static inline void __write_cr4(unsigned long x)  { @@ -661,8 +657,6 @@ static inline void __set_fixmap(unsigned /* enum fixed_addresses */ idx,  #if defined(CONFIG_SMP) && defined(CONFIG_PARAVIRT_SPINLOCKS) -#ifdef CONFIG_QUEUED_SPINLOCKS -  static __always_inline void pv_queued_spin_lock_slowpath(struct qspinlock *lock,  							u32 val)  { @@ -684,22 +678,6 @@ static __always_inline void pv_kick(int cpu)  	PVOP_VCALL1(pv_lock_ops.kick, cpu);  } -#else /* !CONFIG_QUEUED_SPINLOCKS */ - -static __always_inline void __ticket_lock_spinning(struct arch_spinlock *lock, -							__ticket_t ticket) -{ -	PVOP_VCALLEE2(pv_lock_ops.lock_spinning, lock, ticket); -} - -static __always_inline void __ticket_unlock_kick(struct arch_spinlock *lock, -							__ticket_t ticket) -{ -	PVOP_VCALL2(pv_lock_ops.unlock_kick, lock, ticket); -} - -#endif /* CONFIG_QUEUED_SPINLOCKS */ -  #endif /* SMP && PARAVIRT_SPINLOCKS */  #ifdef CONFIG_X86_32 diff --git a/arch/x86/include/asm/paravirt_types.h b/arch/x86/include/asm/paravirt_types.h index 7fa9e7740ba3..0f400c0e4979 100644 --- a/arch/x86/include/asm/paravirt_types.h +++ b/arch/x86/include/asm/paravirt_types.h @@ -108,7 +108,6 @@ struct pv_cpu_ops {  	unsigned long (*read_cr0)(void);  	void (*write_cr0)(unsigned long); -	unsigned long (*read_cr4_safe)(void);  	unsigned long (*read_cr4)(void);  	void (*write_cr4)(unsigned long); @@ -301,23 +300,16 @@ struct pv_mmu_ops {  struct arch_spinlock;  #ifdef CONFIG_SMP  #include <asm/spinlock_types.h> -#else -typedef u16 __ticket_t;  #endif  struct qspinlock;  struct pv_lock_ops { -#ifdef CONFIG_QUEUED_SPINLOCKS  	void (*queued_spin_lock_slowpath)(struct qspinlock *lock, u32 val);  	struct paravirt_callee_save queued_spin_unlock;  	void (*wait)(u8 *ptr, u8 val);  	void (*kick)(int cpu); -#else /* !CONFIG_QUEUED_SPINLOCKS */ -	struct paravirt_callee_save lock_spinning; -	void (*unlock_kick)(struct arch_spinlock *lock, __ticket_t ticket); -#endif /* !CONFIG_QUEUED_SPINLOCKS */  };  /* This contains all the paravirt structures: we get a convenient diff --git a/arch/x86/include/asm/pci.h b/arch/x86/include/asm/pci.h index 9ab7507ca1c2..1411dbed5e5e 100644 --- a/arch/x86/include/asm/pci.h +++ b/arch/x86/include/asm/pci.h @@ -23,6 +23,9 @@ struct pci_sysdata {  #ifdef CONFIG_PCI_MSI_IRQ_DOMAIN  	void		*fwnode;	/* IRQ domain for MSI assignment */  #endif +#if IS_ENABLED(CONFIG_VMD) +	bool vmd_domain;		/* True if in Intel VMD domain */ +#endif  };  extern int pci_routeirq; @@ -56,6 +59,17 @@ static inline void *_pci_root_bus_fwnode(struct pci_bus *bus)  #define pci_root_bus_fwnode	_pci_root_bus_fwnode  #endif +static inline bool is_vmd(struct pci_bus *bus) +{ +#if IS_ENABLED(CONFIG_VMD) +	struct pci_sysdata *sd = bus->sysdata; + +	return sd->vmd_domain; +#else +	return false; +#endif +} +  /* Can be used to override the logic in pci_scan_bus for skipping     already-configured bus numbers - to be used for buggy BIOSes     or architectures with incomplete PCI setup by the loader */ diff --git a/arch/x86/include/asm/percpu.h b/arch/x86/include/asm/percpu.h index e02e3f80d363..84f58de08c2b 100644 --- a/arch/x86/include/asm/percpu.h +++ b/arch/x86/include/asm/percpu.h @@ -521,7 +521,8 @@ do {									\  static __always_inline bool x86_this_cpu_constant_test_bit(unsigned int nr,                          const unsigned long __percpu *addr)  { -	unsigned long __percpu *a = (unsigned long *)addr + nr / BITS_PER_LONG; +	unsigned long __percpu *a = +		(unsigned long __percpu *)addr + nr / BITS_PER_LONG;  #ifdef CONFIG_X86_64  	return ((1UL << (nr % BITS_PER_LONG)) & raw_cpu_read_8(*a)) != 0; @@ -538,7 +539,7 @@ static inline bool x86_this_cpu_variable_test_bit(int nr,  	asm volatile("bt "__percpu_arg(2)",%1\n\t"  			CC_SET(c)  			: CC_OUT(c) (oldbit) -			: "m" (*(unsigned long *)addr), "Ir" (nr)); +			: "m" (*(unsigned long __percpu *)addr), "Ir" (nr));  	return oldbit;  } diff --git a/arch/x86/include/asm/pgtable_64_types.h b/arch/x86/include/asm/pgtable_64_types.h index 6fdef9eef2d5..3a264200c62f 100644 --- a/arch/x86/include/asm/pgtable_64_types.h +++ b/arch/x86/include/asm/pgtable_64_types.h @@ -57,11 +57,13 @@ typedef struct { pteval_t pte; } pte_t;  #define MAXMEM		_AC(__AC(1, UL) << MAX_PHYSMEM_BITS, UL)  #define VMALLOC_SIZE_TB	_AC(32, UL)  #define __VMALLOC_BASE	_AC(0xffffc90000000000, UL) -#define VMEMMAP_START	_AC(0xffffea0000000000, UL) +#define __VMEMMAP_BASE	_AC(0xffffea0000000000, UL)  #ifdef CONFIG_RANDOMIZE_MEMORY  #define VMALLOC_START	vmalloc_base +#define VMEMMAP_START	vmemmap_base  #else  #define VMALLOC_START	__VMALLOC_BASE +#define VMEMMAP_START	__VMEMMAP_BASE  #endif /* CONFIG_RANDOMIZE_MEMORY */  #define VMALLOC_END	(VMALLOC_START + _AC((VMALLOC_SIZE_TB << 40) - 1, UL))  #define MODULES_VADDR    (__START_KERNEL_map + KERNEL_IMAGE_SIZE) diff --git a/arch/x86/include/asm/pgtable_types.h b/arch/x86/include/asm/pgtable_types.h index f1218f512f62..8b4de22d6429 100644 --- a/arch/x86/include/asm/pgtable_types.h +++ b/arch/x86/include/asm/pgtable_types.h @@ -439,8 +439,6 @@ extern pgprot_t pgprot_writethrough(pgprot_t prot);  struct file;  pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn,                                unsigned long size, pgprot_t vma_prot); -int phys_mem_access_prot_allowed(struct file *file, unsigned long pfn, -                              unsigned long size, pgprot_t *vma_prot);  /* Install a pte for a particular vaddr in kernel space. */  void set_pte_vaddr(unsigned long vaddr, pte_t pte); diff --git a/arch/x86/include/asm/pkeys.h b/arch/x86/include/asm/pkeys.h index 7b84565c916c..34684adb6899 100644 --- a/arch/x86/include/asm/pkeys.h +++ b/arch/x86/include/asm/pkeys.h @@ -10,7 +10,6 @@ extern int arch_set_user_pkey_access(struct task_struct *tsk, int pkey,   * Try to dedicate one of the protection keys to be used as an   * execute-only protection key.   */ -#define PKEY_DEDICATED_EXECUTE_ONLY 15  extern int __execute_only_pkey(struct mm_struct *mm);  static inline int execute_only_pkey(struct mm_struct *mm)  { @@ -31,4 +30,76 @@ static inline int arch_override_mprotect_pkey(struct vm_area_struct *vma,  	return __arch_override_mprotect_pkey(vma, prot, pkey);  } +extern int __arch_set_user_pkey_access(struct task_struct *tsk, int pkey, +		unsigned long init_val); + +#define ARCH_VM_PKEY_FLAGS (VM_PKEY_BIT0 | VM_PKEY_BIT1 | VM_PKEY_BIT2 | VM_PKEY_BIT3) + +#define mm_pkey_allocation_map(mm)	(mm->context.pkey_allocation_map) +#define mm_set_pkey_allocated(mm, pkey) do {		\ +	mm_pkey_allocation_map(mm) |= (1U << pkey);	\ +} while (0) +#define mm_set_pkey_free(mm, pkey) do {			\ +	mm_pkey_allocation_map(mm) &= ~(1U << pkey);	\ +} while (0) + +static inline +bool mm_pkey_is_allocated(struct mm_struct *mm, int pkey) +{ +	return mm_pkey_allocation_map(mm) & (1U << pkey); +} + +/* + * Returns a positive, 4-bit key on success, or -1 on failure. + */ +static inline +int mm_pkey_alloc(struct mm_struct *mm) +{ +	/* +	 * Note: this is the one and only place we make sure +	 * that the pkey is valid as far as the hardware is +	 * concerned.  The rest of the kernel trusts that +	 * only good, valid pkeys come out of here. +	 */ +	u16 all_pkeys_mask = ((1U << arch_max_pkey()) - 1); +	int ret; + +	/* +	 * Are we out of pkeys?  We must handle this specially +	 * because ffz() behavior is undefined if there are no +	 * zeros. +	 */ +	if (mm_pkey_allocation_map(mm) == all_pkeys_mask) +		return -1; + +	ret = ffz(mm_pkey_allocation_map(mm)); + +	mm_set_pkey_allocated(mm, ret); + +	return ret; +} + +static inline +int mm_pkey_free(struct mm_struct *mm, int pkey) +{ +	/* +	 * pkey 0 is special, always allocated and can never +	 * be freed. +	 */ +	if (!pkey) +		return -EINVAL; +	if (!mm_pkey_is_allocated(mm, pkey)) +		return -EINVAL; + +	mm_set_pkey_free(mm, pkey); + +	return 0; +} + +extern int arch_set_user_pkey_access(struct task_struct *tsk, int pkey, +		unsigned long init_val); +extern int __arch_set_user_pkey_access(struct task_struct *tsk, int pkey, +		unsigned long init_val); +extern void copy_init_pkru_to_fpregs(void); +  #endif /*_ASM_X86_PKEYS_H */ diff --git a/arch/x86/include/asm/pmem.h b/arch/x86/include/asm/pmem.h index 643eba42d620..2c1ebeb4d737 100644 --- a/arch/x86/include/asm/pmem.h +++ b/arch/x86/include/asm/pmem.h @@ -46,10 +46,7 @@ static inline void arch_memcpy_to_pmem(void *dst, const void *src, size_t n)  static inline int arch_memcpy_from_pmem(void *dst, const void *src, size_t n)  { -	if (static_cpu_has(X86_FEATURE_MCE_RECOVERY)) -		return memcpy_mcsafe(dst, src, n); -	memcpy(dst, src, n); -	return 0; +	return memcpy_mcsafe(dst, src, n);  }  /** diff --git a/arch/x86/include/asm/processor.h b/arch/x86/include/asm/processor.h index 63def9537a2d..984a7bf17f6a 100644 --- a/arch/x86/include/asm/processor.h +++ b/arch/x86/include/asm/processor.h @@ -389,9 +389,9 @@ struct thread_struct {  	unsigned short		fsindex;  	unsigned short		gsindex;  #endif -#ifdef CONFIG_X86_32 -	unsigned long		ip; -#endif + +	u32			status;		/* thread synchronous flags */ +  #ifdef CONFIG_X86_64  	unsigned long		fsbase;  	unsigned long		gsbase; @@ -438,6 +438,15 @@ struct thread_struct {  };  /* + * Thread-synchronous status. + * + * This is different from the flags in that nobody else + * ever touches our thread-synchronous status, so we don't + * have to worry about atomic accesses. + */ +#define TS_COMPAT		0x0002	/* 32bit syscall active (64BIT)*/ + +/*   * Set IOPL bits in EFLAGS from given mask   */  static inline void native_set_iopl_mask(unsigned mask) @@ -724,8 +733,6 @@ static inline void spin_lock_prefetch(const void *x)  	.addr_limit		= KERNEL_DS,				  \  } -extern unsigned long thread_saved_pc(struct task_struct *tsk); -  /*   * TOP_OF_KERNEL_STACK_PADDING reserves 8 bytes on top of the ring0 stack.   * This is necessary to guarantee that the entire "struct pt_regs" @@ -776,17 +783,13 @@ extern unsigned long thread_saved_pc(struct task_struct *tsk);  	.addr_limit		= KERNEL_DS,			\  } -/* - * Return saved PC of a blocked thread. - * What is this good for? it will be always the scheduler or ret_from_fork. - */ -#define thread_saved_pc(t)	READ_ONCE_NOCHECK(*(unsigned long *)((t)->thread.sp - 8)) -  #define task_pt_regs(tsk)	((struct pt_regs *)(tsk)->thread.sp0 - 1)  extern unsigned long KSTK_ESP(struct task_struct *task);  #endif /* CONFIG_X86_64 */ +extern unsigned long thread_saved_pc(struct task_struct *tsk); +  extern void start_thread(struct pt_regs *regs, unsigned long new_ip,  					       unsigned long new_sp); diff --git a/arch/x86/include/asm/pvclock.h b/arch/x86/include/asm/pvclock.h index d019f0cc80ec..3ad741b84072 100644 --- a/arch/x86/include/asm/pvclock.h +++ b/arch/x86/include/asm/pvclock.h @@ -87,9 +87,10 @@ static inline u64 pvclock_scale_delta(u64 delta, u32 mul_frac, int shift)  }  static __always_inline -cycle_t __pvclock_read_cycles(const struct pvclock_vcpu_time_info *src) +cycle_t __pvclock_read_cycles(const struct pvclock_vcpu_time_info *src, +			      u64 tsc)  { -	u64 delta = rdtsc_ordered() - src->tsc_timestamp; +	u64 delta = tsc - src->tsc_timestamp;  	cycle_t offset = pvclock_scale_delta(delta, src->tsc_to_system_mul,  					     src->tsc_shift);  	return src->system_time + offset; diff --git a/arch/x86/include/asm/realmode.h b/arch/x86/include/asm/realmode.h index b2988c0ed829..230e1903acf0 100644 --- a/arch/x86/include/asm/realmode.h +++ b/arch/x86/include/asm/realmode.h @@ -44,9 +44,9 @@ struct trampoline_header {  extern struct real_mode_header *real_mode_header;  extern unsigned char real_mode_blob_end[]; -extern unsigned long init_rsp;  extern unsigned long initial_code;  extern unsigned long initial_gs; +extern unsigned long initial_stack;  extern unsigned char real_mode_blob[];  extern unsigned char real_mode_relocs[]; diff --git a/arch/x86/include/asm/rwsem.h b/arch/x86/include/asm/rwsem.h index 8dbc762ad132..a34e0d4b957d 100644 --- a/arch/x86/include/asm/rwsem.h +++ b/arch/x86/include/asm/rwsem.h @@ -103,8 +103,10 @@ static inline bool __down_read_trylock(struct rw_semaphore *sem)  ({							\  	long tmp;					\  	struct rw_semaphore* ret;			\ +	register void *__sp asm(_ASM_SP);		\ +							\  	asm volatile("# beginning down_write\n\t"	\ -		     LOCK_PREFIX "  xadd      %1,(%3)\n\t"	\ +		     LOCK_PREFIX "  xadd      %1,(%4)\n\t"	\  		     /* adds 0xffff0001, returns the old value */ \  		     "  test " __ASM_SEL(%w1,%k1) "," __ASM_SEL(%w1,%k1) "\n\t" \  		     /* was the active mask 0 before? */\ @@ -112,7 +114,7 @@ static inline bool __down_read_trylock(struct rw_semaphore *sem)  		     "  call " slow_path "\n"		\  		     "1:\n"				\  		     "# ending down_write"		\ -		     : "+m" (sem->count), "=d" (tmp), "=a" (ret)	\ +		     : "+m" (sem->count), "=d" (tmp), "=a" (ret), "+r" (__sp) \  		     : "a" (sem), "1" (RWSEM_ACTIVE_WRITE_BIAS) \  		     : "memory", "cc");			\  	ret;						\ @@ -154,7 +156,7 @@ static inline bool __down_write_trylock(struct rw_semaphore *sem)  		     : "+m" (sem->count), "=&a" (tmp0), "=&r" (tmp1),  		       CC_OUT(e) (result)  		     : "er" (RWSEM_ACTIVE_WRITE_BIAS) -		     : "memory", "cc"); +		     : "memory");  	return result;  } diff --git a/arch/x86/include/asm/sections.h b/arch/x86/include/asm/sections.h index 13b6cdd0af57..2f75f30cb2f6 100644 --- a/arch/x86/include/asm/sections.h +++ b/arch/x86/include/asm/sections.h @@ -2,7 +2,7 @@  #define _ASM_X86_SECTIONS_H  #include <asm-generic/sections.h> -#include <asm/uaccess.h> +#include <asm/extable.h>  extern char __brk_base[], __brk_limit[];  extern struct exception_table_entry __stop___ex_table[]; diff --git a/arch/x86/include/asm/signal.h b/arch/x86/include/asm/signal.h index dd1e7d6387ab..8af22be0fe61 100644 --- a/arch/x86/include/asm/signal.h +++ b/arch/x86/include/asm/signal.h @@ -23,6 +23,10 @@ typedef struct {  	unsigned long sig[_NSIG_WORDS];  } sigset_t; +/* non-uapi in-kernel SA_FLAGS for those indicates ABI for a signal frame */ +#define SA_IA32_ABI	0x02000000u +#define SA_X32_ABI	0x01000000u +  #ifndef CONFIG_COMPAT  typedef sigset_t compat_sigset_t;  #endif diff --git a/arch/x86/include/asm/smp.h b/arch/x86/include/asm/smp.h index ebd0c164cd4e..026ea82ecc60 100644 --- a/arch/x86/include/asm/smp.h +++ b/arch/x86/include/asm/smp.h @@ -39,9 +39,6 @@ DECLARE_EARLY_PER_CPU_READ_MOSTLY(u16, x86_bios_cpu_apicid);  DECLARE_EARLY_PER_CPU_READ_MOSTLY(int, x86_cpu_to_logical_apicid);  #endif -/* Static state in head.S used to set up a CPU */ -extern unsigned long stack_start; /* Initial stack pointer address */ -  struct task_struct;  struct smp_ops { @@ -50,6 +47,7 @@ struct smp_ops {  	void (*smp_cpus_done)(unsigned max_cpus);  	void (*stop_other_cpus)(int wait); +	void (*crash_stop_other_cpus)(void);  	void (*smp_send_reschedule)(int cpu);  	int (*cpu_up)(unsigned cpu, struct task_struct *tidle); diff --git a/arch/x86/include/asm/special_insns.h b/arch/x86/include/asm/special_insns.h index 587d7914ea4b..19a2224f9e16 100644 --- a/arch/x86/include/asm/special_insns.h +++ b/arch/x86/include/asm/special_insns.h @@ -59,22 +59,19 @@ static inline void native_write_cr3(unsigned long val)  static inline unsigned long native_read_cr4(void)  {  	unsigned long val; -	asm volatile("mov %%cr4,%0\n\t" : "=r" (val), "=m" (__force_order)); -	return val; -} - -static inline unsigned long native_read_cr4_safe(void) -{ -	unsigned long val; -	/* This could fault if %cr4 does not exist. In x86_64, a cr4 always -	 * exists, so it will never fail. */  #ifdef CONFIG_X86_32 +	/* +	 * This could fault if CR4 does not exist.  Non-existent CR4 +	 * is functionally equivalent to CR4 == 0.  Keep it simple and pretend +	 * that CR4 == 0 on CPUs that don't have CR4. +	 */  	asm volatile("1: mov %%cr4, %0\n"  		     "2:\n"  		     _ASM_EXTABLE(1b, 2b)  		     : "=r" (val), "=m" (__force_order) : "0" (0));  #else -	val = native_read_cr4(); +	/* CR4 always exists on x86_64. */ +	asm volatile("mov %%cr4,%0\n\t" : "=r" (val), "=m" (__force_order));  #endif  	return val;  } @@ -182,11 +179,6 @@ static inline unsigned long __read_cr4(void)  	return native_read_cr4();  } -static inline unsigned long __read_cr4_safe(void) -{ -	return native_read_cr4_safe(); -} -  static inline void __write_cr4(unsigned long x)  {  	native_write_cr4(x); diff --git a/arch/x86/include/asm/spinlock.h b/arch/x86/include/asm/spinlock.h index be0a05913b91..921bea7a2708 100644 --- a/arch/x86/include/asm/spinlock.h +++ b/arch/x86/include/asm/spinlock.h @@ -20,187 +20,13 @@   * (the type definitions are in asm/spinlock_types.h)   */ -#ifdef CONFIG_X86_32 -# define LOCK_PTR_REG "a" -#else -# define LOCK_PTR_REG "D" -#endif - -#if defined(CONFIG_X86_32) && (defined(CONFIG_X86_PPRO_FENCE)) -/* - * On PPro SMP, we use a locked operation to unlock - * (PPro errata 66, 92) - */ -# define UNLOCK_LOCK_PREFIX LOCK_PREFIX -#else -# define UNLOCK_LOCK_PREFIX -#endif -  /* How long a lock should spin before we consider blocking */  #define SPIN_THRESHOLD	(1 << 15)  extern struct static_key paravirt_ticketlocks_enabled;  static __always_inline bool static_key_false(struct static_key *key); -#ifdef CONFIG_QUEUED_SPINLOCKS  #include <asm/qspinlock.h> -#else - -#ifdef CONFIG_PARAVIRT_SPINLOCKS - -static inline void __ticket_enter_slowpath(arch_spinlock_t *lock) -{ -	set_bit(0, (volatile unsigned long *)&lock->tickets.head); -} - -#else  /* !CONFIG_PARAVIRT_SPINLOCKS */ -static __always_inline void __ticket_lock_spinning(arch_spinlock_t *lock, -							__ticket_t ticket) -{ -} -static inline void __ticket_unlock_kick(arch_spinlock_t *lock, -							__ticket_t ticket) -{ -} - -#endif /* CONFIG_PARAVIRT_SPINLOCKS */ -static inline int  __tickets_equal(__ticket_t one, __ticket_t two) -{ -	return !((one ^ two) & ~TICKET_SLOWPATH_FLAG); -} - -static inline void __ticket_check_and_clear_slowpath(arch_spinlock_t *lock, -							__ticket_t head) -{ -	if (head & TICKET_SLOWPATH_FLAG) { -		arch_spinlock_t old, new; - -		old.tickets.head = head; -		new.tickets.head = head & ~TICKET_SLOWPATH_FLAG; -		old.tickets.tail = new.tickets.head + TICKET_LOCK_INC; -		new.tickets.tail = old.tickets.tail; - -		/* try to clear slowpath flag when there are no contenders */ -		cmpxchg(&lock->head_tail, old.head_tail, new.head_tail); -	} -} - -static __always_inline int arch_spin_value_unlocked(arch_spinlock_t lock) -{ -	return __tickets_equal(lock.tickets.head, lock.tickets.tail); -} - -/* - * Ticket locks are conceptually two parts, one indicating the current head of - * the queue, and the other indicating the current tail. The lock is acquired - * by atomically noting the tail and incrementing it by one (thus adding - * ourself to the queue and noting our position), then waiting until the head - * becomes equal to the the initial value of the tail. - * - * We use an xadd covering *both* parts of the lock, to increment the tail and - * also load the position of the head, which takes care of memory ordering - * issues and should be optimal for the uncontended case. Note the tail must be - * in the high part, because a wide xadd increment of the low part would carry - * up and contaminate the high part. - */ -static __always_inline void arch_spin_lock(arch_spinlock_t *lock) -{ -	register struct __raw_tickets inc = { .tail = TICKET_LOCK_INC }; - -	inc = xadd(&lock->tickets, inc); -	if (likely(inc.head == inc.tail)) -		goto out; - -	for (;;) { -		unsigned count = SPIN_THRESHOLD; - -		do { -			inc.head = READ_ONCE(lock->tickets.head); -			if (__tickets_equal(inc.head, inc.tail)) -				goto clear_slowpath; -			cpu_relax(); -		} while (--count); -		__ticket_lock_spinning(lock, inc.tail); -	} -clear_slowpath: -	__ticket_check_and_clear_slowpath(lock, inc.head); -out: -	barrier();	/* make sure nothing creeps before the lock is taken */ -} - -static __always_inline int arch_spin_trylock(arch_spinlock_t *lock) -{ -	arch_spinlock_t old, new; - -	old.tickets = READ_ONCE(lock->tickets); -	if (!__tickets_equal(old.tickets.head, old.tickets.tail)) -		return 0; - -	new.head_tail = old.head_tail + (TICKET_LOCK_INC << TICKET_SHIFT); -	new.head_tail &= ~TICKET_SLOWPATH_FLAG; - -	/* cmpxchg is a full barrier, so nothing can move before it */ -	return cmpxchg(&lock->head_tail, old.head_tail, new.head_tail) == old.head_tail; -} - -static __always_inline void arch_spin_unlock(arch_spinlock_t *lock) -{ -	if (TICKET_SLOWPATH_FLAG && -		static_key_false(¶virt_ticketlocks_enabled)) { -		__ticket_t head; - -		BUILD_BUG_ON(((__ticket_t)NR_CPUS) != NR_CPUS); - -		head = xadd(&lock->tickets.head, TICKET_LOCK_INC); - -		if (unlikely(head & TICKET_SLOWPATH_FLAG)) { -			head &= ~TICKET_SLOWPATH_FLAG; -			__ticket_unlock_kick(lock, (head + TICKET_LOCK_INC)); -		} -	} else -		__add(&lock->tickets.head, TICKET_LOCK_INC, UNLOCK_LOCK_PREFIX); -} - -static inline int arch_spin_is_locked(arch_spinlock_t *lock) -{ -	struct __raw_tickets tmp = READ_ONCE(lock->tickets); - -	return !__tickets_equal(tmp.tail, tmp.head); -} - -static inline int arch_spin_is_contended(arch_spinlock_t *lock) -{ -	struct __raw_tickets tmp = READ_ONCE(lock->tickets); - -	tmp.head &= ~TICKET_SLOWPATH_FLAG; -	return (__ticket_t)(tmp.tail - tmp.head) > TICKET_LOCK_INC; -} -#define arch_spin_is_contended	arch_spin_is_contended - -static __always_inline void arch_spin_lock_flags(arch_spinlock_t *lock, -						  unsigned long flags) -{ -	arch_spin_lock(lock); -} - -static inline void arch_spin_unlock_wait(arch_spinlock_t *lock) -{ -	__ticket_t head = READ_ONCE(lock->tickets.head); - -	for (;;) { -		struct __raw_tickets tmp = READ_ONCE(lock->tickets); -		/* -		 * We need to check "unlocked" in a loop, tmp.head == head -		 * can be false positive because of overflow. -		 */ -		if (__tickets_equal(tmp.head, tmp.tail) || -				!__tickets_equal(tmp.head, head)) -			break; - -		cpu_relax(); -	} -} -#endif /* CONFIG_QUEUED_SPINLOCKS */  /*   * Read-write spinlocks, allowing multiple readers diff --git a/arch/x86/include/asm/spinlock_types.h b/arch/x86/include/asm/spinlock_types.h index 65c3e37f879a..25311ebb446c 100644 --- a/arch/x86/include/asm/spinlock_types.h +++ b/arch/x86/include/asm/spinlock_types.h @@ -23,20 +23,7 @@ typedef u32 __ticketpair_t;  #define TICKET_SHIFT	(sizeof(__ticket_t) * 8) -#ifdef CONFIG_QUEUED_SPINLOCKS  #include <asm-generic/qspinlock_types.h> -#else -typedef struct arch_spinlock { -	union { -		__ticketpair_t head_tail; -		struct __raw_tickets { -			__ticket_t head, tail; -		} tickets; -	}; -} arch_spinlock_t; - -#define __ARCH_SPIN_LOCK_UNLOCKED	{ { 0 } } -#endif /* CONFIG_QUEUED_SPINLOCKS */  #include <asm-generic/qrwlock_types.h> diff --git a/arch/x86/include/asm/stacktrace.h b/arch/x86/include/asm/stacktrace.h index 0944218af9e2..37f2e0b377ad 100644 --- a/arch/x86/include/asm/stacktrace.h +++ b/arch/x86/include/asm/stacktrace.h @@ -8,86 +8,86 @@  #include <linux/uaccess.h>  #include <linux/ptrace.h> +#include <asm/switch_to.h> + +enum stack_type { +	STACK_TYPE_UNKNOWN, +	STACK_TYPE_TASK, +	STACK_TYPE_IRQ, +	STACK_TYPE_SOFTIRQ, +	STACK_TYPE_EXCEPTION, +	STACK_TYPE_EXCEPTION_LAST = STACK_TYPE_EXCEPTION + N_EXCEPTION_STACKS-1, +}; -extern int kstack_depth_to_print; - -struct thread_info; -struct stacktrace_ops; - -typedef unsigned long (*walk_stack_t)(struct task_struct *task, -				      unsigned long *stack, -				      unsigned long bp, -				      const struct stacktrace_ops *ops, -				      void *data, -				      unsigned long *end, -				      int *graph); - -extern unsigned long -print_context_stack(struct task_struct *task, -		    unsigned long *stack, unsigned long bp, -		    const struct stacktrace_ops *ops, void *data, -		    unsigned long *end, int *graph); - -extern unsigned long -print_context_stack_bp(struct task_struct *task, -		       unsigned long *stack, unsigned long bp, -		       const struct stacktrace_ops *ops, void *data, -		       unsigned long *end, int *graph); - -/* Generic stack tracer with callbacks */ - -struct stacktrace_ops { -	int (*address)(void *data, unsigned long address, int reliable); -	/* On negative return stop dumping */ -	int (*stack)(void *data, char *name); -	walk_stack_t	walk_stack; +struct stack_info { +	enum stack_type type; +	unsigned long *begin, *end, *next_sp;  }; -void dump_trace(struct task_struct *tsk, struct pt_regs *regs, -		unsigned long *stack, unsigned long bp, -		const struct stacktrace_ops *ops, void *data); +bool in_task_stack(unsigned long *stack, struct task_struct *task, +		   struct stack_info *info); + +int get_stack_info(unsigned long *stack, struct task_struct *task, +		   struct stack_info *info, unsigned long *visit_mask); + +void stack_type_str(enum stack_type type, const char **begin, +		    const char **end); + +static inline bool on_stack(struct stack_info *info, void *addr, size_t len) +{ +	void *begin = info->begin; +	void *end   = info->end; + +	return (info->type != STACK_TYPE_UNKNOWN && +		addr >= begin && addr < end && +		addr + len > begin && addr + len <= end); +} + +extern int kstack_depth_to_print;  #ifdef CONFIG_X86_32  #define STACKSLOTS_PER_LINE 8 -#define get_bp(bp) asm("movl %%ebp, %0" : "=r" (bp) :)  #else  #define STACKSLOTS_PER_LINE 4 -#define get_bp(bp) asm("movq %%rbp, %0" : "=r" (bp) :)  #endif  #ifdef CONFIG_FRAME_POINTER -static inline unsigned long -stack_frame(struct task_struct *task, struct pt_regs *regs) +static inline unsigned long * +get_frame_pointer(struct task_struct *task, struct pt_regs *regs)  { -	unsigned long bp; -  	if (regs) -		return regs->bp; +		return (unsigned long *)regs->bp; -	if (task == current) { -		/* Grab bp right from our regs */ -		get_bp(bp); -		return bp; -	} +	if (task == current) +		return __builtin_frame_address(0); -	/* bp is the last reg pushed by switch_to */ -	return *(unsigned long *)task->thread.sp; +	return (unsigned long *)((struct inactive_task_frame *)task->thread.sp)->bp;  }  #else -static inline unsigned long -stack_frame(struct task_struct *task, struct pt_regs *regs) +static inline unsigned long * +get_frame_pointer(struct task_struct *task, struct pt_regs *regs)  { -	return 0; +	return NULL; +} +#endif /* CONFIG_FRAME_POINTER */ + +static inline unsigned long * +get_stack_pointer(struct task_struct *task, struct pt_regs *regs) +{ +	if (regs) +		return (unsigned long *)kernel_stack_pointer(regs); + +	if (task == current) +		return __builtin_frame_address(0); + +	return (unsigned long *)task->thread.sp;  } -#endif -extern void -show_trace_log_lvl(struct task_struct *task, struct pt_regs *regs, -		   unsigned long *stack, unsigned long bp, char *log_lvl); +void show_trace_log_lvl(struct task_struct *task, struct pt_regs *regs, +			unsigned long *stack, char *log_lvl); -extern void -show_stack_log_lvl(struct task_struct *task, struct pt_regs *regs, -		   unsigned long *sp, unsigned long bp, char *log_lvl); +void show_stack_log_lvl(struct task_struct *task, struct pt_regs *regs, +			unsigned long *sp, char *log_lvl);  extern unsigned int code_bytes; @@ -106,7 +106,7 @@ static inline unsigned long caller_frame_pointer(void)  {  	struct stack_frame *frame; -	get_bp(frame); +	frame = __builtin_frame_address(0);  #ifdef CONFIG_FRAME_POINTER  	frame = frame->next_frame; diff --git a/arch/x86/include/asm/string_64.h b/arch/x86/include/asm/string_64.h index 90dbbd9666d4..a164862d77e3 100644 --- a/arch/x86/include/asm/string_64.h +++ b/arch/x86/include/asm/string_64.h @@ -2,6 +2,7 @@  #define _ASM_X86_STRING_64_H  #ifdef __KERNEL__ +#include <linux/jump_label.h>  /* Written 2002 by Andi Kleen */ @@ -78,6 +79,9 @@ int strcmp(const char *cs, const char *ct);  #define memset(s, c, n) __memset(s, c, n)  #endif +__must_check int memcpy_mcsafe_unrolled(void *dst, const void *src, size_t cnt); +DECLARE_STATIC_KEY_FALSE(mcsafe_key); +  /**   * memcpy_mcsafe - copy memory with indication if a machine check happened   * @@ -86,10 +90,23 @@ int strcmp(const char *cs, const char *ct);   * @cnt:	number of bytes to copy   *   * Low level memory copy function that catches machine checks + * We only call into the "safe" function on systems that can + * actually do machine check recovery. Everyone else can just + * use memcpy().   *   * Return 0 for success, -EFAULT for fail   */ -int memcpy_mcsafe(void *dst, const void *src, size_t cnt); +static __always_inline __must_check int +memcpy_mcsafe(void *dst, const void *src, size_t cnt) +{ +#ifdef CONFIG_X86_MCE +	if (static_branch_unlikely(&mcsafe_key)) +		return memcpy_mcsafe_unrolled(dst, src, cnt); +	else +#endif +		memcpy(dst, src, cnt); +	return 0; +}  #endif /* __KERNEL__ */ diff --git a/arch/x86/include/asm/switch_to.h b/arch/x86/include/asm/switch_to.h index 8f321a1b03a1..5cb436acd463 100644 --- a/arch/x86/include/asm/switch_to.h +++ b/arch/x86/include/asm/switch_to.h @@ -2,130 +2,66 @@  #define _ASM_X86_SWITCH_TO_H  struct task_struct; /* one of the stranger aspects of C forward declarations */ + +struct task_struct *__switch_to_asm(struct task_struct *prev, +				    struct task_struct *next); +  __visible struct task_struct *__switch_to(struct task_struct *prev, -					   struct task_struct *next); +					  struct task_struct *next);  struct tss_struct;  void __switch_to_xtra(struct task_struct *prev_p, struct task_struct *next_p,  		      struct tss_struct *tss); -#ifdef CONFIG_X86_32 +/* This runs runs on the previous thread's stack. */ +static inline void prepare_switch_to(struct task_struct *prev, +				     struct task_struct *next) +{ +#ifdef CONFIG_VMAP_STACK +	/* +	 * If we switch to a stack that has a top-level paging entry +	 * that is not present in the current mm, the resulting #PF will +	 * will be promoted to a double-fault and we'll panic.  Probe +	 * the new stack now so that vmalloc_fault can fix up the page +	 * tables if needed.  This can only happen if we use a stack +	 * in vmap space. +	 * +	 * We assume that the stack is aligned so that it never spans +	 * more than one top-level paging entry. +	 * +	 * To minimize cache pollution, just follow the stack pointer. +	 */ +	READ_ONCE(*(unsigned char *)next->thread.sp); +#endif +} + +asmlinkage void ret_from_fork(void); + +/* data that is pointed to by thread.sp */ +struct inactive_task_frame { +#ifdef CONFIG_X86_64 +	unsigned long r15; +	unsigned long r14; +	unsigned long r13; +	unsigned long r12; +#else +	unsigned long si; +	unsigned long di; +#endif +	unsigned long bx; +	unsigned long bp; +	unsigned long ret_addr; +}; -#ifdef CONFIG_CC_STACKPROTECTOR -#define __switch_canary							\ -	"movl %P[task_canary](%[next]), %%ebx\n\t"			\ -	"movl %%ebx, "__percpu_arg([stack_canary])"\n\t" -#define __switch_canary_oparam						\ -	, [stack_canary] "=m" (stack_canary.canary) -#define __switch_canary_iparam						\ -	, [task_canary] "i" (offsetof(struct task_struct, stack_canary)) -#else	/* CC_STACKPROTECTOR */ -#define __switch_canary -#define __switch_canary_oparam -#define __switch_canary_iparam -#endif	/* CC_STACKPROTECTOR */ +struct fork_frame { +	struct inactive_task_frame frame; +	struct pt_regs regs; +}; -/* - * Saving eflags is important. It switches not only IOPL between tasks, - * it also protects other tasks from NT leaking through sysenter etc. - */  #define switch_to(prev, next, last)					\  do {									\ -	/*								\ -	 * Context-switching clobbers all registers, so we clobber	\ -	 * them explicitly, via unused output variables.		\ -	 * (EAX and EBP is not listed because EBP is saved/restored	\ -	 * explicitly for wchan access and EAX is the return value of	\ -	 * __switch_to())						\ -	 */								\ -	unsigned long ebx, ecx, edx, esi, edi;				\ -									\ -	asm volatile("pushl %%ebp\n\t"		/* save    EBP   */	\ -		     "movl %%esp,%[prev_sp]\n\t"	/* save    ESP   */ \ -		     "movl %[next_sp],%%esp\n\t"	/* restore ESP   */ \ -		     "movl $1f,%[prev_ip]\n\t"	/* save    EIP   */	\ -		     "pushl %[next_ip]\n\t"	/* restore EIP   */	\ -		     __switch_canary					\ -		     "jmp __switch_to\n"	/* regparm call  */	\ -		     "1:\t"						\ -		     "popl %%ebp\n\t"		/* restore EBP   */	\ -									\ -		     /* output parameters */				\ -		     : [prev_sp] "=m" (prev->thread.sp),		\ -		       [prev_ip] "=m" (prev->thread.ip),		\ -		       "=a" (last),					\ -									\ -		       /* clobbered output registers: */		\ -		       "=b" (ebx), "=c" (ecx), "=d" (edx),		\ -		       "=S" (esi), "=D" (edi)				\ -		       							\ -		       __switch_canary_oparam				\ -									\ -		       /* input parameters: */				\ -		     : [next_sp]  "m" (next->thread.sp),		\ -		       [next_ip]  "m" (next->thread.ip),		\ -		       							\ -		       /* regparm parameters for __switch_to(): */	\ -		       [prev]     "a" (prev),				\ -		       [next]     "d" (next)				\ +	prepare_switch_to(prev, next);					\  									\ -		       __switch_canary_iparam				\ -									\ -		     : /* reloaded segment registers */			\ -			"memory");					\ +	((last) = __switch_to_asm((prev), (next)));			\  } while (0) -#else /* CONFIG_X86_32 */ - -/* frame pointer must be last for get_wchan */ -#define SAVE_CONTEXT    "pushq %%rbp ; movq %%rsi,%%rbp\n\t" -#define RESTORE_CONTEXT "movq %%rbp,%%rsi ; popq %%rbp\t" - -#define __EXTRA_CLOBBER  \ -	, "rcx", "rbx", "rdx", "r8", "r9", "r10", "r11", \ -	  "r12", "r13", "r14", "r15", "flags" - -#ifdef CONFIG_CC_STACKPROTECTOR -#define __switch_canary							  \ -	"movq %P[task_canary](%%rsi),%%r8\n\t"				  \ -	"movq %%r8,"__percpu_arg([gs_canary])"\n\t" -#define __switch_canary_oparam						  \ -	, [gs_canary] "=m" (irq_stack_union.stack_canary) -#define __switch_canary_iparam						  \ -	, [task_canary] "i" (offsetof(struct task_struct, stack_canary)) -#else	/* CC_STACKPROTECTOR */ -#define __switch_canary -#define __switch_canary_oparam -#define __switch_canary_iparam -#endif	/* CC_STACKPROTECTOR */ - -/* - * There is no need to save or restore flags, because flags are always - * clean in kernel mode, with the possible exception of IOPL.  Kernel IOPL - * has no effect. - */ -#define switch_to(prev, next, last) \ -	asm volatile(SAVE_CONTEXT					  \ -	     "movq %%rsp,%P[threadrsp](%[prev])\n\t" /* save RSP */	  \ -	     "movq %P[threadrsp](%[next]),%%rsp\n\t" /* restore RSP */	  \ -	     "call __switch_to\n\t"					  \ -	     "movq "__percpu_arg([current_task])",%%rsi\n\t"		  \ -	     __switch_canary						  \ -	     "movq %P[thread_info](%%rsi),%%r8\n\t"			  \ -	     "movq %%rax,%%rdi\n\t" 					  \ -	     "testl  %[_tif_fork],%P[ti_flags](%%r8)\n\t"		  \ -	     "jnz   ret_from_fork\n\t"					  \ -	     RESTORE_CONTEXT						  \ -	     : "=a" (last)					  	  \ -	       __switch_canary_oparam					  \ -	     : [next] "S" (next), [prev] "D" (prev),			  \ -	       [threadrsp] "i" (offsetof(struct task_struct, thread.sp)), \ -	       [ti_flags] "i" (offsetof(struct thread_info, flags)),	  \ -	       [_tif_fork] "i" (_TIF_FORK),			  	  \ -	       [thread_info] "i" (offsetof(struct task_struct, stack)),   \ -	       [current_task] "m" (current_task)			  \ -	       __switch_canary_iparam					  \ -	     : "memory", "cc" __EXTRA_CLOBBER) - -#endif /* CONFIG_X86_32 */ -  #endif /* _ASM_X86_SWITCH_TO_H */ diff --git a/arch/x86/include/asm/syscall.h b/arch/x86/include/asm/syscall.h index 4e23dd15c661..e3c95e8e61c5 100644 --- a/arch/x86/include/asm/syscall.h +++ b/arch/x86/include/asm/syscall.h @@ -60,7 +60,7 @@ static inline long syscall_get_error(struct task_struct *task,  	 * TS_COMPAT is set for 32-bit syscall entries and then  	 * remains set until we return to user mode.  	 */ -	if (task_thread_info(task)->status & (TS_COMPAT|TS_I386_REGS_POKED)) +	if (task->thread.status & (TS_COMPAT|TS_I386_REGS_POKED))  		/*  		 * Sign-extend the value so (int)-EFOO becomes (long)-EFOO  		 * and will match correctly in comparisons. @@ -116,7 +116,7 @@ static inline void syscall_get_arguments(struct task_struct *task,  					 unsigned long *args)  {  # ifdef CONFIG_IA32_EMULATION -	if (task_thread_info(task)->status & TS_COMPAT) +	if (task->thread.status & TS_COMPAT)  		switch (i) {  		case 0:  			if (!n--) break; @@ -177,7 +177,7 @@ static inline void syscall_set_arguments(struct task_struct *task,  					 const unsigned long *args)  {  # ifdef CONFIG_IA32_EMULATION -	if (task_thread_info(task)->status & TS_COMPAT) +	if (task->thread.status & TS_COMPAT)  		switch (i) {  		case 0:  			if (!n--) break; @@ -234,18 +234,8 @@ static inline void syscall_set_arguments(struct task_struct *task,  static inline int syscall_get_arch(void)  { -#ifdef CONFIG_IA32_EMULATION -	/* -	 * TS_COMPAT is set for 32-bit syscall entry and then -	 * remains set until we return to user mode. -	 * -	 * x32 tasks should be considered AUDIT_ARCH_X86_64. -	 */ -	if (task_thread_info(current)->status & TS_COMPAT) -		return AUDIT_ARCH_I386; -#endif -	/* Both x32 and x86_64 are considered "64-bit". */ -	return AUDIT_ARCH_X86_64; +	/* x32 tasks should be considered AUDIT_ARCH_X86_64. */ +	return in_ia32_syscall() ? AUDIT_ARCH_I386 : AUDIT_ARCH_X86_64;  }  #endif	/* CONFIG_X86_32 */ diff --git a/arch/x86/include/asm/thread_info.h b/arch/x86/include/asm/thread_info.h index 8b7c8d8e0852..ad6f5eb07a95 100644 --- a/arch/x86/include/asm/thread_info.h +++ b/arch/x86/include/asm/thread_info.h @@ -53,20 +53,14 @@ struct task_struct;  #include <linux/atomic.h>  struct thread_info { -	struct task_struct	*task;		/* main task structure */ -	__u32			flags;		/* low level flags */ -	__u32			status;		/* thread synchronous flags */ -	__u32			cpu;		/* current CPU */ +	unsigned long		flags;		/* low level flags */  };  #define INIT_THREAD_INFO(tsk)			\  {						\ -	.task		= &tsk,			\  	.flags		= 0,			\ -	.cpu		= 0,			\  } -#define init_thread_info	(init_thread_union.thread_info)  #define init_stack		(init_thread_union.stack)  #else /* !__ASSEMBLY__ */ @@ -95,7 +89,6 @@ struct thread_info {  #define TIF_UPROBE		12	/* breakpointed or singlestepping */  #define TIF_NOTSC		16	/* TSC is not accessible in userland */  #define TIF_IA32		17	/* IA32 compatibility process */ -#define TIF_FORK		18	/* ret_from_fork */  #define TIF_NOHZ		19	/* in adaptive nohz mode */  #define TIF_MEMDIE		20	/* is terminating due to OOM killer */  #define TIF_POLLING_NRFLAG	21	/* idle is polling for TIF_NEED_RESCHED */ @@ -119,7 +112,6 @@ struct thread_info {  #define _TIF_UPROBE		(1 << TIF_UPROBE)  #define _TIF_NOTSC		(1 << TIF_NOTSC)  #define _TIF_IA32		(1 << TIF_IA32) -#define _TIF_FORK		(1 << TIF_FORK)  #define _TIF_NOHZ		(1 << TIF_NOHZ)  #define _TIF_POLLING_NRFLAG	(1 << TIF_POLLING_NRFLAG)  #define _TIF_IO_BITMAP		(1 << TIF_IO_BITMAP) @@ -160,11 +152,6 @@ struct thread_info {   */  #ifndef __ASSEMBLY__ -static inline struct thread_info *current_thread_info(void) -{ -	return (struct thread_info *)(current_top_of_stack() - THREAD_SIZE); -} -  static inline unsigned long current_stack_pointer(void)  {  	unsigned long sp; @@ -226,60 +213,19 @@ static inline int arch_within_stack_frames(const void * const stack,  # define cpu_current_top_of_stack (cpu_tss + TSS_sp0)  #endif -/* - * ASM operand which evaluates to a 'thread_info' address of - * the current task, if it is known that "reg" is exactly "off" - * bytes below the top of the stack currently. - * - * ( The kernel stack's size is known at build time, it is usually - *   2 or 4 pages, and the bottom  of the kernel stack contains - *   the thread_info structure. So to access the thread_info very - *   quickly from assembly code we can calculate down from the - *   top of the kernel stack to the bottom, using constant, - *   build-time calculations only. ) - * - * For example, to fetch the current thread_info->flags value into %eax - * on x86-64 defconfig kernels, in syscall entry code where RSP is - * currently at exactly SIZEOF_PTREGS bytes away from the top of the - * stack: - * - *      mov ASM_THREAD_INFO(TI_flags, %rsp, SIZEOF_PTREGS), %eax - * - * will translate to: - * - *      8b 84 24 b8 c0 ff ff      mov    -0x3f48(%rsp), %eax - * - * which is below the current RSP by almost 16K. - */ -#define ASM_THREAD_INFO(field, reg, off) ((field)+(off)-THREAD_SIZE)(reg) -  #endif -/* - * Thread-synchronous status. - * - * This is different from the flags in that nobody else - * ever touches our thread-synchronous status, so we don't - * have to worry about atomic accesses. - */ -#define TS_COMPAT		0x0002	/* 32bit syscall active (64BIT)*/  #ifdef CONFIG_COMPAT  #define TS_I386_REGS_POKED	0x0004	/* regs poked by 32-bit ptracer */  #endif -  #ifndef __ASSEMBLY__ -static inline bool in_ia32_syscall(void) -{  #ifdef CONFIG_X86_32 -	return true; -#endif -#ifdef CONFIG_IA32_EMULATION -	if (current_thread_info()->status & TS_COMPAT) -		return true; +#define in_ia32_syscall() true +#else +#define in_ia32_syscall() (IS_ENABLED(CONFIG_IA32_EMULATION) && \ +			   current->thread.status & TS_COMPAT)  #endif -	return false; -}  /*   * Force syscall return via IRET by making it look as if there was diff --git a/arch/x86/include/asm/traps.h b/arch/x86/include/asm/traps.h index c3496619740a..01fd0a7f48cd 100644 --- a/arch/x86/include/asm/traps.h +++ b/arch/x86/include/asm/traps.h @@ -117,6 +117,12 @@ extern void ist_exit(struct pt_regs *regs);  extern void ist_begin_non_atomic(struct pt_regs *regs);  extern void ist_end_non_atomic(void); +#ifdef CONFIG_VMAP_STACK +void __noreturn handle_stack_overflow(const char *message, +				      struct pt_regs *regs, +				      unsigned long fault_address); +#endif +  /* Interrupts/Exceptions */  enum {  	X86_TRAP_DE = 0,	/*  0, Divide-by-zero */ diff --git a/arch/x86/include/asm/uaccess.h b/arch/x86/include/asm/uaccess.h index 2131c4ce7d8a..faf3687f1035 100644 --- a/arch/x86/include/asm/uaccess.h +++ b/arch/x86/include/asm/uaccess.h @@ -11,6 +11,7 @@  #include <asm/asm.h>  #include <asm/page.h>  #include <asm/smap.h> +#include <asm/extable.h>  #define VERIFY_READ 0  #define VERIFY_WRITE 1 @@ -91,37 +92,6 @@ static inline bool __chk_range_not_ok(unsigned long addr, unsigned long size, un  	likely(!__range_not_ok(addr, size, user_addr_max()))  /* - * The exception table consists of triples of addresses relative to the - * exception table entry itself. The first address is of an instruction - * that is allowed to fault, the second is the target at which the program - * should continue. The third is a handler function to deal with the fault - * caused by the instruction in the first field. - * - * All the routines below use bits of fixup code that are out of line - * with the main instruction path.  This means when everything is well, - * we don't even have to jump over them.  Further, they do not intrude - * on our cache or tlb entries. - */ - -struct exception_table_entry { -	int insn, fixup, handler; -}; - -#define ARCH_HAS_RELATIVE_EXTABLE - -#define swap_ex_entry_fixup(a, b, tmp, delta)			\ -	do {							\ -		(a)->fixup = (b)->fixup + (delta);		\ -		(b)->fixup = (tmp).fixup - (delta);		\ -		(a)->handler = (b)->handler + (delta);		\ -		(b)->handler = (tmp).handler - (delta);		\ -	} while (0) - -extern int fixup_exception(struct pt_regs *regs, int trapnr); -extern bool ex_has_fault_handler(unsigned long ip); -extern void early_fixup_exception(struct pt_regs *regs, int trapnr); - -/*   * These are the main single-value transfer routines.  They automatically   * use the right size if we just have the right pointer type.   * diff --git a/arch/x86/include/asm/unwind.h b/arch/x86/include/asm/unwind.h new file mode 100644 index 000000000000..46de9ac4b990 --- /dev/null +++ b/arch/x86/include/asm/unwind.h @@ -0,0 +1,63 @@ +#ifndef _ASM_X86_UNWIND_H +#define _ASM_X86_UNWIND_H + +#include <linux/sched.h> +#include <linux/ftrace.h> +#include <asm/ptrace.h> +#include <asm/stacktrace.h> + +struct unwind_state { +	struct stack_info stack_info; +	unsigned long stack_mask; +	struct task_struct *task; +	int graph_idx; +#ifdef CONFIG_FRAME_POINTER +	unsigned long *bp; +#else +	unsigned long *sp; +#endif +}; + +void __unwind_start(struct unwind_state *state, struct task_struct *task, +		    struct pt_regs *regs, unsigned long *first_frame); + +bool unwind_next_frame(struct unwind_state *state); + +unsigned long unwind_get_return_address(struct unwind_state *state); + +static inline bool unwind_done(struct unwind_state *state) +{ +	return state->stack_info.type == STACK_TYPE_UNKNOWN; +} + +static inline +void unwind_start(struct unwind_state *state, struct task_struct *task, +		  struct pt_regs *regs, unsigned long *first_frame) +{ +	first_frame = first_frame ? : get_stack_pointer(task, regs); + +	__unwind_start(state, task, regs, first_frame); +} + +#ifdef CONFIG_FRAME_POINTER + +static inline +unsigned long *unwind_get_return_address_ptr(struct unwind_state *state) +{ +	if (unwind_done(state)) +		return NULL; + +	return state->bp + 1; +} + +#else /* !CONFIG_FRAME_POINTER */ + +static inline +unsigned long *unwind_get_return_address_ptr(struct unwind_state *state) +{ +	return NULL; +} + +#endif /* CONFIG_FRAME_POINTER */ + +#endif /* _ASM_X86_UNWIND_H */ diff --git a/arch/x86/include/asm/uv/uv_bau.h b/arch/x86/include/asm/uv/uv_bau.h index cc44d926c17e..57ab86d94d64 100644 --- a/arch/x86/include/asm/uv/uv_bau.h +++ b/arch/x86/include/asm/uv/uv_bau.h @@ -49,14 +49,12 @@  #define UV_NET_ENDPOINT_INTD		(is_uv1_hub() ?			\  			UV1_NET_ENDPOINT_INTD : UV2_NET_ENDPOINT_INTD)  #define UV_DESC_PSHIFT			49 -#define UV_PAYLOADQ_PNODE_SHIFT		49 +#define UV_PAYLOADQ_GNODE_SHIFT		49  #define UV_PTC_BASENAME			"sgi_uv/ptc_statistics"  #define UV_BAU_BASENAME			"sgi_uv/bau_tunables"  #define UV_BAU_TUNABLES_DIR		"sgi_uv"  #define UV_BAU_TUNABLES_FILE		"bau_tunables"  #define WHITESPACE			" \t\n" -#define uv_mmask			((1UL << uv_hub_info->m_val) - 1) -#define uv_physnodeaddr(x)		((__pa((unsigned long)(x)) & uv_mmask))  #define cpubit_isset(cpu, bau_local_cpumask) \  	test_bit((cpu), (bau_local_cpumask).bits) @@ -387,6 +385,17 @@ struct uv2_3_bau_msg_header {  	/* bits 127:120 */  }; +/* Abstracted BAU functions */ +struct bau_operations { +	unsigned long (*read_l_sw_ack)(void); +	unsigned long (*read_g_sw_ack)(int pnode); +	unsigned long (*bau_gpa_to_offset)(unsigned long vaddr); +	void (*write_l_sw_ack)(unsigned long mmr); +	void (*write_g_sw_ack)(int pnode, unsigned long mmr); +	void (*write_payload_first)(int pnode, unsigned long mmr); +	void (*write_payload_last)(int pnode, unsigned long mmr); +}; +  /*   * The activation descriptor:   * The format of the message to send, plus all accompanying control @@ -655,6 +664,16 @@ static inline void write_gmmr_activation(int pnode, unsigned long mmr_image)  	write_gmmr(pnode, UVH_LB_BAU_SB_ACTIVATION_CONTROL, mmr_image);  } +static inline void write_mmr_proc_payload_first(int pnode, unsigned long mmr_image) +{ +	write_gmmr(pnode, UV4H_LB_PROC_INTD_QUEUE_FIRST, mmr_image); +} + +static inline void write_mmr_proc_payload_last(int pnode, unsigned long mmr_image) +{ +	write_gmmr(pnode, UV4H_LB_PROC_INTD_QUEUE_LAST, mmr_image); +} +  static inline void write_mmr_payload_first(int pnode, unsigned long mmr_image)  {  	write_gmmr(pnode, UVH_LB_BAU_INTD_PAYLOAD_QUEUE_FIRST, mmr_image); @@ -700,6 +719,26 @@ static inline unsigned long read_gmmr_sw_ack(int pnode)  	return read_gmmr(pnode, UVH_LB_BAU_INTD_SOFTWARE_ACKNOWLEDGE);  } +static inline void write_mmr_proc_sw_ack(unsigned long mr) +{ +	uv_write_local_mmr(UV4H_LB_PROC_INTD_SOFT_ACK_CLEAR, mr); +} + +static inline void write_gmmr_proc_sw_ack(int pnode, unsigned long mr) +{ +	write_gmmr(pnode, UV4H_LB_PROC_INTD_SOFT_ACK_CLEAR, mr); +} + +static inline unsigned long read_mmr_proc_sw_ack(void) +{ +	return read_lmmr(UV4H_LB_PROC_INTD_SOFT_ACK_PENDING); +} + +static inline unsigned long read_gmmr_proc_sw_ack(int pnode) +{ +	return read_gmmr(pnode, UV4H_LB_PROC_INTD_SOFT_ACK_PENDING); +} +  static inline void write_mmr_data_config(int pnode, unsigned long mr)  {  	uv_write_global_mmr64(pnode, UVH_BAU_DATA_CONFIG, mr); diff --git a/arch/x86/include/asm/vdso.h b/arch/x86/include/asm/vdso.h index 43dc55be524e..2444189cbe28 100644 --- a/arch/x86/include/asm/vdso.h +++ b/arch/x86/include/asm/vdso.h @@ -41,6 +41,8 @@ extern const struct vdso_image vdso_image_32;  extern void __init init_vdso_image(const struct vdso_image *image); +extern int map_vdso_once(const struct vdso_image *image, unsigned long addr); +  #endif /* __ASSEMBLER__ */  #endif /* _ASM_X86_VDSO_H */ diff --git a/arch/x86/include/asm/xen/events.h b/arch/x86/include/asm/xen/events.h index e6911caf5bbf..608a79d5a466 100644 --- a/arch/x86/include/asm/xen/events.h +++ b/arch/x86/include/asm/xen/events.h @@ -20,15 +20,4 @@ static inline int xen_irqs_disabled(struct pt_regs *regs)  /* No need for a barrier -- XCHG is a barrier on x86. */  #define xchg_xen_ulong(ptr, val) xchg((ptr), (val)) -extern int xen_have_vector_callback; - -/* - * Events delivered via platform PCI interrupts are always - * routed to vcpu 0 and hence cannot be rebound. - */ -static inline bool xen_support_evtchn_rebind(void) -{ -	return (!xen_hvm_domain() || xen_have_vector_callback); -} -  #endif /* _ASM_X86_XEN_EVENTS_H */ diff --git a/arch/x86/include/uapi/asm/mce.h b/arch/x86/include/uapi/asm/mce.h index 2184943341bf..69a6e07e3149 100644 --- a/arch/x86/include/uapi/asm/mce.h +++ b/arch/x86/include/uapi/asm/mce.h @@ -26,6 +26,8 @@ struct mce {  	__u32 socketid;	/* CPU socket ID */  	__u32 apicid;	/* CPU initial apic ID */  	__u64 mcgcap;	/* MCGCAP MSR: machine check capabilities of CPU */ +	__u64 synd;	/* MCA_SYND MSR: only valid on SMCA systems */ +	__u64 ipid;	/* MCA_IPID MSR: only valid on SMCA systems */  };  #define MCE_GET_RECORD_LEN   _IOR('M', 1, int) diff --git a/arch/x86/include/uapi/asm/prctl.h b/arch/x86/include/uapi/asm/prctl.h index 3ac5032fae09..ae135de547f5 100644 --- a/arch/x86/include/uapi/asm/prctl.h +++ b/arch/x86/include/uapi/asm/prctl.h @@ -6,4 +6,10 @@  #define ARCH_GET_FS 0x1003  #define ARCH_GET_GS 0x1004 +#ifdef CONFIG_CHECKPOINT_RESTORE +# define ARCH_MAP_VDSO_X32	0x2001 +# define ARCH_MAP_VDSO_32	0x2002 +# define ARCH_MAP_VDSO_64	0x2003 +#endif +  #endif /* _ASM_X86_PRCTL_H */ |