diff options
Diffstat (limited to 'arch/x86/lib')
| -rw-r--r-- | arch/x86/lib/Makefile | 1 | ||||
| -rw-r--r-- | arch/x86/lib/checksum_32.S | 7 | ||||
| -rw-r--r-- | arch/x86/lib/delay.c | 4 | ||||
| -rw-r--r-- | arch/x86/lib/retpoline.S | 49 | ||||
| -rw-r--r-- | arch/x86/lib/x86-opcode-map.txt | 13 | 
5 files changed, 67 insertions, 7 deletions
| diff --git a/arch/x86/lib/Makefile b/arch/x86/lib/Makefile index 7b181b61170e..f23934bbaf4e 100644 --- a/arch/x86/lib/Makefile +++ b/arch/x86/lib/Makefile @@ -26,6 +26,7 @@ lib-y += memcpy_$(BITS).o  lib-$(CONFIG_RWSEM_XCHGADD_ALGORITHM) += rwsem.o  lib-$(CONFIG_INSTRUCTION_DECODER) += insn.o inat.o insn-eval.o  lib-$(CONFIG_RANDOMIZE_BASE) += kaslr.o +lib-$(CONFIG_RETPOLINE) += retpoline.o  obj-y += msr.o msr-reg.o msr-reg-export.o hweight.o diff --git a/arch/x86/lib/checksum_32.S b/arch/x86/lib/checksum_32.S index 4d34bb548b41..46e71a74e612 100644 --- a/arch/x86/lib/checksum_32.S +++ b/arch/x86/lib/checksum_32.S @@ -29,7 +29,8 @@  #include <asm/errno.h>  #include <asm/asm.h>  #include <asm/export.h> -				 +#include <asm/nospec-branch.h> +  /*   * computes a partial checksum, e.g. for TCP/UDP fragments   */ @@ -156,7 +157,7 @@ ENTRY(csum_partial)  	negl %ebx  	lea 45f(%ebx,%ebx,2), %ebx  	testl %esi, %esi -	jmp *%ebx +	JMP_NOSPEC %ebx  	# Handle 2-byte-aligned regions  20:	addw (%esi), %ax @@ -439,7 +440,7 @@ ENTRY(csum_partial_copy_generic)  	andl $-32,%edx  	lea 3f(%ebx,%ebx), %ebx  	testl %esi, %esi  -	jmp *%ebx +	JMP_NOSPEC %ebx  1:	addl $64,%esi  	addl $64,%edi   	SRC(movb -32(%edx),%bl)	; SRC(movb (%edx),%bl) diff --git a/arch/x86/lib/delay.c b/arch/x86/lib/delay.c index 553f8fd23cc4..4846eff7e4c8 100644 --- a/arch/x86/lib/delay.c +++ b/arch/x86/lib/delay.c @@ -107,10 +107,10 @@ static void delay_mwaitx(unsigned long __loops)  		delay = min_t(u64, MWAITX_MAX_LOOPS, loops);  		/* -		 * Use cpu_tss as a cacheline-aligned, seldomly +		 * Use cpu_tss_rw as a cacheline-aligned, seldomly  		 * accessed per-cpu variable as the monitor target.  		 */ -		__monitorx(raw_cpu_ptr(&cpu_tss), 0, 0); +		__monitorx(raw_cpu_ptr(&cpu_tss_rw), 0, 0);  		/*  		 * AMD, like Intel, supports the EAX hint and EAX=0xf diff --git a/arch/x86/lib/retpoline.S b/arch/x86/lib/retpoline.S new file mode 100644 index 000000000000..dfb2ba91b670 --- /dev/null +++ b/arch/x86/lib/retpoline.S @@ -0,0 +1,49 @@ +/* SPDX-License-Identifier: GPL-2.0 */ + +#include <linux/stringify.h> +#include <linux/linkage.h> +#include <asm/dwarf2.h> +#include <asm/cpufeatures.h> +#include <asm/alternative-asm.h> +#include <asm/export.h> +#include <asm/nospec-branch.h> + +.macro THUNK reg +	.section .text.__x86.indirect_thunk + +ENTRY(__x86_indirect_thunk_\reg) +	CFI_STARTPROC +	JMP_NOSPEC %\reg +	CFI_ENDPROC +ENDPROC(__x86_indirect_thunk_\reg) +.endm + +/* + * Despite being an assembler file we can't just use .irp here + * because __KSYM_DEPS__ only uses the C preprocessor and would + * only see one instance of "__x86_indirect_thunk_\reg" rather + * than one per register with the correct names. So we do it + * the simple and nasty way... + */ +#define __EXPORT_THUNK(sym) _ASM_NOKPROBE(sym); EXPORT_SYMBOL(sym) +#define EXPORT_THUNK(reg) __EXPORT_THUNK(__x86_indirect_thunk_ ## reg) +#define GENERATE_THUNK(reg) THUNK reg ; EXPORT_THUNK(reg) + +GENERATE_THUNK(_ASM_AX) +GENERATE_THUNK(_ASM_BX) +GENERATE_THUNK(_ASM_CX) +GENERATE_THUNK(_ASM_DX) +GENERATE_THUNK(_ASM_SI) +GENERATE_THUNK(_ASM_DI) +GENERATE_THUNK(_ASM_BP) +GENERATE_THUNK(_ASM_SP) +#ifdef CONFIG_64BIT +GENERATE_THUNK(r8) +GENERATE_THUNK(r9) +GENERATE_THUNK(r10) +GENERATE_THUNK(r11) +GENERATE_THUNK(r12) +GENERATE_THUNK(r13) +GENERATE_THUNK(r14) +GENERATE_THUNK(r15) +#endif diff --git a/arch/x86/lib/x86-opcode-map.txt b/arch/x86/lib/x86-opcode-map.txt index c4d55919fac1..e0b85930dd77 100644 --- a/arch/x86/lib/x86-opcode-map.txt +++ b/arch/x86/lib/x86-opcode-map.txt @@ -607,7 +607,7 @@ fb: psubq Pq,Qq | vpsubq Vx,Hx,Wx (66),(v1)  fc: paddb Pq,Qq | vpaddb Vx,Hx,Wx (66),(v1)  fd: paddw Pq,Qq | vpaddw Vx,Hx,Wx (66),(v1)  fe: paddd Pq,Qq | vpaddd Vx,Hx,Wx (66),(v1) -ff: +ff: UD0  EndTable  Table: 3-byte opcode 1 (0x0f 0x38) @@ -717,7 +717,7 @@ AVXcode: 2  7e: vpermt2d/q Vx,Hx,Wx (66),(ev)  7f: vpermt2ps/d Vx,Hx,Wx (66),(ev)  80: INVEPT Gy,Mdq (66) -81: INVPID Gy,Mdq (66) +81: INVVPID Gy,Mdq (66)  82: INVPCID Gy,Mdq (66)  83: vpmultishiftqb Vx,Hx,Wx (66),(ev)  88: vexpandps/d Vpd,Wpd (66),(ev) @@ -970,6 +970,15 @@ GrpTable: Grp9  EndTable  GrpTable: Grp10 +# all are UD1 +0: UD1 +1: UD1 +2: UD1 +3: UD1 +4: UD1 +5: UD1 +6: UD1 +7: UD1  EndTable  # Grp11A and Grp11B are expressed as Grp11 in Intel SDM |