linux/arch/x86/include/asm/special_insns.h

#ifndef _ASM_X86_SPECIAL_INSNS_H
#define _ASM_X86_SPECIAL_INSNS_H


#ifdef __KERNEL__

#include <asm/nops.h>

static inline void native_clts(void)
{
	asm volatile("clts");
}

/*
 * Volatile isn't enough to prevent the compiler from reordering the
 * read/write functions for the control registers and messing everything up.
 * A memory clobber would solve the problem, but would prevent reordering of
 * all loads stores around it, which can hurt performance. Solution is to
 * use a variable and mimic reads and writes to it to enforce serialization
 */
extern unsigned long __force_order;

static inline unsigned long native_read_cr0(void)
{
	unsigned long val;
	asm volatile("mov %%cr0,%0\n\t" : "=r" (val), "=m" (__force_order));
	return val;
}

static inline void native_write_cr0(unsigned long val)
{
	asm volatile("mov %0,%%cr0": : "r" (val), "m" (__force_order));
}

static inline unsigned long native_read_cr2(void)
{
	unsigned long val;
	asm volatile("mov %%cr2,%0\n\t" : "=r" (val), "=m" (__force_order));
	return val;
}

static inline void native_write_cr2(unsigned long val)
{
	asm volatile("mov %0,%%cr2": : "r" (val), "m" (__force_order));
}

static inline unsigned long native_read_cr3(void)
{
	unsigned long val;
	asm volatile("mov %%cr3,%0\n\t" : "=r" (val), "=m" (__force_order));
	return val;
}

static inline void native_write_cr3(unsigned long val)
{
	asm volatile("mov %0,%%cr3": : "r" (val), "m" (__force_order));
}

static inline unsigned long native_read_cr4(void)
{
	unsigned long val;
	asm volatile("mov %%cr4,%0\n\t" : "=r" (val), "=m" (__force_order));
	return val;
}

static inline unsigned long native_read_cr4_safe(void)
{
	unsigned long val;
	/* This could fault if %cr4 does not exist. In x86_64, a cr4 always
	 * exists, so it will never fail. */
#ifdef CONFIG_X86_32
	asm volatile("1: mov %%cr4, %0\n"
		     "2:\n"
		     _ASM_EXTABLE(1b, 2b)
		     : "=r" (val), "=m" (__force_order) : "0" (0));
#else
	val = native_read_cr4();
#endif
	return val;
}

static inline void native_write_cr4(unsigned long val)
{
	asm volatile("mov %0,%%cr4": : "r" (val), "m" (__force_order));
}

#ifdef CONFIG_X86_64
static inline unsigned long native_read_cr8(void)
{
	unsigned long cr8;
	asm volatile("movq %%cr8,%0" : "=r" (cr8));
	return cr8;
}

static inline void native_write_cr8(unsigned long val)
{
	asm volatile("movq %0,%%cr8" :: "r" (val) : "memory");
}
#endif

static inline void native_wbinvd(void)
{
	asm volatile("wbinvd": : :"memory");
}

extern asmlinkage void native_load_gs_index(unsigned);

#ifdef CONFIG_PARAVIRT
#include <asm/paravirt.h>
#else

static inline unsigned long read_cr0(void)
{
	return native_read_cr0();
}

static inline void write_cr0(unsigned long x)
{
	native_write_cr0(x);
}

static inline unsigned long read_cr2(void)
{
	return native_read_cr2();
}

static inline void write_cr2(unsigned long x)
{
	native_write_cr2(x);
}

static inline unsigned long read_cr3(void)
{
	return native_read_cr3();
}

static inline void write_cr3(unsigned long x)
{
	native_write_cr3(x);
}

static inline unsigned long __read_cr4(void)
{
	return native_read_cr4();
}

static inline unsigned long __read_cr4_safe(void)
{
	return native_read_cr4_safe();
}

static inline void __write_cr4(unsigned long x)
{
	native_write_cr4(x);
}

static inline void wbinvd(void)
{
	native_wbinvd();
}

#ifdef CONFIG_X86_64

static inline unsigned long read_cr8(void)
{
	return native_read_cr8();
}

static inline void write_cr8(unsigned long x)
{
	native_write_cr8(x);
}

static inline void load_gs_index(unsigned selector)
{
	native_load_gs_index(selector);
}

#endif

/* Clear the 'TS' bit */
static inline void clts(void)
{
	native_clts();
}

#endif/* CONFIG_PARAVIRT */

#define stts() write_cr0(read_cr0() | X86_CR0_TS)

static inline void clflush(volatile void *__p)
{
	asm volatile("clflush %0" : "+m" (*(volatile char __force *)__p));
}

static inline void clflushopt(volatile void *__p)
{
	alternative_io(".byte " __stringify(NOP_DS_PREFIX) "; clflush %P0",
		       ".byte 0x66; clflush %P0",
		       X86_FEATURE_CLFLUSHOPT,
		       "+m" (*(volatile char __force *)__p));
}

static inline void pcommit_sfence(void)
{
	alternative(ASM_NOP7,
		    ".byte 0x66, 0x0f, 0xae, 0xf8\n\t" /* pcommit */
		    "sfence",
		    X86_FEATURE_PCOMMIT);
}

#define nop() asm volatile ("nop")


#endif /* __KERNEL__ */

#endif /* _ASM_X86_SPECIAL_INSNS_H */
Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00			`#ifndef _ASM_X86_SPECIAL_INSNS_H`
			`#define _ASM_X86_SPECIAL_INSNS_H`


			`#ifdef __KERNEL__`

x86/asm: Add support for the pcommit instruction Add support for the new pcommit (persistent commit) instruction. This instruction was announced in the document "Intel Architecture Instruction Set Extensions Programming Reference" with reference number 319433-022: https://software.intel.com/sites/default/files/managed/0d/53/319433-022.pdf The pcommit instruction ensures that data that has been flushed from the processor's cache hierarchy with clwb, clflushopt or clflush is accepted to memory and is durable on the DIMM. The primary use case for this is persistent memory. This function shows how to properly use clwb/clflushopt/clflush and pcommit with appropriate fencing: void flush_and_commit_buffer(void vaddr, unsigned int size) { void vend = vaddr + size - 1; for (; vaddr < vend; vaddr += boot_cpu_data.x86_clflush_size) clwb(vaddr); /* Flush any possible final partial cacheline / clwb(vend); / * sfence to order clwb/clflushopt/clflush cache flushes * mfence via mb() also works / wmb(); / pcommit and the required sfence for ordering / pcommit_sfence(); } After this function completes the data pointed to by vaddr is has been accepted to memory and will be durable if the vaddr points to persistent memory. Pcommit must always be ordered by an mfence or sfence, so to help simplify things we include both the pcommit and the required sfence in the alternatives generated by pcommit_sfence(). The other option is to keep them separated, but on platforms that don't support pcommit this would then turn into: void flush_and_commit_buffer(void vaddr, unsigned int size) { void vend = vaddr + size - 1; for (; vaddr < vend; vaddr += boot_cpu_data.x86_clflush_size) clwb(vaddr); / Flush any possible final partial cacheline / clwb(vend); / * sfence to order clwb/clflushopt/clflush cache flushes * mfence via mb() also works / wmb(); nop(); / from pcommit(), via alternatives / / * sfence to order pcommit * mfence via mb() also works */ wmb(); } This is still correct, but now you've got two fences separated by only a nop. With the commit and the fence together in pcommit_sfence() you avoid the final unneeded fence. Signed-off-by: Ross Zwisler <ross.zwisler@linux.intel.com> Acked-by: Borislav Petkov <bp@suse.de> Acked-by: H. Peter Anvin <hpa@linux.intel.com> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Thomas Gleixner <tglx@linutronix.de> Link: http://lkml.kernel.org/r/1424367448-24254-1-git-send-email-ross.zwisler@linux.intel.com Signed-off-by: Ingo Molnar <mingo@kernel.org> 2015-02-20 01:37:28 +08:00			`#include <asm/nops.h>`

Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00			`static inline void native_clts(void)`
			`{`
			`asm volatile("clts");`
			`}`

			`/*`
			`* Volatile isn't enough to prevent the compiler from reordering the`
			`* read/write functions for the control registers and messing everything up.`
			`* A memory clobber would solve the problem, but would prevent reordering of`
			`* all loads stores around it, which can hurt performance. Solution is to`
			`* use a variable and mimic reads and writes to it to enforce serialization`
			`*/`
x86: __force_order doesn't need to be an actual variable It being static causes over a dozen instances to be scattered across the kernel image, with non of them ever being referenced in any way. Making the variable extern without ever defining it works as well - all we need is to have the compiler think the variable is being accessed. Signed-off-by: Jan Beulich <jbeulich@suse.com> Link: http://lkml.kernel.org/r/51A610B802000078000D99A0@nat28.tlf.novell.com Signed-off-by: Ingo Molnar <mingo@kernel.org> 2013-05-29 20:29:12 +08:00			`extern unsigned long __force_order;`
Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00
			`static inline unsigned long native_read_cr0(void)`
			`{`
			`unsigned long val;`
			`asm volatile("mov %%cr0,%0\n\t" : "=r" (val), "=m" (__force_order));`
			`return val;`
			`}`

			`static inline void native_write_cr0(unsigned long val)`
			`{`
			`asm volatile("mov %0,%%cr0": : "r" (val), "m" (__force_order));`
			`}`

			`static inline unsigned long native_read_cr2(void)`
			`{`
			`unsigned long val;`
			`asm volatile("mov %%cr2,%0\n\t" : "=r" (val), "=m" (__force_order));`
			`return val;`
			`}`

			`static inline void native_write_cr2(unsigned long val)`
			`{`
			`asm volatile("mov %0,%%cr2": : "r" (val), "m" (__force_order));`
			`}`

			`static inline unsigned long native_read_cr3(void)`
			`{`
			`unsigned long val;`
			`asm volatile("mov %%cr3,%0\n\t" : "=r" (val), "=m" (__force_order));`
			`return val;`
			`}`

			`static inline void native_write_cr3(unsigned long val)`
			`{`
			`asm volatile("mov %0,%%cr3": : "r" (val), "m" (__force_order));`
			`}`

			`static inline unsigned long native_read_cr4(void)`
			`{`
			`unsigned long val;`
			`asm volatile("mov %%cr4,%0\n\t" : "=r" (val), "=m" (__force_order));`
			`return val;`
			`}`

			`static inline unsigned long native_read_cr4_safe(void)`
			`{`
			`unsigned long val;`
			`/* This could fault if %cr4 does not exist. In x86_64, a cr4 always`
			`* exists, so it will never fail. */`
			`#ifdef CONFIG_X86_32`
			`asm volatile("1: mov %%cr4, %0\n"`
			`"2:\n"`
			`_ASM_EXTABLE(1b, 2b)`
			`: "=r" (val), "=m" (__force_order) : "0" (0));`
			`#else`
			`val = native_read_cr4();`
			`#endif`
			`return val;`
			`}`

			`static inline void native_write_cr4(unsigned long val)`
			`{`
			`asm volatile("mov %0,%%cr4": : "r" (val), "m" (__force_order));`
			`}`

			`#ifdef CONFIG_X86_64`
			`static inline unsigned long native_read_cr8(void)`
			`{`
			`unsigned long cr8;`
			`asm volatile("movq %%cr8,%0" : "=r" (cr8));`
			`return cr8;`
			`}`

			`static inline void native_write_cr8(unsigned long val)`
			`{`
			`asm volatile("movq %0,%%cr8" :: "r" (val) : "memory");`
			`}`
			`#endif`

			`static inline void native_wbinvd(void)`
			`{`
			`asm volatile("wbinvd": : :"memory");`
			`}`

x86, asmlinkage: Make several variables used from assembler/linker script visible Plus one function, load_gs_index(). Signed-off-by: Andi Kleen <ak@linux.intel.com> Link: http://lkml.kernel.org/r/1375740170-7446-10-git-send-email-andi@firstfloor.org Signed-off-by: H. Peter Anvin <hpa@linux.intel.com> 2013-08-06 06:02:43 +08:00			`extern asmlinkage void native_load_gs_index(unsigned);`
Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00
			`#ifdef CONFIG_PARAVIRT`
			`#include <asm/paravirt.h>`
			`#else`

			`static inline unsigned long read_cr0(void)`
			`{`
			`return native_read_cr0();`
			`}`

			`static inline void write_cr0(unsigned long x)`
			`{`
			`native_write_cr0(x);`
			`}`

			`static inline unsigned long read_cr2(void)`
			`{`
			`return native_read_cr2();`
			`}`

			`static inline void write_cr2(unsigned long x)`
			`{`
			`native_write_cr2(x);`
			`}`

			`static inline unsigned long read_cr3(void)`
			`{`
			`return native_read_cr3();`
			`}`

			`static inline void write_cr3(unsigned long x)`
			`{`
			`native_write_cr3(x);`
			`}`

x86: Store a per-cpu shadow copy of CR4 Context switches and TLB flushes can change individual bits of CR4. CR4 reads take several cycles, so store a shadow copy of CR4 in a per-cpu variable. To avoid wasting a cache line, I added the CR4 shadow to cpu_tlbstate, which is already touched in switch_mm. The heaviest users of the cr4 shadow will be switch_mm and __switch_to_xtra, and __switch_to_xtra is called shortly after switch_mm during context switch, so the cacheline is likely to be hot. Signed-off-by: Andy Lutomirski <luto@amacapital.net> Reviewed-by: Thomas Gleixner <tglx@linutronix.de> Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org> Cc: Kees Cook <keescook@chromium.org> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Vince Weaver <vince@deater.net> Cc: "hillf.zj" <hillf.zj@alibaba-inc.com> Cc: Valdis Kletnieks <Valdis.Kletnieks@vt.edu> Cc: Paul Mackerras <paulus@samba.org> Cc: Arnaldo Carvalho de Melo <acme@kernel.org> Cc: Linus Torvalds <torvalds@linux-foundation.org> Link: http://lkml.kernel.org/r/3a54dd3353fffbf84804398e00dfdc5b7c1afd7d.1414190806.git.luto@amacapital.net Signed-off-by: Ingo Molnar <mingo@kernel.org> 2014-10-25 06:58:08 +08:00			`static inline unsigned long __read_cr4(void)`
Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00			`{`
			`return native_read_cr4();`
			`}`

x86: Store a per-cpu shadow copy of CR4 Context switches and TLB flushes can change individual bits of CR4. CR4 reads take several cycles, so store a shadow copy of CR4 in a per-cpu variable. To avoid wasting a cache line, I added the CR4 shadow to cpu_tlbstate, which is already touched in switch_mm. The heaviest users of the cr4 shadow will be switch_mm and __switch_to_xtra, and __switch_to_xtra is called shortly after switch_mm during context switch, so the cacheline is likely to be hot. Signed-off-by: Andy Lutomirski <luto@amacapital.net> Reviewed-by: Thomas Gleixner <tglx@linutronix.de> Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org> Cc: Kees Cook <keescook@chromium.org> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Vince Weaver <vince@deater.net> Cc: "hillf.zj" <hillf.zj@alibaba-inc.com> Cc: Valdis Kletnieks <Valdis.Kletnieks@vt.edu> Cc: Paul Mackerras <paulus@samba.org> Cc: Arnaldo Carvalho de Melo <acme@kernel.org> Cc: Linus Torvalds <torvalds@linux-foundation.org> Link: http://lkml.kernel.org/r/3a54dd3353fffbf84804398e00dfdc5b7c1afd7d.1414190806.git.luto@amacapital.net Signed-off-by: Ingo Molnar <mingo@kernel.org> 2014-10-25 06:58:08 +08:00			`static inline unsigned long __read_cr4_safe(void)`
Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00			`{`
			`return native_read_cr4_safe();`
			`}`

x86: Store a per-cpu shadow copy of CR4 Context switches and TLB flushes can change individual bits of CR4. CR4 reads take several cycles, so store a shadow copy of CR4 in a per-cpu variable. To avoid wasting a cache line, I added the CR4 shadow to cpu_tlbstate, which is already touched in switch_mm. The heaviest users of the cr4 shadow will be switch_mm and __switch_to_xtra, and __switch_to_xtra is called shortly after switch_mm during context switch, so the cacheline is likely to be hot. Signed-off-by: Andy Lutomirski <luto@amacapital.net> Reviewed-by: Thomas Gleixner <tglx@linutronix.de> Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org> Cc: Kees Cook <keescook@chromium.org> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Vince Weaver <vince@deater.net> Cc: "hillf.zj" <hillf.zj@alibaba-inc.com> Cc: Valdis Kletnieks <Valdis.Kletnieks@vt.edu> Cc: Paul Mackerras <paulus@samba.org> Cc: Arnaldo Carvalho de Melo <acme@kernel.org> Cc: Linus Torvalds <torvalds@linux-foundation.org> Link: http://lkml.kernel.org/r/3a54dd3353fffbf84804398e00dfdc5b7c1afd7d.1414190806.git.luto@amacapital.net Signed-off-by: Ingo Molnar <mingo@kernel.org> 2014-10-25 06:58:08 +08:00			`static inline void __write_cr4(unsigned long x)`
Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00			`{`
			`native_write_cr4(x);`
			`}`

			`static inline void wbinvd(void)`
			`{`
			`native_wbinvd();`
			`}`

			`#ifdef CONFIG_X86_64`

			`static inline unsigned long read_cr8(void)`
			`{`
			`return native_read_cr8();`
			`}`

			`static inline void write_cr8(unsigned long x)`
			`{`
			`native_write_cr8(x);`
			`}`

			`static inline void load_gs_index(unsigned selector)`
			`{`
			`native_load_gs_index(selector);`
			`}`

			`#endif`

			`/* Clear the 'TS' bit */`
			`static inline void clts(void)`
			`{`
			`native_clts();`
			`}`

			`#endif/* CONFIG_PARAVIRT */`

			`#define stts() write_cr0(read_cr0() \| X86_CR0_TS)`

			`static inline void clflush(volatile void *__p)`
			`{`
			`asm volatile("clflush %0" : "+m" ((volatile char __force )__p));`
			`}`

x86: Add support for the clflushopt instruction Add support for the new clflushopt instruction. This instruction was announced in the document "Intel Architecture Instruction Set Extensions Programming Reference" with Ref # 319433-018. http://download-software.intel.com/sites/default/files/managed/50/1a/319433-018.pdf [ hpa: changed the feature flag to simply X86_FEATURE_CLFLUSHOPT - if that is what we want to report in /proc/cpuinfo anyway... ] Signed-off-by: Ross Zwisler <ross.zwisler@linux.intel.com> Link: http://lkml.kernel.org/r/1393441612-19729-2-git-send-email-ross.zwisler@linux.intel.com Signed-off-by: H. Peter Anvin <hpa@linux.intel.com> 2014-02-27 03:06:49 +08:00			`static inline void clflushopt(volatile void *__p)`
			`{`
			`alternative_io(".byte " __stringify(NOP_DS_PREFIX) "; clflush %P0",`
			`".byte 0x66; clflush %P0",`
			`X86_FEATURE_CLFLUSHOPT,`
			`"+m" ((volatile char __force )__p));`
			`}`

x86/asm: Add support for the pcommit instruction Add support for the new pcommit (persistent commit) instruction. This instruction was announced in the document "Intel Architecture Instruction Set Extensions Programming Reference" with reference number 319433-022: https://software.intel.com/sites/default/files/managed/0d/53/319433-022.pdf The pcommit instruction ensures that data that has been flushed from the processor's cache hierarchy with clwb, clflushopt or clflush is accepted to memory and is durable on the DIMM. The primary use case for this is persistent memory. This function shows how to properly use clwb/clflushopt/clflush and pcommit with appropriate fencing: void flush_and_commit_buffer(void vaddr, unsigned int size) { void vend = vaddr + size - 1; for (; vaddr < vend; vaddr += boot_cpu_data.x86_clflush_size) clwb(vaddr); /* Flush any possible final partial cacheline / clwb(vend); / * sfence to order clwb/clflushopt/clflush cache flushes * mfence via mb() also works / wmb(); / pcommit and the required sfence for ordering / pcommit_sfence(); } After this function completes the data pointed to by vaddr is has been accepted to memory and will be durable if the vaddr points to persistent memory. Pcommit must always be ordered by an mfence or sfence, so to help simplify things we include both the pcommit and the required sfence in the alternatives generated by pcommit_sfence(). The other option is to keep them separated, but on platforms that don't support pcommit this would then turn into: void flush_and_commit_buffer(void vaddr, unsigned int size) { void vend = vaddr + size - 1; for (; vaddr < vend; vaddr += boot_cpu_data.x86_clflush_size) clwb(vaddr); / Flush any possible final partial cacheline / clwb(vend); / * sfence to order clwb/clflushopt/clflush cache flushes * mfence via mb() also works / wmb(); nop(); / from pcommit(), via alternatives / / * sfence to order pcommit * mfence via mb() also works */ wmb(); } This is still correct, but now you've got two fences separated by only a nop. With the commit and the fence together in pcommit_sfence() you avoid the final unneeded fence. Signed-off-by: Ross Zwisler <ross.zwisler@linux.intel.com> Acked-by: Borislav Petkov <bp@suse.de> Acked-by: H. Peter Anvin <hpa@linux.intel.com> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Thomas Gleixner <tglx@linutronix.de> Link: http://lkml.kernel.org/r/1424367448-24254-1-git-send-email-ross.zwisler@linux.intel.com Signed-off-by: Ingo Molnar <mingo@kernel.org> 2015-02-20 01:37:28 +08:00			`static inline void pcommit_sfence(void)`
			`{`
			`alternative(ASM_NOP7,`
			`".byte 0x66, 0x0f, 0xae, 0xf8\n\t" /* pcommit */`
			`"sfence",`
			`X86_FEATURE_PCOMMIT);`
			`}`

Disintegrate asm/system.h for X86 Disintegrate asm/system.h for X86. Signed-off-by: David Howells <dhowells@redhat.com> Acked-by: H. Peter Anvin <hpa@zytor.com> cc: x86@kernel.org 2012-03-29 01:11:12 +08:00			`#define nop() asm volatile ("nop")`


			`#endif /* __KERNEL__ */`

			`#endif /* _ASM_X86_SPECIAL_INSNS_H */`