2010-09-18 06:36:40 +08:00
|
|
|
#ifndef _ASM_X86_MWAIT_H
|
|
|
|
#define _ASM_X86_MWAIT_H
|
|
|
|
|
2013-12-12 22:08:36 +08:00
|
|
|
#include <linux/sched.h>
|
|
|
|
|
2016-01-27 05:12:04 +08:00
|
|
|
#include <asm/cpufeature.h>
|
|
|
|
|
2010-09-18 06:36:40 +08:00
|
|
|
#define MWAIT_SUBSTATE_MASK 0xf
|
|
|
|
#define MWAIT_CSTATE_MASK 0xf
|
|
|
|
#define MWAIT_SUBSTATE_SIZE 4
|
2013-02-02 12:37:30 +08:00
|
|
|
#define MWAIT_HINT2CSTATE(hint) (((hint) >> MWAIT_SUBSTATE_SIZE) & MWAIT_CSTATE_MASK)
|
|
|
|
#define MWAIT_HINT2SUBSTATE(hint) ((hint) & MWAIT_CSTATE_MASK)
|
2010-09-18 06:36:40 +08:00
|
|
|
|
|
|
|
#define CPUID_MWAIT_LEAF 5
|
|
|
|
#define CPUID5_ECX_EXTENSIONS_SUPPORTED 0x1
|
|
|
|
#define CPUID5_ECX_INTERRUPT_BREAK 0x2
|
|
|
|
|
|
|
|
#define MWAIT_ECX_INTERRUPT_BREAK 0x1
|
2015-08-10 18:19:53 +08:00
|
|
|
#define MWAITX_ECX_TIMER_ENABLE BIT(1)
|
|
|
|
#define MWAITX_MAX_LOOPS ((u32)-1)
|
|
|
|
#define MWAITX_DISABLE_CSTATES 0xf
|
2010-09-18 06:36:40 +08:00
|
|
|
|
2013-12-12 22:08:36 +08:00
|
|
|
static inline void __monitor(const void *eax, unsigned long ecx,
|
|
|
|
unsigned long edx)
|
|
|
|
{
|
|
|
|
/* "monitor %eax, %ecx, %edx;" */
|
|
|
|
asm volatile(".byte 0x0f, 0x01, 0xc8;"
|
|
|
|
:: "a" (eax), "c" (ecx), "d"(edx));
|
|
|
|
}
|
|
|
|
|
2015-08-10 18:19:53 +08:00
|
|
|
static inline void __monitorx(const void *eax, unsigned long ecx,
|
|
|
|
unsigned long edx)
|
|
|
|
{
|
|
|
|
/* "monitorx %eax, %ecx, %edx;" */
|
|
|
|
asm volatile(".byte 0x0f, 0x01, 0xfa;"
|
|
|
|
:: "a" (eax), "c" (ecx), "d"(edx));
|
|
|
|
}
|
|
|
|
|
2013-12-12 22:08:36 +08:00
|
|
|
static inline void __mwait(unsigned long eax, unsigned long ecx)
|
|
|
|
{
|
|
|
|
/* "mwait %eax, %ecx;" */
|
|
|
|
asm volatile(".byte 0x0f, 0x01, 0xc9;"
|
|
|
|
:: "a" (eax), "c" (ecx));
|
|
|
|
}
|
|
|
|
|
2015-08-10 18:19:53 +08:00
|
|
|
/*
|
|
|
|
* MWAITX allows for a timer expiration to get the core out a wait state in
|
|
|
|
* addition to the default MWAIT exit condition of a store appearing at a
|
|
|
|
* monitored virtual address.
|
|
|
|
*
|
|
|
|
* Registers:
|
|
|
|
*
|
|
|
|
* MWAITX ECX[1]: enable timer if set
|
|
|
|
* MWAITX EBX[31:0]: max wait time expressed in SW P0 clocks. The software P0
|
|
|
|
* frequency is the same as the TSC frequency.
|
|
|
|
*
|
|
|
|
* Below is a comparison between MWAIT and MWAITX on AMD processors:
|
|
|
|
*
|
|
|
|
* MWAIT MWAITX
|
|
|
|
* opcode 0f 01 c9 | 0f 01 fb
|
|
|
|
* ECX[0] value of RFLAGS.IF seen by instruction
|
|
|
|
* ECX[1] unused/#GP if set | enable timer if set
|
|
|
|
* ECX[31:2] unused/#GP if set
|
|
|
|
* EAX unused (reserve for hint)
|
|
|
|
* EBX[31:0] unused | max wait time (P0 clocks)
|
|
|
|
*
|
|
|
|
* MONITOR MONITORX
|
|
|
|
* opcode 0f 01 c8 | 0f 01 fa
|
|
|
|
* EAX (logical) address to monitor
|
|
|
|
* ECX #GP if not zero
|
|
|
|
*/
|
|
|
|
static inline void __mwaitx(unsigned long eax, unsigned long ebx,
|
|
|
|
unsigned long ecx)
|
|
|
|
{
|
|
|
|
/* "mwaitx %eax, %ebx, %ecx;" */
|
|
|
|
asm volatile(".byte 0x0f, 0x01, 0xfb;"
|
|
|
|
:: "a" (eax), "b" (ebx), "c" (ecx));
|
|
|
|
}
|
|
|
|
|
sched/idle/x86: Restore mwait_idle() to fix boot hangs, to improve power savings and to improve performance
In Linux-3.9 we removed the mwait_idle() loop:
69fb3676df33 ("x86 idle: remove mwait_idle() and "idle=mwait" cmdline param")
The reasoning was that modern machines should be sufficiently
happy during the boot process using the default_idle() HALT
loop, until cpuidle loads and either acpi_idle or intel_idle
invoke the newer MWAIT-with-hints idle loop.
But two machines reported problems:
1. Certain Core2-era machines support MWAIT-C1 and HALT only.
MWAIT-C1 is preferred for optimal power and performance.
But if they support just C1, cpuidle never loads and
so they use the boot-time default idle loop forever.
2. Some laptops will boot-hang if HALT is used,
but will boot successfully if MWAIT is used.
This appears to be a hidden assumption in BIOS SMI,
that is presumably valid on the proprietary OS
where the BIOS was validated.
https://bugzilla.kernel.org/show_bug.cgi?id=60770
So here we effectively revert the patch above, restoring
the mwait_idle() loop. However, we don't bother restoring
the idle=mwait cmdline parameter, since it appears to add
no value.
Maintainer notes:
For 3.9, simply revert 69fb3676df
for 3.10, patch -F3 applies, fuzz needed due to __cpuinit use in
context For 3.11, 3.12, 3.13, this patch applies cleanly
Tested-by: Mike Galbraith <bitbucket@online.de>
Signed-off-by: Len Brown <len.brown@intel.com>
Acked-by: Mike Galbraith <bitbucket@online.de>
Cc: <stable@vger.kernel.org> # 3.9+
Cc: Borislav Petkov <bp@alien8.de>
Cc: H. Peter Anvin <hpa@zytor.com>
Cc: Ian Malone <ibmalone@gmail.com>
Cc: Josh Boyer <jwboyer@redhat.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Mike Galbraith <efault@gmx.de>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Link: http://lkml.kernel.org/r/345254a551eb5a6a866e048d7ab570fd2193aca4.1389763084.git.len.brown@intel.com
[ Ported to recent kernels. ]
Signed-off-by: Ingo Molnar <mingo@kernel.org>
2014-01-15 13:37:34 +08:00
|
|
|
static inline void __sti_mwait(unsigned long eax, unsigned long ecx)
|
|
|
|
{
|
|
|
|
trace_hardirqs_on();
|
|
|
|
/* "mwait %eax, %ecx;" */
|
|
|
|
asm volatile("sti; .byte 0x0f, 0x01, 0xc9;"
|
|
|
|
:: "a" (eax), "c" (ecx));
|
|
|
|
}
|
|
|
|
|
2013-12-12 22:08:36 +08:00
|
|
|
/*
|
|
|
|
* This uses new MONITOR/MWAIT instructions on P4 processors with PNI,
|
|
|
|
* which can obviate IPI to trigger checking of need_resched.
|
|
|
|
* We execute MONITOR against need_resched and enter optimized wait state
|
|
|
|
* through MWAIT. Whenever someone changes need_resched, we would be woken
|
|
|
|
* up from MWAIT (without an IPI).
|
|
|
|
*
|
|
|
|
* New with Core Duo processors, MWAIT can take some hints based on CPU
|
|
|
|
* capability.
|
|
|
|
*/
|
|
|
|
static inline void mwait_idle_with_hints(unsigned long eax, unsigned long ecx)
|
|
|
|
{
|
2016-07-19 02:41:10 +08:00
|
|
|
if (static_cpu_has_bug(X86_BUG_MONITOR) || !current_set_polling_and_test()) {
|
2014-06-18 06:06:23 +08:00
|
|
|
if (static_cpu_has_bug(X86_BUG_CLFLUSH_MONITOR)) {
|
2013-12-20 03:58:16 +08:00
|
|
|
mb();
|
2013-12-12 22:08:36 +08:00
|
|
|
clflush((void *)¤t_thread_info()->flags);
|
2013-12-20 03:58:16 +08:00
|
|
|
mb();
|
|
|
|
}
|
2013-12-12 22:08:36 +08:00
|
|
|
|
|
|
|
__monitor((void *)¤t_thread_info()->flags, 0, 0);
|
|
|
|
if (!need_resched())
|
|
|
|
__mwait(eax, ecx);
|
|
|
|
}
|
2013-11-20 19:22:37 +08:00
|
|
|
current_clr_polling();
|
2013-12-12 22:08:36 +08:00
|
|
|
}
|
|
|
|
|
2010-09-18 06:36:40 +08:00
|
|
|
#endif /* _ASM_X86_MWAIT_H */
|