Commit 64f8e73d authored by Linus Torvalds's avatar Linus Torvalds

Merge tag 'x86-splitlock-2021-04-26' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip

Pull x86 bus lock detection updates from Thomas Gleixner:
 "Support for enhanced split lock detection:

  Newer CPUs provide a second mechanism to detect operations with lock
  prefix which go accross a cache line boundary. Such operations have to
  take bus lock which causes a system wide performance degradation when
  these operations happen frequently.

  The new mechanism is not using the #AC exception. It triggers #DB and
  is restricted to operations in user space. Kernel side split lock
  access can only be detected by the #AC based variant.

  Contrary to the #AC based mechanism the #DB based variant triggers
  _after_ the instruction was executed. The mechanism is CPUID
  enumerated and contrary to the #AC version which is based on the magic
  TEST_CTRL_MSR and model/family based enumeration on the way to become
  architectural"

* tag 'x86-splitlock-2021-04-26' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip:
  Documentation/admin-guide: Change doc for split_lock_detect parameter
  x86/traps: Handle #DB for bus lock
  x86/cpufeatures: Enumerate #DB for bus lock detection
parents eea2647e ebca1770
...@@ -5111,27 +5111,37 @@ ...@@ -5111,27 +5111,37 @@
spia_peddr= spia_peddr=
split_lock_detect= split_lock_detect=
[X86] Enable split lock detection [X86] Enable split lock detection or bus lock detection
When enabled (and if hardware support is present), atomic When enabled (and if hardware support is present), atomic
instructions that access data across cache line instructions that access data across cache line
boundaries will result in an alignment check exception. boundaries will result in an alignment check exception
for split lock detection or a debug exception for
bus lock detection.
off - not enabled off - not enabled
warn - the kernel will emit rate limited warnings warn - the kernel will emit rate-limited warnings
about applications triggering the #AC about applications triggering the #AC
exception. This mode is the default on CPUs exception or the #DB exception. This mode is
that supports split lock detection. the default on CPUs that support split lock
detection or bus lock detection. Default
behavior is by #AC if both features are
enabled in hardware.
fatal - the kernel will send SIGBUS to applications fatal - the kernel will send SIGBUS to applications
that trigger the #AC exception. that trigger the #AC exception or the #DB
exception. Default behavior is by #AC if
both features are enabled in hardware.
If an #AC exception is hit in the kernel or in If an #AC exception is hit in the kernel or in
firmware (i.e. not while executing in user mode) firmware (i.e. not while executing in user mode)
the kernel will oops in either "warn" or "fatal" the kernel will oops in either "warn" or "fatal"
mode. mode.
#DB exception for bus lock is triggered only when
CPL > 0.
srbds= [X86,INTEL] srbds= [X86,INTEL]
Control the Special Register Buffer Data Sampling Control the Special Register Buffer Data Sampling
(SRBDS) mitigation. (SRBDS) mitigation.
......
...@@ -41,12 +41,13 @@ unsigned int x86_family(unsigned int sig); ...@@ -41,12 +41,13 @@ unsigned int x86_family(unsigned int sig);
unsigned int x86_model(unsigned int sig); unsigned int x86_model(unsigned int sig);
unsigned int x86_stepping(unsigned int sig); unsigned int x86_stepping(unsigned int sig);
#ifdef CONFIG_CPU_SUP_INTEL #ifdef CONFIG_CPU_SUP_INTEL
extern void __init cpu_set_core_cap_bits(struct cpuinfo_x86 *c); extern void __init sld_setup(struct cpuinfo_x86 *c);
extern void switch_to_sld(unsigned long tifn); extern void switch_to_sld(unsigned long tifn);
extern bool handle_user_split_lock(struct pt_regs *regs, long error_code); extern bool handle_user_split_lock(struct pt_regs *regs, long error_code);
extern bool handle_guest_split_lock(unsigned long ip); extern bool handle_guest_split_lock(unsigned long ip);
extern void handle_bus_lock(struct pt_regs *regs);
#else #else
static inline void __init cpu_set_core_cap_bits(struct cpuinfo_x86 *c) {} static inline void __init sld_setup(struct cpuinfo_x86 *c) {}
static inline void switch_to_sld(unsigned long tifn) {} static inline void switch_to_sld(unsigned long tifn) {}
static inline bool handle_user_split_lock(struct pt_regs *regs, long error_code) static inline bool handle_user_split_lock(struct pt_regs *regs, long error_code)
{ {
...@@ -57,6 +58,8 @@ static inline bool handle_guest_split_lock(unsigned long ip) ...@@ -57,6 +58,8 @@ static inline bool handle_guest_split_lock(unsigned long ip)
{ {
return false; return false;
} }
static inline void handle_bus_lock(struct pt_regs *regs) {}
#endif #endif
#ifdef CONFIG_IA32_FEAT_CTL #ifdef CONFIG_IA32_FEAT_CTL
void init_ia32_feat_ctl(struct cpuinfo_x86 *c); void init_ia32_feat_ctl(struct cpuinfo_x86 *c);
......
...@@ -358,6 +358,7 @@ ...@@ -358,6 +358,7 @@
#define X86_FEATURE_AVX512_VPOPCNTDQ (16*32+14) /* POPCNT for vectors of DW/QW */ #define X86_FEATURE_AVX512_VPOPCNTDQ (16*32+14) /* POPCNT for vectors of DW/QW */
#define X86_FEATURE_LA57 (16*32+16) /* 5-level page tables */ #define X86_FEATURE_LA57 (16*32+16) /* 5-level page tables */
#define X86_FEATURE_RDPID (16*32+22) /* RDPID instruction */ #define X86_FEATURE_RDPID (16*32+22) /* RDPID instruction */
#define X86_FEATURE_BUS_LOCK_DETECT (16*32+24) /* Bus Lock detect */
#define X86_FEATURE_CLDEMOTE (16*32+25) /* CLDEMOTE instruction */ #define X86_FEATURE_CLDEMOTE (16*32+25) /* CLDEMOTE instruction */
#define X86_FEATURE_MOVDIRI (16*32+27) /* MOVDIRI instruction */ #define X86_FEATURE_MOVDIRI (16*32+27) /* MOVDIRI instruction */
#define X86_FEATURE_MOVDIR64B (16*32+28) /* MOVDIR64B instruction */ #define X86_FEATURE_MOVDIR64B (16*32+28) /* MOVDIR64B instruction */
......
...@@ -265,6 +265,7 @@ ...@@ -265,6 +265,7 @@
#define DEBUGCTLMSR_LBR (1UL << 0) /* last branch recording */ #define DEBUGCTLMSR_LBR (1UL << 0) /* last branch recording */
#define DEBUGCTLMSR_BTF_SHIFT 1 #define DEBUGCTLMSR_BTF_SHIFT 1
#define DEBUGCTLMSR_BTF (1UL << 1) /* single-step on branches */ #define DEBUGCTLMSR_BTF (1UL << 1) /* single-step on branches */
#define DEBUGCTLMSR_BUS_LOCK_DETECT (1UL << 2)
#define DEBUGCTLMSR_TR (1UL << 6) #define DEBUGCTLMSR_TR (1UL << 6)
#define DEBUGCTLMSR_BTS (1UL << 7) #define DEBUGCTLMSR_BTS (1UL << 7)
#define DEBUGCTLMSR_BTINT (1UL << 8) #define DEBUGCTLMSR_BTINT (1UL << 8)
......
...@@ -24,6 +24,7 @@ ...@@ -24,6 +24,7 @@
#define DR_TRAP3 (0x8) /* db3 */ #define DR_TRAP3 (0x8) /* db3 */
#define DR_TRAP_BITS (DR_TRAP0|DR_TRAP1|DR_TRAP2|DR_TRAP3) #define DR_TRAP_BITS (DR_TRAP0|DR_TRAP1|DR_TRAP2|DR_TRAP3)
#define DR_BUS_LOCK (0x800) /* bus_lock */
#define DR_STEP (0x4000) /* single-step */ #define DR_STEP (0x4000) /* single-step */
#define DR_SWITCH (0x8000) /* task switch */ #define DR_SWITCH (0x8000) /* task switch */
......
...@@ -1330,7 +1330,7 @@ static void __init early_identify_cpu(struct cpuinfo_x86 *c) ...@@ -1330,7 +1330,7 @@ static void __init early_identify_cpu(struct cpuinfo_x86 *c)
cpu_set_bug_bits(c); cpu_set_bug_bits(c);
cpu_set_core_cap_bits(c); sld_setup(c);
fpu__init_system(c); fpu__init_system(c);
......
...@@ -44,9 +44,9 @@ enum split_lock_detect_state { ...@@ -44,9 +44,9 @@ enum split_lock_detect_state {
}; };
/* /*
* Default to sld_off because most systems do not support split lock detection * Default to sld_off because most systems do not support split lock detection.
* split_lock_setup() will switch this to sld_warn on systems that support * sld_state_setup() will switch this to sld_warn on systems that support
* split lock detect, unless there is a command line override. * split lock/bus lock detect, unless there is a command line override.
*/ */
static enum split_lock_detect_state sld_state __ro_after_init = sld_off; static enum split_lock_detect_state sld_state __ro_after_init = sld_off;
static u64 msr_test_ctrl_cache __ro_after_init; static u64 msr_test_ctrl_cache __ro_after_init;
...@@ -603,6 +603,7 @@ static void init_intel_misc_features(struct cpuinfo_x86 *c) ...@@ -603,6 +603,7 @@ static void init_intel_misc_features(struct cpuinfo_x86 *c)
} }
static void split_lock_init(void); static void split_lock_init(void);
static void bus_lock_init(void);
static void init_intel(struct cpuinfo_x86 *c) static void init_intel(struct cpuinfo_x86 *c)
{ {
...@@ -720,6 +721,7 @@ static void init_intel(struct cpuinfo_x86 *c) ...@@ -720,6 +721,7 @@ static void init_intel(struct cpuinfo_x86 *c)
tsx_disable(); tsx_disable();
split_lock_init(); split_lock_init();
bus_lock_init();
intel_init_thermal(c); intel_init_thermal(c);
} }
...@@ -1020,16 +1022,15 @@ static bool split_lock_verify_msr(bool on) ...@@ -1020,16 +1022,15 @@ static bool split_lock_verify_msr(bool on)
return ctrl == tmp; return ctrl == tmp;
} }
static void __init split_lock_setup(void) static void __init sld_state_setup(void)
{ {
enum split_lock_detect_state state = sld_warn; enum split_lock_detect_state state = sld_warn;
char arg[20]; char arg[20];
int i, ret; int i, ret;
if (!split_lock_verify_msr(false)) { if (!boot_cpu_has(X86_FEATURE_SPLIT_LOCK_DETECT) &&
pr_info("MSR access failed: Disabled\n"); !boot_cpu_has(X86_FEATURE_BUS_LOCK_DETECT))
return; return;
}
ret = cmdline_find_option(boot_command_line, "split_lock_detect", ret = cmdline_find_option(boot_command_line, "split_lock_detect",
arg, sizeof(arg)); arg, sizeof(arg));
...@@ -1041,17 +1042,14 @@ static void __init split_lock_setup(void) ...@@ -1041,17 +1042,14 @@ static void __init split_lock_setup(void)
} }
} }
} }
sld_state = state;
}
switch (state) { static void __init __split_lock_setup(void)
case sld_off: {
pr_info("disabled\n"); if (!split_lock_verify_msr(false)) {
pr_info("MSR access failed: Disabled\n");
return; return;
case sld_warn:
pr_info("warning about user-space split_locks\n");
break;
case sld_fatal:
pr_info("sending SIGBUS on user-space split_locks\n");
break;
} }
rdmsrl(MSR_TEST_CTRL, msr_test_ctrl_cache); rdmsrl(MSR_TEST_CTRL, msr_test_ctrl_cache);
...@@ -1061,7 +1059,9 @@ static void __init split_lock_setup(void) ...@@ -1061,7 +1059,9 @@ static void __init split_lock_setup(void)
return; return;
} }
sld_state = state; /* Restore the MSR to its cached value. */
wrmsrl(MSR_TEST_CTRL, msr_test_ctrl_cache);
setup_force_cpu_cap(X86_FEATURE_SPLIT_LOCK_DETECT); setup_force_cpu_cap(X86_FEATURE_SPLIT_LOCK_DETECT);
} }
...@@ -1118,6 +1118,29 @@ bool handle_guest_split_lock(unsigned long ip) ...@@ -1118,6 +1118,29 @@ bool handle_guest_split_lock(unsigned long ip)
} }
EXPORT_SYMBOL_GPL(handle_guest_split_lock); EXPORT_SYMBOL_GPL(handle_guest_split_lock);
static void bus_lock_init(void)
{
u64 val;
/*
* Warn and fatal are handled by #AC for split lock if #AC for
* split lock is supported.
*/
if (!boot_cpu_has(X86_FEATURE_BUS_LOCK_DETECT) ||
(boot_cpu_has(X86_FEATURE_SPLIT_LOCK_DETECT) &&
(sld_state == sld_warn || sld_state == sld_fatal)) ||
sld_state == sld_off)
return;
/*
* Enable #DB for bus lock. All bus locks are handled in #DB except
* split locks are handled in #AC in the fatal case.
*/
rdmsrl(MSR_IA32_DEBUGCTLMSR, val);
val |= DEBUGCTLMSR_BUS_LOCK_DETECT;
wrmsrl(MSR_IA32_DEBUGCTLMSR, val);
}
bool handle_user_split_lock(struct pt_regs *regs, long error_code) bool handle_user_split_lock(struct pt_regs *regs, long error_code)
{ {
if ((regs->flags & X86_EFLAGS_AC) || sld_state == sld_fatal) if ((regs->flags & X86_EFLAGS_AC) || sld_state == sld_fatal)
...@@ -1126,6 +1149,21 @@ bool handle_user_split_lock(struct pt_regs *regs, long error_code) ...@@ -1126,6 +1149,21 @@ bool handle_user_split_lock(struct pt_regs *regs, long error_code)
return true; return true;
} }
void handle_bus_lock(struct pt_regs *regs)
{
switch (sld_state) {
case sld_off:
break;
case sld_warn:
pr_warn_ratelimited("#DB: %s/%d took a bus_lock trap at address: 0x%lx\n",
current->comm, current->pid, regs->ip);
break;
case sld_fatal:
force_sig_fault(SIGBUS, BUS_ADRALN, NULL);
break;
}
}
/* /*
* This function is called only when switching between tasks with * This function is called only when switching between tasks with
* different split-lock detection modes. It sets the MSR for the * different split-lock detection modes. It sets the MSR for the
...@@ -1166,7 +1204,7 @@ static const struct x86_cpu_id split_lock_cpu_ids[] __initconst = { ...@@ -1166,7 +1204,7 @@ static const struct x86_cpu_id split_lock_cpu_ids[] __initconst = {
{} {}
}; };
void __init cpu_set_core_cap_bits(struct cpuinfo_x86 *c) static void __init split_lock_setup(struct cpuinfo_x86 *c)
{ {
const struct x86_cpu_id *m; const struct x86_cpu_id *m;
u64 ia32_core_caps; u64 ia32_core_caps;
...@@ -1193,5 +1231,40 @@ void __init cpu_set_core_cap_bits(struct cpuinfo_x86 *c) ...@@ -1193,5 +1231,40 @@ void __init cpu_set_core_cap_bits(struct cpuinfo_x86 *c)
} }
cpu_model_supports_sld = true; cpu_model_supports_sld = true;
split_lock_setup(); __split_lock_setup();
}
static void sld_state_show(void)
{
if (!boot_cpu_has(X86_FEATURE_BUS_LOCK_DETECT) &&
!boot_cpu_has(X86_FEATURE_SPLIT_LOCK_DETECT))
return;
switch (sld_state) {
case sld_off:
pr_info("disabled\n");
break;
case sld_warn:
if (boot_cpu_has(X86_FEATURE_SPLIT_LOCK_DETECT))
pr_info("#AC: crashing the kernel on kernel split_locks and warning on user-space split_locks\n");
else if (boot_cpu_has(X86_FEATURE_BUS_LOCK_DETECT))
pr_info("#DB: warning on user-space bus_locks\n");
break;
case sld_fatal:
if (boot_cpu_has(X86_FEATURE_SPLIT_LOCK_DETECT)) {
pr_info("#AC: crashing the kernel on kernel split_locks and sending SIGBUS on user-space split_locks\n");
} else if (boot_cpu_has(X86_FEATURE_BUS_LOCK_DETECT)) {
pr_info("#DB: sending SIGBUS on user-space bus_locks%s\n",
boot_cpu_has(X86_FEATURE_SPLIT_LOCK_DETECT) ?
" from non-WB" : "");
}
break;
}
}
void __init sld_setup(struct cpuinfo_x86 *c)
{
split_lock_setup(c);
sld_state_setup();
sld_state_show();
} }
...@@ -978,6 +978,10 @@ static __always_inline void exc_debug_user(struct pt_regs *regs, ...@@ -978,6 +978,10 @@ static __always_inline void exc_debug_user(struct pt_regs *regs,
goto out_irq; goto out_irq;
} }
/* #DB for bus lock can only be triggered from userspace. */
if (dr6 & DR_BUS_LOCK)
handle_bus_lock(regs);
/* Add the virtual_dr6 bits for signals. */ /* Add the virtual_dr6 bits for signals. */
dr6 |= current->thread.virtual_dr6; dr6 |= current->thread.virtual_dr6;
if (dr6 & (DR_STEP | DR_TRAP_BITS) || icebp) if (dr6 & (DR_STEP | DR_TRAP_BITS) || icebp)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment