Commit 37b6cb47 authored by Ingo Molnar's avatar Ingo Molnar

Merge branch 'uprobes/core' of...

Merge branch 'uprobes/core' of git://git.kernel.org/pub/scm/linux/kernel/git/oleg/misc into perf/core

Pull uprobes fixes and cleanups from Oleg Nesterov:

  "Any probed jmp/call can kill the application, see the changelog in 11/15."
Signed-off-by: default avatarIngo Molnar <mingo@kernel.org>
parents b3d5fc3c 6cc5e7ff
...@@ -33,15 +33,27 @@ typedef u8 uprobe_opcode_t; ...@@ -33,15 +33,27 @@ typedef u8 uprobe_opcode_t;
#define UPROBE_SWBP_INSN 0xcc #define UPROBE_SWBP_INSN 0xcc
#define UPROBE_SWBP_INSN_SIZE 1 #define UPROBE_SWBP_INSN_SIZE 1
struct uprobe_xol_ops;
struct arch_uprobe { struct arch_uprobe {
u16 fixups;
union { union {
u8 insn[MAX_UINSN_BYTES]; u8 insn[MAX_UINSN_BYTES];
u8 ixol[MAX_UINSN_BYTES]; u8 ixol[MAX_UINSN_BYTES];
}; };
u16 fixups;
const struct uprobe_xol_ops *ops;
union {
#ifdef CONFIG_X86_64 #ifdef CONFIG_X86_64
unsigned long rip_rela_target_address; unsigned long rip_rela_target_address;
#endif #endif
struct {
s32 offs;
u8 ilen;
u8 opc1;
} branch;
};
}; };
struct arch_uprobe_task { struct arch_uprobe_task {
......
...@@ -53,7 +53,7 @@ ...@@ -53,7 +53,7 @@
#define OPCODE1(insn) ((insn)->opcode.bytes[0]) #define OPCODE1(insn) ((insn)->opcode.bytes[0])
#define OPCODE2(insn) ((insn)->opcode.bytes[1]) #define OPCODE2(insn) ((insn)->opcode.bytes[1])
#define OPCODE3(insn) ((insn)->opcode.bytes[2]) #define OPCODE3(insn) ((insn)->opcode.bytes[2])
#define MODRM_REG(insn) X86_MODRM_REG(insn->modrm.value) #define MODRM_REG(insn) X86_MODRM_REG((insn)->modrm.value)
#define W(row, b0, b1, b2, b3, b4, b5, b6, b7, b8, b9, ba, bb, bc, bd, be, bf)\ #define W(row, b0, b1, b2, b3, b4, b5, b6, b7, b8, b9, ba, bb, bc, bd, be, bf)\
(((b0##UL << 0x0)|(b1##UL << 0x1)|(b2##UL << 0x2)|(b3##UL << 0x3) | \ (((b0##UL << 0x0)|(b1##UL << 0x1)|(b2##UL << 0x2)|(b3##UL << 0x3) | \
...@@ -229,63 +229,6 @@ static int validate_insn_32bits(struct arch_uprobe *auprobe, struct insn *insn) ...@@ -229,63 +229,6 @@ static int validate_insn_32bits(struct arch_uprobe *auprobe, struct insn *insn)
return -ENOTSUPP; return -ENOTSUPP;
} }
/*
* Figure out which fixups arch_uprobe_post_xol() will need to perform, and
* annotate arch_uprobe->fixups accordingly. To start with,
* arch_uprobe->fixups is either zero or it reflects rip-related fixups.
*/
static void prepare_fixups(struct arch_uprobe *auprobe, struct insn *insn)
{
bool fix_ip = true, fix_call = false; /* defaults */
int reg;
insn_get_opcode(insn); /* should be a nop */
switch (OPCODE1(insn)) {
case 0x9d:
/* popf */
auprobe->fixups |= UPROBE_FIX_SETF;
break;
case 0xc3: /* ret/lret */
case 0xcb:
case 0xc2:
case 0xca:
/* ip is correct */
fix_ip = false;
break;
case 0xe8: /* call relative - Fix return addr */
fix_call = true;
break;
case 0x9a: /* call absolute - Fix return addr, not ip */
fix_call = true;
fix_ip = false;
break;
case 0xff:
insn_get_modrm(insn);
reg = MODRM_REG(insn);
if (reg == 2 || reg == 3) {
/* call or lcall, indirect */
/* Fix return addr; ip is correct. */
fix_call = true;
fix_ip = false;
} else if (reg == 4 || reg == 5) {
/* jmp or ljmp, indirect */
/* ip is correct. */
fix_ip = false;
}
break;
case 0xea: /* jmp absolute -- ip is correct */
fix_ip = false;
break;
default:
break;
}
if (fix_ip)
auprobe->fixups |= UPROBE_FIX_IP;
if (fix_call)
auprobe->fixups |= UPROBE_FIX_CALL;
}
#ifdef CONFIG_X86_64 #ifdef CONFIG_X86_64
/* /*
* If arch_uprobe->insn doesn't use rip-relative addressing, return * If arch_uprobe->insn doesn't use rip-relative addressing, return
...@@ -310,15 +253,11 @@ static void prepare_fixups(struct arch_uprobe *auprobe, struct insn *insn) ...@@ -310,15 +253,11 @@ static void prepare_fixups(struct arch_uprobe *auprobe, struct insn *insn)
* - The displacement is always 4 bytes. * - The displacement is always 4 bytes.
*/ */
static void static void
handle_riprel_insn(struct arch_uprobe *auprobe, struct mm_struct *mm, struct insn *insn) handle_riprel_insn(struct arch_uprobe *auprobe, struct insn *insn)
{ {
u8 *cursor; u8 *cursor;
u8 reg; u8 reg;
if (mm->context.ia32_compat)
return;
auprobe->rip_rela_target_address = 0x0;
if (!insn_rip_relative(insn)) if (!insn_rip_relative(insn))
return; return;
...@@ -372,7 +311,48 @@ handle_riprel_insn(struct arch_uprobe *auprobe, struct mm_struct *mm, struct ins ...@@ -372,7 +311,48 @@ handle_riprel_insn(struct arch_uprobe *auprobe, struct mm_struct *mm, struct ins
cursor++; cursor++;
memmove(cursor, cursor + insn->displacement.nbytes, insn->immediate.nbytes); memmove(cursor, cursor + insn->displacement.nbytes, insn->immediate.nbytes);
} }
return; }
/*
* If we're emulating a rip-relative instruction, save the contents
* of the scratch register and store the target address in that register.
*/
static void
pre_xol_rip_insn(struct arch_uprobe *auprobe, struct pt_regs *regs,
struct arch_uprobe_task *autask)
{
if (auprobe->fixups & UPROBE_FIX_RIP_AX) {
autask->saved_scratch_register = regs->ax;
regs->ax = current->utask->vaddr;
regs->ax += auprobe->rip_rela_target_address;
} else if (auprobe->fixups & UPROBE_FIX_RIP_CX) {
autask->saved_scratch_register = regs->cx;
regs->cx = current->utask->vaddr;
regs->cx += auprobe->rip_rela_target_address;
}
}
static void
handle_riprel_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs, long *correction)
{
if (auprobe->fixups & (UPROBE_FIX_RIP_AX | UPROBE_FIX_RIP_CX)) {
struct arch_uprobe_task *autask;
autask = &current->utask->autask;
if (auprobe->fixups & UPROBE_FIX_RIP_AX)
regs->ax = autask->saved_scratch_register;
else
regs->cx = autask->saved_scratch_register;
/*
* The original instruction includes a displacement, and so
* is 4 bytes longer than what we've just single-stepped.
* Caller may need to apply other fixups to handle stuff
* like "jmpq *...(%rip)" and "callq *...(%rip)".
*/
if (correction)
*correction += 4;
}
} }
static int validate_insn_64bits(struct arch_uprobe *auprobe, struct insn *insn) static int validate_insn_64bits(struct arch_uprobe *auprobe, struct insn *insn)
...@@ -401,9 +381,19 @@ static int validate_insn_bits(struct arch_uprobe *auprobe, struct mm_struct *mm, ...@@ -401,9 +381,19 @@ static int validate_insn_bits(struct arch_uprobe *auprobe, struct mm_struct *mm,
return validate_insn_64bits(auprobe, insn); return validate_insn_64bits(auprobe, insn);
} }
#else /* 32-bit: */ #else /* 32-bit: */
static void handle_riprel_insn(struct arch_uprobe *auprobe, struct mm_struct *mm, struct insn *insn) /*
* No RIP-relative addressing on 32-bit
*/
static void handle_riprel_insn(struct arch_uprobe *auprobe, struct insn *insn)
{
}
static void pre_xol_rip_insn(struct arch_uprobe *auprobe, struct pt_regs *regs,
struct arch_uprobe_task *autask)
{
}
static void handle_riprel_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs,
long *correction)
{ {
/* No RIP-relative addressing on 32-bit */
} }
static int validate_insn_bits(struct arch_uprobe *auprobe, struct mm_struct *mm, struct insn *insn) static int validate_insn_bits(struct arch_uprobe *auprobe, struct mm_struct *mm, struct insn *insn)
...@@ -412,141 +402,311 @@ static int validate_insn_bits(struct arch_uprobe *auprobe, struct mm_struct *mm, ...@@ -412,141 +402,311 @@ static int validate_insn_bits(struct arch_uprobe *auprobe, struct mm_struct *mm,
} }
#endif /* CONFIG_X86_64 */ #endif /* CONFIG_X86_64 */
/** struct uprobe_xol_ops {
* arch_uprobe_analyze_insn - instruction analysis including validity and fixups. bool (*emulate)(struct arch_uprobe *, struct pt_regs *);
* @mm: the probed address space. int (*pre_xol)(struct arch_uprobe *, struct pt_regs *);
* @arch_uprobe: the probepoint information. int (*post_xol)(struct arch_uprobe *, struct pt_regs *);
* @addr: virtual address at which to install the probepoint };
* Return 0 on success or a -ve number on error.
static inline int sizeof_long(void)
{
return is_ia32_task() ? 4 : 8;
}
static int default_pre_xol_op(struct arch_uprobe *auprobe, struct pt_regs *regs)
{
pre_xol_rip_insn(auprobe, regs, &current->utask->autask);
return 0;
}
/*
* Adjust the return address pushed by a call insn executed out of line.
*/ */
int arch_uprobe_analyze_insn(struct arch_uprobe *auprobe, struct mm_struct *mm, unsigned long addr) static int adjust_ret_addr(unsigned long sp, long correction)
{ {
int ret; int rasize = sizeof_long();
struct insn insn; long ra;
auprobe->fixups = 0; if (copy_from_user(&ra, (void __user *)sp, rasize))
ret = validate_insn_bits(auprobe, mm, &insn); return -EFAULT;
if (ret != 0)
return ret;
handle_riprel_insn(auprobe, mm, &insn); ra += correction;
prepare_fixups(auprobe, &insn); if (copy_to_user((void __user *)sp, &ra, rasize))
return -EFAULT;
return 0; return 0;
} }
#ifdef CONFIG_X86_64 static int default_post_xol_op(struct arch_uprobe *auprobe, struct pt_regs *regs)
/*
* If we're emulating a rip-relative instruction, save the contents
* of the scratch register and store the target address in that register.
*/
static void
pre_xol_rip_insn(struct arch_uprobe *auprobe, struct pt_regs *regs,
struct arch_uprobe_task *autask)
{ {
if (auprobe->fixups & UPROBE_FIX_RIP_AX) { struct uprobe_task *utask = current->utask;
autask->saved_scratch_register = regs->ax; long correction = (long)(utask->vaddr - utask->xol_vaddr);
regs->ax = current->utask->vaddr;
regs->ax += auprobe->rip_rela_target_address; handle_riprel_post_xol(auprobe, regs, &correction);
} else if (auprobe->fixups & UPROBE_FIX_RIP_CX) { if (auprobe->fixups & UPROBE_FIX_IP)
autask->saved_scratch_register = regs->cx; regs->ip += correction;
regs->cx = current->utask->vaddr;
regs->cx += auprobe->rip_rela_target_address; if (auprobe->fixups & UPROBE_FIX_CALL) {
if (adjust_ret_addr(regs->sp, correction)) {
regs->sp += sizeof_long();
return -ERESTART;
}
} }
return 0;
} }
#else
static void static struct uprobe_xol_ops default_xol_ops = {
pre_xol_rip_insn(struct arch_uprobe *auprobe, struct pt_regs *regs, .pre_xol = default_pre_xol_op,
struct arch_uprobe_task *autask) .post_xol = default_post_xol_op,
};
static bool branch_is_call(struct arch_uprobe *auprobe)
{ {
/* No RIP-relative addressing on 32-bit */ return auprobe->branch.opc1 == 0xe8;
} }
#endif
/* #define CASE_COND \
* arch_uprobe_pre_xol - prepare to execute out of line. COND(70, 71, XF(OF)) \
* @auprobe: the probepoint information. COND(72, 73, XF(CF)) \
* @regs: reflects the saved user state of current task. COND(74, 75, XF(ZF)) \
*/ COND(78, 79, XF(SF)) \
int arch_uprobe_pre_xol(struct arch_uprobe *auprobe, struct pt_regs *regs) COND(7a, 7b, XF(PF)) \
{ COND(76, 77, XF(CF) || XF(ZF)) \
struct arch_uprobe_task *autask; COND(7c, 7d, XF(SF) != XF(OF)) \
COND(7e, 7f, XF(ZF) || XF(SF) != XF(OF))
autask = &current->utask->autask; #define COND(op_y, op_n, expr) \
autask->saved_trap_nr = current->thread.trap_nr; case 0x ## op_y: DO((expr) != 0) \
current->thread.trap_nr = UPROBE_TRAP_NR; case 0x ## op_n: DO((expr) == 0)
regs->ip = current->utask->xol_vaddr;
pre_xol_rip_insn(auprobe, regs, autask);
autask->saved_tf = !!(regs->flags & X86_EFLAGS_TF); #define XF(xf) (!!(flags & X86_EFLAGS_ ## xf))
regs->flags |= X86_EFLAGS_TF;
if (test_tsk_thread_flag(current, TIF_BLOCKSTEP))
set_task_blockstep(current, false);
return 0; static bool is_cond_jmp_opcode(u8 opcode)
{
switch (opcode) {
#define DO(expr) \
return true;
CASE_COND
#undef DO
default:
return false;
}
} }
/* static bool check_jmp_cond(struct arch_uprobe *auprobe, struct pt_regs *regs)
* This function is called by arch_uprobe_post_xol() to adjust the return
* address pushed by a call instruction executed out of line.
*/
static int adjust_ret_addr(unsigned long sp, long correction)
{ {
int rasize, ncopied; unsigned long flags = regs->flags;
long ra = 0;
if (is_ia32_task()) switch (auprobe->branch.opc1) {
rasize = 4; #define DO(expr) \
else return expr;
rasize = 8; CASE_COND
#undef DO
ncopied = copy_from_user(&ra, (void __user *)sp, rasize); default: /* not a conditional jmp */
if (unlikely(ncopied)) return true;
return -EFAULT; }
}
ra += correction; #undef XF
ncopied = copy_to_user((void __user *)sp, &ra, rasize); #undef COND
if (unlikely(ncopied)) #undef CASE_COND
return -EFAULT;
return 0; static bool branch_emulate_op(struct arch_uprobe *auprobe, struct pt_regs *regs)
{
unsigned long new_ip = regs->ip += auprobe->branch.ilen;
unsigned long offs = (long)auprobe->branch.offs;
if (branch_is_call(auprobe)) {
unsigned long new_sp = regs->sp - sizeof_long();
/*
* If it fails we execute this (mangled, see the comment in
* branch_clear_offset) insn out-of-line. In the likely case
* this should trigger the trap, and the probed application
* should die or restart the same insn after it handles the
* signal, arch_uprobe_post_xol() won't be even called.
*
* But there is corner case, see the comment in ->post_xol().
*/
if (copy_to_user((void __user *)new_sp, &new_ip, sizeof_long()))
return false;
regs->sp = new_sp;
} else if (!check_jmp_cond(auprobe, regs)) {
offs = 0;
}
regs->ip = new_ip + offs;
return true;
} }
#ifdef CONFIG_X86_64 static int branch_post_xol_op(struct arch_uprobe *auprobe, struct pt_regs *regs)
static bool is_riprel_insn(struct arch_uprobe *auprobe)
{ {
return ((auprobe->fixups & (UPROBE_FIX_RIP_AX | UPROBE_FIX_RIP_CX)) != 0); BUG_ON(!branch_is_call(auprobe));
/*
* We can only get here if branch_emulate_op() failed to push the ret
* address _and_ another thread expanded our stack before the (mangled)
* "call" insn was executed out-of-line. Just restore ->sp and restart.
* We could also restore ->ip and try to call branch_emulate_op() again.
*/
regs->sp += sizeof_long();
return -ERESTART;
} }
static void static void branch_clear_offset(struct arch_uprobe *auprobe, struct insn *insn)
handle_riprel_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs, long *correction)
{ {
if (is_riprel_insn(auprobe)) { /*
struct arch_uprobe_task *autask; * Turn this insn into "call 1f; 1:", this is what we will execute
* out-of-line if ->emulate() fails. We only need this to generate
* a trap, so that the probed task receives the correct signal with
* the properly filled siginfo.
*
* But see the comment in ->post_xol(), in the unlikely case it can
* succeed. So we need to ensure that the new ->ip can not fall into
* the non-canonical area and trigger #GP.
*
* We could turn it into (say) "pushf", but then we would need to
* divorce ->insn[] and ->ixol[]. We need to preserve the 1st byte
* of ->insn[] for set_orig_insn().
*/
memset(auprobe->insn + insn_offset_immediate(insn),
0, insn->immediate.nbytes);
}
autask = &current->utask->autask; static struct uprobe_xol_ops branch_xol_ops = {
if (auprobe->fixups & UPROBE_FIX_RIP_AX) .emulate = branch_emulate_op,
regs->ax = autask->saved_scratch_register; .post_xol = branch_post_xol_op,
else };
regs->cx = autask->saved_scratch_register;
/* Returns -ENOSYS if branch_xol_ops doesn't handle this insn */
static int branch_setup_xol_ops(struct arch_uprobe *auprobe, struct insn *insn)
{
u8 opc1 = OPCODE1(insn);
/* has the side-effect of processing the entire instruction */
insn_get_length(insn);
if (WARN_ON_ONCE(!insn_complete(insn)))
return -ENOEXEC;
switch (opc1) {
case 0xeb: /* jmp 8 */
case 0xe9: /* jmp 32 */
case 0x90: /* prefix* + nop; same as jmp with .offs = 0 */
break;
case 0xe8: /* call relative */
branch_clear_offset(auprobe, insn);
break;
case 0x0f:
if (insn->opcode.nbytes != 2)
return -ENOSYS;
/* /*
* The original instruction includes a displacement, and so * If it is a "near" conditional jmp, OPCODE2() - 0x10 matches
* is 4 bytes longer than what we've just single-stepped. * OPCODE1() of the "short" jmp which checks the same condition.
* Fall through to handle stuff like "jmpq *...(%rip)" and
* "callq *...(%rip)".
*/ */
if (correction) opc1 = OPCODE2(insn) - 0x10;
*correction += 4; default:
if (!is_cond_jmp_opcode(opc1))
return -ENOSYS;
} }
auprobe->branch.opc1 = opc1;
auprobe->branch.ilen = insn->length;
auprobe->branch.offs = insn->immediate.value;
auprobe->ops = &branch_xol_ops;
return 0;
} }
#else
static void /**
handle_riprel_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs, long *correction) * arch_uprobe_analyze_insn - instruction analysis including validity and fixups.
* @mm: the probed address space.
* @arch_uprobe: the probepoint information.
* @addr: virtual address at which to install the probepoint
* Return 0 on success or a -ve number on error.
*/
int arch_uprobe_analyze_insn(struct arch_uprobe *auprobe, struct mm_struct *mm, unsigned long addr)
{
struct insn insn;
bool fix_ip = true, fix_call = false;
int ret;
ret = validate_insn_bits(auprobe, mm, &insn);
if (ret)
return ret;
ret = branch_setup_xol_ops(auprobe, &insn);
if (ret != -ENOSYS)
return ret;
/*
* Figure out which fixups arch_uprobe_post_xol() will need to perform,
* and annotate arch_uprobe->fixups accordingly. To start with, ->fixups
* is either zero or it reflects rip-related fixups.
*/
switch (OPCODE1(&insn)) {
case 0x9d: /* popf */
auprobe->fixups |= UPROBE_FIX_SETF;
break;
case 0xc3: /* ret or lret -- ip is correct */
case 0xcb:
case 0xc2:
case 0xca:
fix_ip = false;
break;
case 0x9a: /* call absolute - Fix return addr, not ip */
fix_call = true;
fix_ip = false;
break;
case 0xea: /* jmp absolute -- ip is correct */
fix_ip = false;
break;
case 0xff:
insn_get_modrm(&insn);
switch (MODRM_REG(&insn)) {
case 2: case 3: /* call or lcall, indirect */
fix_call = true;
case 4: case 5: /* jmp or ljmp, indirect */
fix_ip = false;
}
/* fall through */
default:
handle_riprel_insn(auprobe, &insn);
}
if (fix_ip)
auprobe->fixups |= UPROBE_FIX_IP;
if (fix_call)
auprobe->fixups |= UPROBE_FIX_CALL;
auprobe->ops = &default_xol_ops;
return 0;
}
/*
* arch_uprobe_pre_xol - prepare to execute out of line.
* @auprobe: the probepoint information.
* @regs: reflects the saved user state of current task.
*/
int arch_uprobe_pre_xol(struct arch_uprobe *auprobe, struct pt_regs *regs)
{ {
/* No RIP-relative addressing on 32-bit */ struct uprobe_task *utask = current->utask;
regs->ip = utask->xol_vaddr;
utask->autask.saved_trap_nr = current->thread.trap_nr;
current->thread.trap_nr = UPROBE_TRAP_NR;
utask->autask.saved_tf = !!(regs->flags & X86_EFLAGS_TF);
regs->flags |= X86_EFLAGS_TF;
if (test_tsk_thread_flag(current, TIF_BLOCKSTEP))
set_task_blockstep(current, false);
if (auprobe->ops->pre_xol)
return auprobe->ops->pre_xol(auprobe, regs);
return 0;
} }
#endif
/* /*
* If xol insn itself traps and generates a signal(Say, * If xol insn itself traps and generates a signal(Say,
...@@ -592,22 +752,25 @@ bool arch_uprobe_xol_was_trapped(struct task_struct *t) ...@@ -592,22 +752,25 @@ bool arch_uprobe_xol_was_trapped(struct task_struct *t)
*/ */
int arch_uprobe_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs) int arch_uprobe_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs)
{ {
struct uprobe_task *utask; struct uprobe_task *utask = current->utask;
long correction;
int result = 0;
WARN_ON_ONCE(current->thread.trap_nr != UPROBE_TRAP_NR); WARN_ON_ONCE(current->thread.trap_nr != UPROBE_TRAP_NR);
utask = current->utask; if (auprobe->ops->post_xol) {
current->thread.trap_nr = utask->autask.saved_trap_nr; int err = auprobe->ops->post_xol(auprobe, regs);
correction = (long)(utask->vaddr - utask->xol_vaddr); if (err) {
handle_riprel_post_xol(auprobe, regs, &correction); arch_uprobe_abort_xol(auprobe, regs);
if (auprobe->fixups & UPROBE_FIX_IP) /*
regs->ip += correction; * Restart the probed insn. ->post_xol() must ensure
* this is really possible if it returns -ERESTART.
if (auprobe->fixups & UPROBE_FIX_CALL) */
result = adjust_ret_addr(regs->sp, correction); if (err == -ERESTART)
return 0;
return err;
}
}
current->thread.trap_nr = utask->autask.saved_trap_nr;
/* /*
* arch_uprobe_pre_xol() doesn't save the state of TIF_BLOCKSTEP * arch_uprobe_pre_xol() doesn't save the state of TIF_BLOCKSTEP
* so we can get an extra SIGTRAP if we do not clear TF. We need * so we can get an extra SIGTRAP if we do not clear TF. We need
...@@ -618,7 +781,7 @@ int arch_uprobe_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs) ...@@ -618,7 +781,7 @@ int arch_uprobe_post_xol(struct arch_uprobe *auprobe, struct pt_regs *regs)
else if (!(auprobe->fixups & UPROBE_FIX_SETF)) else if (!(auprobe->fixups & UPROBE_FIX_SETF))
regs->flags &= ~X86_EFLAGS_TF; regs->flags &= ~X86_EFLAGS_TF;
return result; return 0;
} }
/* callback routine for handling exceptions. */ /* callback routine for handling exceptions. */
...@@ -652,8 +815,9 @@ int arch_uprobe_exception_notify(struct notifier_block *self, unsigned long val, ...@@ -652,8 +815,9 @@ int arch_uprobe_exception_notify(struct notifier_block *self, unsigned long val,
/* /*
* This function gets called when XOL instruction either gets trapped or * This function gets called when XOL instruction either gets trapped or
* the thread has a fatal signal, so reset the instruction pointer to its * the thread has a fatal signal, or if arch_uprobe_post_xol() failed.
* probed address. * Reset the instruction pointer to its probed address for the potential
* restart or for post mortem analysis.
*/ */
void arch_uprobe_abort_xol(struct arch_uprobe *auprobe, struct pt_regs *regs) void arch_uprobe_abort_xol(struct arch_uprobe *auprobe, struct pt_regs *regs)
{ {
...@@ -668,25 +832,10 @@ void arch_uprobe_abort_xol(struct arch_uprobe *auprobe, struct pt_regs *regs) ...@@ -668,25 +832,10 @@ void arch_uprobe_abort_xol(struct arch_uprobe *auprobe, struct pt_regs *regs)
regs->flags &= ~X86_EFLAGS_TF; regs->flags &= ~X86_EFLAGS_TF;
} }
/*
* Skip these instructions as per the currently known x86 ISA.
* rep=0x66*; nop=0x90
*/
static bool __skip_sstep(struct arch_uprobe *auprobe, struct pt_regs *regs) static bool __skip_sstep(struct arch_uprobe *auprobe, struct pt_regs *regs)
{ {
int i; if (auprobe->ops->emulate)
return auprobe->ops->emulate(auprobe, regs);
for (i = 0; i < MAX_UINSN_BYTES; i++) {
if (auprobe->insn[i] == 0x66)
continue;
if (auprobe->insn[i] == 0x90) {
regs->ip += i + 1;
return true;
}
break;
}
return false; return false;
} }
...@@ -701,23 +850,21 @@ bool arch_uprobe_skip_sstep(struct arch_uprobe *auprobe, struct pt_regs *regs) ...@@ -701,23 +850,21 @@ bool arch_uprobe_skip_sstep(struct arch_uprobe *auprobe, struct pt_regs *regs)
unsigned long unsigned long
arch_uretprobe_hijack_return_addr(unsigned long trampoline_vaddr, struct pt_regs *regs) arch_uretprobe_hijack_return_addr(unsigned long trampoline_vaddr, struct pt_regs *regs)
{ {
int rasize, ncopied; int rasize = sizeof_long(), nleft;
unsigned long orig_ret_vaddr = 0; /* clear high bits for 32-bit apps */ unsigned long orig_ret_vaddr = 0; /* clear high bits for 32-bit apps */
rasize = is_ia32_task() ? 4 : 8; if (copy_from_user(&orig_ret_vaddr, (void __user *)regs->sp, rasize))
ncopied = copy_from_user(&orig_ret_vaddr, (void __user *)regs->sp, rasize);
if (unlikely(ncopied))
return -1; return -1;
/* check whether address has been already hijacked */ /* check whether address has been already hijacked */
if (orig_ret_vaddr == trampoline_vaddr) if (orig_ret_vaddr == trampoline_vaddr)
return orig_ret_vaddr; return orig_ret_vaddr;
ncopied = copy_to_user((void __user *)regs->sp, &trampoline_vaddr, rasize); nleft = copy_to_user((void __user *)regs->sp, &trampoline_vaddr, rasize);
if (likely(!ncopied)) if (likely(!nleft))
return orig_ret_vaddr; return orig_ret_vaddr;
if (ncopied != rasize) { if (nleft != rasize) {
pr_err("uprobe: return address clobbered: pid=%d, %%sp=%#lx, " pr_err("uprobe: return address clobbered: pid=%d, %%sp=%#lx, "
"%%ip=%#lx\n", current->pid, regs->sp, regs->ip); "%%ip=%#lx\n", current->pid, regs->sp, regs->ip);
......
...@@ -60,8 +60,6 @@ static struct percpu_rw_semaphore dup_mmap_sem; ...@@ -60,8 +60,6 @@ static struct percpu_rw_semaphore dup_mmap_sem;
/* Have a copy of original instruction */ /* Have a copy of original instruction */
#define UPROBE_COPY_INSN 0 #define UPROBE_COPY_INSN 0
/* Can skip singlestep */
#define UPROBE_SKIP_SSTEP 1
struct uprobe { struct uprobe {
struct rb_node rb_node; /* node in the rb tree */ struct rb_node rb_node; /* node in the rb tree */
...@@ -491,12 +489,9 @@ static struct uprobe *alloc_uprobe(struct inode *inode, loff_t offset) ...@@ -491,12 +489,9 @@ static struct uprobe *alloc_uprobe(struct inode *inode, loff_t offset)
uprobe->offset = offset; uprobe->offset = offset;
init_rwsem(&uprobe->register_rwsem); init_rwsem(&uprobe->register_rwsem);
init_rwsem(&uprobe->consumer_rwsem); init_rwsem(&uprobe->consumer_rwsem);
/* For now assume that the instruction need not be single-stepped */
__set_bit(UPROBE_SKIP_SSTEP, &uprobe->flags);
/* add to uprobes_tree, sorted on inode:offset */ /* add to uprobes_tree, sorted on inode:offset */
cur_uprobe = insert_uprobe(uprobe); cur_uprobe = insert_uprobe(uprobe);
/* a uprobe exists for this inode:offset combination */ /* a uprobe exists for this inode:offset combination */
if (cur_uprobe) { if (cur_uprobe) {
kfree(uprobe); kfree(uprobe);
...@@ -1628,20 +1623,6 @@ bool uprobe_deny_signal(void) ...@@ -1628,20 +1623,6 @@ bool uprobe_deny_signal(void)
return true; return true;
} }
/*
* Avoid singlestepping the original instruction if the original instruction
* is a NOP or can be emulated.
*/
static bool can_skip_sstep(struct uprobe *uprobe, struct pt_regs *regs)
{
if (test_bit(UPROBE_SKIP_SSTEP, &uprobe->flags)) {
if (arch_uprobe_skip_sstep(&uprobe->arch, regs))
return true;
clear_bit(UPROBE_SKIP_SSTEP, &uprobe->flags);
}
return false;
}
static void mmf_recalc_uprobes(struct mm_struct *mm) static void mmf_recalc_uprobes(struct mm_struct *mm)
{ {
struct vm_area_struct *vma; struct vm_area_struct *vma;
...@@ -1868,13 +1849,13 @@ static void handle_swbp(struct pt_regs *regs) ...@@ -1868,13 +1849,13 @@ static void handle_swbp(struct pt_regs *regs)
handler_chain(uprobe, regs); handler_chain(uprobe, regs);
if (can_skip_sstep(uprobe, regs)) if (arch_uprobe_skip_sstep(&uprobe->arch, regs))
goto out; goto out;
if (!pre_ssout(uprobe, regs, bp_vaddr)) if (!pre_ssout(uprobe, regs, bp_vaddr))
return; return;
/* can_skip_sstep() succeeded, or restart if can't singlestep */ /* arch_uprobe_skip_sstep() succeeded, or restart if can't singlestep */
out: out:
put_uprobe(uprobe); put_uprobe(uprobe);
} }
...@@ -1886,10 +1867,11 @@ static void handle_swbp(struct pt_regs *regs) ...@@ -1886,10 +1867,11 @@ static void handle_swbp(struct pt_regs *regs)
static void handle_singlestep(struct uprobe_task *utask, struct pt_regs *regs) static void handle_singlestep(struct uprobe_task *utask, struct pt_regs *regs)
{ {
struct uprobe *uprobe; struct uprobe *uprobe;
int err = 0;
uprobe = utask->active_uprobe; uprobe = utask->active_uprobe;
if (utask->state == UTASK_SSTEP_ACK) if (utask->state == UTASK_SSTEP_ACK)
arch_uprobe_post_xol(&uprobe->arch, regs); err = arch_uprobe_post_xol(&uprobe->arch, regs);
else if (utask->state == UTASK_SSTEP_TRAPPED) else if (utask->state == UTASK_SSTEP_TRAPPED)
arch_uprobe_abort_xol(&uprobe->arch, regs); arch_uprobe_abort_xol(&uprobe->arch, regs);
else else
...@@ -1903,6 +1885,11 @@ static void handle_singlestep(struct uprobe_task *utask, struct pt_regs *regs) ...@@ -1903,6 +1885,11 @@ static void handle_singlestep(struct uprobe_task *utask, struct pt_regs *regs)
spin_lock_irq(&current->sighand->siglock); spin_lock_irq(&current->sighand->siglock);
recalc_sigpending(); /* see uprobe_deny_signal() */ recalc_sigpending(); /* see uprobe_deny_signal() */
spin_unlock_irq(&current->sighand->siglock); spin_unlock_irq(&current->sighand->siglock);
if (unlikely(err)) {
uprobe_warn(current, "execute the probed insn, sending SIGILL.");
force_sig_info(SIGILL, SEND_SIG_FORCED, current);
}
} }
/* /*
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment