This is the mail archive of the
systemtap@sourceware.org
mailing list for the systemtap project.
Re: [PATCH] Kprobes- robust fault handling for i386
- From: Prasanna S Panchamukhi <prasanna at in dot ibm dot com>
- To: "Mao, Bibo" <bibo dot mao at intel dot com>
- Cc: systemtap at sources dot redhat dot com
- Date: Thu, 23 Feb 2006 14:29:35 +0530
- Subject: Re: [PATCH] Kprobes- robust fault handling for i386
- References: <9FBCE015AF479F46B3B410499F3AE05BC4BF0C@pdsmsx405>
- Reply-to: prasanna at in dot ibm dot com
Bibo,
You are right, the esp might be local variable, we are working on
it. As of now to fix the broken kprobes fault handling, here is the
patch. This is only for i386, once we freeze on this prototype, this
can be ported to other architectures.
Thanks
Prasanna
This patch provides proper kprobes fault handling, if a user-specified
pre/post handlers tries to access user address space, through
copy_from_user(), get_user() etc. The user-specified fault handler
gets called only if the fault occurs wile executing user-specified
handlers. In such a case user-specified handler is allowed to fix it
first, later if the user-specifed fault handler does not fix it, we
try to fix it by calling fix_exception(). Also we set the "FAULTED"
flags if user-specified pre handler faults, so that corresponding
user-specified post_handler can be skipped. The user-specified handler
will not be called if the fault happens when single stepping the
original instruction, instead we reset the current probe and allow the
system page fault handler to fix it up.
Signed-off-by: Prasanna S Panchamukhi <prasanna@in.ibm.com>
arch/i386/kernel/kprobes.c | 78 ++++++++++++++++++++++++++++++++++++++-------
include/linux/kprobes.h | 2 +
2 files changed, 69 insertions(+), 11 deletions(-)
diff -puN arch/i386/kernel/kprobes.c~kprobes-i386-pagefault-handling arch/i386/kernel/kprobes.c
--- linux-2.6.16-rc3-mm1/arch/i386/kernel/kprobes.c~kprobes-i386-pagefault-handling 2006-02-23 11:41:29.000000000 +0530
+++ linux-2.6.16-rc3-mm1-prasanna/arch/i386/kernel/kprobes.c 2006-02-23 14:09:15.000000000 +0530
@@ -35,6 +35,7 @@
#include <asm/cacheflush.h>
#include <asm/kdebug.h>
#include <asm/desc.h>
+#include <asm/uaccess.h>
void jprobe_return_end(void);
@@ -220,8 +221,9 @@ static int __kprobes kprobe_handler(stru
if (kprobe_running()) {
p = get_kprobe(addr);
if (p) {
- if (kcb->kprobe_status == KPROBE_HIT_SS &&
- *p->ainsn.insn == BREAKPOINT_INSTRUCTION) {
+ if (((kcb->kprobe_status == KPROBE_HIT_SS) ||
+ (kcb->kprobe_status == KPROBE_HIT_FAULT_SS)) &&
+ (*p->ainsn.insn == BREAKPOINT_INSTRUCTION)) {
regs->eflags &= ~TF_MASK;
regs->eflags |= kcb->kprobe_saved_eflags;
goto no_kprobe;
@@ -308,7 +310,10 @@ static int __kprobes kprobe_handler(stru
ss_probe:
prepare_singlestep(p, regs);
- kcb->kprobe_status = KPROBE_HIT_SS;
+ if (kcb->kprobe_status != KPROBE_HIT_FAULT)
+ kcb->kprobe_status = KPROBE_HIT_SS;
+ else
+ kcb->kprobe_status = KPROBE_HIT_FAULT_SS;
return 1;
no_kprobe:
@@ -509,7 +514,9 @@ static inline int post_kprobe_handler(st
if (!cur)
return 0;
- if ((kcb->kprobe_status != KPROBE_REENTER) && cur->post_handler) {
+ if ((kcb->kprobe_status != KPROBE_REENTER)
+ && (kcb->kprobe_status != KPROBE_HIT_FAULT_SS)
+ && cur->post_handler) {
kcb->kprobe_status = KPROBE_HIT_SSDONE;
cur->post_handler(cur, regs, 0);
}
@@ -542,15 +549,64 @@ static inline int kprobe_fault_handler(s
struct kprobe *cur = kprobe_running();
struct kprobe_ctlblk *kcb = get_kprobe_ctlblk();
- if (cur->fault_handler && cur->fault_handler(cur, regs, trapnr))
- return 1;
-
- if (kcb->kprobe_status & KPROBE_HIT_SS) {
- resume_execution(cur, regs, kcb);
+ switch(kcb->kprobe_status) {
+ case KPROBE_HIT_SS:
+ case KPROBE_REENTER:
+ case KPROBE_HIT_FAULT_SS:
+ /*
+ * We are here because the instruction being single
+ * stepped caused a page fault. We reset the current
+ * kprobe and the eip points back to the probe address
+ * and allow the page fault handler to continue as a
+ * normal page fault.
+ */
+ regs->eip = (unsigned long)cur->addr;
regs->eflags |= kcb->kprobe_old_eflags;
-
- reset_current_kprobe();
+ if (kcb->kprobe_status == KPROBE_REENTER)
+ restore_previous_kprobe(kcb);
+ else
+ reset_current_kprobe();
preempt_enable_no_resched();
+ break;
+ case KPROBE_HIT_ACTIVE:
+ /*
+ * We set the status as "FAULTED", so that subsequent
+ * user specified post handler can be avoided.
+ */
+ kcb->kprobe_status = KPROBE_HIT_FAULT;
+ /* fall down and fixup the exception*/
+ case KPROBE_HIT_SSDONE:
+ /*
+ * We increment the nmissed count for accounting,
+ * we can also use npre/npostfault count for accouting
+ * these specific fault cases.
+ */
+ kprobes_inc_nmissed_count(cur);
+
+ /*
+ * We come here because instructions in the pre/post
+ * handler caused the page_fault, this could happen
+ * if handler tries to access user space by
+ * copy_from_user(), get_user() etc. Let the
+ * user-specified handler try to fix it first.
+ */
+ if (cur->fault_handler && cur->fault_handler(cur, regs, trapnr))
+ return 1;
+
+ /*
+ * In case the user-specified fault handler returned
+ * zero, try to fix up.
+ */
+ if (fixup_exception(regs))
+ return 1;
+
+ /*
+ * fixup_exception() could not handle it,
+ * Let do_page_fault() fix it.
+ */
+ break;
+ default:
+ break;
}
return 0;
}
diff -puN include/linux/kprobes.h~kprobes-i386-pagefault-handling include/linux/kprobes.h
--- linux-2.6.16-rc3-mm1/include/linux/kprobes.h~kprobes-i386-pagefault-handling 2006-02-23 12:08:07.000000000 +0530
+++ linux-2.6.16-rc3-mm1-prasanna/include/linux/kprobes.h 2006-02-23 12:31:21.000000000 +0530
@@ -46,6 +46,8 @@
#define KPROBE_HIT_SS 0x00000002
#define KPROBE_REENTER 0x00000004
#define KPROBE_HIT_SSDONE 0x00000008
+#define KPROBE_HIT_FAULT 0x00000010
+#define KPROBE_HIT_FAULT_SS 0x00000020
/* Attach to insert probes on any functions which should be ignored*/
#define __kprobes __attribute__((__section__(".kprobes.text")))
_
--
Prasanna S Panchamukhi
Linux Technology Center
India Software Labs, IBM Bangalore
Email: prasanna@in.ibm.com
Ph: 91-80-51776329