Return-Path: Received: (majordomo@vger.kernel.org) by vger.kernel.org via listexpand id S1755913AbbBLM3u (ORCPT ); Thu, 12 Feb 2015 07:29:50 -0500 Received: from szxga01-in.huawei.com ([119.145.14.64]:37969 "EHLO szxga01-in.huawei.com" rhost-flags-OK-OK-OK-OK) by vger.kernel.org with ESMTP id S1755854AbbBLM3r (ORCPT ); Thu, 12 Feb 2015 07:29:47 -0500 From: Wang Nan To: , , , , , , , , , , , , , , , , , , , , , , , , , , , , , , CC: , , , Subject: [RFC PATCH v2 20/26] early kprobes: core logic of eraly kprobes. Date: Thu, 12 Feb 2015 20:21:05 +0800 Message-ID: <1423743665-12897-1-git-send-email-wangnan0@huawei.com> X-Mailer: git-send-email 1.8.4 In-Reply-To: <1423743476-11927-1-git-send-email-wangnan0@huawei.com> References: <1423743476-11927-1-git-send-email-wangnan0@huawei.com> MIME-Version: 1.0 Content-Type: text/plain X-Originating-IP: [10.107.197.247] X-CFilter-Loop: Reflected Sender: linux-kernel-owner@vger.kernel.org List-ID: X-Mailing-List: linux-kernel@vger.kernel.org Content-Length: 7522 Lines: 272 This patch is the main logic of early kprobe. If register_kprobe() is called before kprobes_initialized, an early kprobe is allocated. Try to utilize existing OPTPROBE mechanism to replace the target instruction by a branch instead of breakpoint, because interrupt handlers may not been initialized yet. All resources required by early kprobes are allocated statically. CONFIG_NR_EARLY_KPROBES_SLOTS is used to control number of possible early kprobes. Signed-off-by: Wang Nan --- include/linux/kprobes.h | 4 ++ kernel/kprobes.c | 150 ++++++++++++++++++++++++++++++++++++++++++++++-- 2 files changed, 148 insertions(+), 6 deletions(-) diff --git a/include/linux/kprobes.h b/include/linux/kprobes.h index 6100678..0c64df8 100644 --- a/include/linux/kprobes.h +++ b/include/linux/kprobes.h @@ -450,6 +450,10 @@ extern int proc_kprobes_optimization_handler(struct ctl_table *table, size_t *length, loff_t *ppos); #endif +struct early_kprobe_slot { + struct optimized_kprobe op; +}; + #endif /* CONFIG_OPTPROBES */ #ifdef CONFIG_KPROBES_ON_FTRACE extern void kprobe_ftrace_handler(unsigned long ip, unsigned long parent_ip, diff --git a/kernel/kprobes.c b/kernel/kprobes.c index b83c406..131a71a 100644 --- a/kernel/kprobes.c +++ b/kernel/kprobes.c @@ -77,6 +77,10 @@ int kprobes_is_early(void) static struct hlist_head kprobe_table[KPROBE_TABLE_SIZE]; static struct hlist_head kretprobe_inst_table[KPROBE_TABLE_SIZE]; +#ifdef CONFIG_EARLY_KPROBES +static HLIST_HEAD(early_kprobe_hlist); +#endif + /* NOTE: change this value only with kprobe_mutex held */ static bool kprobes_all_disarmed; @@ -87,6 +91,8 @@ static struct { raw_spinlock_t lock ____cacheline_aligned_in_smp; } kretprobe_table_locks[KPROBE_TABLE_SIZE]; +DEFINE_EKPROBE_ALLOC_OPS(struct early_kprobe_slot, early_kprobe, static) + static raw_spinlock_t *kretprobe_table_lock_ptr(unsigned long hash) { return &(kretprobe_table_locks[hash].lock); @@ -326,7 +332,12 @@ struct kprobe *get_kprobe(void *addr) struct hlist_head *head; struct kprobe *p; - head = &kprobe_table[hash_ptr(addr, KPROBE_HASH_BITS)]; +#ifdef CONFIG_EARLY_KPROBES + if (kprobes_is_early()) + head = &early_kprobe_hlist; + else +#endif + head = &kprobe_table[hash_ptr(addr, KPROBE_HASH_BITS)]; hlist_for_each_entry_rcu(p, head, hlist) { if (p->addr == addr) return p; @@ -386,11 +397,14 @@ NOKPROBE_SYMBOL(opt_pre_handler); static void free_aggr_kprobe(struct kprobe *p) { struct optimized_kprobe *op; + struct early_kprobe_slot *ep; op = container_of(p, struct optimized_kprobe, kp); arch_remove_optimized_kprobe(op); arch_remove_kprobe(p); - kfree(op); + ep = container_of(op, struct early_kprobe_slot, op); + if (likely(!ek_free_early_kprobe(ep))) + kfree(op); } /* Return true(!0) if the kprobe is ready for optimization. */ @@ -607,9 +621,15 @@ static void optimize_kprobe(struct kprobe *p) struct optimized_kprobe *op; /* Check if the kprobe is disabled or not ready for optimization. */ - if (!kprobe_optready(p) || !kprobes_allow_optimization || - (kprobe_disabled(p) || kprobes_all_disarmed)) - return; + if (unlikely(kprobes_is_early())) { + BUG_ON(!(p->flags & KPROBE_FLAG_EARLY)); + if (!kprobe_optready(p) || kprobe_disabled(p)) + return; + } else { + if (!kprobe_optready(p) || !kprobes_allow_optimization || + (kprobe_disabled(p) || kprobes_all_disarmed)) + return; + } /* Both of break_handler and post_handler are not supported. */ if (p->break_handler || p->post_handler) @@ -631,7 +651,10 @@ static void optimize_kprobe(struct kprobe *p) list_del_init(&op->list); else { list_add(&op->list, &optimizing_list); - kick_kprobe_optimizer(); + if (kprobes_is_early()) + arch_optimize_kprobes(&optimizing_list); + else + kick_kprobe_optimizer(); } } @@ -1505,6 +1528,8 @@ out: return ret; } +static int register_early_kprobe(struct kprobe *p); + int register_kprobe(struct kprobe *p) { int ret; @@ -1518,6 +1543,14 @@ int register_kprobe(struct kprobe *p) return PTR_ERR(addr); p->addr = addr; + if (unlikely(kprobes_is_early())) { + p->flags |= KPROBE_FLAG_EARLY; + return register_early_kprobe(p); + } + + WARN(p->flags & KPROBE_FLAG_EARLY, + "register early kprobe after kprobes initialized\n"); + ret = check_kprobe_rereg(p); if (ret) return ret; @@ -2156,6 +2189,8 @@ static struct notifier_block kprobe_module_nb = { extern unsigned long __start_kprobe_blacklist[]; extern unsigned long __stop_kprobe_blacklist[]; +static void convert_early_kprobes(void); + static int __init init_kprobes(void) { int i, err = 0; @@ -2204,6 +2239,7 @@ static int __init init_kprobes(void) if (!err) err = register_module_notifier(&kprobe_module_nb); + convert_early_kprobes(); kprobes_initialized = (err == 0); if (!err) @@ -2497,3 +2533,105 @@ module_init(init_kprobes); /* defined in arch/.../kernel/kprobes.c */ EXPORT_SYMBOL_GPL(jprobe_return); + +#ifdef CONFIG_EARLY_KPROBES + +static int register_early_kprobe(struct kprobe *p) +{ + struct early_kprobe_slot *slot; + int err; + + if (p->break_handler || p->post_handler) + return -EINVAL; + if (p->flags & KPROBE_FLAG_DISABLED) + return -EINVAL; + + slot = ek_alloc_early_kprobe(); + if (!slot) { + pr_err("No enough early kprobe slots.\n"); + return -ENOMEM; + } + + p->flags &= KPROBE_FLAG_DISABLED; + p->flags |= KPROBE_FLAG_EARLY; + p->nmissed = 0; + + err = arch_prepare_kprobe(p); + if (err) { + pr_err("arch_prepare_kprobe failed\n"); + goto free_slot; + } + + INIT_LIST_HEAD(&p->list); + INIT_HLIST_NODE(&p->hlist); + INIT_LIST_HEAD(&slot->op.list); + slot->op.kp.addr = p->addr; + slot->op.kp.flags = p->flags | KPROBE_FLAG_EARLY; + + err = arch_prepare_optimized_kprobe(&slot->op, p); + if (err) { + pr_err("Failed to prepare optimized kprobe.\n"); + goto remove_optimized; + } + + if (!arch_prepared_optinsn(&slot->op.optinsn)) { + pr_err("Failed to prepare optinsn.\n"); + err = -ENOMEM; + goto remove_optimized; + } + + hlist_add_head_rcu(&p->hlist, &early_kprobe_hlist); + init_aggr_kprobe(&slot->op.kp, p); + optimize_kprobe(&slot->op.kp); + return 0; + +remove_optimized: + arch_remove_optimized_kprobe(&slot->op); +free_slot: + ek_free_early_kprobe(slot); + return err; +} + +static void +convert_early_kprobe(struct kprobe *kp) +{ + struct module *probed_mod; + int err; + + BUG_ON(!kprobe_aggrprobe(kp)); + + err = check_kprobe_address_safe(kp, &probed_mod); + if (err) + panic("Insert kprobe at %p is not safe!", kp->addr); + + /* + * FIXME: + * convert kprobe to ftrace if CONFIG_KPROBES_ON_FTRACE is on + * and kp is on ftrace location. + */ + + mutex_lock(&kprobe_mutex); + hlist_del_rcu(&kp->hlist); + + INIT_HLIST_NODE(&kp->hlist); + hlist_add_head_rcu(&kp->hlist, + &kprobe_table[hash_ptr(kp->addr, KPROBE_HASH_BITS)]); + mutex_unlock(&kprobe_mutex); + + if (probed_mod) + module_put(probed_mod); +} + +static void +convert_early_kprobes(void) +{ + struct kprobe *p; + struct hlist_node *tmp; + + hlist_for_each_entry_safe(p, tmp, &early_kprobe_hlist, hlist) + convert_early_kprobe(p); +}; +#else +static int register_early_kprobe(struct kprobe *p) { return -ENOSYS; } +static void convert_early_kprobes(void) {}; +#endif -- 1.8.4 -- To unsubscribe from this list: send the line "unsubscribe linux-kernel" in the body of a message to majordomo@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html Please read the FAQ at http://www.tux.org/lkml/