This patch is the main logic of early kprobe.

If register_kprobe() is called before kprobes_initialized, an early
kprobe is allocated. Try to utilize existing OPTPROBE mechanism to
replace the target instruction by a branch instead of breakpoint,
because interrupt handlers may not been initialized yet.

All resources required by early kprobes are allocated statically.
CONFIG_NR_EARLY_KPROBES_SLOTS is used to control number of possible
early kprobes.

Signed-off-by: Wang Nan <wangn...@huawei.com>
---
 include/linux/kprobes.h |   4 ++
 kernel/kprobes.c        | 150 ++++++++++++++++++++++++++++++++++++++++++++++--
 2 files changed, 148 insertions(+), 6 deletions(-)

diff --git a/include/linux/kprobes.h b/include/linux/kprobes.h
index 6100678..0c64df8 100644
--- a/include/linux/kprobes.h
+++ b/include/linux/kprobes.h
@@ -450,6 +450,10 @@ extern int proc_kprobes_optimization_handler(struct 
ctl_table *table,
                                             size_t *length, loff_t *ppos);
 #endif
 
+struct early_kprobe_slot {
+       struct optimized_kprobe op;
+};
+
 #endif /* CONFIG_OPTPROBES */
 #ifdef CONFIG_KPROBES_ON_FTRACE
 extern void kprobe_ftrace_handler(unsigned long ip, unsigned long parent_ip,
diff --git a/kernel/kprobes.c b/kernel/kprobes.c
index b83c406..131a71a 100644
--- a/kernel/kprobes.c
+++ b/kernel/kprobes.c
@@ -77,6 +77,10 @@ int kprobes_is_early(void)
 static struct hlist_head kprobe_table[KPROBE_TABLE_SIZE];
 static struct hlist_head kretprobe_inst_table[KPROBE_TABLE_SIZE];
 
+#ifdef CONFIG_EARLY_KPROBES
+static HLIST_HEAD(early_kprobe_hlist);
+#endif
+
 /* NOTE: change this value only with kprobe_mutex held */
 static bool kprobes_all_disarmed;
 
@@ -87,6 +91,8 @@ static struct {
        raw_spinlock_t lock ____cacheline_aligned_in_smp;
 } kretprobe_table_locks[KPROBE_TABLE_SIZE];
 
+DEFINE_EKPROBE_ALLOC_OPS(struct early_kprobe_slot, early_kprobe, static)
+
 static raw_spinlock_t *kretprobe_table_lock_ptr(unsigned long hash)
 {
        return &(kretprobe_table_locks[hash].lock);
@@ -326,7 +332,12 @@ struct kprobe *get_kprobe(void *addr)
        struct hlist_head *head;
        struct kprobe *p;
 
-       head = &kprobe_table[hash_ptr(addr, KPROBE_HASH_BITS)];
+#ifdef CONFIG_EARLY_KPROBES
+       if (kprobes_is_early())
+               head = &early_kprobe_hlist;
+       else
+#endif
+               head = &kprobe_table[hash_ptr(addr, KPROBE_HASH_BITS)];
        hlist_for_each_entry_rcu(p, head, hlist) {
                if (p->addr == addr)
                        return p;
@@ -386,11 +397,14 @@ NOKPROBE_SYMBOL(opt_pre_handler);
 static void free_aggr_kprobe(struct kprobe *p)
 {
        struct optimized_kprobe *op;
+       struct early_kprobe_slot *ep;
 
        op = container_of(p, struct optimized_kprobe, kp);
        arch_remove_optimized_kprobe(op);
        arch_remove_kprobe(p);
-       kfree(op);
+       ep = container_of(op, struct early_kprobe_slot, op);
+       if (likely(!ek_free_early_kprobe(ep)))
+               kfree(op);
 }
 
 /* Return true(!0) if the kprobe is ready for optimization. */
@@ -607,9 +621,15 @@ static void optimize_kprobe(struct kprobe *p)
        struct optimized_kprobe *op;
 
        /* Check if the kprobe is disabled or not ready for optimization. */
-       if (!kprobe_optready(p) || !kprobes_allow_optimization ||
-           (kprobe_disabled(p) || kprobes_all_disarmed))
-               return;
+       if (unlikely(kprobes_is_early())) {
+               BUG_ON(!(p->flags & KPROBE_FLAG_EARLY));
+               if (!kprobe_optready(p) || kprobe_disabled(p))
+                       return;
+       } else {
+               if (!kprobe_optready(p) || !kprobes_allow_optimization ||
+                   (kprobe_disabled(p) || kprobes_all_disarmed))
+                       return;
+       }
 
        /* Both of break_handler and post_handler are not supported. */
        if (p->break_handler || p->post_handler)
@@ -631,7 +651,10 @@ static void optimize_kprobe(struct kprobe *p)
                list_del_init(&op->list);
        else {
                list_add(&op->list, &optimizing_list);
-               kick_kprobe_optimizer();
+               if (kprobes_is_early())
+                       arch_optimize_kprobes(&optimizing_list);
+               else
+                       kick_kprobe_optimizer();
        }
 }
 
@@ -1505,6 +1528,8 @@ out:
        return ret;
 }
 
+static int register_early_kprobe(struct kprobe *p);
+
 int register_kprobe(struct kprobe *p)
 {
        int ret;
@@ -1518,6 +1543,14 @@ int register_kprobe(struct kprobe *p)
                return PTR_ERR(addr);
        p->addr = addr;
 
+       if (unlikely(kprobes_is_early())) {
+               p->flags |= KPROBE_FLAG_EARLY;
+               return register_early_kprobe(p);
+       }
+
+       WARN(p->flags & KPROBE_FLAG_EARLY,
+               "register early kprobe after kprobes initialized\n");
+
        ret = check_kprobe_rereg(p);
        if (ret)
                return ret;
@@ -2156,6 +2189,8 @@ static struct notifier_block kprobe_module_nb = {
 extern unsigned long __start_kprobe_blacklist[];
 extern unsigned long __stop_kprobe_blacklist[];
 
+static void convert_early_kprobes(void);
+
 static int __init init_kprobes(void)
 {
        int i, err = 0;
@@ -2204,6 +2239,7 @@ static int __init init_kprobes(void)
        if (!err)
                err = register_module_notifier(&kprobe_module_nb);
 
+       convert_early_kprobes();
        kprobes_initialized = (err == 0);
 
        if (!err)
@@ -2497,3 +2533,105 @@ module_init(init_kprobes);
 
 /* defined in arch/.../kernel/kprobes.c */
 EXPORT_SYMBOL_GPL(jprobe_return);
+
+#ifdef CONFIG_EARLY_KPROBES
+
+static int register_early_kprobe(struct kprobe *p)
+{
+       struct early_kprobe_slot *slot;
+       int err;
+
+       if (p->break_handler || p->post_handler)
+               return -EINVAL;
+       if (p->flags & KPROBE_FLAG_DISABLED)
+               return -EINVAL;
+
+       slot = ek_alloc_early_kprobe();
+       if (!slot) {
+               pr_err("No enough early kprobe slots.\n");
+               return -ENOMEM;
+       }
+
+       p->flags &= KPROBE_FLAG_DISABLED;
+       p->flags |= KPROBE_FLAG_EARLY;
+       p->nmissed = 0;
+
+       err = arch_prepare_kprobe(p);
+       if (err) {
+               pr_err("arch_prepare_kprobe failed\n");
+               goto free_slot;
+       }
+
+       INIT_LIST_HEAD(&p->list);
+       INIT_HLIST_NODE(&p->hlist);
+       INIT_LIST_HEAD(&slot->op.list);
+       slot->op.kp.addr = p->addr;
+       slot->op.kp.flags = p->flags | KPROBE_FLAG_EARLY;
+
+       err = arch_prepare_optimized_kprobe(&slot->op, p);
+       if (err) {
+               pr_err("Failed to prepare optimized kprobe.\n");
+               goto remove_optimized;
+       }
+
+       if (!arch_prepared_optinsn(&slot->op.optinsn)) {
+               pr_err("Failed to prepare optinsn.\n");
+               err = -ENOMEM;
+               goto remove_optimized;
+       }
+
+       hlist_add_head_rcu(&p->hlist, &early_kprobe_hlist);
+       init_aggr_kprobe(&slot->op.kp, p);
+       optimize_kprobe(&slot->op.kp);
+       return 0;
+
+remove_optimized:
+       arch_remove_optimized_kprobe(&slot->op);
+free_slot:
+       ek_free_early_kprobe(slot);
+       return err;
+}
+
+static void
+convert_early_kprobe(struct kprobe *kp)
+{
+       struct module *probed_mod;
+       int err;
+
+       BUG_ON(!kprobe_aggrprobe(kp));
+
+       err = check_kprobe_address_safe(kp, &probed_mod);
+       if (err)
+               panic("Insert kprobe at %p is not safe!", kp->addr);
+
+       /*
+        * FIXME:
+        * convert kprobe to ftrace if CONFIG_KPROBES_ON_FTRACE is on
+        * and kp is on ftrace location.
+        */
+
+       mutex_lock(&kprobe_mutex);
+       hlist_del_rcu(&kp->hlist);
+
+       INIT_HLIST_NODE(&kp->hlist);
+       hlist_add_head_rcu(&kp->hlist,
+                      &kprobe_table[hash_ptr(kp->addr, KPROBE_HASH_BITS)]);
+       mutex_unlock(&kprobe_mutex);
+
+       if (probed_mod)
+               module_put(probed_mod);
+}
+
+static void
+convert_early_kprobes(void)
+{
+       struct kprobe *p;
+       struct hlist_node *tmp;
+
+       hlist_for_each_entry_safe(p, tmp, &early_kprobe_hlist, hlist)
+               convert_early_kprobe(p);
+};
+#else
+static int register_early_kprobe(struct kprobe *p) { return -ENOSYS; }
+static void convert_early_kprobes(void) {};
+#endif
-- 
1.8.4

--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Reply via email to