On Thu, Oct 03, 2019 at 01:01:06PM +0200, Peter Zijlstra wrote:
> Also, I think text_poke_bp(INT3) is broken, although I don't think
> anybody actually does that. Still, let me fix that.

Something like so should allow text_poke_bp(INT3) to work as expected.

---
--- a/arch/x86/kernel/alternative.c
+++ b/arch/x86/kernel/alternative.c
@@ -999,6 +999,13 @@ int poke_int3_handler(struct pt_regs *re
        ip += tp->len;
 
        switch (tp->opcode) {
+       case INT3_INSN_OPCODE:
+               /*
+                * Someone poked an explicit INT3, they'll want to handle it,
+                * do not consume.
+                */
+               return 0;
+
        case CALL_INSN_OPCODE:
                int3_emulate_call(regs, (long)ip + tp->rel32);
                break;
@@ -1040,8 +1047,8 @@ NOKPROBE_SYMBOL(poke_int3_handler);
 void text_poke_bp_batch(struct text_poke_loc *tp, unsigned int nr_entries)
 {
        unsigned char int3 = INT3_INSN_OPCODE;
-       int patched_all_but_first = 0;
        unsigned int i;
+       int do_sync;
 
        lockdep_assert_held(&text_mutex);
 
@@ -1065,16 +1072,16 @@ void text_poke_bp_batch(struct text_poke
        /*
         * Second step: update all but the first byte of the patched range.
         */
-       for (i = 0; i < nr_entries; i++) {
+       for (do_sync = 0, i = 0; i < nr_entries; i++) {
                if (tp[i].len - sizeof(int3) > 0) {
                        text_poke((char *)tp[i].addr + sizeof(int3),
                                  (const char *)tp[i].text + sizeof(int3),
                                  tp[i].len - sizeof(int3));
-                       patched_all_but_first++;
+                       do_sync++;
                }
        }
 
-       if (patched_all_but_first) {
+       if (do_sync) {
                /*
                 * According to Intel, this core syncing is very likely
                 * not necessary and we'd be safe even without it. But
@@ -1087,10 +1094,17 @@ void text_poke_bp_batch(struct text_poke
         * Third step: replace the first byte (int3) by the first byte of
         * replacing opcode.
         */
-       for (i = 0; i < nr_entries; i++)
+       for (do_sync = 0, i = 0; i < nr_entries; i++) {
+               if (tp[i].text[0] == INT3_INSN_OPCODE)
+                       continue;
+
                text_poke(tp[i].addr, tp[i].text, sizeof(int3));
+               do_sync++;
+       }
+
+       if (do_sync)
+               on_each_cpu(do_sync_core, NULL, 1);
 
-       on_each_cpu(do_sync_core, NULL, 1);
        /*
         * sync_core() implies an smp_mb() and orders this store against
         * the writing of the new instruction.
@@ -1123,6 +1137,9 @@ void text_poke_loc_init(struct text_poke
        tp->opcode = insn.opcode.bytes[0];
 
        switch (tp->opcode) {
+       case INT3_INSN_OPCPDE:
+               break;
+
        case CALL_INSN_OPCODE:
        case JMP32_INSN_OPCODE:
        case JMP8_INSN_OPCODE:

Reply via email to