On Tue, Nov 10, 2020 at 01:56:03AM +0100, Frederic Weisbecker wrote:

> [fweisbec: s/disp16/data16, integrate into text_get_insn(), elaborate
>  comment on the resulting insn, emulate on int3 trap, provide validation,
>  uninline __static_call_return0() for HAVE_STATIC_CALL]

> diff --git a/arch/x86/include/asm/text-patching.h 
> b/arch/x86/include/asm/text-patching.h
> index b7421780e4e9..1250f440d1be 100644
> --- a/arch/x86/include/asm/text-patching.h
> +++ b/arch/x86/include/asm/text-patching.h
> @@ -65,6 +65,9 @@ extern void text_poke_finish(void);
>  #define JMP8_INSN_SIZE               2
>  #define JMP8_INSN_OPCODE     0xEB
>  
> +#define XOR5RAX_INSN_SIZE    5
> +#define XOR5RAX_INSN_OPCODE  0x31
> +
>  #define DISP32_SIZE          4
>  
>  static __always_inline int text_opcode_size(u8 opcode)
> @@ -80,6 +83,7 @@ static __always_inline int text_opcode_size(u8 opcode)
>       __CASE(CALL);
>       __CASE(JMP32);
>       __CASE(JMP8);
> +     __CASE(XOR5RAX);
>       }
>  
>  #undef __CASE
> @@ -99,8 +103,21 @@ static __always_inline
>  void *text_gen_insn(u8 opcode, const void *addr, const void *dest)
>  {
>       static union text_poke_insn insn; /* per instance */
> -     int size = text_opcode_size(opcode);
> +     int size;
>  
> +     if (opcode == XOR5RAX_INSN_OPCODE) {
> +             /*
> +              * data16 data16 xorq %rax, %rax - a single 5 byte instruction 
> that clears %rax
> +              * The REX.W cancels the effect of any data16.
> +              */
> +             static union text_poke_insn xor5rax = {
> +                     .text = { 0x66, 0x66, 0x48, 0x31, 0xc0 },
> +             };
> +
> +             return &xor5rax.text;
> +     }
> +
> +     size = text_opcode_size(opcode);
>       insn.opcode = opcode;
>  
>       if (size > 1) {
> @@ -165,6 +182,13 @@ void int3_emulate_ret(struct pt_regs *regs)
>       unsigned long ip = int3_emulate_pop(regs);
>       int3_emulate_jmp(regs, ip);
>  }
> +
> +static __always_inline
> +void int3_emulate_xor5rax(struct pt_regs *regs)
> +{
> +     regs->ax = 0;
> +}
> +
>  #endif /* !CONFIG_UML_X86 */
>  
>  #endif /* _ASM_X86_TEXT_PATCHING_H */
> diff --git a/arch/x86/kernel/alternative.c b/arch/x86/kernel/alternative.c
> index 2400ad62f330..37592f576a10 100644
> --- a/arch/x86/kernel/alternative.c
> +++ b/arch/x86/kernel/alternative.c
> @@ -1125,6 +1125,10 @@ noinstr int poke_int3_handler(struct pt_regs *regs)
>               int3_emulate_jmp(regs, (long)ip + tp->rel32);
>               break;
>  
> +     case XOR5RAX_INSN_OPCODE:
> +             int3_emulate_xor5rax(regs);
> +             break;
> +
>       default:
>               BUG();
>       }
> @@ -1291,6 +1295,7 @@ static void text_poke_loc_init(struct text_poke_loc 
> *tp, void *addr,
>       switch (tp->opcode) {
>       case INT3_INSN_OPCODE:
>       case RET_INSN_OPCODE:
> +     case XOR5RAX_INSN_OPCODE:
>               break;
>  
>       case CALL_INSN_OPCODE:

Why did you add full emulation of this? The patch I send to you used the
text_poke_bp(.emulate) argument to have it emulate an actual call to the
out-of-line version of that function.

That should work fine and is a lot less code.

Reply via email to