LGTM. Happy to move this forward, once it receives an OK from one of you. --Philipp.
On Fri, 26 May 2023 at 02:53, Die Li <li...@eswincomputing.com> wrote: > > This patch allows less instructions to be used when TARGET_XTHEADCONDMOV is > enabled. > > Provide an example from the existing testcases. > > Testcase: > int ConEmv_imm_imm_reg(int x, int y){ > if (x == 1000) return 10; > return y; > } > > Cflags: > -O2 -march=rv64gc_xtheadcondmov -mabi=lp64d > > before patch: > ConEmv_imm_imm_reg: > addi a5,a0,-1000 > li a0,10 > th.mvnez a0,zero,a5 > th.mveqz a1,zero,a5 > or a0,a0,a1 > ret > > after patch: > ConEmv_imm_imm_reg: > addi a5,a0,-1000 > li a0,10 > th.mvnez a0,a1,a5 > ret > > Signed-off-by: Die Li <li...@eswincomputing.com> > > gcc/ChangeLog: > > * config/riscv/riscv.cc (riscv_expand_conditional_move_onesided): > Delete. > (riscv_expand_conditional_move): Reuse the TARGET_SFB_ALU expand > process for TARGET_XTHEADCONDMOV > > gcc/testsuite/ChangeLog: > > * gcc.target/riscv/xtheadcondmov-indirect-rv32.c: Update the output. > * gcc.target/riscv/xtheadcondmov-indirect-rv64.c: Likewise. > --- > gcc/config/riscv/riscv.cc | 44 +++-------------- > .../riscv/xtheadcondmov-indirect-rv32.c | 48 +++++++------------ > .../riscv/xtheadcondmov-indirect-rv64.c | 48 +++++++------------ > 3 files changed, 42 insertions(+), 98 deletions(-) > > diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc > index 09fc9e5d95e..8b8ac9181ba 100644 > --- a/gcc/config/riscv/riscv.cc > +++ b/gcc/config/riscv/riscv.cc > @@ -3442,37 +3442,6 @@ riscv_expand_conditional_branch (rtx label, rtx_code > code, rtx op0, rtx op1) > emit_jump_insn (gen_condjump (condition, label)); > } > > -/* Helper to emit two one-sided conditional moves for the movecc. */ > - > -static void > -riscv_expand_conditional_move_onesided (rtx dest, rtx cons, rtx alt, > - rtx_code code, rtx op0, rtx op1) > -{ > - machine_mode mode = GET_MODE (dest); > - > - gcc_assert (GET_MODE_CLASS (mode) == MODE_INT); > - gcc_assert (reg_or_0_operand (cons, mode)); > - gcc_assert (reg_or_0_operand (alt, mode)); > - > - riscv_emit_int_compare (&code, &op0, &op1, true); > - rtx cond = gen_rtx_fmt_ee (code, mode, op0, op1); > - > - rtx tmp1 = gen_reg_rtx (mode); > - rtx tmp2 = gen_reg_rtx (mode); > - > - emit_insn (gen_rtx_SET (tmp1, gen_rtx_IF_THEN_ELSE (mode, cond, > - cons, const0_rtx))); > - > - /* We need to expand a sequence for both blocks and we do that such, > - that the second conditional move will use the inverted condition. > - We use temporaries that are or'd to the dest register. */ > - cond = gen_rtx_fmt_ee ((code == EQ) ? NE : EQ, mode, op0, op1); > - emit_insn (gen_rtx_SET (tmp2, gen_rtx_IF_THEN_ELSE (mode, cond, > - alt, const0_rtx))); > - > - emit_insn (gen_rtx_SET (dest, gen_rtx_IOR (mode, tmp1, tmp2))); > - } > - > /* Emit a cond move: If OP holds, move CONS to DEST; else move ALT to DEST. > Return 0 if expansion failed. */ > > @@ -3483,6 +3452,7 @@ riscv_expand_conditional_move (rtx dest, rtx op, rtx > cons, rtx alt) > rtx_code code = GET_CODE (op); > rtx op0 = XEXP (op, 0); > rtx op1 = XEXP (op, 1); > + bool need_eq_ne_p = false; > > if (TARGET_XTHEADCONDMOV > && GET_MODE_CLASS (mode) == MODE_INT > @@ -3492,14 +3462,12 @@ riscv_expand_conditional_move (rtx dest, rtx op, rtx > cons, rtx alt) > && GET_MODE (op0) == mode > && GET_MODE (op1) == mode > && (code == EQ || code == NE)) > + need_eq_ne_p = true; > + > + if (need_eq_ne_p || (TARGET_SFB_ALU > + && GET_MODE (op0) == word_mode)) > { > - riscv_expand_conditional_move_onesided (dest, cons, alt, code, op0, > op1); > - return true; > - } > - else if (TARGET_SFB_ALU > - && GET_MODE (op0) == word_mode) > - { > - riscv_emit_int_compare (&code, &op0, &op1); > + riscv_emit_int_compare (&code, &op0, &op1, need_eq_ne_p); > rtx cond = gen_rtx_fmt_ee (code, GET_MODE (op0), op0, op1); > > /* The expander allows (const_int 0) for CONS for the benefit of > diff --git a/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv32.c > b/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv32.c > index 9afdc2eabfd..e2b135f3d00 100644 > --- a/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv32.c > +++ b/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv32.c > @@ -1,15 +1,13 @@ > /* { dg-do compile } */ > /* { dg-options "-O2 -march=rv32gc_xtheadcondmov -mabi=ilp32 > -mriscv-attribute" } */ > -/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" } } */ > +/* { dg-skip-if "" { *-*-* } {"-O0" "-O1" "-Os" "-Og" "-O3" "-Oz" "-flto"} } > */ > /* { dg-final { check-function-bodies "**" "" } } */ > > /* > **ConEmv_imm_imm_reg: > ** addi a5,a0,-1000 > ** li a0,10 > -** th.mvnez a0,zero,a5 > -** th.mveqz a1,zero,a5 > -** or a0,a0,a1 > +** th.mvnez a0,a1,a5 > ** ret > */ > int ConEmv_imm_imm_reg(int x, int y){ > @@ -20,9 +18,8 @@ int ConEmv_imm_imm_reg(int x, int y){ > /* > **ConEmv_imm_reg_reg: > ** addi a5,a0,-1000 > -** th.mvnez a1,zero,a5 > -** th.mveqz a2,zero,a5 > -** or a0,a1,a2 > +** th.mveqz a2,a1,a5 > +** mv a0,a2 > ** ret > */ > int ConEmv_imm_reg_reg(int x, int y, int z){ > @@ -34,9 +31,7 @@ int ConEmv_imm_reg_reg(int x, int y, int z){ > **ConEmv_reg_imm_reg: > ** sub a1,a0,a1 > ** li a0,10 > -** th.mvnez a0,zero,a1 > -** th.mveqz a2,zero,a1 > -** or a0,a0,a2 > +** th.mvnez a0,a2,a1 > ** ret > */ > int ConEmv_reg_imm_reg(int x, int y, int z){ > @@ -47,9 +42,8 @@ int ConEmv_reg_imm_reg(int x, int y, int z){ > /* > **ConEmv_reg_reg_reg: > ** sub a1,a0,a1 > -** th.mvnez a2,zero,a1 > -** th.mveqz a3,zero,a1 > -** or a0,a2,a3 > +** th.mveqz a3,a2,a1 > +** mv a0,a3 > ** ret > */ > int ConEmv_reg_reg_reg(int x, int y, int z, int n){ > @@ -59,12 +53,10 @@ int ConEmv_reg_reg_reg(int x, int y, int z, int n){ > > /* > **ConNmv_imm_imm_reg: > -** li a5,9998336 > -** addi a4,a0,-1000 > -** addi a5,a5,1664 > -** th.mvnez a1,zero,a4 > -** th.mveqz a5,zero,a4 > -** or a0,a1,a5 > +** addi a5,a0,-1000 > +** li a0,9998336 > +** addi a0,a0,1664 > +** th.mveqz a0,a1,a5 > ** ret > */ > int ConNmv_imm_imm_reg(int x, int y){ > @@ -74,10 +66,9 @@ int ConNmv_imm_imm_reg(int x, int y){ > > /* > **ConNmv_imm_reg_reg: > -** addi a5,a0,-1000 > -** th.mveqz a1,zero,a5 > -** th.mvnez a2,zero,a5 > -** or a0,a1,a2 > +** addi a0,a0,-1000 > +** th.mvnez a2,a1,a0 > +** mv a0,a2 > ** ret > */ > int ConNmv_imm_reg_reg(int x, int y, int z){ > @@ -89,9 +80,7 @@ int ConNmv_imm_reg_reg(int x, int y, int z){ > **ConNmv_reg_imm_reg: > ** sub a1,a0,a1 > ** li a0,10 > -** th.mveqz a0,zero,a1 > -** th.mvnez a2,zero,a1 > -** or a0,a0,a2 > +** th.mveqz a0,a2,a1 > ** ret > */ > int ConNmv_reg_imm_reg(int x, int y, int z){ > @@ -101,10 +90,9 @@ int ConNmv_reg_imm_reg(int x, int y, int z){ > > /* > **ConNmv_reg_reg_reg: > -** sub a1,a0,a1 > -** th.mveqz a2,zero,a1 > -** th.mvnez a3,zero,a1 > -** or a0,a2,a3 > +** sub a0,a0,a1 > +** th.mvnez a3,a2,a0 > +** mv a0,a3 > ** ret > */ > int ConNmv_reg_reg_reg(int x, int y, int z, int n){ > diff --git a/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv64.c > b/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv64.c > index a1982fd90bd..99956f8496c 100644 > --- a/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv64.c > +++ b/gcc/testsuite/gcc.target/riscv/xtheadcondmov-indirect-rv64.c > @@ -1,15 +1,13 @@ > /* { dg-do compile } */ > /* { dg-options "-O2 -march=rv64gc_xtheadcondmov -mabi=lp64d > -mriscv-attribute" } */ > -/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" } } */ > +/* { dg-skip-if "" { *-*-* } {"-O0" "-O1" "-Os" "-Og" "-O3" "-Oz" "-flto"} } > */ > /* { dg-final { check-function-bodies "**" "" } } */ > > /* > **ConEmv_imm_imm_reg: > ** addi a5,a0,-1000 > ** li a0,10 > -** th.mvnez a0,zero,a5 > -** th.mveqz a1,zero,a5 > -** or a0,a0,a1 > +** th.mvnez a0,a1,a5 > ** ret > */ > int ConEmv_imm_imm_reg(int x, int y){ > @@ -19,10 +17,9 @@ int ConEmv_imm_imm_reg(int x, int y){ > > /* > **ConEmv_imm_reg_reg: > -** addi a5,a0,-1000 > -** th.mvnez a1,zero,a5 > -** th.mveqz a2,zero,a5 > -** or a0,a1,a2 > +** addi a0,a0,-1000 > +** th.mveqz a2,a1,a5 > +** mv a0,a2 > ** ret > */ > int ConEmv_imm_reg_reg(int x, int y, int z){ > @@ -34,9 +31,7 @@ int ConEmv_imm_reg_reg(int x, int y, int z){ > **ConEmv_reg_imm_reg: > ** sub a1,a0,a1 > ** li a0,10 > -** th.mvnez a0,zero,a1 > -** th.mveqz a2,zero,a1 > -** or a0,a0,a2 > +** th.mvnez a0,a2,a1 > ** ret > */ > int ConEmv_reg_imm_reg(int x, int y, int z){ > @@ -47,9 +42,8 @@ int ConEmv_reg_imm_reg(int x, int y, int z){ > /* > **ConEmv_reg_reg_reg: > ** sub a1,a0,a1 > -** th.mvnez a2,zero,a1 > -** th.mveqz a3,zero,a1 > -** or a0,a2,a3 > +** th.mveqz a3,a2,a1 > +** mv a0,a3 > ** ret > */ > int ConEmv_reg_reg_reg(int x, int y, int z, int n){ > @@ -59,12 +53,10 @@ int ConEmv_reg_reg_reg(int x, int y, int z, int n){ > > /* > **ConNmv_imm_imm_reg: > -** li a5,9998336 > -** addi a4,a0,-1000 > -** addi a5,a5,1664 > -** th.mvnez a1,zero,a4 > -** th.mveqz a5,zero,a4 > -** or a0,a1,a5 > +** addi a5,a0,-1000 > +** li a0,9998336 > +** addi a0,a0,1664 > +** th.mveqz a0,a1,a5 > ** ret > */ > int ConNmv_imm_imm_reg(int x, int y){ > @@ -75,9 +67,8 @@ int ConNmv_imm_imm_reg(int x, int y){ > /* > **ConNmv_imm_reg_reg: > ** addi a5,a0,-1000 > -** th.mveqz a1,zero,a5 > -** th.mvnez a2,zero,a5 > -** or a0,a1,a2 > +** th.mvnez a2,a1,a0 > +** mv a0,a2 > ** ret > */ > int ConNmv_imm_reg_reg(int x, int y, int z){ > @@ -89,9 +80,7 @@ int ConNmv_imm_reg_reg(int x, int y, int z){ > **ConNmv_reg_imm_reg: > ** sub a1,a0,a1 > ** li a0,10 > -** th.mveqz a0,zero,a1 > -** th.mvnez a2,zero,a1 > -** or a0,a0,a2 > +** th.mveqz a0,a2,a1 > ** ret > */ > int ConNmv_reg_imm_reg(int x, int y, int z){ > @@ -101,10 +90,9 @@ int ConNmv_reg_imm_reg(int x, int y, int z){ > > /* > **ConNmv_reg_reg_reg: > -** sub a1,a0,a1 > -** th.mveqz a2,zero,a1 > -** th.mvnez a3,zero,a1 > -** or a0,a2,a3 > +** sub a0,a0,a1 > +** th.mvnez a3,a2,a0 > +** mv a0,a3 > ** ret > */ > int ConNmv_reg_reg_reg(int x, int y, int z, int n){ > -- > 2.17.1 >