LGTM, thanks :)

On Thu, Jan 18, 2024 at 5:59 PM Juzhe-Zhong <juzhe.zh...@rivai.ai> wrote:
>
> While running various benchmarks, I notice we miss vi variant support for 
> integer comparison.
> That is, we can vectorize code into vadd.vi but we can't vectorize into 
> vmseq.vi.
>
> Consider this following case:
>
> void
> foo (int n, int **__restrict a)
> {
>   int b;
>   int c;
>   int d;
>   for (b = 0; b < n; b++)
>     for (long e = 8; e > 0; e--)
>       a[b][e] = a[b][e] == 15;
> }
>
> Before this patch:
>
>         vsetivli        zero,4,e32,m1,ta,ma
>         vmv.v.i v4,15
>         vmv.v.i v3,1
>         vmv.v.i v2,0
> .L3:
>         ld      a5,0(a1)
>         addi    a4,a5,4
>         addi    a5,a5,20
>         vle32.v v1,0(a5)
>         vle32.v v0,0(a4)
>         vmseq.vv        v0,v0,v4
>
> After this patch:
>
>         ld      a5,0(a1)
>         addi    a4,a5,4
>         addi    a5,a5,20
>         vle32.v v1,0(a5)
>         vle32.v v0,0(a4)
>         vmseq.vi        v0,v0,15
>
> It's the missing feature caused by our some mistakes, support vi variant for 
> vec_cmp like other patterns (add, sub, ..., etc).
>
> Tested with no regression, ok for trunk ?
>
> gcc/ChangeLog:
>
>         * config/riscv/autovec.md: Support vi variant.
>
> gcc/testsuite/ChangeLog:
>
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-1.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-2.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-3.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-4.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-5.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-6.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-7.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-8.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/cmp_vi-9.c: New test.
>         * gcc.target/riscv/rvv/autovec/cmp/macro.h: New test.
>
> ---
>  gcc/config/riscv/autovec.md                   |  4 +--
>  .../riscv/rvv/autovec/cmp/cmp_vi-1.c          | 16 +++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-2.c          | 16 +++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-3.c          | 28 +++++++++++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-4.c          | 28 +++++++++++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-5.c          | 16 +++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-6.c          | 16 +++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-7.c          | 28 +++++++++++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-8.c          | 28 +++++++++++++++++++
>  .../riscv/rvv/autovec/cmp/cmp_vi-9.c          | 18 ++++++++++++
>  .../gcc.target/riscv/rvv/autovec/cmp/macro.h  | 11 ++++++++
>  11 files changed, 207 insertions(+), 2 deletions(-)
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-1.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-2.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-3.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-4.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-5.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-6.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-7.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-8.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-9.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/macro.h
>
> diff --git a/gcc/config/riscv/autovec.md b/gcc/config/riscv/autovec.md
> index 706cd9717cb..5ec1c59bdd4 100644
> --- a/gcc/config/riscv/autovec.md
> +++ b/gcc/config/riscv/autovec.md
> @@ -664,7 +664,7 @@
>    [(set (match_operand:<VM> 0 "register_operand")
>         (match_operator:<VM> 1 "comparison_operator"
>           [(match_operand:V_VLSI 2 "register_operand")
> -          (match_operand:V_VLSI 3 "register_operand")]))]
> +          (match_operand:V_VLSI 3 "nonmemory_operand")]))]
>    "TARGET_VECTOR"
>    {
>      riscv_vector::expand_vec_cmp (operands[0], GET_CODE (operands[1]),
> @@ -677,7 +677,7 @@
>    [(set (match_operand:<VM> 0 "register_operand")
>         (match_operator:<VM> 1 "comparison_operator"
>           [(match_operand:V_VLSI 2 "register_operand")
> -          (match_operand:V_VLSI 3 "register_operand")]))]
> +          (match_operand:V_VLSI 3 "nonmemory_operand")]))]
>    "TARGET_VECTOR"
>    {
>      riscv_vector::expand_vec_cmp (operands[0], GET_CODE (operands[1]),
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-1.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-1.c
> new file mode 100644
> index 00000000000..10c232f77bd
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-1.c
> @@ -0,0 +1,16 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (ne_char, char, n, !=, 15)
> +CMP_VI (ne_short, short, n, !=, 15)
> +CMP_VI (ne_int, int, n, !=, 15)
> +CMP_VI (ne_long, long, n, !=, 15)
> +CMP_VI (ne_unsigned_char, unsigned char, n, !=, 15)
> +CMP_VI (ne_unsigned_short, unsigned short, n, !=, 15)
> +CMP_VI (ne_unsigned_int, unsigned int, n, !=, 15)
> +CMP_VI (ne_unsigned_long, unsigned long, n, !=, 15)
> +
> +/* { dg-final { scan-assembler-times {vmsne\.vi} 16 } } */
> +/* { dg-final { scan-assembler-not {vmsne\.vv} } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-2.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-2.c
> new file mode 100644
> index 00000000000..92bea596cd8
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-2.c
> @@ -0,0 +1,16 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (ne_char, char, n, !=, -16)
> +CMP_VI (ne_short, short, n, !=, -16)
> +CMP_VI (ne_int, int, n, !=, -16)
> +CMP_VI (ne_long, long, n, !=, -16)
> +CMP_VI (ne_unsigned_char, unsigned char, n, !=, -16)
> +CMP_VI (ne_unsigned_short, unsigned short, n, !=, -16)
> +CMP_VI (ne_unsigned_int, unsigned int, n, !=, -16)
> +CMP_VI (ne_unsigned_long, unsigned long, n, !=, -16)
> +
> +/* { dg-final { scan-assembler-times {vmsne\.vi} 13 } } */
> +/* { dg-final { scan-assembler-not {vmsne\.vv} } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-3.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-3.c
> new file mode 100644
> index 00000000000..c9003279b0c
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-3.c
> @@ -0,0 +1,28 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3 
> --param=riscv-autovec-lmul=dynamic -fdump-tree-optimized-details" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (ne_char, char, 4, !=, 15)
> +CMP_VI (ne_short, short, 4, !=, 15)
> +CMP_VI (ne_int, int, 4, !=, 15)
> +CMP_VI (ne_long, long, 4, !=, 15)
> +CMP_VI (ne_unsigned_char, unsigned char, 4, !=, 15)
> +CMP_VI (ne_unsigned_short, unsigned short, 4, !=, 15)
> +CMP_VI (ne_unsigned_int, unsigned int, 4, !=, 15)
> +CMP_VI (ne_unsigned_long, unsigned long, 4, !=, 15)
> +
> +/* { dg-final { scan-assembler-times {vmsne\.vi} 32 } } */
> +/* { dg-final { scan-assembler-not {vmsne\.vv} } } */
> +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-4.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-4.c
> new file mode 100644
> index 00000000000..544ff751522
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-4.c
> @@ -0,0 +1,28 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3 
> --param=riscv-autovec-lmul=dynamic -fdump-tree-optimized-details" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (ne_char, char, 4, !=, -16)
> +CMP_VI (ne_short, short, 4, !=, -16)
> +CMP_VI (ne_int, int, 4, !=, -16)
> +CMP_VI (ne_long, long, 4, !=, -16)
> +CMP_VI (ne_unsigned_char, unsigned char, 4, !=, -16)
> +CMP_VI (ne_unsigned_short, unsigned short, 4, !=, -16)
> +CMP_VI (ne_unsigned_int, unsigned int, 4, !=, -16)
> +CMP_VI (ne_unsigned_long, unsigned long, 4, !=, -16)
> +
> +/* { dg-final { scan-assembler-times {vmsne\.vi} 20 } } */
> +/* { dg-final { scan-assembler-not {vmsne\.vv} } } */
> +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-5.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-5.c
> new file mode 100644
> index 00000000000..b7a5a4397c1
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-5.c
> @@ -0,0 +1,16 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (eq_char, char, n, ==, 15)
> +CMP_VI (eq_short, short, n, ==, 15)
> +CMP_VI (eq_int, int, n, ==, 15)
> +CMP_VI (eq_long, long, n, ==, 15)
> +CMP_VI (eq_unsigned_char, unsigned char, n, ==, 15)
> +CMP_VI (eq_unsigned_short, unsigned short, n, ==, 15)
> +CMP_VI (eq_unsigned_int, unsigned int, n, ==, 15)
> +CMP_VI (eq_unsigned_long, unsigned long, n, ==, 15)
> +
> +/* { dg-final { scan-assembler-times {vmseq\.vi} 16 } } */
> +/* { dg-final { scan-assembler-not {vmseq\.vv} } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-6.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-6.c
> new file mode 100644
> index 00000000000..f297ac80bbd
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-6.c
> @@ -0,0 +1,16 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (eq_char, char, n, ==, -16)
> +CMP_VI (eq_short, short, n, ==, -16)
> +CMP_VI (eq_int, int, n, ==, -16)
> +CMP_VI (eq_long, long, n, ==, -16)
> +CMP_VI (eq_unsigned_char, unsigned char, n, ==, -16)
> +CMP_VI (eq_unsigned_short, unsigned short, n, ==, -16)
> +CMP_VI (eq_unsigned_int, unsigned int, n, ==, -16)
> +CMP_VI (eq_unsigned_long, unsigned long, n, ==, -16)
> +
> +/* { dg-final { scan-assembler-times {vmseq\.vi} 13 } } */
> +/* { dg-final { scan-assembler-not {vmseq\.vv} } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-7.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-7.c
> new file mode 100644
> index 00000000000..63ded00947d
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-7.c
> @@ -0,0 +1,28 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3 
> --param=riscv-autovec-lmul=dynamic -fdump-tree-optimized-details" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (eq_char, char, 4, ==, 15)
> +CMP_VI (eq_short, short, 4, ==, 15)
> +CMP_VI (eq_int, int, 4, ==, 15)
> +CMP_VI (eq_long, long, 4, ==, 15)
> +CMP_VI (eq_unsigned_char, unsigned char, 4, ==, 15)
> +CMP_VI (eq_unsigned_short, unsigned short, 4, ==, 15)
> +CMP_VI (eq_unsigned_int, unsigned int, 4, ==, 15)
> +CMP_VI (eq_unsigned_long, unsigned long, 4, ==, 15)
> +
> +/* { dg-final { scan-assembler-times {vmseq\.vi} 32 } } */
> +/* { dg-final { scan-assembler-not {vmseq\.vv} } } */
> +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-8.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-8.c
> new file mode 100644
> index 00000000000..f29b5f12c51
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-8.c
> @@ -0,0 +1,28 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3 
> --param=riscv-autovec-lmul=dynamic -fdump-tree-optimized-details" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (eq_char, char, 4, ==, -16)
> +CMP_VI (eq_short, short, 4, ==, -16)
> +CMP_VI (eq_int, int, 4, ==, -16)
> +CMP_VI (eq_long, long, 4, ==, -16)
> +CMP_VI (eq_unsigned_char, unsigned char, 4, ==, -16)
> +CMP_VI (eq_unsigned_short, unsigned short, 4, ==, -16)
> +CMP_VI (eq_unsigned_int, unsigned int, 4, ==, -16)
> +CMP_VI (eq_unsigned_long, unsigned long, 4, ==, -16)
> +
> +/* { dg-final { scan-assembler-times {vmseq\.vi} 20 } } */
> +/* { dg-final { scan-assembler-not {vmseq\.vv} } } */
> +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */
> +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-9.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-9.c
> new file mode 100644
> index 00000000000..bfc1a68a1e4
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/cmp_vi-9.c
> @@ -0,0 +1,18 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv64gcv -mabi=lp64d -O3" } */
> +
> +#include "macro.h"
> +
> +CMP_VI (le_char, char, n, <=, 15)
> +CMP_VI (le_short, short, n, <=, 15)
> +CMP_VI (le_int, int, n, <=, 15)
> +CMP_VI (le_long, long, n, <=, 15)
> +CMP_VI (le_unsigned_char, unsigned char, n, <=, 15)
> +CMP_VI (le_unsigned_short, unsigned short, n, <=, 15)
> +CMP_VI (le_unsigned_int, unsigned int, n, <=, 15)
> +CMP_VI (le_unsigned_long, unsigned long, n, <=, 15)
> +
> +/* { dg-final { scan-assembler-times {vmsle\.vi} 7 } } */
> +/* { dg-final { scan-assembler-times {vmsleu\.vi} 9 } } */
> +/* { dg-final { scan-assembler-not {vmsle\.vv} } } */
> +/* { dg-final { scan-assembler-not {vmsleu\.vv} } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/macro.h 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/macro.h
> new file mode 100644
> index 00000000000..3fe6ee89a99
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cmp/macro.h
> @@ -0,0 +1,11 @@
> +#define CMP_VI(NAME, TYPE, NITERS, OP, IMM)                                  
>   \
> +  void NAME (int n, TYPE **__restrict a)                                     
>   \
> +  {                                                                          
>   \
> +    int b;                                                                   
>   \
> +    int c;                                                                   
>   \
> +    int d;                                                                   
>   \
> +    for (b = 0; b < NITERS; b++)                                             
>   \
> +      for (int e = 8; e > 0; e--)                                            
>   \
> +       a[b][e] = a[b][e] OP IMM;                                             
>  \
> +  }
> +
> --
> 2.36.3
>

Reply via email to