On Thu, Nov 13, 2025 at 2:22 PM liuhongt <[email protected]> wrote:
>
> For instruction sequence like
>         kmovb   %k0, %edx
>         kmovb   %k1, %ecx
>         orb     %cl, %dl
>         je      .L5
>
> if only CCZ is cared, it can be optimized to
>
>         kortestb %k1, %k0
>         je      .L5
>
> Bootstrapped and regtested on x86_64-pc-linux-gnu{-m32}.
> Ready push to trunk.
>
> gcc/ChangeLog:
>
>         * config/i386/i386.md (*ior<mode>_ccz_1): New define_insn.
>
> gcc/testsuite/ChangeLog:
>
>         * gcc.target/i386/kortest_ccz-1.c: New test.
> ---
>  gcc/config/i386/i386.md                       | 16 ++++++++++++++++
>  gcc/testsuite/gcc.target/i386/kortest_ccz-1.c | 13 +++++++++++++
>  2 files changed, 29 insertions(+)
>  create mode 100644 gcc/testsuite/gcc.target/i386/kortest_ccz-1.c
>
> diff --git a/gcc/config/i386/i386.md b/gcc/config/i386/i386.md
> index 3ea2439526b..ae26ef02c22 100644
> --- a/gcc/config/i386/i386.md
> +++ b/gcc/config/i386/i386.md
> @@ -14203,6 +14203,22 @@ (define_insn "*<code>si_2_zext_imm"
>     (set_attr "isa" "*,apx_ndd")
>     (set_attr "mode" "SI")])
>
> +;; It must be put before *<code><mode>_3, the blow one.
> +(define_insn "*ior<mode>_ccz_1"
> +  [(set (reg:CCZ FLAGS_REG)
> +       (compare:CCZ
> +        (ior:SWI1248_AVX512BWDQ_64
> +         (match_operand:SWI1248_AVX512BWDQ_64 1 "nonimmediate_operand" 
> "%0,?k")
> +         (match_operand:SWI1248_AVX512BWDQ_64 2 "<general_operand>" "<g>, 
> k"))
> +        (const_int 0)))
> +   (clobber (match_scratch:SWI1248_AVX512BWDQ_64 0 "=<r>, k"))]
> +  "TARGET_AVX512F && !(MEM_P (operands[1]) && MEM_P (operands[2]))"
> +  "@
> +   or{<imodesuffix>}\t{%2, %0|%0, %2}
> +   kortest<mskmodesuffix>\t{%1, %2|%2, %1}"
> +  [(set_attr "type" "alu,msklog")
> +   (set_attr "mode" "<MODE>")])
> +
>  (define_insn "*<code><mode>_3"
>    [(set (reg FLAGS_REG)
>         (compare (any_or:SWI
> diff --git a/gcc/testsuite/gcc.target/i386/kortest_ccz-1.c 
> b/gcc/testsuite/gcc.target/i386/kortest_ccz-1.c
> new file mode 100644
> index 00000000000..0f8d4bf9f22
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/i386/kortest_ccz-1.c
> @@ -0,0 +1,13 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=x86-64-v4 -O3" } */
> +/* { dg-final { scan-assembler-not "kmov" } } */
> +/* { dg-final { scan-assembler "kortest" } } */
> +
> +int
> +foo (int *__restrict a, int* __restrict d, int b, int c, int n)
> +{
> +  for (int i = 0; i != 10000; i++)
> +    if (a[i] > b || d[i] > c)
There's typo here, shou;d be | instead of ||.
> +      return 1;
> +  return 0;
> +}
> --
> 2.34.1
>


-- 
BR,
Hongtao

Reply via email to