Register the target specific builtins in `aarch64-simd-builtins.def' and implement their associated backend patterns in `aarch64-simd.md'.
gcc/ChangeLog: * config/aarch64/aarch64-simd-builtins.def (vec_ldap1_lane): New. (vec_stl1_lane): Likewise. * config/aarch64/aarch64-simd.md (aarch64_vec_stl1_lanes<mode>_lane<Vel>): New. (aarch64_vec_stl1_lane<mode>): Likewise. (aarch64_vec_ldap1_lanes<mode>_lane<Vel>): Likewise. (aarch64_vec_ldap1_lane<mode>): Likewise. --- gcc/config/aarch64/aarch64-simd-builtins.def | 7 +++ gcc/config/aarch64/aarch64-simd.md | 65 ++++++++++++++++++++ gcc/config/aarch64/aarch64.md | 2 + 3 files changed, 74 insertions(+) diff --git a/gcc/config/aarch64/aarch64-simd-builtins.def b/gcc/config/aarch64/aarch64-simd-builtins.def index e2b94ad8247..0ae6c4ad41a 100644 --- a/gcc/config/aarch64/aarch64-simd-builtins.def +++ b/gcc/config/aarch64/aarch64-simd-builtins.def @@ -43,6 +43,13 @@ help describe the attributes (for example, pure) for the intrinsic function. */ + BUILTIN_V12DIF (LOADSTRUCT_LANE, vec_ldap1_lane, 0, ALL) + BUILTIN_V12DIUP (LOADSTRUCT_LANE_U, vec_ldap1_lane, 0, ALL) + BUILTIN_V12DIUP (LOADSTRUCT_LANE_P, vec_ldap1_lane, 0, ALL) + BUILTIN_V12DIF (STORESTRUCT_LANE, vec_stl1_lane, 0, ALL) + BUILTIN_V12DIUP (STORESTRUCT_LANE_U, vec_stl1_lane, 0, ALL) + BUILTIN_V12DIUP (STORESTRUCT_LANE_P, vec_stl1_lane, 0, ALL) + BUILTIN_VDC (BINOP, combine, 0, AUTO_FP) BUILTIN_VD_I (BINOPU, combine, 0, NONE) BUILTIN_VDC_P (BINOPP, combine, 0, NONE) diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md index 81ff5bad03d..79697336f61 100644 --- a/gcc/config/aarch64/aarch64-simd.md +++ b/gcc/config/aarch64/aarch64-simd.md @@ -7697,6 +7697,71 @@ DONE; }) +;; Patterns for rcpc3 vector lane loads and stores. + +(define_insn "aarch64_vec_stl1_lanes<mode>_lane<Vel>" + [(set (match_operand:BLK 0 "aarch64_simd_struct_operand" "=Q") + (unspec:BLK [(match_operand:V12DIF 1 "register_operand" "w") + (match_operand:SI 2 "immediate_operand" "i")] + UNSPEC_STL1_LANE))] + "TARGET_RCPC3" + { + operands[2] = aarch64_endian_lane_rtx (<MODE>mode, + INTVAL (operands[2])); + return "stl1\\t{%S1.<Vetype>}[%2], %0"; + } + [(set_attr "type" "neon_store2_one_lane")] +) + +(define_expand "aarch64_vec_stl1_lane<mode>" + [(match_operand:DI 0 "register_operand") + (match_operand:V12DIF 1 "register_operand") + (match_operand:SI 2 "immediate_operand")] + "TARGET_RCPC3" +{ + rtx mem = gen_rtx_MEM (BLKmode, operands[0]); + set_mem_size (mem, GET_MODE_SIZE (GET_MODE_INNER (<MODE>mode))); + + aarch64_simd_lane_bounds (operands[2], 0, + GET_MODE_NUNITS (<MODE>mode).to_constant (), NULL); + emit_insn (gen_aarch64_vec_stl1_lanes<mode>_lane<Vel> (mem, + operands[1], operands[2])); + DONE; +}) + +(define_insn "aarch64_vec_ldap1_lanes<mode>_lane<Vel>" + [(set (match_operand:V12DIF 0 "register_operand" "=w") + (unspec:V12DIF [ + (match_operand:BLK 1 "aarch64_simd_struct_operand" "Q") + (match_operand:V12DIF 2 "register_operand" "0") + (match_operand:SI 3 "immediate_operand" "i")] + UNSPEC_LDAP1_LANE))] + "TARGET_RCPC3" + { + operands[3] = aarch64_endian_lane_rtx (<MODE>mode, + INTVAL (operands[3])); + return "ldap1\\t{%S0.<Vetype>}[%3], %1"; + } + [(set_attr "type" "neon_load2_one_lane")] +) + +(define_expand "aarch64_vec_ldap1_lane<mode>" + [(match_operand:V12DIF 0 "register_operand") + (match_operand:DI 1 "register_operand") + (match_operand:V12DIF 2 "register_operand") + (match_operand:SI 3 "immediate_operand")] + "TARGET_RCPC3" +{ + rtx mem = gen_rtx_MEM (BLKmode, operands[1]); + set_mem_size (mem, GET_MODE_SIZE (GET_MODE_INNER (<MODE>mode))); + + aarch64_simd_lane_bounds (operands[3], 0, + GET_MODE_NUNITS (<MODE>mode).to_constant (), NULL); + emit_insn (gen_aarch64_vec_ldap1_lanes<mode>_lane<Vel> (operands[0], + mem, operands[2], operands[3])); + DONE; +}) + (define_insn_and_split "aarch64_rev_reglist<mode>" [(set (match_operand:VSTRUCT_QD 0 "register_operand" "=&w") (unspec:VSTRUCT_QD diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md index 5bb8c772be8..fb6de3b1fbf 100644 --- a/gcc/config/aarch64/aarch64.md +++ b/gcc/config/aarch64/aarch64.md @@ -295,6 +295,8 @@ UNSPEC_LD1RO UNSPEC_SALT_ADDR UNSPECV_PATCHABLE_AREA + UNSPEC_LDAP1_LANE + UNSPEC_STL1_LANE ]) (define_c_enum "unspecv" [ -- 2.41.0