Re: [Qemu-devel] [PATCH 6/9] tcg/arm: Support INDEX_op_extract2_i32

2019-03-08 Thread Philippe Mathieu-Daudé
On 3/7/19 3:41 PM, Richard Henderson wrote:
> Signed-off-by: Richard Henderson 
> ---
>  tcg/arm/tcg-target.h |  2 +-
>  tcg/arm/tcg-target.inc.c | 25 +
>  2 files changed, 26 insertions(+), 1 deletion(-)
> 
> diff --git a/tcg/arm/tcg-target.h b/tcg/arm/tcg-target.h
> index 4ee6c98958..17e771374d 100644
> --- a/tcg/arm/tcg-target.h
> +++ b/tcg/arm/tcg-target.h
> @@ -116,7 +116,7 @@ extern bool use_idiv_instructions;
>  #define TCG_TARGET_HAS_deposit_i32  use_armv7_instructions
>  #define TCG_TARGET_HAS_extract_i32  use_armv7_instructions
>  #define TCG_TARGET_HAS_sextract_i32 use_armv7_instructions
> -#define TCG_TARGET_HAS_extract2_i32 0
> +#define TCG_TARGET_HAS_extract2_i32 1
>  #define TCG_TARGET_HAS_movcond_i32  1
>  #define TCG_TARGET_HAS_mulu2_i321
>  #define TCG_TARGET_HAS_muls2_i321
> diff --git a/tcg/arm/tcg-target.inc.c b/tcg/arm/tcg-target.inc.c
> index 2245a8aeb9..6873b0cf95 100644
> --- a/tcg/arm/tcg-target.inc.c
> +++ b/tcg/arm/tcg-target.inc.c
> @@ -2064,6 +2064,27 @@ static inline void tcg_out_op(TCGContext *s, TCGOpcode 
> opc,
>  case INDEX_op_sextract_i32:
>  tcg_out_sextract(s, COND_AL, args[0], args[1], args[2], args[3]);
>  break;
> +case INDEX_op_extract2_i32:
> +/* ??? These optimization vs zero should be generic.  */
> +/* ??? But we can't substitute 2 for 1 in the opcode stream yet.  */
> +if (const_args[1]) {
> +if (const_args[2]) {
> +tcg_out_movi(s, TCG_TYPE_REG, args[0], 0);
> +} else {
> +tcg_out_dat_reg(s, COND_AL, ARITH_MOV, args[0], 0,
> +args[2], SHIFT_IMM_LSL(32 - args[3]));
> +}
> +} else if (const_args[2]) {
> +tcg_out_dat_reg(s, COND_AL, ARITH_MOV, args[0], 0,
> +args[1], SHIFT_IMM_LSR(args[3]));
> +} else {
> +/* We can do extract2 in 2 insns, vs the 3 required otherwise.  
> */
> +tcg_out_dat_reg(s, COND_AL, ARITH_MOV, TCG_REG_TMP, 0,
> +args[2], SHIFT_IMM_LSL(32 - args[3]));
> +tcg_out_dat_reg(s, COND_AL, ARITH_ORR, args[0], TCG_REG_TMP,
> +args[1], SHIFT_IMM_LSR(args[3]));
> +}

Reviewed-by: Philippe Mathieu-Daudé 

> +break;
>  
>  case INDEX_op_div_i32:
>  tcg_out_sdiv(s, COND_AL, args[0], args[1], args[2]);
> @@ -2108,6 +2129,8 @@ static const TCGTargetOpDef 
> *tcg_target_op_def(TCGOpcode op)
>  = { .args_ct_str = { "s", "s", "s", "s" } };
>  static const TCGTargetOpDef br
>  = { .args_ct_str = { "r", "rIN" } };
> +static const TCGTargetOpDef ext2
> += { .args_ct_str = { "r", "rZ", "rZ" } };
>  static const TCGTargetOpDef dep
>  = { .args_ct_str = { "r", "0", "rZ" } };
>  static const TCGTargetOpDef movc
> @@ -2174,6 +2197,8 @@ static const TCGTargetOpDef 
> *tcg_target_op_def(TCGOpcode op)
>  return 
>  case INDEX_op_deposit_i32:
>  return 
> +case INDEX_op_extract2_i32:
> +return 
>  case INDEX_op_movcond_i32:
>  return 
>  case INDEX_op_add2_i32:
> 



[Qemu-devel] [PATCH 6/9] tcg/arm: Support INDEX_op_extract2_i32

2019-03-07 Thread Richard Henderson
Signed-off-by: Richard Henderson 
---
 tcg/arm/tcg-target.h |  2 +-
 tcg/arm/tcg-target.inc.c | 25 +
 2 files changed, 26 insertions(+), 1 deletion(-)

diff --git a/tcg/arm/tcg-target.h b/tcg/arm/tcg-target.h
index 4ee6c98958..17e771374d 100644
--- a/tcg/arm/tcg-target.h
+++ b/tcg/arm/tcg-target.h
@@ -116,7 +116,7 @@ extern bool use_idiv_instructions;
 #define TCG_TARGET_HAS_deposit_i32  use_armv7_instructions
 #define TCG_TARGET_HAS_extract_i32  use_armv7_instructions
 #define TCG_TARGET_HAS_sextract_i32 use_armv7_instructions
-#define TCG_TARGET_HAS_extract2_i32 0
+#define TCG_TARGET_HAS_extract2_i32 1
 #define TCG_TARGET_HAS_movcond_i32  1
 #define TCG_TARGET_HAS_mulu2_i321
 #define TCG_TARGET_HAS_muls2_i321
diff --git a/tcg/arm/tcg-target.inc.c b/tcg/arm/tcg-target.inc.c
index 2245a8aeb9..6873b0cf95 100644
--- a/tcg/arm/tcg-target.inc.c
+++ b/tcg/arm/tcg-target.inc.c
@@ -2064,6 +2064,27 @@ static inline void tcg_out_op(TCGContext *s, TCGOpcode 
opc,
 case INDEX_op_sextract_i32:
 tcg_out_sextract(s, COND_AL, args[0], args[1], args[2], args[3]);
 break;
+case INDEX_op_extract2_i32:
+/* ??? These optimization vs zero should be generic.  */
+/* ??? But we can't substitute 2 for 1 in the opcode stream yet.  */
+if (const_args[1]) {
+if (const_args[2]) {
+tcg_out_movi(s, TCG_TYPE_REG, args[0], 0);
+} else {
+tcg_out_dat_reg(s, COND_AL, ARITH_MOV, args[0], 0,
+args[2], SHIFT_IMM_LSL(32 - args[3]));
+}
+} else if (const_args[2]) {
+tcg_out_dat_reg(s, COND_AL, ARITH_MOV, args[0], 0,
+args[1], SHIFT_IMM_LSR(args[3]));
+} else {
+/* We can do extract2 in 2 insns, vs the 3 required otherwise.  */
+tcg_out_dat_reg(s, COND_AL, ARITH_MOV, TCG_REG_TMP, 0,
+args[2], SHIFT_IMM_LSL(32 - args[3]));
+tcg_out_dat_reg(s, COND_AL, ARITH_ORR, args[0], TCG_REG_TMP,
+args[1], SHIFT_IMM_LSR(args[3]));
+}
+break;
 
 case INDEX_op_div_i32:
 tcg_out_sdiv(s, COND_AL, args[0], args[1], args[2]);
@@ -2108,6 +2129,8 @@ static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode 
op)
 = { .args_ct_str = { "s", "s", "s", "s" } };
 static const TCGTargetOpDef br
 = { .args_ct_str = { "r", "rIN" } };
+static const TCGTargetOpDef ext2
+= { .args_ct_str = { "r", "rZ", "rZ" } };
 static const TCGTargetOpDef dep
 = { .args_ct_str = { "r", "0", "rZ" } };
 static const TCGTargetOpDef movc
@@ -2174,6 +2197,8 @@ static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode 
op)
 return 
 case INDEX_op_deposit_i32:
 return 
+case INDEX_op_extract2_i32:
+return 
 case INDEX_op_movcond_i32:
 return 
 case INDEX_op_add2_i32:
-- 
2.17.2