On 29 June 2012 21:38, Stefan Weil <s...@weilnetz.de> wrote:
> commit c4baa0503d9623f1ce891f525ccd140c598bc29a improved SSE table
> type safety which now raises compiler errors when latest QEMU was
> configured with --enable-debug.
>
> Fix this by splitting the SSE tables even further to separate
> helper functions with different signatures.
>
> Instead of crashing by calling address 0, the code now jumps to
> label illegal_op.
>
> Signed-off-by: Stefan Weil <s...@weilnetz.de>
> ---
>  target-i386/translate.c |   59 
> +++++++++++++++++++++++++++--------------------
>  1 file changed, 34 insertions(+), 25 deletions(-)
>
> diff --git a/target-i386/translate.c b/target-i386/translate.c
> index a902f4a..a00a6a1 100644
> --- a/target-i386/translate.c
> +++ b/target-i386/translate.c
> @@ -2947,25 +2947,34 @@ static const SSEFunc_0_pp sse_op_table2[3 * 8][2] = {
>      [16 + 7] = { NULL, gen_helper_pslldq_xmm },
>  };
>
> -static const SSEFunc_0_pi sse_op_table3a[4] = {
> +static const SSEFunc_0_pi sse_op_table3ai[] = {
>      gen_helper_cvtsi2ss,
> -    gen_helper_cvtsi2sd,
> -    X86_64_ONLY(gen_helper_cvtsq2ss),
> -    X86_64_ONLY(gen_helper_cvtsq2sd),
> +    gen_helper_cvtsi2sd
>  };
>
> -static const SSEFunc_i_p sse_op_table3b[4 * 2] = {
> +#ifdef TARGET_X86_64
> +static const SSEFunc_0_pl sse_op_table3aq[] = {
> +    gen_helper_cvtsq2ss,
> +    gen_helper_cvtsq2sd
> +};
> +#endif
> +
> +static const SSEFunc_i_p sse_op_table3bi[] = {
>      gen_helper_cvttss2si,
>      gen_helper_cvttsd2si,
> -    X86_64_ONLY(gen_helper_cvttss2sq),
> -    X86_64_ONLY(gen_helper_cvttsd2sq),
> -
>      gen_helper_cvtss2si,
> -    gen_helper_cvtsd2si,
> -    X86_64_ONLY(gen_helper_cvtss2sq),
> -    X86_64_ONLY(gen_helper_cvtsd2sq),
> +    gen_helper_cvtsd2si

As Andreas says, leaving in the trailing comma makes for nicer patches.

>  };
>
> +#ifdef TARGET_X86_64
> +static const SSEFunc_l_p sse_op_table3bq[] = {
> +    gen_helper_cvttss2sq,
> +    gen_helper_cvttsd2sq,
> +    gen_helper_cvtss2sq,
> +    gen_helper_cvtsd2sq
> +};
> +#endif

This patch removes all the uses of X86_64_ONLY macro so we could remove its
definition too.

> +
>  static const SSEFunc_0_pp sse_op_table4[8][4] = {
>      SSE_FOP(cmpeq),
>      SSE_FOP(cmplt),
> @@ -3097,10 +3106,6 @@ static void gen_sse(DisasContext *s, int b, 
> target_ulong pc_start, int rex_r)
>  {
>      int b1, op1_offset, op2_offset, is_xmm, val, ot;
>      int modrm, mod, rm, reg, reg_addr, offset_addr;
> -    SSEFunc_i_p sse_fn_i_p;
> -    SSEFunc_l_p sse_fn_l_p;
> -    SSEFunc_0_pi sse_fn_pi;
> -    SSEFunc_0_pl sse_fn_pl;
>      SSEFunc_0_pp sse_fn_pp;
>      SSEFunc_0_ppi sse_fn_ppi;
>      SSEFunc_0_ppt sse_fn_ppt;
> @@ -3563,14 +3568,16 @@ static void gen_sse(DisasContext *s, int b, 
> target_ulong pc_start, int rex_r)
>              op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
>              tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
>              if (ot == OT_LONG) {
> -                sse_fn_pi = sse_op_table3a[(s->dflag == 2) * 2 +
> -                                           ((b >> 8) - 2)];
> +                SSEFunc_0_pi sse_fn_pi = sse_op_table3ai[(b >> 8) - 2];

We could optionally do a later cleanup patch moving from "(b >> 8) - 2" to
"(b >> 8) & 1" which I think is more obviously not overrunning the array.

>                  tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
>                  sse_fn_pi(cpu_ptr0, cpu_tmp2_i32);
>              } else {
> -                sse_fn_pl = sse_op_table3a[(s->dflag == 2) * 2 +
> -                                           ((b >> 8) - 2)];
> +#ifdef TARGET_X86_64
> +                SSEFunc_0_pl sse_fn_pl = sse_op_table3aq[(b >> 8) - 2];
>                  sse_fn_pl(cpu_ptr0, cpu_T[0]);
> +#else
> +                goto illegal_op;
> +#endif
>              }
>              break;
>          case 0x02c: /* cvttps2pi */
> @@ -3624,16 +3631,18 @@ static void gen_sse(DisasContext *s, int b, 
> target_ulong pc_start, int rex_r)
>              }
>              tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op2_offset);
>              if (ot == OT_LONG) {
> -                sse_fn_i_p = sse_op_table3b[(s->dflag == 2) * 2 +
> -                                            ((b >> 8) - 2) +
> -                                            (b & 1) * 4];
> +                SSEFunc_i_p sse_fn_i_p =
> +                    sse_op_table3bi[(b >> 8) - 2 + (b & 1) * 2];

((b >> 7) & 2) | (b & 1) plus rearranging the table to match would
IMHO be cleaner in the long run.

>                  sse_fn_i_p(cpu_tmp2_i32, cpu_ptr0);
>                  tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
>              } else {
> -                sse_fn_l_p = sse_op_table3b[(s->dflag == 2) * 2 +
> -                                            ((b >> 8) - 2) +
> -                                            (b & 1) * 4];
> +#ifdef TARGET_X86_64
> +                SSEFunc_l_p sse_fn_l_p =
> +                    sse_op_table3bq[(b >> 8) - 2 + (b & 1) * 2];
>                  sse_fn_l_p(cpu_T[0], cpu_ptr0);
> +#else
> +                goto illegal_op;
> +#endif
>              }
>              gen_op_mov_reg_T0(ot, reg);
>              break;
> --
> 1.7.10

However that is all nitpicking. I think we should apply this as is
since it fixes a build breakage; we can clean up later if we want.

Reviewed-by: Peter Maydell <peter.mayd...@linaro.org>

-- PMM

Reply via email to