Re: [Qemu-devel] [PATCH 3/3] target/arm: Implement ARMv8.3-JSConv

2019-02-04 Thread Richard Henderson
On 2/4/19 11:21 AM, Peter Maydell wrote:
> On Mon, 4 Feb 2019 at 10:17, Richard Henderson
>  wrote:
>>
>> On 2/4/19 8:00 AM, Laurent Desnogues wrote:
>>> The pseudo code asks for NaN inputs to return 0 since FPUnpack returns
>>> a value of 0 for NaN.
>>>
>>> The rest looks correct.
>>
>> So it does.  I apparently copied the INT_MAX thing from softfloat.c without
>> double-checking.
> 
> I'm a little surprised risu didn't catch that -- it's usually
> quite keen on checking NaN behaviour...

I'm not sure either...  Because of other issues, I regenerated the .bin file
and the nan case does trigger now.  I'm not sure what happened before.


r~



Re: [Qemu-devel] [PATCH 3/3] target/arm: Implement ARMv8.3-JSConv

2019-02-04 Thread Peter Maydell
On Mon, 4 Feb 2019 at 10:17, Richard Henderson
 wrote:
>
> On 2/4/19 8:00 AM, Laurent Desnogues wrote:
> > The pseudo code asks for NaN inputs to return 0 since FPUnpack returns
> > a value of 0 for NaN.
> >
> > The rest looks correct.
>
> So it does.  I apparently copied the INT_MAX thing from softfloat.c without
> double-checking.

I'm a little surprised risu didn't catch that -- it's usually
quite keen on checking NaN behaviour...

thanks
-- PMM



Re: [Qemu-devel] [PATCH 3/3] target/arm: Implement ARMv8.3-JSConv

2019-02-04 Thread Richard Henderson
On 2/4/19 8:00 AM, Laurent Desnogues wrote:
> Hello,
> 
> On Mon, Feb 4, 2019 at 6:38 AM Richard Henderson
>  wrote:
>>
>> Signed-off-by: Richard Henderson 
>> ---
>>  target/arm/cpu.h   | 10 +
>>  target/arm/helper.h|  2 +
>>  target/arm/cpu.c   |  1 +
>>  target/arm/cpu64.c |  2 +
>>  target/arm/op_helper.c | 91 ++
>>  target/arm/translate-a64.c | 26 +++
>>  target/arm/translate.c | 15 +++
>>  7 files changed, 147 insertions(+)
>>
>> diff --git a/target/arm/cpu.h b/target/arm/cpu.h
>> index a68bcc9fed..d2c2e2b0cf 100644
>> --- a/target/arm/cpu.h
>> +++ b/target/arm/cpu.h
>> @@ -3209,6 +3209,11 @@ static inline bool isar_feature_aa32_vcma(const 
>> ARMISARegisters *id)
>>  return FIELD_EX32(id->id_isar5, ID_ISAR5, VCMA) != 0;
>>  }
>>
>> +static inline bool isar_feature_aa32_jscvt(const ARMISARegisters *id)
>> +{
>> +return FIELD_EX32(id->id_isar6, ID_ISAR6, JSCVT) != 0;
>> +}
>> +
>>  static inline bool isar_feature_aa32_dp(const ARMISARegisters *id)
>>  {
>>  return FIELD_EX32(id->id_isar6, ID_ISAR6, DP) != 0;
>> @@ -3287,6 +3292,11 @@ static inline bool isar_feature_aa64_dp(const 
>> ARMISARegisters *id)
>>  return FIELD_EX64(id->id_aa64isar0, ID_AA64ISAR0, DP) != 0;
>>  }
>>
>> +static inline bool isar_feature_aa64_jscvt(const ARMISARegisters *id)
>> +{
>> +return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, JSCVT) != 0;
>> +}
>> +
>>  static inline bool isar_feature_aa64_fcma(const ARMISARegisters *id)
>>  {
>>  return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, FCMA) != 0;
>> diff --git a/target/arm/helper.h b/target/arm/helper.h
>> index 53a38188c6..6998f7e8d5 100644
>> --- a/target/arm/helper.h
>> +++ b/target/arm/helper.h
>> @@ -218,6 +218,8 @@ DEF_HELPER_FLAGS_2(rintd_exact, TCG_CALL_NO_RWG, f64, 
>> f64, ptr)
>>  DEF_HELPER_FLAGS_2(rints, TCG_CALL_NO_RWG, f32, f32, ptr)
>>  DEF_HELPER_FLAGS_2(rintd, TCG_CALL_NO_RWG, f64, f64, ptr)
>>
>> +DEF_HELPER_FLAGS_2(fjcvtzs, TCG_CALL_NO_RWG, i64, f64, ptr)
>> +
>>  /* neon_helper.c */
>>  DEF_HELPER_FLAGS_3(neon_qadd_u8, TCG_CALL_NO_RWG, i32, env, i32, i32)
>>  DEF_HELPER_FLAGS_3(neon_qadd_s8, TCG_CALL_NO_RWG, i32, env, i32, i32)
>> diff --git a/target/arm/cpu.c b/target/arm/cpu.c
>> index 3874dc9875..2eb2ce6c8c 100644
>> --- a/target/arm/cpu.c
>> +++ b/target/arm/cpu.c
>> @@ -1995,6 +1995,7 @@ static void arm_max_initfn(Object *obj)
>>  cpu->isar.id_isar5 = t;
>>
>>  t = cpu->isar.id_isar6;
>> +t = FIELD_DP32(t, ID_ISAR6, JSCVT, 1);
>>  t = FIELD_DP32(t, ID_ISAR6, DP, 1);
>>  cpu->isar.id_isar6 = t;
>>
>> diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
>> index 7107ec8d7e..43d8ff047c 100644
>> --- a/target/arm/cpu64.c
>> +++ b/target/arm/cpu64.c
>> @@ -311,6 +311,7 @@ static void aarch64_max_initfn(Object *obj)
>>  cpu->isar.id_aa64isar0 = t;
>>
>>  t = cpu->isar.id_aa64isar1;
>> +t = FIELD_DP64(t, ID_AA64ISAR1, JSCVT, 1);
>>  t = FIELD_DP64(t, ID_AA64ISAR1, FCMA, 1);
>>  t = FIELD_DP64(t, ID_AA64ISAR1, APA, 1); /* PAuth, architected only 
>> */
>>  t = FIELD_DP64(t, ID_AA64ISAR1, API, 0);
>> @@ -340,6 +341,7 @@ static void aarch64_max_initfn(Object *obj)
>>  cpu->isar.id_isar5 = u;
>>
>>  u = cpu->isar.id_isar6;
>> +u = FIELD_DP32(u, ID_ISAR6, JSCVT, 1);
>>  u = FIELD_DP32(u, ID_ISAR6, DP, 1);
>>  cpu->isar.id_isar6 = u;
>>
>> diff --git a/target/arm/op_helper.c b/target/arm/op_helper.c
>> index c998eadfaa..a7259a7194 100644
>> --- a/target/arm/op_helper.c
>> +++ b/target/arm/op_helper.c
>> @@ -24,6 +24,7 @@
>>  #include "internals.h"
>>  #include "exec/exec-all.h"
>>  #include "exec/cpu_ldst.h"
>> +#include "fpu/softfloat.h"
>>
>>  #define SIGNBIT (uint32_t)0x8000
>>  #define SIGNBIT64 ((uint64_t)1 << 63)
>> @@ -1376,3 +1377,93 @@ uint32_t HELPER(ror_cc)(CPUARMState *env, uint32_t x, 
>> uint32_t i)
>>  return ((uint32_t)x >> shift) | (x << (32 - shift));
>>  }
>>  }
>> +
>> +/*
>> + * Implement float64 to int32_t conversion without saturation;
>> + * the result is supplied modulo 2^32.
>> + */
>> +uint64_t HELPER(fjcvtzs)(float64 value, void *vstatus)
>> +{
>> +float_status *status = vstatus;
>> +uint32_t result, exp, sign;
>> +uint64_t frac;
>> +uint32_t inexact; /* !Z */
>> +
>> +sign = extract64(value, 63, 1);
>> +exp = extract64(value, 52, 11);
>> +frac = extract64(value, 0, 52);
>> +
>> +if (exp == 0) {
>> +/* While not inexact for IEEE FP, -0.0 is inexact for JavaScript.  
>> */
>> +inexact = sign;
>> +result = 0;
>> +if (frac != 0) {
>> +if (status->flush_inputs_to_zero) {
>> +float_raise(float_flag_input_denormal, status);
>> +} else {
>> +float_raise(float_flag_inexact, status);
>> +inexact = 1;
>> +}
>> +}
>> 

Re: [Qemu-devel] [PATCH 3/3] target/arm: Implement ARMv8.3-JSConv

2019-02-04 Thread Laurent Desnogues
Hello,

On Mon, Feb 4, 2019 at 6:38 AM Richard Henderson
 wrote:
>
> Signed-off-by: Richard Henderson 
> ---
>  target/arm/cpu.h   | 10 +
>  target/arm/helper.h|  2 +
>  target/arm/cpu.c   |  1 +
>  target/arm/cpu64.c |  2 +
>  target/arm/op_helper.c | 91 ++
>  target/arm/translate-a64.c | 26 +++
>  target/arm/translate.c | 15 +++
>  7 files changed, 147 insertions(+)
>
> diff --git a/target/arm/cpu.h b/target/arm/cpu.h
> index a68bcc9fed..d2c2e2b0cf 100644
> --- a/target/arm/cpu.h
> +++ b/target/arm/cpu.h
> @@ -3209,6 +3209,11 @@ static inline bool isar_feature_aa32_vcma(const 
> ARMISARegisters *id)
>  return FIELD_EX32(id->id_isar5, ID_ISAR5, VCMA) != 0;
>  }
>
> +static inline bool isar_feature_aa32_jscvt(const ARMISARegisters *id)
> +{
> +return FIELD_EX32(id->id_isar6, ID_ISAR6, JSCVT) != 0;
> +}
> +
>  static inline bool isar_feature_aa32_dp(const ARMISARegisters *id)
>  {
>  return FIELD_EX32(id->id_isar6, ID_ISAR6, DP) != 0;
> @@ -3287,6 +3292,11 @@ static inline bool isar_feature_aa64_dp(const 
> ARMISARegisters *id)
>  return FIELD_EX64(id->id_aa64isar0, ID_AA64ISAR0, DP) != 0;
>  }
>
> +static inline bool isar_feature_aa64_jscvt(const ARMISARegisters *id)
> +{
> +return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, JSCVT) != 0;
> +}
> +
>  static inline bool isar_feature_aa64_fcma(const ARMISARegisters *id)
>  {
>  return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, FCMA) != 0;
> diff --git a/target/arm/helper.h b/target/arm/helper.h
> index 53a38188c6..6998f7e8d5 100644
> --- a/target/arm/helper.h
> +++ b/target/arm/helper.h
> @@ -218,6 +218,8 @@ DEF_HELPER_FLAGS_2(rintd_exact, TCG_CALL_NO_RWG, f64, 
> f64, ptr)
>  DEF_HELPER_FLAGS_2(rints, TCG_CALL_NO_RWG, f32, f32, ptr)
>  DEF_HELPER_FLAGS_2(rintd, TCG_CALL_NO_RWG, f64, f64, ptr)
>
> +DEF_HELPER_FLAGS_2(fjcvtzs, TCG_CALL_NO_RWG, i64, f64, ptr)
> +
>  /* neon_helper.c */
>  DEF_HELPER_FLAGS_3(neon_qadd_u8, TCG_CALL_NO_RWG, i32, env, i32, i32)
>  DEF_HELPER_FLAGS_3(neon_qadd_s8, TCG_CALL_NO_RWG, i32, env, i32, i32)
> diff --git a/target/arm/cpu.c b/target/arm/cpu.c
> index 3874dc9875..2eb2ce6c8c 100644
> --- a/target/arm/cpu.c
> +++ b/target/arm/cpu.c
> @@ -1995,6 +1995,7 @@ static void arm_max_initfn(Object *obj)
>  cpu->isar.id_isar5 = t;
>
>  t = cpu->isar.id_isar6;
> +t = FIELD_DP32(t, ID_ISAR6, JSCVT, 1);
>  t = FIELD_DP32(t, ID_ISAR6, DP, 1);
>  cpu->isar.id_isar6 = t;
>
> diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
> index 7107ec8d7e..43d8ff047c 100644
> --- a/target/arm/cpu64.c
> +++ b/target/arm/cpu64.c
> @@ -311,6 +311,7 @@ static void aarch64_max_initfn(Object *obj)
>  cpu->isar.id_aa64isar0 = t;
>
>  t = cpu->isar.id_aa64isar1;
> +t = FIELD_DP64(t, ID_AA64ISAR1, JSCVT, 1);
>  t = FIELD_DP64(t, ID_AA64ISAR1, FCMA, 1);
>  t = FIELD_DP64(t, ID_AA64ISAR1, APA, 1); /* PAuth, architected only 
> */
>  t = FIELD_DP64(t, ID_AA64ISAR1, API, 0);
> @@ -340,6 +341,7 @@ static void aarch64_max_initfn(Object *obj)
>  cpu->isar.id_isar5 = u;
>
>  u = cpu->isar.id_isar6;
> +u = FIELD_DP32(u, ID_ISAR6, JSCVT, 1);
>  u = FIELD_DP32(u, ID_ISAR6, DP, 1);
>  cpu->isar.id_isar6 = u;
>
> diff --git a/target/arm/op_helper.c b/target/arm/op_helper.c
> index c998eadfaa..a7259a7194 100644
> --- a/target/arm/op_helper.c
> +++ b/target/arm/op_helper.c
> @@ -24,6 +24,7 @@
>  #include "internals.h"
>  #include "exec/exec-all.h"
>  #include "exec/cpu_ldst.h"
> +#include "fpu/softfloat.h"
>
>  #define SIGNBIT (uint32_t)0x8000
>  #define SIGNBIT64 ((uint64_t)1 << 63)
> @@ -1376,3 +1377,93 @@ uint32_t HELPER(ror_cc)(CPUARMState *env, uint32_t x, 
> uint32_t i)
>  return ((uint32_t)x >> shift) | (x << (32 - shift));
>  }
>  }
> +
> +/*
> + * Implement float64 to int32_t conversion without saturation;
> + * the result is supplied modulo 2^32.
> + */
> +uint64_t HELPER(fjcvtzs)(float64 value, void *vstatus)
> +{
> +float_status *status = vstatus;
> +uint32_t result, exp, sign;
> +uint64_t frac;
> +uint32_t inexact; /* !Z */
> +
> +sign = extract64(value, 63, 1);
> +exp = extract64(value, 52, 11);
> +frac = extract64(value, 0, 52);
> +
> +if (exp == 0) {
> +/* While not inexact for IEEE FP, -0.0 is inexact for JavaScript.  */
> +inexact = sign;
> +result = 0;
> +if (frac != 0) {
> +if (status->flush_inputs_to_zero) {
> +float_raise(float_flag_input_denormal, status);
> +} else {
> +float_raise(float_flag_inexact, status);
> +inexact = 1;
> +}
> +}
> +} else if (exp == 0x7ff) {
> +if (frac == 0) {
> +/* Infinity.  */
> +result = 0;
> +} else {
> +/* NaN */
> +result = 

[Qemu-devel] [PATCH 3/3] target/arm: Implement ARMv8.3-JSConv

2019-02-03 Thread Richard Henderson
Signed-off-by: Richard Henderson 
---
 target/arm/cpu.h   | 10 +
 target/arm/helper.h|  2 +
 target/arm/cpu.c   |  1 +
 target/arm/cpu64.c |  2 +
 target/arm/op_helper.c | 91 ++
 target/arm/translate-a64.c | 26 +++
 target/arm/translate.c | 15 +++
 7 files changed, 147 insertions(+)

diff --git a/target/arm/cpu.h b/target/arm/cpu.h
index a68bcc9fed..d2c2e2b0cf 100644
--- a/target/arm/cpu.h
+++ b/target/arm/cpu.h
@@ -3209,6 +3209,11 @@ static inline bool isar_feature_aa32_vcma(const 
ARMISARegisters *id)
 return FIELD_EX32(id->id_isar5, ID_ISAR5, VCMA) != 0;
 }
 
+static inline bool isar_feature_aa32_jscvt(const ARMISARegisters *id)
+{
+return FIELD_EX32(id->id_isar6, ID_ISAR6, JSCVT) != 0;
+}
+
 static inline bool isar_feature_aa32_dp(const ARMISARegisters *id)
 {
 return FIELD_EX32(id->id_isar6, ID_ISAR6, DP) != 0;
@@ -3287,6 +3292,11 @@ static inline bool isar_feature_aa64_dp(const 
ARMISARegisters *id)
 return FIELD_EX64(id->id_aa64isar0, ID_AA64ISAR0, DP) != 0;
 }
 
+static inline bool isar_feature_aa64_jscvt(const ARMISARegisters *id)
+{
+return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, JSCVT) != 0;
+}
+
 static inline bool isar_feature_aa64_fcma(const ARMISARegisters *id)
 {
 return FIELD_EX64(id->id_aa64isar1, ID_AA64ISAR1, FCMA) != 0;
diff --git a/target/arm/helper.h b/target/arm/helper.h
index 53a38188c6..6998f7e8d5 100644
--- a/target/arm/helper.h
+++ b/target/arm/helper.h
@@ -218,6 +218,8 @@ DEF_HELPER_FLAGS_2(rintd_exact, TCG_CALL_NO_RWG, f64, f64, 
ptr)
 DEF_HELPER_FLAGS_2(rints, TCG_CALL_NO_RWG, f32, f32, ptr)
 DEF_HELPER_FLAGS_2(rintd, TCG_CALL_NO_RWG, f64, f64, ptr)
 
+DEF_HELPER_FLAGS_2(fjcvtzs, TCG_CALL_NO_RWG, i64, f64, ptr)
+
 /* neon_helper.c */
 DEF_HELPER_FLAGS_3(neon_qadd_u8, TCG_CALL_NO_RWG, i32, env, i32, i32)
 DEF_HELPER_FLAGS_3(neon_qadd_s8, TCG_CALL_NO_RWG, i32, env, i32, i32)
diff --git a/target/arm/cpu.c b/target/arm/cpu.c
index 3874dc9875..2eb2ce6c8c 100644
--- a/target/arm/cpu.c
+++ b/target/arm/cpu.c
@@ -1995,6 +1995,7 @@ static void arm_max_initfn(Object *obj)
 cpu->isar.id_isar5 = t;
 
 t = cpu->isar.id_isar6;
+t = FIELD_DP32(t, ID_ISAR6, JSCVT, 1);
 t = FIELD_DP32(t, ID_ISAR6, DP, 1);
 cpu->isar.id_isar6 = t;
 
diff --git a/target/arm/cpu64.c b/target/arm/cpu64.c
index 7107ec8d7e..43d8ff047c 100644
--- a/target/arm/cpu64.c
+++ b/target/arm/cpu64.c
@@ -311,6 +311,7 @@ static void aarch64_max_initfn(Object *obj)
 cpu->isar.id_aa64isar0 = t;
 
 t = cpu->isar.id_aa64isar1;
+t = FIELD_DP64(t, ID_AA64ISAR1, JSCVT, 1);
 t = FIELD_DP64(t, ID_AA64ISAR1, FCMA, 1);
 t = FIELD_DP64(t, ID_AA64ISAR1, APA, 1); /* PAuth, architected only */
 t = FIELD_DP64(t, ID_AA64ISAR1, API, 0);
@@ -340,6 +341,7 @@ static void aarch64_max_initfn(Object *obj)
 cpu->isar.id_isar5 = u;
 
 u = cpu->isar.id_isar6;
+u = FIELD_DP32(u, ID_ISAR6, JSCVT, 1);
 u = FIELD_DP32(u, ID_ISAR6, DP, 1);
 cpu->isar.id_isar6 = u;
 
diff --git a/target/arm/op_helper.c b/target/arm/op_helper.c
index c998eadfaa..a7259a7194 100644
--- a/target/arm/op_helper.c
+++ b/target/arm/op_helper.c
@@ -24,6 +24,7 @@
 #include "internals.h"
 #include "exec/exec-all.h"
 #include "exec/cpu_ldst.h"
+#include "fpu/softfloat.h"
 
 #define SIGNBIT (uint32_t)0x8000
 #define SIGNBIT64 ((uint64_t)1 << 63)
@@ -1376,3 +1377,93 @@ uint32_t HELPER(ror_cc)(CPUARMState *env, uint32_t x, 
uint32_t i)
 return ((uint32_t)x >> shift) | (x << (32 - shift));
 }
 }
+
+/*
+ * Implement float64 to int32_t conversion without saturation;
+ * the result is supplied modulo 2^32.
+ */
+uint64_t HELPER(fjcvtzs)(float64 value, void *vstatus)
+{
+float_status *status = vstatus;
+uint32_t result, exp, sign;
+uint64_t frac;
+uint32_t inexact; /* !Z */
+
+sign = extract64(value, 63, 1);
+exp = extract64(value, 52, 11);
+frac = extract64(value, 0, 52);
+
+if (exp == 0) {
+/* While not inexact for IEEE FP, -0.0 is inexact for JavaScript.  */
+inexact = sign;
+result = 0;
+if (frac != 0) {
+if (status->flush_inputs_to_zero) {
+float_raise(float_flag_input_denormal, status);
+} else {
+float_raise(float_flag_inexact, status);
+inexact = 1;
+}
+}
+} else if (exp == 0x7ff) {
+if (frac == 0) {
+/* Infinity.  */
+result = 0;
+} else {
+/* NaN */
+result = INT32_MAX;
+}
+/* This operation raises Invalid for both NaN and overflow (Inf).  */
+float_raise(float_flag_invalid, status);
+inexact = 1;
+} else {
+int shift, true_exp;
+
+true_exp = exp - 1023;
+shift = 52 - true_exp;
+
+/* Restore implicit bit.  */
+