Performance improvement for SPEC06fp for the last few commits:

                             qemu-aarch64 SPEC06fp (test set) speedup over QEMU 
4c2c1015905
                                     Host: Intel(R) Core(TM) i7-6700K CPU @ 
4.00GHz
                                           error bars: 95% confidence interval

  6 
+-+---+-----+-----+-----+----+-----+-----+-----+-----+-----+-----+-----+-----+-----+----+-----+-----+-----+---+-+
  5 
+-+..........................+++..............................................................................+-+
  4 
+-+...........................@@=+..............................................................+addsub
       +-+
  3 
+-+........+++++.+++++........@@=+............+++++...............+++........................+++++++++++
      +-+
    |    +%@&+  |&&  %%@&+      +%%@= +%%&=++%%&= +%%&=              +++  +++++ 
      ++++++%%@=++%%&= +%%&=  ++++  |
  2 
+-+..+%@&++%%@&.+%%@&+$$%@=+#$%@=+#$%&=##$%&=*#$%&=.+%@&=...+==##%@&++%%@&+++++++$$%@=**$%@=*#$%&=*+f%&=##$@&=+-+
  1 
+-+**#$@&**#%@&**#%@&**$%@=**$%@=**$%&=*#$%&=*#$%&**#$@&**#$@&**#%@&**#%@&**#%@=**$%@=**$%@=*#$%&=+sqr&=*#$@&=+-+
  0 
+-+**#$@&**#%@&**#%@&**$%@=**$%@=**$%&=*#$%&=*#$%&**#$@&**#$@&**#%@&**#%@&**#%@=**$%@=**$%@=*#$%&=*+cm&=*#$@&=+-+
      
416.game433.434.435.436.cac437.leslie444.447.de450.so453.454.ca459.GemsF465.ton470.lb48482.sph+f32f64ean

                                       qemu-aarch64 NBench score; higher is 
better
                                     Host: Intel(R) Core(TM) i7-6700K CPU @ 
4.00GHz

  16 
+-+-------------------+---------------------+----------------------+---------------------+-------------------+-+
  14 
+-+..........................................+++++++***............+++..+++++................................+-+
  12 
+-+.........................................@@@@&&===+*............@@@&&&==**..................+before
       +-+
  10 
+-+.........................................@..@.&..=.*............@.@..&.=.*............@@@&&&==***ub
       +-+
   8 
+-+.....................................++++@..@.&..=.*............@.@..&.=.*............@+@..&+=
 +*ul       +-+
   6 
+-+...................@@@@&&===**..++###$$$%%..@.&..=.*..***###$$++@.@..&.=.*.......$$$%%%.@..&+=
 +*iv       +-+
   4 
+-+............###$$$%%..@.&..=.*..***.#..$.%..@.&..=.*..*+*..#+$%%%.@..&.=.*..***###+$++%.@..&+=
 +*ma       +-+
   2 
+-+.........****.#..$.%..@.&..=.*..*.*.#..$.%..@.&..=.*..*.*..#.$..%.@..&.=.*..*.*..#.$..%.@..&+=+s*rt
       +-+
   0 
+-+---------****##$$$%%@@@&&===**--***##$$$%%@@@&&===**--***###$$%%%@@&&&==**--***###$$%%%@@&&&==***mp-------+-+
                    FOURIER            NEURAL NET       LU DECOMPOSITION        
         gmean      +f32f64

Images in png: https://imgur.com/a/rkuZW

Signed-off-by: Emilio G. Cota <c...@braap.org>
---
 fpu/softfloat.c | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/fpu/softfloat.c b/fpu/softfloat.c
index 2b86d73..d0f1f65 100644
--- a/fpu/softfloat.c
+++ b/fpu/softfloat.c
@@ -3660,7 +3660,8 @@ float128 uint64_to_float128(uint64_t a, float_status 
*status)
 | Arithmetic.
 *----------------------------------------------------------------------------*/
 
-float64 float32_to_float64(float32 a, float_status *status)
+static float64 __attribute__((noinline))
+soft_float32_to_float64(float32 a, float_status *status)
 {
     flag aSign;
     int aExp;
@@ -3685,6 +3686,20 @@ float64 float32_to_float64(float32 a, float_status 
*status)
 
 }
 
+float64 float32_to_float64(float32 a, float_status *status)
+{
+    if (likely(float32_is_normal(a))) {
+        float f = *(float *)&a;
+        double r = f;
+
+        return *(float64 *)&r;
+    } else if (float32_is_zero(a)) {
+        return float64_set_sign(float64_zero, float32_is_neg(a));
+    } else {
+        return soft_float32_to_float64(a, status);
+    }
+}
+
 /*----------------------------------------------------------------------------
 | Returns the result of converting the single-precision floating-point value
 | `a' to the extended double-precision floating-point format.  The conversion
-- 
2.7.4


Reply via email to