target-ppc: VSX Stage 4: Add xssqrtsp This patch adds the VSX Scalar Square Root Single Precision (xssqrtsp) instruction. The existing VSX_SQRT() macro is modified to support rounding of the intermediate double-precision result to single-precision. Signed-off-by: Tom Musta <tommusta@gmail.com> Reviewed-by: Richard Henderson <rth@twiddle.net> Signed-off-by: Alexander Graf <agraf@suse.de>

commit: cea4e57473efc2fad1d241e87984eba4e5d9690c [log] [tgz]
author: Tom Musta <tommusta@gmail.com> Wed Jan 15 08:10:37 2014 -0600
committer: Alexander Graf <agraf@suse.de> Wed Mar 05 03:06:35 2014 +0100
tree: 4c71a18b09ed18cfc57d7104e3158f893bac24a8
parent: 2c0c52ae620cf121a8b9084c7c1168d867564ee8 [diff] [blame]
diff --git a/target-ppc/fpu_helper.c b/target-ppc/fpu_helper.c
index ac52c23..fec9d1b 100644
--- a/target-ppc/fpu_helper.c
+++ b/target-ppc/fpu_helper.c

@@ -1969,7 +1969,7 @@
  *   fld   - vsr_t field (f32 or f64)
  *   sfprf - set FPRF
  */
-#define VSX_SQRT(op, nels, tp, fld, sfprf)                                   \
+#define VSX_SQRT(op, nels, tp, fld, sfprf, r2sp)                             \
 void helper_##op(CPUPPCState *env, uint32_t opcode)                          \
 {                                                                            \
     ppc_vsr_t xt, xb;                                                        \
@@ -1993,6 +1993,10 @@
             }                                                                \
         }                                                                    \
                                                                              \
+        if (r2sp) {                                                          \
+            xt.fld[i] = helper_frsp(env, xt.fld[i]);                         \
+        }                                                                    \
+                                                                             \
         if (sfprf) {                                                         \
             helper_compute_fprf(env, xt.fld[i], sfprf);                      \
         }                                                                    \
@@ -2002,9 +2006,10 @@
     helper_float_check_status(env);                                          \
 }
 
-VSX_SQRT(xssqrtdp, 1, float64, f64, 1)
-VSX_SQRT(xvsqrtdp, 2, float64, f64, 0)
-VSX_SQRT(xvsqrtsp, 4, float32, f32, 0)
+VSX_SQRT(xssqrtdp, 1, float64, f64, 1, 0)
+VSX_SQRT(xssqrtsp, 1, float64, f64, 1, 1)
+VSX_SQRT(xvsqrtdp, 2, float64, f64, 0, 0)
+VSX_SQRT(xvsqrtsp, 4, float32, f32, 0, 0)
 
 /* VSX_RSQRTE - VSX floating point reciprocal square root estimate
  *   op    - instruction mnemonic
commit	cea4e57473efc2fad1d241e87984eba4e5d9690c	[log] [tgz]
author	Tom Musta <tommusta@gmail.com>	Wed Jan 15 08:10:37 2014 -0600
committer	Alexander Graf <agraf@suse.de>	Wed Mar 05 03:06:35 2014 +0100
tree	4c71a18b09ed18cfc57d7104e3158f893bac24a8
parent	2c0c52ae620cf121a8b9084c7c1168d867564ee8 [diff] [blame]