ce426f
commit e5e0d9a4f632735cf3bb440eecb5caee5eea44c1
ce426f
Author: Ian Bolton <ian.bolton@arm.com>
ce426f
Date:   Thu Apr 24 07:15:33 2014 +0100
ce426f
ce426f
    [AArch64] Suppress unnecessary FPSR and FPCR writes.
ce426f
ce426f
diff --git a/ports/sysdeps/aarch64/fpu/fclrexcpt.c b/ports/sysdeps/aarch64/fpu/fclrexcpt.c
ce426f
index 531269f..b24f0ff 100644
ce426f
--- a/ports/sysdeps/aarch64/fpu/fclrexcpt.c
ce426f
+++ b/ports/sysdeps/aarch64/fpu/fclrexcpt.c
ce426f
@@ -23,13 +23,15 @@ int
ce426f
 feclearexcept (int excepts)
ce426f
 {
ce426f
   fpu_fpsr_t fpsr;
ce426f
+  fpu_fpsr_t fpsr_new;
ce426f
 
ce426f
   excepts &= FE_ALL_EXCEPT;
ce426f
 
ce426f
   _FPU_GETFPSR (fpsr);
ce426f
-  fpsr = (fpsr & ~FE_ALL_EXCEPT) | (fpsr & FE_ALL_EXCEPT & ~excepts);
ce426f
+  fpsr_new = (fpsr & ~FE_ALL_EXCEPT) | (fpsr & FE_ALL_EXCEPT & ~excepts);
ce426f
 
ce426f
-  _FPU_SETFPSR (fpsr);
ce426f
+  if (fpsr != fpsr_new)
ce426f
+    _FPU_SETFPSR (fpsr_new);
ce426f
 
ce426f
   return 0;
ce426f
 }
ce426f
diff --git a/ports/sysdeps/aarch64/fpu/fedisblxcpt.c b/ports/sysdeps/aarch64/fpu/fedisblxcpt.c
ce426f
index 719d52f..c43335c 100644
ce426f
--- a/ports/sysdeps/aarch64/fpu/fedisblxcpt.c
ce426f
+++ b/ports/sysdeps/aarch64/fpu/fedisblxcpt.c
ce426f
@@ -23,6 +23,7 @@ int
ce426f
 fedisableexcept (int excepts)
ce426f
 {
ce426f
   fpu_control_t fpcr;
ce426f
+  fpu_control_t fpcr_new;
ce426f
   int original_excepts;
ce426f
 
ce426f
   _FPU_GETCW (fpcr);
ce426f
@@ -31,9 +32,10 @@ fedisableexcept (int excepts)
ce426f
 
ce426f
   excepts &= FE_ALL_EXCEPT;
ce426f
 
ce426f
-  fpcr &= ~(excepts << FE_EXCEPT_SHIFT);
ce426f
+  fpcr_new = fpcr & ~(excepts << FE_EXCEPT_SHIFT);
ce426f
 
ce426f
-  _FPU_SETCW (fpcr);
ce426f
+  if (fpcr != fpcr_new)
ce426f
+    _FPU_SETCW (fpcr_new);
ce426f
 
ce426f
   return original_excepts;
ce426f
 }
ce426f
diff --git a/ports/sysdeps/aarch64/fpu/feenablxcpt.c b/ports/sysdeps/aarch64/fpu/feenablxcpt.c
ce426f
index 07a4bbb..70e413c 100644
ce426f
--- a/ports/sysdeps/aarch64/fpu/feenablxcpt.c
ce426f
+++ b/ports/sysdeps/aarch64/fpu/feenablxcpt.c
ce426f
@@ -23,6 +23,7 @@ int
ce426f
 feenableexcept (int excepts)
ce426f
 {
ce426f
   fpu_control_t fpcr;
ce426f
+  fpu_control_t fpcr_new;
ce426f
   int original_excepts;
ce426f
 
ce426f
   _FPU_GETCW (fpcr);
ce426f
@@ -31,9 +32,10 @@ feenableexcept (int excepts)
ce426f
 
ce426f
   excepts &= FE_ALL_EXCEPT;
ce426f
 
ce426f
-  fpcr |= (excepts << FE_EXCEPT_SHIFT);
ce426f
+  fpcr_new = fpcr | (excepts << FE_EXCEPT_SHIFT);
ce426f
 
ce426f
-  _FPU_SETCW (fpcr);
ce426f
+  if (fpcr != fpcr_new)
ce426f
+    _FPU_SETCW (fpcr_new);
ce426f
 
ce426f
   /* Trapping exceptions are optional in AArch64 the relevant enable
ce426f
      bits in FPCR are RES0 hence the absence of support can be
ce426f
diff --git a/ports/sysdeps/aarch64/fpu/feholdexcpt.c b/ports/sysdeps/aarch64/fpu/feholdexcpt.c
ce426f
index 0514ac1..973ba4a 100644
ce426f
--- a/ports/sysdeps/aarch64/fpu/feholdexcpt.c
ce426f
+++ b/ports/sysdeps/aarch64/fpu/feholdexcpt.c
ce426f
@@ -22,8 +22,10 @@
ce426f
 int
ce426f
 feholdexcept (fenv_t *envp)
ce426f
 {
ce426f
-  fpu_fpsr_t fpsr;
ce426f
   fpu_control_t fpcr;
ce426f
+  fpu_control_t fpcr_new;
ce426f
+  fpu_fpsr_t fpsr;
ce426f
+  fpu_fpsr_t fpsr_new;
ce426f
 
ce426f
   _FPU_GETCW (fpcr);
ce426f
   envp->__fpcr = fpcr;
ce426f
@@ -32,14 +34,16 @@ feholdexcept (fenv_t *envp)
ce426f
   envp->__fpsr = fpsr;
ce426f
 
ce426f
   /* Now set all exceptions to non-stop.  */
ce426f
-  fpcr &= ~(FE_ALL_EXCEPT << FE_EXCEPT_SHIFT);
ce426f
+  fpcr_new = fpcr & ~(FE_ALL_EXCEPT << FE_EXCEPT_SHIFT);
ce426f
 
ce426f
   /* And clear all exception flags.  */
ce426f
-  fpsr &= ~FE_ALL_EXCEPT;
ce426f
+  fpsr_new = fpsr & ~FE_ALL_EXCEPT;
ce426f
 
ce426f
-  _FPU_SETFPSR (fpsr);
ce426f
+  if (fpsr != fpsr_new)
ce426f
+    _FPU_SETFPSR (fpsr_new);
ce426f
 
ce426f
-  _FPU_SETCW (fpcr);
ce426f
+  if (fpcr != fpcr_new)
ce426f
+    _FPU_SETCW (fpcr_new);
ce426f
 
ce426f
   return 0;
ce426f
 }
ce426f
diff --git a/ports/sysdeps/aarch64/fpu/fesetenv.c b/ports/sysdeps/aarch64/fpu/fesetenv.c
ce426f
index a2434e3..30193e9 100644
ce426f
--- a/ports/sysdeps/aarch64/fpu/fesetenv.c
ce426f
+++ b/ports/sysdeps/aarch64/fpu/fesetenv.c
ce426f
@@ -23,34 +23,38 @@ int
ce426f
 fesetenv (const fenv_t *envp)
ce426f
 {
ce426f
   fpu_control_t fpcr;
ce426f
-  fpu_fpsr_t fpsr;
ce426f
+  fpu_control_t fpcr_new;
ce426f
   fpu_control_t updated_fpcr;
ce426f
+  fpu_fpsr_t fpsr;
ce426f
+  fpu_fpsr_t fpsr_new;
ce426f
 
ce426f
   _FPU_GETCW (fpcr);
ce426f
   _FPU_GETFPSR (fpsr);
ce426f
 
ce426f
-  fpcr &= _FPU_RESERVED;
ce426f
-  fpsr &= _FPU_FPSR_RESERVED;
ce426f
+  fpcr_new = fpcr & _FPU_RESERVED;
ce426f
+  fpsr_new = fpsr & _FPU_FPSR_RESERVED;
ce426f
 
ce426f
   if (envp == FE_DFL_ENV)
ce426f
     {
ce426f
-      fpcr |= _FPU_DEFAULT;
ce426f
-      fpsr |= _FPU_FPSR_DEFAULT;
ce426f
+      fpcr_new |= _FPU_DEFAULT;
ce426f
+      fpsr_new |= _FPU_FPSR_DEFAULT;
ce426f
     }
ce426f
   else if (envp == FE_NOMASK_ENV)
ce426f
     {
ce426f
-      fpcr |= _FPU_FPCR_IEEE;
ce426f
-      fpsr |= _FPU_FPSR_IEEE;
ce426f
+      fpcr_new |= _FPU_FPCR_IEEE;
ce426f
+      fpsr_new |= _FPU_FPSR_IEEE;
ce426f
     }
ce426f
   else
ce426f
     {
ce426f
-      fpcr |= envp->__fpcr & ~_FPU_RESERVED;
ce426f
-      fpsr |= envp->__fpsr & ~_FPU_FPSR_RESERVED;
ce426f
+      fpcr_new |= envp->__fpcr & ~_FPU_RESERVED;
ce426f
+      fpsr_new |= envp->__fpsr & ~_FPU_FPSR_RESERVED;
ce426f
     }
ce426f
 
ce426f
-  _FPU_SETFPSR (fpsr);
ce426f
+  if (fpsr != fpsr_new)
ce426f
+    _FPU_SETFPSR (fpsr_new);
ce426f
 
ce426f
-  _FPU_SETCW (fpcr);
ce426f
+  if (fpcr != fpcr_new)
ce426f
+    _FPU_SETCW (fpcr_new);
ce426f
 
ce426f
   /* Trapping exceptions are optional in AArch64 the relevant enable
ce426f
      bits in FPCR are RES0 hence the absence of support can be
ce426f
@@ -58,7 +62,7 @@ fesetenv (const fenv_t *envp)
ce426f
      value.  */
ce426f
 
ce426f
   _FPU_GETCW (updated_fpcr);
ce426f
-  if ((updated_fpcr & fpcr) != fpcr)
ce426f
+  if ((updated_fpcr & fpcr_new) != fpcr_new)
ce426f
     return 1;
ce426f
 
ce426f
   return 0;
ce426f
diff --git a/ports/sysdeps/aarch64/fpu/fesetround.c b/ports/sysdeps/aarch64/fpu/fesetround.c
ce426f
index 40a05f6..225096a 100644
ce426f
--- a/ports/sysdeps/aarch64/fpu/fesetround.c
ce426f
+++ b/ports/sysdeps/aarch64/fpu/fesetround.c
ce426f
@@ -23,6 +23,7 @@ int
ce426f
 fesetround (int round)
ce426f
 {
ce426f
   fpu_control_t fpcr;
ce426f
+  fpu_control_t fpcr_new;
ce426f
 
ce426f
   switch (round)
ce426f
     {
ce426f
@@ -31,9 +32,10 @@ fesetround (int round)
ce426f
     case FE_DOWNWARD:
ce426f
     case FE_TOWARDZERO:
ce426f
       _FPU_GETCW (fpcr);
ce426f
-      fpcr = (fpcr & ~FE_TOWARDZERO) | round;
ce426f
+      fpcr_new = (fpcr & ~FE_TOWARDZERO) | round;
ce426f
 
ce426f
-      _FPU_SETCW (fpcr);
ce426f
+      if (fpcr != fpcr_new)
ce426f
+	_FPU_SETCW (fpcr_new);
ce426f
       return 0;
ce426f
 
ce426f
     default:
ce426f
diff --git a/ports/sysdeps/aarch64/fpu/fsetexcptflg.c b/ports/sysdeps/aarch64/fpu/fsetexcptflg.c
ce426f
index 49cd1e4..60bb1c9 100644
ce426f
--- a/ports/sysdeps/aarch64/fpu/fsetexcptflg.c
ce426f
+++ b/ports/sysdeps/aarch64/fpu/fsetexcptflg.c
ce426f
@@ -24,16 +24,18 @@ int
ce426f
 fesetexceptflag (const fexcept_t *flagp, int excepts)
ce426f
 {
ce426f
   fpu_fpsr_t fpsr;
ce426f
+  fpu_fpsr_t fpsr_new;
ce426f
 
ce426f
   /* Get the current environment.  */
ce426f
   _FPU_GETFPSR (fpsr);
ce426f
 
ce426f
   /* Set the desired exception mask.  */
ce426f
-  fpsr &= ~(excepts & FE_ALL_EXCEPT);
ce426f
-  fpsr |= (*flagp & excepts & FE_ALL_EXCEPT);
ce426f
+  fpsr_new = fpsr & ~(excepts & FE_ALL_EXCEPT);
ce426f
+  fpsr_new |= (*flagp & excepts & FE_ALL_EXCEPT);
ce426f
 
ce426f
   /* Save state back to the FPU.  */
ce426f
-  _FPU_SETFPSR (fpsr);
ce426f
+  if (fpsr != fpsr_new)
ce426f
+    _FPU_SETFPSR (fpsr_new);
ce426f
 
ce426f
   return 0;
ce426f
 }