aboutsummaryrefslogtreecommitdiff
path: root/src/vectors-4-SSE.h
diff options
context:
space:
mode:
authorsvn_bwardell <svn_bwardell@105869f7-3296-0410-a4ea-f4349344b45a>2011-08-07 12:41:50 +0000
committersvn_bwardell <svn_bwardell@105869f7-3296-0410-a4ea-f4349344b45a>2011-08-07 12:41:50 +0000
commit96caf45931a90c080adc8073762d72aa2a80ac76 (patch)
tree48ccb4894a0bdd3dbf62826e8c0e05641d1f4236 /src/vectors-4-SSE.h
parent1d6878bcc13a1695043cb680f7ab83be28048419 (diff)
Fix definition of kifthen for architectures where blend instructions are not available.
git-svn-id: https://svn.cct.lsu.edu/repos/numrel/LSUThorns/Vectors/trunk@20 105869f7-3296-0410-a4ea-f4349344b45a
Diffstat (limited to 'src/vectors-4-SSE.h')
-rw-r--r--src/vectors-4-SSE.h15
1 files changed, 10 insertions, 5 deletions
diff --git a/src/vectors-4-SSE.h b/src/vectors-4-SSE.h
index 8319c49..7948032 100644
--- a/src/vectors-4-SSE.h
+++ b/src/vectors-4-SSE.h
@@ -303,6 +303,12 @@ static const union {
#ifdef __SSE4_1__
# define k4ifthen(x,y,z) (_mm_blendv_ps(y,z,x))
#else
+#include <math.h>
+#ifdef __cplusplus
+#define SGN(x) std::signbit(x)
+#else
+#define SGN(x) signbit(x)
+#endif
# define k4ifthen(x,y,z) \
({ \
CCTK_REAL4_VEC const xx=(x_); \
@@ -311,10 +317,9 @@ static const union {
CCTK_REAL4_VEC const y=yy; \
CCTK_REAL4_VEC const zz=(z_); \
CCTK_REAL4_VEC const z=zz; \
- CCTK_REAL4_VEC const c = _mm_and_ps(x,k4sign_mask); \
- vec4_set(vec4_elt0(not vec4_elt0(c) ? y : z), \
- vec4_elt1(not vec4_elt1(c) ? y : z), \
- vec4_elt2(not vec4_elt2(c) ? y : z), \
- vec4_elt3(not vec4_elt3(c) ? y : z)); \
+ vec4_set(SGN(vec4_elt0(x)) ? vec4_elt0(z) : vec4_elt0(y), \
+ SGN(vec4_elt1(x)) ? vec4_elt1(z) : vec4_elt1(y), \
+ SGN(vec4_elt2(x)) ? vec4_elt2(z) : vec4_elt2(y), \
+ SGN(vec4_elt3(x)) ? vec4_elt3(z) : vec4_elt3(y)); \
})
#endif