diff options
-rw-r--r-- | src/vectors-4-SSE.h | 8 | ||||
-rw-r--r-- | src/vectors-4-default.h | 2 | ||||
-rw-r--r-- | src/vectors-8-SSE2.h | 8 | ||||
-rw-r--r-- | src/vectors-8-default.h | 2 |
4 files changed, 16 insertions, 4 deletions
diff --git a/src/vectors-4-SSE.h b/src/vectors-4-SSE.h index 7948032..4bda22b 100644 --- a/src/vectors-4-SSE.h +++ b/src/vectors-4-SSE.h @@ -17,7 +17,13 @@ -#define vec4_architecture "SSE" +#ifdef __SSE4_1__ +#define vec4_architecture "SSE4.1 (32-bit precision)" +#elif defined(__SSE4A__) +#define vec4_architecture "SSE4A (32-bit precision)" +#else +#define vec4_architecture "SSE (32-bit precision)" +#endif // Vector type corresponding to CCTK_REAL #define CCTK_REAL4_VEC __m128 diff --git a/src/vectors-4-default.h b/src/vectors-4-default.h index 6f66ff9..f9fccd3 100644 --- a/src/vectors-4-default.h +++ b/src/vectors-4-default.h @@ -8,7 +8,7 @@ -#define vec4_architecture "scalar (no vectorisation)" +#define vec4_architecture "scalar (no vectorisation, 32-bit precision)" // Use CCTK_REAL4 #define CCTK_REAL4_VEC CCTK_REAL4 diff --git a/src/vectors-8-SSE2.h b/src/vectors-8-SSE2.h index 3bd5753..e0b9600 100644 --- a/src/vectors-8-SSE2.h +++ b/src/vectors-8-SSE2.h @@ -17,7 +17,13 @@ -#define vec8_architecture "SSE2" +#ifdef __SSE4_1__ +#define vec8_architecture "SSE4.1 (64-bit precision)" +#elif defined(__SSE4A__) +#define vec8_architecture "SSE4A (64-bit precision)" +#else +#define vec8_architecture "SSE2 (64-bit precision)" +#endif // Vector type corresponding to CCTK_REAL #define CCTK_REAL8_VEC __m128d diff --git a/src/vectors-8-default.h b/src/vectors-8-default.h index cdce1ef..c45ebe6 100644 --- a/src/vectors-8-default.h +++ b/src/vectors-8-default.h @@ -8,7 +8,7 @@ -#define vec8_architecture "scalar (no vectorisation)" +#define vec8_architecture "scalar (no vectorisation, 64-bit precision)" // Use CCTK_REAL8 #define CCTK_REAL8_VEC CCTK_REAL8 |