aboutsummaryrefslogtreecommitdiff
path: root/astro/boinc-setiathome-v7/files/patch-client__vector__analyzeFuncs_sse.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'astro/boinc-setiathome-v7/files/patch-client__vector__analyzeFuncs_sse.cpp')
-rw-r--r--astro/boinc-setiathome-v7/files/patch-client__vector__analyzeFuncs_sse.cpp35
1 files changed, 0 insertions, 35 deletions
diff --git a/astro/boinc-setiathome-v7/files/patch-client__vector__analyzeFuncs_sse.cpp b/astro/boinc-setiathome-v7/files/patch-client__vector__analyzeFuncs_sse.cpp
deleted file mode 100644
index 162d1cb8509f..000000000000
--- a/astro/boinc-setiathome-v7/files/patch-client__vector__analyzeFuncs_sse.cpp
+++ /dev/null
@@ -1,35 +0,0 @@
---- client/vector/analyzeFuncs_sse.cpp.origin 2013-08-02 01:08:24.000000000 +0400
-+++ client/vector/analyzeFuncs_sse.cpp 2013-08-02 01:18:33.000000000 +0400
-@@ -191,7 +191,7 @@
- prefetcht0(out+3*yline);
- // TODO: figure out why the intrinsic version crashes for MinGW build
- // not critical, but shuffle-only _MM_TRANSPOSE4_PS is optimal on some
--#if defined(USE_INTRINSICS) && defined(_MM_TRANSPOSE4_PS) && !defined(__GNUC__)
-+#if defined(USE_INTRINSICS) && (defined(_MM_TRANSPOSE4_PS) && !defined(__GNUC__) || defined(__clang__))
- register float4 row0=*(__m128 *)in;
- register float4 row1=*(__m128 *)(in+xline);
- register float4 row2=*(__m128 *)(in+2*xline);
-@@ -273,7 +273,7 @@
-
- // TODO: figure out why the intrinsic version crashes for MinGW build
- // not critical, but the shuffle-only _MM_TRANSPOSE4_PS is optimal on some
--#if defined(USE_INTRINSICS) && defined(_MM_TRANSPOSE4_PS) && !defined(__GNUC__)
-+#if defined(USE_INTRINSICS) && (defined(_MM_TRANSPOSE4_PS) && !defined(__GNUC__) || defined(__clang__))
- register float4 row0=*(__m128 *)in;
- register float4 row1=*(__m128 *)(in+xline);
- register float4 row2=*(__m128 *)(in+2*xline);
-@@ -1592,8 +1592,14 @@
- return ( tMax );
- }
-
-+#ifdef __clang__
-+#define s_getU( aaaa, ptr ) \
-+ aaaa = _mm_loadl_pi(aaaa, (__m64 *)ptr); \
-+ aaaa = _mm_loadh_pi(aaaa, ((__m64 *)(ptr))+1 )
-+#else
- #define s_getU( aaaa, ptr ) \
- aaaa = _mm_loadh_pi( _mm_loadl_pi(aaaa, (__m64 *)ptr), ((__m64 *)(ptr))+1 )
-+#endif
-
- #define s_putU( ptr, aaaa ) \
- _mm_storel_pi((__m64 *)ptr, aaaa), _mm_storeh_pi( ((__m64 *)ptr)+1 , aaaa)