From 953441badfbe4b08873d430e6aa0f08b66296489 Mon Sep 17 00:00:00 2001 From: Jussi Pakkanen Date: Mon, 13 Feb 2017 22:08:24 +0200 Subject: [PATCH] Added SSE2 support. --- test cases/common/139 simd/meson.build | 25 ++++++++++++++---------- test cases/common/139 simd/simd_sse2.c | 25 ++++++++++++++++++++++++ test cases/common/139 simd/simdchecker.c | 6 ++++++ 3 files changed, 46 insertions(+), 10 deletions(-) create mode 100644 test cases/common/139 simd/simd_sse2.c diff --git a/test cases/common/139 simd/meson.build b/test cases/common/139 simd/meson.build index 5311460cc..d717dba7e 100644 --- a/test cases/common/139 simd/meson.build +++ b/test cases/common/139 simd/meson.build @@ -17,7 +17,6 @@ cdata = configuration_data() # and then have a target that uses the result in links_with. # The following headers need to be added. Also Thumb and Altivec. -# SSE2 # SSE3 # SSSE3 # SSE4.1 @@ -29,15 +28,21 @@ cdata = configuration_data() simdlibs = [] -if cc.has_argument('-mmmx') - cdata.set('HAVE_MMX', 1) - simdlibs += static_library('simd_mmx', 'simd_mmx.c', c_args : '-mmmx') -endif - -if cc.has_argument('-msse') - cdata.set('HAVE_SSE', 1) - simdlibs += static_library('simd_sse', 'simd_sse.c', c_args : '-msse') -endif +simdarr = [['-mmx', 'HAVE_MMX', 'simd_mmx', 'simd_mmx.c'], + ['-msse', 'HAVE_SSE', 'simd_sse', 'simd_sse.c'], + ['-msse2', 'HAVE_SSE2', 'simd_sse2', 'simd_sse2.c'], +] + +foreach ia : simdarr + arg = ia[0] + def = ia[1] + libname = ia[2] + filename = ia[3] + if cc.has_argument(arg) + cdata.set(def, 1) + simdlibs += static_library(libname, filename, c_args : arg) + endif +endforeach configure_file(output : 'simdconfig.h', configuration : cdata) diff --git a/test cases/common/139 simd/simd_sse2.c b/test cases/common/139 simd/simd_sse2.c new file mode 100644 index 000000000..52a7e4017 --- /dev/null +++ b/test cases/common/139 simd/simd_sse2.c @@ -0,0 +1,25 @@ +#include +#include + +#include +#include +#include + +int sse2_available() { + return __builtin_cpu_supports("sse2"); +} + +void increment_sse2(float arr[4]) { + double darr[4]; + __m128d val1 = _mm_set_pd(arr[0], arr[1]); + __m128d val2 = _mm_set_pd(arr[2], arr[3]); + __m128d one = _mm_set_pd1(1.0); + __m128d result = _mm_add_pd(val1, one); + _mm_store_pd(darr, result); + result = _mm_add_pd(val2, one); + _mm_store_pd(&darr[2], result); + arr[0] = (float)darr[1]; + arr[1] = (float)darr[0]; + arr[2] = (float)darr[3]; + arr[3] = (float)darr[2]; +} diff --git a/test cases/common/139 simd/simdchecker.c b/test cases/common/139 simd/simdchecker.c index b3c94f95c..ce28f054d 100644 --- a/test cases/common/139 simd/simdchecker.c +++ b/test cases/common/139 simd/simdchecker.c @@ -17,6 +17,12 @@ int main(int argc, char **argv) { /* Add here. The first matched one is used so put "better" instruction * sets at the top. */ +#if HAVE_SSE2 + if(fptr == NULL && sse2_available()) { + fptr = increment_sse2; + type = "SSE2"; + } +#endif #if HAVE_SSE if(fptr == NULL && sse_available()) { fptr = increment_sse;