From 89853488275b118f6f2ba7724eec30f4d37d67b9 Mon Sep 17 00:00:00 2001 From: Erik Schnetter Date: Fri, 30 Oct 2015 10:53:52 -0400 Subject: Improve optimization barriers --- vec_pseudo.h | 29 +---------------------------- 1 file changed, 1 insertion(+), 28 deletions(-) (limited to 'vec_pseudo.h') diff --git a/vec_pseudo.h b/vec_pseudo.h index c4cbbc1..fa2895c 100644 --- a/vec_pseudo.h +++ b/vec_pseudo.h @@ -472,35 +472,8 @@ template struct realpseudovec : floatprops { } #endif void barrier() { -#if defined __GNUC__ && !defined __clang__ && !defined __ICC -// GCC crashes when +X is used as constraint -#if defined __SSE2__ for (int d = 0; d < size; ++d) - __asm__("" : "+x"(v[d])); -#elif defined __PPC64__ // maybe also __PPC__ - for (int d = 0; d < size; ++d) - __asm__("" : "+f"(v[d])); -#elif defined __arm__ - for (int d = 0; d < size; ++d) - __asm__("" : "+w"(v[d])); -#else -#error "Floating point barrier undefined on this architecture" -#endif -#elif defined __clang__ - for (int d = 0; d < size; ++d) - __asm__("" : "+X"(v[d])); -#elif defined __ICC - for (int d = 0; d < size; ++d) { - real_t tmp = v[d]; - __asm__("" : "+X"(tmp)); - v[d] = tmp; - } -#elif defined __IBMCPP__ - for (int d = 0; d < size; ++d) - __asm__("" : "+f"(v[d])); -#else -#error "Floating point barrier undefined on this architecture" -#endif + v[d] = vecmathlib::barrier(v[d]); } typedef boolpseudovec boolvec_t; -- cgit v1.1