diff options
Diffstat (limited to 'libitm/config/x86/x86_avx.cc')
-rw-r--r-- | libitm/config/x86/x86_avx.cc | 59 |
1 files changed, 59 insertions, 0 deletions
diff --git a/libitm/config/x86/x86_avx.cc b/libitm/config/x86/x86_avx.cc index 30420aa87f5..cd20fe25cdc 100644 --- a/libitm/config/x86/x86_avx.cc +++ b/libitm/config/x86/x86_avx.cc @@ -22,9 +22,66 @@ see the files COPYING3 and COPYING.RUNTIME respectively. If not, see <http://www.gnu.org/licenses/>. */ +#include "config.h" + +// ??? This is pretty gross, but we're going to frob types of the functions. +// Is this better or worse than just admitting we need to do this in pure +// assembly? + +#ifndef HAVE_AS_AVX +#undef __AVX__ +#endif + #include "libitm_i.h" #include "dispatch.h" +extern "C" { + +#ifndef HAVE_AS_AVX +typedef float _ITM_TYPE_M256 __attribute__((vector_size(32), may_alias)); +#endif + +// ??? Re-define the memcpy implementations so that we can frob the +// interface to deal with possibly missing AVX instruction set support. + +#ifdef HAVE_AS_AVX +#define RETURN(X) return X +#define STORE(X,Y) X = Y +#define OUTPUT(T) _ITM_TYPE_##T +#define INPUT(T,X) , _ITM_TYPE_##T X +#else +/* Emit vmovaps (%rax),%ymm0. */ +#define RETURN(X) \ + asm volatile(".byte 0xc5,0xfc,0x28,0x00" : "=m"(X) : "a"(&X)); +/* Emit vmovaps %ymm0,(%rax); vzeroupper. */ +#define STORE(X,Y) \ + asm volatile(".byte 0xc5,0xfc,0x29,0x00,0xc5,0xf8,0x77" : "=m"(X) : "a"(&X)); +#define OUTPUT(T) void +#define INPUT(T,X) +#endif + +#undef ITM_READ_MEMCPY +#define ITM_READ_MEMCPY(T, LSMOD, TARGET, M2) \ +OUTPUT(T) ITM_REGPARM _ITM_##LSMOD##T (const _ITM_TYPE_##T *ptr) \ +{ \ + _ITM_TYPE_##T v; \ + TARGET memtransfer##M2(&v, ptr, sizeof(_ITM_TYPE_##T), false, \ + GTM::abi_dispatch::NONTXNAL, \ + GTM::abi_dispatch::LSMOD); \ + RETURN(v); \ +} + +#undef ITM_WRITE_MEMCPY +#define ITM_WRITE_MEMCPY(T, LSMOD, TARGET, M2) \ +void ITM_REGPARM _ITM_##LSMOD##T (_ITM_TYPE_##T *ptr INPUT(T,in)) \ +{ \ + _ITM_TYPE_##T v; \ + STORE(v, in); \ + TARGET memtransfer##M2(ptr, &v, sizeof(_ITM_TYPE_##T), false, \ + GTM::abi_dispatch::LSMOD, \ + GTM::abi_dispatch::NONTXNAL); \ +} + // ??? Use memcpy for now, until we have figured out how to best instantiate // these loads/stores. CREATE_DISPATCH_FUNCTIONS_T_MEMCPY(M256, GTM::abi_disp()->, ) @@ -34,3 +91,5 @@ _ITM_LM256 (const _ITM_TYPE_M256 *ptr) { GTM::GTM_LB (ptr, sizeof (*ptr)); } + +} |