Fix LLVM Clang compile on PowerPC

author: Jeffrey Walton <noloader@gmail.com> 2018-11-19 02:28:29 -0500
committer: Jeffrey Walton <noloader@gmail.com> 2018-11-19 02:28:29 -0500
commit: 3129ad4d705f88d5ddf72ef9975dac8d08fa7fe9 (patch)
tree: 20d1b90a217ba97797c63fdc9ca730b59ae0875f /gcm_simd.cpp
parent: c9f1a26024d6e099f4c7e57e9ca8391a780dbe1a (diff)
download: cryptopp-git-3129ad4d705f88d5ddf72ef9975dac8d08fa7fe9.tar.gz
1 files changed, 16 insertions, 5 deletions
diff --git a/gcm_simd.cpp b/gcm_simd.cpp
index b701f398..78e842b5 100644
--- a/gcm_simd.cpp
+++ b/gcm_simd.cpp
@@ -64,7 +64,7 @@ extern const char GCM_SIMD_FNAME[] = __FILE__;
 
 ANONYMOUS_NAMESPACE_BEGIN
 
-// ************************* Miscellaneous ************************* //
+// *************************** ARM NEON *************************** //
 
 #if CRYPTOPP_ARM_PMULL_AVAILABLE
 #if defined(__GNUC__)
@@ -168,7 +168,10 @@ inline uint64x2_t VEXT_U8(uint64x2_t a, uint64x2_t b)
 #endif // Microsoft and compatibles
 #endif // CRYPTOPP_ARM_PMULL_AVAILABLE
 
+// ************************** Power 8 Crypto ************************** //
+
 #if CRYPTOPP_POWER8_VMULL_AVAILABLE
+
 using CryptoPP::uint32x4_p;
 using CryptoPP::uint64x2_p;
 using CryptoPP::VecGetLow;
@@ -201,8 +204,10 @@ inline uint64x2_p VMULL2LE(const uint64x2_p& val)
 // _mm_clmulepi64_si128(a, b, 0x00)
 inline uint64x2_p VMULL_00LE(const uint64x2_p& a, const uint64x2_p& b)
 {
-#if defined(__xlc__) || defined(__xlC__) || defined(__clang__)
+#if defined(__ibmxl__) || (defined(_AIX) && defined(__xlC__))
     return VMULL2LE(__vpmsumd (VecGetHigh(a), VecGetHigh(b)));
+#elif defined(__clang__)
+    return VMULL2LE(__builtin_altivec_crypto_vpmsumd (VecGetHigh(a), VecGetHigh(b)));
 #else
     return VMULL2LE(__builtin_crypto_vpmsumd (VecGetHigh(a), VecGetHigh(b)));
 #endif
@@ -214,8 +219,10 @@ inline uint64x2_p VMULL_01LE(const uint64x2_p& a, const uint64x2_p& b)
     // Small speedup. VecGetHigh(b) ensures the high dword of 'b' is 0.
     // The 0 used in the vmull yields 0 for the high product, so the high
     // dword of 'a' is "don't care".
-#if defined(__xlc__) || defined(__xlC__) || defined(__clang__)
+#if defined(__ibmxl__) || (defined(_AIX) && defined(__xlC__))
     return VMULL2LE(__vpmsumd (a, VecGetHigh(b)));
+#elif defined(__clang__)
+    return VMULL2LE(__builtin_altivec_crypto_vpmsumd (a, VecGetHigh(b)));
 #else
     return VMULL2LE(__builtin_crypto_vpmsumd (a, VecGetHigh(b)));
 #endif
@@ -227,8 +234,10 @@ inline uint64x2_p VMULL_10LE(const uint64x2_p& a, const uint64x2_p& b)
     // Small speedup. VecGetHigh(a) ensures the high dword of 'a' is 0.
     // The 0 used in the vmull yields 0 for the high product, so the high
     // dword of 'b' is "don't care".
-#if defined(__xlc__) || defined(__xlC__) || defined(__clang__)
+#if defined(__ibmxl__) || (defined(_AIX) && defined(__xlC__))
     return VMULL2LE(__vpmsumd (VecGetHigh(a), b));
+#elif defined(__clang__)
+    return VMULL2LE(__builtin_altivec_crypto_vpmsumd (VecGetHigh(a), b));
 #else
     return VMULL2LE(__builtin_crypto_vpmsumd (VecGetHigh(a), b));
 #endif
@@ -240,8 +249,10 @@ inline uint64x2_p VMULL_11LE(const uint64x2_p& a, const uint64x2_p& b)
     // Small speedup. VecGetLow(a) ensures the high dword of 'a' is 0.
     // The 0 used in the vmull yields 0 for the high product, so the high
     // dword of 'b' is "don't care".
-#if defined(__xlc__) || defined(__xlC__) || defined(__clang__)
+#if defined(__ibmxl__) || (defined(_AIX) && defined(__xlC__))
     return VMULL2LE(__vpmsumd (VecGetLow(a), b));
+#elif defined(__clang__)
+    return VMULL2LE(__builtin_altivec_crypto_vpmsumd (VecGetLow(a), b));
 #else
     return VMULL2LE(__builtin_crypto_vpmsumd (VecGetLow(a), b));
 #endif
author	Jeffrey Walton <noloader@gmail.com>	2018-11-19 02:28:29 -0500
committer	Jeffrey Walton <noloader@gmail.com>	2018-11-19 02:28:29 -0500
commit	3129ad4d705f88d5ddf72ef9975dac8d08fa7fe9 (patch)
tree	20d1b90a217ba97797c63fdc9ca730b59ae0875f /gcm_simd.cpp
parent	c9f1a26024d6e099f4c7e57e9ca8391a780dbe1a (diff)
download	cryptopp-git-3129ad4d705f88d5ddf72ef9975dac8d08fa7fe9.tar.gz