diff options
Diffstat (limited to 'testsuite/tests/codeGen/should_run/simd004.hs')
-rw-r--r-- | testsuite/tests/codeGen/should_run/simd004.hs | 95 |
1 files changed, 95 insertions, 0 deletions
diff --git a/testsuite/tests/codeGen/should_run/simd004.hs b/testsuite/tests/codeGen/should_run/simd004.hs new file mode 100644 index 0000000000..5216822ec4 --- /dev/null +++ b/testsuite/tests/codeGen/should_run/simd004.hs @@ -0,0 +1,95 @@ +{-# OPTIONS_GHC -O2 #-} +{-# OPTIONS_GHC -mavx #-} +{-# OPTIONS_GHC -msse4 #-} +{-# LANGUAGE MagicHash #-} +{-# LANGUAGE UnboxedTuples #-} +-- !!! test if enabling -O2 produces wrong results while +-- packing , broadcasting, unpacking vectors and for +-- arithmetic operations as well for avx instructions + +import GHC.Exts + +data FloatX4 = FX4# FloatX4# + +instance Show FloatX4 where + show (FX4# f) = case (unpackFloatX4# f) of + (# a, b, c, d #) -> show ((F# a), (F# b), (F# c), (F# d)) + + +instance Eq FloatX4 where + (FX4# a) == (FX4# b) + = case (unpackFloatX4# a) of + (# a1, a2, a3, a4 #) -> + case (unpackFloatX4# b) of + (# b1, b2, b3, b4 #) -> (F# a1) == (F# b1) && + (F# a2) == (F# b2) && + (F# a3) == (F# b3) && + (F# a4) == (F# b4) + +data DoubleX2 = DX2# DoubleX2# + +instance Show DoubleX2 where + show (DX2# d) = case (unpackDoubleX2# d) of + (# a, b #) -> show ((D# a), (D# b)) + + +instance Eq DoubleX2 where + (DX2# a) == (DX2# b) + = case (unpackDoubleX2# a) of + (# a1, a2 #) -> + case (unpackDoubleX2# b) of + (# b1, b2 #) -> (D# a1) == (D# b1) && + (D# a2) == (D# b2) + + +main :: IO () +main = do + + -- !!! test broadcasting, packing and unpacking for vector types + -- FloatX4# + case unpackFloatX4# (broadcastFloatX4# 1.5#) of + (# a, b, c, d #) -> print (F# a, F# b, F# c, F# d) + case unpackFloatX4# (packFloatX4# (# 4.5#,7.8#, 2.3#, 6.5# #)) of + (# a, b, c, d #) -> print (F# a, F# b, F# c, F# d) + + -- DoubleX2# + case unpackDoubleX2# (broadcastDoubleX2# 6.5##) of + (# a, b #) -> print (D# a, D# b) + case unpackDoubleX2# (packDoubleX2# (# 8.9##,7.2## #)) of + (# a, b #) -> print (D# a, D# b) + + + -- !!! test the lifting of unlifted vector types and + -- defining various typeclass instances for the lifted types + + print (FX4# (broadcastFloatX4# 1.5#)) + print $ (FX4# (broadcastFloatX4# 1.5#)) == (FX4# (broadcastFloatX4# 2.5#)) + print $ (FX4# (broadcastFloatX4# 3.5#)) == (FX4# (broadcastFloatX4# 3.5#)) + + print (DX2# (broadcastDoubleX2# 2.5##)) + print $ (DX2# + (broadcastDoubleX2# 1.5##)) == (DX2# (broadcastDoubleX2# 2.5##)) + print $ (DX2# + (broadcastDoubleX2# 3.5##)) == (DX2# (broadcastDoubleX2# 3.5##)) + + + -- !!! test arithmetic vector operations + print (FX4# (plusFloatX4# (packFloatX4# (# 4.5#,7.8#, 2.3#, 6.5# #)) + (packFloatX4# (# 8.2#,6.3#, 4.7#, 9.2# #)))) + print (FX4# (minusFloatX4# (packFloatX4# (# 4.5#,7.8#, 2.3#, 6.5# #)) + (packFloatX4# (# 8.2#,6.3#, 4.7#, 9.2# #)))) + print (FX4# (timesFloatX4# (packFloatX4# (# 4.5#,7.8#, 2.3#, 6.5# #)) + (packFloatX4# (# 8.2#,6.3#, 4.7#, 9.2# #)))) + print (FX4# (divideFloatX4# (packFloatX4# (# 4.5#,7.8#, 2.3#, 6.5# #)) + (packFloatX4# (# 8.2#,6.3#, 4.7#, 9.2# #)))) + print (FX4# (negateFloatX4# (packFloatX4# (# 4.5#,7.8#, 2.3#, 6.5# #)))) + + print (DX2# (plusDoubleX2# (broadcastDoubleX2# 1.3##) + (broadcastDoubleX2# 2.2##))) + print (DX2# (minusDoubleX2# (broadcastDoubleX2# 3.5##) + (broadcastDoubleX2# 2.2##))) + print (DX2# (timesDoubleX2# (broadcastDoubleX2# 2.4##) + (broadcastDoubleX2# 2.2##))) + print (DX2# (divideDoubleX2# (broadcastDoubleX2# 9.2##) + (broadcastDoubleX2# 4.0##))) + print (DX2# (negateDoubleX2# (broadcastDoubleX2# 3.5##))) |