#include "MachDeps.h"
module Data.Primitive.SIMD.Word64X4 (Word64X4) where
import Data.Primitive.SIMD.Class
import GHC.Word
import GHC.Types
import GHC.Prim
import GHC.Ptr
import GHC.ST
import Foreign.Storable
import Control.Monad.Primitive
import Data.Primitive.Types
import Data.Primitive.ByteArray
import Data.Primitive.Addr
import Data.Monoid
import Data.Typeable
import qualified Data.Vector.Primitive as PV
import qualified Data.Vector.Primitive.Mutable as PMV
import Data.Vector.Unboxed (Unbox)
import qualified Data.Vector.Unboxed as UV
import Data.Vector.Generic (Vector(..))
import Data.Vector.Generic.Mutable (MVector(..))
#if WORD_SIZE_IN_BITS == 64
type RealWord64# = Word#
#elif WORD_SIZE_IN_BITS == 32
type RealWord64# = Word64#
#else
#error "WORD_SIZE_IN_BITS is neither 64 or 32"
#endif
data Word64X4 = Word64X4 Word64X2# Word64X2# deriving Typeable
abs' :: Word64 -> Word64
abs' (W64# x) = W64# (abs# x)
abs# :: RealWord64# -> RealWord64#
abs# x = case abs (W64# x) of
W64# y -> y
signum' :: Word64 -> Word64
signum' (W64# x) = W64# (signum# x)
signum# :: RealWord64# -> RealWord64#
signum# x = case signum (W64# x) of
W64# y -> y
instance Eq Word64X4 where
a == b = case unpackWord64X4 a of
(x1, x2, x3, x4) -> case unpackWord64X4 b of
(y1, y2, y3, y4) -> x1 == y1 && x2 == y2 && x3 == y3 && x4 == y4
instance Ord Word64X4 where
a `compare` b = case unpackWord64X4 a of
(x1, x2, x3, x4) -> case unpackWord64X4 b of
(y1, y2, y3, y4) -> x1 `compare` y1 <> x2 `compare` y2 <> x3 `compare` y3 <> x4 `compare` y4
instance Show Word64X4 where
showsPrec _ a s = case unpackWord64X4 a of
(x1, x2, x3, x4) -> "Word64X4 (" ++ shows x1 (", " ++ shows x2 (", " ++ shows x3 (", " ++ shows x4 (")" ++ s))))
instance Num Word64X4 where
(+) = plusWord64X4
() = minusWord64X4
(*) = timesWord64X4
negate = mapVector negate
abs = mapVector abs'
signum = mapVector signum'
fromInteger = broadcastVector . fromInteger
instance Bounded Word64X4 where
minBound = broadcastVector minBound
maxBound = broadcastVector maxBound
instance Storable Word64X4 where
sizeOf x = vectorSize x * elementSize x
alignment = sizeOf
peek (Ptr a) = readOffAddr (Addr a) 0
poke (Ptr a) = writeOffAddr (Addr a) 0
instance SIMDVector Word64X4 where
type Elem Word64X4 = Word64
type ElemTuple Word64X4 = (Word64, Word64, Word64, Word64)
nullVector = broadcastVector 0
vectorSize _ = 4
elementSize _ = 8
broadcastVector = broadcastWord64X4
unsafeInsertVector = unsafeInsertWord64X4
packVector = packWord64X4
unpackVector = unpackWord64X4
mapVector = mapWord64X4
zipVector = zipWord64X4
foldVector = foldWord64X4
sumVector = sumWord64X4
instance SIMDIntVector Word64X4 where
quotVector = quotWord64X4
remVector = remWord64X4
instance Prim Word64X4 where
sizeOf# a = let !(I# x) = sizeOf a in x
alignment# a = let !(I# x) = alignment a in x
indexByteArray# ba i = indexWord64X4Array (ByteArray ba) (I# i)
readByteArray# mba i s = let (ST r) = readWord64X4Array (MutableByteArray mba) (I# i) in r s
writeByteArray# mba i v s = let (ST r) = writeWord64X4Array (MutableByteArray mba) (I# i) v in case r s of { (# s', _ #) -> s' }
setByteArray# mba off n v s = let (ST r) = setByteArrayGeneric (MutableByteArray mba) (I# off) (I# n) v in case r s of { (# s', _ #) -> s' }
indexOffAddr# addr i = indexWord64X4OffAddr (Addr addr) (I# i)
readOffAddr# addr i s = let (ST r) = readWord64X4OffAddr (Addr addr) (I# i) in r s
writeOffAddr# addr i v s = let (ST r) = writeWord64X4OffAddr (Addr addr) (I# i) v in case r s of { (# s', _ #) -> s' }
setOffAddr# addr off n v s = let (ST r) = setOffAddrGeneric (Addr addr) (I# off) (I# n) v in case r s of { (# s', _ #) -> s' }
newtype instance UV.Vector Word64X4 = V_Word64X4 (PV.Vector Word64X4)
newtype instance UV.MVector s Word64X4 = MV_Word64X4 (PMV.MVector s Word64X4)
instance Vector UV.Vector Word64X4 where
basicUnsafeFreeze (MV_Word64X4 v) = V_Word64X4 <$> PV.unsafeFreeze v
basicUnsafeThaw (V_Word64X4 v) = MV_Word64X4 <$> PV.unsafeThaw v
basicLength (V_Word64X4 v) = PV.length v
basicUnsafeSlice start len (V_Word64X4 v) = V_Word64X4(PV.unsafeSlice start len v)
basicUnsafeIndexM (V_Word64X4 v) = PV.unsafeIndexM v
basicUnsafeCopy (MV_Word64X4 m) (V_Word64X4 v) = PV.unsafeCopy m v
elemseq _ = seq
instance MVector UV.MVector Word64X4 where
basicLength (MV_Word64X4 v) = PMV.length v
basicUnsafeSlice start len (MV_Word64X4 v) = MV_Word64X4(PMV.unsafeSlice start len v)
basicOverlaps (MV_Word64X4 v) (MV_Word64X4 w) = PMV.overlaps v w
basicUnsafeNew len = MV_Word64X4 <$> PMV.unsafeNew len
#if MIN_VERSION_vector(0,11,0)
basicInitialize (MV_Word64X4 v) = basicInitialize v
#endif
basicUnsafeRead (MV_Word64X4 v) = PMV.unsafeRead v
basicUnsafeWrite (MV_Word64X4 v) = PMV.unsafeWrite v
instance Unbox Word64X4
broadcastWord64X4 :: Word64 -> Word64X4
broadcastWord64X4 (W64# x) = case broadcastWord64X2# x of
v -> Word64X4 v v
packWord64X4 :: (Word64, Word64, Word64, Word64) -> Word64X4
packWord64X4 (W64# x1, W64# x2, W64# x3, W64# x4) = Word64X4 (packWord64X2# (# x1, x2 #)) (packWord64X2# (# x3, x4 #))
unpackWord64X4 :: Word64X4 -> (Word64, Word64, Word64, Word64)
unpackWord64X4 (Word64X4 m1 m2) = case unpackWord64X2# m1 of
(# x1, x2 #) -> case unpackWord64X2# m2 of
(# x3, x4 #) -> (W64# x1, W64# x2, W64# x3, W64# x4)
unsafeInsertWord64X4 :: Word64X4 -> Word64 -> Int -> Word64X4
unsafeInsertWord64X4 (Word64X4 m1 m2) (W64# y) _i@(I# ip) | _i < 2 = Word64X4 (insertWord64X2# m1 y (ip -# 0#)) m2
| otherwise = Word64X4 m1 (insertWord64X2# m2 y (ip -# 2#))
mapWord64X4 :: (Word64 -> Word64) -> Word64X4 -> Word64X4
mapWord64X4 f = mapWord64X4# (\ x -> case f (W64# x) of { W64# y -> y})
mapWord64X4# :: (RealWord64# -> RealWord64#) -> Word64X4 -> Word64X4
mapWord64X4# f = \ v -> case unpackWord64X4 v of
(W64# x1, W64# x2, W64# x3, W64# x4) -> packWord64X4 (W64# (f x1), W64# (f x2), W64# (f x3), W64# (f x4))
zipWord64X4 :: (Word64 -> Word64 -> Word64) -> Word64X4 -> Word64X4 -> Word64X4
zipWord64X4 f = \ v1 v2 -> case unpackWord64X4 v1 of
(x1, x2, x3, x4) -> case unpackWord64X4 v2 of
(y1, y2, y3, y4) -> packWord64X4 (f x1 y1, f x2 y2, f x3 y3, f x4 y4)
foldWord64X4 :: (Word64 -> Word64 -> Word64) -> Word64X4 -> Word64
foldWord64X4 f' = \ v -> case unpackWord64X4 v of
(x1, x2, x3, x4) -> x1 `f` x2 `f` x3 `f` x4
where f !x !y = f' x y
sumWord64X4 :: Word64X4 -> Word64
sumWord64X4 (Word64X4 x1 x2) = case unpackWord64X2# (plusWord64X2# x1 x2) of
(# y1, y2 #) -> W64# y1 + W64# y2
plusWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
plusWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (plusWord64X2# m1_1 m1_2) (plusWord64X2# m2_1 m2_2)
minusWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
minusWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (minusWord64X2# m1_1 m1_2) (minusWord64X2# m2_1 m2_2)
timesWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
timesWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (timesWord64X2# m1_1 m1_2) (timesWord64X2# m2_1 m2_2)
quotWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
quotWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (quotWord64X2# m1_1 m1_2) (quotWord64X2# m2_1 m2_2)
remWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
remWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (remWord64X2# m1_1 m1_2) (remWord64X2# m2_1 m2_2)
indexWord64X4Array :: ByteArray -> Int -> Word64X4
indexWord64X4Array (ByteArray a) (I# i) = Word64X4 (indexWord64X2Array# a ((i *# 2#) +# 0#)) (indexWord64X2Array# a ((i *# 2#) +# 1#))
readWord64X4Array :: PrimMonad m => MutableByteArray (PrimState m) -> Int -> m Word64X4
readWord64X4Array (MutableByteArray a) (I# i) = primitive (\ s0 -> case readWord64X2Array# a ((i *# 2#) +# 0#) s0 of
(# s1, m1 #) -> case readWord64X2Array# a ((i *# 2#) +# 1#) s1 of
(# s2, m2 #) -> (# s2, Word64X4 m1 m2 #))
writeWord64X4Array :: PrimMonad m => MutableByteArray (PrimState m) -> Int -> Word64X4 -> m ()
writeWord64X4Array (MutableByteArray a) (I# i) (Word64X4 m1 m2) = primitive_ (writeWord64X2Array# a ((i *# 2#) +# 0#) m1) >> primitive_ (writeWord64X2Array# a ((i *# 2#) +# 1#) m2)
indexWord64X4OffAddr :: Addr -> Int -> Word64X4
indexWord64X4OffAddr (Addr a) (I# i) = Word64X4 (indexWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 0#)) 0#) (indexWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 16#)) 0#)
readWord64X4OffAddr :: PrimMonad m => Addr -> Int -> m Word64X4
readWord64X4OffAddr (Addr a) (I# i) = primitive (\ s0 -> case (\ addr i' -> readWord64X2OffAddr# (plusAddr# addr i') 0#) a ((i *# 32#) +# 0#) s0 of
(# s1, m1 #) -> case (\ addr i' -> readWord64X2OffAddr# (plusAddr# addr i') 0#) a ((i *# 32#) +# 16#) s1 of
(# s2, m2 #) -> (# s2, Word64X4 m1 m2 #))
writeWord64X4OffAddr :: PrimMonad m => Addr -> Int -> Word64X4 -> m ()
writeWord64X4OffAddr (Addr a) (I# i) (Word64X4 m1 m2) = primitive_ (writeWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 0#)) 0# m1) >> primitive_ (writeWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 16#)) 0# m2)