module Data.Primitive.SIMD.Int16X32 (Int16X32) where
import Data.Primitive.SIMD.Class
import GHC.Int
import GHC.Types
import GHC.Prim
import GHC.Ptr
import GHC.ST
import Foreign.Storable
import Control.Monad.Primitive
import Data.Primitive.Types
import Data.Primitive.ByteArray
import Data.Primitive.Addr
import Data.Monoid
import Data.Typeable
import qualified Data.Vector.Primitive as PV
import qualified Data.Vector.Primitive.Mutable as PMV
import Data.Vector.Unboxed (Unbox)
import qualified Data.Vector.Unboxed as UV
import Data.Vector.Generic (Vector(..))
import Data.Vector.Generic.Mutable (MVector(..))
data Int16X32 = Int16X32 Int16X8# Int16X8# Int16X8# Int16X8# deriving Typeable
abs' :: Int16 -> Int16
abs' (I16# x) = I16# (abs# x)
abs# :: Int# -> Int#
abs# x = case abs (I16# x) of
I16# y -> y
signum' :: Int16 -> Int16
signum' (I16# x) = I16# (signum# x)
signum# :: Int# -> Int#
signum# x = case signum (I16# x) of
I16# y -> y
instance Eq Int16X32 where
a == b = case unpackInt16X32 a of
(x1, x2, x3, x4, x5, x6, x7, x8, x9, x10, x11, x12, x13, x14, x15, x16, x17, x18, x19, x20, x21, x22, x23, x24, x25, x26, x27, x28, x29, x30, x31, x32) -> case unpackInt16X32 b of
(y1, y2, y3, y4, y5, y6, y7, y8, y9, y10, y11, y12, y13, y14, y15, y16, y17, y18, y19, y20, y21, y22, y23, y24, y25, y26, y27, y28, y29, y30, y31, y32) -> x1 == y1 && x2 == y2 && x3 == y3 && x4 == y4 && x5 == y5 && x6 == y6 && x7 == y7 && x8 == y8 && x9 == y9 && x10 == y10 && x11 == y11 && x12 == y12 && x13 == y13 && x14 == y14 && x15 == y15 && x16 == y16 && x17 == y17 && x18 == y18 && x19 == y19 && x20 == y20 && x21 == y21 && x22 == y22 && x23 == y23 && x24 == y24 && x25 == y25 && x26 == y26 && x27 == y27 && x28 == y28 && x29 == y29 && x30 == y30 && x31 == y31 && x32 == y32
instance Ord Int16X32 where
a `compare` b = case unpackInt16X32 a of
(x1, x2, x3, x4, x5, x6, x7, x8, x9, x10, x11, x12, x13, x14, x15, x16, x17, x18, x19, x20, x21, x22, x23, x24, x25, x26, x27, x28, x29, x30, x31, x32) -> case unpackInt16X32 b of
(y1, y2, y3, y4, y5, y6, y7, y8, y9, y10, y11, y12, y13, y14, y15, y16, y17, y18, y19, y20, y21, y22, y23, y24, y25, y26, y27, y28, y29, y30, y31, y32) -> x1 `compare` y1 <> x2 `compare` y2 <> x3 `compare` y3 <> x4 `compare` y4 <> x5 `compare` y5 <> x6 `compare` y6 <> x7 `compare` y7 <> x8 `compare` y8 <> x9 `compare` y9 <> x10 `compare` y10 <> x11 `compare` y11 <> x12 `compare` y12 <> x13 `compare` y13 <> x14 `compare` y14 <> x15 `compare` y15 <> x16 `compare` y16 <> x17 `compare` y17 <> x18 `compare` y18 <> x19 `compare` y19 <> x20 `compare` y20 <> x21 `compare` y21 <> x22 `compare` y22 <> x23 `compare` y23 <> x24 `compare` y24 <> x25 `compare` y25 <> x26 `compare` y26 <> x27 `compare` y27 <> x28 `compare` y28 <> x29 `compare` y29 <> x30 `compare` y30 <> x31 `compare` y31 <> x32 `compare` y32
instance Show Int16X32 where
showsPrec _ a s = case unpackInt16X32 a of
(x1, x2, x3, x4, x5, x6, x7, x8, x9, x10, x11, x12, x13, x14, x15, x16, x17, x18, x19, x20, x21, x22, x23, x24, x25, x26, x27, x28, x29, x30, x31, x32) -> "Int16X32 (" ++ shows x1 (", " ++ shows x2 (", " ++ shows x3 (", " ++ shows x4 (", " ++ shows x5 (", " ++ shows x6 (", " ++ shows x7 (", " ++ shows x8 (", " ++ shows x9 (", " ++ shows x10 (", " ++ shows x11 (", " ++ shows x12 (", " ++ shows x13 (", " ++ shows x14 (", " ++ shows x15 (", " ++ shows x16 (", " ++ shows x17 (", " ++ shows x18 (", " ++ shows x19 (", " ++ shows x20 (", " ++ shows x21 (", " ++ shows x22 (", " ++ shows x23 (", " ++ shows x24 (", " ++ shows x25 (", " ++ shows x26 (", " ++ shows x27 (", " ++ shows x28 (", " ++ shows x29 (", " ++ shows x30 (", " ++ shows x31 (", " ++ shows x32 (")" ++ s))))))))))))))))))))))))))))))))
instance Num Int16X32 where
(+) = plusInt16X32
() = minusInt16X32
(*) = timesInt16X32
negate = negateInt16X32
abs = mapVector abs'
signum = mapVector signum'
fromInteger = broadcastVector . fromInteger
instance Bounded Int16X32 where
minBound = broadcastVector minBound
maxBound = broadcastVector maxBound
instance Storable Int16X32 where
sizeOf x = vectorSize x * elementSize x
alignment = sizeOf
peek (Ptr a) = readOffAddr (Addr a) 0
poke (Ptr a) = writeOffAddr (Addr a) 0
instance SIMDVector Int16X32 where
type Elem Int16X32 = Int16
type ElemTuple Int16X32 = (Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16)
nullVector = broadcastVector 0
vectorSize _ = 32
elementSize _ = 2
broadcastVector = broadcastInt16X32
unsafeInsertVector = unsafeInsertInt16X32
packVector = packInt16X32
unpackVector = unpackInt16X32
mapVector = mapInt16X32
zipVector = zipInt16X32
foldVector = foldInt16X32
sumVector = sumInt16X32
instance SIMDIntVector Int16X32 where
quotVector = quotInt16X32
remVector = remInt16X32
instance Prim Int16X32 where
sizeOf# a = let !(I# x) = sizeOf a in x
alignment# a = let !(I# x) = alignment a in x
indexByteArray# ba i = indexInt16X32Array (ByteArray ba) (I# i)
readByteArray# mba i s = let (ST r) = readInt16X32Array (MutableByteArray mba) (I# i) in r s
writeByteArray# mba i v s = let (ST r) = writeInt16X32Array (MutableByteArray mba) (I# i) v in case r s of { (# s', _ #) -> s' }
setByteArray# mba off n v s = let (ST r) = setByteArrayGeneric (MutableByteArray mba) (I# off) (I# n) v in case r s of { (# s', _ #) -> s' }
indexOffAddr# addr i = indexInt16X32OffAddr (Addr addr) (I# i)
readOffAddr# addr i s = let (ST r) = readInt16X32OffAddr (Addr addr) (I# i) in r s
writeOffAddr# addr i v s = let (ST r) = writeInt16X32OffAddr (Addr addr) (I# i) v in case r s of { (# s', _ #) -> s' }
setOffAddr# addr off n v s = let (ST r) = setOffAddrGeneric (Addr addr) (I# off) (I# n) v in case r s of { (# s', _ #) -> s' }
newtype instance UV.Vector Int16X32 = V_Int16X32 (PV.Vector Int16X32)
newtype instance UV.MVector s Int16X32 = MV_Int16X32 (PMV.MVector s Int16X32)
instance Vector UV.Vector Int16X32 where
basicUnsafeFreeze (MV_Int16X32 v) = V_Int16X32 <$> PV.unsafeFreeze v
basicUnsafeThaw (V_Int16X32 v) = MV_Int16X32 <$> PV.unsafeThaw v
basicLength (V_Int16X32 v) = PV.length v
basicUnsafeSlice start len (V_Int16X32 v) = V_Int16X32(PV.unsafeSlice start len v)
basicUnsafeIndexM (V_Int16X32 v) = PV.unsafeIndexM v
basicUnsafeCopy (MV_Int16X32 m) (V_Int16X32 v) = PV.unsafeCopy m v
elemseq _ = seq
instance MVector UV.MVector Int16X32 where
basicLength (MV_Int16X32 v) = PMV.length v
basicUnsafeSlice start len (MV_Int16X32 v) = MV_Int16X32(PMV.unsafeSlice start len v)
basicOverlaps (MV_Int16X32 v) (MV_Int16X32 w) = PMV.overlaps v w
basicUnsafeNew len = MV_Int16X32 <$> PMV.unsafeNew len
#if MIN_VERSION_vector(0,11,0)
basicInitialize (MV_Int16X32 v) = basicInitialize v
#endif
basicUnsafeRead (MV_Int16X32 v) = PMV.unsafeRead v
basicUnsafeWrite (MV_Int16X32 v) = PMV.unsafeWrite v
instance Unbox Int16X32
broadcastInt16X32 :: Int16 -> Int16X32
broadcastInt16X32 (I16# x) = case broadcastInt16X8# x of
v -> Int16X32 v v v v
packInt16X32 :: (Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16) -> Int16X32
packInt16X32 (I16# x1, I16# x2, I16# x3, I16# x4, I16# x5, I16# x6, I16# x7, I16# x8, I16# x9, I16# x10, I16# x11, I16# x12, I16# x13, I16# x14, I16# x15, I16# x16, I16# x17, I16# x18, I16# x19, I16# x20, I16# x21, I16# x22, I16# x23, I16# x24, I16# x25, I16# x26, I16# x27, I16# x28, I16# x29, I16# x30, I16# x31, I16# x32) = Int16X32 (packInt16X8# (# x1, x2, x3, x4, x5, x6, x7, x8 #)) (packInt16X8# (# x9, x10, x11, x12, x13, x14, x15, x16 #)) (packInt16X8# (# x17, x18, x19, x20, x21, x22, x23, x24 #)) (packInt16X8# (# x25, x26, x27, x28, x29, x30, x31, x32 #))
unpackInt16X32 :: Int16X32 -> (Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16, Int16)
unpackInt16X32 (Int16X32 m1 m2 m3 m4) = case unpackInt16X8# m1 of
(# x1, x2, x3, x4, x5, x6, x7, x8 #) -> case unpackInt16X8# m2 of
(# x9, x10, x11, x12, x13, x14, x15, x16 #) -> case unpackInt16X8# m3 of
(# x17, x18, x19, x20, x21, x22, x23, x24 #) -> case unpackInt16X8# m4 of
(# x25, x26, x27, x28, x29, x30, x31, x32 #) -> (I16# x1, I16# x2, I16# x3, I16# x4, I16# x5, I16# x6, I16# x7, I16# x8, I16# x9, I16# x10, I16# x11, I16# x12, I16# x13, I16# x14, I16# x15, I16# x16, I16# x17, I16# x18, I16# x19, I16# x20, I16# x21, I16# x22, I16# x23, I16# x24, I16# x25, I16# x26, I16# x27, I16# x28, I16# x29, I16# x30, I16# x31, I16# x32)
unsafeInsertInt16X32 :: Int16X32 -> Int16 -> Int -> Int16X32
unsafeInsertInt16X32 (Int16X32 m1 m2 m3 m4) (I16# y) _i@(I# ip) | _i < 8 = Int16X32 (insertInt16X8# m1 y (ip -# 0#)) m2 m3 m4
| _i < 16 = Int16X32 m1 (insertInt16X8# m2 y (ip -# 8#)) m3 m4
| _i < 24 = Int16X32 m1 m2 (insertInt16X8# m3 y (ip -# 16#)) m4
| otherwise = Int16X32 m1 m2 m3 (insertInt16X8# m4 y (ip -# 24#))
mapInt16X32 :: (Int16 -> Int16) -> Int16X32 -> Int16X32
mapInt16X32 f = mapInt16X32# (\ x -> case f (I16# x) of { I16# y -> y})
mapInt16X32# :: (Int# -> Int#) -> Int16X32 -> Int16X32
mapInt16X32# f = \ v -> case unpackInt16X32 v of
(I16# x1, I16# x2, I16# x3, I16# x4, I16# x5, I16# x6, I16# x7, I16# x8, I16# x9, I16# x10, I16# x11, I16# x12, I16# x13, I16# x14, I16# x15, I16# x16, I16# x17, I16# x18, I16# x19, I16# x20, I16# x21, I16# x22, I16# x23, I16# x24, I16# x25, I16# x26, I16# x27, I16# x28, I16# x29, I16# x30, I16# x31, I16# x32) -> packInt16X32 (I16# (f x1), I16# (f x2), I16# (f x3), I16# (f x4), I16# (f x5), I16# (f x6), I16# (f x7), I16# (f x8), I16# (f x9), I16# (f x10), I16# (f x11), I16# (f x12), I16# (f x13), I16# (f x14), I16# (f x15), I16# (f x16), I16# (f x17), I16# (f x18), I16# (f x19), I16# (f x20), I16# (f x21), I16# (f x22), I16# (f x23), I16# (f x24), I16# (f x25), I16# (f x26), I16# (f x27), I16# (f x28), I16# (f x29), I16# (f x30), I16# (f x31), I16# (f x32))
zipInt16X32 :: (Int16 -> Int16 -> Int16) -> Int16X32 -> Int16X32 -> Int16X32
zipInt16X32 f = \ v1 v2 -> case unpackInt16X32 v1 of
(x1, x2, x3, x4, x5, x6, x7, x8, x9, x10, x11, x12, x13, x14, x15, x16, x17, x18, x19, x20, x21, x22, x23, x24, x25, x26, x27, x28, x29, x30, x31, x32) -> case unpackInt16X32 v2 of
(y1, y2, y3, y4, y5, y6, y7, y8, y9, y10, y11, y12, y13, y14, y15, y16, y17, y18, y19, y20, y21, y22, y23, y24, y25, y26, y27, y28, y29, y30, y31, y32) -> packInt16X32 (f x1 y1, f x2 y2, f x3 y3, f x4 y4, f x5 y5, f x6 y6, f x7 y7, f x8 y8, f x9 y9, f x10 y10, f x11 y11, f x12 y12, f x13 y13, f x14 y14, f x15 y15, f x16 y16, f x17 y17, f x18 y18, f x19 y19, f x20 y20, f x21 y21, f x22 y22, f x23 y23, f x24 y24, f x25 y25, f x26 y26, f x27 y27, f x28 y28, f x29 y29, f x30 y30, f x31 y31, f x32 y32)
foldInt16X32 :: (Int16 -> Int16 -> Int16) -> Int16X32 -> Int16
foldInt16X32 f' = \ v -> case unpackInt16X32 v of
(x1, x2, x3, x4, x5, x6, x7, x8, x9, x10, x11, x12, x13, x14, x15, x16, x17, x18, x19, x20, x21, x22, x23, x24, x25, x26, x27, x28, x29, x30, x31, x32) -> x1 `f` x2 `f` x3 `f` x4 `f` x5 `f` x6 `f` x7 `f` x8 `f` x9 `f` x10 `f` x11 `f` x12 `f` x13 `f` x14 `f` x15 `f` x16 `f` x17 `f` x18 `f` x19 `f` x20 `f` x21 `f` x22 `f` x23 `f` x24 `f` x25 `f` x26 `f` x27 `f` x28 `f` x29 `f` x30 `f` x31 `f` x32
where f !x !y = f' x y
sumInt16X32 :: Int16X32 -> Int16
sumInt16X32 (Int16X32 x1 x2 x3 x4) = case unpackInt16X8# (plusInt16X8# x1 (plusInt16X8# x2 (plusInt16X8# x3 x4))) of
(# y1, y2, y3, y4, y5, y6, y7, y8 #) -> I16# y1 + I16# y2 + I16# y3 + I16# y4 + I16# y5 + I16# y6 + I16# y7 + I16# y8
plusInt16X32 :: Int16X32 -> Int16X32 -> Int16X32
plusInt16X32 (Int16X32 m1_1 m2_1 m3_1 m4_1) (Int16X32 m1_2 m2_2 m3_2 m4_2) = Int16X32 (plusInt16X8# m1_1 m1_2) (plusInt16X8# m2_1 m2_2) (plusInt16X8# m3_1 m3_2) (plusInt16X8# m4_1 m4_2)
minusInt16X32 :: Int16X32 -> Int16X32 -> Int16X32
minusInt16X32 (Int16X32 m1_1 m2_1 m3_1 m4_1) (Int16X32 m1_2 m2_2 m3_2 m4_2) = Int16X32 (minusInt16X8# m1_1 m1_2) (minusInt16X8# m2_1 m2_2) (minusInt16X8# m3_1 m3_2) (minusInt16X8# m4_1 m4_2)
timesInt16X32 :: Int16X32 -> Int16X32 -> Int16X32
timesInt16X32 (Int16X32 m1_1 m2_1 m3_1 m4_1) (Int16X32 m1_2 m2_2 m3_2 m4_2) = Int16X32 (timesInt16X8# m1_1 m1_2) (timesInt16X8# m2_1 m2_2) (timesInt16X8# m3_1 m3_2) (timesInt16X8# m4_1 m4_2)
quotInt16X32 :: Int16X32 -> Int16X32 -> Int16X32
quotInt16X32 (Int16X32 m1_1 m2_1 m3_1 m4_1) (Int16X32 m1_2 m2_2 m3_2 m4_2) = Int16X32 (quotInt16X8# m1_1 m1_2) (quotInt16X8# m2_1 m2_2) (quotInt16X8# m3_1 m3_2) (quotInt16X8# m4_1 m4_2)
remInt16X32 :: Int16X32 -> Int16X32 -> Int16X32
remInt16X32 (Int16X32 m1_1 m2_1 m3_1 m4_1) (Int16X32 m1_2 m2_2 m3_2 m4_2) = Int16X32 (remInt16X8# m1_1 m1_2) (remInt16X8# m2_1 m2_2) (remInt16X8# m3_1 m3_2) (remInt16X8# m4_1 m4_2)
negateInt16X32 :: Int16X32 -> Int16X32
negateInt16X32 (Int16X32 m1_1 m2_1 m3_1 m4_1) = Int16X32 (negateInt16X8# m1_1) (negateInt16X8# m2_1) (negateInt16X8# m3_1) (negateInt16X8# m4_1)
indexInt16X32Array :: ByteArray -> Int -> Int16X32
indexInt16X32Array (ByteArray a) (I# i) = Int16X32 (indexInt16X8Array# a ((i *# 4#) +# 0#)) (indexInt16X8Array# a ((i *# 4#) +# 1#)) (indexInt16X8Array# a ((i *# 4#) +# 2#)) (indexInt16X8Array# a ((i *# 4#) +# 3#))
readInt16X32Array :: PrimMonad m => MutableByteArray (PrimState m) -> Int -> m Int16X32
readInt16X32Array (MutableByteArray a) (I# i) = primitive (\ s0 -> case readInt16X8Array# a ((i *# 4#) +# 0#) s0 of
(# s1, m1 #) -> case readInt16X8Array# a ((i *# 4#) +# 1#) s1 of
(# s2, m2 #) -> case readInt16X8Array# a ((i *# 4#) +# 2#) s2 of
(# s3, m3 #) -> case readInt16X8Array# a ((i *# 4#) +# 3#) s3 of
(# s4, m4 #) -> (# s4, Int16X32 m1 m2 m3 m4 #))
writeInt16X32Array :: PrimMonad m => MutableByteArray (PrimState m) -> Int -> Int16X32 -> m ()
writeInt16X32Array (MutableByteArray a) (I# i) (Int16X32 m1 m2 m3 m4) = primitive_ (writeInt16X8Array# a ((i *# 4#) +# 0#) m1) >> primitive_ (writeInt16X8Array# a ((i *# 4#) +# 1#) m2) >> primitive_ (writeInt16X8Array# a ((i *# 4#) +# 2#) m3) >> primitive_ (writeInt16X8Array# a ((i *# 4#) +# 3#) m4)
indexInt16X32OffAddr :: Addr -> Int -> Int16X32
indexInt16X32OffAddr (Addr a) (I# i) = Int16X32 (indexInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 0#)) 0#) (indexInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 16#)) 0#) (indexInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 32#)) 0#) (indexInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 48#)) 0#)
readInt16X32OffAddr :: PrimMonad m => Addr -> Int -> m Int16X32
readInt16X32OffAddr (Addr a) (I# i) = primitive (\ s0 -> case (\ addr i' -> readInt16X8OffAddr# (plusAddr# addr i') 0#) a ((i *# 64#) +# 0#) s0 of
(# s1, m1 #) -> case (\ addr i' -> readInt16X8OffAddr# (plusAddr# addr i') 0#) a ((i *# 64#) +# 16#) s1 of
(# s2, m2 #) -> case (\ addr i' -> readInt16X8OffAddr# (plusAddr# addr i') 0#) a ((i *# 64#) +# 32#) s2 of
(# s3, m3 #) -> case (\ addr i' -> readInt16X8OffAddr# (plusAddr# addr i') 0#) a ((i *# 64#) +# 48#) s3 of
(# s4, m4 #) -> (# s4, Int16X32 m1 m2 m3 m4 #))
writeInt16X32OffAddr :: PrimMonad m => Addr -> Int -> Int16X32 -> m ()
writeInt16X32OffAddr (Addr a) (I# i) (Int16X32 m1 m2 m3 m4) = primitive_ (writeInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 0#)) 0# m1) >> primitive_ (writeInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 16#)) 0# m2) >> primitive_ (writeInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 32#)) 0# m3) >> primitive_ (writeInt16X8OffAddr# (plusAddr# a ((i *# 64#) +# 48#)) 0# m4)