{-# LANGUAGE UnboxedTuples         #-}
{-# LANGUAGE MagicHash             #-}
{-# LANGUAGE TypeFamilies          #-}
{-# LANGUAGE DeriveDataTypeable    #-}
{-# LANGUAGE BangPatterns          #-}
{-# LANGUAGE MultiParamTypeClasses #-}
{-# LANGUAGE CPP                   #-}

#include "MachDeps.h"

module Data.Primitive.SIMD.Word64X4 (Word64X4) where

-- This code was AUTOMATICALLY generated, DO NOT EDIT!

import Data.Primitive.SIMD.Class

import GHC.Word
import GHC.Types
import GHC.Prim
import GHC.Ptr
import GHC.ST

import Foreign.Storable

import Control.Monad.Primitive

import Data.Primitive.Types
import Data.Primitive.ByteArray
import Data.Primitive.Addr
import Data.Monoid
import Data.Typeable

import qualified Data.Vector.Primitive as PV
import qualified Data.Vector.Primitive.Mutable as PMV
import Data.Vector.Unboxed (Unbox)
import qualified Data.Vector.Unboxed as UV
import Data.Vector.Generic (Vector(..))
import Data.Vector.Generic.Mutable (MVector(..))

#if WORD_SIZE_IN_BITS == 64
type RealWord64# = Word#
#elif WORD_SIZE_IN_BITS == 32
type RealWord64# = Word64#
#else
#error "WORD_SIZE_IN_BITS is neither 64 or 32"
#endif

-- ** Word64X4
data Word64X4 = Word64X4 Word64X2# Word64X2# deriving Typeable

abs' :: Word64 -> Word64
abs' (W64# x) = W64# (abs# x)

{-# INLINE abs# #-}
abs# :: RealWord64# -> RealWord64#
abs# x = case abs (W64# x) of
    W64# y -> y

signum' :: Word64 -> Word64
signum' (W64# x) = W64# (signum# x)

{-# NOINLINE signum# #-}
signum# :: RealWord64# -> RealWord64#
signum# x = case signum (W64# x) of
    W64# y -> y

instance Eq Word64X4 where
    a == b = case unpackWord64X4 a of
        (x1, x2, x3, x4) -> case unpackWord64X4 b of
            (y1, y2, y3, y4) -> x1 == y1 && x2 == y2 && x3 == y3 && x4 == y4

instance Ord Word64X4 where
    a `compare` b = case unpackWord64X4 a of
        (x1, x2, x3, x4) -> case unpackWord64X4 b of
            (y1, y2, y3, y4) -> x1 `compare` y1 <> x2 `compare` y2 <> x3 `compare` y3 <> x4 `compare` y4

instance Show Word64X4 where
    showsPrec _ a s = case unpackWord64X4 a of
        (x1, x2, x3, x4) -> "Word64X4 (" ++ shows x1 (", " ++ shows x2 (", " ++ shows x3 (", " ++ shows x4 (")" ++ s))))

instance Num Word64X4 where
    (+) = plusWord64X4
    (-) = minusWord64X4
    (*) = timesWord64X4
    negate = mapVector negate
    abs    = mapVector abs'
    signum = mapVector signum'
    fromInteger = broadcastVector . fromInteger

instance Bounded Word64X4 where
    minBound = broadcastVector minBound
    maxBound = broadcastVector maxBound

instance Storable Word64X4 where
    sizeOf x     = vectorSize x * elementSize x
    alignment    = sizeOf
    peek (Ptr a) = readOffAddr (Addr a) 0
    poke (Ptr a) = writeOffAddr (Addr a) 0

instance SIMDVector Word64X4 where
    type Elem Word64X4 = Word64
    type ElemTuple Word64X4 = (Word64, Word64, Word64, Word64)
    nullVector         = broadcastVector 0
    vectorSize  _      = 4
    elementSize _      = 8
    broadcastVector    = broadcastWord64X4
    unsafeInsertVector = unsafeInsertWord64X4
    packVector         = packWord64X4
    unpackVector       = unpackWord64X4
    mapVector          = mapWord64X4
    zipVector          = zipWord64X4
    foldVector         = foldWord64X4
    sumVector          = sumWord64X4

instance SIMDIntVector Word64X4 where
    quotVector = quotWord64X4
    remVector  = remWord64X4

instance Prim Word64X4 where
    sizeOf# a                   = let !(I# x) = sizeOf a in x
    alignment# a                = let !(I# x) = alignment a in x
    indexByteArray# ba i        = indexWord64X4Array (ByteArray ba) (I# i)
    readByteArray# mba i s      = let (ST r) = readWord64X4Array (MutableByteArray mba) (I# i) in r s
    writeByteArray# mba i v s   = let (ST r) = writeWord64X4Array (MutableByteArray mba) (I# i) v in case r s of { (# s', _ #) -> s' }
    setByteArray# mba off n v s = let (ST r) = setByteArrayGeneric (MutableByteArray mba) (I# off) (I# n) v in case r s of { (# s', _ #) -> s' }
    indexOffAddr# addr i        = indexWord64X4OffAddr (Addr addr) (I# i)
    readOffAddr# addr i s       = let (ST r) = readWord64X4OffAddr (Addr addr) (I# i) in r s
    writeOffAddr# addr i v s    = let (ST r) = writeWord64X4OffAddr (Addr addr) (I# i) v in case r s of { (# s', _ #) -> s' }
    setOffAddr# addr off n v s  = let (ST r) = setOffAddrGeneric (Addr addr) (I# off) (I# n) v in case r s of { (# s', _ #) -> s' }

newtype instance UV.Vector Word64X4 = V_Word64X4 (PV.Vector Word64X4)
newtype instance UV.MVector s Word64X4 = MV_Word64X4 (PMV.MVector s Word64X4)

instance Vector UV.Vector Word64X4 where
    basicUnsafeFreeze (MV_Word64X4 v) = V_Word64X4 <$> PV.unsafeFreeze v
    basicUnsafeThaw (V_Word64X4 v) = MV_Word64X4 <$> PV.unsafeThaw v
    basicLength (V_Word64X4 v) = PV.length v
    basicUnsafeSlice start len (V_Word64X4 v) = V_Word64X4(PV.unsafeSlice start len v)
    basicUnsafeIndexM (V_Word64X4 v) = PV.unsafeIndexM v
    basicUnsafeCopy (MV_Word64X4 m) (V_Word64X4 v) = PV.unsafeCopy m v
    elemseq _ = seq
    {-# INLINE basicUnsafeFreeze #-}
    {-# INLINE basicUnsafeThaw #-}
    {-# INLINE basicLength #-}
    {-# INLINE basicUnsafeSlice #-}
    {-# INLINE basicUnsafeIndexM #-}
    {-# INLINE basicUnsafeCopy #-}
    {-# INLINE elemseq #-}

instance MVector UV.MVector Word64X4 where
    basicLength (MV_Word64X4 v) = PMV.length v
    basicUnsafeSlice start len (MV_Word64X4 v) = MV_Word64X4(PMV.unsafeSlice start len v)
    basicOverlaps (MV_Word64X4 v) (MV_Word64X4 w) = PMV.overlaps v w
    basicUnsafeNew len = MV_Word64X4 <$> PMV.unsafeNew len
#if MIN_VERSION_vector(0,11,0)
    basicInitialize (MV_Word64X4 v) = basicInitialize v
#endif
    basicUnsafeRead (MV_Word64X4 v) = PMV.unsafeRead v
    basicUnsafeWrite (MV_Word64X4 v) = PMV.unsafeWrite v
    {-# INLINE basicLength #-}
    {-# INLINE basicUnsafeSlice #-}
    {-# INLINE basicOverlaps #-}
    {-# INLINE basicUnsafeNew #-}
    {-# INLINE basicUnsafeRead #-}
    {-# INLINE basicUnsafeWrite #-}

instance Unbox Word64X4

{-# INLINE broadcastWord64X4 #-}
-- | Broadcast a scalar to all elements of a vector.
broadcastWord64X4 :: Word64 -> Word64X4
broadcastWord64X4 (W64# x) = case broadcastWord64X2# x of
    v -> Word64X4 v v

{-# INLINE packWord64X4 #-}
-- | Pack the elements of a tuple into a vector.
packWord64X4 :: (Word64, Word64, Word64, Word64) -> Word64X4
packWord64X4 (W64# x1, W64# x2, W64# x3, W64# x4) = Word64X4 (packWord64X2# (# x1, x2 #)) (packWord64X2# (# x3, x4 #))

{-# INLINE unpackWord64X4 #-}
-- | Unpack the elements of a vector into a tuple.
unpackWord64X4 :: Word64X4 -> (Word64, Word64, Word64, Word64)
unpackWord64X4 (Word64X4 m1 m2) = case unpackWord64X2# m1 of
    (# x1, x2 #) -> case unpackWord64X2# m2 of
        (# x3, x4 #) -> (W64# x1, W64# x2, W64# x3, W64# x4)

{-# INLINE unsafeInsertWord64X4 #-}
-- | Insert a scalar at the given position (starting from 0) in a vector. If the index is outside of the range, the behavior is undefined.
unsafeInsertWord64X4 :: Word64X4 -> Word64 -> Int -> Word64X4
unsafeInsertWord64X4 (Word64X4 m1 m2) (W64# y) _i@(I# ip) | _i < 2 = Word64X4 (insertWord64X2# m1 y (ip -# 0#)) m2
                                                          | otherwise = Word64X4 m1 (insertWord64X2# m2 y (ip -# 2#))

{-# INLINE mapWord64X4 #-}
-- | Apply a function to each element of a vector (unpacks and repacks the vector)
mapWord64X4 :: (Word64 -> Word64) -> Word64X4 -> Word64X4
mapWord64X4 f = mapWord64X4# (\ x -> case f (W64# x) of { W64# y -> y})

{-# INLINE[0] mapWord64X4# #-}
-- | Unboxed helper function.
mapWord64X4# :: (RealWord64# -> RealWord64#) -> Word64X4 -> Word64X4
mapWord64X4# f = \ v -> case unpackWord64X4 v of
    (W64# x1, W64# x2, W64# x3, W64# x4) -> packWord64X4 (W64# (f x1), W64# (f x2), W64# (f x3), W64# (f x4))

{-# INLINE zipWord64X4 #-}
-- | Zip two vectors together using a combining function (unpacks and repacks the vectors)
zipWord64X4 :: (Word64 -> Word64 -> Word64) -> Word64X4 -> Word64X4 -> Word64X4
zipWord64X4 f = \ v1 v2 -> case unpackWord64X4 v1 of
    (x1, x2, x3, x4) -> case unpackWord64X4 v2 of
        (y1, y2, y3, y4) -> packWord64X4 (f x1 y1, f x2 y2, f x3 y3, f x4 y4)

{-# INLINE foldWord64X4 #-}
-- | Fold the elements of a vector to a single value
foldWord64X4 :: (Word64 -> Word64 -> Word64) -> Word64X4 -> Word64
foldWord64X4 f' = \ v -> case unpackWord64X4 v of
    (x1, x2, x3, x4) -> x1 `f` x2 `f` x3 `f` x4
    where f !x !y = f' x y

{-# INLINE sumWord64X4 #-}
-- | Sum up the elements of a vector to a single value.
sumWord64X4 :: Word64X4 -> Word64
sumWord64X4 (Word64X4 x1 x2) = case unpackWord64X2# (plusWord64X2# x1 x2) of
    (# y1, y2 #) -> W64# y1 + W64# y2

{-# INLINE plusWord64X4 #-}
-- | Add two vectors element-wise.
plusWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
plusWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (plusWord64X2# m1_1 m1_2) (plusWord64X2# m2_1 m2_2)

{-# INLINE minusWord64X4 #-}
-- | Subtract two vectors element-wise.
minusWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
minusWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (minusWord64X2# m1_1 m1_2) (minusWord64X2# m2_1 m2_2)

{-# INLINE timesWord64X4 #-}
-- | Multiply two vectors element-wise.
timesWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
timesWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (timesWord64X2# m1_1 m1_2) (timesWord64X2# m2_1 m2_2)

{-# INLINE quotWord64X4 #-}
-- | Rounds towards zero element-wise.
quotWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
quotWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (quotWord64X2# m1_1 m1_2) (quotWord64X2# m2_1 m2_2)

{-# INLINE remWord64X4 #-}
-- | Satisfies (quot x y) * y + (rem x y) == x.
remWord64X4 :: Word64X4 -> Word64X4 -> Word64X4
remWord64X4 (Word64X4 m1_1 m2_1) (Word64X4 m1_2 m2_2) = Word64X4 (remWord64X2# m1_1 m1_2) (remWord64X2# m2_1 m2_2)

{-# INLINE indexWord64X4Array #-}
-- | Read a vector from specified index of the immutable array.
indexWord64X4Array :: ByteArray -> Int -> Word64X4
indexWord64X4Array (ByteArray a) (I# i) = Word64X4 (indexWord64X2Array# a ((i *# 2#) +# 0#)) (indexWord64X2Array# a ((i *# 2#) +# 1#))

{-# INLINE readWord64X4Array #-}
-- | Read a vector from specified index of the mutable array.
readWord64X4Array :: PrimMonad m => MutableByteArray (PrimState m) -> Int -> m Word64X4
readWord64X4Array (MutableByteArray a) (I# i) = primitive (\ s0 -> case readWord64X2Array# a ((i *# 2#) +# 0#) s0 of
    (# s1, m1 #) -> case readWord64X2Array# a ((i *# 2#) +# 1#) s1 of
        (# s2, m2 #) -> (# s2, Word64X4 m1 m2 #))

{-# INLINE writeWord64X4Array #-}
-- | Write a vector to specified index of mutable array.
writeWord64X4Array :: PrimMonad m => MutableByteArray (PrimState m) -> Int -> Word64X4 -> m ()
writeWord64X4Array (MutableByteArray a) (I# i) (Word64X4 m1 m2) = primitive_ (writeWord64X2Array# a ((i *# 2#) +# 0#) m1) >> primitive_ (writeWord64X2Array# a ((i *# 2#) +# 1#) m2)

{-# INLINE indexWord64X4OffAddr #-}
-- | Reads vector from the specified index of the address.
indexWord64X4OffAddr :: Addr -> Int -> Word64X4
indexWord64X4OffAddr (Addr a) (I# i) = Word64X4 (indexWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 0#)) 0#) (indexWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 16#)) 0#)

{-# INLINE readWord64X4OffAddr #-}
-- | Reads vector from the specified index of the address.
readWord64X4OffAddr :: PrimMonad m => Addr -> Int -> m Word64X4
readWord64X4OffAddr (Addr a) (I# i) = primitive (\ s0 -> case (\ addr i' -> readWord64X2OffAddr# (plusAddr# addr i') 0#) a ((i *# 32#) +# 0#) s0 of
    (# s1, m1 #) -> case (\ addr i' -> readWord64X2OffAddr# (plusAddr# addr i') 0#) a ((i *# 32#) +# 16#) s1 of
        (# s2, m2 #) -> (# s2, Word64X4 m1 m2 #))

{-# INLINE writeWord64X4OffAddr #-}
-- | Write vector to the specified index of the address.
writeWord64X4OffAddr :: PrimMonad m => Addr -> Int -> Word64X4 -> m ()
writeWord64X4OffAddr (Addr a) (I# i) (Word64X4 m1 m2) = primitive_ (writeWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 0#)) 0# m1) >> primitive_ (writeWord64X2OffAddr# (plusAddr# a ((i *# 32#) +# 16#)) 0# m2)