module CodeGen.X86.CodeGen where
import Numeric
import Data.Monoid
import qualified Data.Vector as V
import Data.Bits
import Data.Int
import Data.Word
import Control.Arrow
import Control.Monad.Reader
import Control.Monad.Writer
import Control.Monad.State
import Debug.Trace
import CodeGen.X86.Asm
takes [] _ = []
takes (i: is) xs = take i xs: takes is (drop i xs)
iff b a = if b then a else mempty
indicator :: Integral a => Bool -> a
indicator False = 0x0
indicator True = 0x1
pattern FJust a = First (Just a)
pattern FNothing = First Nothing
pattern Integral xs <- (toIntegralSized -> Just xs)
data SReg where
SReg :: IsSize s => Reg s -> SReg
phisicalReg :: SReg -> Reg S64
phisicalReg (SReg (HighReg x)) = NormalReg x
phisicalReg (SReg (NormalReg x)) = NormalReg x
isHigh (SReg HighReg{}) = True
isHigh _ = False
regs :: forall s k . IsSize s => Operand s k -> [SReg]
regs = \case
MemOp (Addr r _ i) -> foldMap (pure . SReg) r ++ foldMap (pure . SReg . snd) i
RegOp r -> [SReg r]
_ -> mempty
isRex (SReg x@(NormalReg r)) = r .&. 0x8 /= 0 || size x == S8 && r `shiftR` 2 == 1
isRex _ = False
noHighRex r = not $ any isHigh r && any isRex r
convertImm :: Bool -> Size -> Operand s k -> First ((Bool, Size), Bytes)
convertImm a b c = (,) (a, b) <$> g a b c
where
g :: Bool -> Size -> Operand s k -> First Bytes
g False S64 (ImmOp w) = toBytes <$> (f w :: First Word64)
g False S32 (ImmOp w) = toBytes <$> (f w :: First Word32)
g False S16 (ImmOp w) = toBytes <$> (f w :: First Word16)
g False S8 (ImmOp w) = toBytes <$> (f w :: First Word8)
g True S64 (ImmOp w) = toBytes <$> (f w :: First Int64)
g True S32 (ImmOp w) = toBytes <$> (f w :: First Int32)
g True S16 (ImmOp w) = toBytes <$> (f w :: First Int16)
g True S8 (ImmOp w) = toBytes <$> (f w :: First Int8)
g _ _ _ = FNothing
f = First . toIntegralSized
mkImmS = convertImm True
mkImm = convertImm False
mkImmNo64 s = mkImmS (no64 s)
no64 S64 = S32
no64 s = s
newtype CodeBuilder = CodeBuilder {buildCode :: CodeBuilderState -> ([Either Int (Int, Word8)], CodeBuilderState)}
type CodeBuilderState = (Int, [Either [(Size, Int, Int)] Int])
instance Monoid CodeBuilder where
mempty = CodeBuilder $ (,) mempty
f `mappend` g = CodeBuilder $ \(buildCode f -> (a, buildCode g -> (b, st))) -> (a ++ b, st)
codeByte :: Word8 -> CodeBuilder
codeByte c = CodeBuilder $ \(n, labs) -> ([Right (n, c)], (n + 1, labs))
mkRef :: Size -> Int -> Int -> CodeBuilder
mkRef s sc bs = CodeBuilder f
where
f (n, labs) | bs >= length labs = trace "warning: missing scope" (mempty, (n + sizeLen s, labs))
f (n, labs) = case labs !! bs of
Right i -> (Right <$> zip [n..] z, (n + sizeLen s, labs))
where
vx = i n sc
z = getBytes $ case s of
S8 -> toBytes (fromIntegral vx :: Int8)
S32 -> toBytes (fromIntegral vx :: Int32)
Left cs -> (mempty, (n + sizeLen s, labs'))
where
labs' = take bs labs ++ Left ((s, n, n sc): cs): drop (bs + 1) labs
instance Show Code where
show c = unlines $ zipWith3 showLine is (takes (zipWith () (tail is ++ [s]) is) bs) ss
where
ss = snd . runWriter . flip evalStateT 0 . flip runReaderT [] . showCode $ c
(x, s) = second fst $ buildCode (mkCodeBuilder c) (0, replicate 10 $ Left [])
bs = V.toList $ V.replicate s 0 V.// [p | Right p <- x]
is = [i | Left i <- x]
showLine addr [] s = s
showLine addr bs s = [showNibble i addr | i <- [5,4..0]] ++ " " ++ pad (2 * maxbytes) (concatMap showByte bs) ++ " " ++ s
pad i xs = xs ++ replicate (i length xs) ' '
maxbytes = 12
codeBytes c = Bytes $ V.toList $ V.replicate s 0 V.// [p | Right p <- x]
where
(x, s) = buildTheCode c
buildTheCode x = second fst $ buildCode (mkCodeBuilder x) (0, [])
mkCodeBuilder :: Code -> CodeBuilder
mkCodeBuilder = \case
EmptyCode -> mempty
AppendCode a b -> mkCodeBuilder a <> mkCodeBuilder b
Up a -> CodeBuilder $ \(n, x: xs) -> second (second (x:)) $ buildCode (mkCodeBuilder a) (n, xs)
Scope x -> CodeBuilder begin <> mkCodeBuilder x <> CodeBuilder end
where
begin (n, labs) = (mempty, (n, Left []: labs))
end (n, Right _: labs) = (mempty, (n, labs))
end (n, _: labs) = trace "warning: missing label" (mempty, (n, labs))
x -> CodeBuilder $ \st@(addr, _) -> first (Left addr:) $ buildCode (mkCodeBuilder' x) st
mkCodeBuilder' :: Code -> CodeBuilder
mkCodeBuilder' = \case
Add a b -> op2 0x0 a b
Or a b -> op2 0x1 a b
Adc a b -> op2 0x2 a b
Sbb a b -> op2 0x3 a b
And a b -> op2 0x4 a b
Sub a b -> op2 0x5 a b
Xor a b -> op2 0x6 a b
Cmp a b -> op2 0x7 a b
Rol a b -> shiftOp 0x0 a b
Ror a b -> shiftOp 0x1 a b
Rcl a b -> shiftOp 0x2 a b
Rcr a b -> shiftOp 0x3 a b
Shl a b -> shiftOp 0x4 a b
Shr a b -> shiftOp 0x5 a b
Sar a b -> shiftOp 0x7 a b
Xchg x@RegA r -> xchg_a r
Xchg r x@RegA -> xchg_a r
Xchg dest src -> op2' 0x43 dest' src
where
(dest', src') = if isMemOp src then (src, dest) else (dest, src)
Test dest (mkImmNo64 (size dest) -> FJust (_, im)) -> case dest of
RegA -> regprefix'' dest 0x54 mempty im
_ -> regprefix'' dest 0x7b (reg8 0x0 dest) im
Test dest (noImm "" -> src) -> op2' 0x42 dest' src'
where
(dest', src') = if isMemOp src then (src, dest) else (dest, src)
Mov dest@(RegOp r) ((if size dest == S64 then mkImm S32 <> mkImmS S32 <> mkImmS S64 else mkImmS (size dest)) -> FJust ((se, si), im))
| (se, si, size dest) /= (True, S32, S64) -> regprefix si dest (oneReg (0x16 .|. indicator (size dest /= S8)) r) im
| otherwise -> regprefix'' dest 0x63 (reg8 0x0 dest) im
Mov dest@(size -> s) (mkImmNo64 s -> FJust (_, im)) -> regprefix'' dest 0x63 (reg8 0x0 dest) im
Mov dest src -> op2' 0x44 dest $ noImm (show (dest, src)) src
Lea dest@(RegOp r) src | size dest /= S8 -> regprefix2 (resizeOperand' dest src) dest 0x46 $ reg8 (reg8_ r) src
where
resizeOperand' :: IsSize s1 => Operand s1 x -> Operand s2 RW -> Operand s1 RW
resizeOperand' _ = resizeOperand
Not a -> op1 0x7b 0x2 a
Neg a -> op1 0x7b 0x3 a
Inc a -> op1 0x7f 0x0 a
Dec a -> op1 0x7f 0x1 a
Call a -> op1' 0xff 0x2 a
Pop dest@(RegOp r) -> regprefix S32 dest (oneReg 0x0b r) mempty
Pop dest -> regprefix S32 dest (codeByte 0x8f <> reg8 0x0 dest) mempty
Push (mkImmS S8 -> FJust (_, im)) -> codeByte 0x6a <> bytesToCode im
Push (mkImmS S32 -> FJust (_, im)) -> codeByte 0x68 <> bytesToCode im
Push dest@(RegOp r) -> regprefix S32 dest (oneReg 0x0a r) mempty
Push dest -> regprefix S32 dest (codeByte 0xff <> reg8 0x6 dest) mempty
Ret -> codeByte 0xc3
Nop -> codeByte 0x90
PushF -> codeByte 0x9c
PopF -> codeByte 0x9d
Cmc -> codeByte 0xf5
Clc -> codeByte 0xf8
Stc -> codeByte 0xf9
Cli -> codeByte 0xfa
Sti -> codeByte 0xfb
Cld -> codeByte 0xfc
Std -> codeByte 0xfd
J (Condition c) -> codeByte (0x70 .|. c) <> mkRef S8 1 0
Jmp -> codeByte 0xeb <> mkRef S8 1 0
Label -> CodeBuilder lab
where
lab (n, labs) = (Right <$> concatMap g corr, (n, labs'))
where
(corr, labs') = replL (Right n) labs
g (size, p, v) = zip [p..] $ getBytes $ case (size, v + n) of
(S8, Integral v) -> toBytes (v :: Int8)
(S32, Integral v) -> toBytes (v :: Int32)
replL x (Left z: zs) = (z, x: zs)
replL x (z: zs) = second (z:) $ replL x zs
Data cs -> CodeBuilder $ \(n, labs) -> (Right <$> zip [n..] (getBytes cs), (n + bytesCount cs, labs))
Align s -> CodeBuilder $ \(n, labs) -> let
j = fromIntegral $ (fromIntegral n 1 :: Int64) .|. f s + 1
in (Right <$> zip [n..] (replicate j 0x90), (n + j, labs))
where
f s = sizeLen s 1
where
xchg_a dest@(RegOp r) | size dest /= S8 = regprefix (size dest) dest (oneReg 0x12 r) mempty
xchg_a dest = regprefix'' dest 0x43 (reg8 0x0 dest) mempty
bytesToCode = mkCodeBuilder' . Data
toCode = bytesToCode . toBytes
sizePrefix_ rs s r x c im
| noHighRex rs = pre <> c <> displacement r <> bytesToCode im
| otherwise = error "cannot use high register in rex instruction"
where
pre = case s of
S8 -> mem32pre r <> iff (any isRex rs || x /= 0) (prefix40_ x)
S16 -> codeByte 0x66 <> mem32pre r <> prefix40 x
S32 -> mem32pre r <> prefix40 x
S64 -> mem32pre r <> prefix40 (0x8 .|. x)
mem32pre :: Operand s k -> CodeBuilder
mem32pre (MemOp r@Addr{}) | size r == S32 = codeByte 0x67
mem32pre _ = mempty
prefix40 x = iff (x /= 0) $ prefix40_ x
prefix40_ x = codeByte $ 0x40 .|. x
displacement :: Operand s a -> CodeBuilder
displacement RegOp{} = mempty
displacement (IPMemOp (Immediate d)) = toCode d
displacement (IPMemOp (LabelRelAddr d)) = mkRef S32 (4 + fromIntegral (bytesCount im)) d
displacement (MemOp (Addr b d i)) = mkSIB b i <> dispVal b d
where
mkSIB _ (IndexReg s (NormalReg 0x4)) = error "sp cannot be used as index"
mkSIB _ (IndexReg s i) = f s $ reg8_ i
mkSIB Nothing _ = f s1 0x4
mkSIB (Just (reg8_ -> 0x4)) _ = f s1 0x4
mkSIB _ _ = mempty
f (Scale s) i = codeByte $ s `shiftL` 6 .|. i `shiftL` 3 .|. maybe 0x5 reg8_ b
dispVal Just{} (Disp (Integral (d :: Int8))) = toCode d
dispVal _ (Disp d) = toCode d
dispVal Nothing _ = toCode (0 :: Int32)
dispVal (Just (reg8_ -> 0x5)) _ = codeByte 0
dispVal _ _ = mempty
reg8_ (NormalReg r) = r .&. 0x7
reg8_ (HighReg r) = r .|. 0x4
regprefix s r c im = sizePrefix_ (regs r) s r (extbits r) c im
regprefix2 r r' p c = sizePrefix_ (regs r <> regs r') (size r) r (extbits r' `shiftL` 2 .|. extbits r) (extension r p <> c) mempty
regprefix'' r p c = regprefix (size r) r $ extension r p <> c
extension x p = codeByte $ p `shiftL` 1 .|. indicator (size x /= S8)
extbits :: Operand s a -> Word8
extbits = \case
MemOp (Addr b _ i) -> maybe 0 indexReg b .|. maybe 0 ((`shiftL` 1) . indexReg . snd) i
RegOp r -> indexReg r
IPMemOp{} -> 0
where
indexReg (NormalReg r) = r `shiftR` 3 .&. 1
indexReg _ = 0
reg8 :: Word8 -> Operand s a -> CodeBuilder
reg8 w x = codeByte $ operMode x `shiftL` 6 .|. w `shiftL` 3 .|. rc x
where
operMode :: Operand s a -> Word8
operMode (MemOp (Addr (Just (reg8_ -> 0x5)) NoDisp _)) = 0x1
operMode (MemOp (Addr Nothing _ _)) = 0x0
operMode (MemOp (Addr _ NoDisp _)) = 0x0
operMode (MemOp (Addr _ (Disp (Integral (_ :: Int8))) _)) = 0x1
operMode (MemOp (Addr _ Disp{} _)) = 0x2
operMode IPMemOp{} = 0x0
operMode RegOp{} = 0x3
rc :: Operand s a -> Word8
rc (MemOp (Addr (Just r) _ NoIndex)) = reg8_ r
rc MemOp{} = 0x04
rc IPMemOp{} = 0x05
rc (RegOp r) = reg8_ r
notA8 dest@RegA = False
notA8 dest = size dest == S8
op2 :: IsSize s => Word8 -> Operand s RW -> Operand s k -> CodeBuilder
op2 op dest@(notA8 -> True) (mkImmS S8 -> FJust (_, im))
= regprefix'' dest 0x40 (reg8 op dest) im
op2 op dest@RegA (mkImmNo64 (size dest) -> FJust (_, im))
= regprefix'' dest (op `shiftL` 2 .|. 0x2) mempty im
op2 op dest (mkImmS S8 <> mkImmNo64 (size dest) -> FJust ((_, k), im))
= regprefix'' dest (0x40 .|. indicator (k == S8)) (reg8 op dest) im
op2 op dest src = op2' (op `shiftL` 2) dest $ noImm "1" src
noImm :: String -> Operand s k -> Operand s RW
noImm _ (RegOp r) = RegOp r
noImm _ (MemOp a) = MemOp a
noImm _ (IPMemOp a) = IPMemOp a
noImm er _ = error $ "immediate value of this size is not supported: " ++ er
op2' :: IsSize s => Word8 -> Operand s RW -> Operand s RW -> CodeBuilder
op2' op dest src@RegOp{} = op2g op dest src
op2' op dest@RegOp{} src = op2g (op .|. 0x1) src dest
op2g op dest src@(RegOp r) = regprefix2 dest src op $ reg8 (reg8_ r) dest
op1_ r1 r2 dest im = regprefix'' dest r1 (reg8 r2 dest) im
op1 a b c = op1_ a b c mempty
op1' :: Word8 -> Word8 -> Operand S64 RW -> CodeBuilder
op1' r1 r2 dest = regprefix S32 dest (codeByte r1 <> reg8 r2 dest) mempty
shiftOp :: IsSize s => Word8 -> Operand s RW -> Operand S8 k -> CodeBuilder
shiftOp c dest (ImmOp 1) = op1 0x68 c dest
shiftOp c dest (mkImm S8 -> FJust (_, i)) = op1_ 0x60 c dest i
shiftOp c dest RegCl = op1 0x69 c dest
shiftOp _ _ _ = error "invalid shift operands"
oneReg x r = codeByte $ x `shiftL` 3 .|. reg8_ r