-- -*- haskell -*- -- -- Lexical syntax for illiterate Haskell 98. -- -- (c) Simon Marlow 2003, with the caveat that much of this is -- translated directly from the syntax in the Haskell 98 report. -- { {-# OPTIONS -w #-} module Yi.Lexer.Haskell ( initState, alexScanToken, tokenToStyle, startsLayout, isComment, Token(..), CommentType(..), ReservedType(..) ) where import Yi.Lexer.Alex import Yi.Style } $whitechar = [\ \t\n\r\f\v] $special = [\(\)\,\;\[\]\`\{\}] $ascdigit = 0-9 $unidigit = [] -- TODO $digit = [$ascdigit $unidigit] $ascsymbol = [\!\#\$\%\&\*\+\.\/\<\=\>\?\@\\\^\|\-\~] $unisymbol = [] -- TODO $symbol = [$ascsymbol $unisymbol] # [$special \_\:\"\'] $large = [A-Z \xc0-\xd6 \xd8-\xde] $small = [a-z \xdf-\xf6 \xf8-\xff \_] $alpha = [$small $large] $graphic = [$small $large $symbol $digit $special \:\"\'] $octit = 0-7 $hexit = [0-9 A-F a-f] $idchar = [$alpha $digit \'] $symchar = [$symbol \:] $nl = [\n\r] @reservedid = as|case|class|data|default|else|hiding|if| import|in|infix|infixl|infixr|instance|module|newtype| qualified|then|type|forall|foreign|export|dynamic| safe|threadsafe|unsafe|stdcall|ccall|dotnet @layoutReservedId = of|let|do|mdo @reservedop = ".." | ":" | "::" | "=" | \\ | "|" | "<-" | "->" | "@" | "~" | "=>" @varid = $small $idchar* @conid = $large $idchar* @varsym = $symbol $symchar* @consym = \: $symchar* @decimal = $digit+ @octal = $octit+ @hexadecimal = $hexit+ @exponent = [eE] [\-\+] @decimal $cntrl = [$large \@\[\\\]\^\_] @ascii = \^ $cntrl | NUL | SOH | STX | ETX | EOT | ENQ | ACK | BEL | BS | HT | LF | VT | FF | CR | SO | SI | DLE | DC1 | DC2 | DC3 | DC4 | NAK | SYN | ETB | CAN | EM | SUB | ESC | FS | GS | RS | US | SP | DEL $charesc = [abfnrtv\\\"\'\&] @escape = \\ ($charesc | @ascii | @decimal | o @octal | x @hexadecimal) @gap = \\ $whitechar+ \\ @string = $graphic # [\"\\] | " " | @escape | @gap haskell :- <0> $white+ ; { "{-" { m (subtract 1) (Comment Open) } "-}" { m (+1) (Comment Close) } $white+ ; -- whitespace [^\-\{]+ { c $ Comment Text } -- rule to generate comments larger than 1 char . { c $ Comment Text } } <0> { -- The first rule matches operators that begin with --, eg --++-- is a valid -- operator and *not* a comment. -- Note that we have to dissallow '-' as a symbol char for the first one -- of these because we may have -------- which would stilljust be the -- start of a comment. "--"\-* [$symbol # \-] $symchar* { c Operator } -- The next rule allows for the start of a comment basically -- it is -- followed by anything which isn't a symbol character -- (OR more '-'s). So for example "-----:" is still the start of a comment. "--"~[$symbol # \-][^$nl]* { c $ Comment Line } -- Finally because the above rule had to add in a non symbol character -- it's also possible that we have just finishing a line, -- people sometimes do this for example when breaking up paragraphs -- in a long comment. "--"$nl { c $ Comment Line } "{-" { m (subtract 1) $ Comment Open } $special { \str st -> (st, Special (snd $ head str)) } "deriving" { c (Reserved Deriving) } @reservedid { c (Reserved Other) } "where" { c (Reserved Where) } @layoutReservedId { c (Reserved OtherLayout) } `@varid` { c Operator } @varid { c VarIdent } @conid { c ConsIdent } @reservedop { c Operator } @varsym { c Operator } @consym { c ConsOperator } @decimal | 0[oO] @octal | 0[xX] @hexadecimal { c Number } @decimal \. @decimal @exponent? | @decimal @exponent { c Number } \' ($graphic # [\'\\] | " " | @escape) \' { c CharTok } \" @string* \" { c StringTok } . { c Operator } } { type HlState = Int data CommentType = Open | Close | Text | Line deriving (Eq, Show) data ReservedType = Where | OtherLayout | Deriving | Other deriving (Eq, Show) data Token = Number | CharTok | StringTok | VarIdent | ConsIdent | Reserved !ReservedType | ReservedOp | Special Char | ConsOperator | Operator | Comment !CommentType deriving (Eq, Show) tokenToStyle :: Token -> Style tokenToStyle tok = case tok of Number -> defaultStyle CharTok -> stringStyle StringTok -> stringStyle VarIdent -> defaultStyle ConsIdent -> upperIdStyle ReservedOp -> operatorStyle Reserved _ -> keywordStyle Special _ -> defaultStyle ConsOperator -> upperIdStyle Operator -> operatorStyle Comment _ -> commentStyle startsLayout (Reserved OtherLayout) = True startsLayout (Reserved Where) = True startsLayout _ = False isComment (Comment _) = True isComment _ = False stateToInit x | x < 0 = nestcomm | otherwise = 0 initState :: HlState initState = 0 #include "alex.hsinc" }