{- This module was generated from data in the Kate syntax highlighting file xml.xml, version 2.03, by Wilbert Berendsen (wilbert@kde.nl) -} module Text.Highlighting.Kate.Syntax.Xml ( highlight, parseExpression, syntaxName, syntaxExtensions ) where import Text.Highlighting.Kate.Definitions import Text.Highlighting.Kate.Common import qualified Text.Highlighting.Kate.Syntax.Alert import Text.ParserCombinators.Parsec import Control.Monad (when) import Data.Map (fromList) import Data.Maybe (fromMaybe, maybeToList) -- | Full name of language. syntaxName :: String syntaxName = "XML" -- | Filename extensions for this language. syntaxExtensions :: String syntaxExtensions = "*.docbook;*.xml;*.rc;*.daml;*.rdf;*.rss;*.xspf;*.xsd;*.svg;*.ui;*.kcfg;*.qrc;*.wsdl" -- | Highlight source code using this syntax definition. highlight :: String -> Either String [SourceLine] highlight input = case runParser parseSource startingState "source" input of Left err -> Left $ show err Right result -> Right result -- | Parse an expression using appropriate local context. parseExpression :: GenParser Char SyntaxState LabeledSource parseExpression = do st <- getState let oldLang = synStLanguage st setState $ st { synStLanguage = "XML" } context <- currentContext <|> (pushContext "Start" >> currentContext) result <- parseRules context updateState $ \st -> st { synStLanguage = oldLang } return result parseSource = do lineContents <- lookAhead wholeLine updateState $ \st -> st { synStCurrentLine = lineContents } result <- manyTill parseSourceLine eof return $ map normalizeHighlighting result startingState = SyntaxState {synStContexts = fromList [("XML",["Start"])], synStLanguage = "XML", synStCurrentLine = "", synStCharsParsedInLine = 0, synStPrevChar = '\n', synStCaseSensitive = True, synStKeywordCaseSensitive = True, synStCaptures = []} parseSourceLine = manyTill parseExpressionInternal pEndLine pEndLine = do lookAhead $ newline <|> (eof >> return '\n') context <- currentContext case context of "Start" -> return () >> pHandleEndLine "FindXML" -> return () >> pHandleEndLine "FindEntityRefs" -> return () >> pHandleEndLine "FindPEntityRefs" -> return () >> pHandleEndLine "Comment" -> return () >> pHandleEndLine "CDATA" -> return () >> pHandleEndLine "PI" -> return () >> pHandleEndLine "Doctype" -> return () >> pHandleEndLine "Doctype Internal Subset" -> return () >> pHandleEndLine "Doctype Markupdecl" -> return () >> pHandleEndLine "Doctype Markupdecl DQ" -> return () >> pHandleEndLine "Doctype Markupdecl SQ" -> return () >> pHandleEndLine "Element" -> return () >> pHandleEndLine "El Content" -> return () >> pHandleEndLine "El End" -> return () >> pHandleEndLine "Attribute" -> return () >> pHandleEndLine "Value" -> return () >> pHandleEndLine "Value DQ" -> return () >> pHandleEndLine "Value SQ" -> return () >> pHandleEndLine _ -> pHandleEndLine withAttribute attr txt = do when (null txt) $ fail "Parser matched no text" let labs = attr : maybeToList (lookup attr styles) st <- getState let oldCharsParsed = synStCharsParsedInLine st let prevchar = if null txt then '\n' else last txt updateState $ \st -> st { synStCharsParsedInLine = oldCharsParsed + length txt, synStPrevChar = prevchar } return (labs, txt) styles = [("Comment","co"),("CDATA","bn"),("Processing Instruction","kw"),("Doctype","dt"),("Element","kw"),("Attribute","ot"),("Value","st"),("EntityRef","dv"),("PEntityRef","dv"),("Error","er")] parseExpressionInternal = do context <- currentContext parseRules context <|> (pDefault >>= withAttribute (fromMaybe "" $ lookup context defaultAttributes)) regex_'3c'21DOCTYPE'5cs'2b = compileRegex "))+" regex_'3c'21'28ELEMENT'7cENTITY'7cATTLIST'7cNOTATION'29'5cb = compileRegex ">= withAttribute "Normal Text")) <|> ((pString False "" >>= withAttribute "Comment") >>~ (popContext)) <|> ((pRegExpr regex_'2d'28'2d'28'3f'21'2d'3e'29'29'2b >>= withAttribute "Error")) <|> ((Text.Highlighting.Kate.Syntax.Alert.parseExpression)) <|> ((pDetectIdentifier >>= withAttribute "Comment"))) return (attr, result) parseRules "CDATA" = do (attr, result) <- (((pDetectSpaces >>= withAttribute "Other Text")) <|> ((pDetectIdentifier >>= withAttribute "Other Text")) <|> ((pString False "]]>" >>= withAttribute "CDATA") >>~ (popContext)) <|> ((pString False "]]>" >>= withAttribute "EntityRef"))) return (attr, result) parseRules "PI" = do (attr, result) <- ((pDetect2Chars False '?' '>' >>= withAttribute "Processing Instruction") >>~ (popContext)) return (attr, result) parseRules "Doctype" = do (attr, result) <- (((pDetectChar False '>' >>= withAttribute "Doctype") >>~ (popContext)) <|> ((pDetectChar False '[' >>= withAttribute "Doctype") >>~ pushContext "Doctype Internal Subset")) return (attr, result) parseRules "Doctype Internal Subset" = do (attr, result) <- (((pDetectChar False ']' >>= withAttribute "Doctype") >>~ (popContext)) <|> ((pRegExpr regex_'3c'21'28ELEMENT'7cENTITY'7cATTLIST'7cNOTATION'29'5cb >>= withAttribute "Doctype") >>~ pushContext "Doctype Markupdecl") <|> ((pString False "