{- Copyright 2008-2009 Mario Blazevic This file is part of the Streaming Component Combinators (SCC) project. The SCC project is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. SCC is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with SCC. If not, see . -} {-# LANGUAGE ScopedTypeVariables, Rank2Types, GADTs, FlexibleContexts #-} module Main where import Prelude hiding (appendFile, interact, last, sequence) import Data.List (intersperse, partition) import Data.Char (isAlphaNum) import Data.Maybe (fromJust) import Control.Concurrent (forkIO) import Control.Exception (evaluate) import Control.Monad (liftM, when) import Control.Monad.Trans (lift) import qualified Text.Parsec as Parsec import qualified Text.Parsec.String as Parsec import Text.Parsec hiding (count, parse) import Text.Parsec.String hiding (Parser) import Text.Parsec.Language (emptyDef) import Text.Parsec.Token import System.Console.GetOpt import System.Console.Readline import System.Environment (getArgs) import System.IO (BufferMode (NoBuffering), hFlush, hIsWritable, hPutStrLn, hReady, hSetBuffering, stderr, stdout) import qualified System.Process as Process import Control.Concurrent.MVar import Debug.Trace (trace) import System.IO (Handle, IOMode (ReadMode, WriteMode, AppendMode), openFile, hClose, hGetChar, hGetContents, hPutChar, hFlush, hIsEOF, hClose, putChar, isEOF, stdout) import Control.Concurrent.Configuration (Component, atomic, showComponentTree, usingThreads, with) import Control.Concurrent.Coroutine import Control.Concurrent.SCC.Streams import Control.Concurrent.SCC.Types import Control.Concurrent.SCC.Components hiding ((&&), (||)) import Control.Concurrent.SCC.Combinators (JoinableComponentPair) import qualified Control.Concurrent.SCC.Components as Combinators import qualified Control.Concurrent.SCC.XML as XML data Expression where -- Compiled expressions Compiled :: TypeTag x -> Component x -> Expression -- Generic expressions NativeCommand :: String -> Expression TypeError :: TypeTag x -> TypeTag y -> Expression -> Expression Join :: Expression -> Expression -> Expression Sequence :: Expression -> Expression -> Expression Pipe :: Expression -> Expression -> Expression If :: Expression -> Expression -> Expression -> Expression ForEach :: Expression -> Expression -> Expression -> Expression -- Void expressions, i.e. commands Exit :: Expression -- ProducerComponent constructs FromList :: String -> Expression FileProducer :: String -> Expression StdInProducer :: Expression -- ConsumerComponent constructs FileConsumer :: String -> Expression FileAppend :: String -> Expression Suppress :: Expression ErrorConsumer :: String -> Expression -- TransducerComponent constructs Select :: Expression -> Expression While :: Expression -> Expression -> Expression ExecuteTransducer :: Expression IdentityTransducer :: Expression Count :: Expression Concatenate :: Expression Group :: Expression Unparse :: Expression Uppercase :: Expression ShowTransducer :: Expression -- SplitterComponent constructs EverythingSplitter :: Expression NothingSplitter :: Expression WhitespaceSplitter :: Expression LineSplitter :: Expression LetterSplitter :: Expression DigitSplitter :: Expression MarkedSplitter :: Expression OneSplitter :: Expression SubstringSplitter :: String -> Expression And :: Expression -> Expression -> Expression Or :: Expression -> Expression -> Expression ZipWithAnd :: Expression -> Expression -> Expression ZipWithOr :: Expression -> Expression -> Expression Not :: Expression -> Expression FollowedBy :: Expression -> Expression -> Expression Nested :: Expression -> Expression -> Expression Having :: Expression -> Expression -> Expression HavingOnly :: Expression -> Expression -> Expression Between :: Expression -> Expression -> Expression First :: Expression -> Expression Last :: Expression -> Expression Prefix :: Expression -> Expression Suffix :: Expression -> Expression Prepend :: Expression -> Expression Append :: Expression -> Expression Substitute :: Expression -> Expression StartOf :: Expression -> Expression EndOf :: Expression -> Expression -- XML PrimitiveComponents XMLTokenParser :: Expression XMLAttribute :: Expression XMLAttributeName :: Expression XMLAttributeValue :: Expression XMLElement :: Expression XMLElementContent :: Expression XMLElementName :: Expression XMLElementHavingTag :: Expression -> Expression XMLHavingText :: Expression -> Expression -> Expression XMLHavingOnlyText :: Expression -> Expression -> Expression instance Show Expression where showsPrec _ (Compiled tag c) rest = "compiled " ++ shows tag rest showsPrec _ (NativeCommand cmd) rest = "native \"" ++ cmd ++ "\"" ++ rest showsPrec p (Pipe left right) rest | p < 3 = showsPrec 3 left (" | " ++ showsPrec 2 right rest) showsPrec _ (If s t f) rest = "if " ++ showsPrec 0 s (" then " ++ showsPrec 0 t (" else " ++ showsPrec 0 f (" end if" ++ rest))) showsPrec _ (ForEach s t f) rest = "foreach " ++ showsPrec 0 s (" then " ++ showsPrec 0 t (" else " ++ showsPrec 0 f (" end foreach" ++ rest))) showsPrec _ Exit rest = "Exit" ++ rest showsPrec _ (FileProducer f) rest = "FileProducer \"" ++ f ++ "\"" ++ rest showsPrec _ (FromList str) rest = "echo \"" ++ str ++ "\"" ++ rest showsPrec 0 (Sequence p1 p2) rest = showsPrec 2 p1 (";\n" ++ showsPrec 0 p2 rest) showsPrec 1 (Sequence p1 p2) rest = showsPrec 2 p1 ("; " ++ showsPrec 1 p2 rest) showsPrec p e@Sequence{} rest = "(" ++ showsPrec 1 e (')' : rest) showsPrec 0 (Join p1 p2) rest = showsPrec 2 p1 (" &\n" ++ showsPrec 0 p2 rest) showsPrec 1 (Join p1 p2) rest = showsPrec 2 p1 (" & " ++ showsPrec 1 p2 rest) showsPrec p e@Join{} rest = "(" ++ showsPrec 1 e (')' : rest) showsPrec _ (FileConsumer f) rest = "> \"" ++ f ++ "\"" ++ rest showsPrec _ (FileAppend f) rest = ">> \"" ++ f ++ "\"" ++ rest showsPrec _ (Suppress) rest = "suppress" ++ rest showsPrec _ (ErrorConsumer e) rest = "error \"" ++ e ++ "\"" ++ rest showsPrec p (Select s) rest | p < 4 = "select " ++ showsPrec 4 s rest showsPrec _ (While s t) rest = "while " ++ showsPrec 0 s (" do " ++ showsPrec 0 t (" end while" ++ rest)) showsPrec p (And s1 s2) rest | p < 4 = showsPrec 4 s1 (" >& " ++ showsPrec 4 s2 rest) showsPrec p (Or s1 s2) rest | p < 4 = showsPrec 4 s1 (" >| " ++ showsPrec 4 s2 rest) showsPrec p (ZipWithAnd s1 s2) rest | p < 4 = showsPrec 4 s1 (" && " ++ showsPrec 4 s2 rest) showsPrec p (ZipWithOr s1 s2) rest | p < 4 = showsPrec 4 s1 (" || " ++ showsPrec 4 s2 rest) showsPrec p (FollowedBy s1 s2) rest | p < 4 = showsPrec 4 s1 (", " ++ showsPrec 4 s2 rest) showsPrec p (Not s) rest | p < 4 = ">! " ++ showsPrec 4 s rest showsPrec p (Nested s1 s2) rest | p < 4 = showsPrec 4 s1 (" nested in " ++ showsPrec 4 s2 rest) showsPrec p (Having s1 s2) rest | p < 4 = showsPrec 4 s1 (" having " ++ showsPrec 4 s2 rest) showsPrec p (HavingOnly s1 s2) rest | p < 4 = showsPrec 4 s1 (" having-only " ++ showsPrec 4 s2 rest) showsPrec p (Between s1 s2) rest | p < 4 = showsPrec 4 s1 (" ... " ++ showsPrec 4 s2 rest) showsPrec p (First s) rest | p < 4 = "first " ++ showsPrec 4 s rest showsPrec p (Last s) rest | p < 4 = "last " ++ showsPrec 4 s rest showsPrec p (Prefix s) rest | p < 4 = "prefix " ++ showsPrec 4 s rest showsPrec p (Suffix s) rest | p < 4 = "suffix " ++ showsPrec 4 s rest showsPrec p (Prepend s) rest | p < 4 = "prepend " ++ showsPrec 4 s rest showsPrec p (Append s) rest | p < 4 = "append " ++ showsPrec 4 s rest showsPrec p (Substitute s) rest | p < 4 = "substitute " ++ showsPrec 4 s rest showsPrec p (StartOf s) rest | p < 4 = "start-of " ++ showsPrec 4 s rest showsPrec p (EndOf s) rest | p < 4 = "end-of " ++ showsPrec 4 s rest showsPrec _ ExecuteTransducer rest = "execute" ++ rest showsPrec _ IdentityTransducer rest = "id" ++ rest showsPrec _ Count rest = "count" ++ rest showsPrec _ Concatenate rest = "concatenate" ++ rest showsPrec _ Group rest = "group" ++ rest showsPrec _ Unparse rest = "unparse" ++ rest showsPrec _ Uppercase rest = "uppercase" ++ rest showsPrec _ ShowTransducer rest = "show" ++ rest showsPrec _ EverythingSplitter rest = "everything" ++ rest showsPrec _ NothingSplitter rest = "nothing" ++ rest showsPrec _ WhitespaceSplitter rest = "whitespace" ++ rest showsPrec _ LineSplitter rest = "line" ++ rest showsPrec _ LetterSplitter rest = "letters" ++ rest showsPrec _ DigitSplitter rest = "digits" ++ rest showsPrec _ MarkedSplitter rest = "marked" ++ rest showsPrec _ OneSplitter rest = "one" ++ rest showsPrec _ (SubstringSplitter s) rest = "substring " ++ shows s (' ' : rest) showsPrec _ XMLTokenParser rest = "XML.parse" ++ rest showsPrec _ XMLElement rest = "XML.element" ++ rest showsPrec _ XMLAttribute rest = "XML.attribute" ++ rest showsPrec _ XMLAttributeName rest = "XML.attribute-name" ++ rest showsPrec _ XMLAttributeValue rest = "XML.attribute-value" ++ rest showsPrec _ XMLElementContent rest = "XML.element-content" ++ rest showsPrec _ XMLElementName rest = "XML.element-name" ++ rest showsPrec p (XMLElementHavingTag s) rest = "XML.element-having-tag " ++ showsPrec 4 s (' ' : rest) showsPrec p (XMLHavingText s1 s2) rest = showsPrec 4 s1 (" XML.having-text " ++ showsPrec 4 s2 rest) showsPrec p (XMLHavingOnlyText s1 s2) rest = showsPrec 4 s1 (" XML.having-only-text " ++ showsPrec 4 s2 rest) showsPrec _ (TypeError tag1 tag2 e) rest = ("Type error: expecting " ++ show tag2 ++ ", received " ++ show tag1 ++ "\nin expression " ++ showsPrec 9 e rest) showsPrec p e rest | p > 0 = "(" ++ showsPrec 0 e (')' : rest) data TypeTag x where -- Data type tags AnyTag :: TypeTag () UnitTag :: TypeTag () ShowableTag :: Show x => TypeTag x CharTag :: TypeTag Char IntTag :: TypeTag Integer XMLTokenTag :: TypeTag XML.Token EitherTag :: TypeTag x -> TypeTag y -> TypeTag (Either x y) ListTag :: TypeTag x -> TypeTag [x] MaybeTag :: TypeTag x -> TypeTag (Maybe x) PairTag :: TypeTag x -> TypeTag y -> TypeTag (x, y) MarkupTag :: TypeTag x -> TypeTag y -> TypeTag (Markup x y) -- Streaming component type tags ComponentTag :: TypeTag x -> TypeTag (Component x) CommandTag :: TypeTag (Performer IO ()) ConsumerTag :: TypeTag x -> TypeTag (Consumer IO x ()) ProducerTag :: TypeTag x -> TypeTag (Producer IO x ()) SplitterTag :: forall x b. TypeTag x -> TypeTag b -> TypeTag (Splitter IO x b) TransducerTag :: TypeTag x -> TypeTag y -> TypeTag (Transducer IO x y) GenericInputTag :: (TypeTag x -> TypeTag y) -> TypeTag y instance Show (TypeTag x) where show AnyTag = "Any" show UnitTag = "()" show CharTag = "Char" show IntTag = "Int" show XMLTokenTag = "XML.Token" show (ListTag x) = '[' : shows x "]" show (MaybeTag x) = "Maybe " ++ show x show (EitherTag x y) = "Either " ++ shows x (" " ++ show y) show (MarkupTag x y) = "Markup " ++ shows x (" " ++ show y) show (PairTag x y) = "(" ++ shows x (", " ++ shows y ")") show (ComponentTag c) = show c show CommandTag = "Command" show (ConsumerTag x) = "Consumer " ++ show x show (ProducerTag x) = "Producer " ++ show x show (SplitterTag x b) = "Splitter " ++ shows x (" " ++ show b) show (TransducerTag x y) = "Transducer " ++ shows x (" -> " ++ show y) show GenericInputTag{} = "Generic" -- Weirich's higher-order type-safe cast data CConsumer c x = CConsumer (c (Consumer IO x ())) data CProducer c x = CProducer (c (Producer IO x ())) data CComponent c x = CComponent (c (Component x)) data CList c a = CList (c [a]) data CMaybe c a = CMaybe (c (Maybe a)) data CFlip c b a = CFlip (c a b) data CEL c a d = CEL (c (Either d a)) data CER c a d = CER (c (Either a d)) data CML c a d = CML (c (Markup d a)) data CMR c a d = CMR (c (Markup a d)) data CL c a d = CL (c (d,a)) data CR c a d = CR (c (a,d)) data CTL c a d = CTL (c (Transducer IO d a)) data CTR c a d = CTR (c (Transducer IO a d)) data CSL c a d = CSL (c (Splitter IO d a)) data CSR c a d = CSR (c (Splitter IO a d)) typecast :: forall a b c. TypeTag a -> TypeTag b -> c a -> Maybe (c b) typecast UnitTag UnitTag x = Just x typecast CharTag CharTag x = Just x typecast IntTag IntTag x = Just x typecast XMLTokenTag XMLTokenTag x = Just x typecast (ListTag a) (ListTag b) x = fmap (\(CList y)-> y) (typecast a b (CList x)) typecast (MaybeTag a) (MaybeTag b) x = fmap (\(CMaybe y)-> y) (typecast a b (CMaybe x)) typecast (EitherTag (ra::TypeTag a0) (rb::TypeTag b0)) (EitherTag (ra'::TypeTag a0') (rb'::TypeTag b0')) x = let g = (typecast ra ra' :: (CEL c b0) a0 -> Maybe ((CEL c b0) a0')) h = (typecast rb rb' :: (CER c a0') b0 -> Maybe ((CER c a0') b0')) in case g (CEL x) of Just (CEL x') -> case h (CER x') of Just (CER y') -> Just y' Nothing -> Nothing typecast (MarkupTag (ra::TypeTag a0) (rb::TypeTag b0)) (MarkupTag (ra'::TypeTag a0') (rb'::TypeTag b0')) x = let g = (typecast ra ra' :: (CML c b0) a0 -> Maybe ((CML c b0) a0')) h = (typecast rb rb' :: (CMR c a0') b0 -> Maybe ((CMR c a0') b0')) in case g (CML x) of Just (CML x') -> case h (CMR x') of Just (CMR y') -> Just y' Nothing -> Nothing typecast (PairTag (ra::TypeTag a0) (rb::TypeTag b0)) (PairTag (ra'::TypeTag a0') (rb'::TypeTag b0')) x = let g = (typecast ra ra' :: (CL c b0) a0 -> Maybe ((CL c b0) a0')) h = (typecast rb rb' :: (CR c a0') b0 -> Maybe ((CR c a0') b0')) in case g (CL x) of Just (CL x') -> case h (CR x') of Just (CR y') -> Just y' Nothing -> Nothing typecast (ComponentTag a) (ComponentTag b) x = fmap (\(CComponent y)-> y) (typecast a b (CComponent x)) typecast CommandTag CommandTag x = Just x typecast (ConsumerTag a) (ConsumerTag b) x = fmap (\(CConsumer y)-> y) (typecast a b (CConsumer x)) typecast (ProducerTag a) (ProducerTag b) x = fmap (\(CProducer y)-> y) (typecast a b (CProducer x)) typecast (TransducerTag (ra::TypeTag a0) (rb::TypeTag b0)) (TransducerTag (ra'::TypeTag a0') (rb'::TypeTag b0')) x = let g = (typecast ra ra' :: (CTL c b0) a0 -> Maybe ((CTL c b0) a0')) h = (typecast rb rb' :: (CTR c a0') b0 -> Maybe ((CTR c a0') b0')) in case g (CTL x) of Nothing -> Nothing Just (CTL x') -> case h (CTR x') of Nothing -> Nothing Just (CTR y') -> Just y' typecast (SplitterTag (ra::TypeTag a0) (rb::TypeTag b0)) (SplitterTag (ra'::TypeTag a0') (rb'::TypeTag b0')) x = let g = (typecast ra ra' :: (CSL c b0) a0 -> Maybe ((CSL c b0) a0')) h = (typecast rb rb' :: (CSR c a0') b0 -> Maybe ((CSR c a0') b0')) in case g (CSL x) of Just (CSL x') -> case h (CSR x') of Just (CSR y') -> Just y' Nothing -> Nothing typecast _ _ _ = Nothing trycast :: forall a b. TypeTag a -> TypeTag b -> a -> Expression -> (b -> Expression) -> Expression trycast tag1 tag2 x e constructor = case typecast tag1 tag2 (Just x) of Just (Just y) -> constructor y Nothing -> TypeError tag1 tag2 e tryComponentCast :: forall a b. TypeTag a -> TypeTag b -> Component a -> Expression -> (Component b -> Expression) -> Expression tryComponentCast tag1 tag2 = trycast (ComponentTag tag1) (ComponentTag tag2) data Flag = Command | Help | Interactive | PrettyPrint | ScriptFile String | StandardInput | Threads String deriving Eq data InputSource = UnspecifiedSource | CommandLineSource | InteractiveSource | ScriptFileSource String | StandardInputSource data Flags = Flags {helpFlag :: Bool, inputSourceFlag :: InputSource, prettyPrintFlag :: Bool, threadCount :: Maybe Int} flagList = [Option "c" ["command"] (NoArg Command) "Execute a single command", Option "p" ["prettyprint"] (NoArg PrettyPrint) "Pretty print the input expression instead of executing it", Option "h" ["help"] (NoArg Help) "Show help", Option "f" ["file"] (ReqArg ScriptFile "file") "Execute commands from a script file", Option "i" ["interactive"] (NoArg Interactive) "Execute commands interactively", Option "s" ["stdin"] (NoArg StandardInput) "Execute commands from the standard input", Option "t" ["threads"] (ReqArg Threads "threads") "Specify number of threads to use"] usageSyntax = "Usage: shsh (-c | -f | -i | -s) " main = do args <- getArgs let (specifiedOptions, arguments, errors) = getOpt Permute flagList args emptyOptions = Flags {helpFlag = False, inputSourceFlag = UnspecifiedSource, prettyPrintFlag = False, threadCount = Nothing} options = foldr extractOption emptyOptions specifiedOptions extractOption Command options@Flags{inputSourceFlag= UnspecifiedSource} = options{inputSourceFlag= CommandLineSource} extractOption Help options = options{helpFlag= True} extractOption Interactive options@Flags{inputSourceFlag= UnspecifiedSource} = options{inputSourceFlag= InteractiveSource} extractOption StandardInput options@Flags{inputSourceFlag= UnspecifiedSource} = options{inputSourceFlag= StandardInputSource} extractOption PrettyPrint options = options{prettyPrintFlag= True} extractOption (ScriptFile name) options@Flags{inputSourceFlag= UnspecifiedSource} = options{inputSourceFlag= ScriptFileSource name} extractOption (Threads count) options@Flags{threadCount= Nothing} = options{threadCount= Just (read count)} if not (null errors) || helpFlag options then showHelp else case inputSourceFlag options of CommandLineSource -> interpret options (concat (intersperse " " arguments)) >> return () InteractiveSource -> interact options ScriptFileSource name -> readFile name >>= interpret options >> return () StandardInputSource -> getContents >>= interpret options >> return () UnspecifiedSource -> interact options prettyprint options expression = print expression >> case compile UnitTag expression of Compiled tag component -> putStrLn "::" >> print tag >> putStrLn (showComponentTree $ adjust options component) e@TypeError{} -> print e showHelp = putStrLn (usageInfo usageSyntax flagList) interact options = do Just command <- readline "> " addHistory command finish <- interpret options command when (not finish) (interact options) interpret options command = case parseExpression command of Left position -> hPutStrLn stderr ("Error at " ++ show position) >> return False Right (Exit, "", _) -> return True Right (expression, "", _) -> (if (prettyPrintFlag options) then prettyprint options expression else case compile UnitTag expression of e@Compiled{} -> execute options e e@TypeError{} -> print e) >> return False Right (expression, rest, _) -> hPutStrLn stderr ("Cannot parse \"" ++ rest ++ "\"\nafter " ++ show expression) >> return False execute :: Flags -> Expression -> IO () execute options (Compiled CommandTag command) = perform $ with $ adjust options command execute options (Compiled (ProducerTag CharTag) producer) = liftM fst (runCoroutine (pipe (produce $ with $ adjust options producer) (consume $ with toStdOut))) >> hFlush stdout execute options (Compiled tag _) = hPutStrLn stderr ("Expecting a command or a ProducerComponent Char, received a " ++ show tag) adjust Flags{threadCount= Just threads} component = usingThreads component threads adjust _ component = component compile :: TypeTag x -> Expression -> Expression compile inputTag e@Compiled{} = e compile inputTag e@TypeError{} = e compile inputTag (Pipe left right) = case compile inputTag left of Compiled tag@(ProducerTag tag1) p -> case compile tag1 right of Compiled (ConsumerTag tag2) c -> tryComponentCast tag (ProducerTag tag2) p left $ \p'-> Compiled CommandTag (p' >-> c) Compiled (TransducerTag tag2 tag3) t -> tryComponentCast tag (ProducerTag tag2) p left $ \p'-> Compiled (ProducerTag tag3) (p' >-> t) e@TypeError{} -> e Compiled (TransducerTag tag1 tag2) t -> case compile tag2 right of Compiled tag3@ConsumerTag{} c -> tryComponentCast tag3 (ConsumerTag tag2) c right $ \c'-> Compiled (ConsumerTag tag1) (t >-> c') Compiled tag@(TransducerTag tag3 tag4) t2 -> tryComponentCast tag (TransducerTag tag2 tag4) t2 right $ \t2'-> Compiled (TransducerTag tag1 tag4) (t >-> t2') e@TypeError{} -> e Compiled tag _ -> TypeError tag (TransducerTag tag2 AnyTag) right Compiled tag _ -> TypeError tag (ProducerTag AnyTag) left e@TypeError{} -> e compile UnitTag (NativeCommand command) = Compiled (ProducerTag CharTag) $ atomic command ioCost $ Producer $ \sink-> do (Nothing, Just stdout, Nothing, pid) <- lift (Process.createProcess (Process.shell command){Process.std_out= Process.CreatePipe}) produce (with $ fromHandle stdout True) sink compile UnitTag (FileProducer path) = Compiled (ProducerTag CharTag) (fromFile path) compile UnitTag StdInProducer = Compiled (ProducerTag CharTag) fromStdIn compile inputTag (FromList string) = Compiled (ProducerTag CharTag) (atomic "putList" 1 $ Producer $ \sink-> putList string sink >> return ()) compile inputTag (FileConsumer path) = Compiled (ConsumerTag CharTag) (toFile path) compile inputTag (FileAppend path) = Compiled (ConsumerTag CharTag) (appendFile path) compile inputTag Suppress = Compiled (ConsumerTag inputTag) suppress compile inputTag (ErrorConsumer message) = Compiled (ConsumerTag inputTag) (erroneous message) compile inputTag (Sequence e1 e2) = compileJoin sequence inputTag e1 e2 compile inputTag (Join e1 e2) = compileJoin join inputTag e1 e2 compile inputTag (ForEach splitter true false) = combineSplitterAndBranches foreach inputTag splitter true false compile inputTag (If splitter true false) = combineSplitterAndBranches ifs inputTag splitter true false compile inputTag (NativeCommand command) = Compiled (TransducerTag CharTag CharTag) (atomic command ioCost $ Transducer f) where f source sink = do (Just stdin, Just stdout, Nothing, pid) <- lift (Process.createProcess (Process.shell command){Process.std_in= Process.CreatePipe, Process.std_out= Process.CreatePipe}) lift (hSetBuffering stdin NoBuffering >> hSetBuffering stdout NoBuffering) interleave source stdin pid stdout sink return [] interleave :: forall a1 a2 d. (AncestorFunctor a1 d, AncestorFunctor a2 d) => Source IO a1 Char -> Handle -> Process.ProcessHandle -> Handle -> Sink IO a2 Char -> Coroutine d IO () interleave source stdin pid stdout sink = interleave1 where interleave1 = get source >>= maybe (lift (hClose stdin) >> interleaveEnd) (\x-> lift (Process.getProcessExitCode pid) >>= maybe (lift (hPutChar stdin x) >> interleave2) (const interleave2)) interleave2 = canPut sink >>= flip when (lift (hReady stdout) >>= flip when (lift (hGetChar stdout) >>= put sink >> return ()) >> interleave1) interleaveEnd = canPut sink >>= flip when (lift (hIsEOF stdout) >>= cond (lift $ hClose stdout) (lift (hGetChar stdout) >>= put sink >> interleaveEnd)) compile inputTag (Select e) = case compile inputTag e of Compiled (SplitterTag tag _) s -> Compiled (TransducerTag tag tag) (select s) Compiled tag _ -> TypeError tag (SplitterTag inputTag AnyTag) e e'@TypeError{} -> e' compile inputTag (While condition body) = case (compile inputTag condition, compile inputTag body) of (Compiled (SplitterTag tag1 _) s, Compiled tag2@TransducerTag{} t) -> let tag2' = TransducerTag tag1 tag1 in tryComponentCast tag2 tag2' t body (\t'-> Compiled tag2' (while t' s)) compile inputTag (FollowedBy left right) = combineSplitters followedBy inputTag PairTag left right compile inputTag (And left right) = combineSplitters (>&) inputTag PairTag left right compile inputTag (Or left right) = combineSplitters (>|) inputTag EitherTag left right compile inputTag (ZipWithAnd left right) = combineSplitters (Combinators.&&) inputTag PairTag left right compile inputTag (ZipWithOr left right) = combineSplitters (Combinators.||) inputTag EitherTag left right compile inputTag (Nested left right) = combineSplittersOfSameType nestedIn inputTag left right compile inputTag (Having left right) = combineSplittersOfSameType having inputTag left right compile inputTag (HavingOnly left right) = combineSplittersOfSameType havingOnly inputTag left right compile inputTag (Between left right) = combineSplittersOfSameType (...) inputTag left right compile inputTag (Not splitter) = wrapSplitter snot inputTag splitter compile inputTag (First splitter) = wrapSplitter first inputTag splitter compile inputTag (Last splitter) = wrapSplitter last inputTag splitter compile inputTag (Prefix splitter) = wrapSplitter prefix inputTag splitter compile inputTag (Suffix splitter) = wrapSplitter suffix inputTag splitter compile inputTag (StartOf splitter) = wrapSplitter' startOf inputTag MaybeTag splitter compile inputTag (EndOf splitter) = wrapSplitter' endOf inputTag MaybeTag splitter compile inputTag (Prepend prefix) = wrapProducerIntoTransducer prepend inputTag prefix compile inputTag (Append suffix) = wrapProducerIntoTransducer append inputTag suffix compile inputTag (Substitute replacement) = wrapGenericProducerIntoTransducer substitute inputTag replacement compile inputTag ExecuteTransducer = Compiled (TransducerTag CharTag CharTag) (atomic "execute" ioCost $ Transducer execute) where execute :: forall a1 a2 d. OpenTransducer IO a1 a2 d Char Char execute source sink = do let (source' :: Source IO d Char) = liftSource source ((), command) <- pipe (pour source') getList (Nothing, Just stdout, Nothing, pid) <- lift (Process.createProcess (Process.shell command){Process.std_out= Process.CreatePipe}) produce (with $ fromHandle stdout True) sink return [] compile inputTag IdentityTransducer = Compiled (TransducerTag inputTag inputTag) asis compile inputTag Count = Compiled (TransducerTag inputTag IntTag) count compile inputTag@(ListTag itemTag) Concatenate = Compiled (TransducerTag inputTag itemTag) concatenate compile inputTag Concatenate = TypeError inputTag (ListTag AnyTag) Concatenate compile inputTag Group = Compiled (TransducerTag inputTag (ListTag inputTag)) group compile t@(MarkupTag t1 t2) Unparse = Compiled (TransducerTag t t2) unparse compile inputTag Unparse = TypeError (TransducerTag (MarkupTag AnyTag AnyTag) AnyTag) (TransducerTag inputTag AnyTag) Unparse compile CharTag Uppercase = Compiled (TransducerTag CharTag CharTag) uppercase compile inputTag Uppercase = TypeError (TransducerTag CharTag CharTag) (TransducerTag inputTag AnyTag) Uppercase compile inputTag@CharTag ShowTransducer = Compiled (TransducerTag inputTag (ListTag CharTag)) toString compile inputTag@IntTag ShowTransducer = Compiled (TransducerTag inputTag (ListTag CharTag)) toString compile inputTag@(MarkupTag XMLTokenTag CharTag) ShowTransducer = Compiled (TransducerTag inputTag (ListTag CharTag)) toString compile inputTag ShowTransducer = TypeError (TransducerTag IntTag (ListTag CharTag)) (TransducerTag inputTag AnyTag) ShowTransducer {- compile inputTag ShowTransducer = let targetType = TransducerTag ShowableTag (ListTag CharTag) actualType = TransducerTag inputTag (ListTag CharTag) in trycast targetType actualType toString ShowTransducer (Compiled actualType) -} compile inputTag EverythingSplitter = Compiled (SplitterTag inputTag UnitTag) everything compile inputTag NothingSplitter = Compiled (SplitterTag inputTag UnitTag) nothing compile inputTag WhitespaceSplitter = Compiled (SplitterTag CharTag UnitTag) whitespace compile inputTag LineSplitter = Compiled (SplitterTag CharTag UnitTag) line compile inputTag LetterSplitter = Compiled (SplitterTag CharTag UnitTag) letters compile inputTag DigitSplitter = Compiled (SplitterTag CharTag UnitTag) digits compile inputTag MarkedSplitter = Compiled (SplitterTag (MarkupTag AnyTag AnyTag) UnitTag) marked compile inputTag OneSplitter = Compiled (SplitterTag inputTag UnitTag) one compile CharTag (SubstringSplitter part) = Compiled (SplitterTag CharTag UnitTag) (substring part) compile inputTag e@SubstringSplitter{} = TypeError (SplitterTag CharTag UnitTag) (SplitterTag inputTag UnitTag) e compile CharTag XMLTokenParser = Compiled (TransducerTag CharTag (MarkupTag XMLTokenTag CharTag)) xmlParseTokens compile t@(MarkupTag XMLTokenTag CharTag) XMLElement = Compiled (SplitterTag t UnitTag) xmlElement compile t@(MarkupTag XMLTokenTag CharTag) XMLAttribute = Compiled (SplitterTag t UnitTag) xmlAttribute compile t@(MarkupTag XMLTokenTag CharTag) XMLAttributeName = Compiled (SplitterTag t UnitTag) xmlAttributeName compile t@(MarkupTag XMLTokenTag CharTag) XMLAttributeValue = Compiled (SplitterTag t UnitTag) xmlAttributeValue compile t@(MarkupTag XMLTokenTag CharTag) XMLElementContent = Compiled (SplitterTag t UnitTag) xmlElementContent compile t@(MarkupTag XMLTokenTag CharTag) XMLElementName = Compiled (SplitterTag t UnitTag) xmlElementName compile t@(MarkupTag XMLTokenTag CharTag) (XMLElementHavingTag s) = wrapConcreteSplitter xmlElementHavingTag t s compile t@(MarkupTag XMLTokenTag CharTag) (XMLHavingText left right) = combineSplittersOfDifferentTypes xmlHavingText t CharTag left right compile t@(MarkupTag XMLTokenTag CharTag) (XMLHavingOnlyText left right) = combineSplittersOfDifferentTypes xmlHavingOnlyText t CharTag left right compile inputTag expression = error ("Cannot compile " ++ show expression ++ " with input " ++ show inputTag) compileJoin :: forall t. (forall t1 t2 t3 m x y c1 c2 c3. JoinableComponentPair t1 t2 t3 m x y c1 c2 c3 => Component c1 -> Component c2 -> Component c3) -> TypeTag t -> Expression -> Expression -> Expression compileJoin combinator inputTag e1 e2 = case (compile inputTag e1, compile inputTag e2) of (Compiled CommandTag c1, Compiled CommandTag c2) -> Compiled CommandTag (combinator c1 c2) (Compiled tag1@ProducerTag{} p1, Compiled tag2@ProducerTag{} p2) -> tryComponentCast tag2 tag1 p2 e2 (\p2'-> Compiled tag1 (combinator p1 p2')) (Compiled tag1@ConsumerTag{} c1, Compiled tag2@ConsumerTag{} c2) -> tryComponentCast tag2 tag1 c2 e2 (\c2'-> Compiled tag1 (combinator c1 c2')) (Compiled tag1@TransducerTag{} t1, Compiled tag2@TransducerTag{} t2) -> tryComponentCast tag2 tag1 t2 e2 (\t2'-> Compiled tag1 (combinator t1 t2')) (Compiled CommandTag c, Compiled tag@ProducerTag{} p) -> Compiled tag (combinator c p) (Compiled tag@ProducerTag{} p, Compiled CommandTag c) -> Compiled tag (combinator p c) (Compiled CommandTag c1, Compiled tag@ConsumerTag{} c2) -> Compiled tag (combinator c1 c2) (Compiled tag@ConsumerTag{} c1, Compiled CommandTag c2) -> Compiled tag (combinator c1 c2) (Compiled CommandTag c, Compiled tag@TransducerTag{} t) -> Compiled tag (combinator c t) (Compiled tag@TransducerTag{} t, Compiled CommandTag c) -> Compiled tag (combinator t c) (Compiled (ProducerTag tag1) p, Compiled (ConsumerTag tag2) c) -> Compiled (TransducerTag tag2 tag1) (combinator p c) (Compiled (ConsumerTag tag1) p, Compiled (ProducerTag tag2) c) -> Compiled (TransducerTag tag1 tag2) (combinator p c) (Compiled (ProducerTag tag1) p, Compiled tag@(TransducerTag tag2 tag3) t) -> let tag' = TransducerTag tag2 tag1 in tryComponentCast tag tag' t e2 (\t'-> Compiled tag' (combinator p t')) (Compiled tag@(TransducerTag tag1 tag2) t, Compiled tag3@ProducerTag{} p) -> let tag' = TransducerTag tag2 tag1 in tryComponentCast tag3 (ProducerTag tag2) p e2 (\p'-> Compiled tag (combinator t p')) (Compiled (ConsumerTag tag1) c, Compiled tag@(TransducerTag tag2 tag3) t) -> let tag' = TransducerTag tag1 tag3 in tryComponentCast tag tag' t e2 (\t'-> Compiled tag' (combinator c t')) (Compiled tag@(TransducerTag tag1 tag2) t, Compiled tag3@ConsumerTag{} c) -> let tag' = TransducerTag tag2 tag1 in tryComponentCast tag3 (ConsumerTag tag1) c e2 (\c'-> Compiled tag (combinator t c')) (e@TypeError{}, _) -> e (_, e@TypeError{}) -> e (Compiled tag@SplitterTag{} _, _) -> TypeError tag (ProducerTag AnyTag) e1 (_, Compiled tag@SplitterTag{} _) -> TypeError tag (ProducerTag AnyTag) e2 wrapSplitter :: forall x. (forall x b. SplitterComponent IO x b -> SplitterComponent IO x b) -> TypeTag x -> Expression -> Expression wrapSplitter combinator inputTag expression = case compile inputTag expression of Compiled tag@(SplitterTag tx tb) splitter -> Compiled (SplitterTag tx tb) (combinator splitter) Compiled tag _ -> TypeError tag (SplitterTag inputTag AnyTag) expression e@TypeError{} -> e wrapConcreteSplitter :: forall x. (forall b. SplitterComponent IO x b -> SplitterComponent IO x b) -> TypeTag x -> Expression -> Expression wrapConcreteSplitter combinator inputTag expression = case compile inputTag expression of Compiled tag@(SplitterTag tx tb) splitter -> tryComponentCast tag (SplitterTag inputTag tb) splitter expression $ \s'-> Compiled (SplitterTag inputTag tb) (combinator s') Compiled tag _ -> TypeError tag (SplitterTag inputTag AnyTag) expression e@TypeError{} -> e wrapConcreteSplitter' :: forall x y. (forall b. SplitterComponent IO x b -> SplitterComponent IO y ()) -> TypeTag x -> TypeTag y -> Expression -> Expression wrapConcreteSplitter' combinator inputTag outputTag expression = case compile inputTag expression of Compiled tag@(SplitterTag tx tb) splitter -> tryComponentCast tag (SplitterTag inputTag tb) splitter expression $ \s'-> Compiled (SplitterTag outputTag UnitTag) (combinator s') Compiled tag _ -> TypeError tag (SplitterTag inputTag AnyTag) expression e@TypeError{} -> e wrapSplitter' :: forall x c. (forall x b. SplitterComponent IO x b -> SplitterComponent IO x (c b)) -> TypeTag x -> (forall b. TypeTag b -> TypeTag (c b)) -> Expression -> Expression wrapSplitter' combinator inputTag constructor expression = case compile inputTag expression of Compiled tag@(SplitterTag tx tb) splitter -> Compiled (SplitterTag tx (constructor tb)) (combinator splitter) Compiled tag _ -> TypeError tag (SplitterTag inputTag AnyTag) expression e@TypeError{} -> e wrapProducerIntoTransducer :: forall x. (ProducerComponent IO x () -> TransducerComponent IO x x) -> TypeTag x -> Expression -> Expression wrapProducerIntoTransducer combinator inputTag expression = case compile inputTag expression of Compiled tag@ProducerTag{} p -> tryComponentCast tag (ProducerTag inputTag) p expression $ \p'-> Compiled (TransducerTag inputTag inputTag) (combinator p') Compiled tag _ -> TypeError tag (ProducerTag inputTag) expression e@TypeError{} -> e wrapGenericProducerIntoTransducer :: forall x. (forall y r. ProducerComponent IO y r -> TransducerComponent IO x y) -> TypeTag x -> Expression -> Expression wrapGenericProducerIntoTransducer combinator inputTag expression = case compile inputTag expression of Compiled (ProducerTag outTag) p -> Compiled (TransducerTag inputTag outTag) (combinator p) Compiled tag _ -> TypeError tag (ProducerTag inputTag) expression e@TypeError{} -> e combineSplitters :: forall x c. (forall x b1 b2. SplitterComponent IO x b1 -> SplitterComponent IO x b2 -> SplitterComponent IO x (c b1 b2)) -> TypeTag x -> (forall b1 b2. TypeTag b1 -> TypeTag b2 -> TypeTag (c b1 b2)) -> Expression -> Expression -> Expression combineSplitters combinator inputTag constructor left right = case (compile inputTag left, compile inputTag right) of (Compiled tag1@(SplitterTag x1 b1) s1, Compiled tag2@(SplitterTag x2 b2) s2) -> tryComponentCast tag2 (SplitterTag x1 b2) s2 right $ \s2'-> Compiled (SplitterTag x1 (constructor b1 b2)) (combinator s1 s2') (e@TypeError{}, _) -> e (_, e@TypeError{}) -> e (Compiled tag1 _, Compiled tag2@SplitterTag{} _) -> TypeError tag1 tag2 left (Compiled tag1@SplitterTag{} _, Compiled tag2 _) -> TypeError tag2 tag1 right combineSplittersOfSameType :: forall x. (forall x b. SplitterComponent IO x b -> SplitterComponent IO x b -> SplitterComponent IO x b) -> TypeTag x -> Expression -> Expression -> Expression combineSplittersOfSameType combinator inputTag left right = case (compile inputTag left, compile inputTag right) of (Compiled tag1@SplitterTag{} s1, Compiled tag2@SplitterTag{} s2) -> tryComponentCast tag2 tag1 s2 right (\s2'-> Compiled tag1 (combinator s1 s2')) (e@TypeError{}, _) -> e (_, e@TypeError{}) -> e (Compiled tag1 _, Compiled tag2@SplitterTag{} _) -> TypeError tag1 tag2 left (Compiled tag1@SplitterTag{} _, Compiled tag2 _) -> TypeError tag2 tag1 right combineSplittersOfDifferentTypes :: forall x1 x2. (forall b1 b2. SplitterComponent IO x1 b1 -> SplitterComponent IO x2 b2 -> SplitterComponent IO x1 b1) -> TypeTag x1 -> TypeTag x2 -> Expression -> Expression -> Expression combineSplittersOfDifferentTypes combinator tag1 tag2 left right = case (compile tag1 left, compile tag2 right) of (Compiled tag1'@(SplitterTag _ b1) s1, Compiled tag2'@(SplitterTag _ b2) s2) -> tryComponentCast tag1' (SplitterTag tag1 b1) s1 left $ \s1'-> tryComponentCast tag2' (SplitterTag tag2 b2) s2 right $ \s2'-> Compiled (SplitterTag tag1 b1) (combinator s1' s2') (e@TypeError{}, _) -> e (_, e@TypeError{}) -> e (Compiled tag1 _, Compiled tag2@SplitterTag{} _) -> TypeError tag1 tag2 left (Compiled tag1@SplitterTag{} _, Compiled tag2 _) -> TypeError tag2 tag1 right combineTransducersOfSameType :: forall x. (forall x y. TransducerComponent IO x y -> TransducerComponent IO x y -> TransducerComponent IO x y) -> TypeTag x -> Expression -> Expression -> Expression combineTransducersOfSameType combinator inputTag left right = case (compile inputTag left, compile inputTag right) of (Compiled tag1@TransducerTag{} t1, Compiled tag2@TransducerTag{} t2) -> tryComponentCast tag2 tag1 t2 right (\t2'-> Compiled tag1 (combinator t1 t2')) combineSplitterAndBranches :: forall x. (forall x b cc. Branching cc IO x [x] => SplitterComponent IO x b -> Component cc -> Component cc -> Component cc) -> TypeTag x -> Expression -> Expression -> Expression -> Expression combineSplitterAndBranches combinator inputTag splitter true false = case (compile inputTag splitter, compile inputTag true, compile inputTag false) of (Compiled (SplitterTag tag1 _) s, Compiled tag2@ConsumerTag{} t, Compiled tag3@ConsumerTag{} f) -> tryComponentCast tag2 (ConsumerTag tag1) t true $ \t'-> tryComponentCast tag3 (ConsumerTag tag1) f false $ \f'-> Compiled (ConsumerTag tag1) (combinator s t' f') (Compiled tag1@SplitterTag{} s, Compiled tag2@SplitterTag{} t, Compiled tag3@SplitterTag{} f) -> tryComponentCast tag2 tag1 t true $ \t'-> tryComponentCast tag3 tag1 f false $ \f'-> Compiled tag1 (combinator s t' f') (Compiled (SplitterTag tag1 _) s, Compiled tag2@(TransducerTag tag2a tag2b) t, Compiled tag3@TransducerTag{} f) -> let tag2' = TransducerTag tag1 tag2b in tryComponentCast tag2 tag2' t true $ \t'-> tryComponentCast tag3 tag2' f false $ \f'-> Compiled tag2' (combinator s t' f') (Compiled (SplitterTag tag1 _) s, Compiled tag2@(TransducerTag tag2a tag2b) t, Compiled tag3@ConsumerTag{} f) -> let tag2' = TransducerTag tag1 tag2b in tryComponentCast tag2 tag2' t true $ \t'-> tryComponentCast tag3 (ConsumerTag tag1) f false $ \f'-> Compiled tag2' (combinator s t' (consumeBy f')) (Compiled (SplitterTag tag1 _) s, Compiled tag2@ConsumerTag{} t, Compiled tag3@(TransducerTag tag3a tag3b) f) -> let tag3' = TransducerTag tag1 tag3b in tryComponentCast tag2 (ConsumerTag tag1) t true $ \t'-> tryComponentCast tag3 tag3' f false $ \f'-> Compiled tag3' (combinator s (consumeBy t') f') (Compiled (SplitterTag tag1 _) s, Compiled tag2@(TransducerTag tag2a tag2b) t, Compiled tag3@ProducerTag{} f) -> let tag2' = TransducerTag tag1 tag2b in tryComponentCast tag2 tag2' t true $ \t'-> tryComponentCast tag3 (ProducerTag tag2b) f false $ \f'-> Compiled tag2' (combinator s t' (substitute f')) (Compiled (SplitterTag tag1 _) s, Compiled tag2@ProducerTag{} t, Compiled tag3@(TransducerTag tag3a tag3b) f) -> let tag3' = TransducerTag tag1 tag3b in tryComponentCast tag2 (ProducerTag tag3b) t true $ \t'-> tryComponentCast tag3 tag3' f false $ \f'-> Compiled tag3' (combinator s (substitute t') f') (Compiled (SplitterTag tag1 _) s, Compiled tag2@(ConsumerTag tag2a) t, Compiled tag3@(ProducerTag tag3a) f) -> tryComponentCast tag2 (ConsumerTag tag1) t true $ \t'-> Compiled (TransducerTag tag1 tag3a) (combinator s (consumeBy t') (substitute f)) (Compiled (SplitterTag tag1 _) s, Compiled tag2@(ProducerTag tag2a) t, Compiled tag3@(ConsumerTag tag3a) f) -> tryComponentCast tag3 (ConsumerTag tag1) f true $ \f'-> Compiled (TransducerTag tag1 tag2a) (combinator s (substitute t) (consumeBy f')) (e@TypeError{}, _, _) -> e (_, e@TypeError{}, _) -> e (_, _, e@TypeError{}) -> e (Compiled SplitterTag{} _, Compiled tag _, _) -> TypeError tag (TransducerTag inputTag AnyTag) true (Compiled SplitterTag{} _, _, Compiled tag _) -> TypeError tag (TransducerTag inputTag AnyTag) false (Compiled tag _, _, _) -> TypeError tag (SplitterTag inputTag AnyTag) splitter parseExpression :: String -> Either Int (Expression, [Char], Int) parseExpression s = case Parsec.parse partialExpressionParser "" s of Left error -> Left (sourceLine (errorPos error)) Right result -> Right result lexer = (makeTokenParser language) {stringLiteral= stringLexemeParser} language = emptyDef{commentLine= "#", identLetter= satisfy (\char-> isAlphaNum char || char == '-' || char == '_'), reservedOpNames= ["...", ">!", ">", ">&", ">,", ">>", ">|", "|", "||", ";", "&"], reservedNames= ["append", "concatenate", "count", "digits", "do", "else", "end", "error", "exit", "everything", "first", "foreach", "group", "having", "having-only", "id", "if", "in", "last", "letters", "line", "marked", "nested", "nothing", "prefix", "prepend", "select", "show", "stdin", "substitute", "substring", "suffix", "suppress", "then", "unparse", "uppercase", "while", "whitespace", "XML.parse-tags", "XML.serialize-tags", "XML.element", "XML.element-content", "XML.element-having-tag", "XML.element-name", "XML.having-text"]} reservedTokens = reservedOpNames language ++ reservedNames language partialExpressionParser :: Parsec.Parser (Expression, [Char], Int) partialExpressionParser = do whiteSpace lexer t <- expressionParser whiteSpace lexer rest <- getInput pos <- getPosition return (t, rest, sourceLine pos - 1) expressionParser :: Parsec.Parser Expression expressionParser = do head <- stepParser whiteSpace lexer (do tail <- many1 (try (symbol lexer ";" >> stepParser)) return (foldr1 Sequence (head:tail)) <|> do tail <- many1 (try (symbol lexer "&" >> stepParser)) return (foldr1 Join (head:tail)) <|> return head ) stepParser :: Parsec.Parser Expression stepParser = do head <- termParser whiteSpace lexer tail <- many (try (char '|' >> whiteSpace lexer >> termParser)) return (foldr1 Pipe (head:tail)) termParser :: Parsec.Parser Expression termParser = do first <- prefixTermParser whiteSpace lexer option first (liftM (foldr1 FollowedBy . (first :)) (many1 $ try (symbol lexer ">," >> prefixTermParser)) <|> liftM (foldr1 Or . (first :)) (many1 $ try (symbol lexer ">|" >> prefixTermParser)) <|> liftM (foldr1 And . (first :)) (many1 $ try (symbol lexer ">&" >> prefixTermParser)) <|> liftM (foldr1 ZipWithOr . (first :)) (many1 $ try (symbol lexer "||" >> prefixTermParser)) <|> liftM (foldr1 ZipWithAnd . (first :)) (many1 $ try (symbol lexer "&&" >> prefixTermParser)) <|> liftM (Between first) (try (symbol lexer "..." >> prefixTermParser)) <|> liftM (Having first) (try (symbol lexer "having" >> prefixTermParser)) <|> liftM (HavingOnly first) (try (symbol lexer "having-only" >> prefixTermParser)) <|> liftM (XMLHavingOnlyText first) (try (symbol lexer "XML.having-only-text" >> prefixTermParser)) <|> liftM (XMLHavingText first) (try (symbol lexer "XML.having-text" >> prefixTermParser)) ) prefixTermParser :: Parsec.Parser Expression prefixTermParser = try (symbol lexer ">!" >> liftM Not prefixTermParser) <|> try (symbol lexer "prefix" >> liftM Prefix prefixTermParser) <|> try (symbol lexer "suffix" >> liftM Suffix prefixTermParser) <|> try (symbol lexer "prepend" >> liftM Prepend prefixTermParser) <|> try (symbol lexer "append" >> liftM Append prefixTermParser) <|> try (symbol lexer "substitute" >> liftM Substitute prefixTermParser) <|> try (symbol lexer "first" >> liftM First prefixTermParser) <|> try (symbol lexer "last" >> liftM Last prefixTermParser) <|> try (symbol lexer "start-of" >> liftM StartOf prefixTermParser) <|> try (symbol lexer "end-of" >> liftM EndOf prefixTermParser) <|> try (symbol lexer "select" >> liftM Select prefixTermParser) <|> try (symbol lexer "XML.element-having-tag" >> liftM XMLElementHavingTag prefixTermParser) <|> primaryParser primaryParser :: Parsec.Parser Expression primaryParser = try (do char '(' whiteSpace lexer expression <- expressionParser whiteSpace lexer char ')' return expression) <|> try (symbol lexer "exit" >> return Exit) <|> try (nativeSourceParser "cat") <|> try (nativeSourceParser "ls") <|> try (do symbol lexer "echo" string <- nativeCommand True return (FromList string)) <|> try (symbol lexer "stdin" >> return StdInProducer) <|> try (do symbol lexer ">>" file <- parameterParser True return (FileAppend file)) <|> try (do symbol lexer ">" file <- parameterParser True return (FileConsumer file)) <|> try (symbol lexer "suppress" >> return Suppress) <|> try (do symbol lexer "error" message <- (try (parameterParser True) <|> return "Error sink reached!") return (ErrorConsumer message)) <|> try (symbol lexer "concatenate" >> return Concatenate) <|> try (symbol lexer "count" >> return Count) <|> try (symbol lexer "digits" >> return DigitSplitter) <|> try (symbol lexer "everything" >> return EverythingSplitter) <|> try (symbol lexer "execute" >> return ExecuteTransducer) <|> try (symbol lexer "group" >> return Group) <|> try (symbol lexer "id" >> return IdentityTransducer) <|> try (symbol lexer "letters" >> return LetterSplitter) <|> try (symbol lexer "line" >> return LineSplitter) <|> try (symbol lexer "marked" >> return MarkedSplitter) <|> try (symbol lexer "nothing" >> return NothingSplitter) <|> try (symbol lexer "one" >> return OneSplitter) <|> try (symbol lexer "show" >> return ShowTransducer) <|> try (symbol lexer "uppercase" >> return Uppercase) <|> try (symbol lexer "unparse" >> return Unparse) <|> try (symbol lexer "whitespace" >> return WhitespaceSplitter) <|> try (symbol lexer "XML.attribute-name" >> return XMLAttributeName) <|> try (symbol lexer "XML.attribute-value" >> return XMLAttributeValue) <|> try (symbol lexer "XML.attribute" >> return XMLAttribute) <|> try (symbol lexer "XML.element-content" >> return XMLElementContent) <|> try (symbol lexer "XML.element-name" >> return XMLElementName) <|> try (symbol lexer "XML.element" >> return XMLElement) <|> try (symbol lexer "XML.parse" >> return XMLTokenParser) <|> try (do symbol lexer "substring" part <- parameterParser True return (SubstringSplitter part)) <|> try (do symbol lexer "if" splitter <- expressionParser whiteSpace lexer symbol lexer "then" true <- expressionParser false <- (try (symbol lexer "else" >> expressionParser) <|> return Suppress) symbol lexer "end" option "" (symbol lexer "if") return (If splitter true false)) <|> try (do symbol lexer "nested" core <- expressionParser whiteSpace lexer symbol lexer "in" shell <- expressionParser whiteSpace lexer symbol lexer "end" option "" (symbol lexer "nested") return (Nested core shell)) <|> try (do symbol lexer "while" test <- expressionParser whiteSpace lexer symbol lexer "do" body <- expressionParser whiteSpace lexer symbol lexer "end" option "" (symbol lexer "while") return (While test body)) <|> try (do symbol lexer "foreach" splitter <- expressionParser whiteSpace lexer symbol lexer "then" trueBranch <- expressionParser whiteSpace lexer falseBranch <- (try (symbol lexer "else" >> expressionParser) <|> return IdentityTransducer) whiteSpace lexer symbol lexer "end" option "" (symbol lexer "foreach") return (ForEach splitter trueBranch falseBranch)) <|> liftM NativeCommand (nativeCommand False) nativeSourceParser :: String -> Parsec.Parser Expression nativeSourceParser command = do symbol lexer command params <- nativeCommand False return (NativeCommand (command ++ " " ++ params)) nativeCommand :: Bool -> Parsec.Parser String nativeCommand normalize = do parts <- try (lexeme lexer (parameterParser normalize) `manyTill` ((eof >> return "") <|> lookAhead (choice (map (try . symbol lexer) reservedTokens)))) return (concat (intersperse " " parts)) where manyTill :: GenParser tok st a -> GenParser tok st end -> GenParser tok st [a] manyTill p end = scan where scan = do{ end; return [] } <|> do{ x <- p; xs <- scan; return (x:xs) } <|> return [] parameterParser :: Bool -> Parsec.Parser String parameterParser normalize = do chars <- many (noneOf " \t\n'\"`\\()[]{}<>|&;") (do try (string "\\n") rest <- option "" (parameterParser normalize) return (chars ++ '\n' : rest) <|> do try (string "\\t") rest <- option "" (parameterParser normalize) return (chars ++ '\t' : rest) <|> do next <- escape rest <- option "" (parameterParser normalize) return (chars ++ next : rest) <|> do quote <- oneOf "'\"`" string <- many (try (noneOf (quote : "\\")) <|> escape) char quote rest <- option "" (parameterParser normalize) return (chars ++ (if normalize then string else quote : (string ++ [quote])) ++ rest) <|> do try (char '(') whiteSpace lexer inside <- nativeCommand normalize char ')' rest <- option "" (parameterParser normalize) return (chars ++ '(' : inside ++ ')' : rest) <|> do try (char '[') whiteSpace lexer inside <- nativeCommand normalize char ']' rest <- parameterParser normalize return (chars ++ '[' : inside ++ ']' : rest) <|> do try (char '{') whiteSpace lexer inside <- nativeCommand normalize char '}' rest <- option "" (parameterParser normalize) return (chars ++ '{' : inside ++ '}' : rest) <|> do when (null chars) parserZero return chars) escape :: Parsec.Parser Char escape = do char '\\' escaped <- anyChar return (case escaped of 'n' -> '\n' 'r' -> '\r' 't' -> '\t' _ -> escaped) stringLexemeParser :: Parsec.Parser String stringLexemeParser = do terminator <- oneOf "'\"`" content <- many (try (noneOf ['\\', terminator] <|> (string "\\t" >> return '\t') <|> (string "\\n" >> return '\n') <|> (char '\\' >> anyChar))) char terminator return (terminator : (content ++ [terminator]))