{-# LANGUAGE BangPatterns, CPP, FlexibleContexts, InstanceSigs, RankNTypes, ScopedTypeVariables, TypeFamilies, UndecidableInstances #-} -- | Continuation-passing parser for Parsing Expression Grammars that keeps track of the parsed prefix length module Text.Grampa.PEG.Continued.Measured (Parser(..), Result(..), alt) where import Control.Applicative (Applicative(..), Alternative(..), liftA2) import Control.Monad (Monad(..), MonadPlus(..)) #if MIN_VERSION_base(4,13,0) import Control.Monad (MonadFail(fail)) #endif import Data.Functor.Compose (Compose(..)) import Data.Kind (Type) import Data.Semigroup (Semigroup(..)) import Data.Monoid (Monoid(mappend, mempty)) import Data.Monoid.Factorial(FactorialMonoid) import Data.Monoid.Textual(TextualMonoid) import Data.String (fromString) import Debug.Trace (trace) import Witherable (Filterable(mapMaybe)) import Data.Semigroup.Cancellative (LeftReductive(stripPrefix)) import qualified Data.Monoid.Factorial as Factorial import qualified Data.Monoid.Null as Null import qualified Data.Monoid.Textual as Textual import qualified Rank2 import qualified Text.Parser.Char as Char import Text.Parser.Char (CharParsing) import Text.Parser.Combinators (Parsing(..)) import Text.Parser.LookAhead (LookAheadParsing(..)) import Text.Parser.Input.Position (fromEnd) import Text.Grampa.Class (CommittedParsing(..), DeterministicParsing(..), InputParsing(..), InputCharParsing(..), ConsumedInputParsing(..), MultiParsing(..), ParseResults, ParseFailure(..), FailureDescription(..), Pos) import Text.Grampa.Internal (TraceableParsing(..), emptyFailure, erroneous, expected, expectedInput, replaceExpected) import Text.Grampa.PEG.Continued (Result(..)) -- | Parser type for Parsing Expression Grammars that uses a continuation-passing algorithm and keeps track of the -- parsed prefix length, fast for grammars in LL(1) class but with potentially exponential performance for longer -- ambiguous prefixes. newtype Parser (g :: (Type -> Type) -> Type) s r = Parser{applyParser :: forall x. s -> (r -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x} instance Functor (Parser g s) where fmap f (Parser p) = Parser (\input success-> p input (success . f)) {-# INLINABLE fmap #-} instance Applicative (Parser g s) where pure a = Parser (\input success _-> success a 0 input) (<*>) :: forall a b. Parser g s (a -> b) -> Parser g s a -> Parser g s b Parser p <*> Parser q = Parser r where r :: forall x. s -> (b -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x r rest success failure = p rest (\f len rest'-> q rest' (\a len'-> success (f a) $! len + len') failure) failure {-# INLINABLE (<*>) #-} instance (FactorialMonoid s, Ord s) => Alternative (Parser g s) where empty = Parser (\rest _ failure-> failure $ emptyFailure $ fromEnd $ Factorial.length rest) (<|>) = alt -- | A named and unconstrained version of the '<|>' operator alt :: forall g s a. Ord s => Parser g s a -> Parser g s a -> Parser g s a Parser p `alt` Parser q = Parser r where r :: forall x. s -> (a -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x r rest success failure = p rest success (\f1-> q rest success $ \f2 -> failure (f1 <> f2)) instance Factorial.FactorialMonoid s => Filterable (Parser g s) where mapMaybe :: forall a b. (a -> Maybe b) -> Parser g s a -> Parser g s b mapMaybe f (Parser p) = Parser q where q :: forall x. s -> (b -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q rest success failure = p rest (maybe filterFailure success . f) failure where filterFailure _ _ = failure (expected (fromEnd $ Factorial.length rest) "filter") {-# INLINABLE mapMaybe #-} #if MIN_VERSION_base(4,13,0) instance Monad (Parser g s) where #else instance Factorial.FactorialMonoid s => Monad (Parser g s) where #endif return = pure (>>=) :: forall a b. Parser g s a -> (a -> Parser g s b) -> Parser g s b Parser p >>= f = Parser r where r :: forall x. s -> (b -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x r rest success failure = p rest (\a len rest'-> applyParser (f a) rest' (\b len'-> success b $! len + len') failure) failure #if MIN_VERSION_base(4,13,0) instance FactorialMonoid s => MonadFail (Parser g s) where #endif fail msg = Parser (\rest _ failure-> failure $ expected (fromEnd $ Factorial.length rest) msg) instance (FactorialMonoid s, Ord s) => MonadPlus (Parser g s) where mzero = empty mplus = (<|>) instance Semigroup x => Semigroup (Parser g s x) where (<>) = liftA2 (<>) instance Monoid x => Monoid (Parser g s x) where mempty = pure mempty mappend = (<>) instance (FactorialMonoid s, Ord s) => Parsing (Parser g s) where try :: forall a. Parser g s a -> Parser g s a try (Parser p) = Parser q where q :: forall x. s -> (a -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q input success failure = p input success (const $ failure $ emptyFailure $ fromEnd $ Factorial.length input) () :: forall a. Parser g s a -> String -> Parser g s a Parser p msg = Parser q where q :: forall x. s -> (a -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q input success failure = p input success (failure . replaceExpected (fromEnd $ Factorial.length input) msg) eof = Parser p where p rest success failure | Null.null rest = success () 0 rest | otherwise = failure (expected (fromEnd $ Factorial.length rest) "end of input") unexpected msg = Parser (\t _ failure -> failure $ erroneous (fromEnd $ Factorial.length t) msg) notFollowedBy (Parser p) = Parser q where q :: forall x. s -> (() -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q input success failure = p input success' failure' where success' _ _ _ = failure (expected (fromEnd $ Factorial.length input) "notFollowedBy") failure' _ = success () 0 input instance (FactorialMonoid s, Ord s) => CommittedParsing (Parser g s) where type CommittedResults (Parser g s) = ParseResults s commit :: forall a. Parser g s a -> Parser g s (ParseResults s a) commit (Parser p) = Parser q where q :: forall x. s -> (ParseResults s a -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q input success _failure = p input (success . Right) failure' where failure' f = success (Left f) 0 input admit :: forall a. Parser g s (ParseResults s a) -> Parser g s a admit (Parser p) = Parser q where q :: forall x. s -> (a -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q input success failure = p input success' failure where success' (Left f) _len _rest = failure f success' (Right a) len rest = success a len rest -- | Every PEG parser is deterministic all the time. instance (FactorialMonoid s, Ord s) => DeterministicParsing (Parser g s) where (<<|>) = alt takeSome = some takeMany = many skipAll = skipMany instance (FactorialMonoid s, Ord s) => LookAheadParsing (Parser g s) where lookAhead :: forall a. Parser g s a -> Parser g s a lookAhead (Parser p) = Parser q where q :: forall x. s -> (a -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q input success failure = p input success' failure' where success' a _ _ = success a 0 input failure' f = failure f instance (Ord s, Show s, TextualMonoid s) => CharParsing (Parser g s) where satisfy predicate = Parser p where p :: forall x. s -> (Char -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success failure = case Textual.splitCharacterPrefix rest of Just (first, suffix) | predicate first -> success first 1 suffix _ -> failure (expected (fromEnd $ Factorial.length rest) "Char.satisfy") string s = Textual.toString (error "unexpected non-character") <$> string (fromString s) text t = (fromString . Textual.toString (error "unexpected non-character")) <$> string (Textual.fromText t) instance (LeftReductive s, FactorialMonoid s, Ord s) => InputParsing (Parser g s) where type ParserInput (Parser g s) = s getInput = Parser p where p rest success _ = success rest 0 rest anyToken = Parser p where p rest success failure = case Factorial.splitPrimePrefix rest of Just (first, suffix) -> success first 1 suffix _ -> failure (expected (fromEnd $ Factorial.length rest) "anyToken") satisfy predicate = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success failure = case Factorial.splitPrimePrefix rest of Just (first, suffix) | predicate first -> success first 1 suffix _ -> failure (expected (fromEnd $ Factorial.length rest) "satisfy") notSatisfy predicate = Parser p where p :: forall x. s -> (() -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success failure = case Factorial.splitPrimePrefix rest of Just (first, _) | predicate first -> failure (expected (fromEnd $ Factorial.length rest) "notSatisfy") _ -> success () 0 rest scan :: forall state. state -> (state -> s -> Maybe state) -> Parser g s s scan s0 f = Parser (p s0) where p :: forall x. state -> s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p s rest success _ = success prefix len suffix where (prefix, suffix, _) = Factorial.spanMaybe' s f rest !len = Factorial.length prefix take n = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success _ | (prefix, suffix) <- Factorial.splitAt n rest, len <- Factorial.length prefix, len == n = success prefix len suffix p rest _ failure = failure (expected (fromEnd $ Factorial.length rest) $ "take" ++ show n) takeWhile predicate = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success _ | (prefix, suffix) <- Factorial.span predicate rest, !len <- Factorial.length prefix = success prefix len suffix takeWhile1 predicate = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success failure | (prefix, suffix) <- Factorial.span predicate rest, !len <- Factorial.length prefix = if len == 0 then failure (expected (fromEnd $ Factorial.length rest) "takeWhile1") else success prefix len suffix string s = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p s' success failure | Just suffix <- stripPrefix s s', !len <- Factorial.length s = success s len suffix | otherwise = failure (expectedInput (fromEnd $ Factorial.length s') s) {-# INLINABLE string #-} instance (LeftReductive s, FactorialMonoid s, Ord s) => ConsumedInputParsing (Parser g s) where match :: forall a. Parser g s a -> Parser g s (s, a) match (Parser p) = Parser q where q :: forall x. s -> ((s, a) -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q rest success failure = p rest success' failure where success' r !len suffix = success (Factorial.take len rest, r) len suffix instance (InputParsing (Parser g s), FactorialMonoid s) => TraceableParsing (Parser g s) where traceInput :: forall a. (s -> String) -> Parser g s a -> Parser g s a traceInput description (Parser p) = Parser q where q :: forall x. s -> (a -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x q rest success failure = traceWith "Parsing " (p rest success' failure') where traceWith prefix = trace (prefix <> description rest) failure' f = traceWith "Failed " (failure f) success' r !len suffix = trace ("Parsed " <> description (Factorial.take len rest)) (success r len suffix) instance (Ord s, Show s, TextualMonoid s) => InputCharParsing (Parser g s) where satisfyCharInput predicate = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success failure = case Textual.splitCharacterPrefix rest of Just (first, suffix) | predicate first -> success (Factorial.primePrefix rest) 1 suffix _ -> failure (expected (fromEnd $ Factorial.length rest) "satisfyCharInput") notSatisfyChar predicate = Parser p where p :: forall x. s -> (() -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success failure = case Textual.characterPrefix rest of Just first | predicate first -> failure (expected (fromEnd $ Factorial.length rest) "notSatisfyChar") _ -> success () 0 rest scanChars :: forall state. state -> (state -> Char -> Maybe state) -> Parser g s s scanChars s0 f = Parser (p s0) where p :: forall x. state -> s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p s rest success _ = success prefix len suffix where (prefix, suffix, _) = Textual.spanMaybe_' s f rest !len = Factorial.length prefix takeCharsWhile predicate = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success _ | (prefix, suffix) <- Textual.span_ False predicate rest, !len <- Factorial.length prefix = success prefix len suffix takeCharsWhile1 predicate = Parser p where p :: forall x. s -> (s -> Int -> s -> x) -> (ParseFailure Pos s -> x) -> x p rest success failure | Null.null prefix = failure (expected (fromEnd $ Factorial.length rest) "takeCharsWhile1") | otherwise = success prefix len suffix where (prefix, suffix) = Textual.span_ False predicate rest !len = Factorial.length prefix -- | Continuation-passing PEG parser that keeps track of the parsed prefix length -- -- @ -- 'parseComplete' :: ("Rank2".'Rank2.Functor' g, 'FactorialMonoid' s) => -- g (Continued.'Parser' g s) -> s -> g ('ParseResults' s) -- @ instance (LeftReductive s, FactorialMonoid s, Ord s) => MultiParsing (Parser g s) where type ResultFunctor (Parser g s) = ParseResults s -- | Returns an input prefix parse paired with the remaining input suffix. parsePrefix g input = Rank2.fmap (Compose . (\p-> applyParser p input (\a _ rest-> Right (rest, a)) Left)) g parseComplete g input = Rank2.fmap (\p-> applyParser p input (const . const . Right) Left) (Rank2.fmap (<* eof) g)