{-# LANGUAGE ExistentialQuantification, RankNTypes #-} {-# LANGUAGE ViewPatterns #-} {-# LANGUAGE CPP #-} -- | -- -- This module builds on module "Control.Foldl", adding stateful transducers -- and grouping operations. module Control.Foldl.Transduce ( -- * Transducer types Transduction , Transduction' , Transducer(..) , TransductionM , TransductionM' , TransducerM(..) -- * Applying transducers , transduce , transduce' , transduceM , transduceM' -- * Working with groups , groups , groups' , groupsM , groupsM' , folds , folds' , foldsM , foldsM' -- * Transducers , surround , surroundIO -- * Splitters , chunksOf -- * Transducer utilities , _generalize , _simplify , foldify , foldifyM , hoistTransducer , hoistFold -- * Re-exports -- $reexports , module Data.Functor.Extend , module Control.Foldl ) where import Data.Bifunctor import Data.Monoid import Data.Functor.Identity import Data.Functor.Extend import Data.Foldable (Foldable,foldlM,foldl',toList) import Control.Applicative import Control.Monad import Control.Monad.IO.Class import Control.Comonad import Control.Foldl (Fold(..),FoldM(..)) import qualified Control.Foldl as L import Control.Foldl.Transduce.Internal (Pair(..),Trio(..),fstOf3) {- $setup >>> import qualified Control.Foldl as L >>> import Control.Foldl.Transduce >>> import Control.Applicative -} ------------------------------------------------------------------------------ #if !(MIN_VERSION_foldl(1,1,2)) instance Comonad (Fold a) where extract (Fold _ begin done) = done begin {-# INLINABLE extract #-} duplicate (Fold step begin done) = Fold step begin (\x -> Fold step x done) {-# INLINABLE duplicate #-} #endif instance Extend (Fold a) where duplicated f = duplicate f {-# INLINABLE duplicated #-} instance Monad m => Extend (FoldM m a) where duplicated (FoldM step begin done) = FoldM step begin (\x -> return $! FoldM step (return x) done) {-# INLINABLE duplicated #-} ------------------------------------------------------------------------------ {-| A (possibly stateful) transformation on the inputs of a 'Fold'. Functions constructed with combinators like 'L.premap' or 'L.handles' from "Control.Foldl" also typecheck as a 'Transduction'. -} type Transduction a b = forall x. Fold b x -> Fold a x {-| A more general from of 'Transduction' that adds new information to the return value of the 'Fold'. -} type Transduction' a b r = forall x. Fold b x -> Fold a (r,x) {-| A stateful process that transforms a stream of inputs into a stream of outputs, and may optionally demarcate groups in the stream of outputs. Composed of a step function, an initial state, and a extraction function. The step function returns a triplet of: * The new internal state. * Outputs that continues the last segment detected in the previous step. * A list of lists containing outputs for segments detected in the current step. If the list is empty, that means no splitting has taken place in the current step. 'Transducer's that do not perform grouping never return anything other than @[]@ here. In effect, they treat the whole stream as a single group. The extraction function returns the 'Transducer's own result value, as well as any pending outputs. -} data Transducer i o r = forall x. Transducer (x -> i -> (x,[o],[[o]])) x (x -> (r,[o])) instance Functor (Transducer i o) where fmap f (Transducer step begin done) = Transducer step begin (first f . done) instance Bifunctor (Transducer i) where first f (Transducer step begin done) = Transducer (fmap (\(x,xs,xss) -> (x,map f xs, map (map f) xss)) . step) begin (fmap (fmap f) . done) second f w = fmap f w {-| Like 'Transduction', but works on monadic 'Fold's. -} type TransductionM m a b = forall x. Monad m => FoldM m b x -> FoldM m a x {-| Like 'Transduction'', but works on monadic 'Fold's. -} type TransductionM' m a b r = forall x. FoldM m b x -> FoldM m a (r,x) {-| Like 'Transducer', but monadic. -} data TransducerM m i o r = forall x. TransducerM (x -> i -> m (x,[o],[[o]])) (m x) (x -> m (r,[o])) instance Monad m => Functor (TransducerM m i o) where fmap f (TransducerM step begin done) = TransducerM step begin done' where done' x = do (r,os) <- done x let r' = f r return $! (r' `seq` (r', os)) instance (Functor m, Monad m) => Bifunctor (TransducerM m i) where first f (TransducerM step begin done) = TransducerM (fmap (fmap (\(x,xs,xss) -> (x,map f xs, map (map f) xss))) . step) begin (fmap (fmap (fmap f)) . done) second f w = fmap f w {-| Apply a 'Transducer' to a 'Fold', discarding the return value of the 'Transducer'. >>> L.fold (transduce (Transducer (\_ i -> ((),[i],[])) () (\_ -> ('r',[]))) L.list) [1..7] [1,2,3,4,5,6,7] -} transduce :: Transducer i o r -> Transduction i o transduce t = fmap snd . (transduce' t) {-| Generalized version of 'transduce' that preserves the return value of the 'Transducer'. >>> L.fold (transduce' (Transducer (\_ i -> ((),[i],[])) () (\_ -> ('r',[]))) L.list) [1..7] ('r',[1,2,3,4,5,6,7]) -} transduce' :: Transducer i o x -> Transduction' i o x transduce' (Transducer wstep wstate wdone) (Fold fstep fstate fdone) = Fold step (Pair wstate fstate) done where step (Pair ws fs) i = let (ws',os,oss) = wstep ws i in Pair ws' (foldl' fstep fs (os ++ mconcat oss)) done (Pair ws fs) = let (wr,os) = wdone ws in (,) wr (fdone (foldl' fstep fs os)) {-| Like 'transduce', but works on monadic 'Fold's. -} transduceM :: Monad m => TransducerM m i o r -> TransductionM m i o transduceM t = fmap snd . (transduceM' t) {-| Like 'transduce'', but works on monadic 'Fold's. -} transduceM' :: Monad m => TransducerM m i o x -> TransductionM' m i o x transduceM' (TransducerM wstep wstate wdone) (FoldM fstep fstate fdone) = FoldM step (liftM2 Pair wstate fstate) done where step (Pair ws fs) i = do (ws',os,oss) <- wstep ws i fs' <- foldlM fstep fs (os ++ mconcat oss) return $! Pair ws' fs' done (Pair ws fs) = do (wr,os) <- wdone ws fr <- fdone =<< foldlM fstep fs os return $! (,) wr fr ------------------------------------------------------------------------------ data SurroundState = PrefixAdded | PrefixPending {-| Adds a prefix and a suffix to the stream arriving into a 'Fold'. >>> L.fold (transduce (surround "prefix" "suffix") L.list) "middle" "prefixmiddlesuffix" -} surround :: (Foldable p, Foldable s) => p a -> s a -> Transducer a a () surround (toList -> ps) (toList -> ss) = Transducer step PrefixPending done where step PrefixPending a = (PrefixAdded, ps ++ [a],[]) step PrefixAdded a = (PrefixAdded, [a],[]) done PrefixPending = ((), ps ++ ss) done PrefixAdded = ((), ss) {-| Like 'surround', but the prefix and suffix are obtained using a 'IO' action. >>> L.foldM (transduceM (surroundIO (return "prefix") (return "suffix")) (L.generalize L.list)) "middle" "prefixmiddlesuffix" -} surroundIO :: (Foldable p, Foldable s, Functor m, MonadIO m) => m (p a) -> m (s a) -> TransducerM m a a () surroundIO prefixa suffixa = TransducerM step (return PrefixPending) done where step PrefixPending a = do ps <- fmap toList prefixa return (PrefixAdded, ps ++ [a],[]) step PrefixAdded a = return (PrefixAdded, [a],[]) done PrefixPending = do ps <- fmap toList prefixa ss <- fmap toList suffixa return ((), toList ps ++ toList ss) done PrefixAdded = do ss <- fmap toList suffixa return ((), toList ss) ------------------------------------------------------------------------------ {-| Generalize a 'Transducer' to a 'TransducerM'. -} _generalize :: Monad m => Transducer i o r -> TransducerM m i o r _generalize (Transducer step begin done) = TransducerM step' begin' done' where step' x a = return (step x a) begin' = return begin done' x = return (done x) {-| Simplify a pure 'TransducerM' to a 'Transducer'. -} _simplify :: TransducerM Identity i o r -> Transducer i o r _simplify (TransducerM step begin done) = Transducer step' begin' done' where step' x a = runIdentity (step x a) begin' = runIdentity begin done' x = runIdentity (done x) {-| Transforms a 'Transducer' into a 'Fold' by forgetting about the data sent downstream. -} foldify :: Transducer i o r -> Fold i r foldify (Transducer step begin done) = Fold (\x i -> fstOf3 (step x i)) begin (\x -> fst (done x)) {-| Monadic version of 'foldify'. -} foldifyM :: Functor m => TransducerM m i o r -> FoldM m i r foldifyM (TransducerM step begin done) = FoldM (\x i -> fmap fstOf3 (step x i)) begin (\x -> fmap fst (done x)) {-| Transforms a 'Fold' into a 'Transducer' that sends the return value of the 'Fold' downstream when upstream closes. -} chokepoint :: Fold i b -> Transducer i b () chokepoint (Fold fstep fstate fdone) = (Transducer wstep fstate wdone) where wstep = \fstate' i -> (fstep fstate' i,[],[]) wdone = \fstate' -> ((),[fdone fstate']) chokepointM :: Applicative m => FoldM m i b -> TransducerM m i b () chokepointM (FoldM fstep fstate fdone) = (TransducerM wstep fstate wdone) where wstep = \fstate' i -> fmap (\s -> (s,[],[])) (fstep fstate' i) wdone = \fstate' -> fmap (\r -> ((),[r])) (fdone fstate') {-| Changes the base monad used by a 'TransducerM'. -} hoistTransducer :: Monad m => (forall a. m a -> n a) -> TransducerM m i o r -> TransducerM n i o r hoistTransducer g (TransducerM step begin done) = TransducerM (\s i -> g (step s i)) (g begin) (g . done) {-| Changes the base monad used by a 'FoldM'. -} hoistFold :: Monad m => (forall a. m a -> n a) -> FoldM m i r -> FoldM n i r hoistFold g (FoldM step begin done) = FoldM (\s i -> g (step s i)) (g begin) (g . done) ------------------------------------------------------------------------------ {-| Repeatedly applies a 'Transduction' to process each of the groups demarcated by a 'Transducer', returning a 'Fold' what works over the undivided stream of inputs. The return value of the 'Transducer' is discarded. >>> L.fold (groups (chunksOf 2) (transduce (surround "<" ">")) L.list) "aabbccdd" "
" -} groups :: Transducer i i' r -> Transduction i' b -> Transduction i b groups splitter transduction oldfold = let transduction' = fmap ((,) ()) . transduction newfold = groups' splitter L.mconcat transduction' oldfold in fmap snd newfold {-| Generalized version of 'groups' that preserves the return value of the 'Transducer'. A summary value for each group is also calculated. They are aggregated for the whole stream, with the help of an auxiliary 'Fold'. >>> L.fold (groups' (chunksOf 2) L.list (\f -> transduce (surround "<" ">") (liftA2 (,) L.list f)) L.list) "aabbccdd" (((),["","","","
"]),"
") -} groups' :: Transducer i i' s -> Fold u v -- ^ auxiliary 'Fold' that aggregates the @u@ values produced for each group -> Transduction' i' a u -- ^ repeatedly applied for processing each group -> Transduction' i a (s,v) groups' (Transducer sstep sbegin sdone) summarizer t f = Fold step (Trio sbegin summarizer (t (duplicated f))) done where step (Trio ss summarizer' fs) i = let (ss', oldSplit, newSplits) = sstep ss i (summarizer'',fs') = foldl' (\(summarizer_,fs_) split_ -> let (u, renewed) = reset fs_ in (L.fold (duplicated summarizer_) [u], step' renewed split_)) (summarizer', step' fs oldSplit) newSplits in Trio ss' summarizer'' fs' step' = L.fold . duplicated reset (Fold _ fstate fdone) = let (u,x) = fdone fstate in (u,t (duplicated x)) done (Trio ss summarizer' (Fold fstep fstate fdone)) = let (s,xss) = sdone ss (u,extract -> x) = fdone (foldl' fstep fstate xss) in ((s,L.fold summarizer' [u]),x) {-| Monadic version of 'groups'. -} groupsM :: Monad m => TransducerM m i i' s -> TransductionM m i' b -> TransductionM m i b groupsM splitter transduction oldfold = let transduction' = fmap ((,) ()) . transduction newfold = groupsM' splitter (L.generalize L.mconcat) transduction' oldfold in fmap snd newfold {-| Monadic version of 'groups''. -} groupsM' :: Monad m => TransducerM m i i' s -> FoldM m u v -> TransductionM' m i' a u -> TransductionM' m i a (s,v) groupsM' (TransducerM sstep sbegin sdone) summarizer t f = FoldM step (sbegin >>= \zzz -> return (Trio zzz summarizer (t (duplicated f)))) done where step (Trio ss summarizer' fs) i = do (ss', oldSplit, newSplits) <- sstep ss i fs' <- step' fs oldSplit (summarizer'',fs'') <- foldlM step'' (summarizer',fs') newSplits return $! Trio ss' summarizer'' fs'' step' = L.foldM . duplicated step'' = \(summarizer_, fs) is -> do (u,fs') <- reset fs u' <- L.foldM (duplicated summarizer_) [u] fs'' <- step' fs' is return $! (u',fs'') reset (FoldM _ fstate fdone) = do (u,x) <- fdone =<< fstate return (u, t . duplicated $ x) done (Trio ss summarizer' (FoldM fstep fstate fdone)) = do (s,xss) <- sdone ss (u,finalf) <- fdone =<< flip (foldlM fstep) xss =<< fstate v <- L.foldM summarizer' [u] r <- L.foldM finalf [] return ((s,v),r) {-| Summarizes each of the groups demarcated by the 'Transducer' using a 'Fold'. The result value of the 'Transducer' is discarded. -} folds :: Transducer i i' r -> Fold i' b -> Transduction i b folds splitter f = groups splitter (transduce (chokepoint f)) {-| Like 'folds', but preserves the return value of the 'Transducer'. -} folds' :: Transducer i i' s -> Fold i' b -> Transduction' i b s folds' splitter innerfold somefold = fmap (bimap fst id) (groups' splitter L.mconcat innertrans somefold) where innertrans = fmap ((,) ()) . transduce (chokepoint innerfold) {-| Monadic version of 'folds'. -} foldsM :: (Applicative m,Monad m) => TransducerM m i i' r -> FoldM m i' b -> TransductionM m i b foldsM splitter f = groupsM splitter (transduceM (chokepointM f)) {-| Monadic version of 'folds''. -} foldsM' :: (Applicative m,Monad m) => TransducerM m i i' s -> FoldM m i' b -> TransductionM' m i b s foldsM' splitter innerfold somefold = fmap (bimap fst id) (groupsM' splitter (L.generalize L.mconcat) innertrans somefold) where innertrans = fmap ((,) ()) . transduceM (chokepointM innerfold) ------------------------------------------------------------------------------ {-| Splits a stream into chunks of fixed size. >>> L.fold (folds (chunksOf 2) L.list L.list) [1..7] [[1,2],[3,4],[5,6],[7]] >>> L.fold (groups (chunksOf 2) (transduce (surround [] [0])) L.list) [1..7] [1,2,0,3,4,0,5,6,0,7,0] -} chunksOf :: Int -> Transducer a a () chunksOf 0 = Transducer (\_ _ -> ((),[],repeat [])) () (error "never happens") chunksOf groupSize = Transducer step groupSize done where step 0 a = (pred groupSize, [], [[a]]) step i a = (pred i, [a], []) done _ = ((),[]) ------------------------------------------------------------------------------ {- $reexports -}