{-# LANGUAGE CPP #-}
{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE GeneralizedNewtypeDeriving #-}
{-# LANGUAGE LambdaCase #-}
{-# LANGUAGE MultiParamTypeClasses #-}
{-# LANGUAGE RankNTypes #-}
{-# LANGUAGE ScopedTypeVariables #-}
{-# LANGUAGE TypeFamilies #-}
{-# LANGUAGE UndecidableInstances #-}
module Text.Megaparsec.Internal
(
Hints (..),
Reply (..),
Consumption (..),
Result (..),
ParsecT (..),
toHints,
withHints,
accHints,
refreshLastHint,
runParsecT,
withParsecT,
)
where
import Control.Applicative
import Control.Monad
import Control.Monad.Cont.Class
import Control.Monad.Error.Class
import qualified Control.Monad.Fail as Fail
import Control.Monad.Fix
import Control.Monad.IO.Class
import Control.Monad.Reader.Class
import Control.Monad.State.Class
import Control.Monad.Trans
import Data.List.NonEmpty (NonEmpty (..))
import qualified Data.List.NonEmpty as NE
import Data.Proxy
import Data.Semigroup
import Data.Set (Set)
import qualified Data.Set as E
import Data.String (IsString (..))
import Text.Megaparsec.Class
import Text.Megaparsec.Error
import Text.Megaparsec.State
import Text.Megaparsec.Stream
newtype Hints t = Hints [Set (ErrorItem t)]
deriving (Semigroup, Monoid)
data Reply e s a = Reply (State s e) Consumption (Result s e a)
data Consumption
=
Consumed
|
Virgin
data Result s e a
=
OK a
|
Error (ParseError s e)
newtype ParsecT e s m a = ParsecT
{ unParser ::
forall b.
State s e ->
(a -> State s e -> Hints (Token s) -> m b) ->
(ParseError s e -> State s e -> m b) ->
(a -> State s e -> Hints (Token s) -> m b) ->
(ParseError s e -> State s e -> m b) ->
m b
}
instance (Stream s, Semigroup a) => Semigroup (ParsecT e s m a) where
(<>) = liftA2 (<>)
{-# INLINE (<>) #-}
sconcat = fmap sconcat . sequence
{-# INLINE sconcat #-}
instance (Stream s, Monoid a) => Monoid (ParsecT e s m a) where
mempty = pure mempty
{-# INLINE mempty #-}
mappend = (<>)
{-# INLINE mappend #-}
mconcat = fmap mconcat . sequence
{-# INLINE mconcat #-}
instance
(a ~ Tokens s, IsString a, Eq a, Stream s, Ord e) =>
IsString (ParsecT e s m a)
where
fromString s = tokens (==) (fromString s)
instance Functor (ParsecT e s m) where
fmap = pMap
pMap :: (a -> b) -> ParsecT e s m a -> ParsecT e s m b
pMap f p = ParsecT $ \s cok cerr eok eerr ->
unParser p s (cok . f) cerr (eok . f) eerr
{-# INLINE pMap #-}
instance Stream s => Applicative (ParsecT e s m) where
pure = pPure
(<*>) = pAp
p1 *> p2 = p1 `pBind` const p2
p1 <* p2 = do x1 <- p1; void p2; return x1
pPure :: a -> ParsecT e s m a
pPure x = ParsecT $ \s _ _ eok _ -> eok x s mempty
{-# INLINE pPure #-}
pAp ::
Stream s =>
ParsecT e s m (a -> b) ->
ParsecT e s m a ->
ParsecT e s m b
pAp m k = ParsecT $ \s cok cerr eok eerr ->
let mcok x s' hs =
unParser
k
s'
(cok . x)
cerr
(accHints hs (cok . x))
(withHints hs cerr)
meok x s' hs =
unParser
k
s'
(cok . x)
cerr
(accHints hs (eok . x))
(withHints hs eerr)
in unParser m s mcok cerr meok eerr
{-# INLINE pAp #-}
instance (Ord e, Stream s) => Alternative (ParsecT e s m) where
empty = mzero
(<|>) = mplus
instance Stream s => Monad (ParsecT e s m) where
return = pure
(>>=) = pBind
#if !(MIN_VERSION_base(4,13,0))
fail = Fail.fail
#endif
pBind ::
Stream s =>
ParsecT e s m a ->
(a -> ParsecT e s m b) ->
ParsecT e s m b
pBind m k = ParsecT $ \s cok cerr eok eerr ->
let mcok x s' hs =
unParser
(k x)
s'
cok
cerr
(accHints hs cok)
(withHints hs cerr)
meok x s' hs =
unParser
(k x)
s'
cok
cerr
(accHints hs eok)
(withHints hs eerr)
in unParser m s mcok cerr meok eerr
{-# INLINE pBind #-}
instance Stream s => Fail.MonadFail (ParsecT e s m) where
fail = pFail
pFail :: String -> ParsecT e s m a
pFail msg = ParsecT $ \s@(State _ o _ _) _ _ _ eerr ->
let d = E.singleton (ErrorFail msg)
in eerr (FancyError o d) s
{-# INLINE pFail #-}
instance (Stream s, MonadIO m) => MonadIO (ParsecT e s m) where
liftIO = lift . liftIO
instance (Stream s, MonadReader r m) => MonadReader r (ParsecT e s m) where
ask = lift ask
local f p = mkPT $ \s -> local f (runParsecT p s)
instance (Stream s, MonadState st m) => MonadState st (ParsecT e s m) where
get = lift get
put = lift . put
instance (Stream s, MonadCont m) => MonadCont (ParsecT e s m) where
callCC f = mkPT $ \s ->
callCC $ \c ->
runParsecT (f (\a -> mkPT $ \s' -> c (pack s' a))) s
where
pack s a = Reply s Virgin (OK a)
instance (Stream s, MonadError e' m) => MonadError e' (ParsecT e s m) where
throwError = lift . throwError
p `catchError` h = mkPT $ \s ->
runParsecT p s `catchError` \e ->
runParsecT (h e) s
mkPT :: Monad m => (State s e -> m (Reply e s a)) -> ParsecT e s m a
mkPT k = ParsecT $ \s cok cerr eok eerr -> do
(Reply s' consumption result) <- k s
case consumption of
Consumed ->
case result of
OK x -> cok x s' mempty
Error e -> cerr e s'
Virgin ->
case result of
OK x -> eok x s' mempty
Error e -> eerr e s'
instance (Ord e, Stream s) => MonadPlus (ParsecT e s m) where
mzero = pZero
mplus = pPlus
pZero :: ParsecT e s m a
pZero = ParsecT $ \s@(State _ o _ _) _ _ _ eerr ->
eerr (TrivialError o Nothing E.empty) s
{-# INLINE pZero #-}
pPlus ::
(Ord e, Stream s) =>
ParsecT e s m a ->
ParsecT e s m a ->
ParsecT e s m a
pPlus m n = ParsecT $ \s cok cerr eok eerr ->
let meerr err ms =
let ncerr err' s' = cerr (err' <> err) (longestMatch ms s')
neok x s' hs = eok x s' (toHints (stateOffset s') err <> hs)
neerr err' s' = eerr (err' <> err) (longestMatch ms s')
in unParser n s cok ncerr neok neerr
in unParser m s cok cerr eok meerr
{-# INLINE pPlus #-}
longestMatch :: State s e -> State s e -> State s e
longestMatch s1@(State _ o1 _ _) s2@(State _ o2 _ _) =
case o1 `compare` o2 of
LT -> s2
EQ -> s2
GT -> s1
{-# INLINE longestMatch #-}
instance (Stream s, MonadFix m) => MonadFix (ParsecT e s m) where
mfix f = mkPT $ \s -> mfix $ \(~(Reply _ _ result)) -> do
let a = case result of
OK a' -> a'
Error _ -> error "mfix ParsecT"
runParsecT (f a) s
instance MonadTrans (ParsecT e s) where
lift amb = ParsecT $ \s _ _ eok _ ->
amb >>= \a -> eok a s mempty
instance (Ord e, Stream s) => MonadParsec e s (ParsecT e s m) where
parseError = pParseError
label = pLabel
try = pTry
lookAhead = pLookAhead
notFollowedBy = pNotFollowedBy
withRecovery = pWithRecovery
observing = pObserving
eof = pEof
token = pToken
tokens = pTokens
takeWhileP = pTakeWhileP
takeWhile1P = pTakeWhile1P
takeP = pTakeP
getParserState = pGetParserState
updateParserState = pUpdateParserState
pParseError ::
ParseError s e ->
ParsecT e s m a
pParseError e = ParsecT $ \s _ _ _ eerr -> eerr e s
{-# INLINE pParseError #-}
pLabel :: String -> ParsecT e s m a -> ParsecT e s m a
pLabel l p = ParsecT $ \s cok cerr eok eerr ->
let el = Label <$> NE.nonEmpty l
cok' x s' hs =
case el of
Nothing -> cok x s' (refreshLastHint hs Nothing)
Just _ -> cok x s' hs
eok' x s' hs = eok x s' (refreshLastHint hs el)
eerr' err = eerr $
case err of
(TrivialError pos us _) ->
TrivialError pos us (maybe E.empty E.singleton el)
_ -> err
in unParser p s cok' cerr eok' eerr'
{-# INLINE pLabel #-}
pTry :: ParsecT e s m a -> ParsecT e s m a
pTry p = ParsecT $ \s cok _ eok eerr ->
let eerr' err _ = eerr err s
in unParser p s cok eerr' eok eerr'
{-# INLINE pTry #-}
pLookAhead :: ParsecT e s m a -> ParsecT e s m a
pLookAhead p = ParsecT $ \s _ cerr eok eerr ->
let eok' a _ _ = eok a s mempty
in unParser p s eok' cerr eok' eerr
{-# INLINE pLookAhead #-}
pNotFollowedBy :: Stream s => ParsecT e s m a -> ParsecT e s m ()
pNotFollowedBy p = ParsecT $ \s@(State input o _ _) _ _ eok eerr ->
let what = maybe EndOfInput (Tokens . nes . fst) (take1_ input)
unexpect u = TrivialError o (pure u) E.empty
cok' _ _ _ = eerr (unexpect what) s
cerr' _ _ = eok () s mempty
eok' _ _ _ = eerr (unexpect what) s
eerr' _ _ = eok () s mempty
in unParser p s cok' cerr' eok' eerr'
{-# INLINE pNotFollowedBy #-}
pWithRecovery ::
Stream s =>
(ParseError s e -> ParsecT e s m a) ->
ParsecT e s m a ->
ParsecT e s m a
pWithRecovery r p = ParsecT $ \s cok cerr eok eerr ->
let mcerr err ms =
let rcok x s' _ = cok x s' mempty
rcerr _ _ = cerr err ms
reok x s' _ = eok x s' (toHints (stateOffset s') err)
reerr _ _ = cerr err ms
in unParser (r err) ms rcok rcerr reok reerr
meerr err ms =
let rcok x s' _ = cok x s' (toHints (stateOffset s') err)
rcerr _ _ = eerr err ms
reok x s' _ = eok x s' (toHints (stateOffset s') err)
reerr _ _ = eerr err ms
in unParser (r err) ms rcok rcerr reok reerr
in unParser p s cok mcerr eok meerr
{-# INLINE pWithRecovery #-}
pObserving ::
Stream s =>
ParsecT e s m a ->
ParsecT e s m (Either (ParseError s e) a)
pObserving p = ParsecT $ \s cok _ eok _ ->
let cerr' err s' = cok (Left err) s' mempty
eerr' err s' = eok (Left err) s' (toHints (stateOffset s') err)
in unParser p s (cok . Right) cerr' (eok . Right) eerr'
{-# INLINE pObserving #-}
pEof :: forall e s m. Stream s => ParsecT e s m ()
pEof = ParsecT $ \s@(State input o pst de) _ _ eok eerr ->
case take1_ input of
Nothing -> eok () s mempty
Just (x, _) ->
let us = (pure . Tokens . nes) x
ps = E.singleton EndOfInput
in eerr
(TrivialError o us ps)
(State input o pst de)
{-# INLINE pEof #-}
pToken ::
forall e s m a.
Stream s =>
(Token s -> Maybe a) ->
Set (ErrorItem (Token s)) ->
ParsecT e s m a
pToken test ps = ParsecT $ \s@(State input o pst de) cok _ _ eerr ->
case take1_ input of
Nothing ->
let us = pure EndOfInput
in eerr (TrivialError o us ps) s
Just (c, cs) ->
case test c of
Nothing ->
let us = (Just . Tokens . nes) c
in eerr
(TrivialError o us ps)
(State input o pst de)
Just x ->
cok x (State cs (o + 1) pst de) mempty
{-# INLINE pToken #-}
pTokens ::
forall e s m.
Stream s =>
(Tokens s -> Tokens s -> Bool) ->
Tokens s ->
ParsecT e s m (Tokens s)
pTokens f tts = ParsecT $ \s@(State input o pst de) cok _ eok eerr ->
let pxy = Proxy :: Proxy s
unexpect pos' u =
let us = pure u
ps = (E.singleton . Tokens . NE.fromList . chunkToTokens pxy) tts
in TrivialError pos' us ps
len = chunkLength pxy tts
in case takeN_ len input of
Nothing ->
eerr (unexpect o EndOfInput) s
Just (tts', input') ->
if f tts tts'
then
let st = State input' (o + len) pst de
in if chunkEmpty pxy tts
then eok tts' st mempty
else cok tts' st mempty
else
let ps = (Tokens . NE.fromList . chunkToTokens pxy) tts'
in eerr (unexpect o ps) (State input o pst de)
{-# INLINE pTokens #-}
pTakeWhileP ::
forall e s m.
Stream s =>
Maybe String ->
(Token s -> Bool) ->
ParsecT e s m (Tokens s)
pTakeWhileP ml f = ParsecT $ \(State input o pst de) cok _ eok _ ->
let pxy = Proxy :: Proxy s
(ts, input') = takeWhile_ f input
len = chunkLength pxy ts
hs =
case ml >>= NE.nonEmpty of
Nothing -> mempty
Just l -> (Hints . pure . E.singleton . Label) l
in if chunkEmpty pxy ts
then eok ts (State input' (o + len) pst de) hs
else cok ts (State input' (o + len) pst de) hs
{-# INLINE pTakeWhileP #-}
pTakeWhile1P ::
forall e s m.
Stream s =>
Maybe String ->
(Token s -> Bool) ->
ParsecT e s m (Tokens s)
pTakeWhile1P ml f = ParsecT $ \(State input o pst de) cok _ _ eerr ->
let pxy = Proxy :: Proxy s
(ts, input') = takeWhile_ f input
len = chunkLength pxy ts
el = Label <$> (ml >>= NE.nonEmpty)
hs =
case el of
Nothing -> mempty
Just l -> (Hints . pure . E.singleton) l
in if chunkEmpty pxy ts
then
let us = pure $
case take1_ input of
Nothing -> EndOfInput
Just (t, _) -> Tokens (nes t)
ps = maybe E.empty E.singleton el
in eerr
(TrivialError o us ps)
(State input o pst de)
else cok ts (State input' (o + len) pst de) hs
{-# INLINE pTakeWhile1P #-}
pTakeP ::
forall e s m.
Stream s =>
Maybe String ->
Int ->
ParsecT e s m (Tokens s)
pTakeP ml n = ParsecT $ \s@(State input o pst de) cok _ _ eerr ->
let pxy = Proxy :: Proxy s
el = Label <$> (ml >>= NE.nonEmpty)
ps = maybe E.empty E.singleton el
in case takeN_ n input of
Nothing ->
eerr (TrivialError o (pure EndOfInput) ps) s
Just (ts, input') ->
let len = chunkLength pxy ts
in if len /= n
then
eerr
(TrivialError (o + len) (pure EndOfInput) ps)
(State input o pst de)
else cok ts (State input' (o + len) pst de) mempty
{-# INLINE pTakeP #-}
pGetParserState :: ParsecT e s m (State s e)
pGetParserState = ParsecT $ \s _ _ eok _ -> eok s s mempty
{-# INLINE pGetParserState #-}
pUpdateParserState :: (State s e -> State s e) -> ParsecT e s m ()
pUpdateParserState f = ParsecT $ \s _ _ eok _ -> eok () (f s) mempty
{-# INLINE pUpdateParserState #-}
nes :: a -> NonEmpty a
nes x = x :| []
{-# INLINE nes #-}
toHints ::
Stream s =>
Int ->
ParseError s e ->
Hints (Token s)
toHints streamPos = \case
TrivialError errOffset _ ps ->
if streamPos == errOffset
then Hints (if E.null ps then [] else [ps])
else mempty
FancyError _ _ -> mempty
{-# INLINE toHints #-}
withHints ::
Stream s =>
Hints (Token s) ->
(ParseError s e -> State s e -> m b) ->
ParseError s e ->
State s e ->
m b
withHints (Hints ps') c e =
case e of
TrivialError pos us ps -> c (TrivialError pos us (E.unions (ps : ps')))
_ -> c e
{-# INLINE withHints #-}
accHints ::
Hints t ->
(a -> State s e -> Hints t -> m b) ->
(a -> State s e -> Hints t -> m b)
accHints hs1 c x s hs2 = c x s (hs1 <> hs2)
{-# INLINE accHints #-}
refreshLastHint :: Hints t -> Maybe (ErrorItem t) -> Hints t
refreshLastHint (Hints []) _ = Hints []
refreshLastHint (Hints (_ : xs)) Nothing = Hints xs
refreshLastHint (Hints (_ : xs)) (Just m) = Hints (E.singleton m : xs)
{-# INLINE refreshLastHint #-}
runParsecT ::
Monad m =>
ParsecT e s m a ->
State s e ->
m (Reply e s a)
runParsecT p s = unParser p s cok cerr eok eerr
where
cok a s' _ = return $ Reply s' Consumed (OK a)
cerr err s' = return $ Reply s' Consumed (Error err)
eok a s' _ = return $ Reply s' Virgin (OK a)
eerr err s' = return $ Reply s' Virgin (Error err)
withParsecT ::
forall e e' s m a.
(Monad m, Ord e') =>
(e -> e') ->
ParsecT e s m a ->
ParsecT e' s m a
withParsecT f p =
ParsecT $ \s cok cerr eok eerr ->
let s' =
s
{ stateParseErrors = []
}
adjustState :: State s e -> State s e'
adjustState st =
st
{ stateParseErrors =
(mapParseError f <$> stateParseErrors st)
++ stateParseErrors s
}
cok' x st hs = cok x (adjustState st) hs
cerr' e st = cerr (mapParseError f e) (adjustState st)
eok' x st hs = eok x (adjustState st) hs
eerr' e st = eerr (mapParseError f e) (adjustState st)
in unParser p s' cok' cerr' eok' eerr'
where
{-# INLINE withParsecT #-}