megaparsec/Text/Megaparsec.hs

{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE MultiParamTypeClasses #-}
{-# LANGUAGE RankNTypes #-}
{-# LANGUAGE Safe #-}
{-# LANGUAGE ScopedTypeVariables #-}
{-# LANGUAGE TypeFamilies #-}
{-# LANGUAGE UndecidableInstances #-}

-- |
-- Module      :  Text.Megaparsec
-- Copyright   :  © 2015–present Megaparsec contributors
--                © 2007 Paolo Martini
--                © 1999–2001 Daan Leijen
-- License     :  FreeBSD
--
-- Maintainer  :  Mark Karpov <markkarpov92@gmail.com>
-- Stability   :  experimental
-- Portability :  portable
--
-- This module includes everything you need to get started writing a parser.
-- If you are new to Megaparsec and don't know where to begin, take a look
-- at the tutorial <https://markkarpov.com/tutorial/megaparsec.html>.
--
-- In addition to the "Text.Megaparsec" module, which exports and re-exports
-- almost everything that you may need, we advise to import
-- "Text.Megaparsec.Char" if you plan to work with a stream of 'Char' tokens
-- or "Text.Megaparsec.Byte" if you intend to parse binary data.
--
-- It is common to start working with the library by defining a type synonym
-- like this:
--
-- > type Parser = Parsec Void Text
-- >                      ^    ^
-- >                      |    |
-- > Custom error component    Input stream type
--
-- Then you can write type signatures like @Parser 'Int'@—for a parser that
-- returns an 'Int' for example.
--
-- Similarly (since it's known to cause confusion), you should use
-- 'ParseErrorBundle' type parametrized like this:
--
-- > ParseErrorBundle Text Void
-- >                  ^    ^
-- >                  |    |
-- >  Input stream type    Custom error component (the same you used in Parser)
--
-- Megaparsec uses some type-level machinery to provide flexibility without
-- compromising on type safety. Thus type signatures are sometimes necessary
-- to avoid ambiguous types. If you're seeing an error message that reads
-- like “Type variable @e0@ is ambiguous …”, you need to give an explicit
-- signature to your parser to resolve the ambiguity. It's a good idea to
-- provide type signatures for all top-level definitions.
module Text.Megaparsec
  ( -- * Re-exports
    -- $reexports
    module Text.Megaparsec.Pos,
    module Text.Megaparsec.Error,
    module Text.Megaparsec.Stream,
    module Control.Monad.Combinators,

    -- * Data types
    State (..),
    PosState (..),
    Parsec,
    ParsecT,

    -- * Running parser
    parse,
    parseMaybe,
    parseTest,
    runParser,
    runParser',
    runParserT,
    runParserT',

    -- * Primitive combinators
    MonadParsec (..),

    -- * Signaling parse errors
    -- $parse-errors
    failure,
    fancyFailure,
    unexpected,
    customFailure,
    region,
    registerParseError,
    registerFailure,
    registerFancyFailure,

    -- * Derivatives of primitive combinators
    single,
    satisfy,
    anySingle,
    anySingleBut,
    oneOf,
    noneOf,
    chunk,
    (<?>),
    match,
    takeRest,
    atEnd,

    -- * Parser state combinators
    getInput,
    setInput,
    getSourcePos,
    getOffset,
    setOffset,
    setParserState,
  )
where

import Control.Monad.Combinators
import Control.Monad.Identity
import Data.List.NonEmpty (NonEmpty (..))
import qualified Data.List.NonEmpty as NE
import Data.Maybe (fromJust)
import Data.Set (Set)
import qualified Data.Set as E
import Text.Megaparsec.Class
import Text.Megaparsec.Error
import Text.Megaparsec.Internal
import Text.Megaparsec.Pos
import Text.Megaparsec.State
import Text.Megaparsec.Stream

-- $reexports
--
-- Note that we re-export monadic combinators from
-- "Control.Monad.Combinators" because these are more efficient than
-- 'Applicative'-based ones. Thus 'many' and 'some' may clash with the
-- functions from "Control.Applicative". You need to hide the functions like
-- this:
--
-- > import Control.Applicative hiding (many, some)
--
-- Also note that you can import "Control.Monad.Combinators.NonEmpty" if you
-- wish that combinators like 'some' return 'NonEmpty' lists. The module
-- lives in the @parser-combinators@ package (you need at least version
-- /0.4.0/).
--
-- This module is intended to be imported qualified:
--
-- > import qualified Control.Monad.Combinators.NonEmpty as NE
--
-- Other modules of interest are:
--
--     * "Control.Monad.Combinators.Expr" for parsing of expressions.
--     * "Control.Applicative.Permutations" for parsing of permutations
--       phrases.

----------------------------------------------------------------------------
-- Data types

-- | 'Parsec' is a non-transformer variant of the more general 'ParsecT'
-- monad transformer.
type Parsec e s = ParsecT e s Identity

----------------------------------------------------------------------------
-- Running a parser

-- | @'parse' p file input@ runs parser @p@ over 'Identity' (see
-- 'runParserT' if you're using the 'ParsecT' monad transformer; 'parse'
-- itself is just a synonym for 'runParser'). It returns either a
-- 'ParseErrorBundle' ('Left') or a value of type @a@ ('Right').
-- 'errorBundlePretty' can be used to turn 'ParseErrorBundle' into the
-- string representation of the error message. See "Text.Megaparsec.Error"
-- if you need to do more advanced error analysis.
--
-- > main = case parse numbers "" "11,2,43" of
-- >          Left bundle -> putStr (errorBundlePretty bundle)
-- >          Right xs -> print (sum xs)
-- >
-- > numbers = decimal `sepBy` char ','
parse ::
  -- | Parser to run
  Parsec e s a ->
  -- | Name of source file
  String ->
  -- | Input for parser
  s ->
  Either (ParseErrorBundle s e) a
parse = runParser

-- | @'parseMaybe' p input@ runs the parser @p@ on @input@ and returns the
-- result inside 'Just' on success and 'Nothing' on failure. This function
-- also parses 'eof', so if the parser doesn't consume all of its input, it
-- will fail.
--
-- The function is supposed to be useful for lightweight parsing, where
-- error messages (and thus file names) are not important and entire input
-- should be consumed. For example, it can be used for parsing of a single
-- number according to a specification of its format.
parseMaybe :: (Ord e, Stream s) => Parsec e s a -> s -> Maybe a
parseMaybe p s =
  case parse (p <* eof) "" s of
    Left _ -> Nothing
    Right x -> Just x

-- | The expression @'parseTest' p input@ applies the parser @p@ on the
-- input @input@ and prints the result to stdout. Useful for testing.
parseTest ::
  ( ShowErrorComponent e,
    Show a,
    VisualStream s,
    TraversableStream s
  ) =>
  -- | Parser to run
  Parsec e s a ->
  -- | Input for parser
  s ->
  IO ()
parseTest p input =
  case parse p "" input of
    Left e -> putStr (errorBundlePretty e)
    Right x -> print x

-- | @'runParser' p file input@ runs parser @p@ on the input stream of
-- tokens @input@, obtained from source @file@. The @file@ is only used in
-- error messages and may be the empty string. Returns either a
-- 'ParseErrorBundle' ('Left') or a value of type @a@ ('Right').
--
-- > parseFromFile p file = runParser p file <$> readFile file
runParser ::
  -- | Parser to run
  Parsec e s a ->
  -- | Name of source file
  String ->
  -- | Input for parser
  s ->
  Either (ParseErrorBundle s e) a
runParser p name s = snd $ runParser' p (initialState name s)

-- | The function is similar to 'runParser' with the difference that it
-- accepts and returns the parser state. This allows us e.g. to specify
-- arbitrary textual position at the beginning of parsing. This is the most
-- general way to run a parser over the 'Identity' monad.
--
-- @since 4.2.0
runParser' ::
  -- | Parser to run
  Parsec e s a ->
  -- | Initial state
  State s e ->
  (State s e, Either (ParseErrorBundle s e) a)
runParser' p = runIdentity . runParserT' p

-- | @'runParserT' p file input@ runs parser @p@ on the input list of tokens
-- @input@, obtained from source @file@. The @file@ is only used in error
-- messages and may be the empty string. Returns a computation in the
-- underlying monad @m@ that returns either a 'ParseErrorBundle' ('Left') or
-- a value of type @a@ ('Right').
runParserT ::
  Monad m =>
  -- | Parser to run
  ParsecT e s m a ->
  -- | Name of source file
  String ->
  -- | Input for parser
  s ->
  m (Either (ParseErrorBundle s e) a)
runParserT p name s = snd <$> runParserT' p (initialState name s)

-- | This function is similar to 'runParserT', but like 'runParser'' it
-- accepts and returns parser state. This is thus the most general way to
-- run a parser.
--
-- @since 4.2.0
runParserT' ::
  Monad m =>
  -- | Parser to run
  ParsecT e s m a ->
  -- | Initial state
  State s e ->
  m (State s e, Either (ParseErrorBundle s e) a)
runParserT' p s = do
  (Reply s' _ result) <- runParsecT p s
  let toBundle es =
        ParseErrorBundle
          { bundleErrors =
              NE.sortWith errorOffset es,
            bundlePosState = statePosState s
          }
  return $ case result of
    OK x ->
      case NE.nonEmpty (stateParseErrors s') of
        Nothing -> (s', Right x)
        Just de -> (s', Left (toBundle de))
    Error e ->
      (s', Left (toBundle (e :| stateParseErrors s')))

-- | Given the name of source file and the input construct the initial state
-- for a parser.
initialState :: String -> s -> State s e
initialState name s =
  State
    { stateInput = s,
      stateOffset = 0,
      statePosState =
        PosState
          { pstateInput = s,
            pstateOffset = 0,
            pstateSourcePos = initialPos name,
            pstateTabWidth = defaultTabWidth,
            pstateLinePrefix = ""
          },
      stateParseErrors = []
    }

----------------------------------------------------------------------------
-- Signaling parse errors

-- $parse-errors
--
-- The most general function to fail and end parsing is 'parseError'. These
-- are built on top of it. The section also includes functions starting with
-- the @register@ prefix which allow users to register “delayed”
-- 'ParseError's.

-- | Stop parsing and report a trivial 'ParseError'.
--
-- @since 6.0.0
failure ::
  MonadParsec e s m =>
  -- | Unexpected item (if any)
  Maybe (ErrorItem (Token s)) ->
  -- | Expected items
  Set (ErrorItem (Token s)) ->
  m a
failure us ps = do
  o <- getOffset
  parseError (TrivialError o us ps)
{-# INLINE failure #-}

-- | Stop parsing and report a fancy 'ParseError'. To report a single custom
-- parse error, see 'Text.Megaparsec.customFailure'.
--
-- @since 6.0.0
fancyFailure ::
  MonadParsec e s m =>
  -- | Fancy error components
  Set (ErrorFancy e) ->
  m a
fancyFailure xs = do
  o <- getOffset
  parseError (FancyError o xs)
{-# INLINE fancyFailure #-}

-- | The parser @'unexpected' item@ fails with an error message telling
-- about unexpected item @item@ without consuming any input.
--
-- > unexpected item = failure (Just item) Set.empty
unexpected :: MonadParsec e s m => ErrorItem (Token s) -> m a
unexpected item = failure (Just item) E.empty
{-# INLINE unexpected #-}

-- | Report a custom parse error. For a more general version, see
-- 'fancyFailure'.
--
-- > customFailure = fancyFailure . Set.singleton . ErrorCustom
--
-- @since 6.3.0
customFailure :: MonadParsec e s m => e -> m a
customFailure = fancyFailure . E.singleton . ErrorCustom
{-# INLINE customFailure #-}

-- | Specify how to process 'ParseError's that happen inside of this
-- wrapper. This applies to both normal and delayed 'ParseError's.
--
-- As a side-effect of the implementation the inner computation will start
-- with an empty collection of delayed errors and they will be updated and
-- “restored” on the way out of 'region'.
--
-- @since 5.3.0
region ::
  MonadParsec e s m =>
  -- | How to process 'ParseError's
  (ParseError s e -> ParseError s e) ->
  -- | The “region” that the processing applies to
  m a ->
  m a
region f m = do
  deSoFar <- stateParseErrors <$> getParserState
  updateParserState $ \s ->
    s {stateParseErrors = []}
  r <- observing m
  updateParserState $ \s ->
    s {stateParseErrors = (f <$> stateParseErrors s) ++ deSoFar}
  case r of
    Left err -> parseError (f err)
    Right x -> return x
{-# INLINEABLE region #-}

-- | Register a 'ParseError' for later reporting. This action does not end
-- parsing and has no effect except for adding the given 'ParseError' to the
-- collection of “delayed” 'ParseError's which will be taken into
-- consideration at the end of parsing. Only if this collection is empty the
-- parser will succeed. This is the main way to report several parse errors
-- at once.
--
-- @since 8.0.0
registerParseError :: MonadParsec e s m => ParseError s e -> m ()
registerParseError e = updateParserState $ \s ->
  s {stateParseErrors = e : stateParseErrors s}
{-# INLINE registerParseError #-}

-- | Like 'failure', but for delayed 'ParseError's.
--
-- @since 8.0.0
registerFailure ::
  MonadParsec e s m =>
  -- | Unexpected item (if any)
  Maybe (ErrorItem (Token s)) ->
  -- | Expected items
  Set (ErrorItem (Token s)) ->
  m ()
registerFailure us ps = do
  o <- getOffset
  registerParseError (TrivialError o us ps)
{-# INLINE registerFailure #-}

-- | Like 'fancyFailure', but for delayed 'ParseError's.
--
-- @since 8.0.0
registerFancyFailure ::
  MonadParsec e s m =>
  -- | Fancy error components
  Set (ErrorFancy e) ->
  m ()
registerFancyFailure xs = do
  o <- getOffset
  registerParseError (FancyError o xs)
{-# INLINE registerFancyFailure #-}

----------------------------------------------------------------------------
-- Derivatives of primitive combinators

-- | @'single' t@ only matches the single token @t@.
--
-- > semicolon = single ';'
--
-- See also: 'token', 'anySingle', 'Text.Megaparsec.Byte.char',
-- 'Text.Megaparsec.Char.char'.
--
-- @since 7.0.0
single ::
  MonadParsec e s m =>
  -- | Token to match
  Token s ->
  m (Token s)
single t = token testToken expected
  where
    testToken x = if x == t then Just x else Nothing
    expected = E.singleton (Tokens (t :| []))
{-# INLINE single #-}

-- | The parser @'satisfy' f@ succeeds for any token for which the supplied
-- function @f@ returns 'True'.
--
-- > digitChar = satisfy isDigit <?> "digit"
-- > oneOf cs  = satisfy (`elem` cs)
--
-- __Performance note__: when you need to parse a single token, it is often
-- a good idea to use 'satisfy' with the right predicate function instead of
-- creating a complex parser using the combinators.
--
-- See also: 'anySingle', 'anySingleBut', 'oneOf', 'noneOf'.
--
-- @since 7.0.0
satisfy ::
  MonadParsec e s m =>
  -- | Predicate to apply
  (Token s -> Bool) ->
  m (Token s)
satisfy f = token testChar E.empty
  where
    testChar x = if f x then Just x else Nothing
{-# INLINE satisfy #-}

-- | Parse and return a single token. It's a good idea to attach a 'label'
-- to this parser.
--
-- > anySingle = satisfy (const True)
--
-- See also: 'satisfy', 'anySingleBut'.
--
-- @since 7.0.0
anySingle :: MonadParsec e s m => m (Token s)
anySingle = satisfy (const True)
{-# INLINE anySingle #-}

-- | Match any token but the given one. It's a good idea to attach a 'label'
-- to this parser.
--
-- > anySingleBut t = satisfy (/= t)
--
-- See also: 'single', 'anySingle', 'satisfy'.
--
-- @since 7.0.0
anySingleBut ::
  MonadParsec e s m =>
  -- | Token we should not match
  Token s ->
  m (Token s)
anySingleBut t = satisfy (/= t)
{-# INLINE anySingleBut #-}

-- | @'oneOf' ts@ succeeds if the current token is in the supplied
-- collection of tokens @ts@. Returns the parsed token. Note that this
-- parser cannot automatically generate the “expected” component of error
-- message, so usually you should label it manually with 'label' or ('<?>').
--
-- > oneOf cs = satisfy (`elem` cs)
--
-- See also: 'satisfy'.
--
-- > digit = oneOf ['0'..'9'] <?> "digit"
--
-- __Performance note__: prefer 'satisfy' when you can because it's faster
-- when you have only a couple of tokens to compare to:
--
-- > quoteFast = satisfy (\x -> x == '\'' || x == '\"')
-- > quoteSlow = oneOf "'\""
--
-- @since 7.0.0
oneOf ::
  (Foldable f, MonadParsec e s m) =>
  -- | Collection of matching tokens
  f (Token s) ->
  m (Token s)
oneOf cs = satisfy (`elem` cs)
{-# INLINE oneOf #-}

-- | As the dual of 'oneOf', @'noneOf' ts@ succeeds if the current token
-- /not/ in the supplied list of tokens @ts@. Returns the parsed character.
-- Note that this parser cannot automatically generate the “expected”
-- component of error message, so usually you should label it manually with
-- 'label' or ('<?>').
--
-- > noneOf cs = satisfy (`notElem` cs)
--
-- See also: 'satisfy'.
--
-- __Performance note__: prefer 'satisfy' and 'anySingleBut' when you can
-- because it's faster.
--
-- @since 7.0.0
noneOf ::
  (Foldable f, MonadParsec e s m) =>
  -- | Collection of taken we should not match
  f (Token s) ->
  m (Token s)
noneOf cs = satisfy (`notElem` cs)
{-# INLINE noneOf #-}

-- | @'chunk' chk@ only matches the chunk @chk@.
--
-- > divOrMod = chunk "div" <|> chunk "mod"
--
-- See also: 'tokens', 'Text.Megaparsec.Char.string',
-- 'Text.Megaparsec.Byte.string'.
--
-- @since 7.0.0
chunk ::
  MonadParsec e s m =>
  -- | Chunk to match
  Tokens s ->
  m (Tokens s)
chunk = tokens (==)
{-# INLINE chunk #-}

-- | A synonym for 'label' in the form of an operator.
infix 0 <?>

(<?>) :: MonadParsec e s m => m a -> String -> m a
(<?>) = flip label
{-# INLINE (<?>) #-}

-- | Return both the result of a parse and a chunk of input that was
-- consumed during parsing. This relies on the change of the 'stateOffset'
-- value to evaluate how many tokens were consumed. If you mess with it
-- manually in the argument parser, prepare for troubles.
--
-- @since 5.3.0
match :: MonadParsec e s m => m a -> m (Tokens s, a)
match p = do
  o <- getOffset
  s <- getInput
  r <- p
  o' <- getOffset
  -- NOTE The 'fromJust' call here should never fail because if the stream
  -- is empty before 'p' (the only case when 'takeN_' can return 'Nothing'
  -- as per its invariants), (tp' - tp) won't be greater than 0, and in that
  -- case 'Just' is guaranteed to be returned as per another invariant of
  -- 'takeN_'.
  return ((fst . fromJust) (takeN_ (o' - o) s), r)
{-# INLINEABLE match #-}

-- | Consume the rest of the input and return it as a chunk. This parser
-- never fails, but may return the empty chunk.
--
-- > takeRest = takeWhileP Nothing (const True)
--
-- @since 6.0.0
takeRest :: MonadParsec e s m => m (Tokens s)
takeRest = takeWhileP Nothing (const True)
{-# INLINE takeRest #-}

-- | Return 'True' when end of input has been reached.
--
-- > atEnd = option False (True <$ hidden eof)
--
-- @since 6.0.0
atEnd :: MonadParsec e s m => m Bool
atEnd = option False (True <$ hidden eof)
{-# INLINE atEnd #-}

----------------------------------------------------------------------------
-- Parser state combinators

-- | Return the current input.
getInput :: MonadParsec e s m => m s
getInput = stateInput <$> getParserState
{-# INLINE getInput #-}

-- | @'setInput' input@ continues parsing with @input@.
setInput :: MonadParsec e s m => s -> m ()
setInput s = updateParserState (\(State _ o pst de) -> State s o pst de)
{-# INLINE setInput #-}

-- | Return the current source position. This function /is not cheap/, do
-- not call it e.g. on matching of every token, that's a bad idea. Still you
-- can use it to get 'SourcePos' to attach to things that you parse.
--
-- The function works under the assumption that we move in the input stream
-- only forwards and never backwards, which is always true unless the user
-- abuses the library.
--
-- @since 7.0.0
getSourcePos :: (TraversableStream s, MonadParsec e s m) => m SourcePos
getSourcePos = do
  st <- getParserState
  let pst = reachOffsetNoLine (stateOffset st) (statePosState st)
  setParserState st {statePosState = pst}
  return (pstateSourcePos pst)
{-# INLINE getSourcePos #-}

-- | Get the number of tokens processed so far.
--
-- See also: 'setOffset'.
--
-- @since 7.0.0
getOffset :: MonadParsec e s m => m Int
getOffset = stateOffset <$> getParserState
{-# INLINE getOffset #-}

-- | Set the number of tokens processed so far.
--
-- See also: 'getOffset'.
--
-- @since 7.0.0
setOffset :: MonadParsec e s m => Int -> m ()
setOffset o = updateParserState $ \(State s _ pst de) ->
  State s o pst de
{-# INLINE setOffset #-}

-- | @'setParserState' st@ sets the parser state to @st@.
--
-- See also: 'getParserState', 'updateParserState'.
setParserState :: MonadParsec e s m => State s e -> m ()
setParserState st = updateParserState (const st)
{-# INLINE setParserState #-}
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								{-# LANGUAGE FlexibleContexts #-}
 								{-# LANGUAGE FlexibleInstances #-}
 								{-# LANGUAGE MultiParamTypeClasses #-}
 								{-# LANGUAGE RankNTypes #-}
-												Add Safe Haskell support

Remove dependence on GeneralizedNewtypeDeriving and add Safe Haskell
extensions to every file.

											
										
										
											2020-10-12 23:24:28 +03:00
+								{-# LANGUAGE Safe #-}
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								{-# LANGUAGE ScopedTypeVariables #-}
 								{-# LANGUAGE TypeFamilies #-}
 								{-# LANGUAGE UndecidableInstances #-}
-												refactoring, phase 1

											
										
										
											2015-07-28 16:32:19 +03:00
+								-- |
-												renamed ‘MegaParsec’ → ‘Megaparsec’, close #10

											
										
										
											2015-08-01 19:24:45 +03:00
+								-- Module      :  Text.Megaparsec
-												Use the word “present” instead of current year in copyright notes

[skip ci]

											
										
										
											2019-07-02 22:41:24 +03:00
+								-- Copyright   :  © 2015–present Megaparsec contributors
-												cosmetic changes in copyright (headers)

											
										
										
											2015-07-30 19:20:37 +03:00
+								--                © 2007 Paolo Martini
 								--                © 1999–2001 Daan Leijen
-												after some consulting, it should be “FreeBSD”

What Parsec used is called “FreeBSD” or “BSD 2 clause”. Addition of the
third clause may require contacting all the authors. To hell with it,
let it be “FreeBSD” (which is anyway better than “BSD-like”), I'm a
hacker, not a lawyer (tm).

											
										
										
											2015-10-30 14:26:45 +03:00
+								-- License     :  FreeBSD
-												refactoring, phase 1

											
										
										
											2015-07-28 16:32:19 +03:00
+								--
-												Update my email address

[skip ci]

											
										
										
											2017-05-24 15:30:10 +03:00
+								-- Maintainer  :  Mark Karpov <markkarpov92@gmail.com>
-												refactoring, phase 2

											
										
										
											2015-07-29 11:38:32 +03:00
+								-- Stability   :  experimental
-												refactoring, phase 1

											
										
										
											2015-07-28 16:32:19 +03:00
+								-- Portability :  portable
 								--
 								-- This module includes everything you need to get started writing a parser.
-												Various corrections in ‘README.md’ and docs

											
										
										
											2016-05-14 12:59:18 +03:00
+								-- If you are new to Megaparsec and don't know where to begin, take a look
-												Update the links to the tutorial

											
										
										
											2019-11-23 01:16:51 +03:00
+								-- at the tutorial <https://markkarpov.com/tutorial/megaparsec.html>.
-												refactoring, phase 1

											
										
										
											2015-07-28 16:32:19 +03:00
+								--
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								-- In addition to the "Text.Megaparsec" module, which exports and re-exports
-												Improve the writing

											
										
										
											2021-04-25 16:49:13 +03:00
+								-- almost everything that you may need, we advise to import
-												Char and byte modules (#230)


											
										
										
											2017-07-03 14:34:00 +03:00
+								-- "Text.Megaparsec.Char" if you plan to work with a stream of 'Char' tokens
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- or "Text.Megaparsec.Byte" if you intend to parse binary data.
-												extends description of ‘Text.Megaparsec’ module

											
										
										
											2015-08-03 21:15:16 +03:00
+								--
-												Drop per-stream type modules (#215)


											
										
										
											2017-06-13 19:14:31 +03:00
+								-- It is common to start working with the library by defining a type synonym
 								-- like this:
-												extends description of ‘Text.Megaparsec’ module

											
										
										
											2015-08-03 21:15:16 +03:00
+								--
-												Separate trivial and fancy parse errors (#223)



											
										
										
											2017-06-29 08:13:22 +03:00
+								-- > type Parser = Parsec Void Text
 								-- >                      ^    ^
 								-- >                      |    |
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- > Custom error component    Input stream type
-												extends description of ‘Text.Megaparsec’ module

											
										
										
											2015-08-03 21:15:16 +03:00
+								--
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- Then you can write type signatures like @Parser 'Int'@—for a parser that
-												Drop per-stream type modules (#215)


											
										
										
											2017-06-13 19:14:31 +03:00
+								-- returns an 'Int' for example.
-												Mention ambiguous type variables and type signatures

Close #157.

											
										
										
											2016-12-26 13:41:30 +03:00
+								--
-												Add a note about the ‘ParseError’ type

											
										
										
											2017-07-28 07:28:16 +03:00
+								-- Similarly (since it's known to cause confusion), you should use
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- 'ParseErrorBundle' type parametrized like this:
-												Add a note about the ‘ParseError’ type

											
										
										
											2017-07-28 07:28:16 +03:00
+								--
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- > ParseErrorBundle Text Void
 								-- >                  ^    ^
 								-- >                  |    |
 								-- >  Input stream type    Custom error component (the same you used in Parser)
-												Add a note about the ‘ParseError’ type

											
										
										
											2017-07-28 07:28:16 +03:00
+								--
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- Megaparsec uses some type-level machinery to provide flexibility without
 								-- compromising on type safety. Thus type signatures are sometimes necessary
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- to avoid ambiguous types. If you're seeing an error message that reads
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- like “Type variable @e0@ is ambiguous …”, you need to give an explicit
 								-- signature to your parser to resolve the ambiguity. It's a good idea to
 								-- provide type signatures for all top-level definitions.
-												renamed ‘MegaParsec’ → ‘Megaparsec’, close #10

											
										
										
											2015-08-01 19:24:45 +03:00
+								module Text.Megaparsec
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								  ( -- * Re-exports
-												Add a note about ‘Control.Applicative.Combinators.NonEmpty’

											
										
										
											2017-07-30 19:14:08 +03:00
+								    -- $reexports
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    module Text.Megaparsec.Pos,
 								    module Text.Megaparsec.Error,
 								    module Text.Megaparsec.Stream,
 								    module Control.Monad.Combinators,
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								    -- * Data types
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    State (..),
 								    PosState (..),
 								    Parsec,
 								    ParsecT,
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								    -- * Running parser
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    parse,
 								    parseMaybe,
 								    parseTest,
 								    runParser,
 								    runParser',
 								    runParserT,
 								    runParserT',
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								    -- * Primitive combinators
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    MonadParsec (..),
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								    -- * Signaling parse errors
 								    -- $parse-errors
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    failure,
 								    fancyFailure,
 								    unexpected,
 								    customFailure,
 								    region,
 								    registerParseError,
 								    registerFailure,
 								    registerFancyFailure,
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								    -- * Derivatives of primitive combinators
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    single,
 								    satisfy,
 								    anySingle,
 								    anySingleBut,
 								    oneOf,
 								    noneOf,
 								    chunk,
 								    (<?>),
 								    match,
 								    takeRest,
 								    atEnd,
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								    -- * Parser state combinators
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    getInput,
 								    setInput,
 								    getSourcePos,
 								    getOffset,
 								    setOffset,
 								    setParserState,
 								  )
-												refactoring, phase 1

											
										
										
											2015-07-28 16:32:19 +03:00
+								where
-												Initial import

											
										
										
											2008-01-13 20:53:15 +03:00
-												Use parser combinators 0.4.0 (#269)


											
										
										
											2017-12-31 12:01:16 +03:00
+								import Control.Monad.Combinators
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								import Control.Monad.Identity
 								import Data.List.NonEmpty (NonEmpty (..))
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								import qualified Data.List.NonEmpty as NE
-												Extending stream (#229)


											
										
										
											2017-07-02 19:56:01 +03:00
+								import Data.Maybe (fromJust)
-												Re-organize error reporting functions

The methods ‘failure’ and ‘fancyFailure’ of ‘MonadParsec’ are now ordinary
functions and live in ‘Text.Megaparsec’. They are defined in terms of the
new ‘parseError’ method of ‘MonadParsec’. This method allows us to signal
parse errors at a given offset without manipulating parser state manually.

											
										
										
											2019-11-05 14:09:05 +03:00
+								import Data.Set (Set)
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								import qualified Data.Set as E
-												Add ‘Text.Megaparsec.Internal’ (#288)

											
										
										
											2018-03-27 17:40:20 +03:00
+								import Text.Megaparsec.Class
-												Speed-up numeric parsers (#232)


											
										
										
											2017-07-09 20:12:23 +03:00
+								import Text.Megaparsec.Error
-												Add ‘Text.Megaparsec.Internal’ (#288)

											
										
										
											2018-03-27 17:40:20 +03:00
+								import Text.Megaparsec.Internal
-												Speed-up numeric parsers (#232)


											
										
										
											2017-07-09 20:12:23 +03:00
+								import Text.Megaparsec.Pos
-												Add ‘Text.Megaparsec.Internal’ (#288)

											
										
										
											2018-03-27 17:40:20 +03:00
+								import Text.Megaparsec.State
-												Speed-up numeric parsers (#232)


											
										
										
											2017-07-09 20:12:23 +03:00
+								import Text.Megaparsec.Stream
-												re-export ‘(<|>)’, ‘many’, ‘some’, and ‘optional’, fixes #9

These functions are now re-exported from ‘Control.Applicative’
module. ‘many’ and ‘some’ are now part of ‘Alternative’ instance of
‘ParsecT’.

Note that these functions are re-exported only in ‘Text.MegaParsec’
module, but not in ‘Text.MegaParsec.Prim’ to avoid duplication of
floating doc-strings. Others internal modules now just casually import
‘Control.Applicative’ for their needs.

Note that ‘many1’ was renamed to ‘some’, the same is done for other
parsers that had ‘many1’ part in their names (for consistency).

											
										
										
											2015-08-01 17:39:20 +03:00
-												Add a note about ‘Control.Applicative.Combinators.NonEmpty’

											
										
										
											2017-07-30 19:14:08 +03:00
+								-- $reexports
 								--
-												Add a note about monadic vs applicative combinators

											
										
										
											2018-03-27 18:19:55 +03:00
+								-- Note that we re-export monadic combinators from
 								-- "Control.Monad.Combinators" because these are more efficient than
 								-- 'Applicative'-based ones. Thus 'many' and 'some' may clash with the
 								-- functions from "Control.Applicative". You need to hide the functions like
 								-- this:
 								--
 								-- > import Control.Applicative hiding (many, some)
 								--
-												Promote ‘Control.Monad.Combinators.NonEmpty’ in the docs

[skip ci]

											
										
										
											2017-12-31 12:05:27 +03:00
+								-- Also note that you can import "Control.Monad.Combinators.NonEmpty" if you
 								-- wish that combinators like 'some' return 'NonEmpty' lists. The module
 								-- lives in the @parser-combinators@ package (you need at least version
 								-- /0.4.0/).
-												Add a note about ‘Control.Applicative.Combinators.NonEmpty’

											
										
										
											2017-07-30 19:14:08 +03:00
+								--
 								-- This module is intended to be imported qualified:
 								--
-												Promote ‘Control.Monad.Combinators.NonEmpty’ in the docs

[skip ci]

											
										
										
											2017-12-31 12:05:27 +03:00
+								-- > import qualified Control.Monad.Combinators.NonEmpty as NE
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								--
 								-- Other modules of interest are:
 								--
 								--     * "Control.Monad.Combinators.Expr" for parsing of expressions.
 								--     * "Control.Applicative.Permutations" for parsing of permutations
 								--       phrases.
-												Add a note about ‘Control.Applicative.Combinators.NonEmpty’

											
										
										
											2017-07-30 19:14:08 +03:00
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								----------------------------------------------------------------------------
 								-- Data types
-												Documentation corrections and improvements

											
										
										
											2017-07-25 12:43:24 +03:00
+								-- | 'Parsec' is a non-transformer variant of the more general 'ParsecT'
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								-- monad transformer.
 								type Parsec e s = ParsecT e s Identity
 								----------------------------------------------------------------------------
 								-- Running a parser
-												Misc improvements in the docs

											
										
										
											2018-09-04 22:24:28 +03:00
+								-- | @'parse' p file input@ runs parser @p@ over 'Identity' (see
 								-- 'runParserT' if you're using the 'ParsecT' monad transformer; 'parse'
 								-- itself is just a synonym for 'runParser'). It returns either a
 								-- 'ParseErrorBundle' ('Left') or a value of type @a@ ('Right').
 								-- 'errorBundlePretty' can be used to turn 'ParseErrorBundle' into the
 								-- string representation of the error message. See "Text.Megaparsec.Error"
 								-- if you need to do more advanced error analysis.
 								--
 								-- > main = case parse numbers "" "11,2,43" of
 								-- >          Left bundle -> putStr (errorBundlePretty bundle)
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								-- >          Right xs -> print (sum xs)
 								-- >
-												Misc improvements in the docs

											
										
										
											2018-09-04 22:24:28 +03:00
+								-- > numbers = decimal `sepBy` char ','
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								parse ::
 								  -- | Parser to run
 								  Parsec e s a ->
 								  -- | Name of source file
 								  String ->
 								  -- | Input for parser
 								  s ->
 								  Either (ParseErrorBundle s e) a
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								parse = runParser
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- | @'parseMaybe' p input@ runs the parser @p@ on @input@ and returns the
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								-- result inside 'Just' on success and 'Nothing' on failure. This function
 								-- also parses 'eof', so if the parser doesn't consume all of its input, it
 								-- will fail.
 								--
 								-- The function is supposed to be useful for lightweight parsing, where
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- error messages (and thus file names) are not important and entire input
-												Improve the writing

											
										
										
											2021-04-25 16:49:13 +03:00
+								-- should be consumed. For example, it can be used for parsing of a single
 								-- number according to a specification of its format.
-												Refactor pos and error modules (#222)


											
										
										
											2017-06-28 10:08:26 +03:00
+								parseMaybe :: (Ord e, Stream s) => Parsec e s a -> s -> Maybe a
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								parseMaybe p s =
 								  case parse (p <* eof) "" s of
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    Left _ -> Nothing
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								    Right x -> Just x
-												Improve the writing

											
										
										
											2021-04-25 16:49:13 +03:00
+								-- | The expression @'parseTest' p input@ applies the parser @p@ on the
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- input @input@ and prints the result to stdout. Useful for testing.
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								parseTest ::
 								  ( ShowErrorComponent e,
 								    Show a,
-												Decouple the error reporting-related methods from ‘Stream’

Split the ‘Stream’ type class. The methods ‘showTokens’ and ‘tokensLength’
have been put into a separate type class ‘VisualStream’, while ‘reachOffset’
and ‘reachOffsetNoLine’ are now in ‘TraversableStream’. This should make
defining ‘Stream’ instances for custom streams easier.

Defined ‘Stream’ instances for lists and ‘Seq’s.

											
										
										
											2020-06-26 14:55:55 +03:00
+								    VisualStream s,
 								    TraversableStream s
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								  ) =>
 								  -- | Parser to run
 								  Parsec e s a ->
 								  -- | Input for parser
 								  s ->
 								  IO ()
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								parseTest p input =
 								  case parse p "" input of
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    Left e -> putStr (errorBundlePretty e)
-												Implement rendering of parse error context (#236)


											
										
										
											2017-07-25 10:36:40 +03:00
+								    Right x -> print x
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- | @'runParser' p file input@ runs parser @p@ on the input stream of
 								-- tokens @input@, obtained from source @file@. The @file@ is only used in
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- error messages and may be the empty string. Returns either a
 								-- 'ParseErrorBundle' ('Left') or a value of type @a@ ('Right').
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								--
 								-- > parseFromFile p file = runParser p file <$> readFile file
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								runParser ::
 								  -- | Parser to run
 								  Parsec e s a ->
 								  -- | Name of source file
 								  String ->
 								  -- | Input for parser
 								  s ->
 								  Either (ParseErrorBundle s e) a
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								runParser p name s = snd $ runParser' p (initialState name s)
 								-- | The function is similar to 'runParser' with the difference that it
-												Improve the writing

											
										
										
											2021-04-25 16:49:13 +03:00
+								-- accepts and returns the parser state. This allows us e.g. to specify
 								-- arbitrary textual position at the beginning of parsing. This is the most
 								-- general way to run a parser over the 'Identity' monad.
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								--
 								-- @since 4.2.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								runParser' ::
 								  -- | Parser to run
 								  Parsec e s a ->
 								  -- | Initial state
 								  State s e ->
 								  (State s e, Either (ParseErrorBundle s e) a)
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								runParser' p = runIdentity . runParserT' p
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- | @'runParserT' p file input@ runs parser @p@ on the input list of tokens
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								-- @input@, obtained from source @file@. The @file@ is only used in error
 								-- messages and may be the empty string. Returns a computation in the
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- underlying monad @m@ that returns either a 'ParseErrorBundle' ('Left') or
 								-- a value of type @a@ ('Right').
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								runParserT ::
 								  Monad m =>
 								  -- | Parser to run
 								  ParsecT e s m a ->
 								  -- | Name of source file
 								  String ->
 								  -- | Input for parser
 								  s ->
 								  m (Either (ParseErrorBundle s e) a)
-												Drop ‘liftM’

											
										
										
											2018-10-26 16:07:46 +03:00
+								runParserT p name s = snd <$> runParserT' p (initialState name s)
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
 								-- | This function is similar to 'runParserT', but like 'runParser'' it
 								-- accepts and returns parser state. This is thus the most general way to
 								-- run a parser.
 								--
 								-- @since 4.2.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								runParserT' ::
 								  Monad m =>
 								  -- | Parser to run
 								  ParsecT e s m a ->
 								  -- | Initial state
 								  State s e ->
 								  m (State s e, Either (ParseErrorBundle s e) a)
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								runParserT' p s = do
 								  (Reply s' _ result) <- runParsecT p s
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								  let toBundle es =
 								        ParseErrorBundle
 								          { bundleErrors =
 								              NE.sortWith errorOffset es,
 								            bundlePosState = statePosState s
 								          }
-												Introduce parse error bundle (#306)

* Introduce parse error bundle

* Update the changelog (parse error bundle)

											
										
										
											2018-07-15 16:01:35 +03:00
+								  return $ case result of
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								    OK x ->
 								      case NE.nonEmpty (stateParseErrors s') of
 								        Nothing -> (s', Right x)
 								        Just de -> (s', Left (toBundle de))
-												Introduce parse error bundle (#306)

* Introduce parse error bundle

* Update the changelog (parse error bundle)

											
										
										
											2018-07-15 16:01:35 +03:00
+								    Error e ->
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								      (s', Left (toBundle (e :| stateParseErrors s')))
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
-												Improve the writing

											
										
										
											2021-04-25 16:49:13 +03:00
+								-- | Given the name of source file and the input construct the initial state
 								-- for a parser.
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								initialState :: String -> s -> State s e
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								initialState name s =
 								  State
 								    { stateInput = s,
 								      stateOffset = 0,
 								      statePosState =
 								        PosState
 								          { pstateInput = s,
 								            pstateOffset = 0,
 								            pstateSourcePos = initialPos name,
 								            pstateTabWidth = defaultTabWidth,
 								            pstateLinePrefix = ""
 								          },
 								      stateParseErrors = []
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								    }
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								----------------------------------------------------------------------------
 								-- Signaling parse errors
 								-- $parse-errors
 								--
 								-- The most general function to fail and end parsing is 'parseError'. These
 								-- are built on top of it. The section also includes functions starting with
 								-- the @register@ prefix which allow users to register “delayed”
 								-- 'ParseError's.
 								-- | Stop parsing and report a trivial 'ParseError'.
 								--
 								-- @since 6.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								failure ::
 								  MonadParsec e s m =>
 								  -- | Unexpected item (if any)
 								  Maybe (ErrorItem (Token s)) ->
 								  -- | Expected items
 								  Set (ErrorItem (Token s)) ->
 								  m a
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								failure us ps = do
 								  o <- getOffset
 								  parseError (TrivialError o us ps)
 								{-# INLINE failure #-}
 								-- | Stop parsing and report a fancy 'ParseError'. To report a single custom
 								-- parse error, see 'Text.Megaparsec.customFailure'.
 								--
 								-- @since 6.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								fancyFailure ::
 								  MonadParsec e s m =>
 								  -- | Fancy error components
 								  Set (ErrorFancy e) ->
 								  m a
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								fancyFailure xs = do
 								  o <- getOffset
 								  parseError (FancyError o xs)
 								{-# INLINE fancyFailure #-}
 								-- | The parser @'unexpected' item@ fails with an error message telling
 								-- about unexpected item @item@ without consuming any input.
 								--
 								-- > unexpected item = failure (Just item) Set.empty
 								unexpected :: MonadParsec e s m => ErrorItem (Token s) -> m a
 								unexpected item = failure (Just item) E.empty
 								{-# INLINE unexpected #-}
 								-- | Report a custom parse error. For a more general version, see
 								-- 'fancyFailure'.
 								--
 								-- > customFailure = fancyFailure . Set.singleton . ErrorCustom
 								--
 								-- @since 6.3.0
 								customFailure :: MonadParsec e s m => e -> m a
 								customFailure = fancyFailure . E.singleton . ErrorCustom
 								{-# INLINE customFailure #-}
 								-- | Specify how to process 'ParseError's that happen inside of this
 								-- wrapper. This applies to both normal and delayed 'ParseError's.
 								--
 								-- As a side-effect of the implementation the inner computation will start
-												Fix a typo

											
										
										
											2022-10-21 21:26:14 +03:00
+								-- with an empty collection of delayed errors and they will be updated and
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								-- “restored” on the way out of 'region'.
 								--
 								-- @since 5.3.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								region ::
 								  MonadParsec e s m =>
 								  -- | How to process 'ParseError's
 								  (ParseError s e -> ParseError s e) ->
 								  -- | The “region” that the processing applies to
 								  m a ->
 								  m a
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								region f m = do
 								  deSoFar <- stateParseErrors <$> getParserState
 								  updateParserState $ \s ->
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    s {stateParseErrors = []}
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								  r <- observing m
 								  updateParserState $ \s ->
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    s {stateParseErrors = (f <$> stateParseErrors s) ++ deSoFar}
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								  case r of
 								    Left err -> parseError (f err)
 								    Right x -> return x
 								{-# INLINEABLE region #-}
 								-- | Register a 'ParseError' for later reporting. This action does not end
 								-- parsing and has no effect except for adding the given 'ParseError' to the
 								-- collection of “delayed” 'ParseError's which will be taken into
-												Improve the writing

											
										
										
											2021-04-25 16:49:13 +03:00
+								-- consideration at the end of parsing. Only if this collection is empty the
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								-- parser will succeed. This is the main way to report several parse errors
 								-- at once.
 								--
 								-- @since 8.0.0
 								registerParseError :: MonadParsec e s m => ParseError s e -> m ()
 								registerParseError e = updateParserState $ \s ->
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								  s {stateParseErrors = e : stateParseErrors s}
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								{-# INLINE registerParseError #-}
 								-- | Like 'failure', but for delayed 'ParseError's.
 								--
 								-- @since 8.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								registerFailure ::
 								  MonadParsec e s m =>
 								  -- | Unexpected item (if any)
 								  Maybe (ErrorItem (Token s)) ->
 								  -- | Expected items
 								  Set (ErrorItem (Token s)) ->
 								  m ()
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								registerFailure us ps = do
 								  o <- getOffset
 								  registerParseError (TrivialError o us ps)
 								{-# INLINE registerFailure #-}
 								-- | Like 'fancyFailure', but for delayed 'ParseError's.
 								--
 								-- @since 8.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								registerFancyFailure ::
 								  MonadParsec e s m =>
 								  -- | Fancy error components
 								  Set (ErrorFancy e) ->
 								  m ()
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								registerFancyFailure xs = do
 								  o <- getOffset
 								  registerParseError (FancyError o xs)
 								{-# INLINE registerFancyFailure #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								----------------------------------------------------------------------------
 								-- Derivatives of primitive combinators
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								-- | @'single' t@ only matches the single token @t@.
 								--
 								-- > semicolon = single ';'
 								--
 								-- See also: 'token', 'anySingle', 'Text.Megaparsec.Byte.char',
 								-- 'Text.Megaparsec.Char.char'.
 								--
 								-- @since 7.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								single ::
 								  MonadParsec e s m =>
 								  -- | Token to match
 								  Token s ->
 								  m (Token s)
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								single t = token testToken expected
 								  where
 								    testToken x = if x == t then Just x else Nothing
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								    expected = E.singleton (Tokens (t :| []))
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								{-# INLINE single #-}
 								-- | The parser @'satisfy' f@ succeeds for any token for which the supplied
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- function @f@ returns 'True'.
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								--
 								-- > digitChar = satisfy isDigit <?> "digit"
 								-- > oneOf cs  = satisfy (`elem` cs)
 								--
-												Add a performance note to the dos of ‘satisfy’

Close #434.

											
										
										
											2020-12-14 14:08:57 +03:00
+								-- __Performance note__: when you need to parse a single token, it is often
 								-- a good idea to use 'satisfy' with the right predicate function instead of
 								-- creating a complex parser using the combinators.
 								--
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								-- See also: 'anySingle', 'anySingleBut', 'oneOf', 'noneOf'.
 								--
 								-- @since 7.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								satisfy ::
 								  MonadParsec e s m =>
 								  -- | Predicate to apply
 								  (Token s -> Bool) ->
 								  m (Token s)
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								satisfy f = token testChar E.empty
 								  where
 								    testChar x = if f x then Just x else Nothing
 								{-# INLINE satisfy #-}
 								-- | Parse and return a single token. It's a good idea to attach a 'label'
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- to this parser.
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								--
 								-- > anySingle = satisfy (const True)
 								--
 								-- See also: 'satisfy', 'anySingleBut'.
 								--
 								-- @since 7.0.0
 								anySingle :: MonadParsec e s m => m (Token s)
 								anySingle = satisfy (const True)
 								{-# INLINE anySingle #-}
 								-- | Match any token but the given one. It's a good idea to attach a 'label'
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- to this parser.
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								--
 								-- > anySingleBut t = satisfy (/= t)
 								--
 								-- See also: 'single', 'anySingle', 'satisfy'.
 								--
 								-- @since 7.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								anySingleBut ::
 								  MonadParsec e s m =>
 								  -- | Token we should not match
 								  Token s ->
 								  m (Token s)
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								anySingleBut t = satisfy (/= t)
 								{-# INLINE anySingleBut #-}
 								-- | @'oneOf' ts@ succeeds if the current token is in the supplied
 								-- collection of tokens @ts@. Returns the parsed token. Note that this
 								-- parser cannot automatically generate the “expected” component of error
 								-- message, so usually you should label it manually with 'label' or ('<?>').
 								--
 								-- > oneOf cs = satisfy (`elem` cs)
 								--
 								-- See also: 'satisfy'.
 								--
 								-- > digit = oneOf ['0'..'9'] <?> "digit"
 								--
 								-- __Performance note__: prefer 'satisfy' when you can because it's faster
 								-- when you have only a couple of tokens to compare to:
 								--
 								-- > quoteFast = satisfy (\x -> x == '\'' || x == '\"')
 								-- > quoteSlow = oneOf "'\""
 								--
 								-- @since 7.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								oneOf ::
 								  (Foldable f, MonadParsec e s m) =>
 								  -- | Collection of matching tokens
 								  f (Token s) ->
 								  m (Token s)
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								oneOf cs = satisfy (`elem` cs)
 								{-# INLINE oneOf #-}
 								-- | As the dual of 'oneOf', @'noneOf' ts@ succeeds if the current token
 								-- /not/ in the supplied list of tokens @ts@. Returns the parsed character.
 								-- Note that this parser cannot automatically generate the “expected”
 								-- component of error message, so usually you should label it manually with
 								-- 'label' or ('<?>').
 								--
 								-- > noneOf cs = satisfy (`notElem` cs)
 								--
 								-- See also: 'satisfy'.
 								--
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- __Performance note__: prefer 'satisfy' and 'anySingleBut' when you can
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								-- because it's faster.
 								--
 								-- @since 7.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								noneOf ::
 								  (Foldable f, MonadParsec e s m) =>
 								  -- | Collection of taken we should not match
 								  f (Token s) ->
 								  m (Token s)
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								noneOf cs = satisfy (`notElem` cs)
 								{-# INLINE noneOf #-}
 								-- | @'chunk' chk@ only matches the chunk @chk@.
 								--
 								-- > divOrMod = chunk "div" <|> chunk "mod"
 								--
 								-- See also: 'tokens', 'Text.Megaparsec.Char.string',
 								-- 'Text.Megaparsec.Byte.string'.
 								--
 								-- @since 7.0.0
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								chunk ::
 								  MonadParsec e s m =>
 								  -- | Chunk to match
 								  Tokens s ->
 								  m (Tokens s)
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								chunk = tokens (==)
 								{-# INLINE chunk #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								-- | A synonym for 'label' in the form of an operator.
 								infix 0 <?>
 								(<?>) :: MonadParsec e s m => m a -> String -> m a
 								(<?>) = flip label
-												Extending stream (#229)


											
										
										
											2017-07-02 19:56:01 +03:00
+								{-# INLINE (<?>) #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
-												Documentation corrections and improvements

											
										
										
											2017-07-25 12:43:24 +03:00
+								-- | Return both the result of a parse and a chunk of input that was
-												Misc improvements in the docs

											
										
										
											2018-09-04 22:24:28 +03:00
+								-- consumed during parsing. This relies on the change of the 'stateOffset'
 								-- value to evaluate how many tokens were consumed. If you mess with it
 								-- manually in the argument parser, prepare for troubles.
-												re-export ‘(<|>)’, ‘many’, ‘some’, and ‘optional’, fixes #9

These functions are now re-exported from ‘Control.Applicative’
module. ‘many’ and ‘some’ are now part of ‘Alternative’ instance of
‘ParsecT’.

Note that these functions are re-exported only in ‘Text.MegaParsec’
module, but not in ‘Text.MegaParsec.Prim’ to avoid duplication of
floating doc-strings. Others internal modules now just casually import
‘Control.Applicative’ for their needs.

Note that ‘many1’ was renamed to ‘some’, the same is done for other
parsers that had ‘many1’ part in their names (for consistency).

											
										
										
											2015-08-01 17:39:20 +03:00
+								--
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								-- @since 5.3.0
-												Extending stream (#229)


											
										
										
											2017-07-02 19:56:01 +03:00
+								match :: MonadParsec e s m => m a -> m (Tokens s, a)
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								match p = do
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								  o <- getOffset
 								  s <- getInput
 								  r <- p
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								  o' <- getOffset
-												Extending stream (#229)


											
										
										
											2017-07-02 19:56:01 +03:00
+								  -- NOTE The 'fromJust' call here should never fail because if the stream
 								  -- is empty before 'p' (the only case when 'takeN_' can return 'Nothing'
 								  -- as per its invariants), (tp' - tp) won't be greater than 0, and in that
 								  -- case 'Just' is guaranteed to be returned as per another invariant of
 								  -- 'takeN_'.
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								  return ((fst . fromJust) (takeN_ (o' - o) s), r)
-												Extending stream (#229)


											
										
										
											2017-07-02 19:56:01 +03:00
+								{-# INLINEABLE match #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
-												Add ‘takeP’, ‘takeRest’, and ‘atEnd’

											
										
										
											2017-07-03 15:34:53 +03:00
+								-- | Consume the rest of the input and return it as a chunk. This parser
-												Misc improvements in the docs

											
										
										
											2018-09-04 22:24:28 +03:00
+								-- never fails, but may return the empty chunk.
-												Add ‘takeP’, ‘takeRest’, and ‘atEnd’

											
										
										
											2017-07-03 15:34:53 +03:00
+								--
 								-- > takeRest = takeWhileP Nothing (const True)
-												Char and byte modules (#230)


											
										
										
											2017-07-03 14:34:00 +03:00
+								--
 								-- @since 6.0.0
-												Add ‘takeP’, ‘takeRest’, and ‘atEnd’

											
										
										
											2017-07-03 15:34:53 +03:00
+								takeRest :: MonadParsec e s m => m (Tokens s)
 								takeRest = takeWhileP Nothing (const True)
 								{-# INLINE takeRest #-}
-												Extending stream (#229)


											
										
										
											2017-07-02 19:56:01 +03:00
-												Add ‘takeP’, ‘takeRest’, and ‘atEnd’

											
										
										
											2017-07-03 15:34:53 +03:00
+								-- | Return 'True' when end of input has been reached.
-												Char and byte modules (#230)


											
										
										
											2017-07-03 14:34:00 +03:00
+								--
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								-- > atEnd = option False (True <$ hidden eof)
 								--
-												Char and byte modules (#230)


											
										
										
											2017-07-03 14:34:00 +03:00
+								-- @since 6.0.0
-												Add ‘takeP’, ‘takeRest’, and ‘atEnd’

											
										
										
											2017-07-03 15:34:53 +03:00
+								atEnd :: MonadParsec e s m => m Bool
-												Make ‘atEnd’ not produce hints (#264)


											
										
										
											2017-12-17 09:03:56 +03:00
+								atEnd = option False (True <$ hidden eof)
-												Add ‘takeP’, ‘takeRest’, and ‘atEnd’

											
										
										
											2017-07-03 15:34:53 +03:00
+								{-# INLINE atEnd #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
 								----------------------------------------------------------------------------
 								-- Parser state combinators
 								-- | Return the current input.
 								getInput :: MonadParsec e s m => m s
 								getInput = stateInput <$> getParserState
-												Inline more

											
										
										
											2018-05-01 10:23:52 +03:00
+								{-# INLINE getInput #-}
-												re-export ‘(<|>)’, ‘many’, ‘some’, and ‘optional’, fixes #9

These functions are now re-exported from ‘Control.Applicative’
module. ‘many’ and ‘some’ are now part of ‘Alternative’ instance of
‘ParsecT’.

Note that these functions are re-exported only in ‘Text.MegaParsec’
module, but not in ‘Text.MegaParsec.Prim’ to avoid duplication of
floating doc-strings. Others internal modules now just casually import
‘Control.Applicative’ for their needs.

Note that ‘many1’ was renamed to ‘some’, the same is done for other
parsers that had ‘many1’ part in their names (for consistency).

											
										
										
											2015-08-01 17:39:20 +03:00
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								-- | @'setInput' input@ continues parsing with @input@.
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								setInput :: MonadParsec e s m => s -> m ()
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								setInput s = updateParserState (\(State _ o pst de) -> State s o pst de)
-												Inline more

											
										
										
											2018-05-01 10:23:52 +03:00
+								{-# INLINE setInput #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- | Return the current source position. This function /is not cheap/, do
 								-- not call it e.g. on matching of every token, that's a bad idea. Still you
 								-- can use it to get 'SourcePos' to attach to things that you parse.
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								--
-												Numerous documentation corrections

											
										
										
											2018-11-07 08:21:00 +03:00
+								-- The function works under the assumption that we move in the input stream
 								-- only forwards and never backwards, which is always true unless the user
 								-- abuses the library.
-												re-export ‘(<|>)’, ‘many’, ‘some’, and ‘optional’, fixes #9

These functions are now re-exported from ‘Control.Applicative’
module. ‘many’ and ‘some’ are now part of ‘Alternative’ instance of
‘ParsecT’.

Note that these functions are re-exported only in ‘Text.MegaParsec’
module, but not in ‘Text.MegaParsec.Prim’ to avoid duplication of
floating doc-strings. Others internal modules now just casually import
‘Control.Applicative’ for their needs.

Note that ‘many1’ was renamed to ‘some’, the same is done for other
parsers that had ‘many1’ part in their names (for consistency).

											
										
										
											2015-08-01 17:39:20 +03:00
+								--
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- @since 7.0.0
-												Decouple the error reporting-related methods from ‘Stream’

Split the ‘Stream’ type class. The methods ‘showTokens’ and ‘tokensLength’
have been put into a separate type class ‘VisualStream’, while ‘reachOffset’
and ‘reachOffsetNoLine’ are now in ‘TraversableStream’. This should make
defining ‘Stream’ instances for custom streams easier.

Defined ‘Stream’ instances for lists and ‘Seq’s.

											
										
										
											2020-06-26 14:55:55 +03:00
+								getSourcePos :: (TraversableStream s, MonadParsec e s m) => m SourcePos
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								getSourcePos = do
 								  st <- getParserState
-												Simplify type signatures of ‘reachOffset’ and ‘reachOffsetNoLine’

Changed type signatures of ‘reachOffset’ and ‘reachOffsetNoLine’ methods of
the ‘Stream’ type class. Instead of three-tuple ‘reachOffset’ now returns
two-tuple because ‘SourcePos’ is already contained in the returned
‘PosState’ record.

											
										
										
											2019-07-13 18:11:49 +03:00
+								  let pst = reachOffsetNoLine (stateOffset st) (statePosState st)
-												Format the source code with Ormolu

											
										
										
											2020-04-23 22:28:20 +03:00
+								  setParserState st {statePosState = pst}
-												Simplify type signatures of ‘reachOffset’ and ‘reachOffsetNoLine’

Changed type signatures of ‘reachOffset’ and ‘reachOffsetNoLine’ methods of
the ‘Stream’ type class. Instead of three-tuple ‘reachOffset’ now returns
two-tuple because ‘SourcePos’ is already contained in the returned
‘PosState’ record.

											
										
										
											2019-07-13 18:11:49 +03:00
+								  return (pstateSourcePos pst)
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								{-# INLINE getSourcePos #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
 								-- | Get the number of tokens processed so far.
 								--
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- See also: 'setOffset'.
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								--
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- @since 7.0.0
 								getOffset :: MonadParsec e s m => m Int
 								getOffset = stateOffset <$> getParserState
 								{-# INLINE getOffset #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
 								-- | Set the number of tokens processed so far.
-												re-export ‘(<|>)’, ‘many’, ‘some’, and ‘optional’, fixes #9

These functions are now re-exported from ‘Control.Applicative’
module. ‘many’ and ‘some’ are now part of ‘Alternative’ instance of
‘ParsecT’.

Note that these functions are re-exported only in ‘Text.MegaParsec’
module, but not in ‘Text.MegaParsec.Prim’ to avoid duplication of
floating doc-strings. Others internal modules now just casually import
‘Control.Applicative’ for their needs.

Note that ‘many1’ was renamed to ‘some’, the same is done for other
parsers that had ‘many1’ part in their names (for consistency).

											
										
										
											2015-08-01 17:39:20 +03:00
+								--
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- See also: 'getOffset'.
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								--
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								-- @since 7.0.0
 								setOffset :: MonadParsec e s m => Int -> m ()
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								setOffset o = updateParserState $ \(State s _ pst de) ->
 								  State s o pst de
-												Use offset in parse errors (#313)

The change allows to speed-up parsers in most cases and re-use the fact that
we're traversing input stream on pretty-printing ‘ParseError’s anyway.
											
										
										
											2018-08-20 19:35:10 +03:00
+								{-# INLINE setOffset #-}
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
-												Rename ‘Text.Megaparsec.Lexer’ to ‘Text.Megaparsec.Char.Lexer’

Also numerous documentation improvements and some inlineable pragmas.

											
										
										
											2017-07-04 13:12:35 +03:00
+								-- | @'setParserState' st@ sets the parser state to @st@.
-												Move general-enough combinators to ‘Text.Megaparsec’ (#267)


											
										
										
											2018-01-08 18:39:39 +03:00
+								--
 								-- See also: 'getParserState', 'updateParserState'.
-												Allow registration of delayed parse errors

Megaparsec now supports registration of “delayed” parse errors. On lower
level we added a new field called ‘stateParseErrors’ to the ‘State’ record.
The type also had to change from ‘State s’ to ‘State s e’. This field
contains the list of registered ‘ParseErrors’ that do not end parsing
immediately but still will cause failure in the end if the list is not
empty. Users are expected to register parse errors using the three
functions: ‘registerParseError’, ‘registerFailure’, and
‘registerFancyFailure’. These functions are analogous to those without the
‘register’ prefix, except that they have “delayed” effect.

											
										
										
											2019-11-06 01:24:04 +03:00
+								setParserState :: MonadParsec e s m => State s e -> m ()
-												Reorganize modules (#217)



											
										
										
											2017-06-14 22:12:18 +03:00
+								setParserState st = updateParserState (const st)
-												Inline more

											
										
										
											2018-05-01 10:23:52 +03:00
+								{-# INLINE setParserState #-}