mirror of
https://github.com/mrkkrp/megaparsec.git
synced 2024-12-18 22:01:41 +03:00
152 lines
5.1 KiB
Haskell
152 lines
5.1 KiB
Haskell
-----------------------------------------------------------------------------
|
|
-- |
|
|
-- Module : Text.Parsec.Char
|
|
-- Copyright : (c) Daan Leijen 1999-2001, (c) Paolo Martini 2007
|
|
-- License : BSD-style (see the LICENSE file)
|
|
--
|
|
-- Maintainer : derek.a.elkins@gmail.com
|
|
-- Stability : provisional
|
|
-- Portability : portable
|
|
--
|
|
-- Commonly used character parsers.
|
|
--
|
|
-----------------------------------------------------------------------------
|
|
|
|
{-# LANGUAGE FlexibleContexts #-}
|
|
|
|
module Text.Parsec.Char where
|
|
|
|
import Data.Char
|
|
import Text.Parsec.Pos
|
|
import Text.Parsec.Prim
|
|
import Control.Applicative ((*>))
|
|
|
|
-- | @oneOf cs@ succeeds if the current character is in the supplied
|
|
-- list of characters @cs@. Returns the parsed character. See also
|
|
-- 'satisfy'.
|
|
--
|
|
-- > vowel = oneOf "aeiou"
|
|
|
|
oneOf :: (Stream s m Char) => [Char] -> ParsecT s u m Char
|
|
oneOf cs = satisfy (\c -> elem c cs)
|
|
|
|
-- | As the dual of 'oneOf', @noneOf cs@ succeeds if the current
|
|
-- character /not/ in the supplied list of characters @cs@. Returns the
|
|
-- parsed character.
|
|
--
|
|
-- > consonant = noneOf "aeiou"
|
|
|
|
noneOf :: (Stream s m Char) => [Char] -> ParsecT s u m Char
|
|
noneOf cs = satisfy (\c -> not (elem c cs))
|
|
|
|
-- | Skips /zero/ or more white space characters. See also 'skipMany'.
|
|
|
|
spaces :: (Stream s m Char) => ParsecT s u m ()
|
|
spaces = skipMany space <?> "white space"
|
|
|
|
-- | Parses a white space character (any character which satisfies 'isSpace')
|
|
-- Returns the parsed character.
|
|
|
|
space :: (Stream s m Char) => ParsecT s u m Char
|
|
space = satisfy isSpace <?> "space"
|
|
|
|
-- | Parses a newline character (\'\\n\'). Returns a newline character.
|
|
|
|
newline :: (Stream s m Char) => ParsecT s u m Char
|
|
newline = char '\n' <?> "lf new-line"
|
|
|
|
-- | Parses a carriage return character (\'\\r\') followed by a newline character (\'\\n\').
|
|
-- Returns a newline character.
|
|
|
|
crlf :: (Stream s m Char) => ParsecT s u m Char
|
|
crlf = char '\r' *> char '\n' <?> "crlf new-line"
|
|
|
|
-- | Parses a CRLF (see 'crlf') or LF (see 'newline') end-of-line.
|
|
-- Returns a newline character (\'\\n\').
|
|
--
|
|
-- > endOfLine = newline <|> crlf
|
|
--
|
|
|
|
endOfLine :: (Stream s m Char) => ParsecT s u m Char
|
|
endOfLine = newline <|> crlf <?> "new-line"
|
|
|
|
-- | Parses a tab character (\'\\t\'). Returns a tab character.
|
|
|
|
tab :: (Stream s m Char) => ParsecT s u m Char
|
|
tab = char '\t' <?> "tab"
|
|
|
|
-- | Parses an upper case letter (a character between \'A\' and \'Z\').
|
|
-- Returns the parsed character.
|
|
|
|
upper :: (Stream s m Char) => ParsecT s u m Char
|
|
upper = satisfy isUpper <?> "uppercase letter"
|
|
|
|
-- | Parses a lower case character (a character between \'a\' and \'z\').
|
|
-- Returns the parsed character.
|
|
|
|
lower :: (Stream s m Char) => ParsecT s u m Char
|
|
lower = satisfy isLower <?> "lowercase letter"
|
|
|
|
-- | Parses a letter or digit (a character between \'0\' and \'9\').
|
|
-- Returns the parsed character.
|
|
|
|
alphaNum :: (Stream s m Char => ParsecT s u m Char)
|
|
alphaNum = satisfy isAlphaNum <?> "letter or digit"
|
|
|
|
-- | Parses a letter (an upper case or lower case character). Returns the
|
|
-- parsed character.
|
|
|
|
letter :: (Stream s m Char) => ParsecT s u m Char
|
|
letter = satisfy isAlpha <?> "letter"
|
|
|
|
-- | Parses a digit. Returns the parsed character.
|
|
|
|
digit :: (Stream s m Char) => ParsecT s u m Char
|
|
digit = satisfy isDigit <?> "digit"
|
|
|
|
-- | Parses a hexadecimal digit (a digit or a letter between \'a\' and
|
|
-- \'f\' or \'A\' and \'F\'). Returns the parsed character.
|
|
|
|
hexDigit :: (Stream s m Char) => ParsecT s u m Char
|
|
hexDigit = satisfy isHexDigit <?> "hexadecimal digit"
|
|
|
|
-- | Parses an octal digit (a character between \'0\' and \'7\'). Returns
|
|
-- the parsed character.
|
|
|
|
octDigit :: (Stream s m Char) => ParsecT s u m Char
|
|
octDigit = satisfy isOctDigit <?> "octal digit"
|
|
|
|
-- | @char c@ parses a single character @c@. Returns the parsed
|
|
-- character (i.e. @c@).
|
|
--
|
|
-- > semiColon = char ';'
|
|
|
|
char :: (Stream s m Char) => Char -> ParsecT s u m Char
|
|
char c = satisfy (==c) <?> show [c]
|
|
|
|
-- | This parser succeeds for any character. Returns the parsed character.
|
|
|
|
anyChar :: (Stream s m Char) => ParsecT s u m Char
|
|
anyChar = satisfy (const True)
|
|
|
|
-- | The parser @satisfy f@ succeeds for any character for which the
|
|
-- supplied function @f@ returns 'True'. Returns the character that is
|
|
-- actually parsed.
|
|
|
|
-- > digit = satisfy isDigit
|
|
-- > oneOf cs = satisfy (\c -> c `elem` cs)
|
|
|
|
satisfy :: (Stream s m Char) => (Char -> Bool) -> ParsecT s u m Char
|
|
satisfy f = tokenPrim (\c -> show [c])
|
|
(\pos c _cs -> updatePosChar pos c)
|
|
(\c -> if f c then Just c else Nothing)
|
|
|
|
-- | @string s@ parses a sequence of characters given by @s@. Returns
|
|
-- the parsed string (i.e. @s@).
|
|
--
|
|
-- > divOrMod = string "div"
|
|
-- > <|> string "mod"
|
|
|
|
string :: (Stream s m Char) => String -> ParsecT s u m String
|
|
string s = tokens show updatePosString s
|