mirror of
https://github.com/idris-lang/Idris2.git
synced 2024-12-18 00:31:57 +03:00
f47d9cfef2
Signed-off-by: Alex Humphreys <alex.humphreys@here.com>
235 lines
7.2 KiB
Idris
235 lines
7.2 KiB
Idris
||| A simple parser combinator library for strings. Inspired by attoparsec zepto.
|
|
module Data.String.Parser
|
|
import Control.Monad.Identity
|
|
import Control.Monad.Trans
|
|
|
|
import Data.Strings
|
|
import Data.Fin
|
|
import Data.List
|
|
|
|
%default partial
|
|
|
|
||| The input state, pos is position in the string and maxPos is the length of the input string.
|
|
public export
|
|
record State where
|
|
constructor S
|
|
input : String
|
|
pos : Int
|
|
maxPos : Int
|
|
|
|
Show State where
|
|
show s = "(" ++ show s.input ++", " ++ show s.pos ++ ", " ++ show s.maxPos ++")"
|
|
|
|
||| Result of applying a parser
|
|
public export
|
|
data Result a = Fail Int String | OK a State
|
|
|
|
|
|
public export
|
|
record ParseT (m : Type -> Type) (a : Type) where
|
|
constructor P
|
|
runParser : State -> m (Result a)
|
|
|
|
public export
|
|
Parser : Type -> Type
|
|
Parser a = ParseT Identity a
|
|
|
|
public export
|
|
implementation Monad m => Functor (ParseT m) where
|
|
map f p = P $ \state =>
|
|
do res <- p.runParser state
|
|
case res of
|
|
OK r state' => pure (OK (f r) state')
|
|
Fail i err => pure (Fail i err)
|
|
|
|
public export
|
|
Monad m => Applicative (ParseT m) where
|
|
pure x = P $ \s => pure (OK x s)
|
|
f <*> x = P $ \s => case !(x.runParser s) of
|
|
OK r s' => case !(f.runParser s') of
|
|
OK f' fs => pure (OK (f' r) fs)
|
|
Fail i err => pure (Fail i err)
|
|
Fail i err => pure (Fail i err)
|
|
|
|
public export
|
|
Monad m => Monad (ParseT m) where
|
|
m >>= k = P $ \state =>
|
|
do res <- m.runParser state
|
|
case res of
|
|
OK a state' => (k a).runParser state'
|
|
Fail i err => pure (Fail i err)
|
|
|
|
public export
|
|
Monad m => Alternative (ParseT m) where
|
|
empty = P $ \s => pure $ Fail (s.pos) "no alternative left"
|
|
a <|> b = P $ \s => case !(a.runParser s) of
|
|
OK r s' => pure $ OK r s'
|
|
Fail _ _ => b.runParser s
|
|
|
|
public export
|
|
MonadTrans ParseT where
|
|
lift x = P $ \s => do res <-x
|
|
pure $ OK res s
|
|
|
|
||| Run a parser in a monad
|
|
||| Returns a tuple of the result and final position on success.
|
|
||| Returns an error message on failure.
|
|
export
|
|
parseT : Monad m => ParseT m a -> String -> m (Either String (a, Int))
|
|
parseT p str = do res <- p.runParser (S str 0 (strLength str))
|
|
case res of
|
|
OK r s => pure $ Right (r, s.pos)
|
|
Fail i err => pure $ Left $ fastAppend ["Parse failed at position ", show i, ": ", err]
|
|
|
|
||| Run a parser in a pure function
|
|
||| Returns a tuple of the result and final position on success.
|
|
||| Returns an error message on failure.
|
|
export
|
|
parse : Parser a -> String -> Either String (a, Int)
|
|
parse p str = runIdentity $ parseT p str
|
|
|
|
||| Combinator that replaces the error message on failure.
|
|
||| This allows combinators to output relevant errors
|
|
export
|
|
(<?>) : Monad m => ParseT m a -> String -> ParseT m a
|
|
(<?>) p msg = P $ \s => case !(p.runParser s) of
|
|
OK r s' => pure $ OK r s'
|
|
Fail i _ => pure $ Fail i msg
|
|
|
|
infixl 0 <?>
|
|
|
|
||| Succeeds if the next char satisfies the predicate `f`
|
|
export
|
|
satisfy : Monad m => (Char -> Bool) -> ParseT m Char
|
|
satisfy f = P $ \s => do if s.pos < s.maxPos
|
|
then do
|
|
let ch = strIndex s.input s.pos
|
|
if f ch
|
|
then pure $ OK ch (S s.input (s.pos + 1) s.maxPos)
|
|
else pure $ Fail (s.pos) "satisfy"
|
|
else pure $ Fail (s.pos) "satisfy"
|
|
|
|
||| Succeeds if the string `str` follows.
|
|
export
|
|
string : Monad m => String -> ParseT m ()
|
|
string str = P $ \s => do let len = strLength str
|
|
if s.pos+len <= s.maxPos
|
|
then do let head = strSubstr s.pos len s.input
|
|
if head == str
|
|
then pure $ OK () (S s.input (s.pos + len) s.maxPos)
|
|
else pure $ Fail (s.pos) ("string " ++ show str)
|
|
else pure $ Fail (s.pos) ("string " ++ show str)
|
|
|
|
||| Succeeds if the next char is `c`
|
|
export
|
|
char : Monad m => Char -> ParseT m ()
|
|
char c = do _ <- satisfy (== c)
|
|
pure ()
|
|
|
|
mutual
|
|
||| Succeeds if `p` succeeds, will continue to match `p` until it fails
|
|
||| and accumulate the results in a list
|
|
export
|
|
some : Monad m => ParseT m a -> ParseT m (List a)
|
|
some p = pure (!p :: !(many p))
|
|
|
|
||| Always succeeds, will accumulate the results of `p` in a list until it fails.
|
|
export
|
|
many : Monad m => ParseT m a -> ParseT m (List a)
|
|
many p = some p <|> pure []
|
|
|
|
||| Always succeeds, applies the predicate `f` on chars until it fails and creates a string
|
|
||| from the results.
|
|
export
|
|
takeWhile : Monad m => (Char -> Bool) -> ParseT m String
|
|
takeWhile f = do ls <- many (satisfy f)
|
|
pure $ pack ls
|
|
|
|
||| Returns the result of the parser `p` or `def` if it fails.
|
|
export
|
|
option : Monad m => a -> ParseT m a -> ParseT m a
|
|
option def p = p <|> pure def
|
|
|
|
||| Returns a Maybe that contains the result of `p` if it succeeds or `Nothing` if it fails.
|
|
export
|
|
optional : Monad m => ParseT m a -> ParseT m (Maybe a)
|
|
optional p = (p >>= \res => pure $ Just res) <|> pure Nothing
|
|
|
|
||| Discards the result of a parser
|
|
export
|
|
skip : Parser a -> Parser ()
|
|
skip = ignore
|
|
|
|
||| Parses a space character
|
|
export
|
|
space : Parser Char
|
|
space = satisfy isSpace
|
|
|
|
||| Parses one or more space characters
|
|
export
|
|
spaces : Parser ()
|
|
spaces = skip (many space) <?> "white space"
|
|
|
|
||| Discards whitespace after a matching parser
|
|
export
|
|
lexeme : Parser a -> Parser a
|
|
lexeme p = p <* spaces
|
|
|
|
||| Matches a specific string, then skips following whitespace
|
|
export
|
|
token : String -> Parser ()
|
|
token s = lexeme (skip (string s)) <?> "token " ++ show s
|
|
|
|
||| Fail with some error message
|
|
export
|
|
fail : Monad m => String -> ParseT m a
|
|
fail x = P $ \s => do pure $ Fail s.pos x
|
|
|
|
||| Matches a single digit
|
|
export
|
|
digit : Parser (Fin 10)
|
|
digit = do x <- satisfy isDigit
|
|
case lookup x digits of
|
|
Nothing => P $ \s => do pure $ Fail s.pos "not a digit"
|
|
Just y => P $ \s => Id (OK y s)
|
|
where
|
|
digits : List (Char, Fin 10)
|
|
digits = [ ('0', 0)
|
|
, ('1', 1)
|
|
, ('2', 2)
|
|
, ('3', 3)
|
|
, ('4', 4)
|
|
, ('5', 5)
|
|
, ('6', 6)
|
|
, ('7', 7)
|
|
, ('8', 8)
|
|
, ('9', 9)
|
|
]
|
|
|
|
fromDigits : Num a => ((Fin 10) -> a) -> List (Fin 10) -> a
|
|
fromDigits f xs = foldl (addDigit) 0 xs
|
|
where
|
|
addDigit : a -> (Fin 10) -> a
|
|
addDigit num d = 10*num + (f d)
|
|
|
|
intFromDigits : List (Fin 10) -> Integer
|
|
intFromDigits = fromDigits finToInteger
|
|
|
|
natFromDigits : List (Fin 10) -> Nat
|
|
natFromDigits = fromDigits finToNat
|
|
|
|
||| Matches a natural number
|
|
export
|
|
natural : Parser Nat
|
|
natural = do x <- some digit
|
|
pure (natFromDigits x)
|
|
|
|
||| Matches an integer, eg. "12", "-4"
|
|
export
|
|
integer : Parser Integer
|
|
integer = do minus <- optional (char '-')
|
|
x <- some digit
|
|
case minus of
|
|
Nothing => pure (intFromDigits x)
|
|
(Just y) => pure ((intFromDigits x)*(-1))
|