{-# OPTIONS_GHC -Wno-incomplete-patterns #-} {-# LANGUAGE PatternSynonyms, ViewPatterns #-} {-| Module : Parsley.Combinator Description : The parsing combinators License : BSD-3-Clause Maintainer : Jamie Willis Stability : stable This module contains the classic parser combinator operations specific to parsers themselves. This means any combinators that deal with input consumption at a primitive level. @since 0.1.0.0 -} module Parsley.Combinator ( satisfy, char, item, string, token, oneOf, noneOf, eof, more, someTill, try, lookAhead, notFollowedBy, line, col, pos ) where import Prelude hiding (traverse, (*>)) import Data.List (sort) import Parsley.Alternative (manyTill) import Parsley.Applicative (($>), void, traverse, (<:>), (*>), (<~>)) import Parsley.Defunctionalized (Defunc(LIFTED, EQ_H, CONST, LAM_S), pattern APP_H, pattern COMPOSE_H) import Parsley.Internal (Code, Quapplicative(..), Parser) import Parsley.ParserOps (satisfy) import qualified Parsley.Internal as Internal (try, lookAhead, notFollowedBy, line, col) {-| This combinator will attempt to parse a given parser. If it succeeds, the result is returned without having consumed any input. If it fails, however, any consumed input remains consumed. @since 0.1.0.0 -} lookAhead :: Parser a -> Parser a lookAhead = Internal.lookAhead {-| This combinator will ensure that a given parser fails. If the parser does fail, a @()@ is returned and no input is consumed. If the parser succeeded, then this combinator will fail, however it will not consume any input. @since 0.1.0.0 -} notFollowedBy :: Parser a -> Parser () notFollowedBy = Internal.notFollowedBy {-| This combinator allows a parser to backtrack on failure, which is to say that it will not have consumed any input if it were to fail. This is important since @parsec@ semantics demand that the second branch of @(`Parsley.Alternative.<|>`)@ can only be taken if the first did not consume input on failure. Excessive use of `try` will reduce the efficiency of the parser and effect the generated error messages. It should only be used in one of two circumstances: * When two branches of a parser share a common leading prefix (in which case, it is often better to try and factor this out). * When a parser needs to be executed atomically (for example, tokens). @since 0.1.0.0 -} try :: Parser a -> Parser a try = Internal.try {-| This combinator will attempt match a given string. If the parser fails midway through, this combinator will fail having consumed input. On success, the string itself is returned and input will be consumed. @since 0.1.0.0 -} string :: String -> Parser String string = traverse char {-| This combinator will attempt to match any one of the provided list of characters. If one of those characters is found, it will be returned and the input consumed. If not, the combinator will fail having consumed no input. @since 0.1.0.0 -} oneOf :: [Char] -> Parser Char oneOf = satisfy . elem' {-| This combinator will attempt to not match any one of the provided list of characters. If one of those characters is found, the combinator will fail having consumed no input. If not, it will return the character that was not an element of the provided list. @since 0.1.0.0 -} noneOf :: [Char] -> Parser Char noneOf = satisfy . COMPOSE_H (makeQ not [||not||]) . elem' elem' :: [Char] -> Defunc (Char -> Bool) elem' cs = LAM_S (\c -> makeQ (elem (_val c) cs) (ofChars cs (_code c))) ofChars :: [Char] -> Code Char -> Code Bool ofChars [] _ = [||False||] ofChars cs qc = foldr1 (\p q -> [|| $$p || $$q ||]) (map (makePred qc) (ranges cs)) makePred :: Code Char -> (Char, Char) -> Code Bool makePred qc (c, c') | c == c' = [|| c == $$qc ||] | otherwise = [|| c <= $$qc && $$qc <= c' ||] ranges :: [Char] -> [(Char, Char)] ranges (sort -> c:cs) = go c (fromEnum c) cs where go :: Char -> Int -> [Char] -> [(Char, Char)] go lower prev [] = [(lower, toEnum prev)] go lower prev (c:cs) | i <- fromEnum c, i == prev + 1 = go lower i cs | otherwise = (lower, toEnum prev) : go c (fromEnum c) cs {-| Like `string`, excepts parses the given string atomically using `try`. Never consumes input on failure. @since 0.1.0.0 -} token :: String -> Parser String token = try . string {-| This parser succeeds only if there is no input left to consume, and fails without consuming input otherwise. @since 0.1.0.0 -} eof :: Parser () eof = notFollowedBy item {-| This parser succeeds if there is still input left to consume, and fails otherwise. @since 0.1.0.0 -} more :: Parser () more = lookAhead (void item) -- Parsing Primitives {-| This combinator will attempt to match a given character. If that character is the next input token, the parser succeeds and the character is returned. Otherwise, the combinator will fail having not consumed any input. @since 0.1.0.0 -} char :: Char -> Parser Char char c = satisfy (EQ_H (LIFTED c)) $> LIFTED c {-| Reads any single character. This combinator will only fail if there is no more input remaining. The parsed character is returned. @since 0.1.0.0 -} item :: Parser Char item = satisfy (APP_H CONST (LIFTED True)) -- Composite Combinators {-| The combinator @someTill p end@ will try and parse @p@ as many times as possible (but at least once) so long as @end@ cannot be successfully parsed. It will return the results from the successful parses of @p@. @since 0.1.0.0 -} someTill :: Parser a -> Parser b -> Parser [a] someTill p end = notFollowedBy end *> (p <:> manyTill p end) {-| The `line` combinator returns the current line number at this point in the parse. Line numbers start from 1. @since 1.0.1.0 -} line :: Parser Int line = Internal.line {-| The `col` combinator returns the current column number at this point in the parse. Column numbers start from 1. @since 1.0.1.0 -} col :: Parser Int col = Internal.col {-| The `pos` combinator returns the current line and column number at this point in the parse. @since 1.0.1.0 -} pos :: Parser (Int, Int) pos = line <~> col