{-# LANGUAGE PatternSynonyms #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE StandaloneDeriving #-}
{-# LANGUAGE DeriveLift #-}
{-# LANGUAGE GADTs #-}
{-# LANGUAGE KindSignatures #-}
{-# LANGUAGE DataKinds #-}
module PyF.Internal.PythonSyntax
( parsePythonFormatString
, parseGenericFormatString
, Item(..)
, FormatMode(..)
, Padding(..)
, Precision(..)
, TypeFormat(..)
, AlternateForm(..)
, pattern DefaultFormatMode
, Parser
)
where
import Language.Haskell.TH.Syntax
import Text.Megaparsec
import qualified Text.Megaparsec.Char.Lexer as L
import Text.Megaparsec.Char
import Data.Void (Void)
import qualified Data.Char
import Data.Maybe (fromMaybe)
import qualified Data.Set as Set
import qualified Language.Haskell.Meta.Syntax.Translate as SyntaxTranslate
import qualified Language.Haskell.Exts.Parser as ParseExp
import qualified Language.Haskell.Exts.Extension as ParseExtension
import qualified Language.Haskell.Exts.SrcLoc as SrcLoc
import PyF.Formatters
type Parser t = Parsec Void String t
data Item = Raw String
| Replacement Exp (Maybe FormatMode)
deriving (Show)
parsePythonFormatString :: [ParseExtension.Extension] -> Parser [Item]
parsePythonFormatString exts = parseGenericFormatString exts ('{', '}')
parseGenericFormatString :: [ParseExtension.Extension] -> (Char, Char) -> Parser [Item]
parseGenericFormatString exts delimiters = many (rawString delimiters <|> escapedParenthesis delimiters <|> replacementField exts delimiters) <* eof
rawString :: (Char, Char) -> Parser Item
rawString (openingChar,closingChar) = do
chars <- some (noneOf ([openingChar, closingChar]))
case escapeChars chars of
Left remaining -> do
offset <- getOffset
setOffset (offset - length remaining)
fancyFailure (Set.singleton (ErrorFail "lexical error in literal section"))
Right escaped -> return (Raw escaped)
escapedParenthesis :: (Char, Char) -> Parser Item
escapedParenthesis (openingChar, closingChar) = Raw <$> (parseRaw openingChar <|> parseRaw closingChar)
where parseRaw c = c:[] <$ string (replicate 2 c)
escapeChars :: String -> Either String String
escapeChars "" = Right ""
escapeChars ('\\':'\n':xs) = escapeChars xs
escapeChars ('\\':'\\':xs) = ('\\' :) <$> escapeChars xs
escapeChars s = case Data.Char.readLitChar s of
((c, xs):_) -> (c :) <$> escapeChars xs
_ -> Left s
replacementField :: [ParseExtension.Extension] -> (Char, Char) -> Parser Item
replacementField exts (charOpening, charClosing) = do
_ <- char charOpening
expr <- evalExpr exts (many (noneOf (charClosing:":" :: [Char])))
fmt <- optional $ do
_ <- char ':'
format_spec
_ <- char charClosing
pure (Replacement expr fmt)
pattern DefaultFormatMode :: FormatMode
pattern DefaultFormatMode = FormatMode PaddingDefault (DefaultF PrecisionDefault Minus) Nothing
data FormatMode = FormatMode Padding TypeFormat (Maybe Char)
deriving (Show)
data Padding = PaddingDefault
| Padding Integer (Maybe (Maybe Char, AnyAlign))
deriving (Show)
data Precision = PrecisionDefault
| Precision Integer
deriving (Show)
data TypeFlag = Flagb | Flagc | Flagd | Flage | FlagE | Flagf | FlagF | Flagg | FlagG | Flagn | Flago | Flags | Flagx | FlagX | FlagPercent
deriving (Show)
data TypeFormat =
DefaultF Precision SignMode
| BinaryF AlternateForm SignMode
| CharacterF
| DecimalF SignMode
| ExponentialF Precision AlternateForm SignMode
| ExponentialCapsF Precision AlternateForm SignMode
| FixedF Precision AlternateForm SignMode
| FixedCapsF Precision AlternateForm SignMode
| GeneralF Precision AlternateForm SignMode
| GeneralCapsF Precision AlternateForm SignMode
| OctalF AlternateForm SignMode
| StringF Precision
| HexF AlternateForm SignMode
| HexCapsF AlternateForm SignMode
| PercentF Precision AlternateForm SignMode
deriving (Show)
data AlternateForm = AlternateForm | NormalForm
deriving (Show)
lastCharFailed :: String -> Parser t
lastCharFailed err = do
offset <- getOffset
setOffset (offset - 1)
fancyFailure (Set.singleton (ErrorFail err))
evalExpr :: [ParseExtension.Extension] -> Parser String -> Parser Exp
evalExpr exts exprParser = do
offset <- getOffset
s <- exprParser
let parseMode = ParseExp.defaultParseMode { ParseExp.extensions = exts }
case SyntaxTranslate.toExp <$> ParseExp.parseExpWithMode parseMode s of
ParseExp.ParseOk expr -> pure expr
ParseExp.ParseFailed (SrcLoc.SrcLoc _name' line col) err -> do
let
linesBefore = take (line - 1) (lines s)
currentOffset = length (unlines linesBefore) + col - 1
setOffset (offset + currentOffset)
fancyFailure (Set.singleton (ErrorFail err))
overrideAlignmentIfZero :: Bool -> Maybe (Maybe Char, AnyAlign) -> Maybe (Maybe Char, AnyAlign)
overrideAlignmentIfZero True Nothing = Just (Just '0', AnyAlign AlignInside)
overrideAlignmentIfZero True (Just (Nothing, al)) = Just (Just '0', al)
overrideAlignmentIfZero _ v = v
format_spec :: Parser FormatMode
format_spec = do
al' <- optional alignment
s <- optional sign
alternateForm <- option NormalForm (AlternateForm <$ char '#')
hasZero <- option False (True <$ char '0')
let al = overrideAlignmentIfZero hasZero al'
w <- optional width
grouping <- optional grouping_option
prec <- option PrecisionDefault (char '.' *> (Precision <$> precision))
t <- optional type_
let padding = case w of
Just p -> Padding p al
Nothing -> PaddingDefault
case t of
Nothing -> pure (FormatMode padding (DefaultF prec (fromMaybe Minus s)) grouping)
Just flag -> case evalFlag flag padding grouping prec alternateForm s of
Right fmt -> pure (FormatMode padding fmt grouping)
Left typeError -> do
lastCharFailed typeError
evalFlag :: TypeFlag -> Padding -> Maybe Char -> Precision -> AlternateForm -> Maybe SignMode -> Either String TypeFormat
evalFlag Flagb _pad _grouping prec alt s = failIfPrec prec (BinaryF alt (defSign s))
evalFlag Flagc _pad _grouping prec alt s = failIfS s =<< failIfPrec prec =<< failIfAlt alt CharacterF
evalFlag Flagd _pad _grouping prec alt s = failIfPrec prec =<< failIfAlt alt (DecimalF (defSign s))
evalFlag Flage _pad _grouping prec alt s = pure $ExponentialF prec alt (defSign s)
evalFlag FlagE _pad _grouping prec alt s = pure $ ExponentialCapsF prec alt (defSign s)
evalFlag Flagf _pad _grouping prec alt s = pure $ FixedF prec alt (defSign s)
evalFlag FlagF _pad _grouping prec alt s = pure $ FixedCapsF prec alt (defSign s)
evalFlag Flagg _pad _grouping prec alt s = pure $ GeneralF prec alt (defSign s)
evalFlag FlagG _pad _grouping prec alt s = pure $ GeneralCapsF prec alt (defSign s)
evalFlag Flagn _pad _grouping _prec _alt _s = Left ("Type 'n' not handled (yet). " ++ errgGn)
evalFlag Flago _pad _grouping prec alt s = failIfPrec prec $ OctalF alt (defSign s)
evalFlag Flags pad grouping prec alt s = failIfGrouping grouping =<< failIfInsidePadding pad =<< failIfS s =<< (failIfAlt alt $ StringF prec)
evalFlag Flagx _pad _grouping prec alt s = failIfPrec prec $ HexF alt (defSign s)
evalFlag FlagX _pad _grouping prec alt s = failIfPrec prec $ HexCapsF alt (defSign s)
evalFlag FlagPercent _pad _grouping prec alt s = pure $ PercentF prec alt (defSign s)
defSign :: Maybe SignMode -> SignMode
defSign Nothing = Minus
defSign (Just s) = s
failIfGrouping :: Maybe Char -> TypeFormat -> Either String TypeFormat
failIfGrouping (Just _) _t = Left "String type is incompatible with grouping (_ or ,)."
failIfGrouping Nothing t = Right t
failIfInsidePadding :: Padding -> TypeFormat -> Either String TypeFormat
failIfInsidePadding (Padding _ (Just (_, AnyAlign AlignInside))) _t = Left "String type is incompatible with inside padding (=)."
failIfInsidePadding _ t = Right t
errgGn :: String
errgGn = "Use one of {'b', 'c', 'd', 'e', 'E', 'f', 'F', 'g', 'G', 'n', 'o', 's', 'x', 'X', '%'}."
failIfPrec :: Precision -> TypeFormat -> Either String TypeFormat
failIfPrec PrecisionDefault i = Right i
failIfPrec (Precision i) _ = Left ("Type incompatible with precision (." ++ show i ++ "), use any of {'e', 'E', 'f', 'F', 'g', 'G', 'n', 's', '%'} or remove the precision field.")
failIfAlt :: AlternateForm -> TypeFormat -> Either String TypeFormat
failIfAlt NormalForm i = Right i
failIfAlt _ _ = Left "Type incompatible with alternative form (#), use any of {'e', 'E', 'f', 'F', 'g', 'G', 'n', 'o', 'x', 'X', '%'} or remove the alternative field."
failIfS :: Maybe SignMode -> TypeFormat -> Either String TypeFormat
failIfS Nothing i = Right i
failIfS (Just s) _ = Left ("Type incompatible with sign field (" ++ [toSignMode s] ++ "), use any of {'b', 'd', 'e', 'E', 'f', 'F', 'g', 'G', 'n', 'o', 'x', 'X', '%'} or remove the sign field.")
toSignMode :: SignMode -> Char
toSignMode Plus = '+'
toSignMode Minus = '-'
toSignMode Space = ' '
alignment :: Parser (Maybe Char, AnyAlign)
alignment = choice [
try $ do
c <- fill
mode <- align
pure (Just c, mode)
, do
mode <- align
pure (Nothing, mode)
]
fill :: Parser Char
fill = anySingle
align :: Parser AnyAlign
align = choice [
AnyAlign AlignLeft <$ char '<',
AnyAlign AlignRight <$ char '>',
AnyAlign AlignCenter <$ char '^',
AnyAlign AlignInside <$ char '='
]
sign :: Parser SignMode
sign = choice
[Plus <$ char '+',
Minus <$ char '-',
Space <$ char ' '
]
width :: Parser Integer
width = integer
integer :: Parser Integer
integer = L.decimal
grouping_option :: Parser Char
grouping_option = oneOf ("_," :: [Char])
precision :: Parser Integer
precision = integer
type_ :: Parser TypeFlag
type_ = choice [
Flagb <$ char 'b',
Flagc <$ char 'c',
Flagd <$ char 'd',
Flage <$ char 'e',
FlagE <$ char 'E',
Flagf <$ char 'f',
FlagF <$ char 'F',
Flagg <$ char 'g',
FlagG <$ char 'G',
Flagn <$ char 'n',
Flago <$ char 'o',
Flags <$ char 's',
Flagx <$ char 'x',
FlagX <$ char 'X',
FlagPercent <$ char '%'
]
deriving instance Lift Precision
deriving instance Lift Padding