{-# LANGUAGE LambdaCase #-} -- | -- Module : Parser.Text -- Copyright : (c) 2020 Composewell Technologies and Contributors -- (c) 2016-2017 Harendra Kumar -- (c) 2014-2015 Antonio Nikishaev -- License : Apache-2.0 -- Maintainer : streamly@composewell.com -- Stability : experimental -- The original Unicode database parser was taken from -- https://github.com/composewell/unicode-transforms but was completely -- rewritten from scratch to parse from UCD text files instead of XML, only -- some types remain the same. That code in turn was originally taken from -- https://github.com/llelf/prose (Antonio Nikishaev) and heavily modified by -- Harendra Kumar. -- module Parser.Text (genModules) where import Control.Exception (catch, IOException) import Control.Monad (void) import Control.Monad.IO.Class (MonadIO(liftIO)) import Data.Bits (Bits(..)) import Data.Word (Word8) import Data.Char (chr, ord, isSpace) import Data.Functor ((<&>)) import Data.Function ((&)) import Data.List (unfoldr, intersperse) import Data.Maybe (fromMaybe) import Streamly.Data.Fold (Fold) import Streamly.Prelude (IsStream, SerialT) import System.Directory (createDirectoryIfMissing) import System.Environment (getEnv) import qualified Data.Set as Set import qualified Streamly.Prelude as Stream import qualified Streamly.Data.Fold as Fold import qualified Streamly.Internal.Data.Fold as Fold import qualified Streamly.Data.Unfold as Unfold import qualified Streamly.FileSystem.Handle as Handle import qualified System.IO as Sys import qualified Streamly.Unicode.Stream as Unicode import Prelude hiding (pred) ------------------------------------------------------------------------------- -- Types ------------------------------------------------------------------------------- data GeneralCategory = Lu|Ll|Lt| --LC Lm|Lo| --L Mn|Mc|Me| --M Nd|Nl|No| --N Pc|Pd|Ps|Pe|Pi|Pf|Po| --P Sm|Sc|Sk|So| --S Zs|Zl|Zp| --Z Cc|Cf|Cs|Co|Cn --C deriving (Show, Bounded, Enum, Read) data DecompType = DTCanonical | DTCompat | DTFont | DTNoBreak | DTInitial | DTMedial | DTFinal | DTIsolated | DTCircle | DTSuper | DTSub | DTVertical | DTWide | DTNarrow | DTSmall | DTSquare | DTFraction deriving (Show, Eq) data Decomp = DCSelf | DC [Char] deriving (Show, Eq) data DType = Canonical | Kompat data DetailedChar = DetailedChar { _char :: Char , _name :: String , _generalCategory :: GeneralCategory , _combiningClass :: Int , _decompositionType :: Maybe DecompType , _decomposition :: Decomp , _simpleUppercaseMapping :: Maybe Char , _simpleLowercaseMapping :: Maybe Char , _simpleTitlecaseMapping :: Maybe Char } deriving (Show) ------------------------------------------------------------------------------- -- Helpers ------------------------------------------------------------------------------- apacheLicense :: String -> String apacheLicense modName = unlines [ "-- |" , "-- Module : " ++ modName , "-- Copyright : (c) 2020 Composewell Technologies and Contributors" , "-- License : Apache-2.0" , "-- Maintainer : streamly@composewell.com" , "-- Stability : experimental" ] readCodePoint :: String -> Char readCodePoint = chr . read . ("0x"++) readCodePointM :: String -> Maybe Char readCodePointM "" = Nothing readCodePointM u = Just (readCodePoint u) genSignature :: String -> String genSignature = (<> " :: Char -> Bool") -- | Check that var is between minimum and maximum of orderList genRangeCheck :: String -> [Int] -> String genRangeCheck var ordList = var <> " >= " <> show (minimum ordList) <> " && " <> var <> " <= " <> show (maximum ordList) genBitmap :: String -> [Int] -> String genBitmap funcName ordList = unlines [ "{-# INLINE " ++ funcName ++ " #-}" , genSignature funcName , funcName <> " = \\c -> let n = ord c in " ++ genRangeCheck "n" ordList ++ " && lookupBit64 bitmap# n" , " where" , " bitmap# = " ++ show (bitMapToAddrLiteral (positionsToBitMap ordList)) ++ "#" ] positionsToBitMap :: [Int] -> [Bool] positionsToBitMap = go 0 where go _ [] = [] go i xxs@(x:xs) | i < x = False : go (i + 1) xxs | otherwise = True : go (i + 1) xs bitMapToAddrLiteral :: [Bool] -> String bitMapToAddrLiteral = map (chr . toByte . padTo8) . unfoldr go where go :: [a] -> Maybe ([a], [a]) go [] = Nothing go xs = Just $ splitAt 8 xs padTo8 :: [Bool] -> [Bool] padTo8 xs | length xs >= 8 = xs | otherwise = xs ++ replicate (8 - length xs) False toByte :: [Bool] -> Int toByte xs = sum $ map (\i -> if xs !! i then 1 `shiftL` i else 0) [0..7] genEnumBitmap :: forall a. (Bounded a, Enum a, Show a) => String -> [a] -> String genEnumBitmap funcName as = unlines [ "{-# INLINE " ++ funcName ++ " #-}" , funcName <> " :: Char -> Int" , funcName <> " c = let n = ord c in if n >= " <> show (length as) <> " then " <> show (fromEnum Cn) <> " else lookupIntN bitmap# n" , " where" , " bitmap# = " <> show (enumMapToAddrLiteral as) <> "#" ] {-| Encode a list of values as a byte map, using their 'Enum' instance. __Note:__ 'Enum' instance must respect the following: * @fromEnum minBound >= 0x00@ * @fromEnum maxBound <= 0xff@ -} enumMapToAddrLiteral :: forall a. (Bounded a, Enum a, Show a) => [a] -> String enumMapToAddrLiteral = fmap go where go :: a -> Char go = chr . fromIntegral . toWord8 toWord8 :: a -> Word8 toWord8 a = let w = fromEnum a in if 0 <= w && w <= 0xff then fromIntegral w else error $ "Cannot convert to Word8: " <> show a -- This bit of code is duplicated but this duplication allows us to reduce 2 -- dependencies on the executable. jamoLCount :: Int jamoLCount = 19 jamoVCount :: Int jamoVCount = 21 jamoTCount :: Int jamoTCount = 28 hangulFirst :: Int hangulFirst = 0xac00 hangulLast :: Int hangulLast = hangulFirst + jamoLCount * jamoVCount * jamoTCount - 1 isHangul :: Char -> Bool isHangul c = n >= hangulFirst && n <= hangulLast where n = ord c ------------------------------------------------------------------------------- -- Parsers ------------------------------------------------------------------------------- ------------------------------------------------------------------------------- -- Parsing UnicodeData.txt ------------------------------------------------------------------------------- genGeneralCategoryModule :: Monad m => String -> Fold m DetailedChar String genGeneralCategoryModule moduleName = done <$> Fold.foldl' step initial where -- (categories, expected char) initial = ([], '\0') step (acc, p) a = if p < _char a -- Fill missing char entry with default category Cn -- See: https://www.unicode.org/reports/tr44/#Default_Values_Table then step (Cn : acc, succ p) a -- Regular entry else (_generalCategory a : acc, succ (_char a)) done (acc, _) = unlines [ apacheLicense moduleName , "module " <> moduleName , "(generalCategory)" , "where" , "" , "import Data.Char (ord)" , "import Unicode.Internal.Bits (lookupIntN)" , "" , genEnumBitmap "generalCategory" (reverse acc) ] readDecomp :: String -> (Maybe DecompType, Decomp) readDecomp s = if null wrds then (Nothing, DCSelf) else decmps wrds where decmps [] = error "Unreachable flow point" decmps y@(x:xs) = case dtmap x of DTCanonical -> (,) (Just DTCanonical) (readCP y) other -> (,) (Just other) (readCP xs) wrds = words s readCP ws = DC $ map readCodePoint ws dtmap "" = DTCompat dtmap "" = DTCircle dtmap "" = DTFinal dtmap "" = DTFont dtmap "" = DTFraction dtmap "" = DTInitial dtmap "" = DTIsolated dtmap "" = DTMedial dtmap "" = DTNarrow dtmap "" = DTNoBreak dtmap "" = DTSmall dtmap "" = DTSquare dtmap "" = DTSub dtmap "" = DTSuper dtmap "" = DTVertical dtmap "" = DTWide dtmap _ = DTCanonical filterNonHangul :: Monad m => Fold m DetailedChar a -> Fold m DetailedChar a filterNonHangul = Fold.filter (not . isHangul . _char) filterDecomposableType :: Monad m => DType -> Fold m DetailedChar a -> Fold m DetailedChar a filterDecomposableType dtype = Fold.filter ((/= DCSelf) . _decomposition) . Fold.filter (predicate . _decompositionType) where predicate = case dtype of Canonical -> (== Just DTCanonical) Kompat -> const True genDecomposableModule :: Monad m => String -> DType -> Fold m DetailedChar String genDecomposableModule moduleName dtype = filterNonHangul $ filterDecomposableType dtype $ done <$> Fold.foldl' step initial where initial = [] step st a = ord (_char a) : st done st = unlines [ apacheLicense moduleName , "module " <> moduleName , "(isDecomposable)" , "where" , "" , "import Data.Char (ord)" , "import Unicode.Internal.Bits (lookupBit64)" , "" , genBitmap "isDecomposable" (reverse st) ] genCombiningClassModule :: Monad m => String -> Fold m DetailedChar String genCombiningClassModule moduleName = Fold.filter (\dc -> _combiningClass dc /= 0) $ done <$> Fold.foldl' step initial where initial = ([], []) step (st1, st2) a = (genCombiningClassDef a : st1, ord (_char a) : st2) done (st1, st2) = unlines [ apacheLicense moduleName , "module " <> moduleName , "(combiningClass, isCombining)" , "where" , "" , "import Data.Char (ord)" , "import Unicode.Internal.Bits (lookupBit64)" , "" , "combiningClass :: Char -> Int" , unlines (reverse st1) , "combiningClass _ = 0\n" , "" , genBitmap "isCombining" (reverse st2) ] genCombiningClassDef dc = "combiningClass " <> show (_char dc) <> " = " <> show (_combiningClass dc) genDecomposeDefModule :: Monad m => String -> [String] -> [String] -> DType -> (Int -> Bool) -> Fold m DetailedChar String genDecomposeDefModule moduleName before after dtype pred = Fold.filter (pred . ord . _char) $ filterNonHangul $ filterDecomposableType dtype $ done <$> Fold.foldl' step initial where decomposeChar c DCSelf = [c] decomposeChar _c (DC ds) = ds genHeader = [ apacheLicense moduleName , "{-# OPTIONS_GHC -fno-warn-incomplete-patterns #-}" , "module " <> moduleName , "(decompose)" , "where" , "" ] genSign = [ "-- Note: this is a partial function we do not expect to call" , "-- this if isDecomposable returns false." , "{-# NOINLINE decompose #-}" , "decompose :: Char -> [Char]" ] initial = [] step st dc = genDecomposeDef dc : st done st = let body = mconcat [genHeader, before, genSign, reverse st, after] in unlines body genDecomposeDef dc = "decompose " <> show (_char dc) <> " = " <> show (decomposeChar (_char dc) (_decomposition dc)) genCompositionsModule :: Monad m => String -> [Int] -> [Int] -> Fold m DetailedChar String genCompositionsModule moduleName compExclu non0CC = Fold.filter (not . flip elem compExclu . ord . _char) $ filterNonHangul $ Fold.filter (isDecompositionLen2 . _decomposition) $ filterDecomposableType Canonical $ done <$> Fold.foldl' step initial where isDecompositionLen2 DCSelf = False isDecompositionLen2 (DC ds) = length ds == 2 genComposePairDef name dc = name <> " " <> show (head d01) <> " " <> show (d01 !! 1) <> " = Just " <> show (_char dc) where d01 = decompPair dc decompPair dc = case _decomposition dc of DCSelf -> error "toCompFormat: DCSelf" (DC ds) -> if length ds == 2 then ds else error "toCompFormat: length /= 2" initial = ([], [], []) step (dec, sp, ss) dc = (dec1, sp1, ss1) where d01 = decompPair dc d1Ord = ord $ d01 !! 1 dec1 = genComposePairDef "compose" dc : dec sp1 = if d1Ord `notElem` non0CC then genComposePairDef "composeStarters" dc : sp else sp ss1 = if d1Ord `notElem` non0CC then d1Ord : ss else ss header = [ apacheLicense moduleName , "{-# OPTIONS_GHC -fno-warn-incomplete-patterns #-}" , "module " <> moduleName , "(compose, composeStarters, isSecondStarter)" , "where" , "" , "import Data.Char (ord)" , "import Unicode.Internal.Bits (lookupBit64)" , "" ] composePair decomps = [ "{-# NOINLINE compose #-}" , "compose :: Char -> Char -> Maybe Char" , unlines decomps , "compose _ _ = " <> "Nothing" <> "\n" , "" ] composeStarterPair starterPairs = [ "composeStarters :: Char -> Char -> Maybe Char" , unlines starterPairs , "composeStarters _ _ = " <> "Nothing" <> "\n" , "" ] isSecondStarter secondStarters = [genBitmap "isSecondStarter" secondStarters] done (dec, sp, ss) = unlines $ header ++ composePair (reverse dec) ++ composeStarterPair (reverse sp) ++ isSecondStarter (Set.toList (Set.fromList ss)) genSimpleCaseMappingModule :: Monad m => String -> String -> (DetailedChar -> Maybe Char) -> Fold m DetailedChar String genSimpleCaseMappingModule moduleName funcName field = done <$> Fold.foldl' step initial where genHeader = [ apacheLicense moduleName , "module " <> moduleName , "(" ++ funcName ++ ")" , "where" , "" ] genSign = [ "{-# NOINLINE " ++ funcName ++ " #-}" , funcName ++ " :: Char -> Char" ] initial = [] step ds dc = case genUpper dc of Nothing -> ds Just d -> d : ds after = [funcName ++ " c = c"] done st = let body = mconcat [genHeader, genSign, reverse st, after] in unlines body genUpper dc = field dc <&> \c -> mconcat [ funcName , " " , show (_char dc) , " = " , show c ] genCorePropertiesModule :: Monad m => String -> (String -> Bool) -> Fold m (String, [Int]) String genCorePropertiesModule moduleName isProp = Fold.filter (\(name, _) -> isProp name) $ done <$> Fold.foldl' step initial where prop2FuncName x = "is" ++ x initial = ([], []) step (props, bitmaps) (name, bits) = (name : props, genBitmap (prop2FuncName name) bits : bitmaps) done (props, bitmaps) = unlines $ header props ++ bitmaps header exports = [ apacheLicense moduleName , "module " <> moduleName , "(" ++ unwords (intersperse "," (map prop2FuncName exports)) ++ ")" , "where" , "" , "import Data.Char (ord)" , "import Unicode.Internal.Bits (lookupBit64)" ] ------------------------------------------------------------------------------- -- Parsing property files ------------------------------------------------------------------------------- trim :: String -> String trim = takeWhile (not . isSpace) . dropWhile isSpace type PropertyLine = (String, [Int]) emptyPropertyLine :: PropertyLine emptyPropertyLine = ("", []) combinePropertyLines :: PropertyLine -> PropertyLine -> PropertyLine combinePropertyLines t1@(n1, o1) t2@(n2, o2) | n1 == "" = t2 | n2 == "" = t1 | n1 == n2 = (n1, o1 ++ o2) | otherwise = error $ "Cannot group " ++ n1 ++ " with " ++ n2 parsePropertyLine :: String -> PropertyLine parsePropertyLine ln | null ln = emptyPropertyLine | head ln == '#' = emptyPropertyLine | otherwise = parseLineJ ln where parseLineJ :: String -> (String, [Int]) parseLineJ line = let (rangeLn, line1) = span (/= ';') line propLn = takeWhile (/= '#') (tail line1) in (trim propLn, parseRange (trim rangeLn)) parseRange :: String -> [Int] parseRange rng = if '.' `elem` rng then let low = read $ "0x" ++ takeWhile (/= '.') rng high = read $ "0x" ++ reverse (takeWhile (/= '.') (reverse rng)) in [low .. high] else [read $ "0x" ++ rng] isDivider :: String -> Bool isDivider x = x == "# ================================================" parsePropertyLines :: (IsStream t, Monad m) => t m String -> t m PropertyLine parsePropertyLines = Stream.splitOn isDivider $ Fold.lmap parsePropertyLine $ Fold.foldl' combinePropertyLines emptyPropertyLine -- | A range entry in @UnicodeData.txt@. data UnicodeDataRange = SingleCode !DetailedChar -- ^ Regular entry for one code point | FirstCode !String !DetailedChar -- ^ A partial range for entry with a name as: @\@ | CompleteRange !String !DetailedChar !DetailedChar -- ^ A complete range, requiring 2 continuous entries with respective names: -- -- * @\@ -- * @\@ {-| Parse UnicodeData.txt lines Parse ranges according to https://www.unicode.org/reports/tr44/#Code_Point_Ranges. __Note:__ this does /not/ fill missing char entries, i.e. entries with no explicit entry nor within a range. -} parseUnicodeDataLines :: forall t m. (IsStream t, Monad m) => t m String -> t m DetailedChar parseUnicodeDataLines = Stream.unfoldMany (Unfold.unfoldr unitToRange) . Stream.foldMany ( Fold.lmap parseDetailedChar $ Fold.mkFold_ step initial ) where step :: Maybe UnicodeDataRange -> DetailedChar -> Fold.Step (Maybe UnicodeDataRange) (Maybe UnicodeDataRange) step Nothing dc = case span (/= ',') (_name dc) of (range, ", First>") -> Fold.Partial (Just (FirstCode range dc)) _ -> Fold.Done (Just (SingleCode dc)) step (Just (FirstCode range1 dc1)) dc2 = case span (/= ',') (_name dc2) of (range2, ", Last>") -> if range1 == range2 && _char dc1 < _char dc2 then Fold.Done (Just (CompleteRange range1 dc1 dc2)) else error $ "Cannot create range: incompatible ranges" <> show (dc1, dc2) _ -> error $ "Cannot create range: missing entry correspong to: " <> show range1 step _ _ = error "impossible case" initial :: Fold.Step (Maybe UnicodeDataRange) (Maybe UnicodeDataRange) initial = Fold.Partial Nothing unitToRange :: Maybe UnicodeDataRange -> Maybe (DetailedChar, Maybe UnicodeDataRange) unitToRange = fmap $ \case SingleCode dc -> (dc, Nothing) FirstCode _ dc -> error $ "Incomplete range: " <> show dc CompleteRange range dc1 dc2 -> if _char dc1 < _char dc2 -- [TODO] Create the proper name then (dc1{_name="TODO"}, Just (CompleteRange range dc1{_char=succ (_char dc1)} dc2)) else (dc2{_name="TODO"}, Nothing) -- | Parse a single entry of @UnicodeData.txt@ parseDetailedChar :: String -> DetailedChar parseDetailedChar line = DetailedChar { _char = readCodePoint char , _name = name , _generalCategory = read gc , _combiningClass = read combining , _decompositionType = dctype , _decomposition = dcval , _simpleUppercaseMapping = readCodePointM sUpper , _simpleLowercaseMapping = readCodePointM sLower , _simpleTitlecaseMapping = readCodePointM sTitle } where (char, line1) = span (/= ';') line (name, line2) = span (/= ';') (tail line1) (gc, line3) = span (/= ';') (tail line2) (combining, line4) = span (/= ';') (tail line3) (_bidi, line5) = span (/= ';') (tail line4) (decomposition, line6) = span (/= ';') (tail line5) (dctype, dcval) = readDecomp decomposition (_decimal, line7) = span (/= ';') (tail line6) (_digit, line8) = span (/= ';') (tail line7) (_numeric, line9) = span (/= ';') (tail line8) (_bidiM, line10) = span (/= ';') (tail line9) (_uni1Name, line11) = span (/= ';') (tail line10) (_iso, line12) = span (/= ';') (tail line11) (sUpper, line13) = span (/= ';') (tail line12) (sLower, line14) = span (/= ';') (tail line13) sTitle = tail line14 ------------------------------------------------------------------------------- -- Generation ------------------------------------------------------------------------------- readLinesFromFile :: String -> SerialT IO String readLinesFromFile file = withFile file Sys.ReadMode $ \h -> Stream.unfold Handle.read h & Unicode.decodeUtf8 & unicodeLines Fold.toList where unicodeLines = Stream.splitOnSuffix (== '\n') withFile file_ mode = Stream.bracket (liftIO $ Sys.openFile file_ mode) (liftIO . Sys.hClose) moduleToFileName :: String -> String moduleToFileName = map (\x -> if x == '.' then '/' else x) dirFromFileName :: String -> String dirFromFileName = reverse . dropWhile (/= '/') . reverse -- ModuleRecipe is a tuple of the module name and a function that generates the -- module using the module name type ModuleRecipe a = (String, String -> Fold IO a String) -- GeneratorRecipe is a list of ModuleRecipe type GeneratorRecipe a = [ModuleRecipe a] fileEmitter :: String -> String -> ModuleRecipe a -> Fold IO a () fileEmitter file outdir (modName, fldGen) = Fold.rmapM action $ fldGen modName where pretext version = mconcat [ "-- autogenerated from https://www.unicode.org/Public/" , version , "/ucd/" , file ,"\n" ] outfile = outdir <> moduleToFileName modName <> ".hs" outfiledir = dirFromFileName outfile action c = do version <- catch (getEnv "UNICODE_VERSION") (\(_ :: IOException) -> return "") createDirectoryIfMissing True outfiledir writeFile outfile (pretext version ++ c) runGenerator :: String -> String -> (SerialT IO String -> SerialT IO a) -> String -> GeneratorRecipe a -> IO () runGenerator indir file transformLines outdir recipes = readLinesFromFile (indir <> file) & transformLines & Stream.fold combinedFld where generatedFolds = map (fileEmitter file outdir) recipes combinedFld = void $ Fold.distribute generatedFolds genModules :: String -> String -> [String] -> IO () genModules indir outdir props = do compExclu <- readLinesFromFile (indir <> "DerivedNormalizationProps.txt") & parsePropertyLines & Stream.find (\(name, _) -> name == "Full_Composition_Exclusion") & fmap (snd . fromMaybe ("", [])) non0CC <- readLinesFromFile (indir <> "extracted/DerivedCombiningClass.txt") & parsePropertyLines & Stream.filter (\(name, _) -> name /= "0") & Stream.map snd & Stream.fold (Fold.foldl' (++) []) runGenerator indir "UnicodeData.txt" parseUnicodeDataLines outdir [ compositions compExclu non0CC , combiningClass , decomposable , decomposableK , decompositions , decompositionsK2 , decompositionsK , generalCategory , simpleUpperCaseMapping , simpleLowerCaseMapping , simpleTitleCaseMapping ] runGenerator indir "PropList.txt" parsePropertyLines outdir [ propList ] runGenerator indir "DerivedCoreProperties.txt" parsePropertyLines outdir [ derivedCoreProperties ] where propList = ("Unicode.Internal.Char.PropList" , (`genCorePropertiesModule` (`elem` props))) derivedCoreProperties = ("Unicode.Internal.Char.DerivedCoreProperties" , (`genCorePropertiesModule` (`elem` props))) compositions exc non0 = ( "Unicode.Internal.Char.UnicodeData.Compositions" , \m -> genCompositionsModule m exc non0) combiningClass = ( "Unicode.Internal.Char.UnicodeData.CombiningClass" , genCombiningClassModule) decomposable = ( "Unicode.Internal.Char.UnicodeData.Decomposable" , (`genDecomposableModule` Canonical)) decomposableK = ( "Unicode.Internal.Char.UnicodeData.DecomposableK" , (`genDecomposableModule` Kompat)) decompositions = ( "Unicode.Internal.Char.UnicodeData.Decompositions" , \m -> genDecomposeDefModule m [] [] Canonical (const True)) decompositionsK2 = ( "Unicode.Internal.Char.UnicodeData.DecompositionsK2" , \m -> genDecomposeDefModule m [] [] Kompat (>= 60000)) decompositionsK = let pre = ["import qualified " <> fst decompositionsK2 <> " as DK2", ""] post = ["decompose c = DK2.decompose c"] in ( "Unicode.Internal.Char.UnicodeData.DecompositionsK" , \m -> genDecomposeDefModule m pre post Kompat (< 60000)) generalCategory = ( "Unicode.Internal.Char.UnicodeData.GeneralCategory" , genGeneralCategoryModule) simpleUpperCaseMapping = ( "Unicode.Internal.Char.UnicodeData.SimpleUpperCaseMapping" , \m -> genSimpleCaseMappingModule m "toSimpleUpperCase" _simpleUppercaseMapping) simpleLowerCaseMapping = ( "Unicode.Internal.Char.UnicodeData.SimpleLowerCaseMapping" , \m -> genSimpleCaseMappingModule m "toSimpleLowerCase" _simpleLowercaseMapping) simpleTitleCaseMapping = ( "Unicode.Internal.Char.UnicodeData.SimpleTitleCaseMapping" , \m -> genSimpleCaseMappingModule m "toSimpleTitleCase" _simpleTitlecaseMapping)