{-# LANGUAGE LambdaCase #-}
module Unicode.Char.General
(
GeneralCategory(..)
, generalCategoryAbbr
, generalCategory
, isAlphabetic
, isAlphaNum
, isControl
, isMark
, isPrint
, isPunctuation
, isSeparator
, isSymbol
, isWhiteSpace
, isLetter
, isSpace
, isAscii
, isLatin1
, isAsciiUpper
, isAsciiLower
, isJamo
, jamoNCount
, jamoLFirst
, jamoLCount
, jamoLIndex
, jamoLLast
, jamoVFirst
, jamoVCount
, jamoVIndex
, jamoVLast
, jamoTFirst
, jamoTCount
, jamoTIndex
, jamoTLast
, hangulFirst
, hangulLast
, isHangul
, isHangulLV
)
where
import Control.Exception (assert)
import Data.Char (isAscii, isLatin1, isAsciiUpper, isAsciiLower, ord)
import Data.Ix (Ix)
import Unicode.Internal.Division (quotRem28)
import qualified Unicode.Internal.Char.DerivedCoreProperties as P
import qualified Unicode.Internal.Char.PropList as P
import qualified Unicode.Internal.Char.UnicodeData.GeneralCategory as UC
data GeneralCategory
= UppercaseLetter
| LowercaseLetter
| TitlecaseLetter
| ModifierLetter
| OtherLetter
| NonSpacingMark
| SpacingCombiningMark
| EnclosingMark
| DecimalNumber
| LetterNumber
| OtherNumber
| ConnectorPunctuation
| DashPunctuation
| OpenPunctuation
| ClosePunctuation
| InitialQuote
| FinalQuote
| OtherPunctuation
| MathSymbol
| CurrencySymbol
| ModifierSymbol
| OtherSymbol
| Space
| LineSeparator
| ParagraphSeparator
| Control
| Format
| Surrogate
| PrivateUse
| NotAssigned
deriving ( Int -> GeneralCategory -> ShowS
[GeneralCategory] -> ShowS
GeneralCategory -> String
forall a.
(Int -> a -> ShowS) -> (a -> String) -> ([a] -> ShowS) -> Show a
showList :: [GeneralCategory] -> ShowS
$cshowList :: [GeneralCategory] -> ShowS
show :: GeneralCategory -> String
$cshow :: GeneralCategory -> String
showsPrec :: Int -> GeneralCategory -> ShowS
$cshowsPrec :: Int -> GeneralCategory -> ShowS
Show
, GeneralCategory -> GeneralCategory -> Bool
forall a. (a -> a -> Bool) -> (a -> a -> Bool) -> Eq a
/= :: GeneralCategory -> GeneralCategory -> Bool
$c/= :: GeneralCategory -> GeneralCategory -> Bool
== :: GeneralCategory -> GeneralCategory -> Bool
$c== :: GeneralCategory -> GeneralCategory -> Bool
Eq
, Eq GeneralCategory
GeneralCategory -> GeneralCategory -> Bool
GeneralCategory -> GeneralCategory -> Ordering
GeneralCategory -> GeneralCategory -> GeneralCategory
forall a.
Eq a
-> (a -> a -> Ordering)
-> (a -> a -> Bool)
-> (a -> a -> Bool)
-> (a -> a -> Bool)
-> (a -> a -> Bool)
-> (a -> a -> a)
-> (a -> a -> a)
-> Ord a
min :: GeneralCategory -> GeneralCategory -> GeneralCategory
$cmin :: GeneralCategory -> GeneralCategory -> GeneralCategory
max :: GeneralCategory -> GeneralCategory -> GeneralCategory
$cmax :: GeneralCategory -> GeneralCategory -> GeneralCategory
>= :: GeneralCategory -> GeneralCategory -> Bool
$c>= :: GeneralCategory -> GeneralCategory -> Bool
> :: GeneralCategory -> GeneralCategory -> Bool
$c> :: GeneralCategory -> GeneralCategory -> Bool
<= :: GeneralCategory -> GeneralCategory -> Bool
$c<= :: GeneralCategory -> GeneralCategory -> Bool
< :: GeneralCategory -> GeneralCategory -> Bool
$c< :: GeneralCategory -> GeneralCategory -> Bool
compare :: GeneralCategory -> GeneralCategory -> Ordering
$ccompare :: GeneralCategory -> GeneralCategory -> Ordering
Ord
, Int -> GeneralCategory
GeneralCategory -> Int
GeneralCategory -> [GeneralCategory]
GeneralCategory -> GeneralCategory
GeneralCategory -> GeneralCategory -> [GeneralCategory]
GeneralCategory
-> GeneralCategory -> GeneralCategory -> [GeneralCategory]
forall a.
(a -> a)
-> (a -> a)
-> (Int -> a)
-> (a -> Int)
-> (a -> [a])
-> (a -> a -> [a])
-> (a -> a -> [a])
-> (a -> a -> a -> [a])
-> Enum a
enumFromThenTo :: GeneralCategory
-> GeneralCategory -> GeneralCategory -> [GeneralCategory]
$cenumFromThenTo :: GeneralCategory
-> GeneralCategory -> GeneralCategory -> [GeneralCategory]
enumFromTo :: GeneralCategory -> GeneralCategory -> [GeneralCategory]
$cenumFromTo :: GeneralCategory -> GeneralCategory -> [GeneralCategory]
enumFromThen :: GeneralCategory -> GeneralCategory -> [GeneralCategory]
$cenumFromThen :: GeneralCategory -> GeneralCategory -> [GeneralCategory]
enumFrom :: GeneralCategory -> [GeneralCategory]
$cenumFrom :: GeneralCategory -> [GeneralCategory]
fromEnum :: GeneralCategory -> Int
$cfromEnum :: GeneralCategory -> Int
toEnum :: Int -> GeneralCategory
$ctoEnum :: Int -> GeneralCategory
pred :: GeneralCategory -> GeneralCategory
$cpred :: GeneralCategory -> GeneralCategory
succ :: GeneralCategory -> GeneralCategory
$csucc :: GeneralCategory -> GeneralCategory
Enum
, GeneralCategory
forall a. a -> a -> Bounded a
maxBound :: GeneralCategory
$cmaxBound :: GeneralCategory
minBound :: GeneralCategory
$cminBound :: GeneralCategory
Bounded
, Ord GeneralCategory
(GeneralCategory, GeneralCategory) -> Int
(GeneralCategory, GeneralCategory) -> [GeneralCategory]
(GeneralCategory, GeneralCategory) -> GeneralCategory -> Bool
(GeneralCategory, GeneralCategory) -> GeneralCategory -> Int
forall a.
Ord a
-> ((a, a) -> [a])
-> ((a, a) -> a -> Int)
-> ((a, a) -> a -> Int)
-> ((a, a) -> a -> Bool)
-> ((a, a) -> Int)
-> ((a, a) -> Int)
-> Ix a
unsafeRangeSize :: (GeneralCategory, GeneralCategory) -> Int
$cunsafeRangeSize :: (GeneralCategory, GeneralCategory) -> Int
rangeSize :: (GeneralCategory, GeneralCategory) -> Int
$crangeSize :: (GeneralCategory, GeneralCategory) -> Int
inRange :: (GeneralCategory, GeneralCategory) -> GeneralCategory -> Bool
$cinRange :: (GeneralCategory, GeneralCategory) -> GeneralCategory -> Bool
unsafeIndex :: (GeneralCategory, GeneralCategory) -> GeneralCategory -> Int
$cunsafeIndex :: (GeneralCategory, GeneralCategory) -> GeneralCategory -> Int
index :: (GeneralCategory, GeneralCategory) -> GeneralCategory -> Int
$cindex :: (GeneralCategory, GeneralCategory) -> GeneralCategory -> Int
range :: (GeneralCategory, GeneralCategory) -> [GeneralCategory]
$crange :: (GeneralCategory, GeneralCategory) -> [GeneralCategory]
Ix
)
generalCategoryAbbr :: GeneralCategory -> String
generalCategoryAbbr :: GeneralCategory -> String
generalCategoryAbbr = \case
GeneralCategory
UppercaseLetter -> String
"Lu"
GeneralCategory
LowercaseLetter -> String
"Ll"
GeneralCategory
TitlecaseLetter -> String
"Lt"
GeneralCategory
ModifierLetter -> String
"Lm"
GeneralCategory
OtherLetter -> String
"Lo"
GeneralCategory
NonSpacingMark -> String
"Mn"
GeneralCategory
SpacingCombiningMark -> String
"Mc"
GeneralCategory
EnclosingMark -> String
"Me"
GeneralCategory
DecimalNumber -> String
"Nd"
GeneralCategory
LetterNumber -> String
"Nl"
GeneralCategory
OtherNumber -> String
"No"
GeneralCategory
ConnectorPunctuation -> String
"Pc"
GeneralCategory
DashPunctuation -> String
"Pd"
GeneralCategory
OpenPunctuation -> String
"Ps"
GeneralCategory
ClosePunctuation -> String
"Pe"
GeneralCategory
InitialQuote -> String
"Pi"
GeneralCategory
FinalQuote -> String
"Pf"
GeneralCategory
OtherPunctuation -> String
"Po"
GeneralCategory
MathSymbol -> String
"Sm"
GeneralCategory
CurrencySymbol -> String
"Sc"
GeneralCategory
ModifierSymbol -> String
"Sk"
GeneralCategory
OtherSymbol -> String
"So"
GeneralCategory
Space -> String
"Zs"
GeneralCategory
LineSeparator -> String
"Zl"
GeneralCategory
ParagraphSeparator -> String
"Zp"
GeneralCategory
Control -> String
"Cc"
GeneralCategory
Format -> String
"Cf"
GeneralCategory
Surrogate -> String
"Cs"
GeneralCategory
PrivateUse -> String
"Co"
GeneralCategory
NotAssigned -> String
"Cn"
{-# INLINE generalCategory #-}
generalCategory :: Char -> GeneralCategory
generalCategory :: Char -> GeneralCategory
generalCategory = forall a. Enum a => Int -> a
toEnum forall b c a. (b -> c) -> (a -> b) -> a -> c
. Char -> Int
UC.generalCategory
{-# INLINE isAlphabetic #-}
isAlphabetic :: Char -> Bool
isAlphabetic :: Char -> Bool
isAlphabetic = Char -> Bool
P.isAlphabetic
isAlphaNum :: Char -> Bool
isAlphaNum :: Char -> Bool
isAlphaNum Char
c = case Char -> GeneralCategory
generalCategory Char
c of
GeneralCategory
UppercaseLetter -> Bool
True
GeneralCategory
LowercaseLetter -> Bool
True
GeneralCategory
TitlecaseLetter -> Bool
True
GeneralCategory
ModifierLetter -> Bool
True
GeneralCategory
OtherLetter -> Bool
True
GeneralCategory
DecimalNumber -> Bool
True
GeneralCategory
LetterNumber -> Bool
True
GeneralCategory
OtherNumber -> Bool
True
GeneralCategory
_ -> Bool
False
isControl :: Char -> Bool
isControl :: Char -> Bool
isControl Char
c = case Char -> GeneralCategory
generalCategory Char
c of
GeneralCategory
Control -> Bool
True
GeneralCategory
_ -> Bool
False
isMark :: Char -> Bool
isMark :: Char -> Bool
isMark Char
c = case Char -> GeneralCategory
generalCategory Char
c of
GeneralCategory
NonSpacingMark -> Bool
True
GeneralCategory
SpacingCombiningMark -> Bool
True
GeneralCategory
EnclosingMark -> Bool
True
GeneralCategory
_ -> Bool
False
isPrint :: Char -> Bool
isPrint :: Char -> Bool
isPrint Char
c = case Char -> GeneralCategory
generalCategory Char
c of
GeneralCategory
LineSeparator -> Bool
False
GeneralCategory
ParagraphSeparator -> Bool
False
GeneralCategory
Control -> Bool
False
GeneralCategory
Format -> Bool
False
GeneralCategory
Surrogate -> Bool
False
GeneralCategory
PrivateUse -> Bool
False
GeneralCategory
NotAssigned -> Bool
False
GeneralCategory
_ -> Bool
True
isPunctuation :: Char -> Bool
isPunctuation :: Char -> Bool
isPunctuation Char
c = case Char -> GeneralCategory
generalCategory Char
c of
GeneralCategory
ConnectorPunctuation -> Bool
True
GeneralCategory
DashPunctuation -> Bool
True
GeneralCategory
OpenPunctuation -> Bool
True
GeneralCategory
ClosePunctuation -> Bool
True
GeneralCategory
InitialQuote -> Bool
True
GeneralCategory
FinalQuote -> Bool
True
GeneralCategory
OtherPunctuation -> Bool
True
GeneralCategory
_ -> Bool
False
{-# INLINE isWhiteSpace #-}
isWhiteSpace :: Char -> Bool
isWhiteSpace :: Char -> Bool
isWhiteSpace = Char -> Bool
P.isWhite_Space
isSeparator :: Char -> Bool
isSeparator :: Char -> Bool
isSeparator Char
c = case Char -> GeneralCategory
generalCategory Char
c of
GeneralCategory
Space -> Bool
True
GeneralCategory
LineSeparator -> Bool
True
GeneralCategory
ParagraphSeparator -> Bool
True
GeneralCategory
_ -> Bool
False
isSymbol :: Char -> Bool
isSymbol :: Char -> Bool
isSymbol Char
c = case Char -> GeneralCategory
generalCategory Char
c of
GeneralCategory
MathSymbol -> Bool
True
GeneralCategory
CurrencySymbol -> Bool
True
GeneralCategory
ModifierSymbol -> Bool
True
GeneralCategory
OtherSymbol -> Bool
True
GeneralCategory
_ -> Bool
False
{-# INLINE isLetter #-}
{-# DEPRECATED isLetter "Use isAlphabetic instead. Note that the behavior of this function does not match base:Data.Char.isLetter. See Unicode.Char.General.Compat for behavior compatible with base:Data.Char." #-}
isLetter :: Char -> Bool
isLetter :: Char -> Bool
isLetter = Char -> Bool
P.isAlphabetic
{-# INLINE isSpace #-}
{-# DEPRECATED isSpace "Use isWhiteSpace instead. Note that the behavior of this function does not match base:Data.Char.isSpace. See Unicode.Char.General.Compat for behavior compatible with base:Data.Char." #-}
isSpace :: Char -> Bool
isSpace :: Char -> Bool
isSpace = Char -> Bool
P.isWhite_Space
jamoLFirst, jamoLCount, jamoLLast :: Int
jamoLFirst :: Int
jamoLFirst = Int
0x1100
jamoLCount :: Int
jamoLCount = Int
19
jamoLLast :: Int
jamoLLast = Int
jamoLFirst forall a. Num a => a -> a -> a
+ Int
jamoLCount forall a. Num a => a -> a -> a
- Int
1
jamoVFirst, jamoVCount, jamoVLast :: Int
jamoVFirst :: Int
jamoVFirst = Int
0x1161
jamoVCount :: Int
jamoVCount = Int
21
jamoVLast :: Int
jamoVLast = Int
jamoVFirst forall a. Num a => a -> a -> a
+ Int
jamoVCount forall a. Num a => a -> a -> a
- Int
1
jamoTFirst, jamoTCount :: Int
jamoTFirst :: Int
jamoTFirst = Int
0x11a7
jamoTCount :: Int
jamoTCount = Int
28
jamoTLast :: Int
jamoTLast :: Int
jamoTLast = Int
jamoTFirst forall a. Num a => a -> a -> a
+ Int
jamoTCount forall a. Num a => a -> a -> a
- Int
1
jamoNCount :: Int
jamoNCount :: Int
jamoNCount = Int
588
hangulFirst, hangulLast :: Int
hangulFirst :: Int
hangulFirst = Int
0xac00
hangulLast :: Int
hangulLast = Int
hangulFirst forall a. Num a => a -> a -> a
+ Int
jamoLCount forall a. Num a => a -> a -> a
* Int
jamoVCount forall a. Num a => a -> a -> a
* Int
jamoTCount forall a. Num a => a -> a -> a
- Int
1
isHangul :: Char -> Bool
isHangul :: Char -> Bool
isHangul Char
c = Int
n forall a. Ord a => a -> a -> Bool
>= Int
hangulFirst Bool -> Bool -> Bool
&& Int
n forall a. Ord a => a -> a -> Bool
<= Int
hangulLast
where n :: Int
n = Char -> Int
ord Char
c
isHangulLV :: Char -> Bool
isHangulLV :: Char -> Bool
isHangulLV Char
c = forall a. (?callStack::CallStack) => Bool -> a -> a
assert (Int
jamoTCount forall a. Eq a => a -> a -> Bool
== Int
28)
forall a b. (a, b) -> b
snd (Int -> (Int, Int)
quotRem28 (Char -> Int
ord Char
c forall a. Num a => a -> a -> a
- Int
hangulFirst)) forall a. Eq a => a -> a -> Bool
== Int
0
isJamo :: Char -> Bool
isJamo :: Char -> Bool
isJamo Char
c = Int
n forall a. Ord a => a -> a -> Bool
>= Int
jamoLFirst Bool -> Bool -> Bool
&& Int
n forall a. Ord a => a -> a -> Bool
<= Int
jamoTLast
where n :: Int
n = Char -> Int
ord Char
c
jamoLIndex :: Char -> Maybe Int
jamoLIndex :: Char -> Maybe Int
jamoLIndex Char
c
| Int
index forall a. Ord a => a -> a -> Bool
>= Int
0 Bool -> Bool -> Bool
&& Int
index forall a. Ord a => a -> a -> Bool
< Int
jamoLCount = forall a. a -> Maybe a
Just Int
index
| Bool
otherwise = forall a. Maybe a
Nothing
where index :: Int
index = Char -> Int
ord Char
c forall a. Num a => a -> a -> a
- Int
jamoLFirst
jamoVIndex :: Char -> Maybe Int
jamoVIndex :: Char -> Maybe Int
jamoVIndex Char
c
| Int
index forall a. Ord a => a -> a -> Bool
>= Int
0 Bool -> Bool -> Bool
&& Int
index forall a. Ord a => a -> a -> Bool
< Int
jamoVCount = forall a. a -> Maybe a
Just Int
index
| Bool
otherwise = forall a. Maybe a
Nothing
where index :: Int
index = Char -> Int
ord Char
c forall a. Num a => a -> a -> a
- Int
jamoVFirst
jamoTIndex :: Char -> Maybe Int
jamoTIndex :: Char -> Maybe Int
jamoTIndex Char
c
| Int
index forall a. Ord a => a -> a -> Bool
> Int
0 Bool -> Bool -> Bool
&& Int
index forall a. Ord a => a -> a -> Bool
< Int
jamoTCount = forall a. a -> Maybe a
Just Int
index
| Bool
otherwise = forall a. Maybe a
Nothing
where index :: Int
index = Char -> Int
ord Char
c forall a. Num a => a -> a -> a
- Int
jamoTFirst