unicode-data-parser-0.1.0.1: Parsers for Unicode Character Database (UCD) files
Copyright(c) 2024 Pierre Le Marre
Maintainerdev@wismill.eu
Stabilityexperimental
Safe HaskellNone
LanguageGHC2021

UCD.Parser.UnicodeData

Description

Parser for UnicodeData.txt.

Since: 0.1.0

Synopsis

Documentation

data GeneralCategory Source #

Constructors

Lu

Letter, Uppercase

Ll

Letter, Lowercase

Lt

Letter, Titlecase

Lm

Letter, Modifier

Lo

Letter, Other

Mn

Mark, Non-Spacing

Mc

Mark, Spacing Combining

Me

Mark, Enclosing

Nd

Number, Decimal

Nl

Number, Letter

No

Number, Other

Pc

Punctuation, Connector

Pd

Punctuation, Dash

Ps

Punctuation, Open

Pe

Punctuation, Close

Pi

Punctuation, Initial quote

Pf

Punctuation, Final quote

Po

Punctuation, Other

Sm

Symbol, Math

Sc

Symbol, Currency

Sk

Symbol, Modifier

So

Symbol, Other

Zs

Separator, Space

Zl

Separator, Line

Zp

Separator, Paragraph

Cc

Other, Control

Cf

Other, Format

Cs

Other, Surrogate

Co

Other, Private Use

Cn

Other, Not Assigned

data Decomposition Source #

Unicode decomposition of a code point

Since: 0.1.0

Constructors

Self 
Decomposition !DecompositionType ![Char] 

Instances

Instances details
Show Decomposition Source # 
Instance details

Defined in UCD.Parser.UnicodeData

Methods

showsPrec :: Int -> Decomposition -> ShowS

show :: Decomposition -> String

showList :: [Decomposition] -> ShowS

Eq Decomposition Source # 
Instance details

Defined in UCD.Parser.UnicodeData

data Entry Source #

An entry in UnicodeData.txt.

Since: 0.1.0

Constructors

Entry 

Fields

Instances

Instances details
Show Entry Source # 
Instance details

Defined in UCD.Parser.UnicodeData

Methods

showsPrec :: Int -> Entry -> ShowS

show :: Entry -> String

showList :: [Entry] -> ShowS

Eq Entry Source # 
Instance details

Defined in UCD.Parser.UnicodeData

Methods

(==) :: Entry -> Entry -> Bool

(/=) :: Entry -> Entry -> Bool

data NumericValue Source #

Numeric value of a code point, if relevant

Since: 0.1.0

Constructors

NotNumeric 
Digit !Word8 
Integer !Integer 
Rational !Rational 

Instances

Instances details
Show NumericValue Source # 
Instance details

Defined in UCD.Parser.UnicodeData

Methods

showsPrec :: Int -> NumericValue -> ShowS

show :: NumericValue -> String

showList :: [NumericValue] -> ShowS

Eq NumericValue Source # 
Instance details

Defined in UCD.Parser.UnicodeData

Methods

(==) :: NumericValue -> NumericValue -> Bool

(/=) :: NumericValue -> NumericValue -> Bool

data CharDetails Source #

Core characteristics of a Unicode code point

Since: 0.1.0

Instances

Instances details
Show CharDetails Source # 
Instance details

Defined in UCD.Parser.UnicodeData

Methods

showsPrec :: Int -> CharDetails -> ShowS

show :: CharDetails -> String

showList :: [CharDetails] -> ShowS

Eq CharDetails Source # 
Instance details

Defined in UCD.Parser.UnicodeData

Methods

(==) :: CharDetails -> CharDetails -> Bool

(/=) :: CharDetails -> CharDetails -> Bool

parse :: ByteString -> [Entry] Source #

Parser for UnicodeData.txt file

Since: 0.1.0