punkt-0.1.0: Multilingual unsupervised sentence tokenization with Punkt.

Safe HaskellNone
LanguageHaskell2010

NLP.Punkt

Documentation

data Entity a Source

Constructors

Word a Bool 
Punct a 
ParaStart 
Ellipsis 
Dash 

Instances

Eq a => Eq (Entity a) 
Show a => Show (Entity a) 

data Token Source

Constructors

Token 

Fields

offset :: Int
 
toklen :: Int
 
entity :: Entity Text
 
sentend :: Bool
 
abbrev :: Bool
 

Instances