algebraic-graphs-io-0.1.5.1: I/O utilities and datasets for algebraic-graphs
Safe HaskellNone
LanguageHaskell2010

Algebra.Graph.IO.Datasets.LINQS.Citeseer

Description

Citeseer document classification dataset, from :

Qing Lu, and Lise Getoor. "Link-based classification." ICML, 2003.

https://linqs.soe.ucsc.edu/data

Synopsis

Documentation

citeseerGraph :: IO (Graph ContentRow) Source #

Reconstruct the citation graph

NB : relies on the user having stashed the dataset to local disk first.

stash :: IO () Source #

Download, parse, serialize and save the dataset to local storage.

Two binary files will be created under ./assets/citeseer/

data ContentRow Source #

Dataset row of the .content file

Constructors

CRow 

Fields

Instances

Instances details
Eq ContentRow Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

Show ContentRow Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

Generic ContentRow Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

Associated Types

type Rep ContentRow :: Type -> Type #

Binary ContentRow Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

type Rep ContentRow Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

type Rep ContentRow = D1 ('MetaData "ContentRow" "Algebra.Graph.IO.Datasets.LINQS.Citeseer" "algebraic-graphs-io-0.1.5.1-5xxZnEUve6JKB9uqS79GZK" 'False) (C1 ('MetaCons "CRow" 'PrefixI 'True) (S1 ('MetaSel ('Just "crId") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 String) :*: (S1 ('MetaSel ('Just "crFeatures") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 (Seq Int16)) :*: S1 ('MetaSel ('Just "crClass") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 DocClass))))

data DocClass Source #

document classes of the Citeseer dataset

Constructors

Agents 
AI 
DB 
IR 
ML 
HCI 

Instances

Instances details
Eq DocClass Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

Show DocClass Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

Generic DocClass Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

Associated Types

type Rep DocClass :: Type -> Type #

Methods

from :: DocClass -> Rep DocClass x #

to :: Rep DocClass x -> DocClass #

Binary DocClass Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

Methods

put :: DocClass -> Put #

get :: Get DocClass #

putList :: [DocClass] -> Put #

type Rep DocClass Source # 
Instance details

Defined in Algebra.Graph.IO.Datasets.LINQS.Citeseer

type Rep DocClass = D1 ('MetaData "DocClass" "Algebra.Graph.IO.Datasets.LINQS.Citeseer" "algebraic-graphs-io-0.1.5.1-5xxZnEUve6JKB9uqS79GZK" 'False) ((C1 ('MetaCons "Agents" 'PrefixI 'False) (U1 :: Type -> Type) :+: (C1 ('MetaCons "AI" 'PrefixI 'False) (U1 :: Type -> Type) :+: C1 ('MetaCons "DB" 'PrefixI 'False) (U1 :: Type -> Type))) :+: (C1 ('MetaCons "IR" 'PrefixI 'False) (U1 :: Type -> Type) :+: (C1 ('MetaCons "ML" 'PrefixI 'False) (U1 :: Type -> Type) :+: C1 ('MetaCons "HCI" 'PrefixI 'False) (U1 :: Type -> Type))))