module Web.NombreGenerator.Scrapper.BsAs (scrap) where import Text.XML.HXT.Core import Text.HandsomeSoup fromWeb = fromUrl "http://www.buenosaires.gob.ar/areas/registrocivil/nombres/busqueda/imprimir.php?sexo=ambos" fromFile = readDocument [withParseHTML yes, withInputEncoding isoLatin1, withCheckNamespaces no, withParseByMimeType no, withWarnings no] "Nombres.html" getDoc = traceMsg 0 "Downloading..." >>> --fromWeb >>> fromFile >>> traceMsg 0 "Parsing..." scrap :: IO [String] scrap = runX findNames findNames :: IOSLA (XIOState ()) XmlTree String findNames = getDoc >>> css ".contenido tbody tr" >>> listA ( getChildren >>> hasName "td" /> getText ) >>. map head