diff options
author | Joris | 2018-06-17 23:24:47 +0200 |
---|---|---|
committer | Joris | 2018-06-18 11:13:55 +0200 |
commit | 0a4d3c8f12dc5797a919a00b6bcaf759947687cc (patch) | |
tree | bcb89781e22c2314bf0c064ebb37cb7f8a362f5c /src/parser/haskell/Parser/OuestFranceParser.hs | |
parent | e2a5c7c5c596d057b6fa9c08a8204ce1429cfdc4 (diff) | |
download | ad-listener-0a4d3c8f12dc5797a919a00b6bcaf759947687cc.tar.gz ad-listener-0a4d3c8f12dc5797a919a00b6bcaf759947687cc.tar.bz2 ad-listener-0a4d3c8f12dc5797a919a00b6bcaf759947687cc.zip |
Add ouest france parser
Diffstat (limited to 'src/parser/haskell/Parser/OuestFranceParser.hs')
-rw-r--r-- | src/parser/haskell/Parser/OuestFranceParser.hs | 27 |
1 files changed, 27 insertions, 0 deletions
diff --git a/src/parser/haskell/Parser/OuestFranceParser.hs b/src/parser/haskell/Parser/OuestFranceParser.hs new file mode 100644 index 0000000..a7b6360 --- /dev/null +++ b/src/parser/haskell/Parser/OuestFranceParser.hs @@ -0,0 +1,27 @@ +module Parser.OuestFranceParser + ( parse + ) where + +import Data.Maybe (catMaybes) +import Data.Text (Text) +import qualified Data.Text as T + +import Text.HTML.TagSoup + +import Model.Ad (Ad (Ad)) + +import Parser.Utils + +parse :: Text -> [Ad] +parse page = + catMaybes . fmap parseAd $ partitions (~== "<a>") tags + where tags = getTagsBetween "<div id=listAnnonces>" "<div id=interactions>" (parseTags page) + +parseAd :: [Tag Text] -> Maybe Ad +parseAd tags = do + name <- getTagTextAfter "<span class=annTitre>" tags + location <- getTagTextAfter "<span class=annVille>" tags + let price = getTagTextAfter "<span class=annPrix>" tags + let startUrl = T.pack "https://www.ouestfrance-immo.com/" + url <- getTagAttribute "<a>" (T.pack "href") tags + return (Ad name location price (T.concat [startUrl, url])) |