aboutsummaryrefslogtreecommitdiff
path: root/src/Parser/Utils.hs
blob: d72a1ceada0378d9bfd5b79165efbf8d133a0a25 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
module Parser.Utils
  ( getTagsBefore
  , getTagsAfter
  , getTagsBetween
  , getTagAttributes
  , getTagAttribute
  , getTagTextAfter
  ) where

import Data.List (find, findIndex)
import Data.Maybe (listToMaybe, catMaybes)
import Data.Text (Text)
import qualified Data.Text as T

import Text.HTML.TagSoup

getTagsBefore :: String -> [Tag Text] -> [Tag Text]
getTagsBefore selector = takeWhile (~/= selector)

getTagsAfter :: String -> [Tag Text] -> [Tag Text]
getTagsAfter selector = drop 1 . dropWhile (~/= selector)

getTagsBetween :: String -> String -> [Tag Text] -> [Tag Text]
getTagsBetween begin end = getTagsBefore end . getTagsAfter begin

getTagAttributes :: String -> Text -> [Tag Text] -> [Text]
getTagAttributes selector attribute =
  catMaybes
  . fmap (maybeTagAttribute attribute)
  . filter (~== selector)

getTagAttribute :: String -> Text -> [Tag Text] -> Maybe Text
getTagAttribute selector attribute =
  listToMaybe
  . getTagAttributes selector attribute

getTagTextAfter :: String -> [Tag Text] -> Maybe Text
getTagTextAfter selector tags =
  case findIndex (~== selector) tags of
    Just index -> fmap T.strip $ safeGetAt (index + 1) tags >>= maybeTagText
    Nothing -> Nothing

maybeTagAttribute :: Text -> Tag Text -> Maybe Text
maybeTagAttribute name (TagOpen _ xs) =
  fmap snd . find (\(x, _) -> x == name) $ xs
maybeTagAttribute attribute _ = Nothing

safeGetAt :: Int -> [a] -> Maybe a
safeGetAt index = listToMaybe . drop index