summaryrefslogtreecommitdiff
path: root/parser/artoftea.fnl
blob: c8f25ee995ca8a650404d11feeaedd407182a0ec (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
(local peg
 (if (pick-values 1 (pcall require :lpeg))
   (require :lpeg)
   (require :lpeglj)))
(local parser (require :parser.parser))
(local number (require :lib.number))
(local fetcher (require :fetcher))

(fn format-url [path page]
  (.. "https://artoftea.ru/" path
      (if (< 1 page) (.. "?page=" page) "")))

(local product-peg
  (*
   (parser.anywhere
    (parser.tag :div {:class "product-thumb__image"}
     (parser.tag :a {:href (peg.Cg (parser.till "\"") :url) :title "*"}
      (*
       (parser.anywhere (* "src=\"" (peg.Cg (parser.till "\"") :image) "\""))
       (parser.till "</a>")))))
   (parser.anywhere
     (parser.tag :a {:class "product-thumb__name" :href "*"}
      (peg.Cg (parser.till "</a>") :title)))
   (parser.anywhere
    (+
     (*
      (+
        ;; without discount
        (parser.tag :option {:data-price-prefix (peg.Cg (parser.till "\"") :prefix)
                             :data-price (peg.Cg (parser.till "\"") :amount)
                             :value "*" :selected "selected"}
         (peg.Cg (parser.till "</option>") :weight))
        ;; with discount
        (parser.tag :option {:data-price-prefix (peg.Cg (parser.till "\"") :prefix)
                             :data-price "*"
                             :data-special (peg.Cg (parser.till "\"") :amount)
                             :value "*" :selected "selected"}
         (peg.Cg (parser.till "</option>") :weight)))
      (parser.anywhere
       (parser.tag :span {:data-price (peg.Cg (parser.till "\"") :price)
                          :class "*"}
        (parser.till "</span>"))))
     ;; without options
     (parser.tag :span {:data-price (peg.Cg (parser.till "\"") :price)
                        :class "*"}
      (parser.till "</span>"))))
   (parser.anywhere (parser.tag :span {} "В корзину"))))

(fn normalize [product]
  (local year (parser.guess-year product.title))
  (local weight (or (parser.guess-weight product.weight ["г"])
                    (parser.guess-weight product.title)))
  (local amount (if product.amount
                  (number.string->number product.amount)
                  1))
  (local price (number.string->number product.price))
  (local final-price (if (= product.prefix "*")
                          (* price amount)
                         (= product.prefix "=")
                          amount
                         price))

  {:site "artoftea"
   :title product.title
   :url product.url
   :description product.description
   :image product.image
   :year year
   :price final-price
   :weight weight
   :volume (parser.guess-volume product.title)
   :price-per (if (and final-price weight (< 0 weight))
                (/ (math.ceil (* (/ final-price weight) 10)) 10)
                nil)})

(fn products []
  (fetcher.from-html
    [{:path "redtea" :tags ["Красный чай"]}
     {:path "greentea" :tags ["Зеленый чай"]}
     {:path "puer/shu-puer" :tags ["Шу пуэр"]}
     {:path "puer/sheng-puer" :tags ["Шен пуэр"]}
     {:path "rassypnoi-puer"}
     {:path "oolong" :tags ["Улун"]}
     {:path "whitetea" :tags ["Белый чай"]}
     {:path "yellowtea" :tags ["Желтый чай"]}
     {:path "xej-cha-chernyj-chaj" :tags ["Хэй ча"]}
     {:path "posuda/gaiwans" :tags ["Посуда" "Гайвань"]}
     {:path "posuda/cups" :tags ["Посуда" "Пиала"]}
     {:path "posuda/chahai" :tags ["Посуда" "Чахай"]}
     {:path "posuda/chainiki-steklo-farfor" :tags ["Посуда" "Стекло"]}
     {:path "posuda/chainiki-isinskaya-glina" :tags ["Посуда" "Чайник" "Исин"]}
     {:path "posuda/chayniki-iz-keramiki-farfora" :tags ["Посуда" "Чайник" "Керамика"]}
     {:path "posuda/farfor-iz-tszindechzhen" :tags ["Посуда" "Цзиндэчжэнь"]}
     {:path "posuda/keramika-iz-tszyanshuy" :tags ["Посуда" "Чайник" "Цзяньшуй"]}
     {:path "posuda/keramika-iz-chaochzhou" :tags ["Посуда" "Чайник" "Чаочжоу"]}
     {:path "posuda/posuda-iz-tsinchzhou" :tags ["Посуда" "Чайник" "Гуанси"]}
     {:path "posuda/termosy-zavarochnyye-butylki" :tags ["Посуда" "Термос"]}
     {:path "posuda/sama-kamjove" :tags ["Посуда" "Типот"]}
     {:path "posuda/steklo" :tags ["Посуда" "Стекло"]}
     {:path "posuda/nabory" :tags ["Посуда" "Набор"]}
     {:path "posuda/ekskljuzivnaja-posuda" :tags ["Посуда" "Набор"]}
     {:path "accesories/chaban" :tags ["Чабань"]}
     {:path "accesories/instrumenty" :tags ["Инструмент"]}
     {:path "accesories/tea-toys" :tags ["Фигурка"]}
     {:path "accesories/tea-toys" :tags ["Фигурка"]}
     {:path "accesories/chahe-strainers" :tags ["Сито"]}
     {:path "accesories/miscellaneous" :tags ["Аксессуар"]}
     {:path "accesories/firmenny-stil" :tags ["Мерч"]}
     {:path "accesories/stikery" :tags ["Мерч"]}
     {:path "upakovka" :tags ["Упаковка"]}
     {:path "eksklyuzivny-chay"}
     {:path "taiwan-tea" :tags ["Тайвань"]}]
    format-url
    product-peg
    normalize))

{:products products :title "Art of tea" :url "https://artoftea.ru"}