summaryrefslogtreecommitdiff
path: root/parser/chaibez.fnl
blob: d42a4ae754dfec14ab3110c02248beb54315c007 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
(local peg
 (if (pick-values 1 (pcall require :lpeg))
   (require :lpeg)
   (require :lpeglj)))
(local parser (require :parser.parser))
(local number (require :lib.number))
(local fetcher (require :fetcher))

(fn format-url [path page]
  (.. "https://chaibez.ru/" path "/"
      (if (< 1 page) (.. "?page=" page) "")))

(local product-peg
  (*
   (parser.anywhere
    (parser.tag :div {:class "image"}
     (parser.tag :a {:href (peg.Cg (parser.till "\"") :url) :class "*"}
      (*
       (parser.anywhere (* "src=\"" (peg.Cg (parser.till "\"") :image) "\""))
       (parser.till "</a>")))))
   (parser.anywhere
    (*
      "<div class=\"caption\">"
      parser.pegs.spaces
      (parser.tag :h4 {}
       (*
        (parser.tag :a {:href (peg.Cg (parser.till "\"") :url)}
         (peg.Cg (parser.till "</a>") :title))
        (parser.till "</h4>")))))
   ;; same engine as artoftea
   (parser.anywhere
    (+
     (*
      (+
        ;; without discount
        (parser.tag :option {:data-price-prefix (peg.Cg (parser.till "\"") :prefix)
                             :data-price (peg.Cg (parser.till "\"") :amount)
                             :value "*" :selected "selected"}
         (peg.Cg (parser.till "</option>") :weight))
        ;; with discount
        (parser.tag :option {:data-price-prefix (peg.Cg (parser.till "\"") :prefix)
                             :data-price "*"
                             :data-special (peg.Cg (parser.till "\"") :amount)
                             :value "*" :selected "selected"}
         (peg.Cg (parser.till "</option>") :weight)))
      (parser.anywhere
       (parser.tag :span {:data-price (peg.Cg (parser.till "\"") :price)
                          :class "*"}
        (parser.till "</span>"))))
     ;; without options
     (parser.tag :span {:data-price (peg.Cg (parser.till "\"") :price)
                        :class "*"}
      (parser.till "</span>"))))
   (parser.anywhere (parser.tag :span {:class "*"} "В корзину"))))

(fn normalize [product]
  (local year (parser.guess-year product.title))
  (local weight (or (parser.guess-weight product.weight ["г"])
                    (parser.guess-weight product.title)))
  (local amount (if product.amount
                  (number.string->number product.amount)
                  1))
  (local price (number.string->number product.price))
  (local final-price (if (= product.prefix "*")
                          (* price amount)
                         (= product.prefix "=")
                          amount
                         price))

  {:site "chaibez"
   :title product.title
   :url product.url
   :description product.description
   :image product.image
   :year year
   :price final-price
   :weight weight
   :volume (parser.guess-volume product.title)
   :price-per (if (and final-price weight (< 0 weight))
                (/ (math.ceil (* (/ final-price weight) 10)) 10)
                nil)})

 (fn products []
   (fetcher.from-html
     [{:path "red_tea" :tags ["Красный чай"]}
      {:path "green_tea" :tags ["Зеленый чай"]}
      {:path "puer/shu_puer" :tags ["Шу пуэр"]}
      {:path "puer/rassypnoj-puer" :tags ["Шу пуэр"]}
      {:path "puer/shen_puer" :tags ["Шен пуэр"]}
      {:path "ulun/svetliy-ulun" :tags ["Улун"]}
      {:path "ulun/temniy-ulun" :tags ["Улун" "Уишань"]}
      {:path "ulun/ulun-guandun" :tags ["Улун" "Гуандун"]}
      {:path "ulun/gaba" :tags ["Улун" "Габа"]}
      {:path "ulun/taivan-ulun" :tags ["Улун" "Тайвань"]}
      {:path "white_tea" :tags ["Белый чай"]}
      {:path "yellow-tea" :tags ["Желтый чай"]}
      {:path "xej-cha-chernyj-chaj" :tags ["Хэй ча"]}
      {:path "posuda/gajvani" :tags ["Посуда" "Гайвань"]}
      {:path "posuda/kolba-station" :tags ["Посуда" "Стекло"]}
      {:path "posuda/chahai" :tags ["Посуда" "Чахай"]}
      {:path "posuda/isinskie-chajniki" :tags ["Посуда" "Чайник" "Исин"]}
      {:path "posuda/pials" :tags ["Посуда" "Пиала"]}
      {:path "posuda/chajniki-s-knopkoi" :tags ["Посуда" "Типот"]}
      {:path "aksessuary/chabani-chajnye-dosk" :tags ["Чабань"]}
      {:path "aksessuary/figurki" :tags ["Фигурка"]}
      {:path "aksessuary/instrumenty-kistochki-shhipcy-shilo" :tags ["Инструмент"]}
      {:path "aksessuary/chaxe-sitechki" :tags ["Сито"]}
      {:path "aksessuary/cases" :tags ["Чехол"]}
      {:path "trav_tea" :tags ["Травяной чай"]}]
     format-url
     product-peg
     normalize))

{:products products :title "Чай без церемоний" :url "https://chaibez.ru"}