blob: c8f25ee995ca8a650404d11feeaedd407182a0ec (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
|
(local peg
(if (pick-values 1 (pcall require :lpeg))
(require :lpeg)
(require :lpeglj)))
(local parser (require :parser.parser))
(local number (require :lib.number))
(local fetcher (require :fetcher))
(fn format-url [path page]
(.. "https://artoftea.ru/" path
(if (< 1 page) (.. "?page=" page) "")))
(local product-peg
(*
(parser.anywhere
(parser.tag :div {:class "product-thumb__image"}
(parser.tag :a {:href (peg.Cg (parser.till "\"") :url) :title "*"}
(*
(parser.anywhere (* "src=\"" (peg.Cg (parser.till "\"") :image) "\""))
(parser.till "</a>")))))
(parser.anywhere
(parser.tag :a {:class "product-thumb__name" :href "*"}
(peg.Cg (parser.till "</a>") :title)))
(parser.anywhere
(+
(*
(+
;; without discount
(parser.tag :option {:data-price-prefix (peg.Cg (parser.till "\"") :prefix)
:data-price (peg.Cg (parser.till "\"") :amount)
:value "*" :selected "selected"}
(peg.Cg (parser.till "</option>") :weight))
;; with discount
(parser.tag :option {:data-price-prefix (peg.Cg (parser.till "\"") :prefix)
:data-price "*"
:data-special (peg.Cg (parser.till "\"") :amount)
:value "*" :selected "selected"}
(peg.Cg (parser.till "</option>") :weight)))
(parser.anywhere
(parser.tag :span {:data-price (peg.Cg (parser.till "\"") :price)
:class "*"}
(parser.till "</span>"))))
;; without options
(parser.tag :span {:data-price (peg.Cg (parser.till "\"") :price)
:class "*"}
(parser.till "</span>"))))
(parser.anywhere (parser.tag :span {} "В корзину"))))
(fn normalize [product]
(local year (parser.guess-year product.title))
(local weight (or (parser.guess-weight product.weight ["г"])
(parser.guess-weight product.title)))
(local amount (if product.amount
(number.string->number product.amount)
1))
(local price (number.string->number product.price))
(local final-price (if (= product.prefix "*")
(* price amount)
(= product.prefix "=")
amount
price))
{:site "artoftea"
:title product.title
:url product.url
:description product.description
:image product.image
:year year
:price final-price
:weight weight
:volume (parser.guess-volume product.title)
:price-per (if (and final-price weight (< 0 weight))
(/ (math.ceil (* (/ final-price weight) 10)) 10)
nil)})
(fn products []
(fetcher.from-html
[{:path "redtea" :tags ["Красный чай"]}
{:path "greentea" :tags ["Зеленый чай"]}
{:path "puer/shu-puer" :tags ["Шу пуэр"]}
{:path "puer/sheng-puer" :tags ["Шен пуэр"]}
{:path "rassypnoi-puer"}
{:path "oolong" :tags ["Улун"]}
{:path "whitetea" :tags ["Белый чай"]}
{:path "yellowtea" :tags ["Желтый чай"]}
{:path "xej-cha-chernyj-chaj" :tags ["Хэй ча"]}
{:path "posuda/gaiwans" :tags ["Посуда" "Гайвань"]}
{:path "posuda/cups" :tags ["Посуда" "Пиала"]}
{:path "posuda/chahai" :tags ["Посуда" "Чахай"]}
{:path "posuda/chainiki-steklo-farfor" :tags ["Посуда" "Стекло"]}
{:path "posuda/chainiki-isinskaya-glina" :tags ["Посуда" "Чайник" "Исин"]}
{:path "posuda/chayniki-iz-keramiki-farfora" :tags ["Посуда" "Чайник" "Керамика"]}
{:path "posuda/farfor-iz-tszindechzhen" :tags ["Посуда" "Цзиндэчжэнь"]}
{:path "posuda/keramika-iz-tszyanshuy" :tags ["Посуда" "Чайник" "Цзяньшуй"]}
{:path "posuda/keramika-iz-chaochzhou" :tags ["Посуда" "Чайник" "Чаочжоу"]}
{:path "posuda/posuda-iz-tsinchzhou" :tags ["Посуда" "Чайник" "Гуанси"]}
{:path "posuda/termosy-zavarochnyye-butylki" :tags ["Посуда" "Термос"]}
{:path "posuda/sama-kamjove" :tags ["Посуда" "Типот"]}
{:path "posuda/steklo" :tags ["Посуда" "Стекло"]}
{:path "posuda/nabory" :tags ["Посуда" "Набор"]}
{:path "posuda/ekskljuzivnaja-posuda" :tags ["Посуда" "Набор"]}
{:path "accesories/chaban" :tags ["Чабань"]}
{:path "accesories/instrumenty" :tags ["Инструмент"]}
{:path "accesories/tea-toys" :tags ["Фигурка"]}
{:path "accesories/tea-toys" :tags ["Фигурка"]}
{:path "accesories/chahe-strainers" :tags ["Сито"]}
{:path "accesories/miscellaneous" :tags ["Аксессуар"]}
{:path "accesories/firmenny-stil" :tags ["Мерч"]}
{:path "accesories/stikery" :tags ["Мерч"]}
{:path "upakovka" :tags ["Упаковка"]}
{:path "eksklyuzivny-chay"}
{:path "taiwan-tea" :tags ["Тайвань"]}]
format-url
product-peg
normalize))
{:products products :title "Art of tea" :url "https://artoftea.ru"}
|