diff options
| author | unwox <me@unwox.com> | 2025-01-29 22:00:44 +0600 |
|---|---|---|
| committer | unwox <me@unwox.com> | 2025-01-29 23:18:00 +0600 |
| commit | 4e4880fd6631f46138fabee5e20ddc22c84ac6bd (patch) | |
| tree | c1d67535e7cf95741b3dc96280b764f9f4ec5bb6 /parser | |
| parent | 5c2dfda03f0ce765b4dacd0c39cc8a0602eea917 (diff) | |
add suhexuan parser
Diffstat (limited to 'parser')
| -rw-r--r-- | parser/parser.fnl | 6 | ||||
| -rw-r--r-- | parser/suhexuan.fnl | 62 |
2 files changed, 66 insertions, 2 deletions
diff --git a/parser/parser.fnl b/parser/parser.fnl index e97351f..b2ff20c 100644 --- a/parser/parser.fnl +++ b/parser/parser.fnl @@ -147,7 +147,8 @@ (if extra-metrics (table.unpack extra-metrics) ""))) - (+ (peg.P " ") "\t" "." "\n" -1))))))] + (maybe ".") + (+ (peg.P " ") "\t" "." "\n" "<" -1))))))] (let [result (peg:match text)] (if result (let [[number metric] result] @@ -162,7 +163,8 @@ (* (peg.C pegs.number) (maybe " ") (+ (* (peg.C (+ (peg.P "мл") "л")) - (+ (peg.P " ") "\t" "." "\n" -1))))))] + (maybe ".") + (+ (peg.P " ") "\t" "." "\n" "<" -1))))))] (let [result (peg:match text)] (if result (let [[number metric] result] diff --git a/parser/suhexuan.fnl b/parser/suhexuan.fnl new file mode 100644 index 0000000..8592294 --- /dev/null +++ b/parser/suhexuan.fnl @@ -0,0 +1,62 @@ +(import-macros {: map} :lib.macro) + +(local parser (require :parser.parser)) +(local array (require :lib.array)) +(local http (require :lib.http)) +(local number (require :lib.number)) +(local fetcher (require :fetcher)) +(local json (require :vendor.json)) + +(fn format-url [path page] + (.. "https://store.tildaapi.com/api/getproductslist/" + "?storepartuid=" path + "&slice=" page + "&recid=644733406" + "&c=1738164538594" + "&getparts=true" + "&getoptions=true" + "&size=36")) + +(fn destruct-response [response] + {:items (. (json.decode response) :products)}) + +(fn normalize [product] + (local gallery (json.decode product.gallery)) + (local weight (parser.guess-weight product.title ["г"])) + (local price (number.string->number product.price)) + + {:site "suhexuan" + :url product.url + :title product.title + :description product.text + ;; FIXME: parse all editions into different products + :image (if (< 0 (# gallery)) + (. gallery 1 :img) + "") + :weight weight + :volume (or (parser.guess-volume product.text) + (parser.guess-volume product.title)) + :price price + :price-per (if (and price weight (< 0 weight)) + (/ (math.ceil (* (/ price weight) 10)) 10) + nil) + :characteristics product.characteristics}) + +(fn products [] + (fetcher.from-json + [{:path "896764703561" :tags ["Посуда"]} + {:path "343222834961" :tags ["Разное"]} + {:path "167733677091&filters[charact:6272182]=Зеленый" :tags ["Зеленый чай"]} + {:path "167733677091&filters[charact:6272182]=Белый" :tags ["Белый чай"]} + {:path "167733677091&filters[charact:6272182]=Желтый" :tags ["Желтый чай"]} + {:path "167733677091&filters[charact:6272182]=Красный" :tags ["Красный чай"]} + {:path "167733677091&filters[charact:6272182]=Черный" :tags ["Хэй ча"]} + {:path "167733677091&filters[charact:6272182]=Шу+пуэр" :tags ["Шу пуэр"]} + {:path "167733677091&filters[charact:6272182]=Шэн+пуэр" :tags ["Шэн пуэр"]} + {:path "167733677091&filters[charact:6272182]=С+ароматами" :tags []} + {:path "167733677091&filters[charact:6272182]=Улун" :tags ["Улун"]}] + format-url + destruct-response + normalize)) + +{:products products :title "СуХэСюань" :url "https://suhexuan.ru"} |
