Fix the html cover scraping (lovelybooks changed the html again)

This commit is contained in:
Aaron Fischer 2018-07-13 23:31:00 +02:00
parent 641fcb8712
commit 695afe17db

View file

@ -27,13 +27,16 @@
[me.raynes.fs :as fs]))
(defn imgurl->bytes [lovelybooks-url]
(-> (java.net.URL. lovelybooks-url)
(let [urls (-> (java.net.URL. lovelybooks-url)
html/html-resource
(html/select [:div.bookcoverXXL :> :div :> :img])
(html/select [:div.cover-wrapper :> :div.cover :> :img.BookCover])
first
(get-in [:attrs :src])
(http-client/get {:as :byte-array})
:body))
(get-in [:attrs :srcset])
(str/split #" "))
url-to-fetch (last (filter #(re-matches #"http.+\.jpg" %) urls))
stream (http-client/get url-to-fetch {:as :byte-array})]
(:body stream)))
(defn encode-url-part [part]
(java.net.URLEncoder/encode part "UTF-8"))