[slickpic] add album extractor (#249)

5 years ago · 2184e3a86b
parent c23bf263fe
commit 2184e3a86b
4 changed files with 122 additions and 0 deletions
--- a/docs/supportedsites.rst
+++ b/docs/supportedsites.rst
@ -94,6 +94,7 @@ Sen Manga            https://raw.senmanga.com/           Chapters
 Sense-Scans          http://sensescans.com/reader/       Chapters, Manga
 Sex.com              https://www.sex.com/                Boards, Pins, Search Results
 Simply Hentai        https://www.simply-hentai.com/      Galleries, individual Images, Videos
+SlickPic             https://www.slickpic.com//          Albums
 SlideShare           https://www.slideshare.net/         Presentations
 SmugMug              https://www.smugmug.com/            |smugmug-C|                                        Optional (OAuth)
 The /b/ Archive      https://thebarchive.com/            Threads
--- a/gallery_dl/extractor/init.py
+++ b/gallery_dl/extractor/init.py
@ -85,6 +85,7 @@ modules = [
    "senmanga",
    "sexcom",
    "simplyhentai",
+    "slickpic",
    "slideshare",
    "smugmug",
    "tsumino",
--- a/gallery_dl/extractor/slickpic.py
+++ b/gallery_dl/extractor/slickpic.py
@ -0,0 +1,119 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2019 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://www.slickpic.com/"""
+
+from .common import Extractor, Message
+from .. import text
+import time
+
+
+BASE_PATTERN = r"(?:https?://)?([^.]+)\.slickpic\.com"
+
+
+class SlickpicExtractor(Extractor):
+    """Base class for slickpic extractors"""
+    category = "slickpic"
+
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.user = match.group(1)
+        self.root = "https://{}.slickpic.com".format(self.user)
+
+
+class SlickpicAlbumExtractor(SlickpicExtractor):
+    """Extractor for albums on slickpic.com"""
+    subcategory = "album"
+    directory_fmt = ("{category}", "{user[name]}",
+                     "{album[id]} {album[title]}")
+    filename_fmt = "{num:>03}_{id}{title:?_//}.{extension}"
+    archive_fmt = "{id}"
+    pattern = BASE_PATTERN + r"/albums/([^/?&#]+)"
+    test = (
+        ("https://mattcrandall.slickpic.com/albums/LamborghiniMurcielago/", {
+            "url": "58bd94ebc80fd906e9879826970b408d54c6da07",
+            "keyword": "54a9d6f9e42ae43c644aa9316186fb9d9955fe53",
+        }),
+        ("https://mattcrandall.slickpic.com/albums/LamborghiniMurcielago/", {
+            "range": "34",
+            "content": "cec6630e659dc72db1ee1a9a6f3b525189261988",
+        }),
+    )
+
+    def __init__(self, match):
+        SlickpicExtractor.__init__(self, match)
+        self.album = match.group(2)
+
+    def items(self):
+        data = self.metadata()
+        imgs = self.images(data)
+
+        data = {
+            "album": {
+                "id"   : text.parse_int(data["aid"]),
+                "title": text.unescape(data["title"]),
+            },
+            "user": {
+                "id"  : text.parse_int(data["uid"]),
+                "name": text.unescape(data["user"]),
+                "nick": self.user
+            },
+            "count": len(imgs),
+        }
+
+        yield Message.Version, 1
+        yield Message.Directory, data
+        for num, img in enumerate(imgs, 1):
+            url = img["url_rsz"] + "/o/" + img["fname"]
+            img = text.nameext_from_url(img["fname"], {
+                "url"        : url,
+                "num"        : num,
+                "id"         : text.parse_int(img["id"]),
+                "width"      : text.parse_int(img["width"]),
+                "height"     : text.parse_int(img["height"]),
+                "title"      : img["title"],
+                "description": img["descr"],
+            })
+            img.update(data)
+            yield Message.Url, url, img
+
+    def metadata(self):
+        url = "{}/albums/{}/?wallpaper".format(self.root, self.album)
+        extr = text.extract_from(self.request(url).text)
+
+        title = text.unescape(extr("<title>", "</title>"))
+        title, _, user = title.rpartition(" by ")
+
+        return {
+            "title": title,
+            "user" : user,
+            "tk"   : extr('tk = "', '"'),
+            "shd"  : extr('shd = "', '"'),
+            "aid"  : extr('data-aid="', '"', ),
+            "uid"  : extr('data-uid="', '"', ),
+        }
+
+    def images(self, data):
+        url = self.root + "/xhr/photo/get/list"
+        data = {
+            "tm"    : time.time(),
+            "tk"    : data["tk"],
+            "shd"   : data["shd"],
+            "aid"   : data["aid"],
+            "uid"   : data["uid"],
+            "col"   : "0",
+            "sys"   : self.album,
+            "vw"    : "1280",
+            "vh"    : "1024",
+            "skey"  : "",
+            "viewer": "false",
+            "pub"   : "1",
+            "sng"   : "0",
+            "whq"   : "1",
+        }
+        return self.request(url, method="POST", data=data).json()["list"]
--- a/scripts/supportedsites.py
+++ b/scripts/supportedsites.py
@ -64,6 +64,7 @@ CATEGORY_MAP = {
    "sensescans"     : "Sense-Scans",
    "sexcom"         : "Sex.com",
    "simplyhentai"   : "Simply Hentai",
+    "slickpic"       : "SlickPic",
    "slideshare"     : "SlideShare",
    "smugmug"        : "SmugMug",
    "thebarchive"    : "The /b/ Archive",