[wallpapercave] add extractor for images (#2205)

3 years ago · b17e2dcf93
parent c661737f36
commit b17e2dcf93
4 changed files with 41 additions and 0 deletions
--- a/docs/supportedsites.md
+++ b/docs/supportedsites.md
@ -787,6 +787,12 @@ Consider all sites to be NSFW unless otherwise known.
    <td>Collections, individual Images, Search Results</td>
    <td><a href="configuration.rst#extractorwallhavenapi-key">API Key</a></td>
 </tr>
+<tr>
+    <td>Wallpaper Cave</td>
+    <td>https://wallpapercave.com/</td>
+    <td>individual Images, Search Results</td>
+    <td></td>
+</tr>
 <tr>
    <td>Warosu</td>
    <td>https://warosu.org/</td>
--- a/gallery_dl/extractor/init.py
+++ b/gallery_dl/extractor/init.py
@ -132,6 +132,7 @@ modules = [
    "vk",
    "vsco",
    "wallhaven",
+    "wallpapercave",
    "warosu",
    "weasyl",
    "webtoons",
--- a/gallery_dl/extractor/wallpapercave.py
+++ b/gallery_dl/extractor/wallpapercave.py
@ -0,0 +1,30 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2021 David Hoppenbrouwers
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://wallpapercave.com/"""
+
+from .common import Extractor, Message
+from .. import text
+
+
+class WallpapercaveImageExtractor(Extractor):
+    """Extractor for images on wallpapercave.com"""
+    category = "wallpapercave"
+    subcategory = "image"
+    root = "https://wallpapercave.com"
+    pattern = r"(?:https?://)?(?:www\.)?wallpapercave\.com"
+    test = ("https://wallpapercave.com/w/wp10270355", {
+        "content": "58b088aaa1cf1a60e347015019eb0c5a22b263a6",
+    })
+
+    def items(self):
+        page = self.request(text.ensure_http_scheme(self.url)).text
+        for path in text.extract_iter(page, 'class="download" href="', '"'):
+            image = text.nameext_from_url(path)
+            yield Message.Directory, image
+            yield Message.Url, self.root + path, image
--- a/scripts/supportedsites.py
+++ b/scripts/supportedsites.py
@ -111,6 +111,7 @@ CATEGORY_MAP = {
    "vk"             : "VK",
    "vsco"           : "VSCO",
    "wakarimasen"    : "Wakarimasen Archive",
+    "wallpapercave"  : "Wallpaper Cave",
    "webtoons"       : "Webtoon",
    "wikiart"        : "WikiArt.org",
    "xhamster"       : "xHamster",
@ -203,6 +204,9 @@ SUBCATEGORY_MAP = {
    "wallhaven": {
        "collections": "",
    },
+    "wallpapercave": {
+        "image": "individual Images, Search Results",
+    },
    "weasyl": {
        "journals"   : "",
        "submissions": "",