gallery-dl/gallery_dl/extractor/pixiv.py

# -*- coding: utf-8 -*-

# Copyright 2014-2023 Mike Fährmann
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.

"""Extractors for https://www.pixiv.net/"""

from .common import Extractor, Message
from .. import text, util, exception
from ..cache import cache, memcache
from datetime import datetime, timedelta
import itertools
import hashlib


class PixivExtractor(Extractor):
    """Base class for pixiv extractors"""
    category = "pixiv"
    root = "https://www.pixiv.net"
    directory_fmt = ("{category}", "{user[id]} {user[account]}")
    filename_fmt = "{id}_p{num}.{extension}"
    archive_fmt = "{id}{suffix}.{extension}"
    cookiedomain = None

    def __init__(self, match):
        Extractor.__init__(self, match)
        self.api = PixivAppAPI(self)
        self.load_ugoira = self.config("ugoira", True)
        self.max_posts = self.config("max-posts", 0)

    def items(self):
        tags = self.config("tags", "japanese")
        if tags == "original":
            transform_tags = None
        elif tags == "translated":
            def transform_tags(work):
                work["tags"] = list(dict.fromkeys(
                    tag["translated_name"] or tag["name"]
                    for tag in work["tags"]))
        else:
            def transform_tags(work):
                work["tags"] = [tag["name"] for tag in work["tags"]]

        ratings = {0: "General", 1: "R-18", 2: "R-18G"}
        meta_user = self.config("metadata")
        meta_bookmark = self.config("metadata-bookmark")
        metadata = self.metadata()

        works = self.works()
        if self.max_posts:
            works = itertools.islice(works, self.max_posts)
        for work in works:
            if not work["user"]["id"]:
                continue

            meta_single_page = work["meta_single_page"]
            meta_pages = work["meta_pages"]
            del work["meta_single_page"]
            del work["image_urls"]
            del work["meta_pages"]

            if meta_user:
                work.update(self.api.user_detail(work["user"]["id"]))
            if meta_bookmark and work["is_bookmarked"]:
                detail = self.api.illust_bookmark_detail(work["id"])
                work["tags_bookmark"] = [tag["name"] for tag in detail["tags"]
                                         if tag["is_registered"]]
            if transform_tags:
                transform_tags(work)
            work["num"] = 0
            work["date"] = text.parse_datetime(work["create_date"])
            work["rating"] = ratings.get(work["x_restrict"])
            work["suffix"] = ""
            work.update(metadata)

            yield Message.Directory, work

            if work["type"] == "ugoira":
                if not self.load_ugoira:
                    continue

                try:
                    ugoira = self.api.ugoira_metadata(work["id"])
                except exception.StopExtraction as exc:
                    self.log.warning(
                        "Unable to retrieve Ugoira metatdata (%s - %s)",
                        work.get("id"), exc.message)
                    continue

                url = ugoira["zip_urls"]["medium"].replace(
                    "_ugoira600x600", "_ugoira1920x1080")
                work["frames"] = ugoira["frames"]
                work["date_url"] = self._date_from_url(url)
                work["_http_adjust_extension"] = False
                yield Message.Url, url, text.nameext_from_url(url, work)

            elif work["page_count"] == 1:
                url = meta_single_page["original_image_url"]
                work["date_url"] = self._date_from_url(url)
                yield Message.Url, url, text.nameext_from_url(url, work)

            else:
                for work["num"], img in enumerate(meta_pages):
                    url = img["image_urls"]["original"]
                    work["date_url"] = self._date_from_url(url)
                    work["suffix"] = "_p{:02}".format(work["num"])
                    yield Message.Url, url, text.nameext_from_url(url, work)

    @staticmethod
    def _date_from_url(url, offset=timedelta(hours=9)):
        try:
            _, _, _, _, _, y, m, d, H, M, S, _ = url.split("/")
            return datetime(
                int(y), int(m), int(d), int(H), int(M), int(S)) - offset
        except Exception:
            return None

    @staticmethod
    def _make_work(kind, url, user):
        p = url.split("/")
        return {
            "create_date"     : "{}-{}-{}T{}:{}:{}+09:00".format(
                p[5], p[6], p[7], p[8], p[9], p[10]) if len(p) > 9 else None,
            "height"          : 0,
            "id"              : kind,
            "image_urls"      : None,
            "meta_pages"      : (),
            "meta_single_page": {"original_image_url": url},
            "page_count"      : 1,
            "sanity_level"    : 0,
            "tags"            : (),
            "title"           : kind,
            "type"            : kind,
            "user"            : user,
            "width"           : 0,
            "x_restrict"      : 0,
        }

    def works(self):
        """Return an iterable containing all relevant 'work' objects"""

    def metadata(self):
        """Collect metadata for extractor job"""
        return {}


class PixivUserExtractor(PixivExtractor):
    """Extractor for a pixiv user profile"""
    subcategory = "user"
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net/(?:"
               r"(?:en/)?u(?:sers)?/|member\.php\?id=|(?:mypage\.php)?#id="
               r")(\d+)(?:$|[?#])")
    test = (
        ("https://www.pixiv.net/en/users/173530"),
        ("https://www.pixiv.net/u/173530"),
        ("https://www.pixiv.net/member.php?id=173530"),
        ("https://www.pixiv.net/mypage.php#id=173530"),
        ("https://www.pixiv.net/#id=173530"),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.user_id = match.group(1)

    def items(self):
        base = "{}/users/{}/".format(self.root, self.user_id)
        return self._dispatch_extractors((
            (PixivAvatarExtractor    , base + "avatar"),
            (PixivBackgroundExtractor, base + "background"),
            (PixivArtworksExtractor  , base + "artworks"),
            (PixivFavoriteExtractor  , base + "bookmarks/artworks"),
            (PixivNovelUserExtractor , base + "novels"),
        ), ("artworks",))


class PixivArtworksExtractor(PixivExtractor):
    """Extractor for artworks of a pixiv user"""
    subcategory = "artworks"
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net/(?:"
               r"(?:en/)?users/(\d+)/(?:artworks|illustrations|manga)"
               r"(?:/([^/?#]+))?/?(?:$|[?#])"
               r"|member_illust\.php\?id=(\d+)(?:&([^#]+))?)")
    test = (
        ("https://www.pixiv.net/en/users/173530/artworks", {
            "url": "852c31ad83b6840bacbce824d85f2a997889efb7",
        }),
        # illusts with specific tag
        (("https://www.pixiv.net/en/users/173530/artworks"
          "/%E6%89%8B%E3%81%B6%E3%82%8D"), {
            "url": "25b1cd81153a8ff82eec440dd9f20a4a22079658",
        }),
        (("https://www.pixiv.net/member_illust.php?id=173530"
          "&tag=%E6%89%8B%E3%81%B6%E3%82%8D"), {
            "url": "25b1cd81153a8ff82eec440dd9f20a4a22079658",
        }),
        # deleted account
        ("http://www.pixiv.net/member_illust.php?id=173531", {
            "options": (("metadata", True),),
            "exception": exception.NotFoundError,
        }),
        ("https://www.pixiv.net/en/users/173530/manga"),
        ("https://www.pixiv.net/en/users/173530/illustrations"),
        ("https://www.pixiv.net/member_illust.php?id=173530"),
        ("https://touch.pixiv.net/member_illust.php?id=173530"),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        u1, t1, u2, t2 = match.groups()
        if t1:
            t1 = text.unquote(t1)
        elif t2:
            t2 = text.parse_query(t2).get("tag")
        self.user_id = u1 or u2
        self.tag = t1 or t2

    def metadata(self):
        if self.config("metadata"):
            self.api.user_detail(self.user_id)
        return {}

    def works(self):
        works = self.api.user_illusts(self.user_id)

        if self.tag:
            tag = self.tag.lower()
            works = (
                work for work in works
                if tag in [t["name"].lower() for t in work["tags"]]
            )

        return works


class PixivAvatarExtractor(PixivExtractor):
    """Extractor for pixiv avatars"""
    subcategory = "avatar"
    filename_fmt = "avatar{date:?_//%Y-%m-%d}.{extension}"
    archive_fmt = "avatar_{user[id]}_{date}"
    pattern = (r"(?:https?://)?(?:www\.)?pixiv\.net"
               r"/(?:en/)?users/(\d+)/avatar")
    test = ("https://www.pixiv.net/en/users/173530/avatar", {
        "content": "4e57544480cc2036ea9608103e8f024fa737fe66",
    })

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.user_id = match.group(1)

    def works(self):
        user = self.api.user_detail(self.user_id)["user"]
        url = user["profile_image_urls"]["medium"].replace("_170.", ".")
        return (self._make_work("avatar", url, user),)


class PixivBackgroundExtractor(PixivExtractor):
    """Extractor for pixiv background banners"""
    subcategory = "background"
    filename_fmt = "background{date:?_//%Y-%m-%d}.{extension}"
    archive_fmt = "background_{user[id]}_{date}"
    pattern = (r"(?:https?://)?(?:www\.)?pixiv\.net"
               r"/(?:en/)?users/(\d+)/background")
    test = ("https://www.pixiv.net/en/users/194921/background", {
        "pattern": r"https://i\.pximg\.net/background/img/2021/01/30/16/12/02"
                   r"/194921_af1f71e557a42f499213d4b9eaccc0f8\.jpg",
    })

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.user_id = match.group(1)

    def works(self):
        detail = self.api.user_detail(self.user_id)
        url = detail["profile"]["background_image_url"]
        if not url:
            return ()
        if "/c/" in url:
            parts = url.split("/")
            del parts[3:5]
            url = "/".join(parts)
        url = url.replace("_master1200.", ".")
        work = self._make_work("background", url, detail["user"])
        if url.endswith(".jpg"):
            url = url[:-4]
            work["_fallback"] = (url + ".png", url + ".gif")
        return (work,)


class PixivMeExtractor(PixivExtractor):
    """Extractor for pixiv.me URLs"""
    subcategory = "me"
    pattern = r"(?:https?://)?pixiv\.me/([^/?#]+)"
    test = (
        ("https://pixiv.me/del_shannon", {
            "url": "29c295ce75150177e6b0a09089a949804c708fbf",
        }),
        ("https://pixiv.me/del_shanno", {
            "exception": exception.NotFoundError,
        }),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.account = match.group(1)

    def items(self):
        url = "https://pixiv.me/" + self.account
        data = {"_extractor": PixivUserExtractor}
        response = self.request(
            url, method="HEAD", allow_redirects=False, notfound="user")
        yield Message.Queue, response.headers["Location"], data


class PixivWorkExtractor(PixivExtractor):
    """Extractor for a single pixiv work/illustration"""
    subcategory = "work"
    pattern = (r"(?:https?://)?(?:(?:www\.|touch\.)?pixiv\.net"
               r"/(?:(?:en/)?artworks/"
               r"|member_illust\.php\?(?:[^&]+&)*illust_id=)(\d+)"
               r"|(?:i(?:\d+\.pixiv|\.pximg)\.net"
               r"/(?:(?:.*/)?img-[^/]+/img/\d{4}(?:/\d\d){5}|img\d+/img/[^/]+)"
               r"|img\d*\.pixiv\.net/img/[^/]+|(?:www\.)?pixiv\.net/i)/(\d+))")
    test = (
        ("https://www.pixiv.net/artworks/966412", {
            "url": "90c1715b07b0d1aad300bce256a0bc71f42540ba",
            "content": "69a8edfb717400d1c2e146ab2b30d2c235440c5a",
            "keyword": {
                "date"    : "dt:2008-06-12 15:29:13",
                "date_url": "dt:2008-06-12 15:29:13",
            },
        }),
        (("http://www.pixiv.net/member_illust.php"
          "?mode=medium&illust_id=966411"), {
            "exception": exception.NotFoundError,
        }),
        # ugoira
        (("https://www.pixiv.net/member_illust.php"
          "?mode=medium&illust_id=66806629"), {
            "url": "7267695a985c4db8759bebcf8d21dbdd2d2317ef",
            "keyword": {
                "frames"  : list,
                "date"    : "dt:2018-01-14 15:06:08",
                "date_url": "dt:2018-01-15 04:24:48",
            },
        }),
        # related works (#1237)
        ("https://www.pixiv.net/artworks/966412", {
            "options": (("related", True),),
            "range": "1-10",
            "count": ">= 10",
        }),
        ("https://www.pixiv.net/en/artworks/966412"),
        ("http://www.pixiv.net/member_illust.php?mode=medium&illust_id=96641"),
        ("http://i1.pixiv.net/c/600x600/img-master"
         "/img/2008/06/13/00/29/13/966412_p0_master1200.jpg"),
        ("https://i.pximg.net/img-original"
         "/img/2017/04/25/07/33/29/62568267_p0.png"),
        ("https://www.pixiv.net/i/966412"),
        ("http://img.pixiv.net/img/soundcross/42626136.jpg"),
        ("http://i2.pixiv.net/img76/img/snailrin/42672235.jpg"),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.illust_id = match.group(1) or match.group(2)

    def works(self):
        works = (self.api.illust_detail(self.illust_id),)
        if self.config("related", False):
            related = self.api.illust_related(self.illust_id)
            works = itertools.chain(works, related)
        return works


class PixivFavoriteExtractor(PixivExtractor):
    """Extractor for all favorites/bookmarks of a pixiv-user"""
    subcategory = "favorite"
    directory_fmt = ("{category}", "bookmarks",
                     "{user_bookmark[id]} {user_bookmark[account]}")
    archive_fmt = "f_{user_bookmark[id]}_{id}{num}.{extension}"
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net/(?:(?:en/)?"
               r"users/(\d+)/(bookmarks/artworks|following)(?:/([^/?#]+))?"
               r"|bookmark\.php)(?:\?([^#]*))?")
    test = (
        ("https://www.pixiv.net/en/users/173530/bookmarks/artworks", {
            "url": "85a3104eaaaf003c7b3947117ca2f1f0b1cfc949",
        }),
        ("https://www.pixiv.net/bookmark.php?id=173530", {
            "url": "85a3104eaaaf003c7b3947117ca2f1f0b1cfc949",
        }),
        # bookmarks with specific tag
        (("https://www.pixiv.net/en/users/3137110"
          "/bookmarks/artworks/%E3%81%AF%E3%82%93%E3%82%82%E3%82%93"), {
            "url": "379b28275f786d946e01f721e54afe346c148a8c",
        }),
        # bookmarks with specific tag (legacy url)
        (("https://www.pixiv.net/bookmark.php?id=3137110"
          "&tag=%E3%81%AF%E3%82%93%E3%82%82%E3%82%93&p=1"), {
            "url": "379b28275f786d946e01f721e54afe346c148a8c",
        }),
        # own bookmarks
        ("https://www.pixiv.net/bookmark.php", {
            "url": "90c1715b07b0d1aad300bce256a0bc71f42540ba",
            "keyword": {"tags_bookmark": ["47", "hitman"]},
            "options": (("metadata-bookmark", True),),
        }),
        # own bookmarks with tag (#596)
        ("https://www.pixiv.net/bookmark.php?tag=foobar", {
            "count": 0,
        }),
        # followed users (#515)
        ("https://www.pixiv.net/en/users/173530/following", {
            "pattern": PixivUserExtractor.pattern,
            "count": ">= 12",
        }),
        # followed users (legacy url) (#515)
        ("https://www.pixiv.net/bookmark.php?id=173530&type=user", {
            "pattern": PixivUserExtractor.pattern,
            "count": ">= 12",
        }),
        # touch URLs
        ("https://touch.pixiv.net/bookmark.php?id=173530"),
        ("https://touch.pixiv.net/bookmark.php"),
    )

    def __init__(self, match):
        uid, kind, self.tag, query = match.groups()
        query = text.parse_query(query)

        if not uid:
            uid = query.get("id")
            if not uid:
                self.subcategory = "bookmark"

        if kind == "following" or query.get("type") == "user":
            self.subcategory = "following"
            self.items = self._items_following

        PixivExtractor.__init__(self, match)
        self.query = query
        self.user_id = uid

    def works(self):
        tag = None
        if "tag" in self.query:
            tag = text.unquote(self.query["tag"])
        elif self.tag:
            tag = text.unquote(self.tag)

        restrict = "public"
        if self.query.get("rest") == "hide":
            restrict = "private"

        return self.api.user_bookmarks_illust(self.user_id, tag, restrict)

    def metadata(self):
        if self.user_id:
            user = self.api.user_detail(self.user_id)["user"]
        else:
            self.api.login()
            user = self.api.user

        self.user_id = user["id"]
        return {"user_bookmark": user}

    def _items_following(self):
        restrict = "public"
        if self.query.get("rest") == "hide":
            restrict = "private"

        for preview in self.api.user_following(self.user_id, restrict):
            user = preview["user"]
            user["_extractor"] = PixivUserExtractor
            url = "https://www.pixiv.net/users/{}".format(user["id"])
            yield Message.Queue, url, user


class PixivRankingExtractor(PixivExtractor):
    """Extractor for pixiv ranking pages"""
    subcategory = "ranking"
    archive_fmt = "r_{ranking[mode]}_{ranking[date]}_{id}{num}.{extension}"
    directory_fmt = ("{category}", "rankings",
                     "{ranking[mode]}", "{ranking[date]}")
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
               r"/ranking\.php(?:\?([^#]*))?")
    test = (
        ("https://www.pixiv.net/ranking.php?mode=daily&date=20170818"),
        ("https://www.pixiv.net/ranking.php"),
        ("https://touch.pixiv.net/ranking.php"),
        ("https://www.pixiv.net/ranking.php?mode=unknown", {
            "exception": exception.StopExtraction,
        }),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.query = match.group(1)
        self.mode = self.date = None

    def works(self):
        return self.api.illust_ranking(self.mode, self.date)

    def metadata(self):
        query = text.parse_query(self.query)

        mode = query.get("mode", "daily").lower()
        mode_map = {
            "daily": "day",
            "daily_r18": "day_r18",
            "daily_ai": "day_ai",
            "daily_r18_ai": "day_r18_ai",
            "weekly": "week",
            "weekly_r18": "week_r18",
            "monthly": "month",
            "male": "day_male",
            "male_r18": "day_male_r18",
            "female": "day_female",
            "female_r18": "day_female_r18",
            "original": "week_original",
            "rookie": "week_rookie",
            "r18g": "week_r18g",
        }
        try:
            self.mode = mode = mode_map[mode]
        except KeyError:
            raise exception.StopExtraction("Invalid mode '%s'", mode)

        date = query.get("date")
        if date:
            if len(date) == 8 and date.isdecimal():
                date = "{}-{}-{}".format(date[0:4], date[4:6], date[6:8])
            else:
                self.log.warning("invalid date '%s'", date)
                date = None
        if not date:
            date = (datetime.utcnow() - timedelta(days=1)).strftime("%Y-%m-%d")
        self.date = date

        return {"ranking": {
            "mode": mode,
            "date": self.date,
        }}


class PixivSearchExtractor(PixivExtractor):
    """Extractor for pixiv search results"""
    subcategory = "search"
    archive_fmt = "s_{search[word]}_{id}{num}.{extension}"
    directory_fmt = ("{category}", "search", "{search[word]}")
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
               r"/(?:(?:en/)?tags/([^/?#]+)(?:/[^/?#]+)?/?"
               r"|search\.php)(?:\?([^#]+))?")
    test = (
        ("https://www.pixiv.net/en/tags/Original", {
            "range": "1-10",
            "count": 10,
        }),
        ("https://pixiv.net/en/tags/foo/artworks?order=week&s_mode=s_tag", {
            "exception": exception.StopExtraction,
        }),
        ("https://pixiv.net/en/tags/foo/artworks?order=date&s_mode=tag", {
            "exception": exception.StopExtraction,
        }),
        ("https://www.pixiv.net/search.php?s_mode=s_tag&name=Original", {
            "exception": exception.StopExtraction,
        }),
        ("https://www.pixiv.net/en/tags/foo/artworks?order=date&s_mode=s_tag"),
        ("https://www.pixiv.net/search.php?s_mode=s_tag&word=Original"),
        ("https://touch.pixiv.net/search.php?word=Original"),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.word, self.query = match.groups()
        self.sort = self.target = None

    def works(self):
        return self.api.search_illust(
            self.word, self.sort, self.target,
            date_start=self.date_start, date_end=self.date_end)

    def metadata(self):
        query = text.parse_query(self.query)

        if self.word:
            self.word = text.unquote(self.word)
        else:
            try:
                self.word = query["word"]
            except KeyError:
                raise exception.StopExtraction("Missing search term")

        sort = query.get("order", "date_d")
        sort_map = {
            "date": "date_asc",
            "date_d": "date_desc",
            "popular_d": "popular_desc",
            "popular_male_d": "popular_male_desc",
            "popular_female_d": "popular_female_desc",
        }
        try:
            self.sort = sort = sort_map[sort]
        except KeyError:
            raise exception.StopExtraction("Invalid search order '%s'", sort)

        target = query.get("s_mode", "s_tag_full")
        target_map = {
            "s_tag": "partial_match_for_tags",
            "s_tag_full": "exact_match_for_tags",
            "s_tc": "title_and_caption",
        }
        try:
            self.target = target = target_map[target]
        except KeyError:
            raise exception.StopExtraction("Invalid search mode '%s'", target)

        self.date_start = query.get("scd")
        self.date_end = query.get("ecd")

        return {"search": {
            "word": self.word,
            "sort": self.sort,
            "target": self.target,
            "date_start": self.date_start,
            "date_end": self.date_end,
        }}


class PixivFollowExtractor(PixivExtractor):
    """Extractor for new illustrations from your followed artists"""
    subcategory = "follow"
    archive_fmt = "F_{user_follow[id]}_{id}{num}.{extension}"
    directory_fmt = ("{category}", "following")
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
               r"/bookmark_new_illust\.php")
    test = (
        ("https://www.pixiv.net/bookmark_new_illust.php"),
        ("https://touch.pixiv.net/bookmark_new_illust.php"),
    )

    def works(self):
        return self.api.illust_follow()

    def metadata(self):
        self.api.login()
        return {"user_follow": self.api.user}


class PixivPixivisionExtractor(PixivExtractor):
    """Extractor for illustrations from a pixivision article"""
    subcategory = "pixivision"
    directory_fmt = ("{category}", "pixivision",
                     "{pixivision_id} {pixivision_title}")
    archive_fmt = "V{pixivision_id}_{id}{suffix}.{extension}"
    pattern = r"(?:https?://)?(?:www\.)?pixivision\.net/(?:en/)?a/(\d+)"
    test = (
        ("https://www.pixivision.net/en/a/2791"),
        ("https://pixivision.net/a/2791", {
            "count": 7,
            "keyword": {
                "pixivision_id": "2791",
                "pixivision_title": "What's your favorite music? Editor’s "
                                    "picks featuring: “CD Covers”!",
            },
        }),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.pixivision_id = match.group(1)

    def works(self):
        return (
            self.api.illust_detail(illust_id.partition("?")[0])
            for illust_id in util.unique_sequence(text.extract_iter(
                self.page, '<a href="https://www.pixiv.net/en/artworks/', '"'))
        )

    def metadata(self):
        url = "https://www.pixivision.net/en/a/" + self.pixivision_id
        headers = {"User-Agent": "Mozilla/5.0"}
        self.page = self.request(url, headers=headers).text

        title = text.extr(self.page, '<title>', '<')
        return {
            "pixivision_id"   : self.pixivision_id,
            "pixivision_title": text.unescape(title),
        }


class PixivSeriesExtractor(PixivExtractor):
    """Extractor for illustrations from a Pixiv series"""
    subcategory = "series"
    directory_fmt = ("{category}", "{user[id]} {user[account]}",
                     "{series[id]} {series[title]}")
    filename_fmt = "{num_series:>03}_{id}_p{num}.{extension}"
    pattern = (r"(?:https?://)?(?:www\.)?pixiv\.net"
               r"/user/(\d+)/series/(\d+)")
    test = ("https://www.pixiv.net/user/10509347/series/21859", {
        "range": "1-10",
        "count": 10,
        "keyword": {
            "num_series": int,
            "series": {
                "canonical": "https://www.pixiv.net/user/10509347"
                             "/series/21859",
                "description": str,
                "ogp": dict,
                "title": "先輩がうざい後輩の話",
                "total": int,
                "twitter": dict,
            },
        },
    })

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.user_id, self.series_id = match.groups()

    def works(self):
        url = self.root + "/ajax/series/" + self.series_id
        params = {"p": 1}
        headers = {
            "Accept": "application/json",
            "Referer": "{}/user/{}/series/{}".format(
                self.root, self.user_id, self.series_id),
            "Alt-Used": "www.pixiv.net",
        }

        while True:
            data = self.request(url, params=params, headers=headers).json()
            body = data["body"]
            page = body["page"]

            series = body["extraData"]["meta"]
            series["id"] = self.series_id
            series["total"] = page["total"]
            series["title"] = text.extr(series["title"], '"', '"')

            for info in page["series"]:
                work = self.api.illust_detail(info["workId"])
                work["num_series"] = info["order"]
                work["series"] = series
                yield work

            if len(page["series"]) < 10:
                return
            params["p"] += 1


class PixivNovelExtractor(PixivExtractor):
    """Extractor for pixiv novels"""
    subcategory = "novel"
    request_interval = 1.0
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
               r"/n(?:ovel/show\.php\?id=|/)(\d+)")
    test = (
        ("https://www.pixiv.net/novel/show.php?id=19612040", {
            "count": 1,
            "content": "c6f22167f9df7aeaf63b51933b4c8ef6fc5e6a1e",
            "keyword": {
                "caption": r"re:「無能な名無し」と呼ばれ虐げられて育った鈴\(すず\)は、",
                "comment_access_control": 0,
                "create_date": "2023-04-02T15:18:58+09:00",
                "date": "dt:2023-04-02 06:18:58",
                "id": 19612040,
                "is_bookmarked": False,
                "is_muted": False,
                "is_mypixiv_only": False,
                "is_original": True,
                "is_x_restricted": False,
                "novel_ai_type": 1,
                "page_count": 1,
                "rating": "General",
                "restrict": 0,
                "series": {
                    "id": 10278364,
                    "title": "龍の贄嫁〜虐げられた少女は運命の番として愛される〜"
                },
                "tags": ["和風ファンタジー", "溺愛", "神様", "ヤンデレ", "執着",
                         "異能", "ざまぁ", "学園", "神嫁"],
                "text_length": 5977,
                "title": "異母妹から「無能な名無し」と虐げられていた私、"
                         "どうやら異母妹に霊力を搾取されていたようです（１）",
                "user": {
                    "account": "yukinaga_chifuyu",
                    "id": 77055466,
                },
                "visible": True,
                "x_restrict": 0,
            },
        }),
        ("https://www.pixiv.net/n/19612040"),
    )

    def __init__(self, match):
        PixivExtractor.__init__(self, match)
        self.novel_id = match.group(1)

    def items(self):
        tags = self.config("tags", "japanese")
        if tags == "original":
            transform_tags = None
        elif tags == "translated":
            def transform_tags(work):
                work["tags"] = list(dict.fromkeys(
                    tag["translated_name"] or tag["name"]
                    for tag in work["tags"]))
        else:
            def transform_tags(work):
                work["tags"] = [tag["name"] for tag in work["tags"]]

        ratings = {0: "General", 1: "R-18", 2: "R-18G"}
        meta_user = self.config("metadata")
        meta_bookmark = self.config("metadata-bookmark")

        novels = self.novels()
        if self.max_posts:
            novels = itertools.islice(novels, self.max_posts)
        for novel in novels:
            if meta_user:
                novel.update(self.api.user_detail(novel["user"]["id"]))
            if meta_bookmark and novel["is_bookmarked"]:
                detail = self.api.novel_bookmark_detail(novel["id"])
                novel["tags_bookmark"] = [tag["name"] for tag in detail["tags"]
                                          if tag["is_registered"]]
            if transform_tags:
                transform_tags(novel)
            novel["num"] = 0
            novel["date"] = text.parse_datetime(novel["create_date"])
            novel["rating"] = ratings.get(novel["x_restrict"])
            novel["suffix"] = ""

            yield Message.Directory, novel

            novel["extension"] = "txt"
            content = self.api.novel_text(novel["id"])["novel_text"]
            yield Message.Url, "text:" + content, novel

    def novels(self):
        return (self.api.novel_detail(self.novel_id),)


class PixivNovelUserExtractor(PixivNovelExtractor):
    """Extractor for pixiv users' novels"""
    subcategory = "novel-user"
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
               r"/(?:en/)?users/(\d+)/novels")
    test = ("https://www.pixiv.net/en/users/77055466/novels", {
        "pattern": "^text:",
        "range": "1-5",
        "count": 5,
    })

    def novels(self):
        return self.api.user_novels(self.novel_id)


class PixivNovelSeriesExtractor(PixivNovelExtractor):
    """Extractor for pixiv novel series"""
    subcategory = "novel-series"
    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
               r"/novel/series/(\d+)")
    test = ("https://www.pixiv.net/novel/series/10278364", {
        "count": 4,
        "content": "b06abed001b3f6ccfb1579699e9a238b46d38ea2",
    })

    def novels(self):
        return self.api.novel_series(self.novel_id)


class PixivSketchExtractor(Extractor):
    """Extractor for user pages on sketch.pixiv.net"""
    category = "pixiv"
    subcategory = "sketch"
    directory_fmt = ("{category}", "sketch", "{user[unique_name]}")
    filename_fmt = "{post_id} {id}.{extension}"
    archive_fmt = "S{user[id]}_{id}"
    root = "https://sketch.pixiv.net"
    cookiedomain = ".pixiv.net"
    pattern = r"(?:https?://)?sketch\.pixiv\.net/@([^/?#]+)"
    test = ("https://sketch.pixiv.net/@nicoby", {
        "pattern": r"https://img\-sketch\.pixiv\.net/uploads/medium"
                   r"/file/\d+/\d+\.(jpg|png)",
        "count": ">= 35",
    })

    def __init__(self, match):
        Extractor.__init__(self, match)
        self.username = match.group(1)

    def items(self):
        headers = {"Referer": "{}/@{}".format(self.root, self.username)}

        for post in self.posts():
            media = post["media"]
            post["post_id"] = post["id"]
            post["date"] = text.parse_datetime(
                post["created_at"], "%Y-%m-%dT%H:%M:%S.%f%z")
            util.delete_items(post, ("id", "media", "_links"))

            yield Message.Directory, post
            post["_http_headers"] = headers

            for photo in media:
                original = photo["photo"]["original"]
                post["id"] = photo["id"]
                post["width"] = original["width"]
                post["height"] = original["height"]

                url = original["url"]
                text.nameext_from_url(url, post)
                yield Message.Url, url, post

    def posts(self):
        url = "{}/api/walls/@{}/posts/public.json".format(
            self.root, self.username)
        headers = {
            "Accept": "application/vnd.sketch-v4+json",
            "X-Requested-With": "{}/@{}".format(self.root, self.username),
            "Referer": self.root + "/",
        }

        while True:
            data = self.request(url, headers=headers).json()
            yield from data["data"]["items"]

            next_url = data["_links"].get("next")
            if not next_url:
                return
            url = self.root + next_url["href"]


class PixivAppAPI():
    """Minimal interface for the Pixiv App API for mobile devices

    For a more complete implementation or documentation, see
    - https://github.com/upbit/pixivpy
    - https://gist.github.com/ZipFile/3ba99b47162c23f8aea5d5942bb557b1
    """
    CLIENT_ID = "MOBrBDS8blbauoSck0ZfDbtuzpyT"
    CLIENT_SECRET = "lsACyCD94FhDUtGTXi3QzcFE2uU1hqtDaKeqrdwj"
    HASH_SECRET = ("28c1fdd170a5204386cb1313c7077b34"
                   "f83e4aaf4aa829ce78c231e05b0bae2c")

    def __init__(self, extractor):
        self.extractor = extractor
        self.log = extractor.log
        self.username = extractor._get_auth_info()[0]
        self.user = None

        extractor.session.headers.update({
            "App-OS"        : "ios",
            "App-OS-Version": "13.1.2",
            "App-Version"   : "7.7.6",
            "User-Agent"    : "PixivIOSApp/7.7.6 (iOS 13.1.2; iPhone11,8)",
            "Referer"       : "https://app-api.pixiv.net/",
        })

        self.client_id = extractor.config(
            "client-id", self.CLIENT_ID)
        self.client_secret = extractor.config(
            "client-secret", self.CLIENT_SECRET)

        token = extractor.config("refresh-token")
        if token is None or token == "cache":
            token = _refresh_token_cache(self.username)
        self.refresh_token = token

    def login(self):
        """Login and gain an access token"""
        self.user, auth = self._login_impl(self.username)
        self.extractor.session.headers["Authorization"] = auth

    @cache(maxage=3600, keyarg=1)
    def _login_impl(self, username):
        if not self.refresh_token:
            raise exception.AuthenticationError(
                "'refresh-token' required.\n"
                "Run `gallery-dl oauth:pixiv` to get one.")

        self.log.info("Refreshing access token")
        url = "https://oauth.secure.pixiv.net/auth/token"
        data = {
            "client_id"     : self.client_id,
            "client_secret" : self.client_secret,
            "grant_type"    : "refresh_token",
            "refresh_token" : self.refresh_token,
            "get_secure_url": "1",
        }

        time = datetime.utcnow().strftime("%Y-%m-%dT%H:%M:%S+00:00")
        headers = {
            "X-Client-Time": time,
            "X-Client-Hash": hashlib.md5(
                (time + self.HASH_SECRET).encode()).hexdigest(),
        }

        response = self.extractor.request(
            url, method="POST", headers=headers, data=data, fatal=False)
        if response.status_code >= 400:
            self.log.debug(response.text)
            raise exception.AuthenticationError("Invalid refresh token")

        data = response.json()["response"]
        return data["user"], "Bearer " + data["access_token"]

    def illust_detail(self, illust_id):
        params = {"illust_id": illust_id}
        return self._call("/v1/illust/detail", params)["illust"]

    def illust_bookmark_detail(self, illust_id):
        params = {"illust_id": illust_id}
        return self._call(
            "/v2/illust/bookmark/detail", params)["bookmark_detail"]

    def illust_follow(self, restrict="all"):
        params = {"restrict": restrict}
        return self._pagination("/v2/illust/follow", params)

    def illust_ranking(self, mode="day", date=None):
        params = {"mode": mode, "date": date}
        return self._pagination("/v1/illust/ranking", params)

    def illust_related(self, illust_id):
        params = {"illust_id": illust_id}
        return self._pagination("/v2/illust/related", params)

    def novel_bookmark_detail(self, novel_id):
        params = {"novel_id": novel_id}
        return self._call(
            "/v2/novel/bookmark/detail", params)["bookmark_detail"]

    def novel_detail(self, novel_id):
        params = {"novel_id": novel_id}
        return self._call("/v2/novel/detail", params)["novel"]

    def novel_series(self, series_id):
        params = {"series_id": series_id}
        return self._pagination("/v1/novel/series", params, "novels")

    def novel_text(self, novel_id):
        params = {"novel_id": novel_id}
        return self._call("/v1/novel/text", params)

    def search_illust(self, word, sort=None, target=None, duration=None,
                      date_start=None, date_end=None):
        params = {"word": word, "search_target": target,
                  "sort": sort, "duration": duration,
                  "start_date": date_start, "end_date": date_end}
        return self._pagination("/v1/search/illust", params)

    def user_bookmarks_illust(self, user_id, tag=None, restrict="public"):
        """Return illusts bookmarked by a user"""
        params = {"user_id": user_id, "tag": tag, "restrict": restrict}
        return self._pagination("/v1/user/bookmarks/illust", params)

    def user_bookmark_tags_illust(self, user_id, restrict="public"):
        """Return bookmark tags defined by a user"""
        params = {"user_id": user_id, "restrict": restrict}
        return self._pagination(
            "/v1/user/bookmark-tags/illust", params, "bookmark_tags")

    @memcache(keyarg=1)
    def user_detail(self, user_id):
        params = {"user_id": user_id}
        return self._call("/v1/user/detail", params)

    def user_following(self, user_id, restrict="public"):
        params = {"user_id": user_id, "restrict": restrict}
        return self._pagination("/v1/user/following", params, "user_previews")

    def user_illusts(self, user_id):
        params = {"user_id": user_id}
        return self._pagination("/v1/user/illusts", params)

    def user_novels(self, user_id):
        params = {"user_id": user_id}
        return self._pagination("/v1/user/novels", params, "novels")

    def ugoira_metadata(self, illust_id):
        params = {"illust_id": illust_id}
        return self._call("/v1/ugoira/metadata", params)["ugoira_metadata"]

    def _call(self, endpoint, params=None):
        url = "https://app-api.pixiv.net" + endpoint

        while True:
            self.login()
            response = self.extractor.request(url, params=params, fatal=False)
            data = response.json()

            if "error" not in data:
                return data

            self.log.debug(data)

            if response.status_code == 404:
                raise exception.NotFoundError()

            error = data["error"]
            if "rate limit" in (error.get("message") or "").lower():
                self.extractor.wait(seconds=300)
                continue

            raise exception.StopExtraction("API request failed: %s", error)

    def _pagination(self, endpoint, params, key="illusts"):
        while True:
            data = self._call(endpoint, params)
            yield from data[key]

            if not data["next_url"]:
                return
            query = data["next_url"].rpartition("?")[2]
            params = text.parse_query(query)


@cache(maxage=10*365*24*3600, keyarg=0)
def _refresh_token_cache(username):
    return None
-												[pixiv] update to new extractor interface

											
										
										
											10 years ago
+								# -*- coding: utf-8 -*-
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								# Copyright 2014-2023 Mike Fährmann
-												[pixiv] update to new extractor interface

											
										
										
											10 years ago
+								#
 								# This program is free software; you can redistribute it and/or modify
 								# it under the terms of the GNU General Public License version 2 as
 								# published by the Free Software Foundation.
-												[pixiv] add extractor for 'pixivision' articles (#1672)

											
										
										
											3 years ago
+								"""Extractors for https://www.pixiv.net/"""
-												[pixiv] update to new extractor interface

											
										
										
											10 years ago
-												remove SequentialExtractor class

											
										
										
											9 years ago
+								from .common import Extractor, Message
-												[pixiv] add extractor for 'pixivision' articles (#1672)

											
										
										
											3 years ago
+								from .. import text, util, exception
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								from ..cache import cache, memcache
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								from datetime import datetime, timedelta
-												[pixiv] implement 'avatar' option (#595, #623)

											
										
										
											5 years ago
+								import itertools
-												[pixiv] fix authentication

											
										
										
											5 years ago
+								import hashlib
-												initial commit

											
										
										
											10 years ago
-												code adjustments according to pep8 nr2

											
										
										
											8 years ago
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								class PixivExtractor(Extractor):
 								    """Base class for pixiv extractors"""
-												update all other extractors

											
										
										
											9 years ago
+								    category = "pixiv"
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								    root = "https://www.pixiv.net"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    directory_fmt = ("{category}", "{user[id]} {user[account]}")
-												[pixiv] simplify default filename format

(#366)

											
										
										
											5 years ago
+								    filename_fmt = "{id}_p{num}.{extension}"
-												[pixiv] update metadata entries (#366)

- change 'num' to a simple enumerating integer
- change default filename format
- provide content of the old 'num' field as 'suffix'
- add 'filename' for ugoira

											
										
										
											5 years ago
+								    archive_fmt = "{id}{suffix}.{extension}"
-												let extractors opt-out of cookie option usage

useful to avoid sending unnecessary cookies when all authentication
is done through OAuth tokens

											
										
										
											5 years ago
+								    cookiedomain = None
-												initial commit

											
										
										
											10 years ago
-												propagate 'match' to base extractor constructor

											
										
										
											6 years ago
+								    def __init__(self, match):
 								        Extractor.__init__(self, match)
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								        self.api = PixivAppAPI(self)
-												implement and use extractor.config() method

											
										
										
											8 years ago
+								        self.load_ugoira = self.config("ugoira", True)
-												[pixiv] implement 'max-posts' option (#1558)

* implement max-rank for pixiv

* rename to max-posts and make more generic
											
										
										
											3 years ago
+								        self.max_posts = self.config("max-posts", 0)
-												initial commit

											
										
										
											10 years ago
-												[pixiv] update to new extractor interface

											
										
										
											10 years ago
+								    def items(self):
-												[pixiv] change 'translated-tags' option (#1507)

- rename to 'tags'
- use string-values: "japanese", "translated", "noop"
- remove duplicate entries for "translated" tags

											
										
										
											3 years ago
+								        tags = self.config("tags", "japanese")
-												[pixiv] rename "noop" value for 'tags' option to "original"

(#1507)

											
										
										
											3 years ago
+								        if tags == "original":
-												[pixiv] change 'translated-tags' option (#1507)

- rename to 'tags'
- use string-values: "japanese", "translated", "noop"
- remove duplicate entries for "translated" tags

											
										
										
											3 years ago
+								            transform_tags = None
 								        elif tags == "translated":
 								            def transform_tags(work):
-												[pixiv] preserve 'tags' order (#3266)

for '"tags": "translated"'

As it turns out, set() does *not* preserve insertion order.

											
										
										
											2 years ago
+								                work["tags"] = list(dict.fromkeys(
-												[pixiv] change 'translated-tags' option (#1507)

- rename to 'tags'
- use string-values: "japanese", "translated", "noop"
- remove duplicate entries for "translated" tags

											
										
										
											3 years ago
+								                    tag["translated_name"] or tag["name"]
 								                    for tag in work["tags"]))
 								        else:
 								            def transform_tags(work):
 								                work["tags"] = [tag["name"] for tag in work["tags"]]
-												[pixiv] add 'rating' metadata field (#595)

A human-friendlier representation of 'x_restrict'

											
										
										
											5 years ago
+								        ratings = {0: "General", 1: "R-18", 2: "R-18G"}
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								        meta_user = self.config("metadata")
 								        meta_bookmark = self.config("metadata-bookmark")
-												[pixiv] reduce calls to '/user/detail'

											
										
										
											5 years ago
+								        metadata = self.metadata()
-												[pixiv] transition to pixiv public api

											
										
										
											9 years ago
-												[pixiv] implement 'max-posts' option (#1558)

* implement max-rank for pixiv

* rename to max-posts and make more generic
											
										
										
											3 years ago
+								        works = self.works()
 								        if self.max_posts:
 								            works = itertools.islice(works, self.max_posts)
 								        for work in works:
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								            if not work["user"]["id"]:
 								                continue
 								            meta_single_page = work["meta_single_page"]
 								            meta_pages = work["meta_pages"]
 								            del work["meta_single_page"]
 								            del work["image_urls"]
 								            del work["meta_pages"]
-												[pixiv] change 'translated-tags' option (#1507)

- rename to 'tags'
- use string-values: "japanese", "translated", "noop"
- remove duplicate entries for "translated" tags

											
										
										
											3 years ago
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								            if meta_user:
-												[pixiv] extend 'metadata' option (#3057)

make it usable for all 'pixiv' extractors

											
										
										
											2 years ago
+								                work.update(self.api.user_detail(work["user"]["id"]))
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								            if meta_bookmark and work["is_bookmarked"]:
 								                detail = self.api.illust_bookmark_detail(work["id"])
 								                work["tags_bookmark"] = [tag["name"] for tag in detail["tags"]
 								                                         if tag["is_registered"]]
-												[pixiv] change 'translated-tags' option (#1507)

- rename to 'tags'
- use string-values: "japanese", "translated", "noop"
- remove duplicate entries for "translated" tags

											
										
										
											3 years ago
+								            if transform_tags:
 								                transform_tags(work)
-												[pixiv] update metadata entries (#366)

- change 'num' to a simple enumerating integer
- change default filename format
- provide content of the old 'num' field as 'suffix'
- add 'filename' for ugoira

											
										
										
											5 years ago
+								            work["num"] = 0
-												apply workaround from 4736912 in parse_datetime() itself

											
										
										
											5 years ago
+								            work["date"] = text.parse_datetime(work["create_date"])
-												[pixiv] add 'rating' metadata field (#595)

A human-friendlier representation of 'x_restrict'

											
										
										
											5 years ago
+								            work["rating"] = ratings.get(work["x_restrict"])
-												[pixiv] update metadata entries (#366)

- change 'num' to a simple enumerating integer
- change default filename format
- provide content of the old 'num' field as 'suffix'
- add 'filename' for ugoira

											
										
										
											5 years ago
+								            work["suffix"] = ""
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								            work.update(metadata)
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
-												[pixiv] create directory for each "work" item (#136)

											
										
										
											6 years ago
+								            yield Message.Directory, work
-												[pixiv] transition to pixiv public api

											
										
										
											9 years ago
+								            if work["type"] == "ugoira":
-												[pixiv] add option to skip ugoiras

											
										
										
											8 years ago
+								                if not self.load_ugoira:
 								                    continue
-												[pixiv] make retrieving ugoira metadata non-fatal (#2562)

											
										
										
											2 years ago
 								                try:
 								                    ugoira = self.api.ugoira_metadata(work["id"])
 								                except exception.StopExtraction as exc:
 								                    self.log.warning(
 								                        "Unable to retrieve Ugoira metatdata (%s - %s)",
 								                        work.get("id"), exc.message)
 								                    continue
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
 								                url = ugoira["zip_urls"]["medium"].replace(
 								                    "_ugoira600x600", "_ugoira1920x1080")
-												[pixiv] rework ugoira handling

Frame information now gets attached to the ZIP file's keyword dict
instead of being written to a separate text file.

											
										
										
											6 years ago
+								                work["frames"] = ugoira["frames"]
-												[pixiv] extract 'date_url' metadata (#3405)

i.e. the datetime encoded in each file URL.

https://i.pximg.net/img-master/img/2022/12/01/13/44/55/12345678_p0.jpg
->
2022-12-01 13:44:55 +09:00
->
2022-12-01 04:44:55

											
										
										
											2 years ago
+								                work["date_url"] = self._date_from_url(url)
-												[downloader:http] disable filename extension changes for ugoira

(#1507)

											
										
										
											3 years ago
+								                work["_http_adjust_extension"] = False
-												[pixiv] update metadata entries (#366)

- change 'num' to a simple enumerating integer
- change default filename format
- provide content of the old 'num' field as 'suffix'
- add 'filename' for ugoira

											
										
										
											5 years ago
+								                yield Message.Url, url, text.nameext_from_url(url, work)
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
-												[pixiv] transition to pixiv public api

											
										
										
											9 years ago
+								            elif work["page_count"] == 1:
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								                url = meta_single_page["original_image_url"]
-												[pixiv] extract 'date_url' metadata (#3405)

i.e. the datetime encoded in each file URL.

https://i.pximg.net/img-master/img/2022/12/01/13/44/55/12345678_p0.jpg
->
2022-12-01 13:44:55 +09:00
->
2022-12-01 04:44:55

											
										
										
											2 years ago
+								                work["date_url"] = self._date_from_url(url)
-												[pixiv] provide 'filename' and change default filename format

to '{filename}.{extension}' (closes #366)

											
										
										
											5 years ago
+								                yield Message.Url, url, text.nameext_from_url(url, work)
-												initial commit

											
										
										
											10 years ago
 								            else:
-												[pixiv] update metadata entries (#366)

- change 'num' to a simple enumerating integer
- change default filename format
- provide content of the old 'num' field as 'suffix'
- add 'filename' for ugoira

											
										
										
											5 years ago
+								                for work["num"], img in enumerate(meta_pages):
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								                    url = img["image_urls"]["original"]
-												[pixiv] extract 'date_url' metadata (#3405)

i.e. the datetime encoded in each file URL.

https://i.pximg.net/img-master/img/2022/12/01/13/44/55/12345678_p0.jpg
->
2022-12-01 13:44:55 +09:00
->
2022-12-01 04:44:55

											
										
										
											2 years ago
+								                    work["date_url"] = self._date_from_url(url)
-												[pixiv] update metadata entries (#366)

- change 'num' to a simple enumerating integer
- change default filename format
- provide content of the old 'num' field as 'suffix'
- add 'filename' for ugoira

											
										
										
											5 years ago
+								                    work["suffix"] = "_p{:02}".format(work["num"])
-												[pixiv] provide 'filename' and change default filename format

to '{filename}.{extension}' (closes #366)

											
										
										
											5 years ago
+								                    yield Message.Url, url, text.nameext_from_url(url, work)
-												[pixiv] transition to pixiv public api

											
										
										
											9 years ago
-												[pixiv] extract 'date_url' metadata (#3405)

i.e. the datetime encoded in each file URL.

https://i.pximg.net/img-master/img/2022/12/01/13/44/55/12345678_p0.jpg
->
2022-12-01 13:44:55 +09:00
->
2022-12-01 04:44:55

											
										
										
											2 years ago
+								    @staticmethod
 								    def _date_from_url(url, offset=timedelta(hours=9)):
 								        try:
 								            _, _, _, _, _, y, m, d, H, M, S, _ = url.split("/")
 								            return datetime(
 								                int(y), int(m), int(d), int(H), int(M), int(S)) - offset
 								        except Exception:
 								            return None
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								    @staticmethod
 								    def _make_work(kind, url, user):
-												[pixiv] updates to avatar/background extractors (#2495)

- add 'date' metadata to avatar/background files when available
  and use that in default filenames / archive ids
- remove deprecation warnings as their option names clash with
  subcategory names

											
										
										
											2 years ago
+								        p = url.split("/")
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								        return {
-												[pixiv] updates to avatar/background extractors (#2495)

- add 'date' metadata to avatar/background files when available
  and use that in default filenames / archive ids
- remove deprecation warnings as their option names clash with
  subcategory names

											
										
										
											2 years ago
+								            "create_date"     : "{}-{}-{}T{}:{}:{}+09:00".format(
 								                p[5], p[6], p[7], p[8], p[9], p[10]) if len(p) > 9 else None,
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								            "height"          : 0,
 								            "id"              : kind,
 								            "image_urls"      : None,
 								            "meta_pages"      : (),
 								            "meta_single_page": {"original_image_url": url},
 								            "page_count"      : 1,
 								            "sanity_level"    : 0,
 								            "tags"            : (),
 								            "title"           : kind,
 								            "type"            : kind,
 								            "user"            : user,
 								            "width"           : 0,
 								            "x_restrict"      : 0,
 								        }
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								    def works(self):
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								        """Return an iterable containing all relevant 'work' objects"""
-												initial commit

											
										
										
											10 years ago
-												[pixiv] reduce calls to '/user/detail'

											
										
										
											5 years ago
+								    def metadata(self):
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								        """Collect metadata for extractor job"""
-												[pixiv] reduce calls to '/user/detail'

											
										
										
											5 years ago
+								        return {}
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
 								class PixivUserExtractor(PixivExtractor):
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								    """Extractor for a pixiv user profile"""
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								    subcategory = "user"
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net/(?:"
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								               r"(?:en/)?u(?:sers)?/|member\.php\?id=|(?:mypage\.php)?#id="
 								               r")(\d+)(?:$|[?#])")
 								    test = (
 								        ("https://www.pixiv.net/en/users/173530"),
 								        ("https://www.pixiv.net/u/173530"),
 								        ("https://www.pixiv.net/member.php?id=173530"),
 								        ("https://www.pixiv.net/mypage.php#id=173530"),
 								        ("https://www.pixiv.net/#id=173530"),
 								    )
 								    def __init__(self, match):
 								        PixivExtractor.__init__(self, match)
 								        self.user_id = match.group(1)
 								    def items(self):
 								        base = "{}/users/{}/".format(self.root, self.user_id)
 								        return self._dispatch_extractors((
 								            (PixivAvatarExtractor    , base + "avatar"),
 								            (PixivBackgroundExtractor, base + "background"),
 								            (PixivArtworksExtractor  , base + "artworks"),
 								            (PixivFavoriteExtractor  , base + "bookmarks/artworks"),
-												[pixiv] initial 'novel' support (#1241, #4044)

supported URLs are
- https://www.pixiv.net/novel/show.php?id=<ID>
- https://www.pixiv.net/novel/series/<ID>
- https://www.pixiv.net/en/users/<ID>/novels

											
										
										
											1 year ago
+								            (PixivNovelUserExtractor , base + "novels"),
-												[pixiv] updates to avatar/background extractors (#2495)

- add 'date' metadata to avatar/background files when available
  and use that in default filenames / archive ids
- remove deprecation warnings as their option names clash with
  subcategory names

											
										
										
											2 years ago
+								        ), ("artworks",))
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
 								class PixivArtworksExtractor(PixivExtractor):
 								    """Extractor for artworks of a pixiv user"""
 								    subcategory = "artworks"
 								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net/(?:"
 								               r"(?:en/)?users/(\d+)/(?:artworks|illustrations|manga)"
 								               r"(?:/([^/?#]+))?/?(?:$|[?#])"
 								               r"|member_illust\.php\?id=(\d+)(?:&([^#]+))?)")
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    test = (
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/en/users/173530/artworks", {
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								            "url": "852c31ad83b6840bacbce824d85f2a997889efb7",
 								        }),
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        # illusts with specific tag
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        (("https://www.pixiv.net/en/users/173530/artworks"
 								          "/%E6%89%8B%E3%81%B6%E3%82%8D"), {
 								            "url": "25b1cd81153a8ff82eec440dd9f20a4a22079658",
 								        }),
-												[pixiv] unquote tags

											
										
										
											7 years ago
+								        (("https://www.pixiv.net/member_illust.php?id=173530"
 								          "&tag=%E6%89%8B%E3%81%B6%E3%82%8D"), {
 								            "url": "25b1cd81153a8ff82eec440dd9f20a4a22079658",
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								        }),
-												[pixiv] implement 'avatar' option (#595, #623)

											
										
										
											5 years ago
+								        # deleted account
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								        ("http://www.pixiv.net/member_illust.php?id=173531", {
-												[pixiv] add 'metadata' option (#1551)

											
										
										
											3 years ago
+								            "options": (("metadata", True),),
 								            "exception": exception.NotFoundError,
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								        }),
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/en/users/173530/manga"),
 								        ("https://www.pixiv.net/en/users/173530/illustrations"),
 								        ("https://www.pixiv.net/member_illust.php?id=173530"),
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								        ("https://touch.pixiv.net/member_illust.php?id=173530"),
 								    )
-												[pixiv] update to new extractor interface

											
										
										
											10 years ago
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								    def __init__(self, match):
-												propagate 'match' to base extractor constructor

											
										
										
											6 years ago
+								        PixivExtractor.__init__(self, match)
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								        u1, t1, u2, t2 = match.groups()
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        if t1:
 								            t1 = text.unquote(t1)
 								        elif t2:
 								            t2 = text.parse_query(t2).get("tag")
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								        self.user_id = u1 or u2
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        self.tag = t1 or t2
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
-												[pixiv] add 'metadata' option (#1551)

											
										
										
											3 years ago
+								    def metadata(self):
 								        if self.config("metadata"):
-												[pixiv] extend 'metadata' option (#3057)

make it usable for all 'pixiv' extractors

											
										
										
											2 years ago
+								            self.api.user_detail(self.user_id)
-												[pixiv] add 'metadata' option (#1551)

											
										
										
											3 years ago
+								        return {}
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								    def works(self):
-												[pixiv] respect more query parameters for user URLs

The API endpoint responsible for user illustrations does not
provide sufficient filter capabilities* to match the actual
website, so we are spinning our own filters.

Respected parameters are
    'type': illust, manga, ugoira
    'tag' : any image tag (this was already supported)
    'p'   : the page to start on

*
- API can filter for illustrations and manga, but not for ugoira.
- 'offset' is applied before filtering
- no 'tag' filter

											
										
										
											6 years ago
+								        works = self.api.user_illusts(self.user_id)
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        if self.tag:
 								            tag = self.tag.lower()
-												[pixiv] remove 'type' and 'page' query parameter handling

The "new and improved" /member_illust.php and /bookmark.php listings
don't quite work with how things were.

											
										
										
											6 years ago
+								            works = (
 								                work for work in works
 								                if tag in [t["name"].lower() for t in work["tags"]]
 								            )
-												[pixiv] respect more query parameters for user URLs

The API endpoint responsible for user illustrations does not
provide sufficient filter capabilities* to match the actual
website, so we are spinning our own filters.

Respected parameters are
    'type': illust, manga, ugoira
    'tag' : any image tag (this was already supported)
    'p'   : the page to start on

*
- API can filter for illustrations and manga, but not for ugoira.
- 'offset' is applied before filtering
- no 'tag' filter

											
										
										
											6 years ago
 								        return works
-												[pixiv] support pixiv.me URLs (#23)

											
										
										
											7 years ago
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
 								class PixivAvatarExtractor(PixivExtractor):
 								    """Extractor for pixiv avatars"""
 								    subcategory = "avatar"
-												[pixiv] updates to avatar/background extractors (#2495)

- add 'date' metadata to avatar/background files when available
  and use that in default filenames / archive ids
- remove deprecation warnings as their option names clash with
  subcategory names

											
										
										
											2 years ago
+								    filename_fmt = "avatar{date:?_//%Y-%m-%d}.{extension}"
 								    archive_fmt = "avatar_{user[id]}_{date}"
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								    pattern = (r"(?:https?://)?(?:www\.)?pixiv\.net"
 								               r"/(?:en/)?users/(\d+)/avatar")
 								    test = ("https://www.pixiv.net/en/users/173530/avatar", {
 								        "content": "4e57544480cc2036ea9608103e8f024fa737fe66",
 								    })
 								    def __init__(self, match):
 								        PixivExtractor.__init__(self, match)
 								        self.user_id = match.group(1)
 								    def works(self):
 								        user = self.api.user_detail(self.user_id)["user"]
 								        url = user["profile_image_urls"]["medium"].replace("_170.", ".")
 								        return (self._make_work("avatar", url, user),)
 								class PixivBackgroundExtractor(PixivExtractor):
 								    """Extractor for pixiv background banners"""
 								    subcategory = "background"
-												[pixiv] fix default filenames for backgrounds

											
										
										
											2 years ago
+								    filename_fmt = "background{date:?_//%Y-%m-%d}.{extension}"
-												[pixiv] updates to avatar/background extractors (#2495)

- add 'date' metadata to avatar/background files when available
  and use that in default filenames / archive ids
- remove deprecation warnings as their option names clash with
  subcategory names

											
										
										
											2 years ago
+								    archive_fmt = "background_{user[id]}_{date}"
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								    pattern = (r"(?:https?://)?(?:www\.)?pixiv\.net"
 								               r"/(?:en/)?users/(\d+)/background")
 								    test = ("https://www.pixiv.net/en/users/194921/background", {
 								        "pattern": r"https://i\.pximg\.net/background/img/2021/01/30/16/12/02"
 								                   r"/194921_af1f71e557a42f499213d4b9eaccc0f8\.jpg",
 								    })
 								    def __init__(self, match):
 								        PixivExtractor.__init__(self, match)
 								        self.user_id = match.group(1)
 								    def works(self):
 								        detail = self.api.user_detail(self.user_id)
 								        url = detail["profile"]["background_image_url"]
 								        if not url:
 								            return ()
 								        if "/c/" in url:
 								            parts = url.split("/")
 								            del parts[3:5]
 								            url = "/".join(parts)
 								        url = url.replace("_master1200.", ".")
 								        work = self._make_work("background", url, detail["user"])
 								        if url.endswith(".jpg"):
-												[pixiv] include '.gif' in background fallback URLs (#2495)

											
										
										
											2 years ago
+								            url = url[:-4]
 								            work["_fallback"] = (url + ".png", url + ".gif")
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								        return (work,)
-												[pixiv] implement 'background' option (#623, #1124, #2495)

											
										
										
											2 years ago
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
-												[pixiv] support pixiv.me URLs (#23)

											
										
										
											7 years ago
+								class PixivMeExtractor(PixivExtractor):
 								    """Extractor for pixiv.me URLs"""
 								    subcategory = "me"
-												remove '&' from URL patterns

'/?&#' -> '/?#' and '?&#' -> '?#'

According to https://www.ietf.org/rfc/rfc3986.txt, URLs are
"organized hierarchically" by using "the slash ("/"), question
mark ("?"), and number sign ("#") characters to delimit components"

											
										
										
											4 years ago
+								    pattern = r"(?:https?://)?pixiv\.me/([^/?#]+)"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    test = (
-												[pixiv] support pixiv.me URLs (#23)

											
										
										
											7 years ago
+								        ("https://pixiv.me/del_shannon", {
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								            "url": "29c295ce75150177e6b0a09089a949804c708fbf",
-												[pixiv] support pixiv.me URLs (#23)

											
										
										
											7 years ago
+								        }),
 								        ("https://pixiv.me/del_shanno", {
 								            "exception": exception.NotFoundError,
 								        }),
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    )
-												[pixiv] support pixiv.me URLs (#23)

											
										
										
											7 years ago
 								    def __init__(self, match):
-												propagate 'match' to base extractor constructor

											
										
										
											6 years ago
+								        PixivExtractor.__init__(self, match)
-												[pixiv] support pixiv.me URLs (#23)

											
										
										
											7 years ago
+								        self.account = match.group(1)
 								    def items(self):
-												use 'extractor.request()' for more HTTP requests

											
										
										
											6 years ago
+								        url = "https://pixiv.me/" + self.account
-												add '_extractor' information to redirect results

											
										
										
											5 years ago
+								        data = {"_extractor": PixivUserExtractor}
-												use 'extractor.request()' for more HTTP requests

											
										
										
											6 years ago
+								        response = self.request(
-												replace extractor.request() 'expect' argument

with
- 'fatal': allow 4xx status codes
- 'notfound': raise NotFoundError on 404

											
										
										
											5 years ago
+								            url, method="HEAD", allow_redirects=False, notfound="user")
-												add '_extractor' information to redirect results

											
										
										
											5 years ago
+								        yield Message.Queue, response.headers["Location"], data
-												[pixiv] support pixiv.me URLs (#23)

											
										
										
											7 years ago
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								class PixivWorkExtractor(PixivExtractor):
-												consistent extractor naming scheme + docstrings

											
										
										
											8 years ago
+								    """Extractor for a single pixiv work/illustration"""
-												add subcategories to extractors

											
										
										
											9 years ago
+								    subcategory = "work"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    pattern = (r"(?:https?://)?(?:(?:www\.|touch\.)?pixiv\.net"
-												[pixiv] match '/artworks/' URLs

											
										
										
											5 years ago
+								               r"/(?:(?:en/)?artworks/"
 								               r"|member_illust\.php\?(?:[^&]+&)*illust_id=)(\d+)"
-												rewrite URL patterns to use only 1 per extractor

											
										
										
											6 years ago
+								               r"|(?:i(?:\d+\.pixiv|\.pximg)\.net"
 								               r"/(?:(?:.*/)?img-[^/]+/img/\d{4}(?:/\d\d){5}|img\d+/img/[^/]+)"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								               r"|img\d*\.pixiv\.net/img/[^/]+|(?:www\.)?pixiv\.net/i)/(\d+))")
 								    test = (
-												[pixiv] match '/artworks/' URLs

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/artworks/966412", {
-												update unit test results

											
										
										
											8 years ago
+								            "url": "90c1715b07b0d1aad300bce256a0bc71f42540ba",
-												[pixiv] match direct-links to images

											
										
										
											8 years ago
+								            "content": "69a8edfb717400d1c2e146ab2b30d2c235440c5a",
-												[pixiv] extract 'date_url' metadata (#3405)

i.e. the datetime encoded in each file URL.

https://i.pximg.net/img-master/img/2022/12/01/13/44/55/12345678_p0.jpg
->
2022-12-01 13:44:55 +09:00
->
2022-12-01 04:44:55

											
										
										
											2 years ago
+								            "keyword": {
 								                "date"    : "dt:2008-06-12 15:29:13",
 								                "date_url": "dt:2008-06-12 15:29:13",
 								            },
-												[pixiv] match direct-links to images

											
										
										
											8 years ago
+								        }),
-												code adjustments according to pep8 nr2

											
										
										
											8 years ago
+								        (("http://www.pixiv.net/member_illust.php"
 								          "?mode=medium&illust_id=966411"), {
-												add a few tests expecting exceptions

											
										
										
											8 years ago
+								            "exception": exception.NotFoundError,
 								        }),
-												[pixiv] fix ugoira extraction (closes #78)

											
										
										
											7 years ago
+								        # ugoira
 								        (("https://www.pixiv.net/member_illust.php"
 								          "?mode=medium&illust_id=66806629"), {
-												[pixiv] fix ugoira test

											
										
										
											6 years ago
+								            "url": "7267695a985c4db8759bebcf8d21dbdd2d2317ef",
-												[pixiv] extract 'date_url' metadata (#3405)

i.e. the datetime encoded in each file URL.

https://i.pximg.net/img-master/img/2022/12/01/13/44/55/12345678_p0.jpg
->
2022-12-01 13:44:55 +09:00
->
2022-12-01 04:44:55

											
										
										
											2 years ago
+								            "keyword": {
 								                "frames"  : list,
 								                "date"    : "dt:2018-01-14 15:06:08",
 								                "date_url": "dt:2018-01-15 04:24:48",
 								            },
-												[pixiv] fix ugoira extraction (closes #78)

											
										
										
											7 years ago
+								        }),
-												[pixiv] add 'related' option (#1237)

											
										
										
											4 years ago
+								        # related works (#1237)
 								        ("https://www.pixiv.net/artworks/966412", {
 								            "options": (("related", True),),
-												update extractor test results

											
										
										
											4 years ago
+								            "range": "1-10",
-												[pixiv] add 'related' option (#1237)

											
										
										
											4 years ago
+								            "count": ">= 10",
 								        }),
-												[pixiv] match '/artworks/' URLs

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/en/artworks/966412"),
 								        ("http://www.pixiv.net/member_illust.php?mode=medium&illust_id=96641"),
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								        ("http://i1.pixiv.net/c/600x600/img-master"
 								         "/img/2008/06/13/00/29/13/966412_p0_master1200.jpg"),
 								        ("https://i.pximg.net/img-original"
 								         "/img/2017/04/25/07/33/29/62568267_p0.png"),
 								        ("https://www.pixiv.net/i/966412"),
 								        ("http://img.pixiv.net/img/soundcross/42626136.jpg"),
 								        ("http://i2.pixiv.net/img76/img/snailrin/42672235.jpg"),
 								    )
-												[pixiv] add single work/illust extractor

											
										
										
											9 years ago
 								    def __init__(self, match):
-												propagate 'match' to base extractor constructor

											
										
										
											6 years ago
+								        PixivExtractor.__init__(self, match)
-												rewrite URL patterns to use only 1 per extractor

											
										
										
											6 years ago
+								        self.illust_id = match.group(1) or match.group(2)
-												[pixiv] add single work/illust extractor

											
										
										
											9 years ago
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								    def works(self):
-												[pixiv] add 'related' option (#1237)

											
										
										
											4 years ago
+								        works = (self.api.illust_detail(self.illust_id),)
 								        if self.config("related", False):
 								            related = self.api.illust_related(self.illust_id)
 								            works = itertools.chain(works, related)
 								        return works
-												[pixiv] add single work/illust extractor

											
										
										
											9 years ago
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
+								class PixivFavoriteExtractor(PixivExtractor):
-												consistent extractor naming scheme + docstrings

											
										
										
											8 years ago
+								    """Extractor for all favorites/bookmarks of a pixiv-user"""
-												add subcategories to extractors

											
										
										
											9 years ago
+								    subcategory = "favorite"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    directory_fmt = ("{category}", "bookmarks",
 								                     "{user_bookmark[id]} {user_bookmark[account]}")
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    archive_fmt = "f_{user_bookmark[id]}_{id}{num}.{extension}"
-												[pixiv] handle tags at the end of new bookmark URLs

											
										
										
											5 years ago
+								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net/(?:(?:en/)?"
-												fix PixivFavoriteExtractor regex (#1405)

* fix PixivFavoriteExtractor regex

* do not use lookbehind
											
										
										
											4 years ago
+								               r"users/(\d+)/(bookmarks/artworks|following)(?:/([^/?#]+))?"
 								               r"|bookmark\.php)(?:\?([^#]*))?")
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    test = (
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/en/users/173530/bookmarks/artworks", {
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								            "url": "85a3104eaaaf003c7b3947117ca2f1f0b1cfc949",
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        }),
-												[pixiv] support mobile URLs (https://touch.pixiv.net/)

											
										
										
											7 years ago
+								        ("https://www.pixiv.net/bookmark.php?id=173530", {
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								            "url": "85a3104eaaaf003c7b3947117ca2f1f0b1cfc949",
-												[pixiv] support mobile URLs (https://touch.pixiv.net/)

											
										
										
											7 years ago
+								        }),
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        # bookmarks with specific tag
-												[pixiv] handle tags at the end of new bookmark URLs

											
										
										
											5 years ago
+								        (("https://www.pixiv.net/en/users/3137110"
 								          "/bookmarks/artworks/%E3%81%AF%E3%82%93%E3%82%82%E3%82%93"), {
 								            "url": "379b28275f786d946e01f721e54afe346c148a8c",
 								        }),
 								        # bookmarks with specific tag (legacy url)
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        (("https://www.pixiv.net/bookmark.php?id=3137110"
 								          "&tag=%E3%81%AF%E3%82%93%E3%82%82%E3%82%93&p=1"), {
-												[pixiv] handle tags at the end of new bookmark URLs

											
										
										
											5 years ago
+								            "url": "379b28275f786d946e01f721e54afe346c148a8c",
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        }),
 								        # own bookmarks
 								        ("https://www.pixiv.net/bookmark.php", {
 								            "url": "90c1715b07b0d1aad300bce256a0bc71f42540ba",
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								            "keyword": {"tags_bookmark": ["47", "hitman"]},
 								            "options": (("metadata-bookmark", True),),
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        }),
-												[pixiv] fix user id for bookmarks API calls (closes #596)

											
										
										
											5 years ago
+								        # own bookmarks with tag (#596)
 								        ("https://www.pixiv.net/bookmark.php?tag=foobar", {
 								            "count": 0,
 								        }),
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
+								        # followed users (#515)
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/en/users/173530/following", {
 								            "pattern": PixivUserExtractor.pattern,
 								            "count": ">= 12",
 								        }),
-												[pixiv] handle tags at the end of new bookmark URLs

											
										
										
											5 years ago
+								        # followed users (legacy url) (#515)
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/bookmark.php?id=173530&type=user", {
 								            "pattern": PixivUserExtractor.pattern,
 								            "count": ">= 12",
 								        }),
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        # touch URLs
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								        ("https://touch.pixiv.net/bookmark.php?id=173530"),
 								        ("https://touch.pixiv.net/bookmark.php"),
 								    )
-												[pixiv] add user-favorite extractor

											
										
										
											9 years ago
 								    def __init__(self, match):
-												[pixiv] handle tags at the end of new bookmark URLs

											
										
										
											5 years ago
+								        uid, kind, self.tag, query = match.groups()
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
+								        query = text.parse_query(query)
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
+								        if not uid:
 								            uid = query.get("id")
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								            if not uid:
 								                self.subcategory = "bookmark"
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
 								        if kind == "following" or query.get("type") == "user":
 								            self.subcategory = "following"
 								            self.items = self._items_following
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
-												propagate 'match' to base extractor constructor

											
										
										
											6 years ago
+								        PixivExtractor.__init__(self, match)
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
+								        self.query = query
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        self.user_id = uid
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
 								    def works(self):
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        tag = None
 								        if "tag" in self.query:
 								            tag = text.unquote(self.query["tag"])
-												[pixiv] handle tags at the end of new bookmark URLs

											
										
										
											5 years ago
+								        elif self.tag:
 								            tag = text.unquote(self.tag)
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
+								        restrict = "public"
 								        if self.query.get("rest") == "hide":
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								            restrict = "private"
-												[pixiv] add user-favorite extractor

											
										
										
											9 years ago
-												[pixiv] remove 'type' and 'page' query parameter handling

The "new and improved" /member_illust.php and /bookmark.php listings
don't quite work with how things were.

											
										
										
											6 years ago
+								        return self.api.user_bookmarks_illust(self.user_id, tag, restrict)
-												[pixiv] add bookmark extractor

											
										
										
											9 years ago
-												[pixiv] reduce calls to '/user/detail'

											
										
										
											5 years ago
+								    def metadata(self):
-												[pixiv] update URL patterns (fixes #568)

Pixiv now uses new URLs for
- user profiles and illustration listings:
  - https://www.pixiv.net/en/users/<ID>
  - https://www.pixiv.net/en/users/<ID>/artworks
- bookmarks:
  - https://www.pixiv.net/en/users/<ID>/bookmarks/artworks

											
										
										
											5 years ago
+								        if self.user_id:
-												[pixiv] implement 'background' option (#623, #1124, #2495)

											
										
										
											2 years ago
+								            user = self.api.user_detail(self.user_id)["user"]
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        else:
 								            self.api.login()
 								            user = self.api.user
 								        self.user_id = user["id"]
 								        return {"user_bookmark": user}
-												[pixiv] refresh access-token every 50 minutes

											
										
										
											9 years ago
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
+								    def _items_following(self):
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
+								        restrict = "public"
 								        if self.query.get("rest") == "hide":
 								            restrict = "private"
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
+								        for preview in self.api.user_following(self.user_id, restrict):
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
+								            user = preview["user"]
 								            user["_extractor"] = PixivUserExtractor
-												[pixiv] update URLs of followed users to the new format

											
										
										
											5 years ago
+								            url = "https://www.pixiv.net/users/{}".format(user["id"])
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
+								            yield Message.Queue, url, user
-												code adjustments according to pep8 nr2

											
										
										
											8 years ago
-												[pixiv] add extractor for ranking lists

											
										
										
											7 years ago
+								class PixivRankingExtractor(PixivExtractor):
 								    """Extractor for pixiv ranking pages"""
 								    subcategory = "ranking"
-												[pixiv] update archive IDs and add metadata-fields

(Pixiv bookmarks actually have their own IDs, comments and tags,
independent of the bookmarked image, which makes creating an
archive ID a lot easier)

											
										
										
											7 years ago
+								    archive_fmt = "r_{ranking[mode]}_{ranking[date]}_{id}{num}.{extension}"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    directory_fmt = ("{category}", "rankings",
 								                     "{ranking[mode]}", "{ranking[date]}")
 								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
 								               r"/ranking\.php(?:\?([^#]*))?")
 								    test = (
 								        ("https://www.pixiv.net/ranking.php?mode=daily&date=20170818"),
 								        ("https://www.pixiv.net/ranking.php"),
 								        ("https://touch.pixiv.net/ranking.php"),
-												[pixiv] stop with error for invalid search/ranking parameters

instead of falling back to defaults

											
										
										
											2 years ago
+								        ("https://www.pixiv.net/ranking.php?mode=unknown", {
 								            "exception": exception.StopExtraction,
 								        }),
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    )
-												[pixiv] add extractor for ranking lists

											
										
										
											7 years ago
 								    def __init__(self, match):
-												propagate 'match' to base extractor constructor

											
										
										
											6 years ago
+								        PixivExtractor.__init__(self, match)
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
+								        self.query = match.group(1)
 								        self.mode = self.date = None
-												[pixiv] add extractor for ranking lists

											
										
										
											7 years ago
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
+								    def works(self):
 								        return self.api.illust_ranking(self.mode, self.date)
-												[pixiv] reduce calls to '/user/detail'

											
										
										
											5 years ago
+								    def metadata(self):
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
+								        query = text.parse_query(self.query)
 								        mode = query.get("mode", "daily").lower()
 								        mode_map = {
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								            "daily": "day",
 								            "daily_r18": "day_r18",
-												[pixiv] rankings: add support for the new daily AI and daily AI R18

(#3214, #3221)

In remembrance of @thatfuckingbird

											
										
										
											2 years ago
+								            "daily_ai": "day_ai",
 								            "daily_r18_ai": "day_r18_ai",
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								            "weekly": "week",
 								            "weekly_r18": "week_r18",
 								            "monthly": "month",
 								            "male": "day_male",
 								            "male_r18": "day_male_r18",
 								            "female": "day_female",
 								            "female_r18": "day_female_r18",
 								            "original": "week_original",
 								            "rookie": "week_rookie",
 								            "r18g": "week_r18g",
-												[pixiv] update archive IDs and add metadata-fields

(Pixiv bookmarks actually have their own IDs, comments and tags,
independent of the bookmarked image, which makes creating an
archive ID a lot easier)

											
										
										
											7 years ago
+								        }
-												[pixiv] stop with error for invalid search/ranking parameters

instead of falling back to defaults

											
										
										
											2 years ago
+								        try:
 								            self.mode = mode = mode_map[mode]
 								        except KeyError:
 								            raise exception.StopExtraction("Invalid mode '%s'", mode)
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								        date = query.get("date")
 								        if date:
 								            if len(date) == 8 and date.isdecimal():
 								                date = "{}-{}-{}".format(date[0:4], date[4:6], date[6:8])
 								            else:
 								                self.log.warning("invalid date '%s'", date)
 								                date = None
 								        if not date:
 								            date = (datetime.utcnow() - timedelta(days=1)).strftime("%Y-%m-%d")
 								        self.date = date
-												[pixiv] rewrite

- same functionality, better(?) code quality, easier to extend

- added test for the user-tag functionality

- removed the 'artist-id', 'artist-name' and 'artist-nick'
  keywords, which can be replaced with 'user[id]', 'user[name]'
  and 'user[account]' respectively

											
										
										
											7 years ago
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
+								        return {"ranking": {
 								            "mode": mode,
 								            "date": self.date,
 								        }}
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
+								class PixivSearchExtractor(PixivExtractor):
 								    """Extractor for pixiv search results"""
 								    subcategory = "search"
 								    archive_fmt = "s_{search[word]}_{id}{num}.{extension}"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    directory_fmt = ("{category}", "search", "{search[word]}")
 								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
-												remove '&' from URL patterns

'/?&#' -> '/?#' and '?&#' -> '?#'

According to https://www.ietf.org/rfc/rfc3986.txt, URLs are
"organized hierarchically" by using "the slash ("/"), question
mark ("?"), and number sign ("#") characters to delimit components"

											
										
										
											4 years ago
+								               r"/(?:(?:en/)?tags/([^/?#]+)(?:/[^/?#]+)?/?"
-												[pixiv] match new search URLs (closes #507)

											
										
										
											5 years ago
+								               r"|search\.php)(?:\?([^#]+))?")
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    test = (
-												[pixiv] match new search URLs (closes #507)

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/en/tags/Original", {
 								            "range": "1-10",
 								            "count": 10,
 								        }),
-												[pixiv] stop with error for invalid search/ranking parameters

instead of falling back to defaults

											
										
										
											2 years ago
+								        ("https://pixiv.net/en/tags/foo/artworks?order=week&s_mode=s_tag", {
 								            "exception": exception.StopExtraction,
 								        }),
 								        ("https://pixiv.net/en/tags/foo/artworks?order=date&s_mode=tag", {
 								            "exception": exception.StopExtraction,
 								        }),
 								        ("https://www.pixiv.net/search.php?s_mode=s_tag&name=Original", {
 								            "exception": exception.StopExtraction,
 								        }),
-												[pixiv] match new search URLs (closes #507)

											
										
										
											5 years ago
+								        ("https://www.pixiv.net/en/tags/foo/artworks?order=date&s_mode=s_tag"),
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								        ("https://www.pixiv.net/search.php?s_mode=s_tag&word=Original"),
 								        ("https://touch.pixiv.net/search.php?word=Original"),
 								    )
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
 								    def __init__(self, match):
-												propagate 'match' to base extractor constructor

											
										
										
											6 years ago
+								        PixivExtractor.__init__(self, match)
-												[pixiv] match new search URLs (closes #507)

											
										
										
											5 years ago
+								        self.word, self.query = match.groups()
 								        self.sort = self.target = None
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
 								    def works(self):
-												[pixiv] allow setting a date range for search results (#2133)

with the 'scd' and 'ecd' query parameters

											
										
										
											3 years ago
+								        return self.api.search_illust(
 								            self.word, self.sort, self.target,
 								            date_start=self.date_start, date_end=self.date_end)
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
-												[pixiv] reduce calls to '/user/detail'

											
										
										
											5 years ago
+								    def metadata(self):
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
+								        query = text.parse_query(self.query)
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
-												[pixiv] match new search URLs (closes #507)

											
										
										
											5 years ago
+								        if self.word:
 								            self.word = text.unquote(self.word)
 								        else:
-												[pixiv] stop with error for invalid search/ranking parameters

instead of falling back to defaults

											
										
										
											2 years ago
+								            try:
 								                self.word = query["word"]
 								            except KeyError:
-												[pixiv] match new search URLs (closes #507)

											
										
										
											5 years ago
+								                raise exception.StopExtraction("Missing search term")
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
 								        sort = query.get("order", "date_d")
 								        sort_map = {
 								            "date": "date_asc",
 								            "date_d": "date_desc",
-												[pixiv] allow sorting by popularity (requires pixiv premium)

											
										
										
											1 year ago
+								            "popular_d": "popular_desc",
 								            "popular_male_d": "popular_male_desc",
 								            "popular_female_d": "popular_female_desc",
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
+								        }
-												[pixiv] stop with error for invalid search/ranking parameters

instead of falling back to defaults

											
										
										
											2 years ago
+								        try:
 								            self.sort = sort = sort_map[sort]
 								        except KeyError:
 								            raise exception.StopExtraction("Invalid search order '%s'", sort)
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
-												[pixiv] use 'exact_match_for_tags' as default search mode (#3092)

											
										
										
											2 years ago
+								        target = query.get("s_mode", "s_tag_full")
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
+								        target_map = {
 								            "s_tag": "partial_match_for_tags",
 								            "s_tag_full": "exact_match_for_tags",
 								            "s_tc": "title_and_caption",
 								        }
-												[pixiv] stop with error for invalid search/ranking parameters

instead of falling back to defaults

											
										
										
											2 years ago
+								        try:
 								            self.target = target = target_map[target]
 								        except KeyError:
 								            raise exception.StopExtraction("Invalid search mode '%s'", target)
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
-												[pixiv] allow setting a date range for search results (#2133)

with the 'scd' and 'ecd' query parameters

											
										
										
											3 years ago
+								        self.date_start = query.get("scd")
 								        self.date_end = query.get("ecd")
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
+								        return {"search": {
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
+								            "word": self.word,
 								            "sort": self.sort,
 								            "target": self.target,
-												[pixiv] allow setting a date range for search results (#2133)

with the 'scd' and 'ecd' query parameters

											
										
										
											3 years ago
+								            "date_start": self.date_start,
 								            "date_end": self.date_end,
-												[pixiv] move query parsing out of constructor

better exception handling, among other things

											
										
										
											6 years ago
+								        }}
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
-												[pixiv] add extractor for illusts from followed users

											
										
										
											6 years ago
+								class PixivFollowExtractor(PixivExtractor):
 								    """Extractor for new illustrations from your followed artists"""
 								    subcategory = "follow"
 								    archive_fmt = "F_{user_follow[id]}_{id}{num}.{extension}"
-												simplify extractor constants

- single strings for URL patterns
- tuples instead of lists for 'directory_fmt' and 'test'
- single-tuple tests where applicable

											
										
										
											6 years ago
+								    directory_fmt = ("{category}", "following")
 								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
 								               r"/bookmark_new_illust\.php")
 								    test = (
 								        ("https://www.pixiv.net/bookmark_new_illust.php"),
 								        ("https://touch.pixiv.net/bookmark_new_illust.php"),
 								    )
-												[pixiv] add extractor for illusts from followed users

											
										
										
											6 years ago
 								    def works(self):
 								        return self.api.illust_follow()
-												[pixiv] reduce calls to '/user/detail'

											
										
										
											5 years ago
+								    def metadata(self):
-												[pixiv] add extractor for illusts from followed users

											
										
										
											6 years ago
+								        self.api.login()
 								        return {"user_follow": self.api.user}
-												[pixiv] add extractor for 'pixivision' articles (#1672)

											
										
										
											3 years ago
+								class PixivPixivisionExtractor(PixivExtractor):
 								    """Extractor for illustrations from a pixivision article"""
 								    subcategory = "pixivision"
 								    directory_fmt = ("{category}", "pixivision",
 								                     "{pixivision_id} {pixivision_title}")
 								    archive_fmt = "V{pixivision_id}_{id}{suffix}.{extension}"
 								    pattern = r"(?:https?://)?(?:www\.)?pixivision\.net/(?:en/)?a/(\d+)"
 								    test = (
 								        ("https://www.pixivision.net/en/a/2791"),
 								        ("https://pixivision.net/a/2791", {
 								            "count": 7,
 								            "keyword": {
 								                "pixivision_id": "2791",
 								                "pixivision_title": "What's your favorite music? Editor’s "
 								                                    "picks featuring: “CD Covers”!",
 								            },
 								        }),
 								    )
 								    def __init__(self, match):
 								        PixivExtractor.__init__(self, match)
 								        self.pixivision_id = match.group(1)
 								    def works(self):
 								        return (
-												[pixiv] fix 'pixivision' extraction

											
										
										
											1 year ago
+								            self.api.illust_detail(illust_id.partition("?")[0])
-												[pixiv] add extractor for 'pixivision' articles (#1672)

											
										
										
											3 years ago
+								            for illust_id in util.unique_sequence(text.extract_iter(
 								                self.page, '<a href="https://www.pixiv.net/en/artworks/', '"'))
 								        )
 								    def metadata(self):
 								        url = "https://www.pixivision.net/en/a/" + self.pixivision_id
 								        headers = {"User-Agent": "Mozilla/5.0"}
 								        self.page = self.request(url, headers=headers).text
-												replace 'text.extract()' with 'text.extr()' where possible

											
										
										
											2 years ago
+								        title = text.extr(self.page, '<title>', '<')
-												[pixiv] add extractor for 'pixivision' articles (#1672)

											
										
										
											3 years ago
+								        return {
 								            "pixivision_id"   : self.pixivision_id,
 								            "pixivision_title": text.unescape(title),
 								        }
-												[pixiv] add 'series' extractor (#2964)

											
										
										
											2 years ago
+								class PixivSeriesExtractor(PixivExtractor):
 								    """Extractor for illustrations from a Pixiv series"""
 								    subcategory = "series"
 								    directory_fmt = ("{category}", "{user[id]} {user[account]}",
 								                     "{series[id]} {series[title]}")
 								    filename_fmt = "{num_series:>03}_{id}_p{num}.{extension}"
 								    pattern = (r"(?:https?://)?(?:www\.)?pixiv\.net"
 								               r"/user/(\d+)/series/(\d+)")
 								    test = ("https://www.pixiv.net/user/10509347/series/21859", {
 								        "range": "1-10",
 								        "count": 10,
 								        "keyword": {
 								            "num_series": int,
 								            "series": {
 								                "canonical": "https://www.pixiv.net/user/10509347"
 								                             "/series/21859",
 								                "description": str,
 								                "ogp": dict,
 								                "title": "先輩がうざい後輩の話",
 								                "total": int,
 								                "twitter": dict,
 								            },
 								        },
 								    })
 								    def __init__(self, match):
 								        PixivExtractor.__init__(self, match)
 								        self.user_id, self.series_id = match.groups()
 								    def works(self):
 								        url = self.root + "/ajax/series/" + self.series_id
 								        params = {"p": 1}
 								        headers = {
 								            "Accept": "application/json",
 								            "Referer": "{}/user/{}/series/{}".format(
 								                self.root, self.user_id, self.series_id),
 								            "Alt-Used": "www.pixiv.net",
 								        }
 								        while True:
 								            data = self.request(url, params=params, headers=headers).json()
 								            body = data["body"]
 								            page = body["page"]
 								            series = body["extraData"]["meta"]
 								            series["id"] = self.series_id
 								            series["total"] = page["total"]
-												replace 'text.extract()' with 'text.extr()' where possible

											
										
										
											2 years ago
+								            series["title"] = text.extr(series["title"], '"', '"')
-												[pixiv] add 'series' extractor (#2964)

											
										
										
											2 years ago
 								            for info in page["series"]:
 								                work = self.api.illust_detail(info["workId"])
 								                work["num_series"] = info["order"]
 								                work["series"] = series
 								                yield work
 								            if len(page["series"]) < 10:
 								                return
 								            params["p"] += 1
-												[pixiv] initial 'novel' support (#1241, #4044)

supported URLs are
- https://www.pixiv.net/novel/show.php?id=<ID>
- https://www.pixiv.net/novel/series/<ID>
- https://www.pixiv.net/en/users/<ID>/novels

											
										
										
											1 year ago
+								class PixivNovelExtractor(PixivExtractor):
 								    """Extractor for pixiv novels"""
 								    subcategory = "novel"
 								    request_interval = 1.0
 								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
-												[pixiv] support short novel URLs

https://www.pixiv.net/n/<ID>

											
										
										
											1 year ago
+								               r"/n(?:ovel/show\.php\?id=|/)(\d+)")
 								    test = (
 								        ("https://www.pixiv.net/novel/show.php?id=19612040", {
 								            "count": 1,
 								            "content": "c6f22167f9df7aeaf63b51933b4c8ef6fc5e6a1e",
 								            "keyword": {
 								                "caption": r"re:「無能な名無し」と呼ばれ虐げられて育った鈴\(すず\)は、",
 								                "comment_access_control": 0,
 								                "create_date": "2023-04-02T15:18:58+09:00",
 								                "date": "dt:2023-04-02 06:18:58",
 								                "id": 19612040,
 								                "is_bookmarked": False,
 								                "is_muted": False,
 								                "is_mypixiv_only": False,
 								                "is_original": True,
 								                "is_x_restricted": False,
 								                "novel_ai_type": 1,
 								                "page_count": 1,
 								                "rating": "General",
 								                "restrict": 0,
 								                "series": {
 								                    "id": 10278364,
 								                    "title": "龍の贄嫁〜虐げられた少女は運命の番として愛される〜"
 								                },
 								                "tags": ["和風ファンタジー", "溺愛", "神様", "ヤンデレ", "執着",
 								                         "異能", "ざまぁ", "学園", "神嫁"],
 								                "text_length": 5977,
 								                "title": "異母妹から「無能な名無し」と虐げられていた私、"
 								                         "どうやら異母妹に霊力を搾取されていたようです（１）",
 								                "user": {
 								                    "account": "yukinaga_chifuyu",
 								                    "id": 77055466,
 								                },
 								                "visible": True,
 								                "x_restrict": 0,
-												[pixiv] initial 'novel' support (#1241, #4044)

supported URLs are
- https://www.pixiv.net/novel/show.php?id=<ID>
- https://www.pixiv.net/novel/series/<ID>
- https://www.pixiv.net/en/users/<ID>/novels

											
										
										
											1 year ago
+								            },
-												[pixiv] support short novel URLs

https://www.pixiv.net/n/<ID>

											
										
										
											1 year ago
+								        }),
 								        ("https://www.pixiv.net/n/19612040"),
 								    )
-												[pixiv] initial 'novel' support (#1241, #4044)

supported URLs are
- https://www.pixiv.net/novel/show.php?id=<ID>
- https://www.pixiv.net/novel/series/<ID>
- https://www.pixiv.net/en/users/<ID>/novels

											
										
										
											1 year ago
 								    def __init__(self, match):
 								        PixivExtractor.__init__(self, match)
 								        self.novel_id = match.group(1)
 								    def items(self):
 								        tags = self.config("tags", "japanese")
 								        if tags == "original":
 								            transform_tags = None
 								        elif tags == "translated":
 								            def transform_tags(work):
 								                work["tags"] = list(dict.fromkeys(
 								                    tag["translated_name"] or tag["name"]
 								                    for tag in work["tags"]))
 								        else:
 								            def transform_tags(work):
 								                work["tags"] = [tag["name"] for tag in work["tags"]]
 								        ratings = {0: "General", 1: "R-18", 2: "R-18G"}
 								        meta_user = self.config("metadata")
 								        meta_bookmark = self.config("metadata-bookmark")
 								        novels = self.novels()
 								        if self.max_posts:
 								            novels = itertools.islice(novels, self.max_posts)
 								        for novel in novels:
 								            if meta_user:
 								                novel.update(self.api.user_detail(novel["user"]["id"]))
 								            if meta_bookmark and novel["is_bookmarked"]:
 								                detail = self.api.novel_bookmark_detail(novel["id"])
 								                novel["tags_bookmark"] = [tag["name"] for tag in detail["tags"]
 								                                          if tag["is_registered"]]
 								            if transform_tags:
 								                transform_tags(novel)
 								            novel["num"] = 0
 								            novel["date"] = text.parse_datetime(novel["create_date"])
 								            novel["rating"] = ratings.get(novel["x_restrict"])
 								            novel["suffix"] = ""
 								            yield Message.Directory, novel
 								            novel["extension"] = "txt"
 								            content = self.api.novel_text(novel["id"])["novel_text"]
 								            yield Message.Url, "text:" + content, novel
 								    def novels(self):
 								        return (self.api.novel_detail(self.novel_id),)
 								class PixivNovelUserExtractor(PixivNovelExtractor):
 								    """Extractor for pixiv users' novels"""
 								    subcategory = "novel-user"
 								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
 								               r"/(?:en/)?users/(\d+)/novels")
 								    test = ("https://www.pixiv.net/en/users/77055466/novels", {
 								        "pattern": "^text:",
 								        "range": "1-5",
 								        "count": 5,
 								    })
 								    def novels(self):
 								        return self.api.user_novels(self.novel_id)
 								class PixivNovelSeriesExtractor(PixivNovelExtractor):
 								    """Extractor for pixiv novel series"""
 								    subcategory = "novel-series"
 								    pattern = (r"(?:https?://)?(?:www\.|touch\.)?pixiv\.net"
 								               r"/novel/series/(\d+)")
 								    test = ("https://www.pixiv.net/novel/series/10278364", {
 								        "count": 4,
 								        "content": "b06abed001b3f6ccfb1579699e9a238b46d38ea2",
 								    })
 								    def novels(self):
 								        return self.api.novel_series(self.novel_id)
-												[pixiv] add 'sketch' extractor (#1497)

											
										
										
											3 years ago
+								class PixivSketchExtractor(Extractor):
 								    """Extractor for user pages on sketch.pixiv.net"""
 								    category = "pixiv"
 								    subcategory = "sketch"
 								    directory_fmt = ("{category}", "sketch", "{user[unique_name]}")
 								    filename_fmt = "{post_id} {id}.{extension}"
 								    archive_fmt = "S{user[id]}_{id}"
 								    root = "https://sketch.pixiv.net"
 								    cookiedomain = ".pixiv.net"
 								    pattern = r"(?:https?://)?sketch\.pixiv\.net/@([^/?#]+)"
 								    test = ("https://sketch.pixiv.net/@nicoby", {
 								        "pattern": r"https://img\-sketch\.pixiv\.net/uploads/medium"
 								                   r"/file/\d+/\d+\.(jpg|png)",
 								        "count": ">= 35",
 								    })
 								    def __init__(self, match):
 								        Extractor.__init__(self, match)
 								        self.username = match.group(1)
 								    def items(self):
 								        headers = {"Referer": "{}/@{}".format(self.root, self.username)}
 								        for post in self.posts():
 								            media = post["media"]
 								            post["post_id"] = post["id"]
 								            post["date"] = text.parse_datetime(
 								                post["created_at"], "%Y-%m-%dT%H:%M:%S.%f%z")
 								            util.delete_items(post, ("id", "media", "_links"))
 								            yield Message.Directory, post
 								            post["_http_headers"] = headers
 								            for photo in media:
 								                original = photo["photo"]["original"]
 								                post["id"] = photo["id"]
 								                post["width"] = original["width"]
 								                post["height"] = original["height"]
 								                url = original["url"]
 								                text.nameext_from_url(url, post)
 								                yield Message.Url, url, post
 								    def posts(self):
 								        url = "{}/api/walls/@{}/posts/public.json".format(
 								            self.root, self.username)
 								        headers = {
 								            "Accept": "application/vnd.sketch-v4+json",
 								            "X-Requested-With": "{}/@{}".format(self.root, self.username),
 								            "Referer": self.root + "/",
 								        }
 								        while True:
 								            data = self.request(url, headers=headers).json()
 								            yield from data["data"]["items"]
 								            next_url = data["_links"].get("next")
 								            if not next_url:
 								                return
 								            url = self.root + next_url["href"]
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								class PixivAppAPI():
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    """Minimal interface for the Pixiv App API for mobile devices
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    For a more complete implementation or documentation, see
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								    - https://github.com/upbit/pixivpy
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    - https://gist.github.com/ZipFile/3ba99b47162c23f8aea5d5942bb557b1
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								    """
 								    CLIENT_ID = "MOBrBDS8blbauoSck0ZfDbtuzpyT"
 								    CLIENT_SECRET = "lsACyCD94FhDUtGTXi3QzcFE2uU1hqtDaKeqrdwj"
-												[pixiv] fix authentication

											
										
										
											5 years ago
+								    HASH_SECRET = ("28c1fdd170a5204386cb1313c7077b34"
 								                   "f83e4aaf4aa829ce78c231e05b0bae2c")
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
 								    def __init__(self, extractor):
-												use extractor.request for all other API calls

- deviantart
- pawoo
- pixiv
- reddit

											
										
										
											6 years ago
+								        self.extractor = extractor
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								        self.log = extractor.log
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								        self.username = extractor._get_auth_info()[0]
-												[pixiv] add extractor for illusts from followed users

											
										
										
											6 years ago
+								        self.user = None
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								        extractor.session.headers.update({
 								            "App-OS"        : "ios",
 								            "App-OS-Version": "13.1.2",
 								            "App-Version"   : "7.7.6",
 								            "User-Agent"    : "PixivIOSApp/7.7.6 (iOS 13.1.2; iPhone11,8)",
 								            "Referer"       : "https://app-api.pixiv.net/",
 								        })
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								        self.client_id = extractor.config(
 								            "client-id", self.CLIENT_ID)
 								        self.client_secret = extractor.config(
 								            "client-secret", self.CLIENT_SECRET)
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
 								        token = extractor.config("refresh-token")
 								        if token is None or token == "cache":
 								            token = _refresh_token_cache(self.username)
 								        self.refresh_token = token
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    def login(self):
 								        """Login and gain an access token"""
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								        self.user, auth = self._login_impl(self.username)
-												use extractor.request for all other API calls

- deviantart
- pawoo
- pixiv
- reddit

											
										
										
											6 years ago
+								        self.extractor.session.headers["Authorization"] = auth
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												adjust cache maxage values

											
										
										
											6 years ago
+								    @cache(maxage=3600, keyarg=1)
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								    def _login_impl(self, username):
 								        if not self.refresh_token:
-												raise error when required username or password are missing

do not try to login as 'None' (#1192)

											
										
										
											4 years ago
+								            raise exception.AuthenticationError(
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								                "'refresh-token' required.\n"
 								                "Run `gallery-dl oauth:pixiv` to get one.")
-												raise error when required username or password are missing

do not try to login as 'None' (#1192)

											
										
										
											4 years ago
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								        self.log.info("Refreshing access token")
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								        url = "https://oauth.secure.pixiv.net/auth/token"
 								        data = {
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								            "client_id"     : self.client_id,
 								            "client_secret" : self.client_secret,
 								            "grant_type"    : "refresh_token",
 								            "refresh_token" : self.refresh_token,
 								            "get_secure_url": "1",
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								        }
-												[pixiv] fix authentication

											
										
										
											5 years ago
+								        time = datetime.utcnow().strftime("%Y-%m-%dT%H:%M:%S+00:00")
 								        headers = {
 								            "X-Client-Time": time,
 								            "X-Client-Hash": hashlib.md5(
 								                (time + self.HASH_SECRET).encode()).hexdigest(),
 								        }
-												use extractor.request for all other API calls

- deviantart
- pawoo
- pixiv
- reddit

											
										
										
											6 years ago
+								        response = self.extractor.request(
-												[pixiv] fix authentication

											
										
										
											5 years ago
+								            url, method="POST", headers=headers, data=data, fatal=False)
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								        if response.status_code >= 400:
-												[pixiv] output debug message on failed login attempt

(#1192)

											
										
										
											4 years ago
+								            self.log.debug(response.text)
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											4 years ago
+								            raise exception.AuthenticationError("Invalid refresh token")
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
 								        data = response.json()["response"]
 								        return data["user"], "Bearer " + data["access_token"]
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    def illust_detail(self, illust_id):
 								        params = {"illust_id": illust_id}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._call("/v1/illust/detail", params)["illust"]
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								    def illust_bookmark_detail(self, illust_id):
 								        params = {"illust_id": illust_id}
 								        return self._call(
 								            "/v2/illust/bookmark/detail", params)["bookmark_detail"]
-												[pixiv] add extractor for illusts from followed users

											
										
										
											6 years ago
+								    def illust_follow(self, restrict="all"):
 								        params = {"restrict": restrict}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._pagination("/v2/illust/follow", params)
-												[pixiv] add extractor for illusts from followed users

											
										
										
											6 years ago
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    def illust_ranking(self, mode="day", date=None):
 								        params = {"mode": mode, "date": date}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._pagination("/v1/illust/ranking", params)
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
-												[pixiv] add 'related' option (#1237)

											
										
										
											4 years ago
+								    def illust_related(self, illust_id):
 								        params = {"illust_id": illust_id}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._pagination("/v2/illust/related", params)
-												[pixiv] add 'related' option (#1237)

											
										
										
											4 years ago
-												[pixiv] initial 'novel' support (#1241, #4044)

supported URLs are
- https://www.pixiv.net/novel/show.php?id=<ID>
- https://www.pixiv.net/novel/series/<ID>
- https://www.pixiv.net/en/users/<ID>/novels

											
										
										
											1 year ago
+								    def novel_bookmark_detail(self, novel_id):
 								        params = {"novel_id": novel_id}
 								        return self._call(
 								            "/v2/novel/bookmark/detail", params)["bookmark_detail"]
 								    def novel_detail(self, novel_id):
 								        params = {"novel_id": novel_id}
 								        return self._call("/v2/novel/detail", params)["novel"]
 								    def novel_series(self, series_id):
 								        params = {"series_id": series_id}
 								        return self._pagination("/v1/novel/series", params, "novels")
 								    def novel_text(self, novel_id):
 								        params = {"novel_id": novel_id}
 								        return self._call("/v1/novel/text", params)
-												[pixiv] allow setting a date range for search results (#2133)

with the 'scd' and 'ecd' query parameters

											
										
										
											3 years ago
+								    def search_illust(self, word, sort=None, target=None, duration=None,
 								                      date_start=None, date_end=None):
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
+								        params = {"word": word, "search_target": target,
-												[pixiv] allow setting a date range for search results (#2133)

with the 'scd' and 'ecd' query parameters

											
										
										
											3 years ago
+								                  "sort": sort, "duration": duration,
 								                  "start_date": date_start, "end_date": date_end}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._pagination("/v1/search/illust", params)
-												[pixiv] add extractor for search results

											
										
										
											6 years ago
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								    def user_bookmarks_illust(self, user_id, tag=None, restrict="public"):
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								        """Return illusts bookmarked by a user"""
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								        params = {"user_id": user_id, "tag": tag, "restrict": restrict}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._pagination("/v1/user/bookmarks/illust", params)
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
-												[pixiv] implement 'metadata-bookmark' option (#3417)

											
										
										
											2 years ago
+								    def user_bookmark_tags_illust(self, user_id, restrict="public"):
 								        """Return bookmark tags defined by a user"""
 								        params = {"user_id": user_id, "restrict": restrict}
 								        return self._pagination(
 								            "/v1/user/bookmark-tags/illust", params, "bookmark_tags")
-												[pixiv] implement 'include' option

- split 'user' extractor and its 'avatar' and 'background' options into
  separate extractors ('artworks', 'avatar', 'background')
- avatars can now be downloaded with
  https://www.pixiv.net/en/users/ID/avatar
  as URL and will use a proper archive key; similar for backgrounds
- options for the 'user' subcategory must be moved to 'artworks' to have
  the same effect as before

											
										
										
											2 years ago
+								    @memcache(keyarg=1)
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    def user_detail(self, user_id):
 								        params = {"user_id": user_id}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._call("/v1/user/detail", params)
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
-												[pixiv] support fetching privately followed users (fixes #1628)

											
										
										
											3 years ago
+								    def user_following(self, user_id, restrict="public"):
 								        params = {"user_id": user_id, "restrict": restrict}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._pagination("/v1/user/following", params, "user_previews")
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
-												[pixiv] respect more query parameters for user URLs

The API endpoint responsible for user illustrations does not
provide sufficient filter capabilities* to match the actual
website, so we are spinning our own filters.

Respected parameters are
    'type': illust, manga, ugoira
    'tag' : any image tag (this was already supported)
    'p'   : the page to start on

*
- API can filter for illustrations and manga, but not for ugoira.
- 'offset' is applied before filtering
- no 'tag' filter

											
										
										
											6 years ago
+								    def user_illusts(self, user_id):
 								        params = {"user_id": user_id}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._pagination("/v1/user/illusts", params)
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
-												[pixiv] initial 'novel' support (#1241, #4044)

supported URLs are
- https://www.pixiv.net/novel/show.php?id=<ID>
- https://www.pixiv.net/novel/series/<ID>
- https://www.pixiv.net/en/users/<ID>/novels

											
										
										
											1 year ago
+								    def user_novels(self, user_id):
 								        params = {"user_id": user_id}
 								        return self._pagination("/v1/user/novels", params, "novels")
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
+								    def ugoira_metadata(self, illust_id):
 								        params = {"illust_id": illust_id}
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        return self._call("/v1/ugoira/metadata", params)["ugoira_metadata"]
-												[pixiv] use App API

Transitioning to the App API breaks favorites archive IDs (there is
no longer any bookmark ID information), but the favorites API endpoint
of the public API was gone anyways ...

											
										
										
											6 years ago
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								    def _call(self, endpoint, params=None):
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        url = "https://app-api.pixiv.net" + endpoint
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								        while True:
 								            self.login()
 								            response = self.extractor.request(url, params=params, fatal=False)
 								            data = response.json()
 								            if "error" not in data:
 								                return data
 								            self.log.debug(data)
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												[pixiv] wait and retry after rate limit error (closes #535)

											
										
										
											5 years ago
+								            if response.status_code == 404:
 								                raise exception.NotFoundError()
 								            error = data["error"]
 								            if "rate limit" in (error.get("message") or "").lower():
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								                self.extractor.wait(seconds=300)
 								                continue
-												[pixiv] wait and retry after rate limit error (closes #535)

											
										
										
											5 years ago
-												[pixiv] update API interface

- start all endpoints with '/'
- use extractor.wait() for rate limit
- retry with while loop instead of recursion
- in case of error, write entire response to debug log

											
										
										
											2 years ago
+								            raise exception.StopExtraction("API request failed: %s", error)
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
+								    def _pagination(self, endpoint, params, key="illusts"):
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
+								        while True:
 								            data = self._call(endpoint, params)
-												[pixiv] support listing followed users (#515)

											
										
										
											5 years ago
+								            yield from data[key]
-												[pixiv] implement AppAPI wrapper

											
										
										
											6 years ago
 								            if not data["next_url"]:
 								                return
-												[pixiv] improve bookmark extraction

- combine 'favorite' and 'bookmark' extractors
  - it is now one extractor class, but its subcategory still
    distinguishes between your own bookmarks ('bookmark') and other
    user's bookmarks ('favorite') like before
- allow filtering by bookmark tags and public/private bookmarks
- fix pagination for bookmark results

											
										
										
											6 years ago
+								            query = data["next_url"].rpartition("?")[2]
 								            params = text.parse_query(query)
-												[pixiv] use refresh_token based authentication

The first login will still use username and password, but everything
afterwards will use the refresh_token obtained from that.

This will prevent pixiv from sending a "New login to pixiv" email every
time a new access_token is requested.

											
										
										
											6 years ago
-												adjust cache maxage values

											
										
										
											6 years ago
+								@cache(maxage=10*365*24*3600, keyarg=0)
-												[pixiv] use refresh_token based authentication

The first login will still use username and password, but everything
afterwards will use the refresh_token obtained from that.

This will prevent pixiv from sending a "New login to pixiv" email every
time a new access_token is requested.

											
										
										
											6 years ago
+								def _refresh_token_cache(username):
 								    return None