gallery-dl/gallery_dl/extractor/gelbooru.py

# -*- coding: utf-8 -*-

# Copyright 2014-2023 Mike Fährmann
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.

"""Extractors for https://gelbooru.com/"""

from .common import Extractor, Message
from . import gelbooru_v02
from .. import text, exception
import binascii

BASE_PATTERN = r"(?:https?://)?(?:www\.)?gelbooru\.com/(?:index\.php)?\?"


class GelbooruBase():
    """Base class for gelbooru extractors"""
    category = "gelbooru"
    basecategory = "booru"
    root = "https://gelbooru.com"
    offset = 0

    def _api_request(self, params, key="post", log=False):
        if "s" not in params:
            params["s"] = "post"
        params["api_key"] = self.api_key
        params["user_id"] = self.user_id

        url = self.root + "/index.php?page=dapi&q=index&json=1"
        data = self.request(url, params=params).json()

        if not key:
            return data

        try:
            posts = data[key]
        except KeyError:
            if log:
                self.log.error("Incomplete API response (missing '%s')", key)
                self.log.debug("%s", data)
            return []

        if not isinstance(posts, list):
            return (posts,)
        return posts

    def _pagination(self, params):
        params["pid"] = self.page_start
        params["limit"] = self.per_page
        limit = self.per_page // 2
        pid = False

        if "tags" in params:
            tags = params["tags"].split()
            op = "<"
            id = False

            for tag in tags:
                if tag.startswith("sort:"):
                    if tag == "sort:id:asc":
                        op = ">"
                    elif tag == "sort:id" or tag.startswith("sort:id:"):
                        op = "<"
                    else:
                        pid = True
                elif tag.startswith("id:"):
                    id = True

            if not pid:
                if id:
                    tag = "id:" + op
                    tags = [t for t in tags if not t.startswith(tag)]
                tags = "{} id:{}".format(" ".join(tags), op)

        while True:
            posts = self._api_request(params)

            yield from posts

            if len(posts) < limit:
                return

            if pid:
                params["pid"] += 1
            else:
                if "pid" in params:
                    del params["pid"]
                params["tags"] = tags + str(posts[-1]["id"])

    def _pagination_html(self, params):
        url = self.root + "/index.php"
        params["pid"] = self.offset

        data = {}
        while True:
            num_ids = 0
            page = self.request(url, params=params).text

            for data["id"] in text.extract_iter(page, '" id="p', '"'):
                num_ids += 1
                yield from self._api_request(data)

            if num_ids < self.per_page:
                return
            params["pid"] += self.per_page

    @staticmethod
    def _file_url(post):
        url = post["file_url"]
        if url.endswith((".webm", ".mp4")):
            md5 = post["md5"]
            path = "/images/{}/{}/{}.webm".format(md5[0:2], md5[2:4], md5)
            post["_fallback"] = GelbooruBase._video_fallback(path)
            url = "https://img3.gelbooru.com" + path
        return url

    @staticmethod
    def _video_fallback(path):
        yield "https://img2.gelbooru.com" + path
        yield "https://img1.gelbooru.com" + path

    def _notes(self, post, page):
        notes_data = text.extr(page, '<section id="notes"', '</section>')
        if not notes_data:
            return

        post["notes"] = notes = []
        extr = text.extract
        for note in text.extract_iter(notes_data, '<article', '</article>'):
            notes.append({
                "width" : int(extr(note, 'data-width="', '"')[0]),
                "height": int(extr(note, 'data-height="', '"')[0]),
                "x"     : int(extr(note, 'data-x="', '"')[0]),
                "y"     : int(extr(note, 'data-y="', '"')[0]),
                "body"  : extr(note, 'data-body="', '"')[0],
            })

    def _skip_offset(self, num):
        self.offset += num
        return num


class GelbooruTagExtractor(GelbooruBase,
                           gelbooru_v02.GelbooruV02TagExtractor):
    """Extractor for images from gelbooru.com based on search-tags"""
    pattern = BASE_PATTERN + r"page=post&s=list&tags=([^&#]*)"
    example = "https://gelbooru.com/index.php?page=post&s=list&tags=TAG"


class GelbooruPoolExtractor(GelbooruBase,
                            gelbooru_v02.GelbooruV02PoolExtractor):
    """Extractor for gelbooru pools"""
    per_page = 45
    pattern = BASE_PATTERN + r"page=pool&s=show&id=(\d+)"
    example = "https://gelbooru.com/index.php?page=pool&s=show&id=12345"

    skip = GelbooruBase._skip_offset

    def metadata(self):
        url = self.root + "/index.php"
        self._params = {
            "page": "pool",
            "s"   : "show",
            "id"  : self.pool_id,
        }
        page = self.request(url, params=self._params).text

        name, pos = text.extract(page, "<h3>Now Viewing: ", "</h3>")
        if not name:
            raise exception.NotFoundError("pool")

        return {
            "pool": text.parse_int(self.pool_id),
            "pool_name": text.unescape(name),
        }

    def posts(self):
        return self._pagination_html(self._params)


class GelbooruFavoriteExtractor(GelbooruBase,
                                gelbooru_v02.GelbooruV02FavoriteExtractor):
    """Extractor for gelbooru favorites"""
    per_page = 100
    pattern = BASE_PATTERN + r"page=favorites&s=view&id=(\d+)"
    example = "https://gelbooru.com/index.php?page=favorites&s=view&id=12345"

    skip = GelbooruBase._skip_offset

    def posts(self):
        # get number of favorites
        params = {
            "s"    : "favorite",
            "id"   : self.favorite_id,
            "limit": "2",
        }
        data = self._api_request(params, None, True)

        count = data["@attributes"]["count"]
        self.log.debug("API reports %s favorite entries", count)

        favs = data["favorite"]
        try:
            order = 1 if favs[0]["id"] < favs[1]["id"] else -1
        except LookupError as exc:
            self.log.debug(
                "Error when determining API favorite order (%s: %s)",
                exc.__class__.__name__, exc)
            order = -1
        else:
            self.log.debug("API yields favorites in %sscending order",
                           "a" if order > 0 else "de")

        order_favs = self.config("order-posts")
        if order_favs and order_favs[0] in ("r", "a"):
            self.log.debug("Returning them in reverse")
            order = -order

        if order < 0:
            return self._pagination(params, count)
        return self._pagination_reverse(params, count)

    def _pagination(self, params, count):
        if self.offset:
            pnum, skip = divmod(self.offset, self.per_page)
        else:
            pnum = skip = 0

        params["pid"] = pnum
        params["limit"] = self.per_page

        while True:
            favs = self._api_request(params, "favorite")

            if not favs:
                return

            if skip:
                favs = favs[skip:]
                skip = 0

            for fav in favs:
                for post in self._api_request({"id": fav["favorite"]}):
                    post["date_favorited"] = text.parse_timestamp(fav["added"])
                    yield post

            params["pid"] += 1

    def _pagination_reverse(self, params, count):
        pnum, last = divmod(count-1, self.per_page)
        if self.offset > last:
            # page number change
            self.offset -= last
            diff, self.offset = divmod(self.offset-1, self.per_page)
            pnum -= diff + 1
        skip = self.offset

        params["pid"] = pnum
        params["limit"] = self.per_page

        while True:
            favs = self._api_request(params, "favorite")
            favs.reverse()

            if skip:
                favs = favs[skip:]
                skip = 0

            for fav in favs:
                for post in self._api_request({"id": fav["favorite"]}):
                    post["date_favorited"] = text.parse_timestamp(fav["added"])
                    yield post

            params["pid"] -= 1
            if params["pid"] < 0:
                return


class GelbooruPostExtractor(GelbooruBase,
                            gelbooru_v02.GelbooruV02PostExtractor):
    """Extractor for single images from gelbooru.com"""
    pattern = (BASE_PATTERN +
               r"(?=(?:[^#]+&)?page=post(?:&|#|$))"
               r"(?=(?:[^#]+&)?s=view(?:&|#|$))"
               r"(?:[^#]+&)?id=(\d+)")
    example = "https://gelbooru.com/index.php?page=post&s=view&id=12345"


class GelbooruRedirectExtractor(GelbooruBase, Extractor):
    subcategory = "redirect"
    pattern = (r"(?:https?://)?(?:www\.)?gelbooru\.com"
               r"/redirect\.php\?s=([^&#]+)")
    example = "https://gelbooru.com/redirect.php?s=BASE64"

    def __init__(self, match):
        Extractor.__init__(self, match)
        self.url_base64 = match.group(1)

    def items(self):
        url = text.ensure_http_scheme(binascii.a2b_base64(
            self.url_base64).decode())
        data = {"_extractor": GelbooruPostExtractor}
        yield Message.Queue, url, data
[gelbooru] update to new extractor interface 10 years ago			`# -- coding: utf-8 --`
initial commit 10 years ago
fix 'keywords' in extractor tests (#3491) 2 years ago			`# Copyright 2014-2023 Mike Fährmann`
[gelbooru] update to new extractor interface 10 years ago			`#`
			`# This program is free software; you can redistribute it and/or modify`
			`# it under the terms of the GNU General Public License version 2 as`
			`# published by the Free Software Foundation.`

[booru] add generalized extractors for *booru sites similar to cc15fbe7 4 years ago			`"""Extractors for https://gelbooru.com/"""`
[gelbooru] update to new extractor interface 10 years ago
[gelbooru] add extractor for '/redirect.php' URLs (#1530) 3 years ago			`from .common import Extractor, Message`
move extractors from booru.py into their own gelbooru_v02 module 4 years ago			`from . import gelbooru_v02`
[gelbooru] implement 'pool' pagination (#2853) 2 years ago			`from .. import text, exception`
[gelbooru] add extractor for '/redirect.php' URLs (#1530) 3 years ago			`import binascii`
[gelbooru] update to new extractor interface 10 years ago
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`BASE_PATTERN = r"(?:https?://)?(?:www\.)?gelbooru\.com/(?:index\.php)?\?"`

code adjustments according to pep8 nr2 8 years ago
[booru] add generalized extractors for *booru sites similar to cc15fbe7 4 years ago			`class GelbooruBase():`
[gelbooru] update to new format 9 years ago			`"""Base class for gelbooru extractors"""`
			`category = "gelbooru"`
move extractors from booru.py into their own gelbooru_v02 module 4 years ago			`basecategory = "booru"`
[booru] add generalized extractors for *booru sites similar to cc15fbe7 4 years ago			`root = "https://gelbooru.com"`
[gelbooru] fix and improve --range for pools 2 years ago			`offset = 0`
[gelbooru] inherit from BooruExtractor class Breaks pool functionality when using API calls (for now), but reduces code clutter and enables the `tags` option. 6 years ago
[gelbooru] only log "Incomplete API response" for favorites (#5045) 8 months ago			`def _api_request(self, params, key="post", log=False):`
[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`if "s" not in params:`
			`params["s"] = "post"`
[gelbooru] add support for `api_key` and `user_id` (#2767) 2 years ago			`params["api_key"] = self.api_key`
			`params["user_id"] = self.user_id`

[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`url = self.root + "/index.php?page=dapi&q=index&json=1"`
[gelbooru] handle changed API response format (#2157) 3 years ago			`data = self.request(url, params=params).json()`
[gelbooru] add support for `api_key` and `user_id` (#2767) 2 years ago
[gelbooru] detect returned favorites order (#5220) 6 months ago			`if not key:`
			`return data`

[gelbooru] display error for invalid API responses (#4903) 9 months ago			`try:`
			`posts = data[key]`
			`except KeyError:`
[gelbooru] only log "Incomplete API response" for favorites (#5045) 8 months ago			`if log:`
			`self.log.error("Incomplete API response (missing '%s')", key)`
			`self.log.debug("%s", data)`
[gelbooru] display error for invalid API responses (#4903) 9 months ago			`return []`
[gelbooru] add support for `api_key` and `user_id` (#2767) 2 years ago
[gelbooru] handle changed API response format (#2157) 3 years ago			`if not isinstance(posts, list):`
			`return (posts,)`
			`return posts`

			`def _pagination(self, params):`
			`params["pid"] = self.page_start`
			`params["limit"] = self.per_page`
[gelbooru] improve and fix pagination (#2230, #2232) Use 'id:<POSTID' as a tag instead of going through pages with 'pid'. Something similar was already implemented in 93cef784, but that got broken again in 3085aac4. 3 years ago			`limit = self.per_page // 2`
[gelbooru] improve pagination logic for meta tags (#5478) similar to 494acabd38fefdc8c1b482b584695aaa788f9112 5 months ago			`pid = False`

			`if "tags" in params:`
			`tags = params["tags"].split()`
			`op = "<"`
			`id = False`

			`for tag in tags:`
			`if tag.startswith("sort:"):`
			`if tag == "sort:id:asc":`
			`op = ">"`
			`elif tag == "sort:id" or tag.startswith("sort:id:"):`
			`op = "<"`
			`else:`
			`pid = True`
			`elif tag.startswith("id:"):`
			`id = True`

			`if not pid:`
			`if id:`
			`tag = "id:" + op`
			`tags = [t for t in tags if not t.startswith(tag)]`
			`tags = "{} id:{}".format(" ".join(tags), op)`
[gelbooru] handle changed API response format (#2157) 3 years ago
			`while True:`
[gelbooru] improve and fix pagination (#2230, #2232) Use 'id:<POSTID' as a tag instead of going through pages with 'pid'. Something similar was already implemented in 93cef784, but that got broken again in 3085aac4. 3 years ago			`posts = self._api_request(params)`

[gelbooru] improve pagination logic for meta tags (#5478) similar to 494acabd38fefdc8c1b482b584695aaa788f9112 5 months ago			`yield from posts`
[gelbooru] handle changed API response format (#2157) 3 years ago
[gelbooru] improve and fix pagination (#2230, #2232) Use 'id:<POSTID' as a tag instead of going through pages with 'pid'. Something similar was already implemented in 93cef784, but that got broken again in 3085aac4. 3 years ago			`if len(posts) < limit:`
[gelbooru] handle changed API response format (#2157) 3 years ago			`return`
[gelbooru] improve and fix pagination (#2230, #2232) Use 'id:<POSTID' as a tag instead of going through pages with 'pid'. Something similar was already implemented in 93cef784, but that got broken again in 3085aac4. 3 years ago
[gelbooru] improve pagination logic for meta tags (#5478) similar to 494acabd38fefdc8c1b482b584695aaa788f9112 5 months ago			`if pid:`
			`params["pid"] += 1`
			`else:`
			`if "pid" in params:`
			`del params["pid"]`
			`params["tags"] = tags + str(posts[-1]["id"])`
[gelbooru] handle changed API response format (#2157) 3 years ago
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`def _pagination_html(self, params):`
			`url = self.root + "/index.php"`
[gelbooru] fix and improve --range for pools 2 years ago			`params["pid"] = self.offset`
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago
			`data = {}`
			`while True:`
			`num_ids = 0`
			`page = self.request(url, params=params).text`

			`for data["id"] in text.extract_iter(page, '" id="p', '"'):`
			`num_ids += 1`
			`yield from self._api_request(data)`

			`if num_ids < self.per_page:`
			`return`
			`params["pid"] += self.per_page`

[booru] split '_prepare_post()' 4 years ago			`@staticmethod`
			`def _file_url(post):`
			`url = post["file_url"]`
[gelbooru] improve video file detection (fixes #2188) not all files from 'https://video-cdnN.gelbooru.com' are videos 3 years ago			`if url.endswith((".webm", ".mp4")):`
[booru] add generalized extractors for *booru sites similar to cc15fbe7 4 years ago			`md5 = post["md5"]`
[gelbooru] update video server (fixes #1368) from 'https://img2.gelbooru.com' to 'https://img3.gelbooru.com' and provide fallback URLs 4 years ago			`path = "/images/{}/{}/{}.webm".format(md5[0:2], md5[2:4], md5)`
			`post["_fallback"] = GelbooruBase._video_fallback(path)`
			`url = "https://img3.gelbooru.com" + path`
[gelbooru] rewrite mp4 video URLs (fixes #1048) 4 years ago			`return url`

[gelbooru] update video server (fixes #1368) from 'https://img2.gelbooru.com' to 'https://img3.gelbooru.com' and provide fallback URLs 4 years ago			`@staticmethod`
			`def _video_fallback(path):`
			`yield "https://img2.gelbooru.com" + path`
			`yield "https://img1.gelbooru.com" + path`

[booru] refactor 'tags' and 'notes' extraction - move HTML request for post pages into its own function - move gelbooru_v02.py notes extraction to gelbooru.py since it only works there - clean up some code 2 years ago			`def _notes(self, post, page):`
replace 'text.extract()' with 'text.extr()' where possible 2 years ago			`notes_data = text.extr(page, '<section id="notes"', '</section>')`
[booru] refactor 'tags' and 'notes' extraction - move HTML request for post pages into its own function - move gelbooru_v02.py notes extraction to gelbooru.py since it only works there - clean up some code 2 years ago			`if not notes_data:`
			`return`

			`post["notes"] = notes = []`
			`extr = text.extract`
			`for note in text.extract_iter(notes_data, '<article', '</article>'):`
			`notes.append({`
			`"width" : int(extr(note, 'data-width="', '"')[0]),`
			`"height": int(extr(note, 'data-height="', '"')[0]),`
			`"x" : int(extr(note, 'data-x="', '"')[0]),`
			`"y" : int(extr(note, 'data-y="', '"')[0]),`
			`"body" : extr(note, 'data-body="', '"')[0],`
			`})`

[gelbooru] fix and improve --range for pools 2 years ago			`def _skip_offset(self, num):`
			`self.offset += num`
			`return num`

[gelbooru] use manual extraction ... to compensate for their disabled API. (https://gelbooru.com/index.php?page=forum&s=view&id=3875) This also adds an extractor for image-pools. 7 years ago
move extractors from booru.py into their own gelbooru_v02 module 4 years ago			`class GelbooruTagExtractor(GelbooruBase,`
			`gelbooru_v02.GelbooruV02TagExtractor):`
consistent extractor naming scheme + docstrings 8 years ago			`"""Extractor for images from gelbooru.com based on search-tags"""`
[gelbooru] support 'all' and empty tag (#5076) 8 months ago			`pattern = BASE_PATTERN + r"page=post&s=list&tags=([^&#]*)"`
remove test results in extractor modules and add generic example URLs 1 year ago			`example = "https://gelbooru.com/index.php?page=post&s=list&tags=TAG"`
[gelbooru] update to new format 9 years ago

move extractors from booru.py into their own gelbooru_v02 module 4 years ago			`class GelbooruPoolExtractor(GelbooruBase,`
			`gelbooru_v02.GelbooruV02PoolExtractor):`
[gelbooru] implement 'pool' pagination (#2853) 2 years ago			`"""Extractor for gelbooru pools"""`
			`per_page = 45`
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`pattern = BASE_PATTERN + r"page=pool&s=show&id=(\d+)"`
remove test results in extractor modules and add generic example URLs 1 year ago			`example = "https://gelbooru.com/index.php?page=pool&s=show&id=12345"`
[gelbooru] use manual extraction ... to compensate for their disabled API. (https://gelbooru.com/index.php?page=forum&s=view&id=3875) This also adds an extractor for image-pools. 7 years ago
[gelbooru] fix and improve --range for pools 2 years ago			`skip = GelbooruBase._skip_offset`

[booru] add generalized extractors for *booru sites similar to cc15fbe7 4 years ago			`def metadata(self):`
[gelbooru] implement 'pool' pagination (#2853) 2 years ago			`url = self.root + "/index.php"`
			`self._params = {`
			`"page": "pool",`
			`"s" : "show",`
			`"id" : self.pool_id,`
			`}`
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`page = self.request(url, params=self._params).text`
[booru] add generalized extractors for *booru sites similar to cc15fbe7 4 years ago
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`name, pos = text.extract(page, "<h3>Now Viewing: ", "</h3>")`
[booru] add generalized extractors for *booru sites similar to cc15fbe7 4 years ago			`if not name:`
			`raise exception.NotFoundError("pool")`

			`return {`
			`"pool": text.parse_int(self.pool_id),`
			`"pool_name": text.unescape(name),`
			`}`

[gelbooru] handle changed API response format (#2157) 3 years ago			`def posts(self):`
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`return self._pagination_html(self._params)`
[gelbooru] implement 'pool' pagination (#2853) 2 years ago

[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`class GelbooruFavoriteExtractor(GelbooruBase,`
			`gelbooru_v02.GelbooruV02FavoriteExtractor):`
[gelbooru] warn about missing cookies for favorites (#3704) and add docstring so it shows up in --list-extractors 2 years ago			`"""Extractor for gelbooru favorites"""`
[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`per_page = 100`
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`pattern = BASE_PATTERN + r"page=favorites&s=view&id=(\d+)"`
remove test results in extractor modules and add generic example URLs 1 year ago			`example = "https://gelbooru.com/index.php?page=favorites&s=view&id=12345"`
[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago
[gelbooru] fix --range for favorites (#3704) 2 years ago			`skip = GelbooruBase._skip_offset`

[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`def posts(self):`
			`# get number of favorites`
			`params = {`
			`"s" : "favorite",`
			`"id" : self.favorite_id,`
[gelbooru] detect returned favorites order (#5220) 6 months ago			`"limit": "2",`
[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`}`
[gelbooru] detect returned favorites order (#5220) 6 months ago			`data = self._api_request(params, None, True)`

			`count = data["@attributes"]["count"]`
[gelbooru] add 'order-posts' option for favorites (#5220) 6 months ago			`self.log.debug("API reports %s favorite entries", count)`
[gelbooru] detect returned favorites order (#5220) 6 months ago
			`favs = data["favorite"]`
			`try:`
			`order = 1 if favs[0]["id"] < favs[1]["id"] else -1`
[gelbooru] add 'order-posts' option for favorites (#5220) 6 months ago			`except LookupError as exc:`
			`self.log.debug(`
			`"Error when determining API favorite order (%s: %s)",`
			`exc.__class__.__name__, exc)`
			`order = -1`
			`else:`
			`self.log.debug("API yields favorites in %sscending order",`
			`"a" if order > 0 else "de")`
[gelbooru] detect returned favorites order (#5220) 6 months ago
[gelbooru] add 'order-posts' option for favorites (#5220) 6 months ago			`order_favs = self.config("order-posts")`
			`if order_favs and order_favs[0] in ("r", "a"):`
[gelbooru] detect returned favorites order (#5220) 6 months ago			`self.log.debug("Returning them in reverse")`
[gelbooru] add 'order-posts' option for favorites (#5220) 6 months ago			`order = -order`
[gelbooru] detect returned favorites order (#5220) 6 months ago
[gelbooru] add 'order-posts' option for favorites (#5220) 6 months ago			`if order < 0:`
			`return self._pagination(params, count)`
			`return self._pagination_reverse(params, count)`
[gelbooru] detect returned favorites order (#5220) 6 months ago
			`def _pagination(self, params, count):`
			`if self.offset:`
			`pnum, skip = divmod(self.offset, self.per_page)`
			`else:`
			`pnum = skip = 0`

			`params["pid"] = pnum`
			`params["limit"] = self.per_page`

			`while True:`
[gelbooru] add 'order-posts' option for favorites (#5220) 6 months ago			`favs = self._api_request(params, "favorite")`
[gelbooru] detect returned favorites order (#5220) 6 months ago
			`if not favs:`
			`return`

			`if skip:`
			`favs = favs[skip:]`
			`skip = 0`

			`for fav in favs:`
[gelbooru] add 'date_favorited' metadata field 6 months ago			`for post in self._api_request({"id": fav["favorite"]}):`
			`post["date_favorited"] = text.parse_timestamp(fav["added"])`
			`yield post`
[gelbooru] detect returned favorites order (#5220) 6 months ago
			`params["pid"] += 1`
[gelbooru] fix --range for favorites (#3704) 2 years ago
[gelbooru] detect returned favorites order (#5220) 6 months ago			`def _pagination_reverse(self, params, count):`
[gelbooru] fix 'favorite' extractor (#4903) lots of +1/-1 and </<= mistakes 9 months ago			`pnum, last = divmod(count-1, self.per_page)`
			`if self.offset > last:`
			`# page number change`
[gelbooru] fix --range for favorites (#3704) 2 years ago			`self.offset -= last`
[gelbooru] fix 'favorite' extractor (#4903) lots of +1/-1 and </<= mistakes 9 months ago			`diff, self.offset = divmod(self.offset-1, self.per_page)`
[gelbooru] fix --range for favorites (#3704) 2 years ago			`pnum -= diff + 1`
			`skip = self.offset`

			`params["pid"] = pnum`
[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`params["limit"] = self.per_page`

			`while True:`
[gelbooru] add 'order-posts' option for favorites (#5220) 6 months ago			`favs = self._api_request(params, "favorite")`
[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`favs.reverse()`
[gelbooru] fix 'favorite' extractor (#4903) lots of +1/-1 and </<= mistakes 9 months ago
[gelbooru] fix --range for favorites (#3704) 2 years ago			`if skip:`
			`favs = favs[skip:]`
			`skip = 0`

[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago			`for fav in favs:`
[gelbooru] add 'date_favorited' metadata field 6 months ago			`for post in self._api_request({"id": fav["favorite"]}):`
			`post["date_favorited"] = text.parse_timestamp(fav["added"])`
			`yield post`
[gelbooru] extract favorites without needing cookies (#3704) TODO: fix --range 2 years ago
			`params["pid"] -= 1`
			`if params["pid"] < 0:`
			`return`
[gelbooru] handle changed API response format (#2157) 3 years ago
[gelbooru] use manual extraction ... to compensate for their disabled API. (https://gelbooru.com/index.php?page=forum&s=view&id=3875) This also adds an extractor for image-pools. 7 years ago
move extractors from booru.py into their own gelbooru_v02 module 4 years ago			`class GelbooruPostExtractor(GelbooruBase,`
			`gelbooru_v02.GelbooruV02PostExtractor):`
consistent extractor naming scheme + docstrings 8 years ago			`"""Extractor for single images from gelbooru.com"""`
[gelbooru] add 'favorite' extractor (#3704) requires logged in cookies to work 2 years ago			`pattern = (BASE_PATTERN +`
[gelbooru] allow alternate parameter order in post URLs (#2821) 2 years ago			`r"(?=(?:[^#]+&)?page=post(?:&\|#\|$))"`
			`r"(?=(?:[^#]+&)?s=view(?:&\|#\|$))"`
			`r"(?:[^#]+&)?id=(\d+)")`
remove test results in extractor modules and add generic example URLs 1 year ago			`example = "https://gelbooru.com/index.php?page=post&s=view&id=12345"`
[gelbooru] add extractor for '/redirect.php' URLs (#1530) 3 years ago

			`class GelbooruRedirectExtractor(GelbooruBase, Extractor):`
			`subcategory = "redirect"`
			`pattern = (r"(?:https?://)?(?:www\.)?gelbooru\.com"`
			`r"/redirect\.php\?s=([^&#]+)")`
remove test results in extractor modules and add generic example URLs 1 year ago			`example = "https://gelbooru.com/redirect.php?s=BASE64"`
[gelbooru] add extractor for '/redirect.php' URLs (#1530) 3 years ago
			`def __init__(self, match):`
			`Extractor.__init__(self, match)`
fix bug in test_init and update example URLs 1 year ago			`self.url_base64 = match.group(1)`
[gelbooru] add extractor for '/redirect.php' URLs (#1530) 3 years ago
			`def items(self):`
fix bug in test_init and update example URLs 1 year ago			`url = text.ensure_http_scheme(binascii.a2b_base64(`
			`self.url_base64).decode())`
[gelbooru] add extractor for '/redirect.php' URLs (#1530) 3 years ago			`data = {"_extractor": GelbooruPostExtractor}`
fix bug in test_init and update example URLs 1 year ago			`yield Message.Queue, url, data`