gallery-dl/gallery_dl/extractor/furaffinity.py

# -*- coding: utf-8 -*-

# Copyright 2020-2022 Mike Fährmann
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.

"""Extractors for https://www.furaffinity.net/"""

from .common import Extractor, Message
from .. import text, util

BASE_PATTERN = r"(?:https?://)?(?:www\.|sfw\.)?furaffinity\.net"


class FuraffinityExtractor(Extractor):
    """Base class for furaffinity extractors"""
    category = "furaffinity"
    directory_fmt = ("{category}", "{user!l}")
    filename_fmt = "{id}{title:? //}.{extension}"
    archive_fmt = "{id}"
    cookiedomain = ".furaffinity.net"
    root = "https://www.furaffinity.net"
    _warning = True

    def __init__(self, match):
        Extractor.__init__(self, match)
        self.user = match.group(1)
        self.offset = 0
        self._new_layout = None

        if self.config("descriptions") == "html":
            self._process_description = str.strip

    def items(self):

        if self._warning:
            if not self._check_cookies(("a", "b")):
                self.log.warning("no 'a' and 'b' session cookies set")
            FuraffinityExtractor._warning = False

        external = self.config("external", False)
        metadata = self.metadata()
        for post_id in util.advance(self.posts(), self.offset):
            post = self._parse_post(post_id)
            if post:
                if metadata:
                    post.update(metadata)
                yield Message.Directory, post
                yield Message.Url, post["url"], post

                if external:
                    for url in text.extract_iter(
                            post["_description"], 'href="http', '"'):
                        yield Message.Queue, "http" + url, post

    def metadata(self):
        return None

    def skip(self, num):
        self.offset += num
        return num

    def _parse_post(self, post_id):
        url = "{}/view/{}/".format(self.root, post_id)
        extr = text.extract_from(self.request(url).text)

        if self._new_layout is None:
            self._new_layout = ("http-equiv=" not in extr("<meta ", ">"))

        path = extr('href="//d', '"')
        if not path:
            self.log.warning(
                "Unable to download post %s (\"%s\")",
                post_id, text.remove_html(
                    extr('System Message', '</section>') or
                    extr('System Message', '</table>')
                )
            )
            return None

        pi = text.parse_int
        rh = text.remove_html

        data = text.nameext_from_url(path, {
            "id" : pi(post_id),
            "url": "https://d" + path,
        })

        if self._new_layout:
            data["tags"] = text.split_html(extr(
                'class="tags-row">', '</section>'))
            data["title"] = text.unescape(extr("<h2><p>", "</p></h2>"))
            data["artist"] = extr("<strong>", "<")
            data["_description"] = extr('class="section-body">', '</div>')
            data["views"] = pi(rh(extr('class="views">', '</span>')))
            data["favorites"] = pi(rh(extr('class="favorites">', '</span>')))
            data["comments"] = pi(rh(extr('class="comments">', '</span>')))
            data["rating"] = rh(extr('class="rating">', '</span>'))
            data["fa_category"] = rh(extr('>Category</strong>', '</span>'))
            data["theme"] = rh(extr('>', '<'))
            data["species"] = rh(extr('>Species</strong>', '</div>'))
            data["gender"] = rh(extr('>Gender</strong>', '</div>'))
            data["width"] = pi(extr("<span>", "x"))
            data["height"] = pi(extr("", "p"))
        else:
            # old site layout
            data["title"] = text.unescape(extr("<h2>", "</h2>"))
            data["artist"] = extr(">", "<")
            data["fa_category"] = extr("<b>Category:</b>", "<").strip()
            data["theme"] = extr("<b>Theme:</b>", "<").strip()
            data["species"] = extr("<b>Species:</b>", "<").strip()
            data["gender"] = extr("<b>Gender:</b>", "<").strip()
            data["favorites"] = pi(extr("<b>Favorites:</b>", "<"))
            data["comments"] = pi(extr("<b>Comments:</b>", "<"))
            data["views"] = pi(extr("<b>Views:</b>", "<"))
            data["width"] = pi(extr("<b>Resolution:</b>", "x"))
            data["height"] = pi(extr("", "<"))
            data["tags"] = text.split_html(extr(
                'id="keywords">', '</div>'))[::2]
            data["rating"] = extr('<img alt="', ' ')
            data["_description"] = extr("</table>", "</table>")

        data["artist_url"] = data["artist"].replace("_", "").lower()
        data["user"] = self.user or data["artist_url"]
        data["date"] = text.parse_timestamp(data["filename"].partition(".")[0])
        data["description"] = self._process_description(data["_description"])

        return data

    @staticmethod
    def _process_description(description):
        return text.unescape(text.remove_html(description, "", ""))

    def _pagination(self, path):
        num = 1

        while True:
            url = "{}/{}/{}/{}/".format(
                self.root, path, self.user, num)
            page = self.request(url).text
            post_id = None

            for post_id in text.extract_iter(page, 'id="sid-', '"'):
                yield post_id

            if not post_id:
                return
            num += 1

    def _pagination_favorites(self):
        path = "/favorites/{}/".format(self.user)

        while path:
            page = self.request(self.root + path).text
            yield from text.extract_iter(page, 'id="sid-', '"')
            path = text.extract(page, 'right" href="', '"')[0]

    def _pagination_search(self, query):
        url = self.root + "/search/"
        data = {
            "page"           : 0,
            "next_page"      : "Next",
            "order-by"       : "relevancy",
            "order-direction": "desc",
            "range"          : "all",
            "rating-general" : "on",
            "rating-mature"  : "on",
            "rating-adult"   : "on",
            "type-art"       : "on",
            "type-music"     : "on",
            "type-flash"     : "on",
            "type-story"     : "on",
            "type-photo"     : "on",
            "type-poetry"    : "on",
            "mode"           : "extended",
        }
        data.update(query)
        if "page" in query:
            data["page"] = text.parse_int(query["page"])

        while True:
            page = self.request(url, method="POST", data=data).text
            post_id = None

            for post_id in text.extract_iter(page, 'id="sid-', '"'):
                yield post_id

            if not post_id:
                return
            data["page"] += 1


class FuraffinityGalleryExtractor(FuraffinityExtractor):
    """Extractor for a furaffinity user's gallery"""
    subcategory = "gallery"
    pattern = BASE_PATTERN + r"/gallery/([^/?#]+)"
    test = ("https://www.furaffinity.net/gallery/mirlinthloth/", {
        "pattern": r"https://d\d?\.f(uraffinity|acdn)\.net"
                   r"/art/mirlinthloth/\d+/\d+.\w+\.\w+",
        "range": "45-50",
        "count": 6,
    })

    def posts(self):
        return self._pagination("gallery")


class FuraffinityScrapsExtractor(FuraffinityExtractor):
    """Extractor for a furaffinity user's scraps"""
    subcategory = "scraps"
    directory_fmt = ("{category}", "{user!l}", "Scraps")
    pattern = BASE_PATTERN + r"/scraps/([^/?#]+)"
    test = ("https://www.furaffinity.net/scraps/mirlinthloth/", {
        "pattern": r"https://d\d?\.f(uraffinity|acdn)\.net"
                   r"/art/[^/]+(/stories)?/\d+/\d+.\w+.",
        "count": ">= 3",
    })

    def posts(self):
        return self._pagination("scraps")


class FuraffinityFavoriteExtractor(FuraffinityExtractor):
    """Extractor for a furaffinity user's favorites"""
    subcategory = "favorite"
    directory_fmt = ("{category}", "{user!l}", "Favorites")
    pattern = BASE_PATTERN + r"/favorites/([^/?#]+)"
    test = ("https://www.furaffinity.net/favorites/mirlinthloth/", {
        "pattern": r"https://d\d?\.f(uraffinity|acdn)\.net"
                   r"/art/[^/]+/\d+/\d+.\w+\.\w+",
        "range": "45-50",
        "count": 6,
    })

    def posts(self):
        return self._pagination_favorites()


class FuraffinitySearchExtractor(FuraffinityExtractor):
    """Extractor for furaffinity search results"""
    subcategory = "search"
    directory_fmt = ("{category}", "Search", "{search}")
    pattern = BASE_PATTERN + r"/search(?:/([^/?#]+))?/?[?&]([^#]+)"
    test = (
        ("https://www.furaffinity.net/search/?q=cute", {
            "pattern": r"https://d\d?\.f(uraffinity|acdn)\.net"
                       r"/art/[^/]+/\d+/\d+.\w+\.\w+",
            "range": "45-50",
            "count": 6,
        }),
        ("https://www.furaffinity.net/search/cute&rating-general=0", {
            "range": "1",
            "count": 1,
        }),
    )

    def __init__(self, match):
        FuraffinityExtractor.__init__(self, match)
        self.query = text.parse_query(match.group(2))
        if self.user and "q" not in self.query:
            self.query["q"] = text.unquote(self.user)

    def metadata(self):
        return {"search": self.query.get("q")}

    def posts(self):
        return self._pagination_search(self.query)


class FuraffinityPostExtractor(FuraffinityExtractor):
    """Extractor for individual posts on furaffinity"""
    subcategory = "post"
    pattern = BASE_PATTERN + r"/(?:view|full)/(\d+)"
    test = (
        ("https://www.furaffinity.net/view/21835115/", {
            "pattern": r"https://d\d*\.f(uraffinity|acdn)\.net/(download/)?art"
                       r"/mirlinthloth/music/1488278723/1480267446.mirlinthlot"
                       r"h_dj_fennmink_-_bude_s_4_ever\.mp3",
            "keyword": {
                "artist"     : "mirlinthloth",
                "artist_url" : "mirlinthloth",
                "date"       : "dt:2016-11-27 17:24:06",
                "description": "A Song made playing the game Cosmic DJ.",
                "extension"  : "mp3",
                "filename"   : r"re:\d+\.\w+_dj_fennmink_-_bude_s_4_ever",
                "id"         : 21835115,
                "tags"       : list,
                "title"      : "Bude's 4 Ever",
                "url"        : r"re:https://d\d?\.f(uraffinity|acdn)\.net/art",
                "user"       : "mirlinthloth",
                "views"      : int,
                "favorites"  : int,
                "comments"   : int,
                "rating"     : "General",
                "fa_category": "Music",
                "theme"      : "All",
                "species"    : "Unspecified / Any",
                "gender"     : "Any",
                "width"      : 120,
                "height"     : 120,
            },
        }),
        # 'external' option (#1492)
        ("https://www.furaffinity.net/view/42166511/", {
            "options": (("external", True),),
            "pattern": r"https://d\d*\.f(uraffinity|acdn)\.net/"
                       r"|http://www\.postybirb\.com",
            "count": 2,
        }),
        # no tags (#2277)
        ("https://www.furaffinity.net/view/45331225/", {
            "keyword": {
                "artist": "Kota_Remminders",
                "artist_url": "kotaremminders",
                "date": "dt:2022-01-03 17:49:33",
                "fa_category": "Adoptables",
                "filename": "1641232173.kotaremminders_chidopts1",
                "gender": "Any",
                "height": 905,
                "id": 45331225,
                "rating": "General",
                "species": "Unspecified / Any",
                "tags": [],
                "theme": "All",
                "title": "REMINDER",
                "width": 1280,
            },
        }),
        ("https://furaffinity.net/view/21835115/"),
        ("https://sfw.furaffinity.net/view/21835115/"),
        ("https://www.furaffinity.net/full/21835115/"),
    )

    def posts(self):
        post_id = self.user
        self.user = None
        return (post_id,)


class FuraffinityUserExtractor(FuraffinityExtractor):
    """Extractor for furaffinity user profiles"""
    subcategory = "user"
    cookiedomain = None
    pattern = BASE_PATTERN + r"/user/([^/?#]+)"
    test = (
        ("https://www.furaffinity.net/user/mirlinthloth/", {
            "pattern": r"/gallery/mirlinthloth/$",
        }),
        ("https://www.furaffinity.net/user/mirlinthloth/", {
            "options": (("include", "all"),),
            "pattern": r"/(gallery|scraps|favorites)/mirlinthloth/$",
            "count": 3,
        }),
    )

    def items(self):
        base = "{}/{{}}/{}/".format(self.root, self.user)
        return self._dispatch_extractors((
            (FuraffinityGalleryExtractor , base.format("gallery")),
            (FuraffinityScrapsExtractor  , base.format("scraps")),
            (FuraffinityFavoriteExtractor, base.format("favorites")),
        ), ("gallery",))


class FuraffinityFollowingExtractor(FuraffinityExtractor):
    """Extractor for a furaffinity user's watched users"""
    subcategory = "following"
    pattern = BASE_PATTERN + "/watchlist/by/([^/?#]+)"
    test = ("https://www.furaffinity.net/watchlist/by/mirlinthloth/", {
        "pattern": FuraffinityUserExtractor.pattern,
        "range": "176-225",
        "count": 50,
    })

    def items(self):
        url = "{}/watchlist/by/{}/".format(self.root, self.user)
        data = {"_extractor": FuraffinityUserExtractor}

        while True:
            page = self.request(url).text

            for path in text.extract_iter(page, '<a href="', '"'):
                yield Message.Queue, self.root + path, data

            path = text.rextract(page, 'action="', '"')[0]
            if url.endswith(path):
                return
            url = self.root + path
[furaffinity] add extractors (#284) 5 years ago			`# -- coding: utf-8 --`

[furaffinity] improve new/old layout detection (fixes #2277) 3 years ago			`# Copyright 2020-2022 Mike Fährmann`
[furaffinity] add extractors (#284) 5 years ago			`#`
			`# This program is free software; you can redistribute it and/or modify`
			`# it under the terms of the GNU General Public License version 2 as`
			`# published by the Free Software Foundation.`

			`"""Extractors for https://www.furaffinity.net/"""`

			`from .common import Extractor, Message`
			`from .. import text, util`

[furaffinity] accept sfw.furaffinity.net URLs (closes #608) Just as an alias for regular URLs with no extra content filtering. 5 years ago			`BASE_PATTERN = r"(?:https?://)?(?:www\.\|sfw\.)?furaffinity\.net"`
[furaffinity] add extractors (#284) 5 years ago

			`class FuraffinityExtractor(Extractor):`
			`"""Base class for furaffinity extractors"""`
			`category = "furaffinity"`
			`directory_fmt = ("{category}", "{user!l}")`
[furaffinity] improve metadata extraction (fixes #1630) Fetch 'title' and 'artist' metadata from a different location, since for posts with an empty title the <title> element is completely empty and does not contain the artist's name. 3 years ago			`filename_fmt = "{id}{title:? //}.{extension}"`
[furaffinity] add extractors (#284) 5 years ago			`archive_fmt = "{id}"`
[furaffinity] support classic layout (#284) 5 years ago			`cookiedomain = ".furaffinity.net"`
[furaffinity] add extractors (#284) 5 years ago			`root = "https://www.furaffinity.net"`
[furaffinity] warn when no session cookies were found 3 years ago			`_warning = True`
[furaffinity] add extractors (#284) 5 years ago
			`def __init__(self, match):`
			`Extractor.__init__(self, match)`
			`self.user = match.group(1)`
			`self.offset = 0`
[furaffinity] improve new/old layout detection (fixes #2277) 3 years ago			`self._new_layout = None`
[furaffinity] add extractors (#284) 5 years ago
[furaffinity] add 'descriptions' option (#1231) 4 years ago			`if self.config("descriptions") == "html":`
[furaffinity] add 'external' option (closes #1492) 3 years ago			`self._process_description = str.strip`
[furaffinity] add 'descriptions' option (#1231) 4 years ago
[furaffinity] add extractors (#284) 5 years ago			`def items(self):`
[furaffinity] warn when no session cookies were found 3 years ago
			`if self._warning:`
			`if not self._check_cookies(("a", "b")):`
			`self.log.warning("no 'a' and 'b' session cookies set")`
			`FuraffinityExtractor._warning = False`

[furaffinity] add 'external' option (closes #1492) 3 years ago			`external = self.config("external", False)`
[furaffinity] add 'search' extractor (closes #915) 4 years ago			`metadata = self.metadata()`
[furaffinity] add extractors (#284) 5 years ago			`for post_id in util.advance(self.posts(), self.offset):`
			`post = self._parse_post(post_id)`
			`if post:`
[furaffinity] add 'search' extractor (closes #915) 4 years ago			`if metadata:`
			`post.update(metadata)`
[furaffinity] add extractors (#284) 5 years ago			`yield Message.Directory, post`
			`yield Message.Url, post["url"], post`

[furaffinity] add 'external' option (closes #1492) 3 years ago			`if external:`
			`for url in text.extract_iter(`
			`post["_description"], 'href="http', '"'):`
			`yield Message.Queue, "http" + url, post`

[furaffinity] add 'search' extractor (closes #915) 4 years ago			`def metadata(self):`
			`return None`

[furaffinity] add extractors (#284) 5 years ago			`def skip(self, num):`
			`self.offset += num`
			`return num`

			`def _parse_post(self, post_id):`
			`url = "{}/view/{}/".format(self.root, post_id)`
			`extr = text.extract_from(self.request(url).text)`
[furaffinity] support classic layout (#284) 5 years ago
[furaffinity] improve new/old layout detection (fixes #2277) 3 years ago			`if self._new_layout is None:`
			`self._new_layout = ("http-equiv=" not in extr("<meta ", ">"))`

			`path = extr('href="//d', '"')`
[furaffinity] support classic layout (#284) 5 years ago			`if not path:`
[furaffinity] add extractors (#284) 5 years ago			`self.log.warning(`
[furaffinity] support classic layout (#284) 5 years ago			`"Unable to download post %s (\"%s\")",`
			`post_id, text.remove_html(`
			`extr('System Message', '</section>') or`
			`extr('System Message', '</table>')`
			`)`
			`)`
[furaffinity] add extractors (#284) 5 years ago			`return None`

[furaffinity] extract more metadata - views - favorites - comments - rating - fa_category (since 'category' is already in use) - theme - species - gender - width - height 5 years ago			`pi = text.parse_int`
			`rh = text.remove_html`

[furaffinity] support classic layout (#284) 5 years ago			`data = text.nameext_from_url(path, {`
[furaffinity] improve metadata extraction (fixes #1630) Fetch 'title' and 'artist' metadata from a different location, since for posts with an empty title the <title> element is completely empty and does not contain the artist's name. 3 years ago			`"id" : pi(post_id),`
			`"url": "https://d" + path,`
[furaffinity] support classic layout (#284) 5 years ago			`})`

[furaffinity] improve new/old layout detection (fixes #2277) 3 years ago			`if self._new_layout:`
			`data["tags"] = text.split_html(extr(`
			`'class="tags-row">', '</section>'))`
[furaffinity] improve metadata extraction (fixes #1630) Fetch 'title' and 'artist' metadata from a different location, since for posts with an empty title the <title> element is completely empty and does not contain the artist's name. 3 years ago			`data["title"] = text.unescape(extr("<h2><p>", "</p></h2>"))`
			`data["artist"] = extr("<strong>", "<")`
[furaffinity] add 'external' option (closes #1492) 3 years ago			`data["_description"] = extr('class="section-body">', '</div>')`
[furaffinity] extract more metadata - views - favorites - comments - rating - fa_category (since 'category' is already in use) - theme - species - gender - width - height 5 years ago			`data["views"] = pi(rh(extr('class="views">', '</span>')))`
			`data["favorites"] = pi(rh(extr('class="favorites">', '</span>')))`
			`data["comments"] = pi(rh(extr('class="comments">', '</span>')))`
			`data["rating"] = rh(extr('class="rating">', '</span>'))`
			`data["fa_category"] = rh(extr('>Category</strong>', '</span>'))`
			`data["theme"] = rh(extr('>', '<'))`
			`data["species"] = rh(extr('>Species</strong>', '</div>'))`
			`data["gender"] = rh(extr('>Gender</strong>', '</div>'))`
			`data["width"] = pi(extr("<span>", "x"))`
			`data["height"] = pi(extr("", "p"))`
[furaffinity] support classic layout (#284) 5 years ago			`else:`
[furaffinity] extract more metadata - views - favorites - comments - rating - fa_category (since 'category' is already in use) - theme - species - gender - width - height 5 years ago			`# old site layout`
[furaffinity] improve metadata extraction (fixes #1630) Fetch 'title' and 'artist' metadata from a different location, since for posts with an empty title the <title> element is completely empty and does not contain the artist's name. 3 years ago			`data["title"] = text.unescape(extr("<h2>", "</h2>"))`
			`data["artist"] = extr(">", "<")`
[furaffinity] extract more metadata - views - favorites - comments - rating - fa_category (since 'category' is already in use) - theme - species - gender - width - height 5 years ago			`data["fa_category"] = extr("<b>Category:</b>", "<").strip()`
			`data["theme"] = extr("<b>Theme:</b>", "<").strip()`
			`data["species"] = extr("<b>Species:</b>", "<").strip()`
			`data["gender"] = extr("<b>Gender:</b>", "<").strip()`
			`data["favorites"] = pi(extr("<b>Favorites:</b>", "<"))`
			`data["comments"] = pi(extr("<b>Comments:</b>", "<"))`
			`data["views"] = pi(extr("<b>Views:</b>", "<"))`
			`data["width"] = pi(extr("<b>Resolution:</b>", "x"))`
			`data["height"] = pi(extr("", "<"))`
[furaffinity] support classic layout (#284) 5 years ago			`data["tags"] = text.split_html(extr(`
			`'id="keywords">', '</div>'))[::2]`
[furaffinity] extract more metadata - views - favorites - comments - rating - fa_category (since 'category' is already in use) - theme - species - gender - width - height 5 years ago			`data["rating"] = extr('<img alt="', ' ')`
[furaffinity] add 'external' option (closes #1492) 3 years ago			`data["_description"] = extr("</table>", "</table>")`
[furaffinity] improve metadata extraction (fixes #1630) Fetch 'title' and 'artist' metadata from a different location, since for posts with an empty title the <title> element is completely empty and does not contain the artist's name. 3 years ago
			`data["artist_url"] = data["artist"].replace("_", "").lower()`
			`data["user"] = self.user or data["artist_url"]`
[furaffinity] support classic layout (#284) 5 years ago			`data["date"] = text.parse_timestamp(data["filename"].partition(".")[0])`
[furaffinity] add 'external' option (closes #1492) 3 years ago			`data["description"] = self._process_description(data["_description"])`
[furaffinity] support classic layout (#284) 5 years ago
			`return data`
[furaffinity] add extractors (#284) 5 years ago
[furaffinity] add 'descriptions' option (#1231) 4 years ago			`@staticmethod`
			`def _process_description(description):`
			`return text.unescape(text.remove_html(description, "", ""))`

[furaffinity] fix using 'category-tranfer' (#1274) 3 years ago			`def _pagination(self, path):`
[furaffinity] add extractors (#284) 5 years ago			`num = 1`

			`while True:`
			`url = "{}/{}/{}/{}/".format(`
[furaffinity] fix using 'category-tranfer' (#1274) 3 years ago			`self.root, path, self.user, num)`
[furaffinity] add extractors (#284) 5 years ago			`page = self.request(url).text`
			`post_id = None`

			`for post_id in text.extract_iter(page, 'id="sid-', '"'):`
			`yield post_id`

			`if not post_id:`
			`return`
			`num += 1`

			`def _pagination_favorites(self):`
			`path = "/favorites/{}/".format(self.user)`

			`while path:`
			`page = self.request(self.root + path).text`
			`yield from text.extract_iter(page, 'id="sid-', '"')`
[furaffinity] support classic layout (#284) 5 years ago			`path = text.extract(page, 'right" href="', '"')[0]`
[furaffinity] add extractors (#284) 5 years ago
[furaffinity] add 'search' extractor (closes #915) 4 years ago			`def _pagination_search(self, query):`
			`url = self.root + "/search/"`
			`data = {`
			`"page" : 0,`
			`"next_page" : "Next",`
			`"order-by" : "relevancy",`
			`"order-direction": "desc",`
			`"range" : "all",`
			`"rating-general" : "on",`
			`"rating-mature" : "on",`
			`"rating-adult" : "on",`
			`"type-art" : "on",`
			`"type-music" : "on",`
			`"type-flash" : "on",`
			`"type-story" : "on",`
			`"type-photo" : "on",`
			`"type-poetry" : "on",`
			`"mode" : "extended",`
			`}`
			`data.update(query)`
			`if "page" in query:`
			`data["page"] = text.parse_int(query["page"])`

			`while True:`
			`page = self.request(url, method="POST", data=data).text`
			`post_id = None`

			`for post_id in text.extract_iter(page, 'id="sid-', '"'):`
			`yield post_id`

			`if not post_id:`
			`return`
			`data["page"] += 1`

[furaffinity] add extractors (#284) 5 years ago
			`class FuraffinityGalleryExtractor(FuraffinityExtractor):`
			`"""Extractor for a furaffinity user's gallery"""`
			`subcategory = "gallery"`
remove '&' from URL patterns '/?&#' -> '/?#' and '?&#' -> '?#' According to https://www.ietf.org/rfc/rfc3986.txt, URLs are "organized hierarchically" by using "the slash ("/"), question mark ("?"), and number sign ("#") characters to delimit components" 4 years ago			`pattern = BASE_PATTERN + r"/gallery/([^/?#]+)"`
[furaffinity] add extractors (#284) 5 years ago			`test = ("https://www.furaffinity.net/gallery/mirlinthloth/", {`
update extractor test results 4 years ago			`"pattern": r"https://d\d?\.f(uraffinity\|acdn)\.net"`
			`r"/art/mirlinthloth/\d+/\d+.\w+\.\w+",`
[furaffinity] add extractors (#284) 5 years ago			`"range": "45-50",`
			`"count": 6,`
			`})`

[furaffinity] fix using 'category-tranfer' (#1274) 3 years ago			`def posts(self):`
			`return self._pagination("gallery")`

[furaffinity] add extractors (#284) 5 years ago
			`class FuraffinityScrapsExtractor(FuraffinityExtractor):`
			`"""Extractor for a furaffinity user's scraps"""`
			`subcategory = "scraps"`
			`directory_fmt = ("{category}", "{user!l}", "Scraps")`
remove '&' from URL patterns '/?&#' -> '/?#' and '?&#' -> '?#' According to https://www.ietf.org/rfc/rfc3986.txt, URLs are "organized hierarchically" by using "the slash ("/"), question mark ("?"), and number sign ("#") characters to delimit components" 4 years ago			`pattern = BASE_PATTERN + r"/scraps/([^/?#]+)"`
[furaffinity] add extractors (#284) 5 years ago			`test = ("https://www.furaffinity.net/scraps/mirlinthloth/", {`
update extractor test results 4 years ago			`"pattern": r"https://d\d?\.f(uraffinity\|acdn)\.net"`
			`r"/art/[^/]+(/stories)?/\d+/\d+.\w+.",`
[furaffinity] add extractors (#284) 5 years ago			`"count": ">= 3",`
			`})`

[furaffinity] fix using 'category-tranfer' (#1274) 3 years ago			`def posts(self):`
			`return self._pagination("scraps")`

[furaffinity] add extractors (#284) 5 years ago
			`class FuraffinityFavoriteExtractor(FuraffinityExtractor):`
			`"""Extractor for a furaffinity user's favorites"""`
			`subcategory = "favorite"`
			`directory_fmt = ("{category}", "{user!l}", "Favorites")`
remove '&' from URL patterns '/?&#' -> '/?#' and '?&#' -> '?#' According to https://www.ietf.org/rfc/rfc3986.txt, URLs are "organized hierarchically" by using "the slash ("/"), question mark ("?"), and number sign ("#") characters to delimit components" 4 years ago			`pattern = BASE_PATTERN + r"/favorites/([^/?#]+)"`
[furaffinity] add extractors (#284) 5 years ago			`test = ("https://www.furaffinity.net/favorites/mirlinthloth/", {`
update extractor test results 4 years ago			`"pattern": r"https://d\d?\.f(uraffinity\|acdn)\.net"`
			`r"/art/[^/]+/\d+/\d+.\w+\.\w+",`
[furaffinity] add extractors (#284) 5 years ago			`"range": "45-50",`
			`"count": 6,`
			`})`

			`def posts(self):`
			`return self._pagination_favorites()`


[furaffinity] add 'search' extractor (closes #915) 4 years ago			`class FuraffinitySearchExtractor(FuraffinityExtractor):`
			`"""Extractor for furaffinity search results"""`
			`subcategory = "search"`
			`directory_fmt = ("{category}", "Search", "{search}")`
[furaffinity] expand URL pattern for searches (closes #1780) 3 years ago			`pattern = BASE_PATTERN + r"/search(?:/([^/?#]+))?/?[?&]([^#]+)"`
			`test = (`
			`("https://www.furaffinity.net/search/?q=cute", {`
			`"pattern": r"https://d\d?\.f(uraffinity\|acdn)\.net"`
			`r"/art/[^/]+/\d+/\d+.\w+\.\w+",`
			`"range": "45-50",`
			`"count": 6,`
			`}),`
			`("https://www.furaffinity.net/search/cute&rating-general=0", {`
			`"range": "1",`
			`"count": 1,`
			`}),`
			`)`

			`def __init__(self, match):`
			`FuraffinityExtractor.__init__(self, match)`
			`self.query = text.parse_query(match.group(2))`
			`if self.user and "q" not in self.query:`
[furaffinity] unquote search queries (#1958) instead of unescape (unquote -> url params, unescape -> html entities) 3 years ago			`self.query["q"] = text.unquote(self.user)`
[furaffinity] add 'search' extractor (closes #915) 4 years ago
			`def metadata(self):`
			`return {"search": self.query.get("q")}`

			`def posts(self):`
			`return self._pagination_search(self.query)`


[furaffinity] add extractors (#284) 5 years ago			`class FuraffinityPostExtractor(FuraffinityExtractor):`
			`"""Extractor for individual posts on furaffinity"""`
			`subcategory = "post"`
[furaffinity] support classic layout (#284) 5 years ago			`pattern = BASE_PATTERN + r"/(?:view\|full)/(\d+)"`
			`test = (`
			`("https://www.furaffinity.net/view/21835115/", {`
update extractor test results 4 years ago			`"pattern": r"https://d\d*\.f(uraffinity\|acdn)\.net/(download/)?art"`
			`r"/mirlinthloth/music/1488278723/1480267446.mirlinthlot"`
			`r"h_dj_fennmink_-_bude_s_4_ever\.mp3",`
[furaffinity] support classic layout (#284) 5 years ago			`"keyword": {`
			`"artist" : "mirlinthloth",`
[furaffinity] add 'artist_url' metadata field (closes #821) 4 years ago			`"artist_url" : "mirlinthloth",`
add tests for specific datetime values 5 years ago			`"date" : "dt:2016-11-27 17:24:06",`
[furaffinity] support classic layout (#284) 5 years ago			`"description": "A Song made playing the game Cosmic DJ.",`
			`"extension" : "mp3",`
			`"filename" : r"re:\d+\.\w+_dj_fennmink_-_bude_s_4_ever",`
			`"id" : 21835115,`
			`"tags" : list,`
			`"title" : "Bude's 4 Ever",`
update extractor test results 4 years ago			`"url" : r"re:https://d\d?\.f(uraffinity\|acdn)\.net/art",`
[furaffinity] support classic layout (#284) 5 years ago			`"user" : "mirlinthloth",`
[furaffinity] extract more metadata - views - favorites - comments - rating - fa_category (since 'category' is already in use) - theme - species - gender - width - height 5 years ago			`"views" : int,`
			`"favorites" : int,`
			`"comments" : int,`
			`"rating" : "General",`
			`"fa_category": "Music",`
			`"theme" : "All",`
			`"species" : "Unspecified / Any",`
			`"gender" : "Any",`
			`"width" : 120,`
			`"height" : 120,`
[furaffinity] support classic layout (#284) 5 years ago			`},`
			`}),`
[furaffinity] add 'external' option (closes #1492) 3 years ago			`# 'external' option (#1492)`
			`("https://www.furaffinity.net/view/42166511/", {`
			`"options": (("external", True),),`
			`"pattern": r"https://d\d*\.f(uraffinity\|acdn)\.net/"`
			`r"\|http://www\.postybirb\.com",`
			`"count": 2,`
			`}),`
[furaffinity] improve new/old layout detection (fixes #2277) 3 years ago			`# no tags (#2277)`
			`("https://www.furaffinity.net/view/45331225/", {`
			`"keyword": {`
			`"artist": "Kota_Remminders",`
			`"artist_url": "kotaremminders",`
			`"date": "dt:2022-01-03 17:49:33",`
			`"fa_category": "Adoptables",`
			`"filename": "1641232173.kotaremminders_chidopts1",`
			`"gender": "Any",`
			`"height": 905,`
			`"id": 45331225,`
			`"rating": "General",`
			`"species": "Unspecified / Any",`
			`"tags": [],`
			`"theme": "All",`
			`"title": "REMINDER",`
			`"width": 1280,`
			`},`
			`}),`
[furaffinity] accept sfw.furaffinity.net URLs (closes #608) Just as an alias for regular URLs with no extra content filtering. 5 years ago			`("https://furaffinity.net/view/21835115/"),`
			`("https://sfw.furaffinity.net/view/21835115/"),`
[furaffinity] support classic layout (#284) 5 years ago			`("https://www.furaffinity.net/full/21835115/"),`
			`)`
[furaffinity] add extractors (#284) 5 years ago
			`def posts(self):`
			`post_id = self.user`
			`self.user = None`
			`return (post_id,)`


			`class FuraffinityUserExtractor(FuraffinityExtractor):`
			`"""Extractor for furaffinity user profiles"""`
			`subcategory = "user"`
[furaffinity] support classic layout (#284) 5 years ago			`cookiedomain = None`
remove '&' from URL patterns '/?&#' -> '/?#' and '?&#' -> '?#' According to https://www.ietf.org/rfc/rfc3986.txt, URLs are "organized hierarchically" by using "the slash ("/"), question mark ("?"), and number sign ("#") characters to delimit components" 4 years ago			`pattern = BASE_PATTERN + r"/user/([^/?#]+)"`
[furaffinity] add extractors (#284) 5 years ago			`test = (`
			`("https://www.furaffinity.net/user/mirlinthloth/", {`
			`"pattern": r"/gallery/mirlinthloth/$",`
			`}),`
			`("https://www.furaffinity.net/user/mirlinthloth/", {`
			`"options": (("include", "all"),),`
			`"pattern": r"/(gallery\|scraps\|favorites)/mirlinthloth/$",`
			`"count": 3,`
			`}),`
			`)`

			`def items(self):`
			`base = "{}/{{}}/{}/".format(self.root, self.user)`
			`return self._dispatch_extractors((`
			`(FuraffinityGalleryExtractor , base.format("gallery")),`
			`(FuraffinityScrapsExtractor , base.format("scraps")),`
			`(FuraffinityFavoriteExtractor, base.format("favorites")),`
			`), ("gallery",))`
[furaffinity] add 'following' extractor (#515) 4 years ago

			`class FuraffinityFollowingExtractor(FuraffinityExtractor):`
			`"""Extractor for a furaffinity user's watched users"""`
			`subcategory = "following"`
remove '&' from URL patterns '/?&#' -> '/?#' and '?&#' -> '?#' According to https://www.ietf.org/rfc/rfc3986.txt, URLs are "organized hierarchically" by using "the slash ("/"), question mark ("?"), and number sign ("#") characters to delimit components" 4 years ago			`pattern = BASE_PATTERN + "/watchlist/by/([^/?#]+)"`
[furaffinity] add 'following' extractor (#515) 4 years ago			`test = ("https://www.furaffinity.net/watchlist/by/mirlinthloth/", {`
			`"pattern": FuraffinityUserExtractor.pattern,`
			`"range": "176-225",`
			`"count": 50,`
			`})`

			`def items(self):`
			`url = "{}/watchlist/by/{}/".format(self.root, self.user)`
			`data = {"_extractor": FuraffinityUserExtractor}`

			`while True:`
			`page = self.request(url).text`

			`for path in text.extract_iter(page, '<a href="', '"'):`
			`yield Message.Queue, self.root + path, data`

			`path = text.rextract(page, 'action="', '"')[0]`
			`if url.endswith(path):`
			`return`
			`url = self.root + path`