From 6f0735568ca1a88a37efaa52d9453b43c75f0b98 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mike=20F=C3=A4hrmann?= Date: Thu, 15 Dec 2022 18:05:32 +0100 Subject: [PATCH] [2chen] fix file URLs --- gallery_dl/extractor/2chen.py | 13 ++++++++++--- 1 file changed, 10 insertions(+), 3 deletions(-) diff --git a/gallery_dl/extractor/2chen.py b/gallery_dl/extractor/2chen.py index 2cf8b305..d9674d86 100644 --- a/gallery_dl/extractor/2chen.py +++ b/gallery_dl/extractor/2chen.py @@ -20,6 +20,7 @@ class _2chenThreadExtractor(Extractor): pattern = r"(?:https?://)?2chen\.(?:moe|club)/([^/?#]+)/(\d+)" test = ( ("https://2chen.moe/tv/496715", { + "pattern": r"https://2chen\.su/assets/images/src/\w{40}\.\w+$", "count": ">= 179", }), ("https://2chen.club/tv/1", { @@ -39,13 +40,19 @@ class _2chenThreadExtractor(Extractor): page = self.request(url, encoding="utf-8", notfound="thread").text data = self.metadata(page) yield Message.Directory, data + for post in self.posts(page): - if not post["url"]: + + url = post["url"] + if not url: continue + if url[0] == "/": + url = self.root + url + post["url"] = url = url.partition("?")[0] + post.update(data) - post["url"] = self.root + post["url"] post["time"] = text.parse_int(post["date"].timestamp()) - yield Message.Url, post["url"], text.nameext_from_url( + yield Message.Url, url, text.nameext_from_url( post["filename"], post) def metadata(self, page):