# -*- coding: utf-8 -*- # Copyright 2016-2017 Mike Fährmann # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License version 2 as # published by the Free Software Foundation. """Extract hentaimanga from https://hentaihere.com/""" from .. import text from . import hentaicdn import re class HentaihereMangaExtractor(hentaicdn.HentaicdnMangaExtractor): """Extractor for mangas from hentaihere.com""" category = "hentaihere" pattern = [r"(?:https?://)?(?:www\.)?hentaihere\.com/m/S(\d+)/?$"] test = [ ("https://hentaihere.com/m/S13812", { "url": "d1ba6e28bb2162e844f8559c2b2725ba0a093559", }), ("https://hentaihere.com/m/S7608", { "url": "6c5239758dc93f6b1b4175922836c10391b174f7", }), ] def __init__(self, match): hentaicdn.HentaicdnMangaExtractor.__init__(self) self.gid = match.group(1) def get_chapters(self): return text.extract_iter( self.request("https://hentaihere.com/m/S" + self.gid).text, '

\n", "")[0] pattern = r"Page 1 \| (.+) $([^)]+)$ - Chapter \d+: (.+) by (.+) at " match = re.match(pattern, title) return { "gallery-id": self.gid, "title": match.group(1), "type": match.group(2), "chapter": self.chapter, "chapter-name": match.group(3), "author": match.group(4), "count": len(images), "lang": "en", "language": "English", }