# -*- coding: utf-8 -*- # Copyright 2015 Mike Fährmann # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License version 2 as # published by the Free Software Foundation. """Extract manga-chapters and entire manga from http://kissmanga.com/""" from .common import Extractor, Message from .. import text, cloudflare import re class KissmangaExtractor(Extractor): """Base class for kissmanga extractors""" category = "kissmanga" directory_fmt = ["{category}", "{manga}", "c{chapter:>03}{chapter-minor} - {title}"] filename_fmt = "{manga}_c{chapter:>03}{chapter-minor}_{page:>03}.{extension}" url_base = "http://kissmanga.com" def __init__(self, match): Extractor.__init__(self) self.url = match.group(0) class KissmangaMangaExtractor(KissmangaExtractor): """Extract all manga-chapters from kissmanga""" subcategory = "manga" pattern = [r"(?:https?://)?(?:www\.)?kissmanga\.com/Manga/[^/]+/?$"] test = [("http://kissmanga.com/Manga/Dropout", { "url": "992befdd64e178fe5af67de53f8b510860d968ca", })] def items(self): cloudflare.bypass_ddos_protection(self.session, self.url_base) yield Message.Version, 1 for chapter in self.get_chapters(): yield Message.Queue, self.url_base + chapter def get_chapters(self): """Return a list of all chapter urls""" page = self.request(self.url).text return reversed(list( text.extract_iter(page, '\n