[batoto] fix extraction of chapter URLs

pull/40/head
Mike Fährmann 7 years ago
parent 18e6ed1c7e
commit c7ec103e15
No known key found for this signature in database
GPG Key ID: 5680CA389D365A88

@ -69,10 +69,10 @@ class BatotoMangaExtractor(BatotoExtractor, MangaExtractor):
def chapters(self, page):
# TODO: filter by language / translator
needle = ('<td style="border-top:0;">\n '
'<a href="https://bato.to/reader#')
pattern = (r'<td style="border-top:0;">\s+'
r'<a href="https?://bato\.to/reader#([^"]+)')
return [self.root + "/reader#" + mangahash
for mangahash in text.extract_iter(page, needle, '"')]
for mangahash in re.findall(pattern, page)]
class BatotoChapterExtractor(BatotoExtractor, AsynchronousExtractor):

@ -291,7 +291,7 @@ class DeviantartCollectionExtractor(DeviantartExtractor):
r"/favourites/(\d+)/([^/?&#]+)"]
test = [("http://rosuuri.deviantart.com/favourites/58951174/Useful", {
"url": "22a3858a1efb150d11c3f4e63cf9082ad70c6ea0",
"keyword": "b4abbad60f87a42fb6c1a021cb3a8efd9d31bfb7",
"keyword": "e0ed920fb3dfdad9294be592be2eeb3dc1258a6a",
})]
def __init__(self, match):

@ -58,7 +58,7 @@ skip = [
"exhentai", "kissmanga", "mangafox", "dynastyscans", "nijie",
"archivedmoe", "archiveofsins", "thebarchive",
# temporary issues
"mangapark",
"mangapark", "danbooru", "yandere", "pixiv",
]
# enable selective testing for direct calls
if __name__ == '__main__' and len(sys.argv) > 1:

Loading…
Cancel
Save