[mangahere] fix metadata extraction

pull/54/head
Mike Fährmann 7 years ago
parent 2d0cfb33e1
commit 305da540c3
No known key found for this signature in database
GPG Key ID: 5680CA389D365A88

@ -92,9 +92,8 @@ class MangahereChapterExtractor(AsynchronousExtractor):
"""Collect metadata for extractor-job"""
manga, pos = text.extract(page, '<title>', '</title>')
chid , pos = text.extract(page, '.net/store/manga/', '/', pos)
_ , pos = text.extract(page, '<select class="wid60"', '', pos)
_ , pos = text.extract(page, '</select>', '', pos)
count, pos = text.extract(page, '>', '<', pos-30)
pages, pos = text.extract(page, ' class="wid60"', '</select>', pos)
count = re.findall(r">(\d+)<", pages)[-1]
manga = re.match((r"(.+) \d+(\.\d+)? - Read .+ Chapter "
r"\d+(\.\d+)? Online"), manga).group(1)
return {

@ -73,8 +73,8 @@ skip = [
"exhentai", "kissmanga", "mangafox", "dynastyscans", "nijie",
"archivedmoe", "archiveofsins", "thebarchive",
# temporary issues
"imgtrex",
"loveisover", # certificate verify failed
"nyafuu",
"mangazuki",
]
# enable selective testing for direct calls
if __name__ == '__main__' and len(sys.argv) > 1:

Loading…
Cancel
Save