[imgyt] fix extraction

pull/40/head
Mike Fährmann 7 years ago
parent 4ad903b797
commit f32b1a0292
No known key found for this signature in database
GPG Key ID: 5680CA389D365A88

@ -76,10 +76,10 @@ class ImgytImageExtractor(ImagehostImageExtractor):
https = True https = True
def get_info(self, page): def get_info(self, page):
url, pos = text.extract(page, '<img class="centred" src="', '"') url, pos = text.extract(page, "<img class='centred' src='", "'")
if not url: if not url:
raise exception.NotFoundError("image") raise exception.NotFoundError("image")
filename, pos = text.extract(page, ' alt="', '"', pos) filename, pos = text.extract(page, " alt='", "'", pos)
filename = (filename + splitext(url)[1]) if filename else url filename = (filename + splitext(url)[1]) if filename else url
return url, filename return url, filename
@ -189,8 +189,7 @@ class HosturimageImageExtractor(ImagehostImageExtractor):
https = True https = True
def get_info(self, page): def get_info(self, page):
_ , pos = text.extract(page, '<div id="image_details">', '') url, pos = text.extract(page, "<img class='centred' src='", "'")
url, pos = text.extract(page, 'src="', '"', pos)
return url, url return url, url

@ -67,6 +67,8 @@ skip = [
"archivedmoe", "archiveofsins", "thebarchive", "archivedmoe", "archiveofsins", "thebarchive",
# temporary issues # temporary issues
"luscious", # "high load" "luscious", # "high load"
"imgtrex", # 504
"hentaifoundry", # SSL cert expired
] ]
# enable selective testing for direct calls # enable selective testing for direct calls
if __name__ == '__main__' and len(sys.argv) > 1: if __name__ == '__main__' and len(sys.argv) > 1:

Loading…
Cancel
Save