[architizer] fix extraction (#4537)

pull/4571/head
Mike Fährmann 1 year ago
parent 6178177227
commit cb4798f07a
No known key found for this signature in database
GPG Key ID: 5680CA389D365A88

@ -29,11 +29,13 @@ class ArchitizerProjectExtractor(GalleryExtractor):
def metadata(self, page):
extr = text.extract_from(page)
extr('id="Pages"', "")
return {
"title" : extr("data-name='", "'"),
"slug" : extr("data-slug='", "'"),
"gid" : extr("data-gid='", "'").rpartition(".")[2],
"firm" : extr("data-firm-leaders-str='", "'"),
"title" : extr('data-name="', '"'),
"slug" : extr('data-slug="', '"'),
"gid" : extr('data-gid="', '"').rpartition(".")[2],
"firm" : extr('data-firm-leaders-str="', '"'),
"location" : extr("<h2>", "<").strip(),
"type" : text.unescape(text.remove_html(extr(
'<div class="title">Type</div>', '<br'))),
@ -52,7 +54,7 @@ class ArchitizerProjectExtractor(GalleryExtractor):
return [
(url, None)
for url in text.extract_iter(
page, "property='og:image:secure_url' content='", "?")
page, 'property="og:image:secure_url" content="', "?")
]

Loading…
Cancel
Save