More logical Mastodon parsing order (fixes parsing pages with lots of <h3>)

2024-10-23 02:19:05 +00:00 · 2022-09-02 22:01:39 +03:00 · 2022-09-02 22:01:39 +03:00 · 2906946ee9
commit 2906946ee9
parent 933ce8555f
1 changed files with 5 additions and 5 deletions
--- a/fetch_blocks.py
+++ b/fetch_blocks.py
@ -39,11 +39,11 @@ def get_mastodon_blocks(domain: str) -> dict:
        return {}
    for header in doc.find_all("h3"):
-        for line in header.find_next_siblings("table")[0].find_all("tr")[1:]:
+        header_text = header.text
-            header_text = header.text
+        if header_text in translations:
-            if header_text in translations:
+            header_text = translations[header_text]
-                    header_text = translations[header_text]
+        if header_text in blocks:
-            if header_text in blocks:
+            for line in header.find_next_siblings("table")[0].find_all("tr")[1:]:
                blocks[header_text].append(
                    {
                        "domain": line.find("span").text,