From 06dabf8c03461094d16632e5efefd9c49ba8db74 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tristan=20Dani=C3=ABl=20Maat?= Date: Sat, 9 Apr 2022 19:30:41 +0100 Subject: [PATCH] Work around other broken links --- qinghai/scrape.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/qinghai/scrape.py b/qinghai/scrape.py index 812973a..f6b8025 100644 --- a/qinghai/scrape.py +++ b/qinghai/scrape.py @@ -35,8 +35,11 @@ def main(): writer.writerow(i, link[0], link[1]) for i, link in enumerate(links): - # Broken link - if i == 210: + # Broken links + # + # 275 was available as an iframe, and is parsed separately in + # scrape-iframe.py + if i in (210, 275, 453, 681, 703, 791, 871, 913, 914, 915): continue print(f"Downloading {link[0]} ({i}/{len(links)})")