diff --git a/shanxi/scrape-articles.py b/shanxi/scrape-articles.py index 63fb55c..8896064 100644 --- a/shanxi/scrape-articles.py +++ b/shanxi/scrape-articles.py @@ -12,6 +12,9 @@ def main(): with open("articles-shanxi/links.csv", "r") as f: links = read_links(f) + # Broken links + links = links[:254] + download_link_texts(links, "message-box", "articles-shanxi", encoding="UTF-8")