Browse Source

fix: should not check paper url
gov.cn change url frequently

NateScarlet 2 years ago
parent
commit
74303b42dd
1 changed files with 0 additions and 5 deletions
  1. 0 5
      scripts/fetch.py

+ 0 - 5
scripts/fetch.py

@@ -138,11 +138,6 @@ def get_paper(url: str) -> str:
         str: Extracted paper text.
         str: Extracted paper text.
     """
     """
 
 
-    assert re.match(
-        r"https?://www.gov.cn/zhengce/(zhengceku|content)/\d{4}-\d{2}/\d{2}/content_\d+.htm",
-        url,
-    ), "site changed, need human verify: %s" % (url,)
-
     response = requests.get(url)
     response = requests.get(url)
     _raise_for_status_200(response)
     _raise_for_status_200(response)
     response.encoding = "utf-8"
     response.encoding = "utf-8"