From f45ad35c6ac9ed5b8dc420d5a45d663037607129 Mon Sep 17 00:00:00 2001 From: oscar Date: Sun, 16 Mar 2025 15:51:17 +0800 Subject: [PATCH] modify scripts --- scripts/iafd/src/iafd_scraper.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/scripts/iafd/src/iafd_scraper.py b/scripts/iafd/src/iafd_scraper.py index 823a2b9..ac1f096 100644 --- a/scripts/iafd/src/iafd_scraper.py +++ b/scripts/iafd/src/iafd_scraper.py @@ -47,14 +47,14 @@ def fetch_page(url, validator, max_retries=3, parser="html.parser", preprocessor # 处理 HTTP 状态码 if response.status_code == 404: - logging.warning(f"Page not found (404): {url}") + logging.debug(f"Page not found (404): {url}") return None, 404 # 直接返回 404,调用方可以跳过 response.raise_for_status() # 处理 HTTP 错误 # 过期的网页,与404相同处理 if "invalid or outdated page" in response.text.lower(): - logging.warning(f"invalid or outdated page: {url}") + logging.debug(f"invalid or outdated page: {url}") return None, 404 # 直接返回 404,调用方可以跳过 # 预处理 HTML(如果提供了 preprocessor)