From 6e9e4e34e1cc1bc70b47885bcaf7ecb8dcdf889b Mon Sep 17 00:00:00 2001 From: zzx Date: Thu, 25 Sep 2025 17:21:42 +0800 Subject: [PATCH] =?UTF-8?q?fix(spider):=E4=B8=BA=E5=8F=91=E5=B8=83?= =?UTF-8?q?=E6=97=B6=E9=97=B4=E6=8F=90=E5=8F=96=E6=B7=BB=E5=8A=A0=E5=BC=82?= =?UTF-8?q?=E5=B8=B8=E5=A4=84=E7=90=86?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 当无法正确提取发布时间空时,设置默认值以避免程序中断 --- spiders/ai_seo/metaso.py | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/spiders/ai_seo/metaso.py b/spiders/ai_seo/metaso.py index b153bc6..7e18293 100644 --- a/spiders/ai_seo/metaso.py +++ b/spiders/ai_seo/metaso.py @@ -78,9 +78,12 @@ class MetasoSpider(AbstractAiSeoSpider): # 抽取链接和标题 a = search_item.locator("xpath=./div[1]/a") # 抽取时间 - publish_date_element = search_item.locator("xpath=./div[2]/div") - publish_str = await publish_date_element.text_content() - search_result.publish_time = publish_str.replace('[', '').replace(']', '') + try: + publish_date_element = search_item.locator("xpath=./div[2]/div") + publish_str = await publish_date_element.text_content() + search_result.publish_time = publish_str.replace('[', '').replace(']', '') + except Exception as e: + search_result.publish_time = '' if await a.is_visible(): search_result.title = await a.text_content() search_result.url = await a.get_attribute('href')