From c411b4848fd6d8e8f7244ef6cb1c700ac14e3a21 Mon Sep 17 00:00:00 2001 From: JiaoTianBo Date: Tue, 24 Mar 2026 15:50:41 +0800 Subject: [PATCH] =?UTF-8?q?chore(crawler):=20=E7=A7=BB=E9=99=A4=20BossCraw?= =?UTF-8?q?ler=20=E4=B8=AD=E8=B0=83=E8=AF=95=E6=89=93=E5=8D=B0=E4=BB=A3?= =?UTF-8?q?=E7=A0=81?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - 删除了打印 geek_data 和 geek_card 属性的调试语句 - 移除了候选人 name 和 source_id 解析时的调试输出 chore(ingestion): 去除数据验证失败时的调试打印 - 删除了验证失败后打印原始数据和标准化数据的调试信息 - 精简验证失败的日志输出,保持代码简洁 --- .../ylhp_hr_2_0/service/crawler/boss_crawler.py | 9 --------- .../service/ingestion/unified_ingestion_service.py | 6 ------ 2 files changed, 15 deletions(-) diff --git a/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/crawler/boss_crawler.py b/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/crawler/boss_crawler.py index f9f8c42..52ab225 100644 --- a/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/crawler/boss_crawler.py +++ b/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/crawler/boss_crawler.py @@ -138,13 +138,6 @@ class BossCrawler(BaseCrawler): # 获取 geekCard(Boss SDK 的数据通常在 geekCard 中) geek_card = getattr(geek_data, 'geekCard', None) or geek_data - # 调试:打印 geek_data 和 geek_card 的所有属性 - print(f"[DEBUG] geek_data type: {type(geek_data)}") - print(f"[DEBUG] geek_data attrs: {dir(geek_data) if hasattr(geek_data, '__dict__') else 'no __dict__'}") - if geek_card is not geek_data: - print(f"[DEBUG] geek_card type: {type(geek_card)}") - print(f"[DEBUG] geek_card attrs: {dir(geek_card) if hasattr(geek_card, '__dict__') else 'no __dict__'}") - # 从 SDK 返回的数据中提取候选人信息 source_id = (getattr(geek_data, 'geekId', '') or getattr(geek_data, 'encryptGeekId', '') or @@ -155,8 +148,6 @@ class BossCrawler(BaseCrawler): name = (getattr(geek_card, 'geekName', '') or getattr(geek_data, 'geekName', '')) - print(f"[DEBUG] Parsed name: '{name}', source_id: '{source_id}'") - # 解析薪资期望(Boss SDK 使用 salary 或 lowSalary/highSalary) salary_str = (getattr(geek_card, 'salary', '') or getattr(geek_data, 'salary', '')) diff --git a/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/ingestion/unified_ingestion_service.py b/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/ingestion/unified_ingestion_service.py index 3770a3a..6462e54 100644 --- a/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/ingestion/unified_ingestion_service.py +++ b/src/main/python/cn/yinlihupo/ylhp_hr_2_0/service/ingestion/unified_ingestion_service.py @@ -137,12 +137,6 @@ class UnifiedIngestionService: # 2. 数据验证 validation_result = self._validate(normalized) if not validation_result.is_valid: - # 打印原始数据和标准化数据,方便排查 - print(f"[数据验证失败] 错误: {validation_result.error_messages}") - print(f"[数据验证失败] 原始数据: {raw_data}") - print(f"[数据验证失败] 标准化后候选人: name={normalized.candidate.name}, " - f"source={normalized.candidate.source}, source_id={normalized.candidate.source_id}") - print(f"[数据验证失败] 标准化后简历: raw_content长度={len(normalized.resume.raw_content) if normalized.resume.raw_content else 0}") return IngestionResult.failed_result( errors=validation_result.error_messages, message="数据验证失败"