Skip to content

Commit cddef4e

Browse files
committed
x
1 parent 48f6f44 commit cddef4e

File tree

1 file changed

+0
-8
lines changed

1 file changed

+0
-8
lines changed

scripts/process_dataset.py

Lines changed: 0 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -27,11 +27,6 @@ def process_single_item(data: dict, verbose: bool = False) -> dict:
2727
html = data.get('llm_webkit_html', '') # 预处理HTML
2828
llm_response = data.get('llm_response_html', '') # LLM响应HTML
2929

30-
if verbose:
31-
print(f"\n📝 字段信息:")
32-
print(f" llm_webkit_html 长度: {len(typical_raw_tag_html)}")
33-
print(f" llm_response_html 长度: {len(llm_response)}")
34-
3530
# 检查必要字段
3631
if not typical_raw_tag_html:
3732
if verbose:
@@ -57,9 +52,6 @@ def process_single_item(data: dict, verbose: bool = False) -> dict:
5752
# 提取 main_html
5853
main_html = pre_data.get(PreDataJsonKey.TYPICAL_MAIN_HTML, "")
5954

60-
if verbose:
61-
print(f" main_html 长度: {len(main_html)}")
62-
6355
# 添加新字段
6456
data['llm_webkit430_main_html'] = main_html
6557

0 commit comments

Comments
 (0)