diff --git a/examples/basic_usage.py b/examples/basic_usage.py index e257867..65324a1 100755 --- a/examples/basic_usage.py +++ b/examples/basic_usage.py @@ -409,7 +409,7 @@ def _setup(self): def _extract_content(self, html, url=None): return ExtractionResult( content="抽取器A的结果", - content_list=[{"type": "paragraph", "content": "抽取器A的结果"}], + # content_list=[{"type": "paragraph", "content": "抽取器A的结果"}], success=True, confidence_score=0.9 ) @@ -420,7 +420,7 @@ def _setup(self): def _extract_content(self, html, url=None): return ExtractionResult( content="抽取器B的结果", - content_list=[{"type": "paragraph", "content": "抽取器B的结果"}], + # content_list=[{"type": "paragraph", "content": "抽取器B的结果"}], success=True, confidence_score=0.8 ) @@ -703,6 +703,7 @@ def hello_world(): try: demo_basic_mock_evaluation() demo_llm_webkit_evaluation() # 使用LLM-WebKit评测示例 + demo_extractor_comparison() print("\n✅ 示例运行完成!") except Exception as e: diff --git a/results/leaderboard.csv b/results/leaderboard.csv index 4bfa0d7..10177dc 100644 --- a/results/leaderboard.csv +++ b/results/leaderboard.csv @@ -1,3 +1,3 @@ -extractor,total_samples,success_rate,overall,table_extraction,formula_extraction -extractor_a,2,1.0,0.0,0.25,1.0 -extractor_b,2,1.0,0.0,0.25,1.0 +extractor,total_samples,success_rate,overall,code_edit,formula_edit,table_TEDS,table_edit,text_edit +extractor_a,2,1.0,0.4012,0.5,0.5,0.5,0.5,0.0062 +extractor_b,2,1.0,0.4012,0.5,0.5,0.5,0.5,0.0062