Skip to content

Commit 9a4c7fc

Browse files
committed
fix: TEDS algorithm optimization
1 parent cfbfd02 commit 9a4c7fc

File tree

3 files changed

+7
-579
lines changed

3 files changed

+7
-579
lines changed

requirements.txt

Lines changed: 5 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,5 @@
1-
rapidFuzz
2-
setuptools
3-
jsonlines
4-
beautifulsoup4
5-
requests
6-
torch
7-
html2text
8-
resiliparse
9-
trafilatura
10-
# llm-web-kit==3.2.0
11-
https://github.com/opendatalab/magic-html/releases/download/magic_html-0.1.5-released/magic_html-0.1.5-py3-none-any.whl
12-
streamlit
13-
markdown
1+
# WebMainBench dependencies
2+
rapidfuzz>=3.0.0
3+
lxml>=4.6.0
4+
beautifulsoup4>=4.9.0
5+
apted>=1.2.0

tests/test_teds.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -220,7 +220,7 @@ def test_teds_structure_same_content_different(self):
220220
groundtruth=gt,
221221
table_edit_result=self.valid_table_edit_result
222222
)
223-
assert result.score == 0.7999999999999999
223+
assert result.score == 0.96
224224

225225

226226

@@ -326,7 +326,7 @@ def test_teds_content_similarity(self):
326326
table2,
327327
table_edit_result=self.valid_table_edit_result
328328
)
329-
assert result.score == 0.3999999999999999
329+
assert result.score == 0.9318181818181819
330330

331331

332332
class TestStructureTEDS(unittest.TestCase):

0 commit comments

Comments
 (0)