|
2 | 2 | "metadata": { |
3 | 3 | "dataset_name": "real_preprocessed_html_test", |
4 | 4 | "extractor_name": "llm-webkit", |
5 | | - "timestamp": "2025-08-13T14:53:57.558572", |
| 5 | + "timestamp": "2025-08-14T11:22:33.005587", |
6 | 6 | "total_samples": 2 |
7 | 7 | }, |
8 | 8 | "overall_metrics": { |
9 | | - "text_edit": 0.045309156685715835, |
| 9 | + "text_edit": 0.09025270758122739, |
10 | 10 | "code_edit": 0.0, |
11 | 11 | "table_edit": 0.0, |
12 | 12 | "table_TEDS": 0.0, |
13 | 13 | "formula_edit": 0.0, |
14 | | - "overall": 0.009061831337143167 |
| 14 | + "overall": 0.018050541516245477 |
15 | 15 | }, |
16 | 16 | "sample_results": [ |
17 | 17 | { |
18 | 18 | "sample_id": "33e291cd-5b26-48b1-977f-3c63b45e6d13", |
19 | 19 | "extraction_success": true, |
20 | | - "extraction_time": 0.6193361282348633, |
| 20 | + "extraction_time": 0.6739089488983154, |
21 | 21 | "metrics": { |
22 | 22 | "code_edit": { |
23 | 23 | "score": 0.0, |
|
99 | 99 | }, |
100 | 100 | { |
101 | 101 | "sample_id": "93898d00-0d6c-451d-9f99-4c386c6c2918", |
102 | | - "extraction_success": true, |
103 | | - "extraction_time": 0.0010640621185302734, |
104 | | - "metrics": { |
105 | | - "code_edit": { |
106 | | - "score": 0.0, |
107 | | - "success": false, |
108 | | - "details": { |
109 | | - "predicted_code_length": 0, |
110 | | - "groundtruth_code_length": 0, |
111 | | - "content_type": "code" |
112 | | - }, |
113 | | - "error": "Both predicted and groundtruth are empty" |
114 | | - }, |
115 | | - "formula_edit": { |
116 | | - "score": 0.0, |
117 | | - "success": false, |
118 | | - "details": { |
119 | | - "predicted_formula_length": 0, |
120 | | - "groundtruth_formula_length": 0, |
121 | | - "content_type": "formula" |
122 | | - }, |
123 | | - "error": "Both predicted and groundtruth are empty" |
124 | | - }, |
125 | | - "text_edit": { |
126 | | - "score": 0.00036560579020428197, |
127 | | - "success": true, |
128 | | - "details": { |
129 | | - "distance": 161317, |
130 | | - "predicted_length": 59, |
131 | | - "groundtruth_length": 161376, |
132 | | - "normalized": true, |
133 | | - "predicted_text_length": 59, |
134 | | - "groundtruth_text_length": 161376, |
135 | | - "content_type": "text" |
136 | | - } |
137 | | - }, |
138 | | - "table_edit": { |
139 | | - "score": 0.0, |
140 | | - "success": false, |
141 | | - "details": { |
142 | | - "predicted_table_length": 0, |
143 | | - "groundtruth_table_length": 0, |
144 | | - "content_type": "table" |
145 | | - }, |
146 | | - "error": "Both predicted and groundtruth are empty" |
147 | | - }, |
148 | | - "table_TEDS": { |
149 | | - "score": 0.0, |
150 | | - "success": false, |
151 | | - "details": { |
152 | | - "content_type": "table", |
153 | | - "algorithm": "TEDS" |
154 | | - }, |
155 | | - "error": "Skipped due to table_edit failure: unknown reason" |
156 | | - }, |
157 | | - "overall": { |
158 | | - "score": 0.00036560579020428197, |
159 | | - "success": true, |
160 | | - "details": { |
161 | | - "source": "average_of_all_metrics", |
162 | | - "description": "Overall score as average of all successful metrics", |
163 | | - "successful_metrics": 1, |
164 | | - "failed_metrics": 4, |
165 | | - "individual_scores": { |
166 | | - "text_edit": 0.00036560579020428197 |
167 | | - } |
168 | | - } |
169 | | - } |
170 | | - }, |
171 | | - "sample_metadata": { |
172 | | - "url": "https://www.15shuba.net/html/58/58618/index.html", |
173 | | - "domain": null, |
174 | | - "language": "zh", |
175 | | - "content_type": null, |
176 | | - "difficulty": null |
177 | | - } |
| 102 | + "extraction_success": false, |
| 103 | + "extraction_time": 0.0, |
| 104 | + "extraction_error": "Empty HTML input", |
| 105 | + "metrics": {} |
178 | 106 | } |
179 | 107 | ], |
180 | 108 | "category_metrics": null, |
181 | 109 | "error_analysis": { |
182 | 110 | "total_samples": 2, |
183 | | - "failed_count": 0, |
184 | | - "success_rate": 1.0, |
185 | | - "common_errors": {}, |
186 | | - "sample_errors": [] |
| 111 | + "failed_count": 1, |
| 112 | + "success_rate": 0.5, |
| 113 | + "common_errors": { |
| 114 | + "empty_input": 1 |
| 115 | + }, |
| 116 | + "sample_errors": [ |
| 117 | + { |
| 118 | + "sample_id": "93898d00-0d6c-451d-9f99-4c386c6c2918", |
| 119 | + "error": "Empty HTML input" |
| 120 | + } |
| 121 | + ] |
187 | 122 | }, |
188 | 123 | "extractor_config": { |
189 | 124 | "use_preprocessed_html": true, |
|
0 commit comments