@@ -129,8 +129,8 @@ def test_table_edit_metric(self):
129129 self .assertTrue (table_result .success )
130130 self .assertIsInstance (table_result .score , float )
131131 # 验证固定内容的确定分数
132- self .assertAlmostEqual (table_result .score , 0.868852 , places = 5 ,
133- msg = f"table_edit分数应该是0.868852 ,实际: { table_result .score } " )
132+ self .assertAlmostEqual (table_result .score , 0.7241379310344828 , places = 5 ,
133+ msg = f"table_edit分数应该是0.7241379310344828 ,实际: { table_result .score } " )
134134
135135 # 验证详细信息
136136 self .assertEqual (table_result .details ['content_type' ], 'table' )
@@ -874,47 +874,62 @@ def test_html_table_edit_distance(self):
874874 # 验证表格编辑距离(分隔符长度差异导致的固定分数)
875875 self .assertIn ("table_edit" , results )
876876 self .assertTrue (results ["table_edit" ].success )
877- self .assertAlmostEqual (results ["table_edit" ].score , 0.593573 , places = 5 ,
878- msg = f"table_edit分数应该是0.593573 ,实际: { results ['table_edit' ].score } " )
877+ self .assertAlmostEqual (results ["table_edit" ].score , 0.6237714987714988 , places = 5 ,
878+ msg = f"table_edit分数应该是0.6237714987714988 ,实际: { results ['table_edit' ].score } " )
879879
880880 # 验证TEDS指标(表格结构完全相同,满分)
881881 self .assertIn ("table_TEDS" , results )
882882 self .assertTrue (results ["table_TEDS" ].success )
883883 self .assertAlmostEqual (results ["table_TEDS" ].score , 0.9984520490180891 , places = 5 ,
884884 msg = f"table_TEDS分数应该是0.0.9984520490180891,实际: { results ['table_TEDS' ].score } " )
885885
886- def test_table_sample_edit_distance (self ):
887- """测试表格样本的编辑距离"""
888- groundtruth = """## 销售数据统计
889-
890- | 产品 | 销量 | 收入 |
891- |------|------|------|
892- | 产品A | 100 | 1000 |
893- | 产品B | 200 | 3000 |"""
894-
895- predicted = """## 销售数据统计
896-
897- | 产品 | 销量 | 收入 |
898- |---|---|---|
899- | 产品A | 100 | 1000 |
900- | 产品B | 200 | 3000 |"""
901-
902- results = self .calculator .calculate_all (
903- predicted_content = predicted ,
904- groundtruth_content = groundtruth
905- )
906-
907- # 验证表格编辑距离(分隔符长度差异导致的固定分数)
908- self .assertIn ("table_edit" , results )
909- self .assertTrue (results ["table_edit" ].success )
910- self .assertAlmostEqual (results ["table_edit" ].score , 0.888889 , places = 5 ,
911- msg = f"table_edit分数应该是0.888889,实际: { results ['table_edit' ].score } " )
912-
913- # 验证TEDS指标(表格结构完全相同,满分)
914- self .assertIn ("table_TEDS" , results )
915- self .assertTrue (results ["table_TEDS" ].success )
916- self .assertAlmostEqual (results ["table_TEDS" ].score , 1.000000 , places = 5 ,
917- msg = f"table_TEDS分数应该是1.000000,实际: { results ['table_TEDS' ].score } " )
886+ def test_table_sample_edit_distance (self ):
887+ """测试渲染一致,表格样式不一致的编辑距离"""
888+ groundtruth = """## 销售数据统计
889+
890+ | 产品 | 销量 | 收入 |
891+ |------|------|------|
892+ | 产品A | 100 | 1000 |
893+ | 产品B | 200 | 3000 |"""
894+
895+ predicted = """## <table>
896+ <thead>
897+ <tr>
898+ <th>产品</th>
899+ <th>销量</th>
900+ <th>收入</th>
901+ </tr>
902+ </thead>
903+ <tbody>
904+ <tr>
905+ <td>产品A</td>
906+ <td>100</td>
907+ <td>1000</td>
908+ </tr>
909+ <tr>
910+ <td>产品B</td>
911+ <td>200</td>
912+ <td>3000</td>
913+ </tr>
914+ </tbody>
915+ </table>"""
916+
917+ results = self .calculator .calculate_all (
918+ predicted_content = predicted ,
919+ groundtruth_content = groundtruth
920+ )
921+
922+ # 验证表格编辑距离(分隔符长度差异导致的固定分数)
923+ self .assertIn ("table_edit" , results )
924+ self .assertTrue (results ["table_edit" ].success )
925+ self .assertAlmostEqual (results ["table_edit" ].score , 1.0 , places = 5 ,
926+ msg = f"table_edit分数应该是1.0,实际: { results ['table_edit' ].score } " )
927+
928+ # 验证TEDS指标(表格结构完全相同,满分)
929+ self .assertIn ("table_TEDS" , results )
930+ self .assertTrue (results ["table_TEDS" ].success )
931+ self .assertAlmostEqual (results ["table_TEDS" ].score , 0.9806224310041104 , places = 5 ,
932+ msg = f"table_TEDS分数应该是0.9806224310041104,实际: { results ['table_TEDS' ].score } " )
918933
919934 def test_formula_sample_edit_distance (self ):
920935 """测试公式样本的编辑距离"""
0 commit comments