Files
docling-eval/docs/evaluations/DPBench/evaluation_DPBench_tableformer.json
Nikos Livathinos d04d016843 feat: Refactor the reading order evaluation to skip document items that have multiple provenances (#10)
- fix: Refactor/improve the code to save log files with evaluation tables and png files with the plots
and ensure to produce all the evaluations/visualizations in the docs/examples/benchmark_xxx.py files
- Introduce optional parameter in create methods for DP-Bench and OmniDocBench to generate
visualizations.
- Update the evaluation files (json/txt/png) in docs/evaluations per dataset. Update Readme.
- Update Readme with the OmniDocBench evaluation/visualization files
- Poetry: Move to docling 2.15.1

---------

Signed-off-by: Nikos Livathinos <nli@zurich.ibm.com>
2025-01-21 14:58:17 +01:00

738 lines
14 KiB
JSON

{
"TEDS": {
"bins": [
0.0,
0.05,
0.1,
0.15000000000000002,
0.2,
0.25,
0.30000000000000004,
0.35000000000000003,
0.4,
0.45,
0.5,
0.55,
0.6000000000000001,
0.65,
0.7000000000000001,
0.75,
0.8,
0.8500000000000001,
0.9,
0.9500000000000001,
1.0
],
"hist": [
0.0,
1.0,
0.0,
0.0,
0.0,
0.0,
0.0,
2.0,
1.0,
2.0,
1.0,
0.0,
1.0,
4.0,
3.0,
4.0,
6.0,
12.0,
13.0,
3.0
],
"mean": 0.7844150943396226,
"median": 0.854,
"std": 0.18453459483483392,
"total": 53
},
"TEDS_complex": {
"bins": [
0.0,
0.05,
0.1,
0.15000000000000002,
0.2,
0.25,
0.30000000000000004,
0.35000000000000003,
0.4,
0.45,
0.5,
0.55,
0.6000000000000001,
0.65,
0.7000000000000001,
0.75,
0.8,
0.8500000000000001,
0.9,
0.9500000000000001,
1.0
],
"hist": [
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
1.0,
1.0,
0.0,
1.0,
1.0,
3.0,
1.0,
0.0
],
"mean": 0.81025,
"median": 0.858,
"std": 0.10778119369484508,
"total": 8
},
"TEDS_simple": {
"bins": [
0.0,
0.05,
0.1,
0.15000000000000002,
0.2,
0.25,
0.30000000000000004,
0.35000000000000003,
0.4,
0.45,
0.5,
0.55,
0.6000000000000001,
0.65,
0.7000000000000001,
0.75,
0.8,
0.8500000000000001,
0.9,
0.9500000000000001,
1.0
],
"hist": [
0.0,
1.0,
0.0,
0.0,
0.0,
0.0,
0.0,
2.0,
1.0,
2.0,
1.0,
0.0,
0.0,
3.0,
3.0,
3.0,
5.0,
9.0,
12.0,
3.0
],
"mean": 0.7798222222222222,
"median": 0.854,
"std": 0.19558482104248842,
"total": 45
},
"TEDS_struct": {
"bins": [
0.0,
0.05,
0.1,
0.15000000000000002,
0.2,
0.25,
0.30000000000000004,
0.35000000000000003,
0.4,
0.45,
0.5,
0.55,
0.6000000000000001,
0.65,
0.7000000000000001,
0.75,
0.8,
0.8500000000000001,
0.9,
0.9500000000000001,
1.0
],
"hist": [
0.0,
1.0,
0.0,
0.0,
0.0,
0.0,
0.0,
0.0,
1.0,
0.0,
0.0,
1.0,
2.0,
1.0,
3.0,
4.0,
7.0,
14.0,
13.0,
6.0
],
"mean": 0.8341698113207547,
"median": 0.873,
"std": 0.1540224429012584,
"total": 53
},
"evaluations": [
{
"TEDS": 0.916,
"filename": "01030000000045.pdf",
"is_complex": false,
"pred_ncols": 3,
"pred_nrows": 9,
"table_id": 0,
"true_ncols": 3,
"true_nrows": 9
},
{
"TEDS": 0.874,
"filename": "01030000000046.pdf",
"is_complex": true,
"pred_ncols": 7,
"pred_nrows": 12,
"table_id": 0,
"true_ncols": 7,
"true_nrows": 12
},
{
"TEDS": 0.848,
"filename": "01030000000047.pdf",
"is_complex": true,
"pred_ncols": 7,
"pred_nrows": 10,
"table_id": 0,
"true_ncols": 7,
"true_nrows": 10
},
{
"TEDS": 0.909,
"filename": "01030000000051.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 9,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 9
},
{
"TEDS": 0.931,
"filename": "01030000000052.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 12,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 12
},
{
"TEDS": 0.911,
"filename": "01030000000053.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 9,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 9
},
{
"TEDS": 0.956,
"filename": "01030000000064.pdf",
"is_complex": false,
"pred_ncols": 3,
"pred_nrows": 11,
"table_id": 0,
"true_ncols": 3,
"true_nrows": 11
},
{
"TEDS": 0.87,
"filename": "01030000000078.pdf",
"is_complex": true,
"pred_ncols": 7,
"pred_nrows": 10,
"table_id": 0,
"true_ncols": 7,
"true_nrows": 10
},
{
"TEDS": 0.757,
"filename": "01030000000081.pdf",
"is_complex": false,
"pred_ncols": 3,
"pred_nrows": 3,
"table_id": 0,
"true_ncols": 3,
"true_nrows": 3
},
{
"TEDS": 0.897,
"filename": "01030000000081.pdf",
"is_complex": false,
"pred_ncols": 3,
"pred_nrows": 7,
"table_id": 1,
"true_ncols": 3,
"true_nrows": 7
},
{
"TEDS": 0.889,
"filename": "01030000000082.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 7,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 7
},
{
"TEDS": 0.871,
"filename": "01030000000082.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 6,
"table_id": 1,
"true_ncols": 4,
"true_nrows": 6
},
{
"TEDS": 0.897,
"filename": "01030000000083.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 8,
"table_id": 0,
"true_ncols": 5,
"true_nrows": 8
},
{
"TEDS": 0.854,
"filename": "01030000000083.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 4,
"table_id": 1,
"true_ncols": 4,
"true_nrows": 4
},
{
"TEDS": 0.903,
"filename": "01030000000083.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 6,
"table_id": 2,
"true_ncols": 4,
"true_nrows": 6
},
{
"TEDS": 0.853,
"filename": "01030000000084.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 4,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 4
},
{
"TEDS": 0.871,
"filename": "01030000000084.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 6,
"table_id": 1,
"true_ncols": 4,
"true_nrows": 6
},
{
"TEDS": 0.702,
"filename": "01030000000088.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 5,
"true_nrows": 6
},
{
"TEDS": 0.688,
"filename": "01030000000089.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 5,
"table_id": 0,
"true_ncols": 5,
"true_nrows": 6
},
{
"TEDS": 0.532,
"filename": "01030000000090.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 5,
"table_id": 0,
"true_ncols": 5,
"true_nrows": 7
},
{
"TEDS": 0.846,
"filename": "01030000000116.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 5,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 5
},
{
"TEDS": 0.662,
"filename": "01030000000116.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 2,
"table_id": 1,
"true_ncols": 4,
"true_nrows": 2
},
{
"TEDS": 0.81,
"filename": "01030000000117.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 4,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 4
},
{
"TEDS": 0.919,
"filename": "01030000000119.pdf",
"is_complex": false,
"pred_ncols": 3,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 3,
"true_nrows": 6
},
{
"TEDS": 0.414,
"filename": "01030000000120.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 2,
"table_id": 0,
"true_ncols": 5,
"true_nrows": 3
},
{
"TEDS": 0.377,
"filename": "01030000000121.pdf",
"is_complex": false,
"pred_ncols": 2,
"pred_nrows": 3,
"table_id": 0,
"true_ncols": 2,
"true_nrows": 2
},
{
"TEDS": 0.913,
"filename": "01030000000127.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 9,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 9
},
{
"TEDS": 0.839,
"filename": "01030000000127.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 5,
"table_id": 1,
"true_ncols": 5,
"true_nrows": 5
},
{
"TEDS": 0.839,
"filename": "01030000000127.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 5,
"table_id": 2,
"true_ncols": 5,
"true_nrows": 5
},
{
"TEDS": 0.955,
"filename": "01030000000128.pdf",
"is_complex": false,
"pred_ncols": 6,
"pred_nrows": 16,
"table_id": 0,
"true_ncols": 6,
"true_nrows": 16
},
{
"TEDS": 0.88,
"filename": "01030000000130.pdf",
"is_complex": false,
"pred_ncols": 3,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 3,
"true_nrows": 6
},
{
"TEDS": 0.933,
"filename": "01030000000132.pdf",
"is_complex": true,
"pred_ncols": 2,
"pred_nrows": 5,
"table_id": 0,
"true_ncols": 2,
"true_nrows": 5
},
{
"TEDS": 0.643,
"filename": "01030000000146.pdf",
"is_complex": true,
"pred_ncols": 2,
"pred_nrows": 9,
"table_id": 0,
"true_ncols": 2,
"true_nrows": 9
},
{
"TEDS": 0.659,
"filename": "01030000000147.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 4,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 4
},
{
"TEDS": 0.93,
"filename": "01030000000149.pdf",
"is_complex": false,
"pred_ncols": 1,
"pred_nrows": 8,
"table_id": 0,
"true_ncols": 1,
"true_nrows": 8
},
{
"TEDS": 0.868,
"filename": "01030000000150.pdf",
"is_complex": true,
"pred_ncols": 2,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 2,
"true_nrows": 6
},
{
"TEDS": 0.895,
"filename": "01030000000165.pdf",
"is_complex": false,
"pred_ncols": 2,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 2,
"true_nrows": 6
},
{
"TEDS": 0.719,
"filename": "01030000000166.pdf",
"is_complex": false,
"pred_ncols": 2,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 2,
"true_nrows": 7
},
{
"TEDS": 0.907,
"filename": "01030000000170.pdf",
"is_complex": false,
"pred_ncols": 6,
"pred_nrows": 8,
"table_id": 0,
"true_ncols": 6,
"true_nrows": 8
},
{
"TEDS": 0.917,
"filename": "01030000000170.pdf",
"is_complex": false,
"pred_ncols": 5,
"pred_nrows": 9,
"table_id": 1,
"true_ncols": 5,
"true_nrows": 9
},
{
"TEDS": 0.472,
"filename": "01030000000178.pdf",
"is_complex": false,
"pred_ncols": 3,
"pred_nrows": 7,
"table_id": 0,
"true_ncols": 3,
"true_nrows": 7
},
{
"TEDS": 0.489,
"filename": "01030000000180.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 3,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 3
},
{
"TEDS": 0.381,
"filename": "01030000000182.pdf",
"is_complex": false,
"pred_ncols": 4,
"pred_nrows": 3,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 4
},
{
"TEDS": 0.65,
"filename": "01030000000187.pdf",
"is_complex": true,
"pred_ncols": 7,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 7,
"true_nrows": 6
},
{
"TEDS": 0.916,
"filename": "01030000000188.pdf",
"is_complex": false,
"pred_ncols": 10,
"pred_nrows": 14,
"table_id": 0,
"true_ncols": 10,
"true_nrows": 14
},
{
"TEDS": 0.795,
"filename": "01030000000189.pdf",
"is_complex": false,
"pred_ncols": 11,
"pred_nrows": 6,
"table_id": 0,
"true_ncols": 11,
"true_nrows": 6
},
{
"TEDS": 0.756,
"filename": "01030000000189.pdf",
"is_complex": false,
"pred_ncols": 10,
"pred_nrows": 4,
"table_id": 1,
"true_ncols": 10,
"true_nrows": 4
},
{
"TEDS": 0.957,
"filename": "01030000000189.pdf",
"is_complex": false,
"pred_ncols": 9,
"pred_nrows": 3,
"table_id": 2,
"true_ncols": 9,
"true_nrows": 3
},
{
"TEDS": 0.714,
"filename": "01030000000190.pdf",
"is_complex": false,
"pred_ncols": 8,
"pred_nrows": 3,
"table_id": 0,
"true_ncols": 8,
"true_nrows": 3
},
{
"TEDS": 0.822,
"filename": "01030000000190.pdf",
"is_complex": false,
"pred_ncols": 9,
"pred_nrows": 5,
"table_id": 1,
"true_ncols": 9,
"true_nrows": 5
},
{
"TEDS": 0.061,
"filename": "01030000000197.pdf",
"is_complex": false,
"pred_ncols": 1,
"pred_nrows": 10,
"table_id": 0,
"true_ncols": 2,
"true_nrows": 1
},
{
"TEDS": 0.911,
"filename": "01030000000197.pdf",
"is_complex": false,
"pred_ncols": 6,
"pred_nrows": 2,
"table_id": 1,
"true_ncols": 6,
"true_nrows": 2
},
{
"TEDS": 0.796,
"filename": "01030000000200.pdf",
"is_complex": true,
"pred_ncols": 4,
"pred_nrows": 10,
"table_id": 0,
"true_ncols": 4,
"true_nrows": 10
}
]
}