mirror of
https://github.com/docling-project/docling-eval.git
synced 2026-05-17 13:10:47 +00:00
d04d016843
- fix: Refactor/improve the code to save log files with evaluation tables and png files with the plots and ensure to produce all the evaluations/visualizations in the docs/examples/benchmark_xxx.py files - Introduce optional parameter in create methods for DP-Bench and OmniDocBench to generate visualizations. - Update the evaluation files (json/txt/png) in docs/evaluations per dataset. Update Readme. - Update Readme with the OmniDocBench evaluation/visualization files - Poetry: Move to docling 2.15.1 --------- Signed-off-by: Nikos Livathinos <nli@zurich.ibm.com>
738 lines
14 KiB
JSON
738 lines
14 KiB
JSON
{
|
|
"TEDS": {
|
|
"bins": [
|
|
0.0,
|
|
0.05,
|
|
0.1,
|
|
0.15000000000000002,
|
|
0.2,
|
|
0.25,
|
|
0.30000000000000004,
|
|
0.35000000000000003,
|
|
0.4,
|
|
0.45,
|
|
0.5,
|
|
0.55,
|
|
0.6000000000000001,
|
|
0.65,
|
|
0.7000000000000001,
|
|
0.75,
|
|
0.8,
|
|
0.8500000000000001,
|
|
0.9,
|
|
0.9500000000000001,
|
|
1.0
|
|
],
|
|
"hist": [
|
|
0.0,
|
|
1.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
2.0,
|
|
1.0,
|
|
2.0,
|
|
1.0,
|
|
0.0,
|
|
1.0,
|
|
4.0,
|
|
3.0,
|
|
4.0,
|
|
6.0,
|
|
12.0,
|
|
13.0,
|
|
3.0
|
|
],
|
|
"mean": 0.7844150943396226,
|
|
"median": 0.854,
|
|
"std": 0.18453459483483392,
|
|
"total": 53
|
|
},
|
|
"TEDS_complex": {
|
|
"bins": [
|
|
0.0,
|
|
0.05,
|
|
0.1,
|
|
0.15000000000000002,
|
|
0.2,
|
|
0.25,
|
|
0.30000000000000004,
|
|
0.35000000000000003,
|
|
0.4,
|
|
0.45,
|
|
0.5,
|
|
0.55,
|
|
0.6000000000000001,
|
|
0.65,
|
|
0.7000000000000001,
|
|
0.75,
|
|
0.8,
|
|
0.8500000000000001,
|
|
0.9,
|
|
0.9500000000000001,
|
|
1.0
|
|
],
|
|
"hist": [
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
1.0,
|
|
1.0,
|
|
0.0,
|
|
1.0,
|
|
1.0,
|
|
3.0,
|
|
1.0,
|
|
0.0
|
|
],
|
|
"mean": 0.81025,
|
|
"median": 0.858,
|
|
"std": 0.10778119369484508,
|
|
"total": 8
|
|
},
|
|
"TEDS_simple": {
|
|
"bins": [
|
|
0.0,
|
|
0.05,
|
|
0.1,
|
|
0.15000000000000002,
|
|
0.2,
|
|
0.25,
|
|
0.30000000000000004,
|
|
0.35000000000000003,
|
|
0.4,
|
|
0.45,
|
|
0.5,
|
|
0.55,
|
|
0.6000000000000001,
|
|
0.65,
|
|
0.7000000000000001,
|
|
0.75,
|
|
0.8,
|
|
0.8500000000000001,
|
|
0.9,
|
|
0.9500000000000001,
|
|
1.0
|
|
],
|
|
"hist": [
|
|
0.0,
|
|
1.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
2.0,
|
|
1.0,
|
|
2.0,
|
|
1.0,
|
|
0.0,
|
|
0.0,
|
|
3.0,
|
|
3.0,
|
|
3.0,
|
|
5.0,
|
|
9.0,
|
|
12.0,
|
|
3.0
|
|
],
|
|
"mean": 0.7798222222222222,
|
|
"median": 0.854,
|
|
"std": 0.19558482104248842,
|
|
"total": 45
|
|
},
|
|
"TEDS_struct": {
|
|
"bins": [
|
|
0.0,
|
|
0.05,
|
|
0.1,
|
|
0.15000000000000002,
|
|
0.2,
|
|
0.25,
|
|
0.30000000000000004,
|
|
0.35000000000000003,
|
|
0.4,
|
|
0.45,
|
|
0.5,
|
|
0.55,
|
|
0.6000000000000001,
|
|
0.65,
|
|
0.7000000000000001,
|
|
0.75,
|
|
0.8,
|
|
0.8500000000000001,
|
|
0.9,
|
|
0.9500000000000001,
|
|
1.0
|
|
],
|
|
"hist": [
|
|
0.0,
|
|
1.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
0.0,
|
|
1.0,
|
|
0.0,
|
|
0.0,
|
|
1.0,
|
|
2.0,
|
|
1.0,
|
|
3.0,
|
|
4.0,
|
|
7.0,
|
|
14.0,
|
|
13.0,
|
|
6.0
|
|
],
|
|
"mean": 0.8341698113207547,
|
|
"median": 0.873,
|
|
"std": 0.1540224429012584,
|
|
"total": 53
|
|
},
|
|
"evaluations": [
|
|
{
|
|
"TEDS": 0.916,
|
|
"filename": "01030000000045.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 3,
|
|
"pred_nrows": 9,
|
|
"table_id": 0,
|
|
"true_ncols": 3,
|
|
"true_nrows": 9
|
|
},
|
|
{
|
|
"TEDS": 0.874,
|
|
"filename": "01030000000046.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 7,
|
|
"pred_nrows": 12,
|
|
"table_id": 0,
|
|
"true_ncols": 7,
|
|
"true_nrows": 12
|
|
},
|
|
{
|
|
"TEDS": 0.848,
|
|
"filename": "01030000000047.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 7,
|
|
"pred_nrows": 10,
|
|
"table_id": 0,
|
|
"true_ncols": 7,
|
|
"true_nrows": 10
|
|
},
|
|
{
|
|
"TEDS": 0.909,
|
|
"filename": "01030000000051.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 9,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 9
|
|
},
|
|
{
|
|
"TEDS": 0.931,
|
|
"filename": "01030000000052.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 12,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 12
|
|
},
|
|
{
|
|
"TEDS": 0.911,
|
|
"filename": "01030000000053.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 9,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 9
|
|
},
|
|
{
|
|
"TEDS": 0.956,
|
|
"filename": "01030000000064.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 3,
|
|
"pred_nrows": 11,
|
|
"table_id": 0,
|
|
"true_ncols": 3,
|
|
"true_nrows": 11
|
|
},
|
|
{
|
|
"TEDS": 0.87,
|
|
"filename": "01030000000078.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 7,
|
|
"pred_nrows": 10,
|
|
"table_id": 0,
|
|
"true_ncols": 7,
|
|
"true_nrows": 10
|
|
},
|
|
{
|
|
"TEDS": 0.757,
|
|
"filename": "01030000000081.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 3,
|
|
"pred_nrows": 3,
|
|
"table_id": 0,
|
|
"true_ncols": 3,
|
|
"true_nrows": 3
|
|
},
|
|
{
|
|
"TEDS": 0.897,
|
|
"filename": "01030000000081.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 3,
|
|
"pred_nrows": 7,
|
|
"table_id": 1,
|
|
"true_ncols": 3,
|
|
"true_nrows": 7
|
|
},
|
|
{
|
|
"TEDS": 0.889,
|
|
"filename": "01030000000082.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 7,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 7
|
|
},
|
|
{
|
|
"TEDS": 0.871,
|
|
"filename": "01030000000082.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 6,
|
|
"table_id": 1,
|
|
"true_ncols": 4,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.897,
|
|
"filename": "01030000000083.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 8,
|
|
"table_id": 0,
|
|
"true_ncols": 5,
|
|
"true_nrows": 8
|
|
},
|
|
{
|
|
"TEDS": 0.854,
|
|
"filename": "01030000000083.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 4,
|
|
"table_id": 1,
|
|
"true_ncols": 4,
|
|
"true_nrows": 4
|
|
},
|
|
{
|
|
"TEDS": 0.903,
|
|
"filename": "01030000000083.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 6,
|
|
"table_id": 2,
|
|
"true_ncols": 4,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.853,
|
|
"filename": "01030000000084.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 4,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 4
|
|
},
|
|
{
|
|
"TEDS": 0.871,
|
|
"filename": "01030000000084.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 6,
|
|
"table_id": 1,
|
|
"true_ncols": 4,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.702,
|
|
"filename": "01030000000088.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 5,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.688,
|
|
"filename": "01030000000089.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 5,
|
|
"table_id": 0,
|
|
"true_ncols": 5,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.532,
|
|
"filename": "01030000000090.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 5,
|
|
"table_id": 0,
|
|
"true_ncols": 5,
|
|
"true_nrows": 7
|
|
},
|
|
{
|
|
"TEDS": 0.846,
|
|
"filename": "01030000000116.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 5,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 5
|
|
},
|
|
{
|
|
"TEDS": 0.662,
|
|
"filename": "01030000000116.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 2,
|
|
"table_id": 1,
|
|
"true_ncols": 4,
|
|
"true_nrows": 2
|
|
},
|
|
{
|
|
"TEDS": 0.81,
|
|
"filename": "01030000000117.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 4,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 4
|
|
},
|
|
{
|
|
"TEDS": 0.919,
|
|
"filename": "01030000000119.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 3,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 3,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.414,
|
|
"filename": "01030000000120.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 2,
|
|
"table_id": 0,
|
|
"true_ncols": 5,
|
|
"true_nrows": 3
|
|
},
|
|
{
|
|
"TEDS": 0.377,
|
|
"filename": "01030000000121.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 2,
|
|
"pred_nrows": 3,
|
|
"table_id": 0,
|
|
"true_ncols": 2,
|
|
"true_nrows": 2
|
|
},
|
|
{
|
|
"TEDS": 0.913,
|
|
"filename": "01030000000127.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 9,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 9
|
|
},
|
|
{
|
|
"TEDS": 0.839,
|
|
"filename": "01030000000127.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 5,
|
|
"table_id": 1,
|
|
"true_ncols": 5,
|
|
"true_nrows": 5
|
|
},
|
|
{
|
|
"TEDS": 0.839,
|
|
"filename": "01030000000127.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 5,
|
|
"table_id": 2,
|
|
"true_ncols": 5,
|
|
"true_nrows": 5
|
|
},
|
|
{
|
|
"TEDS": 0.955,
|
|
"filename": "01030000000128.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 6,
|
|
"pred_nrows": 16,
|
|
"table_id": 0,
|
|
"true_ncols": 6,
|
|
"true_nrows": 16
|
|
},
|
|
{
|
|
"TEDS": 0.88,
|
|
"filename": "01030000000130.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 3,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 3,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.933,
|
|
"filename": "01030000000132.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 2,
|
|
"pred_nrows": 5,
|
|
"table_id": 0,
|
|
"true_ncols": 2,
|
|
"true_nrows": 5
|
|
},
|
|
{
|
|
"TEDS": 0.643,
|
|
"filename": "01030000000146.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 2,
|
|
"pred_nrows": 9,
|
|
"table_id": 0,
|
|
"true_ncols": 2,
|
|
"true_nrows": 9
|
|
},
|
|
{
|
|
"TEDS": 0.659,
|
|
"filename": "01030000000147.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 4,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 4
|
|
},
|
|
{
|
|
"TEDS": 0.93,
|
|
"filename": "01030000000149.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 1,
|
|
"pred_nrows": 8,
|
|
"table_id": 0,
|
|
"true_ncols": 1,
|
|
"true_nrows": 8
|
|
},
|
|
{
|
|
"TEDS": 0.868,
|
|
"filename": "01030000000150.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 2,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 2,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.895,
|
|
"filename": "01030000000165.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 2,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 2,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.719,
|
|
"filename": "01030000000166.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 2,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 2,
|
|
"true_nrows": 7
|
|
},
|
|
{
|
|
"TEDS": 0.907,
|
|
"filename": "01030000000170.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 6,
|
|
"pred_nrows": 8,
|
|
"table_id": 0,
|
|
"true_ncols": 6,
|
|
"true_nrows": 8
|
|
},
|
|
{
|
|
"TEDS": 0.917,
|
|
"filename": "01030000000170.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 5,
|
|
"pred_nrows": 9,
|
|
"table_id": 1,
|
|
"true_ncols": 5,
|
|
"true_nrows": 9
|
|
},
|
|
{
|
|
"TEDS": 0.472,
|
|
"filename": "01030000000178.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 3,
|
|
"pred_nrows": 7,
|
|
"table_id": 0,
|
|
"true_ncols": 3,
|
|
"true_nrows": 7
|
|
},
|
|
{
|
|
"TEDS": 0.489,
|
|
"filename": "01030000000180.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 3,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 3
|
|
},
|
|
{
|
|
"TEDS": 0.381,
|
|
"filename": "01030000000182.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 3,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 4
|
|
},
|
|
{
|
|
"TEDS": 0.65,
|
|
"filename": "01030000000187.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 7,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 7,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.916,
|
|
"filename": "01030000000188.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 10,
|
|
"pred_nrows": 14,
|
|
"table_id": 0,
|
|
"true_ncols": 10,
|
|
"true_nrows": 14
|
|
},
|
|
{
|
|
"TEDS": 0.795,
|
|
"filename": "01030000000189.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 11,
|
|
"pred_nrows": 6,
|
|
"table_id": 0,
|
|
"true_ncols": 11,
|
|
"true_nrows": 6
|
|
},
|
|
{
|
|
"TEDS": 0.756,
|
|
"filename": "01030000000189.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 10,
|
|
"pred_nrows": 4,
|
|
"table_id": 1,
|
|
"true_ncols": 10,
|
|
"true_nrows": 4
|
|
},
|
|
{
|
|
"TEDS": 0.957,
|
|
"filename": "01030000000189.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 9,
|
|
"pred_nrows": 3,
|
|
"table_id": 2,
|
|
"true_ncols": 9,
|
|
"true_nrows": 3
|
|
},
|
|
{
|
|
"TEDS": 0.714,
|
|
"filename": "01030000000190.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 8,
|
|
"pred_nrows": 3,
|
|
"table_id": 0,
|
|
"true_ncols": 8,
|
|
"true_nrows": 3
|
|
},
|
|
{
|
|
"TEDS": 0.822,
|
|
"filename": "01030000000190.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 9,
|
|
"pred_nrows": 5,
|
|
"table_id": 1,
|
|
"true_ncols": 9,
|
|
"true_nrows": 5
|
|
},
|
|
{
|
|
"TEDS": 0.061,
|
|
"filename": "01030000000197.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 1,
|
|
"pred_nrows": 10,
|
|
"table_id": 0,
|
|
"true_ncols": 2,
|
|
"true_nrows": 1
|
|
},
|
|
{
|
|
"TEDS": 0.911,
|
|
"filename": "01030000000197.pdf",
|
|
"is_complex": false,
|
|
"pred_ncols": 6,
|
|
"pred_nrows": 2,
|
|
"table_id": 1,
|
|
"true_ncols": 6,
|
|
"true_nrows": 2
|
|
},
|
|
{
|
|
"TEDS": 0.796,
|
|
"filename": "01030000000200.pdf",
|
|
"is_complex": true,
|
|
"pred_ncols": 4,
|
|
"pred_nrows": 10,
|
|
"table_id": 0,
|
|
"true_ncols": 4,
|
|
"true_nrows": 10
|
|
}
|
|
]
|
|
} |