dingeszakkou2019muchstakeknowledge
/data/papers/dingeszakkou2019muchstakeknowledge/out/bundle.json{
"created_at": "2026-01-19T12:17:12.595824+00:00",
"paper_dir": "papers/dingeszakkou2019muchstakeknowledge",
"pdf": {
"path": "papers/dingeszakkou2019muchstakeknowledge/pdf/paper.pdf"
},
"tool_versions": {
"python": "3.14.2",
"meta-extract": "0.1.0",
"requests": "2.32.5",
"lxml": "6.0.2",
"pandas": "2.3.3",
"pypdf": "5.9.0",
"pypdfium2": "5.3.0",
"pillow": "12.1.0",
"grobid-client-python": "0.1.4",
"camelot-py": "1.0.9",
"tabula-py": "2.10.0"
},
"status": "ok",
"grobid": {
"url": "http://localhost:8070",
"tei_path": "papers/dingeszakkou2019muchstakeknowledge/out/tei.xml"
},
"text": {
"path": "papers/dingeszakkou2019muchstakeknowledge/out/text.txt"
},
"tables": {
"out_dir": "papers/dingeszakkou2019muchstakeknowledge/out/tables",
"camelot": {
"stream": [],
"lattice": [],
"filtered_out": {
"stream": 24,
"lattice": 2
},
"filtered_reasons": {
"stream": {
"filled_rows_ratio": 6,
"min_cols": 13,
"filled_rows": 5
},
"lattice": {
"sparse": 2
}
},
"filter": {
"min_rows": 2,
"min_cols": 2,
"min_non_empty_ratio": 0.2,
"min_filled_rows": 2,
"min_filled_cols": 2,
"min_filled_rows_ratio": 0.5,
"two_col_min_numeric_like_ratio": 0.35
},
"errors": []
},
"tabula": {
"lattice": [],
"stream": [
{
"page": 13,
"index": 1,
"csv_path": "papers/dingeszakkou2019muchstakeknowledge/out/tables/tabula_stream_p13_t1.csv",
"shape": [
15,
6
],
"stats": {
"rows": 15,
"cols": 6,
"non_empty_cells": 31,
"non_empty_ratio": 0.34444444444444444,
"filled_rows": 10,
"filled_cols": 5,
"filled_rows_ratio": 0.6666666666666666,
"numeric_like_ratio": 0.03225806451612903
},
"area": [
34.86615,
29.08344,
313.79535,
455.64056
]
}
],
"filtered_out": {
"lattice": 33,
"stream": 5
},
"filtered_reasons": {
"lattice": {
"min_rows": 31,
"sparse": 2
},
"stream": {
"min_cols": 3,
"filled_rows_ratio": 2
}
},
"filter": {
"min_rows": 2,
"min_cols": 2,
"min_non_empty_ratio": 0.2,
"min_filled_rows": 2,
"min_filled_cols": 2,
"min_filled_rows_ratio": 0.5,
"two_col_min_numeric_like_ratio": 0.35
},
"errors": [
{
"page": 1,
"mode": "lattice",
"error": "IllegalArgumentException('lines must be orthogonal, vertical and horizontal')"
}
],
"ignored_errors": {},
"pages": "all"
}
},
"images": {
"dir": "papers/dingeszakkou2019muchstakeknowledge/out/images",
"manifest": "papers/dingeszakkou2019muchstakeknowledge/out/images/manifest.json",
"embedded": {
"count": 2
},
"rendered_pages": {
"count": 1,
"pages": [
1
]
},
"figures": {
"count": 2,
"pages": [],
"rendered_pages": []
}
},
"errors": [],
"markdown": {
"path": "papers/dingeszakkou2019muchstakeknowledge/out/fulltext.md"
}
}