porteretalndpuzzleaboutknowledge
/data/papers/porteretalndpuzzleaboutknowledge/out/bundle.json
{
  "created_at": "2026-02-10T13:41:28.546878+00:00",
  "paper_dir": "papers/porteretalndpuzzleaboutknowledge",
  "pdf": {
    "path": "papers/porteretalndpuzzleaboutknowledge/pdf/paper.pdf"
  },
  "tool_versions": {
    "python": "3.14.2",
    "meta-extract": "0.1.0",
    "requests": "2.32.5",
    "lxml": "6.0.2",
    "pandas": "2.3.3",
    "pypdf": "5.9.0",
    "pypdfium2": "5.3.0",
    "pillow": "12.1.0",
    "grobid-client-python": "0.1.4",
    "camelot-py": "1.0.9",
    "tabula-py": "2.10.0"
  },
  "status": "ok",
  "grobid": {
    "url": "http://localhost:8070",
    "tei_path": "papers/porteretalndpuzzleaboutknowledge/out/tei.xml"
  },
  "text": {
    "path": "papers/porteretalndpuzzleaboutknowledge/out/text.txt"
  },
  "tables": {
    "out_dir": "papers/porteretalndpuzzleaboutknowledge/out/tables",
    "camelot": {
      "stream": [
        {
          "page": "4",
          "index": 1,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/camelot_stream_p4_t1.csv",
          "shape": [
            22,
            10
          ],
          "stats": {
            "rows": 22,
            "cols": 10,
            "non_empty_cells": 168,
            "non_empty_ratio": 0.7636363636363637,
            "filled_rows": 19,
            "filled_cols": 10,
            "filled_rows_ratio": 0.8636363636363636,
            "numeric_like_ratio": 0.44642857142857145
          },
          "parsing_report": {
            "accuracy": 99.17,
            "whitespace": 23.64,
            "order": 1,
            "page": 4
          }
        },
        {
          "page": "7",
          "index": 2,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/camelot_stream_p7_t2.csv",
          "shape": [
            11,
            8
          ],
          "stats": {
            "rows": 11,
            "cols": 8,
            "non_empty_cells": 56,
            "non_empty_ratio": 0.6363636363636364,
            "filled_rows": 11,
            "filled_cols": 8,
            "filled_rows_ratio": 1.0,
            "numeric_like_ratio": 0.4642857142857143
          },
          "parsing_report": {
            "accuracy": 96.22,
            "whitespace": 36.36,
            "order": 1,
            "page": 7
          }
        },
        {
          "page": "8",
          "index": 3,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/camelot_stream_p8_t3.csv",
          "shape": [
            8,
            4
          ],
          "stats": {
            "rows": 8,
            "cols": 4,
            "non_empty_cells": 12,
            "non_empty_ratio": 0.375,
            "filled_rows": 4,
            "filled_cols": 2,
            "filled_rows_ratio": 0.5,
            "numeric_like_ratio": 0.08333333333333333
          },
          "parsing_report": {
            "accuracy": 65.55,
            "whitespace": 62.5,
            "order": 1,
            "page": 8
          }
        },
        {
          "page": "9",
          "index": 4,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/camelot_stream_p9_t4.csv",
          "shape": [
            18,
            6
          ],
          "stats": {
            "rows": 18,
            "cols": 6,
            "non_empty_cells": 100,
            "non_empty_ratio": 0.9259259259259259,
            "filled_rows": 18,
            "filled_cols": 6,
            "filled_rows_ratio": 1.0,
            "numeric_like_ratio": 0.58
          },
          "parsing_report": {
            "accuracy": 99.3,
            "whitespace": 7.41,
            "order": 1,
            "page": 9
          }
        },
        {
          "page": "11",
          "index": 5,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/camelot_stream_p11_t5.csv",
          "shape": [
            7,
            3
          ],
          "stats": {
            "rows": 7,
            "cols": 3,
            "non_empty_cells": 11,
            "non_empty_ratio": 0.5238095238095238,
            "filled_rows": 4,
            "filled_cols": 2,
            "filled_rows_ratio": 0.5714285714285714,
            "numeric_like_ratio": 0.09090909090909091
          },
          "parsing_report": {
            "accuracy": 71.65,
            "whitespace": 47.62,
            "order": 1,
            "page": 11
          }
        },
        {
          "page": "12",
          "index": 6,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/camelot_stream_p12_t6.csv",
          "shape": [
            11,
            7
          ],
          "stats": {
            "rows": 11,
            "cols": 7,
            "non_empty_cells": 52,
            "non_empty_ratio": 0.6753246753246753,
            "filled_rows": 11,
            "filled_cols": 7,
            "filled_rows_ratio": 1.0,
            "numeric_like_ratio": 0.4230769230769231
          },
          "parsing_report": {
            "accuracy": 95.79,
            "whitespace": 32.47,
            "order": 1,
            "page": 12
          }
        },
        {
          "page": "13",
          "index": 7,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/camelot_stream_p13_t7.csv",
          "shape": [
            20,
            6
          ],
          "stats": {
            "rows": 20,
            "cols": 6,
            "non_empty_cells": 100,
            "non_empty_ratio": 0.8333333333333334,
            "filled_rows": 18,
            "filled_cols": 6,
            "filled_rows_ratio": 0.9,
            "numeric_like_ratio": 0.64
          },
          "parsing_report": {
            "accuracy": 98.48,
            "whitespace": 16.67,
            "order": 1,
            "page": 13
          }
        }
      ],
      "lattice": [],
      "filtered_out": {
        "stream": 12,
        "lattice": 3
      },
      "filtered_reasons": {
        "stream": {
          "min_cols": 4,
          "filled_rows_ratio": 4,
          "filled_rows": 4
        },
        "lattice": {
          "sparse": 3
        }
      },
      "filter": {
        "min_rows": 2,
        "min_cols": 2,
        "min_non_empty_ratio": 0.2,
        "min_filled_rows": 2,
        "min_filled_cols": 2,
        "min_filled_rows_ratio": 0.5,
        "two_col_min_numeric_like_ratio": 0.35
      },
      "errors": []
    },
    "tabula": {
      "lattice": [],
      "stream": [
        {
          "page": 4,
          "index": 1,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/tabula_stream_p4_t1.csv",
          "shape": [
            16,
            10
          ],
          "stats": {
            "rows": 16,
            "cols": 10,
            "non_empty_cells": 153,
            "non_empty_ratio": 0.95625,
            "filled_rows": 16,
            "filled_cols": 10,
            "filled_rows_ratio": 1.0,
            "numeric_like_ratio": 0.49019607843137253
          }
        },
        {
          "page": 9,
          "index": 2,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/tabula_stream_p9_t2.csv",
          "shape": [
            16,
            4
          ],
          "stats": {
            "rows": 16,
            "cols": 4,
            "non_empty_cells": 64,
            "non_empty_ratio": 1.0,
            "filled_rows": 16,
            "filled_cols": 4,
            "filled_rows_ratio": 1.0,
            "numeric_like_ratio": 0.46875
          }
        },
        {
          "page": 13,
          "index": 3,
          "csv_path": "papers/porteretalndpuzzleaboutknowledge/out/tables/tabula_stream_p13_t3.csv",
          "shape": [
            16,
            4
          ],
          "stats": {
            "rows": 16,
            "cols": 4,
            "non_empty_cells": 64,
            "non_empty_ratio": 1.0,
            "filled_rows": 16,
            "filled_cols": 4,
            "filled_rows_ratio": 1.0,
            "numeric_like_ratio": 0.328125
          }
        }
      ],
      "filtered_out": {
        "lattice": 0,
        "stream": 4
      },
      "filtered_reasons": {
        "lattice": {},
        "stream": {
          "min_cols": 2,
          "two_col_low_numeric": 1,
          "filled_rows_ratio": 1
        }
      },
      "filter": {
        "min_rows": 2,
        "min_cols": 2,
        "min_non_empty_ratio": 0.2,
        "min_filled_rows": 2,
        "min_filled_cols": 2,
        "min_filled_rows_ratio": 0.5,
        "two_col_min_numeric_like_ratio": 0.35
      },
      "errors": [],
      "ignored_errors": {},
      "pages": "all"
    }
  },
  "images": {
    "dir": "papers/porteretalndpuzzleaboutknowledge/out/images",
    "manifest": "papers/porteretalndpuzzleaboutknowledge/out/images/manifest.json",
    "embedded": {
      "count": 24
    },
    "rendered_pages": {
      "count": 17,
      "pages": [
        1,
        2,
        3,
        4,
        5,
        6,
        7,
        8,
        9,
        10,
        11,
        12,
        13,
        14,
        15,
        16,
        17
      ]
    },
    "figures": {
      "count": 4,
      "pages": [],
      "rendered_pages": []
    }
  },
  "errors": [],
  "markdown": {
    "path": "papers/porteretalndpuzzleaboutknowledge/out/fulltext.md"
  }
}