sripadastanley2012empiricaltestsinterest
/data/papers/sripadastanley2012empiricaltestsinterest/out/bundle.json
{
  "created_at": "2026-01-19T11:42:56.452406+00:00",
  "paper_dir": "papers/sripadastanley2012empiricaltestsinterest",
  "pdf": {
    "path": "papers/sripadastanley2012empiricaltestsinterest/pdf/paper.pdf"
  },
  "tool_versions": {
    "python": "3.14.2",
    "meta-extract": "0.1.0",
    "requests": "2.32.5",
    "lxml": "6.0.2",
    "pandas": "2.3.3",
    "pypdf": "5.9.0",
    "pypdfium2": "5.3.0",
    "pillow": "12.1.0",
    "grobid-client-python": "0.1.4",
    "camelot-py": "1.0.9",
    "tabula-py": "2.10.0"
  },
  "status": "ok",
  "grobid": {
    "url": "http://localhost:8070",
    "tei_path": "papers/sripadastanley2012empiricaltestsinterest/out/tei.xml"
  },
  "text": {
    "path": "papers/sripadastanley2012empiricaltestsinterest/out/text.txt"
  },
  "tables": {
    "out_dir": "papers/sripadastanley2012empiricaltestsinterest/out/tables",
    "camelot": {
      "stream": [
        {
          "page": "22",
          "index": 1,
          "csv_path": "papers/sripadastanley2012empiricaltestsinterest/out/tables/camelot_stream_p22_t1.csv",
          "shape": [
            7,
            5
          ],
          "stats": {
            "rows": 7,
            "cols": 5,
            "non_empty_cells": 18,
            "non_empty_ratio": 0.5142857142857142,
            "filled_rows": 5,
            "filled_cols": 5,
            "filled_rows_ratio": 0.7142857142857143,
            "numeric_like_ratio": 0.05555555555555555
          },
          "parsing_report": {
            "accuracy": 87.7,
            "whitespace": 48.57,
            "order": 2,
            "page": 22
          }
        }
      ],
      "lattice": [],
      "filtered_out": {
        "stream": 30,
        "lattice": 0
      },
      "filtered_reasons": {
        "stream": {
          "min_cols": 20,
          "filled_rows": 7,
          "filled_rows_ratio": 3
        },
        "lattice": {}
      },
      "filter": {
        "min_rows": 2,
        "min_cols": 2,
        "min_non_empty_ratio": 0.2,
        "min_filled_rows": 2,
        "min_filled_cols": 2,
        "min_filled_rows_ratio": 0.5,
        "two_col_min_numeric_like_ratio": 0.35
      },
      "errors": []
    },
    "tabula": {
      "lattice": [],
      "stream": [],
      "filtered_out": {
        "lattice": 0,
        "stream": 6
      },
      "filtered_reasons": {
        "lattice": {},
        "stream": {
          "filled_rows": 3,
          "min_cols": 3
        }
      },
      "filter": {
        "min_rows": 2,
        "min_cols": 2,
        "min_non_empty_ratio": 0.2,
        "min_filled_rows": 2,
        "min_filled_cols": 2,
        "min_filled_rows_ratio": 0.5,
        "two_col_min_numeric_like_ratio": 0.35
      },
      "errors": [],
      "ignored_errors": {},
      "pages": "all"
    }
  },
  "images": {
    "dir": "papers/sripadastanley2012empiricaltestsinterest/out/images",
    "manifest": "papers/sripadastanley2012empiricaltestsinterest/out/images/manifest.json",
    "embedded": {
      "count": 4
    },
    "rendered_pages": {
      "count": 4,
      "pages": [
        1,
        9,
        13,
        14
      ]
    },
    "figures": {
      "count": 5,
      "pages": [
        9,
        13,
        14
      ],
      "rendered_pages": [
        9,
        13,
        14
      ]
    }
  },
  "errors": [],
  "markdown": {
    "path": "papers/sripadastanley2012empiricaltestsinterest/out/fulltext.md"
  }
}