nielsr/arxiv-chandra-ocr-2-include-images-demo-2604-08626-spacing-fix-v2-20260416 / 2604.08626 /2604.08626_metadata.json
| { | |
| "elapsed_seconds": 494.38, | |
| "failed_pages": [], | |
| "image_file_count": 13, | |
| "image_files": [ | |
| "images/page-001-55630241b036bf047e7cf52e082403ba_15_img.webp", | |
| "images/page-010-5a648852d523f787f68af04863ee55ce_1_img.webp", | |
| "images/page-013-32f5d64141b1ef58cfc2fa7677297999_1_img.webp", | |
| "images/page-018-c6495b5fdd93af46bbd49d9b08d63bd0_6_img.webp", | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_1_img.webp", | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_7_img.webp", | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_9_img.webp", | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_11_img.webp", | |
| "images/page-020-6c6ca935f7deb56cb5e502dec1b3f423_5_img.webp", | |
| "images/page-031-d84d510c0ccc79fd228c1cc2b91114ae_1_img.webp", | |
| "images/page-032-30ef5fcaccc98aa89bbc49752f2b082c_4_img.webp", | |
| "images/page-033-6e2a40b630398e1bbaee602a688c539a_3_img.webp", | |
| "images/page-033-6e2a40b630398e1bbaee602a688c539a_5_img.webp" | |
| ], | |
| "max_pages_per_paper": 200, | |
| "model_id": "datalab-to/chandra-ocr-2", | |
| "num_pages": 33, | |
| "num_pages_processed": 33, | |
| "pages": [ | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-001-55630241b036bf047e7cf52e082403ba_15_img.webp" | |
| ], | |
| "num_chunks": 17, | |
| "page_number": 1, | |
| "token_count": 1703 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 6, | |
| "page_number": 2, | |
| "token_count": 1411 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 8, | |
| "page_number": 3, | |
| "token_count": 1724 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 7, | |
| "page_number": 4, | |
| "token_count": 1338 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 11, | |
| "page_number": 5, | |
| "token_count": 1606 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 6, | |
| "token_count": 1732 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 18, | |
| "page_number": 7, | |
| "token_count": 2095 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 20, | |
| "page_number": 8, | |
| "token_count": 1995 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 10, | |
| "page_number": 9, | |
| "token_count": 1455 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-010-5a648852d523f787f68af04863ee55ce_1_img.webp" | |
| ], | |
| "num_chunks": 10, | |
| "page_number": 10, | |
| "token_count": 1193 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 11, | |
| "token_count": 1598 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 12, | |
| "page_number": 12, | |
| "token_count": 2156 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-013-32f5d64141b1ef58cfc2fa7677297999_1_img.webp" | |
| ], | |
| "num_chunks": 12, | |
| "page_number": 13, | |
| "token_count": 2441 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 11, | |
| "page_number": 14, | |
| "token_count": 1852 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 13, | |
| "page_number": 15, | |
| "token_count": 2323 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 10, | |
| "page_number": 16, | |
| "token_count": 2962 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 17, | |
| "token_count": 2480 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-018-c6495b5fdd93af46bbd49d9b08d63bd0_6_img.webp" | |
| ], | |
| "num_chunks": 8, | |
| "page_number": 18, | |
| "token_count": 1108 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 4, | |
| "image_files": [ | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_1_img.webp", | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_7_img.webp", | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_9_img.webp", | |
| "images/page-019-82ecac038b5b76c040da2d859190f7a4_11_img.webp" | |
| ], | |
| "num_chunks": 14, | |
| "page_number": 19, | |
| "token_count": 1088 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-020-6c6ca935f7deb56cb5e502dec1b3f423_5_img.webp" | |
| ], | |
| "num_chunks": 7, | |
| "page_number": 20, | |
| "token_count": 1193 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 6, | |
| "page_number": 21, | |
| "token_count": 1327 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 22, | |
| "token_count": 1372 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 4, | |
| "page_number": 23, | |
| "token_count": 265 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 3, | |
| "page_number": 24, | |
| "token_count": 2345 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 25, | |
| "token_count": 2272 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 26, | |
| "token_count": 2433 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 27, | |
| "token_count": 1956 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 22, | |
| "page_number": 28, | |
| "token_count": 1754 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 19, | |
| "page_number": 29, | |
| "token_count": 1924 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 16, | |
| "page_number": 30, | |
| "token_count": 1952 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-031-d84d510c0ccc79fd228c1cc2b91114ae_1_img.webp" | |
| ], | |
| "num_chunks": 9, | |
| "page_number": 31, | |
| "token_count": 1489 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-032-30ef5fcaccc98aa89bbc49752f2b082c_4_img.webp" | |
| ], | |
| "num_chunks": 6, | |
| "page_number": 32, | |
| "token_count": 469 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 2, | |
| "image_files": [ | |
| "images/page-033-6e2a40b630398e1bbaee602a688c539a_3_img.webp", | |
| "images/page-033-6e2a40b630398e1bbaee602a688c539a_5_img.webp" | |
| ], | |
| "num_chunks": 7, | |
| "page_number": 33, | |
| "token_count": 849 | |
| } | |
| ], | |
| "pages_with_images": 9, | |
| "paper_id": "2604.08626", | |
| "paper_url": "https://arxiv.org/abs/2604.08626", | |
| "pdf_exceeds_page_limit": false, | |
| "pdf_url": "https://arxiv.org/pdf/2604.08626.pdf", | |
| "processed_at": "2026-04-16T09:15:30.896239+00:00", | |
| "prompt_type": "ocr_layout", | |
| "script_version": "2026-04-16.1", | |
| "status": "success" | |
| } |
Xet Storage Details
- Size:
- 7.65 kB
- Xet hash:
- 19dabe1ff310a9bea2309bd7353c234477c4ccf50d80dc22eead7e385d1c0d06
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.