nielsr/arxiv-chandra-ocr-2-include-images-demo-2604-08626-duplicate-caption-fix-20260416 / 2604.08626 /2604.08626_metadata.json
| { | |
| "elapsed_seconds": 761.61, | |
| "failed_pages": [], | |
| "image_file_count": 13, | |
| "image_files": [ | |
| "images/page-001-e4fa572fe03d87e9b0ec0f50011c4b0c_15_img.webp", | |
| "images/page-010-50697b74765f1f12205507327f8dba19_1_img.webp", | |
| "images/page-013-c12c65d4cc7192bdda37bab1f33607ac_1_img.webp", | |
| "images/page-018-7260ae3ee5287c1cc3046a3189f5e9e9_6_img.webp", | |
| "images/page-019-fced306a057e37b86c776666826a8d80_1_img.webp", | |
| "images/page-019-fced306a057e37b86c776666826a8d80_7_img.webp", | |
| "images/page-019-fced306a057e37b86c776666826a8d80_9_img.webp", | |
| "images/page-019-fced306a057e37b86c776666826a8d80_11_img.webp", | |
| "images/page-020-335ea2bc15a94d0256416ee66a7e04a6_5_img.webp", | |
| "images/page-031-a67bee2cc4eb1e8be8a8613450dd7c4a_1_img.webp", | |
| "images/page-032-69b10895cf19b5d757c56e4329946dd5_4_img.webp", | |
| "images/page-033-773237c979d59f81cbb4f7d463570c48_3_img.webp", | |
| "images/page-033-773237c979d59f81cbb4f7d463570c48_5_img.webp" | |
| ], | |
| "max_pages_per_paper": 200, | |
| "model_id": "datalab-to/chandra-ocr-2", | |
| "num_pages": 33, | |
| "num_pages_processed": 33, | |
| "pages": [ | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-001-e4fa572fe03d87e9b0ec0f50011c4b0c_15_img.webp" | |
| ], | |
| "num_chunks": 17, | |
| "page_number": 1, | |
| "token_count": 1703 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 6, | |
| "page_number": 2, | |
| "token_count": 1389 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 8, | |
| "page_number": 3, | |
| "token_count": 1724 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 7, | |
| "page_number": 4, | |
| "token_count": 1338 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 11, | |
| "page_number": 5, | |
| "token_count": 1606 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 6, | |
| "token_count": 1732 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 18, | |
| "page_number": 7, | |
| "token_count": 2095 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 20, | |
| "page_number": 8, | |
| "token_count": 1995 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 10, | |
| "page_number": 9, | |
| "token_count": 1455 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-010-50697b74765f1f12205507327f8dba19_1_img.webp" | |
| ], | |
| "num_chunks": 10, | |
| "page_number": 10, | |
| "token_count": 1193 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 11, | |
| "token_count": 1598 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 12, | |
| "page_number": 12, | |
| "token_count": 2156 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-013-c12c65d4cc7192bdda37bab1f33607ac_1_img.webp" | |
| ], | |
| "num_chunks": 12, | |
| "page_number": 13, | |
| "token_count": 2441 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 11, | |
| "page_number": 14, | |
| "token_count": 1852 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 13, | |
| "page_number": 15, | |
| "token_count": 2323 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 10, | |
| "page_number": 16, | |
| "token_count": 2962 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 17, | |
| "token_count": 2480 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-018-7260ae3ee5287c1cc3046a3189f5e9e9_6_img.webp" | |
| ], | |
| "num_chunks": 8, | |
| "page_number": 18, | |
| "token_count": 1100 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 4, | |
| "image_files": [ | |
| "images/page-019-fced306a057e37b86c776666826a8d80_1_img.webp", | |
| "images/page-019-fced306a057e37b86c776666826a8d80_7_img.webp", | |
| "images/page-019-fced306a057e37b86c776666826a8d80_9_img.webp", | |
| "images/page-019-fced306a057e37b86c776666826a8d80_11_img.webp" | |
| ], | |
| "num_chunks": 14, | |
| "page_number": 19, | |
| "token_count": 1131 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-020-335ea2bc15a94d0256416ee66a7e04a6_5_img.webp" | |
| ], | |
| "num_chunks": 7, | |
| "page_number": 20, | |
| "token_count": 1075 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 6, | |
| "page_number": 21, | |
| "token_count": 1327 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 22, | |
| "token_count": 1372 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 4, | |
| "page_number": 23, | |
| "token_count": 265 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 3, | |
| "page_number": 24, | |
| "token_count": 2345 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 25, | |
| "token_count": 2272 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 26, | |
| "token_count": 2433 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 27, | |
| "token_count": 1956 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 22, | |
| "page_number": 28, | |
| "token_count": 1754 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 19, | |
| "page_number": 29, | |
| "token_count": 1926 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 16, | |
| "page_number": 30, | |
| "token_count": 1952 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-031-a67bee2cc4eb1e8be8a8613450dd7c4a_1_img.webp" | |
| ], | |
| "num_chunks": 9, | |
| "page_number": 31, | |
| "token_count": 1489 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-032-69b10895cf19b5d757c56e4329946dd5_4_img.webp" | |
| ], | |
| "num_chunks": 6, | |
| "page_number": 32, | |
| "token_count": 553 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 2, | |
| "image_files": [ | |
| "images/page-033-773237c979d59f81cbb4f7d463570c48_3_img.webp", | |
| "images/page-033-773237c979d59f81cbb4f7d463570c48_5_img.webp" | |
| ], | |
| "num_chunks": 7, | |
| "page_number": 33, | |
| "token_count": 970 | |
| } | |
| ], | |
| "pages_with_images": 9, | |
| "paper_id": "2604.08626", | |
| "paper_url": "https://arxiv.org/abs/2604.08626", | |
| "pdf_exceeds_page_limit": false, | |
| "pdf_url": "https://arxiv.org/pdf/2604.08626.pdf", | |
| "processed_at": "2026-04-16T10:00:19.253747+00:00", | |
| "prompt_type": "ocr_layout", | |
| "script_version": "2026-04-16.2", | |
| "status": "success" | |
| } |
Xet Storage Details
- Size:
- 7.65 kB
- Xet hash:
- 67d9399960226e1f9ef2f4716d5bfabdd9b451b61d3d8a78a20e0128ce91e304
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.