nielsr/arxiv-chandra-ocr-2-include-images-demo-2604-08626-duplicate-caption-fix-v2-20260416 / 2604.08626 /2604.08626_metadata.json
| { | |
| "elapsed_seconds": 494.95, | |
| "failed_pages": [], | |
| "image_file_count": 13, | |
| "image_files": [ | |
| "images/page-001-d8a3d5757cf72bbaf6e3d3cdabc19729_15_img.webp", | |
| "images/page-010-4a91e1c0bea21f2590c87c3024980996_1_img.webp", | |
| "images/page-013-e9e9bd2bcff327a85d7c5a87f159b363_1_img.webp", | |
| "images/page-018-425b5373f0902973286b76cb90062164_6_img.webp", | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_1_img.webp", | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_7_img.webp", | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_9_img.webp", | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_11_img.webp", | |
| "images/page-020-1de4645f7582fc0c2af0ee1ba9494339_5_img.webp", | |
| "images/page-031-ba28b230879924d7bf3b777027a489b4_1_img.webp", | |
| "images/page-032-7ac683cffc8b23a4f9c4bdd3a305a668_4_img.webp", | |
| "images/page-033-53c0587955a088860be10e1c6e8299b0_3_img.webp", | |
| "images/page-033-53c0587955a088860be10e1c6e8299b0_5_img.webp" | |
| ], | |
| "max_pages_per_paper": 200, | |
| "model_id": "datalab-to/chandra-ocr-2", | |
| "num_pages": 33, | |
| "num_pages_processed": 33, | |
| "pages": [ | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-001-d8a3d5757cf72bbaf6e3d3cdabc19729_15_img.webp" | |
| ], | |
| "num_chunks": 17, | |
| "page_number": 1, | |
| "token_count": 1703 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 6, | |
| "page_number": 2, | |
| "token_count": 1363 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 8, | |
| "page_number": 3, | |
| "token_count": 1724 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 7, | |
| "page_number": 4, | |
| "token_count": 1239 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 11, | |
| "page_number": 5, | |
| "token_count": 1606 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 6, | |
| "token_count": 1732 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 18, | |
| "page_number": 7, | |
| "token_count": 2095 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 20, | |
| "page_number": 8, | |
| "token_count": 1995 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 10, | |
| "page_number": 9, | |
| "token_count": 1443 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-010-4a91e1c0bea21f2590c87c3024980996_1_img.webp" | |
| ], | |
| "num_chunks": 10, | |
| "page_number": 10, | |
| "token_count": 1193 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 11, | |
| "token_count": 1598 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 12, | |
| "page_number": 12, | |
| "token_count": 2156 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-013-e9e9bd2bcff327a85d7c5a87f159b363_1_img.webp" | |
| ], | |
| "num_chunks": 12, | |
| "page_number": 13, | |
| "token_count": 2441 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 11, | |
| "page_number": 14, | |
| "token_count": 1852 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 13, | |
| "page_number": 15, | |
| "token_count": 2323 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 10, | |
| "page_number": 16, | |
| "token_count": 2962 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 17, | |
| "token_count": 2480 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-018-425b5373f0902973286b76cb90062164_6_img.webp" | |
| ], | |
| "num_chunks": 8, | |
| "page_number": 18, | |
| "token_count": 1113 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 4, | |
| "image_files": [ | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_1_img.webp", | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_7_img.webp", | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_9_img.webp", | |
| "images/page-019-cec07549f3334a6e0cb84d79319b19df_11_img.webp" | |
| ], | |
| "num_chunks": 14, | |
| "page_number": 19, | |
| "token_count": 1088 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-020-1de4645f7582fc0c2af0ee1ba9494339_5_img.webp" | |
| ], | |
| "num_chunks": 7, | |
| "page_number": 20, | |
| "token_count": 1087 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 6, | |
| "page_number": 21, | |
| "token_count": 1327 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 14, | |
| "page_number": 22, | |
| "token_count": 1372 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 4, | |
| "page_number": 23, | |
| "token_count": 265 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 3, | |
| "page_number": 24, | |
| "token_count": 2345 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 25, | |
| "token_count": 2272 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 26, | |
| "token_count": 2433 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 2, | |
| "page_number": 27, | |
| "token_count": 1956 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 22, | |
| "page_number": 28, | |
| "token_count": 1754 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 19, | |
| "page_number": 29, | |
| "token_count": 1924 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 0, | |
| "image_files": [], | |
| "num_chunks": 16, | |
| "page_number": 30, | |
| "token_count": 1952 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-031-ba28b230879924d7bf3b777027a489b4_1_img.webp" | |
| ], | |
| "num_chunks": 9, | |
| "page_number": 31, | |
| "token_count": 1489 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 1, | |
| "image_files": [ | |
| "images/page-032-7ac683cffc8b23a4f9c4bdd3a305a668_4_img.webp" | |
| ], | |
| "num_chunks": 6, | |
| "page_number": 32, | |
| "token_count": 491 | |
| }, | |
| { | |
| "error": false, | |
| "image_count": 2, | |
| "image_files": [ | |
| "images/page-033-53c0587955a088860be10e1c6e8299b0_3_img.webp", | |
| "images/page-033-53c0587955a088860be10e1c6e8299b0_5_img.webp" | |
| ], | |
| "num_chunks": 7, | |
| "page_number": 33, | |
| "token_count": 853 | |
| } | |
| ], | |
| "pages_with_images": 9, | |
| "paper_id": "2604.08626", | |
| "paper_url": "https://arxiv.org/abs/2604.08626", | |
| "pdf_exceeds_page_limit": false, | |
| "pdf_url": "https://arxiv.org/pdf/2604.08626.pdf", | |
| "processed_at": "2026-04-16T10:12:32.503852+00:00", | |
| "prompt_type": "ocr_layout", | |
| "script_version": "2026-04-16.3", | |
| "status": "success" | |
| } |
Xet Storage Details
- Size:
- 7.65 kB
- Xet hash:
- f3994efc15113a3eed3f1169253ee8adc420609342285b02a078be49102013c1
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.