{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:G42JQESY3FNWCJSYNA6VNHWSVJ","short_pith_number":"pith:G42JQESY","canonical_record":{"source":{"id":"2605.22100","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-21T07:36:41Z","cross_cats_sorted":[],"title_canon_sha256":"71fd11977fb1264365fe2ac73575a350778e08c86156722e4b1e5b0bca68d733","abstract_canon_sha256":"cd9ea6e5d1e0aad747e886ba8717c6b620d439854eb3d0d15f32329f6ac4bfc5"},"schema_version":"1.0"},"canonical_sha256":"3734981258d95b612658683d569ed2aa5f0a50f9e9fed787765972521d57ddde","source":{"kind":"arxiv","id":"2605.22100","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.22100","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"arxiv_version","alias_value":"2605.22100v1","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.22100","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"pith_short_12","alias_value":"G42JQESY3FNW","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"pith_short_16","alias_value":"G42JQESY3FNWCJSY","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"pith_short_8","alias_value":"G42JQESY","created_at":"2026-05-22T01:04:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:G42JQESY3FNWCJSYNA6VNHWSVJ","target":"record","payload":{"canonical_record":{"source":{"id":"2605.22100","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-21T07:36:41Z","cross_cats_sorted":[],"title_canon_sha256":"71fd11977fb1264365fe2ac73575a350778e08c86156722e4b1e5b0bca68d733","abstract_canon_sha256":"cd9ea6e5d1e0aad747e886ba8717c6b620d439854eb3d0d15f32329f6ac4bfc5"},"schema_version":"1.0"},"canonical_sha256":"3734981258d95b612658683d569ed2aa5f0a50f9e9fed787765972521d57ddde","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-22T01:04:25.764167Z","signature_b64":"5rJxA9UsiwExdfUZpHWQCoNKznyZsFvJY9+AXTjqlXx7h49A4DekCYPsiGK2Ly4O848TBKoIoR5Xb5q49JFRBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3734981258d95b612658683d569ed2aa5f0a50f9e9fed787765972521d57ddde","last_reissued_at":"2026-05-22T01:04:25.763474Z","signature_status":"signed_v1","first_computed_at":"2026-05-22T01:04:25.763474Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.22100","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T01:04:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"4CgbhG7iJ2OeQwyxu2YpI/BsHFZbBuTRH8nobatBdhliiepvNpgNlenWaj6Jl/e293Y8pWM+QXXl5laAm34UDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T18:45:21.718234Z"},"content_sha256":"e090484ae9879299000f7d2a86ff5e8d072a9aa427a77bb5e4dc01929e55ec95","schema_version":"1.0","event_id":"sha256:e090484ae9879299000f7d2a86ff5e8d072a9aa427a77bb5e4dc01929e55ec95"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:G42JQESY3FNWCJSYNA6VNHWSVJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"MPDocBench-Parse: Benchmarking Practical Multi-page Document Parsing","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Bangbang Zhou, Feiyu Gao, Hangdi Xing, Hongtao Xie, Jianjun Xu, Jieping Ye, Ming Yan, Qi Zheng, Shuai Bai, Yifan Chen, Zhibo Yang","submitted_at":"2026-05-21T07:36:41Z","abstract_excerpt":"Document parsing converts visually rich documents into machine-readable structured representations, forming a crucial foundation for information systems. Although many benchmarks have been proposed for document parsing, they remain inadequate for realistic scenarios. Existing benchmarks either focus on specific tasks or assess only single-page, text-centric settings, making them insufficient for practical multi-page parsing. Moreover, they lack fine-grained evaluation of semantic continuity, hierarchical structure recovery, and visual content preservation. To address these gaps, we propose MPD"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.22100","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.22100/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T01:04:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9PYAPhG4CiKisyv4aYOcxMf6ppXlDITsakHaTMAHOsh1oef9PaWi1xxk5Dwai4ofAeua4jPXJFAOyP8puMwpDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T18:45:21.718989Z"},"content_sha256":"48704812a08cdc7d9234caed625106c1d8a48e47644d7f05dc49e9b835959585","schema_version":"1.0","event_id":"sha256:48704812a08cdc7d9234caed625106c1d8a48e47644d7f05dc49e9b835959585"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/G42JQESY3FNWCJSYNA6VNHWSVJ/bundle.json","state_url":"https://pith.science/pith/G42JQESY3FNWCJSYNA6VNHWSVJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/G42JQESY3FNWCJSYNA6VNHWSVJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-24T18:45:21Z","links":{"resolver":"https://pith.science/pith/G42JQESY3FNWCJSYNA6VNHWSVJ","bundle":"https://pith.science/pith/G42JQESY3FNWCJSYNA6VNHWSVJ/bundle.json","state":"https://pith.science/pith/G42JQESY3FNWCJSYNA6VNHWSVJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/G42JQESY3FNWCJSYNA6VNHWSVJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:G42JQESY3FNWCJSYNA6VNHWSVJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"cd9ea6e5d1e0aad747e886ba8717c6b620d439854eb3d0d15f32329f6ac4bfc5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-21T07:36:41Z","title_canon_sha256":"71fd11977fb1264365fe2ac73575a350778e08c86156722e4b1e5b0bca68d733"},"schema_version":"1.0","source":{"id":"2605.22100","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.22100","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"arxiv_version","alias_value":"2605.22100v1","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.22100","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"pith_short_12","alias_value":"G42JQESY3FNW","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"pith_short_16","alias_value":"G42JQESY3FNWCJSY","created_at":"2026-05-22T01:04:25Z"},{"alias_kind":"pith_short_8","alias_value":"G42JQESY","created_at":"2026-05-22T01:04:25Z"}],"graph_snapshots":[{"event_id":"sha256:48704812a08cdc7d9234caed625106c1d8a48e47644d7f05dc49e9b835959585","target":"graph","created_at":"2026-05-22T01:04:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.22100/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Document parsing converts visually rich documents into machine-readable structured representations, forming a crucial foundation for information systems. Although many benchmarks have been proposed for document parsing, they remain inadequate for realistic scenarios. Existing benchmarks either focus on specific tasks or assess only single-page, text-centric settings, making them insufficient for practical multi-page parsing. Moreover, they lack fine-grained evaluation of semantic continuity, hierarchical structure recovery, and visual content preservation. To address these gaps, we propose MPD","authors_text":"Bangbang Zhou, Feiyu Gao, Hangdi Xing, Hongtao Xie, Jianjun Xu, Jieping Ye, Ming Yan, Qi Zheng, Shuai Bai, Yifan Chen, Zhibo Yang","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-21T07:36:41Z","title":"MPDocBench-Parse: Benchmarking Practical Multi-page Document Parsing"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.22100","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e090484ae9879299000f7d2a86ff5e8d072a9aa427a77bb5e4dc01929e55ec95","target":"record","created_at":"2026-05-22T01:04:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"cd9ea6e5d1e0aad747e886ba8717c6b620d439854eb3d0d15f32329f6ac4bfc5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-21T07:36:41Z","title_canon_sha256":"71fd11977fb1264365fe2ac73575a350778e08c86156722e4b1e5b0bca68d733"},"schema_version":"1.0","source":{"id":"2605.22100","kind":"arxiv","version":1}},"canonical_sha256":"3734981258d95b612658683d569ed2aa5f0a50f9e9fed787765972521d57ddde","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3734981258d95b612658683d569ed2aa5f0a50f9e9fed787765972521d57ddde","first_computed_at":"2026-05-22T01:04:25.763474Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-22T01:04:25.763474Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"5rJxA9UsiwExdfUZpHWQCoNKznyZsFvJY9+AXTjqlXx7h49A4DekCYPsiGK2Ly4O848TBKoIoR5Xb5q49JFRBA==","signature_status":"signed_v1","signed_at":"2026-05-22T01:04:25.764167Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.22100","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e090484ae9879299000f7d2a86ff5e8d072a9aa427a77bb5e4dc01929e55ec95","sha256:48704812a08cdc7d9234caed625106c1d8a48e47644d7f05dc49e9b835959585"],"state_sha256":"406d7a3c030f4e4e0e004c0e64f487c93c7d120d7a068d444b03b1bdab0ae088"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ky3rUaObZuIES9KBh+OHo1OI+y5elNJJ1YLf+3QVAmopP1viy8vdvwlx/q0Efo/riTz3Vkvd0nEA5fspRJ3xCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-24T18:45:21.723279Z","bundle_sha256":"e7f9ba63cdaaa20b157c8500b3023b532d2784bd2f3f1c68980dea679f41f724"}}