{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:ZBFQUHEPSWCQYPN7NCCXB4N4YH","short_pith_number":"pith:ZBFQUHEP","canonical_record":{"source":{"id":"2606.25343","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-24T03:17:30Z","cross_cats_sorted":[],"title_canon_sha256":"6b3d0070d097d9e0ef9ea1f543599a56d6513f16131b2d21c75a9bb4a35e1ca6","abstract_canon_sha256":"d9b45f50b7ec8d6805f73102066ccf74fbbc05457a933e58fc699256f5a54b94"},"schema_version":"1.0"},"canonical_sha256":"c84b0a1c8f95850c3dbf688570f1bcc1e86741b64a472054282d9f77aa95e7bc","source":{"kind":"arxiv","id":"2606.25343","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.25343","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"arxiv_version","alias_value":"2606.25343v1","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.25343","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"pith_short_12","alias_value":"ZBFQUHEPSWCQ","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"pith_short_16","alias_value":"ZBFQUHEPSWCQYPN7","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"pith_short_8","alias_value":"ZBFQUHEP","created_at":"2026-06-25T01:18:02Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:ZBFQUHEPSWCQYPN7NCCXB4N4YH","target":"record","payload":{"canonical_record":{"source":{"id":"2606.25343","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-24T03:17:30Z","cross_cats_sorted":[],"title_canon_sha256":"6b3d0070d097d9e0ef9ea1f543599a56d6513f16131b2d21c75a9bb4a35e1ca6","abstract_canon_sha256":"d9b45f50b7ec8d6805f73102066ccf74fbbc05457a933e58fc699256f5a54b94"},"schema_version":"1.0"},"canonical_sha256":"c84b0a1c8f95850c3dbf688570f1bcc1e86741b64a472054282d9f77aa95e7bc","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-25T01:18:02.647220Z","signature_b64":"Q/V4XOl+LkIkXoeL5xS8O9RMNR5qnvHevrGp6D3pU2OOvgsQXHE4vJ5kMcK8QJI4eC+yKEJu3DyLcavcgF+qDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c84b0a1c8f95850c3dbf688570f1bcc1e86741b64a472054282d9f77aa95e7bc","last_reissued_at":"2026-06-25T01:18:02.646860Z","signature_status":"signed_v1","first_computed_at":"2026-06-25T01:18:02.646860Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.25343","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-25T01:18:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SEVBSRyMR69BmWYTQdcDameJ41KrrJXWfZX0R8fArJsF5iDscalaNSLcK6/9mclU78Yw/WS3wDoNaQwP3fLTDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T08:35:44.737022Z"},"content_sha256":"2fda2eaf99ee60cf195642e7e93dbd542c766fffefea360994eeee9e4c040cc7","schema_version":"1.0","event_id":"sha256:2fda2eaf99ee60cf195642e7e93dbd542c766fffefea360994eeee9e4c040cc7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:ZBFQUHEPSWCQYPN7NCCXB4N4YH","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Invoice Haystack: Benchmarking Document Retrieval and Visual Question Answering Under Strong Visual Homogeneity","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Basim Azam, Heethanjan Kanagalingam, Mokeeshan Vathanakumar, Sarah Monazam Erfani, Thenukan Pathmanathan","submitted_at":"2026-06-24T03:17:30Z","abstract_excerpt":"Vision Language Models have achieved near-human performance on single-document Visual Question Answering, yet their effectiveness degrades significantly when retrieving information from large collections of visually homogeneous documents. Existing multi-document benchmarks aggregate diverse document types, creating artificial separation in embedding space that does not reflect enterprise document repositories where thousands of records share identical visual templates. We identify this as embedding collapse and introduce Invoice Haystack, a benchmark with 1,500 anonymized invoice images paired"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.25343","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.25343/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-25T01:18:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BsrE2R43tKRRBXyCl79RZ8jFMMGtkqvRBD5oI3yBg9mLQIWPhrjSo/JbvyBBXzyLfDxOuaqlN0M2BJbmiYqoBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T08:35:44.737411Z"},"content_sha256":"8f5afddc51d2a4c96cd08c0b8d4a01fafa7d90bb1478c66830fde492f65ac432","schema_version":"1.0","event_id":"sha256:8f5afddc51d2a4c96cd08c0b8d4a01fafa7d90bb1478c66830fde492f65ac432"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZBFQUHEPSWCQYPN7NCCXB4N4YH/bundle.json","state_url":"https://pith.science/pith/ZBFQUHEPSWCQYPN7NCCXB4N4YH/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZBFQUHEPSWCQYPN7NCCXB4N4YH/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-30T08:35:44Z","links":{"resolver":"https://pith.science/pith/ZBFQUHEPSWCQYPN7NCCXB4N4YH","bundle":"https://pith.science/pith/ZBFQUHEPSWCQYPN7NCCXB4N4YH/bundle.json","state":"https://pith.science/pith/ZBFQUHEPSWCQYPN7NCCXB4N4YH/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZBFQUHEPSWCQYPN7NCCXB4N4YH/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:ZBFQUHEPSWCQYPN7NCCXB4N4YH","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d9b45f50b7ec8d6805f73102066ccf74fbbc05457a933e58fc699256f5a54b94","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-24T03:17:30Z","title_canon_sha256":"6b3d0070d097d9e0ef9ea1f543599a56d6513f16131b2d21c75a9bb4a35e1ca6"},"schema_version":"1.0","source":{"id":"2606.25343","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.25343","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"arxiv_version","alias_value":"2606.25343v1","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.25343","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"pith_short_12","alias_value":"ZBFQUHEPSWCQ","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"pith_short_16","alias_value":"ZBFQUHEPSWCQYPN7","created_at":"2026-06-25T01:18:02Z"},{"alias_kind":"pith_short_8","alias_value":"ZBFQUHEP","created_at":"2026-06-25T01:18:02Z"}],"graph_snapshots":[{"event_id":"sha256:8f5afddc51d2a4c96cd08c0b8d4a01fafa7d90bb1478c66830fde492f65ac432","target":"graph","created_at":"2026-06-25T01:18:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.25343/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Vision Language Models have achieved near-human performance on single-document Visual Question Answering, yet their effectiveness degrades significantly when retrieving information from large collections of visually homogeneous documents. Existing multi-document benchmarks aggregate diverse document types, creating artificial separation in embedding space that does not reflect enterprise document repositories where thousands of records share identical visual templates. We identify this as embedding collapse and introduce Invoice Haystack, a benchmark with 1,500 anonymized invoice images paired","authors_text":"Basim Azam, Heethanjan Kanagalingam, Mokeeshan Vathanakumar, Sarah Monazam Erfani, Thenukan Pathmanathan","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-24T03:17:30Z","title":"Invoice Haystack: Benchmarking Document Retrieval and Visual Question Answering Under Strong Visual Homogeneity"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.25343","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2fda2eaf99ee60cf195642e7e93dbd542c766fffefea360994eeee9e4c040cc7","target":"record","created_at":"2026-06-25T01:18:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d9b45f50b7ec8d6805f73102066ccf74fbbc05457a933e58fc699256f5a54b94","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-24T03:17:30Z","title_canon_sha256":"6b3d0070d097d9e0ef9ea1f543599a56d6513f16131b2d21c75a9bb4a35e1ca6"},"schema_version":"1.0","source":{"id":"2606.25343","kind":"arxiv","version":1}},"canonical_sha256":"c84b0a1c8f95850c3dbf688570f1bcc1e86741b64a472054282d9f77aa95e7bc","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c84b0a1c8f95850c3dbf688570f1bcc1e86741b64a472054282d9f77aa95e7bc","first_computed_at":"2026-06-25T01:18:02.646860Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-25T01:18:02.646860Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Q/V4XOl+LkIkXoeL5xS8O9RMNR5qnvHevrGp6D3pU2OOvgsQXHE4vJ5kMcK8QJI4eC+yKEJu3DyLcavcgF+qDw==","signature_status":"signed_v1","signed_at":"2026-06-25T01:18:02.647220Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.25343","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2fda2eaf99ee60cf195642e7e93dbd542c766fffefea360994eeee9e4c040cc7","sha256:8f5afddc51d2a4c96cd08c0b8d4a01fafa7d90bb1478c66830fde492f65ac432"],"state_sha256":"e85d44505b7ada9dd3587342b28e263c320f2fe55b6dc2e121e61ee7e280a8de"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"in8lM2VqLT/7E+rxSYHVr6EB2aGb0q371zTD/zsyCB1f88J0fbthEV6khd6/2XDIXpJU21cKLTx50KvB21W/Aw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-30T08:35:44.739428Z","bundle_sha256":"ef0945b4652d9638b1101ee11176affc1b2518eee9b11b16be0c46c708300be6"}}