{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:LIDOKKAOASHN6YZ25YHUOKXQZA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4331d20646806d67f55cc87e724d31f44ec552ac3654bd8874b37e8dc31d61d9","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T21:31:47Z","title_canon_sha256":"d179c7a15c7fb9e8058a51d6fc24f450138c7d16827fa043d1c7251c0d61180a"},"schema_version":"1.0","source":{"id":"2606.04231","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.04231","created_at":"2026-06-04T01:08:59Z"},{"alias_kind":"arxiv_version","alias_value":"2606.04231v1","created_at":"2026-06-04T01:08:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.04231","created_at":"2026-06-04T01:08:59Z"},{"alias_kind":"pith_short_12","alias_value":"LIDOKKAOASHN","created_at":"2026-06-04T01:08:59Z"},{"alias_kind":"pith_short_16","alias_value":"LIDOKKAOASHN6YZ2","created_at":"2026-06-04T01:08:59Z"},{"alias_kind":"pith_short_8","alias_value":"LIDOKKAO","created_at":"2026-06-04T01:08:59Z"}],"graph_snapshots":[{"event_id":"sha256:3ccf5e12201e8ef54518cb122c679cbfabb48b9d54ad41d8fe02826f266fc629","target":"graph","created_at":"2026-06-04T01:08:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.04231/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Recent advances in multimodal retrieval-augmented generation (MM-RAG) have shifted toward minimal parsing, relying on page-level images for producing retriever embeddings and for answer generation. While efficient, this trend often neglects explicit handling of the rich, structured information in complex enterprise documents, instead depending on pre-trained embeddings or vision-language models to implicitly capture such structure. In this work, we take a more direct approach: MM-BizRAG proactively extracts and represents document structure via a document structure-aware split that dynamically","authors_text":"Adwait Ratnaparkhi, Aymen Kallala, Denis Kochedykov, Hanoz Bhathena, Parin Rajesh Jhaveri, Prateek Singh, Rachneet Kaur, Rohan Mittal, Yiqiao Jin, Zhen Zeng","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T21:31:47Z","title":"MM-BizRAG: Rethinking Multimodal Retrieval-Augmented Generation for General Purpose Enterprise Q&A"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.04231","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d1c12c36f2caf21b21bfe8b8874a48e3eb262656cd69a61952ee0734dc4f4d36","target":"record","created_at":"2026-06-04T01:08:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4331d20646806d67f55cc87e724d31f44ec552ac3654bd8874b37e8dc31d61d9","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T21:31:47Z","title_canon_sha256":"d179c7a15c7fb9e8058a51d6fc24f450138c7d16827fa043d1c7251c0d61180a"},"schema_version":"1.0","source":{"id":"2606.04231","kind":"arxiv","version":1}},"canonical_sha256":"5a06e5280e048edf633aee0f472af0c81634b41ef749b67ef8f2b0734cb0c19a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5a06e5280e048edf633aee0f472af0c81634b41ef749b67ef8f2b0734cb0c19a","first_computed_at":"2026-06-04T01:08:59.377327Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-04T01:08:59.377327Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"I95khkWlASLz/ffHqubpKgBuYVe7th7/oiA44XtpAnBsxkriIxGPhzh4sWd4aJrXWtTrUaMCEIoNbFQuUTmFAg==","signature_status":"signed_v1","signed_at":"2026-06-04T01:08:59.377871Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.04231","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d1c12c36f2caf21b21bfe8b8874a48e3eb262656cd69a61952ee0734dc4f4d36","sha256:3ccf5e12201e8ef54518cb122c679cbfabb48b9d54ad41d8fe02826f266fc629"],"state_sha256":"55b198ad652ad950bcca5b0f02b24fb5434979160387d2568994509ff5201daa"}