{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:AS7HDM7E4BQKWUALXJPBMZ52DC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"22aee27774e31cd45074463c56de7a5dc4745195c96561575256a760bea526c9","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-08-20T08:17:45Z","title_canon_sha256":"baddfb8d0d1b77131aa72d2ff843920b70164daeb255013f17e0661e1b5ab90c"},"schema_version":"1.0","source":{"id":"2508.15851","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2508.15851","created_at":"2026-06-05T01:15:15Z"},{"alias_kind":"arxiv_version","alias_value":"2508.15851v2","created_at":"2026-06-05T01:15:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2508.15851","created_at":"2026-06-05T01:15:15Z"},{"alias_kind":"pith_short_12","alias_value":"AS7HDM7E4BQK","created_at":"2026-06-05T01:15:15Z"},{"alias_kind":"pith_short_16","alias_value":"AS7HDM7E4BQKWUAL","created_at":"2026-06-05T01:15:15Z"},{"alias_kind":"pith_short_8","alias_value":"AS7HDM7E","created_at":"2026-06-05T01:15:15Z"}],"graph_snapshots":[{"event_id":"sha256:bbf04a4b452f8f5aed66b344887dd25b708ac56793b7a0dca3e2efab0890673f","target":"graph","created_at":"2026-06-05T01:15:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2508.15851/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Despite rapid progress in large language models (LLMs), current QA benchmarks still overlook the core challenge of real-world scientific information seeking: synthesizing multimodal evidence scattered across multiple documents and structural formats. Existing QA benchmarks remain narrow in scope, relying on unimodal text and short-span reasoning that fail to capture the complexity of real information seeking. We introduce DocHop-QA, a benchmark of 11,379 instances for evaluating multimodal, multi-document, multi-hop scientific QA. Built from publicly available PubMed articles, DocHop-QA incorp","authors_text":"Jinwoo Kim, Jiwon Park, Rina Carines Cabal, Seohyun Pyeon, Soyeon Caren Han, Yihao Ding, Zhenyuan He","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-08-20T08:17:45Z","title":"DocHop-QA: Towards Multi-Hop Reasoning over Multimodal Document Collections"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2508.15851","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5d62c389f206fd5c1d73465be64a1c0f193ec225efa545ff25954074b053ec4c","target":"record","created_at":"2026-06-05T01:15:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"22aee27774e31cd45074463c56de7a5dc4745195c96561575256a760bea526c9","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-08-20T08:17:45Z","title_canon_sha256":"baddfb8d0d1b77131aa72d2ff843920b70164daeb255013f17e0661e1b5ab90c"},"schema_version":"1.0","source":{"id":"2508.15851","kind":"arxiv","version":2}},"canonical_sha256":"04be71b3e4e060ab500bba5e1667ba188b913c14755101517b15c22808ff534b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"04be71b3e4e060ab500bba5e1667ba188b913c14755101517b15c22808ff534b","first_computed_at":"2026-06-05T01:15:15.511107Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-05T01:15:15.511107Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Aa6/Qt1ywZKq3swcuNMz8kpwcxUSDwKgzXPqMeurtkZaQWaoK7qPdG0nj+zgjNe6PJhMATHx7capTal6E9TUBQ==","signature_status":"signed_v1","signed_at":"2026-06-05T01:15:15.511860Z","signed_message":"canonical_sha256_bytes"},"source_id":"2508.15851","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5d62c389f206fd5c1d73465be64a1c0f193ec225efa545ff25954074b053ec4c","sha256:bbf04a4b452f8f5aed66b344887dd25b708ac56793b7a0dca3e2efab0890673f"],"state_sha256":"4d12c544f8f228eb14ee6d9d3474489e19735dcb80fbd6077d2fd11c59e0114c"}