{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:ZKQYAIYYBY36EK4TASZHRCSJTW","short_pith_number":"pith:ZKQYAIYY","canonical_record":{"source":{"id":"2606.19552","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T19:51:00Z","cross_cats_sorted":[],"title_canon_sha256":"d73f3db9788b448f8dde63341b2c1ca7df638d1ab02f0387687db84b29250151","abstract_canon_sha256":"7ce8960395b23a357802e620dc2c769b36a4383df282fed38fce0cef703bddf1"},"schema_version":"1.0"},"canonical_sha256":"caa18023180e37e22b9304b2788a499d975e82980cd94bd7543d11a9f685b848","source":{"kind":"arxiv","id":"2606.19552","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.19552","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"arxiv_version","alias_value":"2606.19552v1","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.19552","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"pith_short_12","alias_value":"ZKQYAIYYBY36","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"pith_short_16","alias_value":"ZKQYAIYYBY36EK4T","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"pith_short_8","alias_value":"ZKQYAIYY","created_at":"2026-06-19T16:12:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:ZKQYAIYYBY36EK4TASZHRCSJTW","target":"record","payload":{"canonical_record":{"source":{"id":"2606.19552","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T19:51:00Z","cross_cats_sorted":[],"title_canon_sha256":"d73f3db9788b448f8dde63341b2c1ca7df638d1ab02f0387687db84b29250151","abstract_canon_sha256":"7ce8960395b23a357802e620dc2c769b36a4383df282fed38fce0cef703bddf1"},"schema_version":"1.0"},"canonical_sha256":"caa18023180e37e22b9304b2788a499d975e82980cd94bd7543d11a9f685b848","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:12:28.752444Z","signature_b64":"Zpb03Vw2NVNmdlvbS4t9K8fYi890Jcl2RfJrVu0uP4YHY4Ed7J5cp7BuozkeflpFdvf8DguTjMA+d2Zp3Gt/BQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"caa18023180e37e22b9304b2788a499d975e82980cd94bd7543d11a9f685b848","last_reissued_at":"2026-06-19T16:12:28.752074Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:12:28.752074Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.19552","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:12:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JU3sU+flxN6xeGLNCTHqnkImMwQsVdGc71P8kn59xsi7oG8RrTAzC8MkDjlXHVGXhKyYb6qeZ/kNjr4lzau1BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-24T03:32:44.759640Z"},"content_sha256":"6392b610ada9b0879705989fe27f340646aab4a9148878f8734887be28aa8d9e","schema_version":"1.0","event_id":"sha256:6392b610ada9b0879705989fe27f340646aab4a9148878f8734887be28aa8d9e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:ZKQYAIYYBY36EK4TASZHRCSJTW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"LaViSA: A Language and Vision Structural Ambiguity Benchmark","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Koichiro Yoshino, Lee Sangmyeong, Shun Inadumi","submitted_at":"2026-06-17T19:51:00Z","abstract_excerpt":"Structural ambiguity arises when a single sentence admits multiple valid interpretations due to its syntactic structure, posing a fundamental challenge for language understanding. Visual scenes serve as useful cues for resolving such ambiguity, and Vision and Language Models (VLMs) need to be capable of deriving possible semantic interpretations from visual scenes. We introduce Language and Vision Structural Ambiguity (LaViSA), a benchmark designed to evaluate the ability of VLMs to resolve structural ambiguity leveraging visual scenes. LaViSA consists of ambiguous sentences, their disambiguat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.19552","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.19552/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:12:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1LqV4aeVBwFFzWiJF3G2yYd4Pw2/JixCEamAwBVscuXE1MAISaGMTmopGYc9MnB2qEn2Qit56chPe+ETFJU0Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-24T03:32:44.760347Z"},"content_sha256":"68612a2f01853a01516f886703ba63f6130d2d1ac5936307705f587b49593918","schema_version":"1.0","event_id":"sha256:68612a2f01853a01516f886703ba63f6130d2d1ac5936307705f587b49593918"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZKQYAIYYBY36EK4TASZHRCSJTW/bundle.json","state_url":"https://pith.science/pith/ZKQYAIYYBY36EK4TASZHRCSJTW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZKQYAIYYBY36EK4TASZHRCSJTW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-24T03:32:44Z","links":{"resolver":"https://pith.science/pith/ZKQYAIYYBY36EK4TASZHRCSJTW","bundle":"https://pith.science/pith/ZKQYAIYYBY36EK4TASZHRCSJTW/bundle.json","state":"https://pith.science/pith/ZKQYAIYYBY36EK4TASZHRCSJTW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZKQYAIYYBY36EK4TASZHRCSJTW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:ZKQYAIYYBY36EK4TASZHRCSJTW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7ce8960395b23a357802e620dc2c769b36a4383df282fed38fce0cef703bddf1","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T19:51:00Z","title_canon_sha256":"d73f3db9788b448f8dde63341b2c1ca7df638d1ab02f0387687db84b29250151"},"schema_version":"1.0","source":{"id":"2606.19552","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.19552","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"arxiv_version","alias_value":"2606.19552v1","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.19552","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"pith_short_12","alias_value":"ZKQYAIYYBY36","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"pith_short_16","alias_value":"ZKQYAIYYBY36EK4T","created_at":"2026-06-19T16:12:28Z"},{"alias_kind":"pith_short_8","alias_value":"ZKQYAIYY","created_at":"2026-06-19T16:12:28Z"}],"graph_snapshots":[{"event_id":"sha256:68612a2f01853a01516f886703ba63f6130d2d1ac5936307705f587b49593918","target":"graph","created_at":"2026-06-19T16:12:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.19552/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Structural ambiguity arises when a single sentence admits multiple valid interpretations due to its syntactic structure, posing a fundamental challenge for language understanding. Visual scenes serve as useful cues for resolving such ambiguity, and Vision and Language Models (VLMs) need to be capable of deriving possible semantic interpretations from visual scenes. We introduce Language and Vision Structural Ambiguity (LaViSA), a benchmark designed to evaluate the ability of VLMs to resolve structural ambiguity leveraging visual scenes. LaViSA consists of ambiguous sentences, their disambiguat","authors_text":"Koichiro Yoshino, Lee Sangmyeong, Shun Inadumi","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T19:51:00Z","title":"LaViSA: A Language and Vision Structural Ambiguity Benchmark"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.19552","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6392b610ada9b0879705989fe27f340646aab4a9148878f8734887be28aa8d9e","target":"record","created_at":"2026-06-19T16:12:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7ce8960395b23a357802e620dc2c769b36a4383df282fed38fce0cef703bddf1","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T19:51:00Z","title_canon_sha256":"d73f3db9788b448f8dde63341b2c1ca7df638d1ab02f0387687db84b29250151"},"schema_version":"1.0","source":{"id":"2606.19552","kind":"arxiv","version":1}},"canonical_sha256":"caa18023180e37e22b9304b2788a499d975e82980cd94bd7543d11a9f685b848","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"caa18023180e37e22b9304b2788a499d975e82980cd94bd7543d11a9f685b848","first_computed_at":"2026-06-19T16:12:28.752074Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:12:28.752074Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Zpb03Vw2NVNmdlvbS4t9K8fYi890Jcl2RfJrVu0uP4YHY4Ed7J5cp7BuozkeflpFdvf8DguTjMA+d2Zp3Gt/BQ==","signature_status":"signed_v1","signed_at":"2026-06-19T16:12:28.752444Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.19552","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6392b610ada9b0879705989fe27f340646aab4a9148878f8734887be28aa8d9e","sha256:68612a2f01853a01516f886703ba63f6130d2d1ac5936307705f587b49593918"],"state_sha256":"a7c459e57063e5ad64a343b201b4dcf4eaa4828db58ecf1737bf7f77cc0ce541"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EWcILmaLdnW81sbhBuJqpxeorxPRM1z4Nqo3DZzCQSRTEk/LywWNa9IPRnd8H03R89WTQOpa62uO6DZr1d/CAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-24T03:32:44.763480Z","bundle_sha256":"f65d17d5b1fec31637b9cbf77fcb6492691b58195a08ce71231ebd25e9ffad1f"}}