{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:V66ZROCGUS5MFQJL36ICPOMALA","short_pith_number":"pith:V66ZROCG","canonical_record":{"source":{"id":"2601.07820","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-01-12T18:53:09Z","cross_cats_sorted":[],"title_canon_sha256":"e7f106e8caf16d3c415b49de51ac0567abc93112a826279e005b015969bddf1e","abstract_canon_sha256":"e2c4d2bab4f2f92f139ffe652035447ec8db097baf0211f3233447881a67d39f"},"schema_version":"1.0"},"canonical_sha256":"afbd98b846a4bac2c12bdf9027b980580f45af14f644d93886aa0be59b5e1bf8","source":{"kind":"arxiv","id":"2601.07820","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2601.07820","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"arxiv_version","alias_value":"2601.07820v2","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2601.07820","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"pith_short_12","alias_value":"V66ZROCGUS5M","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"pith_short_16","alias_value":"V66ZROCGUS5MFQJL","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"pith_short_8","alias_value":"V66ZROCG","created_at":"2026-05-20T00:01:38Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:V66ZROCGUS5MFQJL36ICPOMALA","target":"record","payload":{"canonical_record":{"source":{"id":"2601.07820","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-01-12T18:53:09Z","cross_cats_sorted":[],"title_canon_sha256":"e7f106e8caf16d3c415b49de51ac0567abc93112a826279e005b015969bddf1e","abstract_canon_sha256":"e2c4d2bab4f2f92f139ffe652035447ec8db097baf0211f3233447881a67d39f"},"schema_version":"1.0"},"canonical_sha256":"afbd98b846a4bac2c12bdf9027b980580f45af14f644d93886aa0be59b5e1bf8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:01:38.521723Z","signature_b64":"321PyfBjypmVYRgLZ8PLZLFcnOTZ6TR8zH1T1TECn0TYXKlLIqqWWt7IOWllKLQf7Byufk+ETYPpLP6kIKRqBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"afbd98b846a4bac2c12bdf9027b980580f45af14f644d93886aa0be59b5e1bf8","last_reissued_at":"2026-05-20T00:01:38.520993Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:01:38.520993Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2601.07820","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:01:38Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VIiyatqyNaJf7eLMFTDkvTakPBIBqx+GXkjyrtm1MG5nmYDbvhzbPKcM2Lc0XaoiqZhD/eAepJKVT0Br1gydAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T21:47:32.639519Z"},"content_sha256":"facc65e0fd7b496e225ca30f1409c58e563186a3edc5277c3f8b69db207ce467","schema_version":"1.0","event_id":"sha256:facc65e0fd7b496e225ca30f1409c58e563186a3edc5277c3f8b69db207ce467"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:V66ZROCGUS5MFQJL36ICPOMALA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Reference Games as a Testbed for the Alignment of Model Uncertainty and Clarification Requests","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Hendrik Buschmeier, Judith Sieker, Manar Ali, Sina Zarrie{\\ss}","submitted_at":"2026-01-12T18:53:09Z","abstract_excerpt":"In human conversation, both interlocutors play an active role in maintaining mutual understanding. When listeners are uncertain about what speakers mean, for example, they can request clarification. It is an open question for language models whether they can assume a similar listener role, recognizing and expressing their own uncertainty through clarification. We argue that reference games are a suitable testbed to approach this question as they are controlled, self-contained, and make clarification needs explicit and measurable. To test this, we evaluate three vision-language models comparing"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2601.07820","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2601.07820/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:01:38Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sxPe11XhNNnN2Yq4XLYPxqHZfmTUntD7RlxhXKsdnOm6EcICEvzq1GdyjoBZnNDwHNIZAmQDwbNBs/4NBAZbDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T21:47:32.640337Z"},"content_sha256":"fde624715e58c3d655153b9d781069d4bfb0e18e161cc3a2949f3bf292680423","schema_version":"1.0","event_id":"sha256:fde624715e58c3d655153b9d781069d4bfb0e18e161cc3a2949f3bf292680423"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/V66ZROCGUS5MFQJL36ICPOMALA/bundle.json","state_url":"https://pith.science/pith/V66ZROCGUS5MFQJL36ICPOMALA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/V66ZROCGUS5MFQJL36ICPOMALA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-22T21:47:32Z","links":{"resolver":"https://pith.science/pith/V66ZROCGUS5MFQJL36ICPOMALA","bundle":"https://pith.science/pith/V66ZROCGUS5MFQJL36ICPOMALA/bundle.json","state":"https://pith.science/pith/V66ZROCGUS5MFQJL36ICPOMALA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/V66ZROCGUS5MFQJL36ICPOMALA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:V66ZROCGUS5MFQJL36ICPOMALA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e2c4d2bab4f2f92f139ffe652035447ec8db097baf0211f3233447881a67d39f","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-01-12T18:53:09Z","title_canon_sha256":"e7f106e8caf16d3c415b49de51ac0567abc93112a826279e005b015969bddf1e"},"schema_version":"1.0","source":{"id":"2601.07820","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2601.07820","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"arxiv_version","alias_value":"2601.07820v2","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2601.07820","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"pith_short_12","alias_value":"V66ZROCGUS5M","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"pith_short_16","alias_value":"V66ZROCGUS5MFQJL","created_at":"2026-05-20T00:01:38Z"},{"alias_kind":"pith_short_8","alias_value":"V66ZROCG","created_at":"2026-05-20T00:01:38Z"}],"graph_snapshots":[{"event_id":"sha256:fde624715e58c3d655153b9d781069d4bfb0e18e161cc3a2949f3bf292680423","target":"graph","created_at":"2026-05-20T00:01:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2601.07820/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"In human conversation, both interlocutors play an active role in maintaining mutual understanding. When listeners are uncertain about what speakers mean, for example, they can request clarification. It is an open question for language models whether they can assume a similar listener role, recognizing and expressing their own uncertainty through clarification. We argue that reference games are a suitable testbed to approach this question as they are controlled, self-contained, and make clarification needs explicit and measurable. To test this, we evaluate three vision-language models comparing","authors_text":"Hendrik Buschmeier, Judith Sieker, Manar Ali, Sina Zarrie{\\ss}","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-01-12T18:53:09Z","title":"Reference Games as a Testbed for the Alignment of Model Uncertainty and Clarification Requests"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2601.07820","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:facc65e0fd7b496e225ca30f1409c58e563186a3edc5277c3f8b69db207ce467","target":"record","created_at":"2026-05-20T00:01:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e2c4d2bab4f2f92f139ffe652035447ec8db097baf0211f3233447881a67d39f","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-01-12T18:53:09Z","title_canon_sha256":"e7f106e8caf16d3c415b49de51ac0567abc93112a826279e005b015969bddf1e"},"schema_version":"1.0","source":{"id":"2601.07820","kind":"arxiv","version":2}},"canonical_sha256":"afbd98b846a4bac2c12bdf9027b980580f45af14f644d93886aa0be59b5e1bf8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"afbd98b846a4bac2c12bdf9027b980580f45af14f644d93886aa0be59b5e1bf8","first_computed_at":"2026-05-20T00:01:38.520993Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:01:38.520993Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"321PyfBjypmVYRgLZ8PLZLFcnOTZ6TR8zH1T1TECn0TYXKlLIqqWWt7IOWllKLQf7Byufk+ETYPpLP6kIKRqBA==","signature_status":"signed_v1","signed_at":"2026-05-20T00:01:38.521723Z","signed_message":"canonical_sha256_bytes"},"source_id":"2601.07820","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:facc65e0fd7b496e225ca30f1409c58e563186a3edc5277c3f8b69db207ce467","sha256:fde624715e58c3d655153b9d781069d4bfb0e18e161cc3a2949f3bf292680423"],"state_sha256":"026b2379c0cab4b89bc4ca011cccdff776fec3c6f7695321fd81e355c9108327"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"wGWOqV/HmZhryWS68Uoj03NkxFvuLGkDEl9BvB7ZhcSmgJf+IQr3UJUzgsPE8Ia1YXCFxpbGoqilD02Uj/DYBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-22T21:47:32.644529Z","bundle_sha256":"70d5dcc7178a4f8ff65f3a1d4a0c305de7f81d54b9abe985980b2930ccf1264e"}}