{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:ADMVMVNO76R4XKGMYY6J2RG3RR","short_pith_number":"pith:ADMVMVNO","canonical_record":{"source":{"id":"2606.03437","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T10:20:56Z","cross_cats_sorted":[],"title_canon_sha256":"da9b1c6859f4d2e8ac38638533af6753e7de8c5845ae3c3e91400e1fd843a533","abstract_canon_sha256":"ecfe5c8982785c7888b8da34c9188c8a08dfc745f29d0772737aa1444c145399"},"schema_version":"1.0"},"canonical_sha256":"00d95655aeffa3cba8ccc63c9d44db8c53760cebda3def0fa6193055b7b61d97","source":{"kind":"arxiv","id":"2606.03437","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.03437","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"arxiv_version","alias_value":"2606.03437v1","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.03437","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"pith_short_12","alias_value":"ADMVMVNO76R4","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"pith_short_16","alias_value":"ADMVMVNO76R4XKGM","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"pith_short_8","alias_value":"ADMVMVNO","created_at":"2026-06-03T01:05:57Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:ADMVMVNO76R4XKGMYY6J2RG3RR","target":"record","payload":{"canonical_record":{"source":{"id":"2606.03437","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T10:20:56Z","cross_cats_sorted":[],"title_canon_sha256":"da9b1c6859f4d2e8ac38638533af6753e7de8c5845ae3c3e91400e1fd843a533","abstract_canon_sha256":"ecfe5c8982785c7888b8da34c9188c8a08dfc745f29d0772737aa1444c145399"},"schema_version":"1.0"},"canonical_sha256":"00d95655aeffa3cba8ccc63c9d44db8c53760cebda3def0fa6193055b7b61d97","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-03T01:05:57.768515Z","signature_b64":"Yh0+Pk1JELMaIIUe6uLV2TJqIabl4dKz4aPPmQZ6hE3cnv4ixITO4gxDH5i3nwfcS4/eqgYm88VHjDY7WEDeAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"00d95655aeffa3cba8ccc63c9d44db8c53760cebda3def0fa6193055b7b61d97","last_reissued_at":"2026-06-03T01:05:57.768167Z","signature_status":"signed_v1","first_computed_at":"2026-06-03T01:05:57.768167Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.03437","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-03T01:05:57Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"GGaaHTrNisev2eB8D+FVz6vyhmqdeVUWWlwfEmpR/jN8Tfto2mE2cQgNa+ESwHEFdQMTBiTTqPdip/4RRlaqAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T20:39:09.655582Z"},"content_sha256":"8740d6ef6e9e8bdf37bc582359cee954577195d8728763e668d5dfd7e34f2773","schema_version":"1.0","event_id":"sha256:8740d6ef6e9e8bdf37bc582359cee954577195d8728763e668d5dfd7e34f2773"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:ADMVMVNO76R4XKGMYY6J2RG3RR","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Large Language Models Are Overconfident in Their Own Responses","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Katharina von der Wense, Manuel Mager, Mario Sanz-Guerrero","submitted_at":"2026-06-02T10:20:56Z","abstract_excerpt":"Prior work has shown that instruction-tuned large language models (LLMs) are less well calibrated than their base pre-trained counterparts. However, little is known about the frequently used chat template's effect on the calibration of conversational LLMs. In this work, we investigate the mechanisms driving this miscalibration by decoupling the effects of the post-training algorithm and the chat format. We find that, while instruction tuning fundamentally harms calibration, the chat template aggravates the issue through an \"ownership bias\" -- models are significantly more confident in their ow"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.03437","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.03437/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-03T01:05:57Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UAPLQHbxroEgDy3wXZ3POvrDFwrNSkqf2tGyLEe6lrQH+asjrsSubuXobq7rIS11h0+CEJrvX1/a6es4d7VnCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T20:39:09.655953Z"},"content_sha256":"da66391ccd39cdf8d98b28a9bcafc7d788bf67b0bd49ee061aec63c98a07cc80","schema_version":"1.0","event_id":"sha256:da66391ccd39cdf8d98b28a9bcafc7d788bf67b0bd49ee061aec63c98a07cc80"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ADMVMVNO76R4XKGMYY6J2RG3RR/bundle.json","state_url":"https://pith.science/pith/ADMVMVNO76R4XKGMYY6J2RG3RR/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ADMVMVNO76R4XKGMYY6J2RG3RR/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T20:39:09Z","links":{"resolver":"https://pith.science/pith/ADMVMVNO76R4XKGMYY6J2RG3RR","bundle":"https://pith.science/pith/ADMVMVNO76R4XKGMYY6J2RG3RR/bundle.json","state":"https://pith.science/pith/ADMVMVNO76R4XKGMYY6J2RG3RR/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ADMVMVNO76R4XKGMYY6J2RG3RR/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:ADMVMVNO76R4XKGMYY6J2RG3RR","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ecfe5c8982785c7888b8da34c9188c8a08dfc745f29d0772737aa1444c145399","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T10:20:56Z","title_canon_sha256":"da9b1c6859f4d2e8ac38638533af6753e7de8c5845ae3c3e91400e1fd843a533"},"schema_version":"1.0","source":{"id":"2606.03437","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.03437","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"arxiv_version","alias_value":"2606.03437v1","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.03437","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"pith_short_12","alias_value":"ADMVMVNO76R4","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"pith_short_16","alias_value":"ADMVMVNO76R4XKGM","created_at":"2026-06-03T01:05:57Z"},{"alias_kind":"pith_short_8","alias_value":"ADMVMVNO","created_at":"2026-06-03T01:05:57Z"}],"graph_snapshots":[{"event_id":"sha256:da66391ccd39cdf8d98b28a9bcafc7d788bf67b0bd49ee061aec63c98a07cc80","target":"graph","created_at":"2026-06-03T01:05:57Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.03437/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Prior work has shown that instruction-tuned large language models (LLMs) are less well calibrated than their base pre-trained counterparts. However, little is known about the frequently used chat template's effect on the calibration of conversational LLMs. In this work, we investigate the mechanisms driving this miscalibration by decoupling the effects of the post-training algorithm and the chat format. We find that, while instruction tuning fundamentally harms calibration, the chat template aggravates the issue through an \"ownership bias\" -- models are significantly more confident in their ow","authors_text":"Katharina von der Wense, Manuel Mager, Mario Sanz-Guerrero","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T10:20:56Z","title":"Large Language Models Are Overconfident in Their Own Responses"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.03437","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8740d6ef6e9e8bdf37bc582359cee954577195d8728763e668d5dfd7e34f2773","target":"record","created_at":"2026-06-03T01:05:57Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ecfe5c8982785c7888b8da34c9188c8a08dfc745f29d0772737aa1444c145399","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T10:20:56Z","title_canon_sha256":"da9b1c6859f4d2e8ac38638533af6753e7de8c5845ae3c3e91400e1fd843a533"},"schema_version":"1.0","source":{"id":"2606.03437","kind":"arxiv","version":1}},"canonical_sha256":"00d95655aeffa3cba8ccc63c9d44db8c53760cebda3def0fa6193055b7b61d97","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"00d95655aeffa3cba8ccc63c9d44db8c53760cebda3def0fa6193055b7b61d97","first_computed_at":"2026-06-03T01:05:57.768167Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-03T01:05:57.768167Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Yh0+Pk1JELMaIIUe6uLV2TJqIabl4dKz4aPPmQZ6hE3cnv4ixITO4gxDH5i3nwfcS4/eqgYm88VHjDY7WEDeAA==","signature_status":"signed_v1","signed_at":"2026-06-03T01:05:57.768515Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.03437","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8740d6ef6e9e8bdf37bc582359cee954577195d8728763e668d5dfd7e34f2773","sha256:da66391ccd39cdf8d98b28a9bcafc7d788bf67b0bd49ee061aec63c98a07cc80"],"state_sha256":"398c11bbc40108cbddf4f4b4b0bdb3bed5fbd0eceb9a026c4089934213a6a858"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"b3YDryR86+xybzxYctdR0Cbdj6/i8eZH/UQP7TpufGAPHfFD2BxqayHC7uPEwydNDNvXoGnn926i9r4kInGYBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T20:39:09.658106Z","bundle_sha256":"f1e2f953d69bf3bb883f8763eb2881af4f35edae430aab25f105b8a35ad8308a"}}