{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:EJUQGIVHSWV7JRY7Y76ZNVZ6UE","short_pith_number":"pith:EJUQGIVH","canonical_record":{"source":{"id":"2606.03969","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T17:53:45Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"7b0a00ec983784f4a2785635e18727d4002761cd3ff4c3796d2fac42059d4171","abstract_canon_sha256":"8087974ea3b05b0d452df4647a099b54b20db7315c3b8583aae096d4c700048c"},"schema_version":"1.0"},"canonical_sha256":"22690322a795abf4c71fc7fd96d73ea1308588e9caca5c50c475846fcaacb1e4","source":{"kind":"arxiv","id":"2606.03969","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.03969","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"arxiv_version","alias_value":"2606.03969v1","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.03969","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"pith_short_12","alias_value":"EJUQGIVHSWV7","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"pith_short_16","alias_value":"EJUQGIVHSWV7JRY7","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"pith_short_8","alias_value":"EJUQGIVH","created_at":"2026-06-03T02:06:08Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:EJUQGIVHSWV7JRY7Y76ZNVZ6UE","target":"record","payload":{"canonical_record":{"source":{"id":"2606.03969","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T17:53:45Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"7b0a00ec983784f4a2785635e18727d4002761cd3ff4c3796d2fac42059d4171","abstract_canon_sha256":"8087974ea3b05b0d452df4647a099b54b20db7315c3b8583aae096d4c700048c"},"schema_version":"1.0"},"canonical_sha256":"22690322a795abf4c71fc7fd96d73ea1308588e9caca5c50c475846fcaacb1e4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-03T02:06:08.253035Z","signature_b64":"7DpC0gwLlProW5kKebZOvPGAfEN9mZK7Ic1ZYVSapptwU6kvvnibpKchrUqLXK9HRqy+RgiMuBWjEFhP7rKSCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"22690322a795abf4c71fc7fd96d73ea1308588e9caca5c50c475846fcaacb1e4","last_reissued_at":"2026-06-03T02:06:08.252615Z","signature_status":"signed_v1","first_computed_at":"2026-06-03T02:06:08.252615Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.03969","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-03T02:06:08Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UtWPPSFzUuJHzwjfLqRH2NKzsv39ZyNyIe4w7yzxTSLBiUtataM874Lc5iv44xmUL0tyY4VSQAkaxWJxOhHVBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T21:04:11.935231Z"},"content_sha256":"ea92acb9cd6406dafe2742b7214f04ad014aa2562a56917c21130873e23259b7","schema_version":"1.0","event_id":"sha256:ea92acb9cd6406dafe2742b7214f04ad014aa2562a56917c21130873e23259b7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:EJUQGIVHSWV7JRY7Y76ZNVZ6UE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Quantifying Faithful Confidence Expression in Large Reasoning Models","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CL","authors_text":"Areeb Gani, Arman Cohan, Asal Meskin, Gabrielle Kaili-May Liu","submitted_at":"2026-06-02T17:53:45Z","abstract_excerpt":"Reliable uncertainty communication is critical to the trustworthiness of LLMs, yet faithful calibration (FC)--the alignment between models' intrinsic and (linguistically) expressed confidence--is a persistent failure mode. This challenge is key for large reasoning models (LRMs), whose extended reasoning traces are often interpreted by users as evidence of deliberation, competence, and confidence. Despite the importance of FC and wide usage of LRMs, the extent to which LRMs can faithfully express their confidence remains poorly understood. Moreover, the prevailing paradigm to measure FC does no"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.03969","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.03969/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-03T02:06:08Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Ufa4dOLvJt7Qgme5lqS1dIY+VKvDsF8aV8ZLOsFNJy90U0hPxd8E2SWS+bUs4Lr0c/xZ6tM1Zha8kUVbObamCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T21:04:11.935654Z"},"content_sha256":"bf47096876d589962ce9f94e697848b9a5a5e44b7fa9af5308c49a6d5ba79fb5","schema_version":"1.0","event_id":"sha256:bf47096876d589962ce9f94e697848b9a5a5e44b7fa9af5308c49a6d5ba79fb5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/EJUQGIVHSWV7JRY7Y76ZNVZ6UE/bundle.json","state_url":"https://pith.science/pith/EJUQGIVHSWV7JRY7Y76ZNVZ6UE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/EJUQGIVHSWV7JRY7Y76ZNVZ6UE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T21:04:11Z","links":{"resolver":"https://pith.science/pith/EJUQGIVHSWV7JRY7Y76ZNVZ6UE","bundle":"https://pith.science/pith/EJUQGIVHSWV7JRY7Y76ZNVZ6UE/bundle.json","state":"https://pith.science/pith/EJUQGIVHSWV7JRY7Y76ZNVZ6UE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/EJUQGIVHSWV7JRY7Y76ZNVZ6UE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:EJUQGIVHSWV7JRY7Y76ZNVZ6UE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8087974ea3b05b0d452df4647a099b54b20db7315c3b8583aae096d4c700048c","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T17:53:45Z","title_canon_sha256":"7b0a00ec983784f4a2785635e18727d4002761cd3ff4c3796d2fac42059d4171"},"schema_version":"1.0","source":{"id":"2606.03969","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.03969","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"arxiv_version","alias_value":"2606.03969v1","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.03969","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"pith_short_12","alias_value":"EJUQGIVHSWV7","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"pith_short_16","alias_value":"EJUQGIVHSWV7JRY7","created_at":"2026-06-03T02:06:08Z"},{"alias_kind":"pith_short_8","alias_value":"EJUQGIVH","created_at":"2026-06-03T02:06:08Z"}],"graph_snapshots":[{"event_id":"sha256:bf47096876d589962ce9f94e697848b9a5a5e44b7fa9af5308c49a6d5ba79fb5","target":"graph","created_at":"2026-06-03T02:06:08Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.03969/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reliable uncertainty communication is critical to the trustworthiness of LLMs, yet faithful calibration (FC)--the alignment between models' intrinsic and (linguistically) expressed confidence--is a persistent failure mode. This challenge is key for large reasoning models (LRMs), whose extended reasoning traces are often interpreted by users as evidence of deliberation, competence, and confidence. Despite the importance of FC and wide usage of LRMs, the extent to which LRMs can faithfully express their confidence remains poorly understood. Moreover, the prevailing paradigm to measure FC does no","authors_text":"Areeb Gani, Arman Cohan, Asal Meskin, Gabrielle Kaili-May Liu","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T17:53:45Z","title":"Quantifying Faithful Confidence Expression in Large Reasoning Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.03969","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ea92acb9cd6406dafe2742b7214f04ad014aa2562a56917c21130873e23259b7","target":"record","created_at":"2026-06-03T02:06:08Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8087974ea3b05b0d452df4647a099b54b20db7315c3b8583aae096d4c700048c","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-02T17:53:45Z","title_canon_sha256":"7b0a00ec983784f4a2785635e18727d4002761cd3ff4c3796d2fac42059d4171"},"schema_version":"1.0","source":{"id":"2606.03969","kind":"arxiv","version":1}},"canonical_sha256":"22690322a795abf4c71fc7fd96d73ea1308588e9caca5c50c475846fcaacb1e4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"22690322a795abf4c71fc7fd96d73ea1308588e9caca5c50c475846fcaacb1e4","first_computed_at":"2026-06-03T02:06:08.252615Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-03T02:06:08.252615Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"7DpC0gwLlProW5kKebZOvPGAfEN9mZK7Ic1ZYVSapptwU6kvvnibpKchrUqLXK9HRqy+RgiMuBWjEFhP7rKSCA==","signature_status":"signed_v1","signed_at":"2026-06-03T02:06:08.253035Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.03969","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ea92acb9cd6406dafe2742b7214f04ad014aa2562a56917c21130873e23259b7","sha256:bf47096876d589962ce9f94e697848b9a5a5e44b7fa9af5308c49a6d5ba79fb5"],"state_sha256":"92a5a7b24b5fc340e9530cf79ab52a82f5964907d6f9b620059eb6f4b07be52b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"W/Rw8dy8Qy/blD7A8lZBqans39eDfguy2rXdFoiCxUKqvX3s1IIJjSFCN5sto6IfD0YcIsmWjrGffRYFqS9rCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T21:04:11.937806Z","bundle_sha256":"4047f095941a03764c931feca825aac8b18a4438d310a390057534a05193ffaf"}}