{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:3LCMPTRKHIGUKLWLAXNIK5PNSO","short_pith_number":"pith:3LCMPTRK","canonical_record":{"source":{"id":"2605.19369","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T05:04:42Z","cross_cats_sorted":[],"title_canon_sha256":"b15e6fcfdb56bbb14163056efc90371c2b796e9742de5d616a5922d2a7e43ec4","abstract_canon_sha256":"6e8a40eebef0f7ae5f76b850fdc6abf89bb8003cd26e8a6969d4344540cd2b26"},"schema_version":"1.0"},"canonical_sha256":"dac4c7ce2a3a0d452ecb05da8575ed9385027c1612a83a8c7b8807c48f5552b0","source":{"kind":"arxiv","id":"2605.19369","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19369","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19369v1","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19369","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"pith_short_12","alias_value":"3LCMPTRKHIGU","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"pith_short_16","alias_value":"3LCMPTRKHIGUKLWL","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"pith_short_8","alias_value":"3LCMPTRK","created_at":"2026-05-20T01:05:41Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:3LCMPTRKHIGUKLWLAXNIK5PNSO","target":"record","payload":{"canonical_record":{"source":{"id":"2605.19369","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T05:04:42Z","cross_cats_sorted":[],"title_canon_sha256":"b15e6fcfdb56bbb14163056efc90371c2b796e9742de5d616a5922d2a7e43ec4","abstract_canon_sha256":"6e8a40eebef0f7ae5f76b850fdc6abf89bb8003cd26e8a6969d4344540cd2b26"},"schema_version":"1.0"},"canonical_sha256":"dac4c7ce2a3a0d452ecb05da8575ed9385027c1612a83a8c7b8807c48f5552b0","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:05:41.763044Z","signature_b64":"YaslGWkLL5Y6cg+Zd8n4RExWpiuHb24cMQAZWIsYP2JhwGahApy6W4a5gHXOWQow8u41CvVUVbaOnuYx+sDDBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"dac4c7ce2a3a0d452ecb05da8575ed9385027c1612a83a8c7b8807c48f5552b0","last_reissued_at":"2026-05-20T01:05:41.762428Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:05:41.762428Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.19369","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2u6SI7tUR55WrgiXVD00QuQYjE0vFxZHULJMSSNrKCtWTD6e6djXWn1t6xUyF9gpTGWhhxQMWTihLKXE//dLCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T03:05:41.779024Z"},"content_sha256":"85ca6674ad38d95725cd022dbedab8ac0da8c22a5b3975908dbdc4640ce40693","schema_version":"1.0","event_id":"sha256:85ca6674ad38d95725cd022dbedab8ac0da8c22a5b3975908dbdc4640ce40693"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:3LCMPTRKHIGUKLWLAXNIK5PNSO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"When to Answer and When to Defer: A Decision Framework for Reliable Code Predictions","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.SE","authors_text":"Ravishka Rathnasuriya, Wei Yang","submitted_at":"2026-05-19T05:04:42Z","abstract_excerpt":"Code language models are increasingly adopted for both understanding and generative tasks. Despite their success, these models frequently produce overconfident incorrect predictions and underconfident correct predictions, undermining their reliability in deployment. Practical deployment demands three capabilities: accurately estimating the likelihood of correctness, abstaining on uncertain predictions, and invoking external mechanisms to validate or repair abstained outputs. Existing calibration and uncertainty estimation methods, primarily developed for natural language tasks, do not readily "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19369","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.19369/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"dF5QFksvrPC305TgkDfn3jRNMxUvdIX168z7pp9jTnzbSHL5tLTrqnbHdNZ+PPtSU4lAsKSsral4riyRw4j9Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T03:05:41.779733Z"},"content_sha256":"9891f66875c9ee5761a2fcb13eacd553c25fe93409ceec6837acaa1eb5046a6c","schema_version":"1.0","event_id":"sha256:9891f66875c9ee5761a2fcb13eacd553c25fe93409ceec6837acaa1eb5046a6c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3LCMPTRKHIGUKLWLAXNIK5PNSO/bundle.json","state_url":"https://pith.science/pith/3LCMPTRKHIGUKLWLAXNIK5PNSO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3LCMPTRKHIGUKLWLAXNIK5PNSO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T03:05:41Z","links":{"resolver":"https://pith.science/pith/3LCMPTRKHIGUKLWLAXNIK5PNSO","bundle":"https://pith.science/pith/3LCMPTRKHIGUKLWLAXNIK5PNSO/bundle.json","state":"https://pith.science/pith/3LCMPTRKHIGUKLWLAXNIK5PNSO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3LCMPTRKHIGUKLWLAXNIK5PNSO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:3LCMPTRKHIGUKLWLAXNIK5PNSO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6e8a40eebef0f7ae5f76b850fdc6abf89bb8003cd26e8a6969d4344540cd2b26","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T05:04:42Z","title_canon_sha256":"b15e6fcfdb56bbb14163056efc90371c2b796e9742de5d616a5922d2a7e43ec4"},"schema_version":"1.0","source":{"id":"2605.19369","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19369","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19369v1","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19369","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"pith_short_12","alias_value":"3LCMPTRKHIGU","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"pith_short_16","alias_value":"3LCMPTRKHIGUKLWL","created_at":"2026-05-20T01:05:41Z"},{"alias_kind":"pith_short_8","alias_value":"3LCMPTRK","created_at":"2026-05-20T01:05:41Z"}],"graph_snapshots":[{"event_id":"sha256:9891f66875c9ee5761a2fcb13eacd553c25fe93409ceec6837acaa1eb5046a6c","target":"graph","created_at":"2026-05-20T01:05:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.19369/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Code language models are increasingly adopted for both understanding and generative tasks. Despite their success, these models frequently produce overconfident incorrect predictions and underconfident correct predictions, undermining their reliability in deployment. Practical deployment demands three capabilities: accurately estimating the likelihood of correctness, abstaining on uncertain predictions, and invoking external mechanisms to validate or repair abstained outputs. Existing calibration and uncertainty estimation methods, primarily developed for natural language tasks, do not readily ","authors_text":"Ravishka Rathnasuriya, Wei Yang","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T05:04:42Z","title":"When to Answer and When to Defer: A Decision Framework for Reliable Code Predictions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19369","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:85ca6674ad38d95725cd022dbedab8ac0da8c22a5b3975908dbdc4640ce40693","target":"record","created_at":"2026-05-20T01:05:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6e8a40eebef0f7ae5f76b850fdc6abf89bb8003cd26e8a6969d4344540cd2b26","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T05:04:42Z","title_canon_sha256":"b15e6fcfdb56bbb14163056efc90371c2b796e9742de5d616a5922d2a7e43ec4"},"schema_version":"1.0","source":{"id":"2605.19369","kind":"arxiv","version":1}},"canonical_sha256":"dac4c7ce2a3a0d452ecb05da8575ed9385027c1612a83a8c7b8807c48f5552b0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"dac4c7ce2a3a0d452ecb05da8575ed9385027c1612a83a8c7b8807c48f5552b0","first_computed_at":"2026-05-20T01:05:41.762428Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T01:05:41.762428Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"YaslGWkLL5Y6cg+Zd8n4RExWpiuHb24cMQAZWIsYP2JhwGahApy6W4a5gHXOWQow8u41CvVUVbaOnuYx+sDDBg==","signature_status":"signed_v1","signed_at":"2026-05-20T01:05:41.763044Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.19369","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:85ca6674ad38d95725cd022dbedab8ac0da8c22a5b3975908dbdc4640ce40693","sha256:9891f66875c9ee5761a2fcb13eacd553c25fe93409ceec6837acaa1eb5046a6c"],"state_sha256":"53728ba793094d1e59b747eda3a17a8b297b32c799373f5b6ed0391da996996e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"rS03ZSCcmg3zpUK/V8baUHUApLfJRPV8Pz9uIwMxf+cCzUoVe9+DH7s3c9VDktKp8jmnampWairZNS9iPpldCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T03:05:41.783179Z","bundle_sha256":"7e76abc0be83fd2c27fb2b380b05d39df8f79bf6c47fb5975e233c22baae85a2"}}