{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:JHWUX7UITFISSTSEXIMSMIAGBX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d9c5e1d5bddc84ded9f63c4fec20a7514f4e9f084aa64dfa305f36d9499c2561","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-22T04:13:14Z","title_canon_sha256":"ad96f8be791a49486acedf0cda9d815874b003d03c422c02dd45c87395179e45"},"schema_version":"1.0","source":{"id":"2606.22830","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.22830","created_at":"2026-06-23T02:14:00Z"},{"alias_kind":"arxiv_version","alias_value":"2606.22830v1","created_at":"2026-06-23T02:14:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.22830","created_at":"2026-06-23T02:14:00Z"},{"alias_kind":"pith_short_12","alias_value":"JHWUX7UITFIS","created_at":"2026-06-23T02:14:00Z"},{"alias_kind":"pith_short_16","alias_value":"JHWUX7UITFISSTSE","created_at":"2026-06-23T02:14:00Z"},{"alias_kind":"pith_short_8","alias_value":"JHWUX7UI","created_at":"2026-06-23T02:14:00Z"}],"graph_snapshots":[{"event_id":"sha256:6b45dcd0a1e6b5040dee32fb72b18386c97fc255531d67b0ea68c41809342b1d","target":"graph","created_at":"2026-06-23T02:14:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.22830/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"On-policy distillation transfers reasoning ability through dense token-level supervision, yet the nature of the transferable signal remains unclear. We discover that reasoning chains contain two types of knowledge that require different discovery mechanisms: decisions (where to branch), which surface through student uncertainty, and evidence (intermediate steps that justify decisions), which hides in positions where the student is confident yet wrong. Current methods capture only decisions; the substantive knowledge in evidence tokens remains untransferred. We propose DEAR(Decision-Evidence Aw","authors_text":"Jinwei Xiao, Qi Gu, Wentao Chen, Xunliang Cai, Yueqing Sun, Yuxin Liu, Zhengxi Lu, Zhiyuan Yao, Zhuowen Han","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-22T04:13:14Z","title":"Finding the Evidence: Discovering Decision-Supporting Tokens for On-Policy Reasoning Distillation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.22830","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:df57668438996b5e8d6a45dd3c4f3d66f69b95e602fcd70a8d82823fc933eca9","target":"record","created_at":"2026-06-23T02:14:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d9c5e1d5bddc84ded9f63c4fec20a7514f4e9f084aa64dfa305f36d9499c2561","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-22T04:13:14Z","title_canon_sha256":"ad96f8be791a49486acedf0cda9d815874b003d03c422c02dd45c87395179e45"},"schema_version":"1.0","source":{"id":"2606.22830","kind":"arxiv","version":1}},"canonical_sha256":"49ed4bfe889951294e44ba192620060dc416111f63625c0e6e0a0803e1ad62dc","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"49ed4bfe889951294e44ba192620060dc416111f63625c0e6e0a0803e1ad62dc","first_computed_at":"2026-06-23T02:14:00.616017Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-23T02:14:00.616017Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"6zQv2nTjWmaGyU7Dahs1wwcFKIqSjUxY9AACuKBCNrHQdSAzhy8h5GxVRwm/jxsvKcYwetGhaL1Cf3bGHmvrCA==","signature_status":"signed_v1","signed_at":"2026-06-23T02:14:00.616438Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.22830","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:df57668438996b5e8d6a45dd3c4f3d66f69b95e602fcd70a8d82823fc933eca9","sha256:6b45dcd0a1e6b5040dee32fb72b18386c97fc255531d67b0ea68c41809342b1d"],"state_sha256":"43f6906c5915b77e3c83920774c2dcf42dcfe5a9b8ce6406e539acfedcee5542"}