{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:MLT7XTZEEZSPVUOJI7FK3EKYWS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5281f176771dda3bbf59cacb0bc26d93fcadeba0ddcc2292b766efe6762a318a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-08T13:12:01Z","title_canon_sha256":"a367c9c0c4d1c244b59740df3237dbd229d07c5f523523f5e4fb4c9906caa62f"},"schema_version":"1.0","source":{"id":"2606.09456","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.09456","created_at":"2026-06-09T02:08:49Z"},{"alias_kind":"arxiv_version","alias_value":"2606.09456v1","created_at":"2026-06-09T02:08:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.09456","created_at":"2026-06-09T02:08:49Z"},{"alias_kind":"pith_short_12","alias_value":"MLT7XTZEEZSP","created_at":"2026-06-09T02:08:49Z"},{"alias_kind":"pith_short_16","alias_value":"MLT7XTZEEZSPVUOJ","created_at":"2026-06-09T02:08:49Z"},{"alias_kind":"pith_short_8","alias_value":"MLT7XTZE","created_at":"2026-06-09T02:08:49Z"}],"graph_snapshots":[{"event_id":"sha256:91b391bdb91447bfc56535404bff7fe4b683ebc47854ad782a52ed92a5df96d8","target":"graph","created_at":"2026-06-09T02:08:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.09456/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"On-Policy Distillation (OPD) has become a core technique in the post-training of Large Language Models (LLMs) for transferring knowledge from domain experts to student models. However, existing OPD distillation methods require teacher and student models to share the same tokenizer, restricting the applicability of OPD within the model series. Current mainstream practice typically employs Supervised Fine-Tuning (SFT) on teacher-generated responses for cross-tokenizer distillation, which fails to capture the rich knowledge embedded in the teacher's probability distribution. In this work, we enab","authors_text":"Dihong Gong, Dongyi Liu, Han Xiao, Jia Li, Yasheng Wang, Yifan Niu, Zelong Wang","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-08T13:12:01Z","title":"Breaking the Tokenizer Barrier: On-Policy Distillation across Model Families"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.09456","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1a3069296fb979cc9174cc30977bdb7862614ddce70806ef6d5bb7b70f20fac6","target":"record","created_at":"2026-06-09T02:08:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5281f176771dda3bbf59cacb0bc26d93fcadeba0ddcc2292b766efe6762a318a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-08T13:12:01Z","title_canon_sha256":"a367c9c0c4d1c244b59740df3237dbd229d07c5f523523f5e4fb4c9906caa62f"},"schema_version":"1.0","source":{"id":"2606.09456","kind":"arxiv","version":1}},"canonical_sha256":"62e7fbcf242664fad1c947caad9158b4a289dfc56215c2e6f87df9ab6f4ac1bf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"62e7fbcf242664fad1c947caad9158b4a289dfc56215c2e6f87df9ab6f4ac1bf","first_computed_at":"2026-06-09T02:08:49.516189Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T02:08:49.516189Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"WL/cTnL5g5oWdiq/0SqIlqmklPLlrd4r+BSHlapiUCNaklqsGHzUtFFjatj/eQeSfUAGKPvo4WBFcvrwWWoXBA==","signature_status":"signed_v1","signed_at":"2026-06-09T02:08:49.517061Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.09456","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1a3069296fb979cc9174cc30977bdb7862614ddce70806ef6d5bb7b70f20fac6","sha256:91b391bdb91447bfc56535404bff7fe4b683ebc47854ad782a52ed92a5df96d8"],"state_sha256":"8c878743f0a9798ac7bab8007f72d55fa80dde75f9bf18dd0c7a9f8283a9c577"}