{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:TUKZJAAD5WKWHXVS7AMJ34SIMC","short_pith_number":"pith:TUKZJAAD","canonical_record":{"source":{"id":"2507.05386","kind":"arxiv","version":6},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-07T18:17:06Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"98badf3560c2c435be51796e09628669640d6ba8fd2e23b033f22979b8fad922","abstract_canon_sha256":"189229dd5b7dbb2e68df03516168e0ab651530868b9e06f477b0d1531cfdfd09"},"schema_version":"1.0"},"canonical_sha256":"9d15948003ed9563deb2f8189df24860a25fdc594e9925766a992020ff2b50d8","source":{"kind":"arxiv","id":"2507.05386","version":6},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.05386","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"arxiv_version","alias_value":"2507.05386v6","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.05386","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"pith_short_12","alias_value":"TUKZJAAD5WKW","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"pith_short_16","alias_value":"TUKZJAAD5WKWHXVS","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"pith_short_8","alias_value":"TUKZJAAD","created_at":"2026-06-30T02:18:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:TUKZJAAD5WKWHXVS7AMJ34SIMC","target":"record","payload":{"canonical_record":{"source":{"id":"2507.05386","kind":"arxiv","version":6},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-07T18:17:06Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"98badf3560c2c435be51796e09628669640d6ba8fd2e23b033f22979b8fad922","abstract_canon_sha256":"189229dd5b7dbb2e68df03516168e0ab651530868b9e06f477b0d1531cfdfd09"},"schema_version":"1.0"},"canonical_sha256":"9d15948003ed9563deb2f8189df24860a25fdc594e9925766a992020ff2b50d8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-30T02:18:04.474580Z","signature_b64":"Yd3dHKdnw82Rk/MofNksS6lcTvdCyH1AHH3k1AS7rL2yicZXQJbBkN6Ifr41qjILWoJm9qQX5Tn3U7OhJFcZAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9d15948003ed9563deb2f8189df24860a25fdc594e9925766a992020ff2b50d8","last_reissued_at":"2026-06-30T02:18:04.473780Z","signature_status":"signed_v1","first_computed_at":"2026-06-30T02:18:04.473780Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2507.05386","source_version":6,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T02:18:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8GFg5gKbThZcnjgpXfzPVudtfTW+XR2yt6/RPUDmOvHCNouhQWUrwoQOd89WTf6f4u+z1Q5YUiH6a2atNdKHCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T21:19:26.651280Z"},"content_sha256":"b3850179564e5d2e5f8d404424df7c45cd29f723c6483fc7f7ecaac2daee0cb3","schema_version":"1.0","event_id":"sha256:b3850179564e5d2e5f8d404424df7c45cd29f723c6483fc7f7ecaac2daee0cb3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:TUKZJAAD5WKWHXVS7AMJ34SIMC","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Reinforcement Fine-Tuning Naturally Mitigates Forgetting in Continual Post-Training","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.LG","authors_text":"Changyi Ma, Dong Yi, Fei Zhu, Gaofeng Meng, Haohan Zhao, Hongbin Liu, Hongbo Zhao, Qingfu Zhang, Rong Feng, Song Lai, Wenzhuo Liu, Xi Lin","submitted_at":"2025-07-07T18:17:06Z","abstract_excerpt":"Continual post-training (CPT) is a popular and effective technique for adapting foundation models like multimodal large language models to ever-evolving downstream tasks. While existing research primarily focuses on methods like data replay, model expansion, or parameter regularization, the fundamental role of the learning paradigm remains largely unexplored. This paper presents a comparative analysis of two core post-training paradigms: supervised fine-tuning (SFT) and reinforcement fine-tuning (RFT), investigating their respective impacts on knowledge retention during CPT. Our experiments ar"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2507.05386","kind":"arxiv","version":6},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2507.05386/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T02:18:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vstC3ZOC6xafuhRhmSj5eRzjHqe8c8dY3oyULkWbiwRzRgOvy7reXpRscGylaiGD1/b8LiQl+l1iUGcWJN+VCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T21:19:26.651676Z"},"content_sha256":"a99861a7b32feae88f66e211114d43a4498ac228c20faa25b5f6a998467e9733","schema_version":"1.0","event_id":"sha256:a99861a7b32feae88f66e211114d43a4498ac228c20faa25b5f6a998467e9733"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/TUKZJAAD5WKWHXVS7AMJ34SIMC/bundle.json","state_url":"https://pith.science/pith/TUKZJAAD5WKWHXVS7AMJ34SIMC/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/TUKZJAAD5WKWHXVS7AMJ34SIMC/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-30T21:19:26Z","links":{"resolver":"https://pith.science/pith/TUKZJAAD5WKWHXVS7AMJ34SIMC","bundle":"https://pith.science/pith/TUKZJAAD5WKWHXVS7AMJ34SIMC/bundle.json","state":"https://pith.science/pith/TUKZJAAD5WKWHXVS7AMJ34SIMC/state.json","well_known_bundle":"https://pith.science/.well-known/pith/TUKZJAAD5WKWHXVS7AMJ34SIMC/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:TUKZJAAD5WKWHXVS7AMJ34SIMC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"189229dd5b7dbb2e68df03516168e0ab651530868b9e06f477b0d1531cfdfd09","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-07T18:17:06Z","title_canon_sha256":"98badf3560c2c435be51796e09628669640d6ba8fd2e23b033f22979b8fad922"},"schema_version":"1.0","source":{"id":"2507.05386","kind":"arxiv","version":6}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.05386","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"arxiv_version","alias_value":"2507.05386v6","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.05386","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"pith_short_12","alias_value":"TUKZJAAD5WKW","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"pith_short_16","alias_value":"TUKZJAAD5WKWHXVS","created_at":"2026-06-30T02:18:04Z"},{"alias_kind":"pith_short_8","alias_value":"TUKZJAAD","created_at":"2026-06-30T02:18:04Z"}],"graph_snapshots":[{"event_id":"sha256:a99861a7b32feae88f66e211114d43a4498ac228c20faa25b5f6a998467e9733","target":"graph","created_at":"2026-06-30T02:18:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2507.05386/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Continual post-training (CPT) is a popular and effective technique for adapting foundation models like multimodal large language models to ever-evolving downstream tasks. While existing research primarily focuses on methods like data replay, model expansion, or parameter regularization, the fundamental role of the learning paradigm remains largely unexplored. This paper presents a comparative analysis of two core post-training paradigms: supervised fine-tuning (SFT) and reinforcement fine-tuning (RFT), investigating their respective impacts on knowledge retention during CPT. Our experiments ar","authors_text":"Changyi Ma, Dong Yi, Fei Zhu, Gaofeng Meng, Haohan Zhao, Hongbin Liu, Hongbo Zhao, Qingfu Zhang, Rong Feng, Song Lai, Wenzhuo Liu, Xi Lin","cross_cats":["cs.AI","cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-07T18:17:06Z","title":"Reinforcement Fine-Tuning Naturally Mitigates Forgetting in Continual Post-Training"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2507.05386","kind":"arxiv","version":6},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b3850179564e5d2e5f8d404424df7c45cd29f723c6483fc7f7ecaac2daee0cb3","target":"record","created_at":"2026-06-30T02:18:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"189229dd5b7dbb2e68df03516168e0ab651530868b9e06f477b0d1531cfdfd09","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-07T18:17:06Z","title_canon_sha256":"98badf3560c2c435be51796e09628669640d6ba8fd2e23b033f22979b8fad922"},"schema_version":"1.0","source":{"id":"2507.05386","kind":"arxiv","version":6}},"canonical_sha256":"9d15948003ed9563deb2f8189df24860a25fdc594e9925766a992020ff2b50d8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9d15948003ed9563deb2f8189df24860a25fdc594e9925766a992020ff2b50d8","first_computed_at":"2026-06-30T02:18:04.473780Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-30T02:18:04.473780Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Yd3dHKdnw82Rk/MofNksS6lcTvdCyH1AHH3k1AS7rL2yicZXQJbBkN6Ifr41qjILWoJm9qQX5Tn3U7OhJFcZAA==","signature_status":"signed_v1","signed_at":"2026-06-30T02:18:04.474580Z","signed_message":"canonical_sha256_bytes"},"source_id":"2507.05386","source_kind":"arxiv","source_version":6}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b3850179564e5d2e5f8d404424df7c45cd29f723c6483fc7f7ecaac2daee0cb3","sha256:a99861a7b32feae88f66e211114d43a4498ac228c20faa25b5f6a998467e9733"],"state_sha256":"47052bbf3b61a7c662b9cfe0737ec37fa94e49f4ccd932391927bae9808b1867"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"F3AOKPbHjm/P7gDVRA0JsUEHxxfkIXAGTTh/eI3T7anRBuZn6qcYVM505U99N1V0rgOimmSeknzZXjfUeqXxBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-30T21:19:26.653803Z","bundle_sha256":"0572a92e39d2f5f8aa713703ede603f3c14b63847769a89955c2ae5a5cd6ee40"}}