{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:6TPOZUGUXWBVJZQQA7ROKOMCUC","short_pith_number":"pith:6TPOZUGU","schema_version":"1.0","canonical_sha256":"f4deecd0d4bd8354e61007e2e53982a0be4f6dc39eb4590c3164661bbd0823af","source":{"kind":"arxiv","id":"2606.17628","version":1},"attestation_state":"computed","paper":{"title":"OPD-Evolver: Cultivating Holistic Agent Evolver via On-Policy Distillation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Guibin Zhang, Shuicheng Yan, Wangchunshu Zhou, Xiaobin Hu, Xun Xu, Yanwei Yue, Zikun Su","submitted_at":"2026-06-16T07:33:53Z","abstract_excerpt":"Memory has become a standard substrate for self-evolving agents, yet retaining experience is not the same as learning how to evolve through it. Existing memory agents can store trajectories, retrieve reflections, or accumulate skills, but often lack the holistic competence to select useful experience, act on it, write reusable knowledge, and maintain a growing repository. We introduce OPD-Evolver, a slow-fast co-evolution framework that cultivates such an agent evolver through on-policy self-distillation. In the fast loop, OPD-Evolver interacts with a four-level memory hierarchy to read, use, "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.17628","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-16T07:33:53Z","cross_cats_sorted":[],"title_canon_sha256":"ef3f395f1f799a0c36146ee84ba9e0c2671e5ae208803bb8ed0198ae52a1f02e","abstract_canon_sha256":"ee6a4b6aeb020f016d1a3d543af7f36316ea31f42b2df151efb387456f122d28"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:10:17.631730Z","signature_b64":"+zNhoHgIKvHFjCVQQ4OZfksj3yCrmtuauYaqeK/JIKEtYq4lmA5cdr65RwBNium4nqx0jXj9rdy7G5z0I6aFCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f4deecd0d4bd8354e61007e2e53982a0be4f6dc39eb4590c3164661bbd0823af","last_reissued_at":"2026-06-19T16:10:17.631390Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:10:17.631390Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"OPD-Evolver: Cultivating Holistic Agent Evolver via On-Policy Distillation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Guibin Zhang, Shuicheng Yan, Wangchunshu Zhou, Xiaobin Hu, Xun Xu, Yanwei Yue, Zikun Su","submitted_at":"2026-06-16T07:33:53Z","abstract_excerpt":"Memory has become a standard substrate for self-evolving agents, yet retaining experience is not the same as learning how to evolve through it. Existing memory agents can store trajectories, retrieve reflections, or accumulate skills, but often lack the holistic competence to select useful experience, act on it, write reusable knowledge, and maintain a growing repository. We introduce OPD-Evolver, a slow-fast co-evolution framework that cultivates such an agent evolver through on-policy self-distillation. In the fast loop, OPD-Evolver interacts with a four-level memory hierarchy to read, use, "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.17628","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.17628/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.17628","created_at":"2026-06-19T16:10:17.631452+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.17628v1","created_at":"2026-06-19T16:10:17.631452+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.17628","created_at":"2026-06-19T16:10:17.631452+00:00"},{"alias_kind":"pith_short_12","alias_value":"6TPOZUGUXWBV","created_at":"2026-06-19T16:10:17.631452+00:00"},{"alias_kind":"pith_short_16","alias_value":"6TPOZUGUXWBVJZQQ","created_at":"2026-06-19T16:10:17.631452+00:00"},{"alias_kind":"pith_short_8","alias_value":"6TPOZUGU","created_at":"2026-06-19T16:10:17.631452+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC","json":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC.json","graph_json":"https://pith.science/api/pith-number/6TPOZUGUXWBVJZQQA7ROKOMCUC/graph.json","events_json":"https://pith.science/api/pith-number/6TPOZUGUXWBVJZQQA7ROKOMCUC/events.json","paper":"https://pith.science/paper/6TPOZUGU"},"agent_actions":{"view_html":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC","download_json":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC.json","view_paper":"https://pith.science/paper/6TPOZUGU","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.17628&json=true","fetch_graph":"https://pith.science/api/pith-number/6TPOZUGUXWBVJZQQA7ROKOMCUC/graph.json","fetch_events":"https://pith.science/api/pith-number/6TPOZUGUXWBVJZQQA7ROKOMCUC/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC/action/timestamp_anchor","attest_storage":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC/action/storage_attestation","attest_author":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC/action/author_attestation","sign_citation":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC/action/citation_signature","submit_replication":"https://pith.science/pith/6TPOZUGUXWBVJZQQA7ROKOMCUC/action/replication_record"}},"created_at":"2026-06-19T16:10:17.631452+00:00","updated_at":"2026-06-19T16:10:17.631452+00:00"}