{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:CKTYKVIQAQNR33DA43DJSJYRMJ","short_pith_number":"pith:CKTYKVIQ","canonical_record":{"source":{"id":"2606.18388","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-16T18:33:08Z","cross_cats_sorted":["cs.AI","cs.CL","cs.MA"],"title_canon_sha256":"fa6e2d1cd1b2c8ad33c5f9a589b46744424b850a95ea7b9f4739bdbbc204bffb","abstract_canon_sha256":"757cc79fecb68c85e7741317565d51aeb3605269e9334d2d743512afd4d5b685"},"schema_version":"1.0"},"canonical_sha256":"12a7855510041b1dec60e6c6992711624ccb42025694acfabf4f7baa5244460b","source":{"kind":"arxiv","id":"2606.18388","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.18388","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"arxiv_version","alias_value":"2606.18388v1","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.18388","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"pith_short_12","alias_value":"CKTYKVIQAQNR","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"pith_short_16","alias_value":"CKTYKVIQAQNR33DA","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"pith_short_8","alias_value":"CKTYKVIQ","created_at":"2026-06-19T16:11:00Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:CKTYKVIQAQNR33DA43DJSJYRMJ","target":"record","payload":{"canonical_record":{"source":{"id":"2606.18388","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-16T18:33:08Z","cross_cats_sorted":["cs.AI","cs.CL","cs.MA"],"title_canon_sha256":"fa6e2d1cd1b2c8ad33c5f9a589b46744424b850a95ea7b9f4739bdbbc204bffb","abstract_canon_sha256":"757cc79fecb68c85e7741317565d51aeb3605269e9334d2d743512afd4d5b685"},"schema_version":"1.0"},"canonical_sha256":"12a7855510041b1dec60e6c6992711624ccb42025694acfabf4f7baa5244460b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:11:00.008812Z","signature_b64":"/gQPP+Ur7Ddx9vZcHrdCxGDosgKp820kZEouYLM6jqOjgTrUv2GOv30ogkBYiG4PyHPqvRBkGsFu/+1SHYXfBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"12a7855510041b1dec60e6c6992711624ccb42025694acfabf4f7baa5244460b","last_reissued_at":"2026-06-19T16:11:00.008474Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:11:00.008474Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.18388","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:11:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VkFQESzNgvssl2zR/bN16+vJAnmFOhJ2oLn/HzRaSCagae8qn2X4C6i5csSGtCSYHPl+WEVQCTAymmiHEWPaAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T09:21:17.028175Z"},"content_sha256":"ac7e0c1ca3505a5d00d29a7ec668fc01221f414f88c7f02485b0534039fd4d6a","schema_version":"1.0","event_id":"sha256:ac7e0c1ca3505a5d00d29a7ec668fc01221f414f88c7f02485b0534039fd4d6a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:CKTYKVIQAQNR33DA43DJSJYRMJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"LLMZero: Discovering Adaptive Training Strategies for RL Post-Training via LLM Agents","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.MA"],"primary_cat":"cs.LG","authors_text":"Alex Zhang, Bernie Wang, Boran Han, Cuixiong Hu, George Karypis, Haoyang Fang, Huzefa Rangwala, Jiading Gai, Peng Tang, Shuai Zhang, Shuo Yang, Wei Zhu, Xuan Zhu, Zhenyu Pan","submitted_at":"2026-06-16T18:33:08Z","abstract_excerpt":"RL post-training strategies are dataset-dependent and reveal a recurring empirical pattern: capacity parameters accumulate monotonically across stages, while regularization parameters predominantly oscillate in response to shifting training dynamics. This distinction matters because fixed schedules commit all parameters to fixed trajectories and therefore cannot express the non-stationary exploration-exploitation tradeoffs that regularization must track; the principle provides actionable design rules for multi-stage training. We discover this through LLMZero, a system where LLM agents search o"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.18388","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.18388/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:11:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"xMlHnSIb0AfdJTA/lMsN5addelPchd0FEcANr9rS3VJxNCL239M7xnP7Bx62tZDsDm3Urm2B73o/8Zp2PIMzCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T09:21:17.028564Z"},"content_sha256":"5b8fca1821e3793f06d260261e9d9ce1979d595f16bbba5d613884dc4630dd0b","schema_version":"1.0","event_id":"sha256:5b8fca1821e3793f06d260261e9d9ce1979d595f16bbba5d613884dc4630dd0b"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CKTYKVIQAQNR33DA43DJSJYRMJ/bundle.json","state_url":"https://pith.science/pith/CKTYKVIQAQNR33DA43DJSJYRMJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CKTYKVIQAQNR33DA43DJSJYRMJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T09:21:17Z","links":{"resolver":"https://pith.science/pith/CKTYKVIQAQNR33DA43DJSJYRMJ","bundle":"https://pith.science/pith/CKTYKVIQAQNR33DA43DJSJYRMJ/bundle.json","state":"https://pith.science/pith/CKTYKVIQAQNR33DA43DJSJYRMJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CKTYKVIQAQNR33DA43DJSJYRMJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:CKTYKVIQAQNR33DA43DJSJYRMJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"757cc79fecb68c85e7741317565d51aeb3605269e9334d2d743512afd4d5b685","cross_cats_sorted":["cs.AI","cs.CL","cs.MA"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-16T18:33:08Z","title_canon_sha256":"fa6e2d1cd1b2c8ad33c5f9a589b46744424b850a95ea7b9f4739bdbbc204bffb"},"schema_version":"1.0","source":{"id":"2606.18388","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.18388","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"arxiv_version","alias_value":"2606.18388v1","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.18388","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"pith_short_12","alias_value":"CKTYKVIQAQNR","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"pith_short_16","alias_value":"CKTYKVIQAQNR33DA","created_at":"2026-06-19T16:11:00Z"},{"alias_kind":"pith_short_8","alias_value":"CKTYKVIQ","created_at":"2026-06-19T16:11:00Z"}],"graph_snapshots":[{"event_id":"sha256:5b8fca1821e3793f06d260261e9d9ce1979d595f16bbba5d613884dc4630dd0b","target":"graph","created_at":"2026-06-19T16:11:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.18388/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"RL post-training strategies are dataset-dependent and reveal a recurring empirical pattern: capacity parameters accumulate monotonically across stages, while regularization parameters predominantly oscillate in response to shifting training dynamics. This distinction matters because fixed schedules commit all parameters to fixed trajectories and therefore cannot express the non-stationary exploration-exploitation tradeoffs that regularization must track; the principle provides actionable design rules for multi-stage training. We discover this through LLMZero, a system where LLM agents search o","authors_text":"Alex Zhang, Bernie Wang, Boran Han, Cuixiong Hu, George Karypis, Haoyang Fang, Huzefa Rangwala, Jiading Gai, Peng Tang, Shuai Zhang, Shuo Yang, Wei Zhu, Xuan Zhu, Zhenyu Pan","cross_cats":["cs.AI","cs.CL","cs.MA"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-16T18:33:08Z","title":"LLMZero: Discovering Adaptive Training Strategies for RL Post-Training via LLM Agents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.18388","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ac7e0c1ca3505a5d00d29a7ec668fc01221f414f88c7f02485b0534039fd4d6a","target":"record","created_at":"2026-06-19T16:11:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"757cc79fecb68c85e7741317565d51aeb3605269e9334d2d743512afd4d5b685","cross_cats_sorted":["cs.AI","cs.CL","cs.MA"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-16T18:33:08Z","title_canon_sha256":"fa6e2d1cd1b2c8ad33c5f9a589b46744424b850a95ea7b9f4739bdbbc204bffb"},"schema_version":"1.0","source":{"id":"2606.18388","kind":"arxiv","version":1}},"canonical_sha256":"12a7855510041b1dec60e6c6992711624ccb42025694acfabf4f7baa5244460b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"12a7855510041b1dec60e6c6992711624ccb42025694acfabf4f7baa5244460b","first_computed_at":"2026-06-19T16:11:00.008474Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:11:00.008474Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"/gQPP+Ur7Ddx9vZcHrdCxGDosgKp820kZEouYLM6jqOjgTrUv2GOv30ogkBYiG4PyHPqvRBkGsFu/+1SHYXfBw==","signature_status":"signed_v1","signed_at":"2026-06-19T16:11:00.008812Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.18388","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ac7e0c1ca3505a5d00d29a7ec668fc01221f414f88c7f02485b0534039fd4d6a","sha256:5b8fca1821e3793f06d260261e9d9ce1979d595f16bbba5d613884dc4630dd0b"],"state_sha256":"780c7c3634ef0d35938af6c221471bd0625d87ccc7c901d9f4f8f6035fc1777b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"aKXiIDllG++sYPrVFQ9yUmanUKZeIdRqXU3+mJ2iJf3iNrEi7MhBCkphdnv7xdgOfGIux/5iQPDxQXr7DH51Dw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T09:21:17.030650Z","bundle_sha256":"1ec9a0553be347bfff1baef9ca6b42d14552c7e60b9020ac85a5c887af3e4304"}}