{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:2NL7GLWHJD7KQYATOJB3NLUNPX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"852234dd03922db1be81fcc4634741d71824379db6981f19dcf94dbb60bbb8b8","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-05-30T17:59:01Z","title_canon_sha256":"33c56d9f2e98d048c1ca6a3059a987b228b0b887b0acd4a6a75091168adbb09e"},"schema_version":"1.0","source":{"id":"2505.24864","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2505.24864","created_at":"2026-05-18T20:46:59Z"},{"alias_kind":"arxiv_version","alias_value":"2505.24864v1","created_at":"2026-05-18T20:46:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2505.24864","created_at":"2026-05-18T20:46:59Z"},{"alias_kind":"pith_short_12","alias_value":"2NL7GLWHJD7K","created_at":"2026-05-18T20:46:59Z"},{"alias_kind":"pith_short_16","alias_value":"2NL7GLWHJD7KQYAT","created_at":"2026-05-18T20:46:59Z"},{"alias_kind":"pith_short_8","alias_value":"2NL7GLWH","created_at":"2026-05-18T20:46:59Z"}],"graph_snapshots":[{"event_id":"sha256:3aac1dfd1d0babeec06eedf2504487fdc72aa76f50743568c9bb86b3fd0c22a4","target":"graph","created_at":"2026-05-18T20:46:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Recent advances in reasoning-centric language models have highlighted reinforcement learning (RL) as a promising method for aligning models with verifiable rewards. However, it remains contentious whether RL truly expands a model's reasoning capabilities or merely amplifies high-reward outputs already latent in the base model's distribution, and whether continually scaling up RL compute reliably leads to improved reasoning performance. In this work, we challenge prevailing assumptions by demonstrating that prolonged RL (ProRL) training can uncover novel reasoning strategies that are inaccessib","authors_text":"Jan Kautz, Jian Hu, Mingjie Liu, Shizhe Diao, Ximing Lu, Xin Dong, Yejin Choi, Yi Dong","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-05-30T17:59:01Z","title":"ProRL: Prolonged Reinforcement Learning Expands Reasoning Boundaries in Large Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2505.24864","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a06ebed25eb900a97e13bc2bb0ac31f8b741c26864de1f1c767a544b4c915702","target":"record","created_at":"2026-05-18T20:46:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"852234dd03922db1be81fcc4634741d71824379db6981f19dcf94dbb60bbb8b8","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-05-30T17:59:01Z","title_canon_sha256":"33c56d9f2e98d048c1ca6a3059a987b228b0b887b0acd4a6a75091168adbb09e"},"schema_version":"1.0","source":{"id":"2505.24864","kind":"arxiv","version":1}},"canonical_sha256":"d357f32ec748fea860137243b6ae8d7de6ae67e3dce0564037f0e4bbf5523562","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d357f32ec748fea860137243b6ae8d7de6ae67e3dce0564037f0e4bbf5523562","first_computed_at":"2026-05-18T20:46:59.301239Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T20:46:59.301239Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ztZ2pO4Al7bT2KgpDj/5i745xSrPwR/R37fEi17bmuPzrp2BU/HEyzyfslx1pxq48m81IKGFQZD/C1t6DrwcBA==","signature_status":"signed_v1","signed_at":"2026-05-18T20:46:59.303231Z","signed_message":"canonical_sha256_bytes"},"source_id":"2505.24864","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a06ebed25eb900a97e13bc2bb0ac31f8b741c26864de1f1c767a544b4c915702","sha256:3aac1dfd1d0babeec06eedf2504487fdc72aa76f50743568c9bb86b3fd0c22a4"],"state_sha256":"d32f748e16be62f41f5e12bad9b7d60dcd9a57ed92227bbd216ef00bffbe6a52"}