{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:P4TVMM3P3AFKY523MIVTWABEQF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"28d882b22246cf4f6b5b96a4fba0ba9b263a4c1444adc94b95ac0ecca19af885","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DC","submitted_at":"2026-05-20T07:55:06Z","title_canon_sha256":"8435d6d1fc2d72905ee5e7ca64cd6ec894d19da1791dc1df3ebea230a861d0e4"},"schema_version":"1.0","source":{"id":"2605.20863","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.20863","created_at":"2026-05-21T01:05:25Z"},{"alias_kind":"arxiv_version","alias_value":"2605.20863v1","created_at":"2026-05-21T01:05:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.20863","created_at":"2026-05-21T01:05:25Z"},{"alias_kind":"pith_short_12","alias_value":"P4TVMM3P3AFK","created_at":"2026-05-21T01:05:25Z"},{"alias_kind":"pith_short_16","alias_value":"P4TVMM3P3AFKY523","created_at":"2026-05-21T01:05:25Z"},{"alias_kind":"pith_short_8","alias_value":"P4TVMM3P","created_at":"2026-05-21T01:05:25Z"}],"graph_snapshots":[{"event_id":"sha256:0e6431c2dbf1ae860f25c9b8f828a1266ef10da3b911739278b2b2fa4964692f","target":"graph","created_at":"2026-05-21T01:05:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.20863/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reinforcement learning with verifiable rewards (RLVR) has recently unlocked strong reasoning capabilities in large language models (LLMs), triggering rapid exploration of new algorithms and data. However, RLVR training is notoriously inefficient: long-tailed rollouts, tool-induced stalls, and asymmetric resource requirements between rollout and training introduce substantial idle time that cannot be eliminated by job-local optimizations such as synchronous pipelining, asynchronous rollout, or colocated execution.\n  We argue that this inefficiency is structural. While idle gaps are unavoidable ","authors_text":"Boyu Tian, Fangzheng Jiao, Guoteng Wang, Hangyu Wang, Menghao Zhang, Peng Sun, Ping Zhang, Qiaoling Chen, Siyuan Feng, Tian Tang, Xiaohe Hu, Yang You, Yanmin Jia, Yiqi Zhang, Zhen Jiang, Ziming Liu","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DC","submitted_at":"2026-05-20T07:55:06Z","title":"PlexRL: Cluster-Level Orchestration of Serviceized LLM Execution for RLVR"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.20863","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3875d326fa15a8e0846c5cb0934b93c6a8244e7253fba2e7fad6840cc4439e20","target":"record","created_at":"2026-05-21T01:05:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"28d882b22246cf4f6b5b96a4fba0ba9b263a4c1444adc94b95ac0ecca19af885","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DC","submitted_at":"2026-05-20T07:55:06Z","title_canon_sha256":"8435d6d1fc2d72905ee5e7ca64cd6ec894d19da1791dc1df3ebea230a861d0e4"},"schema_version":"1.0","source":{"id":"2605.20863","kind":"arxiv","version":1}},"canonical_sha256":"7f2756336fd80aac775b622b3b0024814b68ac38c163c810b31ef1f0a448dde3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7f2756336fd80aac775b622b3b0024814b68ac38c163c810b31ef1f0a448dde3","first_computed_at":"2026-05-21T01:05:25.136281Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-21T01:05:25.136281Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"wRRcnBrFiNLTWCkAB7D/IzGk90kg3sd1oMbcnLSoJ7KO14CfAEDF4tRIOmNUNrw/NghLp/FCva9CjbDl/fI5DQ==","signature_status":"signed_v1","signed_at":"2026-05-21T01:05:25.136990Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.20863","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3875d326fa15a8e0846c5cb0934b93c6a8244e7253fba2e7fad6840cc4439e20","sha256:0e6431c2dbf1ae860f25c9b8f828a1266ef10da3b911739278b2b2fa4964692f"],"state_sha256":"5b5e39d8e05537027e157740acd8ee8eba683323cabfe32c87edf2b831e17db5"}