{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:MBWDFESSL7WNDK3QAUAJ25JCCL","short_pith_number":"pith:MBWDFESS","canonical_record":{"source":{"id":"2511.07317","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-10T17:18:35Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"5221e73bfb4279b156ce611fe2787980d048e37900da2c0caccb69fbc50ffa24","abstract_canon_sha256":"4ab8ae6dbf4088c78bae5c270d24486e1ca156f63a8dacfef0e5429f6da64863"},"schema_version":"1.0"},"canonical_sha256":"606c3292525fecd1ab7005009d752212f7685f34729661181cc7563037c4b256","source":{"kind":"arxiv","id":"2511.07317","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2511.07317","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"arxiv_version","alias_value":"2511.07317v2","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.07317","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"pith_short_12","alias_value":"MBWDFESSL7WN","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"pith_short_16","alias_value":"MBWDFESSL7WNDK3Q","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"pith_short_8","alias_value":"MBWDFESS","created_at":"2026-06-09T01:05:10Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:MBWDFESSL7WNDK3QAUAJ25JCCL","target":"record","payload":{"canonical_record":{"source":{"id":"2511.07317","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-10T17:18:35Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"5221e73bfb4279b156ce611fe2787980d048e37900da2c0caccb69fbc50ffa24","abstract_canon_sha256":"4ab8ae6dbf4088c78bae5c270d24486e1ca156f63a8dacfef0e5429f6da64863"},"schema_version":"1.0"},"canonical_sha256":"606c3292525fecd1ab7005009d752212f7685f34729661181cc7563037c4b256","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-09T01:05:10.480738Z","signature_b64":"3yoj+N6V/1/H4KiXBqQBkga8OH8v7qoJ7qkeG+BQBVeaRE9JKx0YDRCWOssOiS71A/ziBthk3Epve/uaGCCqDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"606c3292525fecd1ab7005009d752212f7685f34729661181cc7563037c4b256","last_reissued_at":"2026-06-09T01:05:10.480235Z","signature_status":"signed_v1","first_computed_at":"2026-06-09T01:05:10.480235Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2511.07317","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:05:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UkvtAr29seZL5ozJ7hHfeHJIvG/fa4HtMSXsOu6g6mzyDs1/HujUF8lCqjSVPWEkOyaWXF4kN3Lxe4+OedA9Dg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T11:27:51.912724Z"},"content_sha256":"8bb640b3c5fb248c5e6add05653770ca86988f791d1df49c229801ac3696a5ea","schema_version":"1.0","event_id":"sha256:8bb640b3c5fb248c5e6add05653770ca86988f791d1df49c229801ac3696a5ea"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:MBWDFESSL7WNDK3QAUAJ25JCCL","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"RLVE: Scaling Up Reinforcement Learning for Language Models with Adaptive Verifiable Environments","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Chenyang Zhao, Hamish Ivison, Hannaneh Hajishirzi, Hao Peng, Jacqueline He, Lifan Yuan, Natasha Jaques, Pang Wei Koh, Runlong Zhou, Shuyue Stella Li, Simon Shaolei Du, Siting Li, Tong Chen, Yiping Wang, Yulia Tsvetkov, Zhiyuan Zeng, Zhuorui Ye","submitted_at":"2025-11-10T17:18:35Z","abstract_excerpt":"We introduce Reinforcement Learning (RL) with Adaptive Verifiable Environments (RLVE), an approach using verifiable environments that procedurally generate problems and provide algorithmically verifiable rewards, to scale up RL for language models (LMs). RLVE enables each verifiable environment to dynamically adapt its problem difficulty distribution to the policy model's capabilities as training progresses. In contrast, static data distributions often lead to vanishing learning signals when problems are either too easy or too hard for the policy. To implement RLVE, we create RLVE-Gym, a large"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.07317","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2511.07317/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:05:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3KXr7iE5FHPUVkKEExazDTG2KAP3C5jQ0i+J8gqmLj5tUSOk37c0DU273KEoLD+h5GTAHqosUlGVzBRgBRtSCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T11:27:51.913525Z"},"content_sha256":"f9d5c6ddebd4fc36096fe37f6864e5ce041ae09a8f12967dbd6521d2f327880d","schema_version":"1.0","event_id":"sha256:f9d5c6ddebd4fc36096fe37f6864e5ce041ae09a8f12967dbd6521d2f327880d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/MBWDFESSL7WNDK3QAUAJ25JCCL/bundle.json","state_url":"https://pith.science/pith/MBWDFESSL7WNDK3QAUAJ25JCCL/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/MBWDFESSL7WNDK3QAUAJ25JCCL/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T11:27:51Z","links":{"resolver":"https://pith.science/pith/MBWDFESSL7WNDK3QAUAJ25JCCL","bundle":"https://pith.science/pith/MBWDFESSL7WNDK3QAUAJ25JCCL/bundle.json","state":"https://pith.science/pith/MBWDFESSL7WNDK3QAUAJ25JCCL/state.json","well_known_bundle":"https://pith.science/.well-known/pith/MBWDFESSL7WNDK3QAUAJ25JCCL/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:MBWDFESSL7WNDK3QAUAJ25JCCL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4ab8ae6dbf4088c78bae5c270d24486e1ca156f63a8dacfef0e5429f6da64863","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-10T17:18:35Z","title_canon_sha256":"5221e73bfb4279b156ce611fe2787980d048e37900da2c0caccb69fbc50ffa24"},"schema_version":"1.0","source":{"id":"2511.07317","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2511.07317","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"arxiv_version","alias_value":"2511.07317v2","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.07317","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"pith_short_12","alias_value":"MBWDFESSL7WN","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"pith_short_16","alias_value":"MBWDFESSL7WNDK3Q","created_at":"2026-06-09T01:05:10Z"},{"alias_kind":"pith_short_8","alias_value":"MBWDFESS","created_at":"2026-06-09T01:05:10Z"}],"graph_snapshots":[{"event_id":"sha256:f9d5c6ddebd4fc36096fe37f6864e5ce041ae09a8f12967dbd6521d2f327880d","target":"graph","created_at":"2026-06-09T01:05:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2511.07317/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"We introduce Reinforcement Learning (RL) with Adaptive Verifiable Environments (RLVE), an approach using verifiable environments that procedurally generate problems and provide algorithmically verifiable rewards, to scale up RL for language models (LMs). RLVE enables each verifiable environment to dynamically adapt its problem difficulty distribution to the policy model's capabilities as training progresses. In contrast, static data distributions often lead to vanishing learning signals when problems are either too easy or too hard for the policy. To implement RLVE, we create RLVE-Gym, a large","authors_text":"Chenyang Zhao, Hamish Ivison, Hannaneh Hajishirzi, Hao Peng, Jacqueline He, Lifan Yuan, Natasha Jaques, Pang Wei Koh, Runlong Zhou, Shuyue Stella Li, Simon Shaolei Du, Siting Li, Tong Chen, Yiping Wang, Yulia Tsvetkov, Zhiyuan Zeng, Zhuorui Ye","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-10T17:18:35Z","title":"RLVE: Scaling Up Reinforcement Learning for Language Models with Adaptive Verifiable Environments"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.07317","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8bb640b3c5fb248c5e6add05653770ca86988f791d1df49c229801ac3696a5ea","target":"record","created_at":"2026-06-09T01:05:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4ab8ae6dbf4088c78bae5c270d24486e1ca156f63a8dacfef0e5429f6da64863","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-10T17:18:35Z","title_canon_sha256":"5221e73bfb4279b156ce611fe2787980d048e37900da2c0caccb69fbc50ffa24"},"schema_version":"1.0","source":{"id":"2511.07317","kind":"arxiv","version":2}},"canonical_sha256":"606c3292525fecd1ab7005009d752212f7685f34729661181cc7563037c4b256","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"606c3292525fecd1ab7005009d752212f7685f34729661181cc7563037c4b256","first_computed_at":"2026-06-09T01:05:10.480235Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T01:05:10.480235Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"3yoj+N6V/1/H4KiXBqQBkga8OH8v7qoJ7qkeG+BQBVeaRE9JKx0YDRCWOssOiS71A/ziBthk3Epve/uaGCCqDw==","signature_status":"signed_v1","signed_at":"2026-06-09T01:05:10.480738Z","signed_message":"canonical_sha256_bytes"},"source_id":"2511.07317","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8bb640b3c5fb248c5e6add05653770ca86988f791d1df49c229801ac3696a5ea","sha256:f9d5c6ddebd4fc36096fe37f6864e5ce041ae09a8f12967dbd6521d2f327880d"],"state_sha256":"637ce83e25f8eec06f66ac1ee7175a6bbb912c5b253724f52c3a388b1198c3d5"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SAZgGCckszQVdZZPHjPZW2gPFbBAvW6/xQoi57YiA75eNzU2kvrDh6nYzrJtB+KTCAt+KfGK+v6tRWXrUYGDAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T11:27:51.918546Z","bundle_sha256":"e9c6d9c80a6481fcd62b235380752507e8660ad78c3a76133024ae5ba29f1f80"}}