{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:DOUNEVZ4WPFSTK7C5IYVXPP2LS","short_pith_number":"pith:DOUNEVZ4","canonical_record":{"source":{"id":"2507.15778","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-07-21T16:34:01Z","cross_cats_sorted":[],"title_canon_sha256":"d7f7b081b9a47a2da71f5c5ccbc4c867bcf25a686a2ca5527b956f3bb0efec16","abstract_canon_sha256":"a04bd231108d166830be735f17c1d26f3ac349f7e553b2d478957e3449a2e952"},"schema_version":"1.0"},"canonical_sha256":"1ba8d2573cb3cb29abe2ea315bbdfa5c9dd669d1fa584fd77bc6c7eedad30de0","source":{"kind":"arxiv","id":"2507.15778","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.15778","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"arxiv_version","alias_value":"2507.15778v2","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.15778","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"pith_short_12","alias_value":"DOUNEVZ4WPFS","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"pith_short_16","alias_value":"DOUNEVZ4WPFSTK7C","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"pith_short_8","alias_value":"DOUNEVZ4","created_at":"2026-05-20T00:00:22Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:DOUNEVZ4WPFSTK7C5IYVXPP2LS","target":"record","payload":{"canonical_record":{"source":{"id":"2507.15778","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-07-21T16:34:01Z","cross_cats_sorted":[],"title_canon_sha256":"d7f7b081b9a47a2da71f5c5ccbc4c867bcf25a686a2ca5527b956f3bb0efec16","abstract_canon_sha256":"a04bd231108d166830be735f17c1d26f3ac349f7e553b2d478957e3449a2e952"},"schema_version":"1.0"},"canonical_sha256":"1ba8d2573cb3cb29abe2ea315bbdfa5c9dd669d1fa584fd77bc6c7eedad30de0","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:00:22.214918Z","signature_b64":"S+FqJsMOiemSbAYmZYvErkjoya6lr+aj99CXLT2qnMVUPIUk8H4z6VA1vbtCim6CtxheRfMMZDBHwwffnBV3DQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1ba8d2573cb3cb29abe2ea315bbdfa5c9dd669d1fa584fd77bc6c7eedad30de0","last_reissued_at":"2026-05-20T00:00:22.214132Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:00:22.214132Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2507.15778","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:00:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"t430S2Yu1KFEz3i/v9UpFaBjgLlHLTytjRYnlyliMzepiGN15F/fDUEKw+LBDrWg/Rv43RdfsFH4F3TQj++ICA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T05:22:12.719980Z"},"content_sha256":"643eef4ce6ac5b97366293d8ef8b6b75d6f7b15aa5963cf9f3dd6e73430a1d62","schema_version":"1.0","event_id":"sha256:643eef4ce6ac5b97366293d8ef8b6b75d6f7b15aa5963cf9f3dd6e73430a1d62"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:DOUNEVZ4WPFSTK7C5IYVXPP2LS","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Stabilizing Knowledge, Promoting Reasoning: Dual-Token Constraints for RLVR","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Fuzheng Zhang, Guorui Zhou, Jiakang Wang, Ling Pan, Runze Liu, Xiu Li","submitted_at":"2025-07-21T16:34:01Z","abstract_excerpt":"Reinforcement Learning with Verifiable Rewards (RLVR) has become an effective post-training method for improving the reasoning abilities of Large Language Models (LLMs). However, existing methods mainly apply uniform optimization constraints across all tokens, ignoring their heterogeneous roles. Prior work shows that high-entropy tokens are closely tied to reasoning, while low-entropy tokens primarily encode factual knowledge, and recent approaches attempt to exploit this distinction by isolating token updates via masking or asynchronous training. We argue that such isolation breaks the sequen"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2507.15778","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2507.15778/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:00:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7jXlhJQnCX5PtzjOOS2warFUscxMou6iYXTOHa5dM1PAAlfJEn36wdFuy0K/kW6gUEHR+CTAKfYnoHqduUYHDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T05:22:12.720652Z"},"content_sha256":"be71d9d54863f6726c992d71a73345f471e64a2fb6f8f5714094c38585368733","schema_version":"1.0","event_id":"sha256:be71d9d54863f6726c992d71a73345f471e64a2fb6f8f5714094c38585368733"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/DOUNEVZ4WPFSTK7C5IYVXPP2LS/bundle.json","state_url":"https://pith.science/pith/DOUNEVZ4WPFSTK7C5IYVXPP2LS/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/DOUNEVZ4WPFSTK7C5IYVXPP2LS/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T05:22:12Z","links":{"resolver":"https://pith.science/pith/DOUNEVZ4WPFSTK7C5IYVXPP2LS","bundle":"https://pith.science/pith/DOUNEVZ4WPFSTK7C5IYVXPP2LS/bundle.json","state":"https://pith.science/pith/DOUNEVZ4WPFSTK7C5IYVXPP2LS/state.json","well_known_bundle":"https://pith.science/.well-known/pith/DOUNEVZ4WPFSTK7C5IYVXPP2LS/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:DOUNEVZ4WPFSTK7C5IYVXPP2LS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a04bd231108d166830be735f17c1d26f3ac349f7e553b2d478957e3449a2e952","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-07-21T16:34:01Z","title_canon_sha256":"d7f7b081b9a47a2da71f5c5ccbc4c867bcf25a686a2ca5527b956f3bb0efec16"},"schema_version":"1.0","source":{"id":"2507.15778","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.15778","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"arxiv_version","alias_value":"2507.15778v2","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.15778","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"pith_short_12","alias_value":"DOUNEVZ4WPFS","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"pith_short_16","alias_value":"DOUNEVZ4WPFSTK7C","created_at":"2026-05-20T00:00:22Z"},{"alias_kind":"pith_short_8","alias_value":"DOUNEVZ4","created_at":"2026-05-20T00:00:22Z"}],"graph_snapshots":[{"event_id":"sha256:be71d9d54863f6726c992d71a73345f471e64a2fb6f8f5714094c38585368733","target":"graph","created_at":"2026-05-20T00:00:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2507.15778/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reinforcement Learning with Verifiable Rewards (RLVR) has become an effective post-training method for improving the reasoning abilities of Large Language Models (LLMs). However, existing methods mainly apply uniform optimization constraints across all tokens, ignoring their heterogeneous roles. Prior work shows that high-entropy tokens are closely tied to reasoning, while low-entropy tokens primarily encode factual knowledge, and recent approaches attempt to exploit this distinction by isolating token updates via masking or asynchronous training. We argue that such isolation breaks the sequen","authors_text":"Fuzheng Zhang, Guorui Zhou, Jiakang Wang, Ling Pan, Runze Liu, Xiu Li","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-07-21T16:34:01Z","title":"Stabilizing Knowledge, Promoting Reasoning: Dual-Token Constraints for RLVR"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2507.15778","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:643eef4ce6ac5b97366293d8ef8b6b75d6f7b15aa5963cf9f3dd6e73430a1d62","target":"record","created_at":"2026-05-20T00:00:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a04bd231108d166830be735f17c1d26f3ac349f7e553b2d478957e3449a2e952","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-07-21T16:34:01Z","title_canon_sha256":"d7f7b081b9a47a2da71f5c5ccbc4c867bcf25a686a2ca5527b956f3bb0efec16"},"schema_version":"1.0","source":{"id":"2507.15778","kind":"arxiv","version":2}},"canonical_sha256":"1ba8d2573cb3cb29abe2ea315bbdfa5c9dd669d1fa584fd77bc6c7eedad30de0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1ba8d2573cb3cb29abe2ea315bbdfa5c9dd669d1fa584fd77bc6c7eedad30de0","first_computed_at":"2026-05-20T00:00:22.214132Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:00:22.214132Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"S+FqJsMOiemSbAYmZYvErkjoya6lr+aj99CXLT2qnMVUPIUk8H4z6VA1vbtCim6CtxheRfMMZDBHwwffnBV3DQ==","signature_status":"signed_v1","signed_at":"2026-05-20T00:00:22.214918Z","signed_message":"canonical_sha256_bytes"},"source_id":"2507.15778","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:643eef4ce6ac5b97366293d8ef8b6b75d6f7b15aa5963cf9f3dd6e73430a1d62","sha256:be71d9d54863f6726c992d71a73345f471e64a2fb6f8f5714094c38585368733"],"state_sha256":"a75bf1da8e99ed0919898a96fc9fe07fd0cb51dc4b7dd1f0c7adbfd44c32f695"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"PflCAZau/JH7cxxOWXh7carKABljf0z1oAlZClu78fzt1YogINiCVAPFaNTW4ucKox5B4E2oCmX+wt/7I6cEDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T05:22:12.723680Z","bundle_sha256":"69f80fc54415c0d777e0cb35fa8ad5a84ea45298d9e44f1a701d1a64b0de182d"}}