{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:RLLBD3WSTZA47IHNV3WVL7XON4","short_pith_number":"pith:RLLBD3WS","canonical_record":{"source":{"id":"2507.21433","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-29T02:05:51Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"1ee423a8466bd8d6169947ba044f624f2219043a49246dd5c9a5316c19f43637","abstract_canon_sha256":"de9bf8c21d8a10d265b7608feb46c5eb3ba5c796f6080cd5b4df8ecd10a9915e"},"schema_version":"1.0"},"canonical_sha256":"8ad611eed29e41cfa0edaeed55feee6f247d2e50a053c620d1a2163523e6bc69","source":{"kind":"arxiv","id":"2507.21433","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.21433","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"arxiv_version","alias_value":"2507.21433v3","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.21433","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"pith_short_12","alias_value":"RLLBD3WSTZA4","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"RLLBD3WSTZA47IHN","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"RLLBD3WS","created_at":"2026-05-18T12:33:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:RLLBD3WSTZA47IHNV3WVL7XON4","target":"record","payload":{"canonical_record":{"source":{"id":"2507.21433","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-29T02:05:51Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"1ee423a8466bd8d6169947ba044f624f2219043a49246dd5c9a5316c19f43637","abstract_canon_sha256":"de9bf8c21d8a10d265b7608feb46c5eb3ba5c796f6080cd5b4df8ecd10a9915e"},"schema_version":"1.0"},"canonical_sha256":"8ad611eed29e41cfa0edaeed55feee6f247d2e50a053c620d1a2163523e6bc69","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:39:17.798668Z","signature_b64":"Vz3tB7/l4+H1TJ1N7wJO789GcB1tpyxEbxuq/bB4NWSij30amJIFooEWJszNxkXqqMJ19k5lInvZfC+P8Rk9BQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8ad611eed29e41cfa0edaeed55feee6f247d2e50a053c620d1a2163523e6bc69","last_reissued_at":"2026-05-17T23:39:17.798003Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:39:17.798003Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2507.21433","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jycJ4xO9W5Emg26Dd1X3Nq5U8k7J43S6nQ2Bfc9UsyXVPvoGlLFJkGf4NyKRk2rXGfH/i+HSN8nUksKLq/mmAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T15:13:17.971744Z"},"content_sha256":"51f5e738a5b92f87bdb9c0eb3d4d55b8946191a63b073754234a45a0aa6c5549","schema_version":"1.0","event_id":"sha256:51f5e738a5b92f87bdb9c0eb3d4d55b8946191a63b073754234a45a0aa6c5549"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:RLLBD3WSTZA47IHNV3WVL7XON4","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"ReasonCache: Accelerating Large Reasoning Model Serving through KV Cache Sharing","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Hong Xu, Jingzong Li, Kaiwen Chen, Minchen Yu, Xin Tan","submitted_at":"2025-07-29T02:05:51Z","abstract_excerpt":"Large Reasoning Models (LRMs) are becoming integral to many AI inference systems, enhancing their capabilities with advanced reasoning. However, deploying these models in production environments presents a significant QoS challenge: the substantial memory overhead from their long, auto-regressive inference processes severely limits throughput and increases latency, thereby affecting the quality of service for concurrent users. We observe that LRMs frequently generate highly similar intermediate reasoning steps, which, in turn, correspond to highly similar KV cache states across layers. Buildin"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2507.21433","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BGg0aGBpkhZ3ntdV4TqbkQpH6MjwH50LGPZ1XPO4b19+VJeb3IzholPVzg27tY5Kf8c2Ts/3QZrUizVKfS67Dg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T15:13:17.972394Z"},"content_sha256":"2ba271edf9bbd844c6962b1f342c230bb59e2ee1187f6b63e98337229ff63242","schema_version":"1.0","event_id":"sha256:2ba271edf9bbd844c6962b1f342c230bb59e2ee1187f6b63e98337229ff63242"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RLLBD3WSTZA47IHNV3WVL7XON4/bundle.json","state_url":"https://pith.science/pith/RLLBD3WSTZA47IHNV3WVL7XON4/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RLLBD3WSTZA47IHNV3WVL7XON4/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T15:13:17Z","links":{"resolver":"https://pith.science/pith/RLLBD3WSTZA47IHNV3WVL7XON4","bundle":"https://pith.science/pith/RLLBD3WSTZA47IHNV3WVL7XON4/bundle.json","state":"https://pith.science/pith/RLLBD3WSTZA47IHNV3WVL7XON4/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RLLBD3WSTZA47IHNV3WVL7XON4/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:RLLBD3WSTZA47IHNV3WVL7XON4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"de9bf8c21d8a10d265b7608feb46c5eb3ba5c796f6080cd5b4df8ecd10a9915e","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-29T02:05:51Z","title_canon_sha256":"1ee423a8466bd8d6169947ba044f624f2219043a49246dd5c9a5316c19f43637"},"schema_version":"1.0","source":{"id":"2507.21433","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.21433","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"arxiv_version","alias_value":"2507.21433v3","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.21433","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"pith_short_12","alias_value":"RLLBD3WSTZA4","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"RLLBD3WSTZA47IHN","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"RLLBD3WS","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:2ba271edf9bbd844c6962b1f342c230bb59e2ee1187f6b63e98337229ff63242","target":"graph","created_at":"2026-05-17T23:39:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Large Reasoning Models (LRMs) are becoming integral to many AI inference systems, enhancing their capabilities with advanced reasoning. However, deploying these models in production environments presents a significant QoS challenge: the substantial memory overhead from their long, auto-regressive inference processes severely limits throughput and increases latency, thereby affecting the quality of service for concurrent users. We observe that LRMs frequently generate highly similar intermediate reasoning steps, which, in turn, correspond to highly similar KV cache states across layers. Buildin","authors_text":"Hong Xu, Jingzong Li, Kaiwen Chen, Minchen Yu, Xin Tan","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-29T02:05:51Z","title":"ReasonCache: Accelerating Large Reasoning Model Serving through KV Cache Sharing"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2507.21433","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:51f5e738a5b92f87bdb9c0eb3d4d55b8946191a63b073754234a45a0aa6c5549","target":"record","created_at":"2026-05-17T23:39:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"de9bf8c21d8a10d265b7608feb46c5eb3ba5c796f6080cd5b4df8ecd10a9915e","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-29T02:05:51Z","title_canon_sha256":"1ee423a8466bd8d6169947ba044f624f2219043a49246dd5c9a5316c19f43637"},"schema_version":"1.0","source":{"id":"2507.21433","kind":"arxiv","version":3}},"canonical_sha256":"8ad611eed29e41cfa0edaeed55feee6f247d2e50a053c620d1a2163523e6bc69","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8ad611eed29e41cfa0edaeed55feee6f247d2e50a053c620d1a2163523e6bc69","first_computed_at":"2026-05-17T23:39:17.798003Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:17.798003Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Vz3tB7/l4+H1TJ1N7wJO789GcB1tpyxEbxuq/bB4NWSij30amJIFooEWJszNxkXqqMJ19k5lInvZfC+P8Rk9BQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:17.798668Z","signed_message":"canonical_sha256_bytes"},"source_id":"2507.21433","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:51f5e738a5b92f87bdb9c0eb3d4d55b8946191a63b073754234a45a0aa6c5549","sha256:2ba271edf9bbd844c6962b1f342c230bb59e2ee1187f6b63e98337229ff63242"],"state_sha256":"14bdf684780941cd20c56c156316a13cd0973a175416dae12e19d5c54535d892"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ItYTjImWvYxSz+GNuFkL6GRMfnkX0bd1aqN3DuqbaAeh+S/XJnYbSfCUY5JN+ztsBmRFA6YjyJy7qtpQXB+nCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T15:13:17.975584Z","bundle_sha256":"a9c020d1c6cf44d6a8da8d875e89aa54b2478e32a441bcc6b83aa3ce57cf6dfc"}}