{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:U4UJ2ELZGA3OUGA3DULMXA67TX","short_pith_number":"pith:U4UJ2ELZ","canonical_record":{"source":{"id":"2510.00231","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-30T19:55:26Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c601479fdd1965425b3cd2e4d82322594688318a3a822b96cbd93dec6a34f2eb","abstract_canon_sha256":"81a4a0ed10bfaa7c53b671a465caeeb0838cea35ddb320dc389b908cc99f8f87"},"schema_version":"1.0"},"canonical_sha256":"a7289d11793036ea181b1d16cb83df9de5baede13fda811e8cb878f36dc018ed","source":{"kind":"arxiv","id":"2510.00231","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2510.00231","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"arxiv_version","alias_value":"2510.00231v2","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.00231","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"pith_short_12","alias_value":"U4UJ2ELZGA3O","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"U4UJ2ELZGA3OUGA3","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"U4UJ2ELZ","created_at":"2026-05-18T12:33:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:U4UJ2ELZGA3OUGA3DULMXA67TX","target":"record","payload":{"canonical_record":{"source":{"id":"2510.00231","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-30T19:55:26Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c601479fdd1965425b3cd2e4d82322594688318a3a822b96cbd93dec6a34f2eb","abstract_canon_sha256":"81a4a0ed10bfaa7c53b671a465caeeb0838cea35ddb320dc389b908cc99f8f87"},"schema_version":"1.0"},"canonical_sha256":"a7289d11793036ea181b1d16cb83df9de5baede13fda811e8cb878f36dc018ed","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:39:17.383585Z","signature_b64":"Rvu9FTJcywWhrUfnqRy0E8kyl1gJb7sS40QKWlPV5kpw6o6V5a4EC2Z/Pjl3YmCUXzWXmuPILxDXpH8uAcudCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a7289d11793036ea181b1d16cb83df9de5baede13fda811e8cb878f36dc018ed","last_reissued_at":"2026-05-17T23:39:17.382808Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:39:17.382808Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2510.00231","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EVLseoHpdoZfksoluPosL95nZ+eydyF+6k0fWlFfAH4dwIJwSaIjI1Ss4wB39HMy+muQyT/ibUoUJmYA6627AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T23:08:51.898501Z"},"content_sha256":"f4c9428684db6a062104487314b1e0607a330eeefc8f946c410cb1b186d56f73","schema_version":"1.0","event_id":"sha256:f4c9428684db6a062104487314b1e0607a330eeefc8f946c410cb1b186d56f73"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:U4UJ2ELZGA3OUGA3DULMXA67TX","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"The Pitfalls of KV Cache Compression","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Aditya Grover, Alex Chen, Daniel Israel, Guy Van den Broeck, Renato Geh","submitted_at":"2025-09-30T19:55:26Z","abstract_excerpt":"KV cache compression promises increased throughput and efficiency with negligible loss in performance. While the gains in throughput are indisputable and recent literature has indeed shown minimal degradation on particular benchmarks, in general the consequences of compression in realistic scenarios such as multi-instruction prompting have been insufficiently studied. In this paper, we identify several pitfalls that practitioners should be aware of when deploying KV cache compressed LLMs. We evaluate five KV cache compression methods (StreamingLLM, SnapKV, TOVA, H2O, and K-Norm) on Llama3.1 8B"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.00231","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yvJQQbrKHTRq6QWQjCrn5tSBfGP6HSTZ2LuWw11zj1tquoA2fTdoSqkjouTCSm3dxxsSnaSQJyH1cN8SoBAXDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T23:08:51.898840Z"},"content_sha256":"6adbfd77c165178864f5b3851a48f41f58c1232f1132b74c3d2032463aea15d9","schema_version":"1.0","event_id":"sha256:6adbfd77c165178864f5b3851a48f41f58c1232f1132b74c3d2032463aea15d9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/U4UJ2ELZGA3OUGA3DULMXA67TX/bundle.json","state_url":"https://pith.science/pith/U4UJ2ELZGA3OUGA3DULMXA67TX/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/U4UJ2ELZGA3OUGA3DULMXA67TX/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T23:08:51Z","links":{"resolver":"https://pith.science/pith/U4UJ2ELZGA3OUGA3DULMXA67TX","bundle":"https://pith.science/pith/U4UJ2ELZGA3OUGA3DULMXA67TX/bundle.json","state":"https://pith.science/pith/U4UJ2ELZGA3OUGA3DULMXA67TX/state.json","well_known_bundle":"https://pith.science/.well-known/pith/U4UJ2ELZGA3OUGA3DULMXA67TX/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:U4UJ2ELZGA3OUGA3DULMXA67TX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"81a4a0ed10bfaa7c53b671a465caeeb0838cea35ddb320dc389b908cc99f8f87","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-30T19:55:26Z","title_canon_sha256":"c601479fdd1965425b3cd2e4d82322594688318a3a822b96cbd93dec6a34f2eb"},"schema_version":"1.0","source":{"id":"2510.00231","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2510.00231","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"arxiv_version","alias_value":"2510.00231v2","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.00231","created_at":"2026-05-17T23:39:17Z"},{"alias_kind":"pith_short_12","alias_value":"U4UJ2ELZGA3O","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"U4UJ2ELZGA3OUGA3","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"U4UJ2ELZ","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:6adbfd77c165178864f5b3851a48f41f58c1232f1132b74c3d2032463aea15d9","target":"graph","created_at":"2026-05-17T23:39:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"KV cache compression promises increased throughput and efficiency with negligible loss in performance. While the gains in throughput are indisputable and recent literature has indeed shown minimal degradation on particular benchmarks, in general the consequences of compression in realistic scenarios such as multi-instruction prompting have been insufficiently studied. In this paper, we identify several pitfalls that practitioners should be aware of when deploying KV cache compressed LLMs. We evaluate five KV cache compression methods (StreamingLLM, SnapKV, TOVA, H2O, and K-Norm) on Llama3.1 8B","authors_text":"Aditya Grover, Alex Chen, Daniel Israel, Guy Van den Broeck, Renato Geh","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-30T19:55:26Z","title":"The Pitfalls of KV Cache Compression"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.00231","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f4c9428684db6a062104487314b1e0607a330eeefc8f946c410cb1b186d56f73","target":"record","created_at":"2026-05-17T23:39:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"81a4a0ed10bfaa7c53b671a465caeeb0838cea35ddb320dc389b908cc99f8f87","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-30T19:55:26Z","title_canon_sha256":"c601479fdd1965425b3cd2e4d82322594688318a3a822b96cbd93dec6a34f2eb"},"schema_version":"1.0","source":{"id":"2510.00231","kind":"arxiv","version":2}},"canonical_sha256":"a7289d11793036ea181b1d16cb83df9de5baede13fda811e8cb878f36dc018ed","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a7289d11793036ea181b1d16cb83df9de5baede13fda811e8cb878f36dc018ed","first_computed_at":"2026-05-17T23:39:17.382808Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:17.382808Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Rvu9FTJcywWhrUfnqRy0E8kyl1gJb7sS40QKWlPV5kpw6o6V5a4EC2Z/Pjl3YmCUXzWXmuPILxDXpH8uAcudCg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:17.383585Z","signed_message":"canonical_sha256_bytes"},"source_id":"2510.00231","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f4c9428684db6a062104487314b1e0607a330eeefc8f946c410cb1b186d56f73","sha256:6adbfd77c165178864f5b3851a48f41f58c1232f1132b74c3d2032463aea15d9"],"state_sha256":"f4a58f5fde74c8bdc43c898f2fdf367ec1d00bea19475ee7b7cc83de17177168"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5yz+th7THW7+AILToeQmzdQmKinzGnMm+qtGfC2bljQXtAGIHPDEdgaW7jV8gP5z5J21kSA8Bi6V3T/XnQUmCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T23:08:51.900712Z","bundle_sha256":"cf040d097fc6cd9551beccd69663f90fee0c53df2ad055767836eb1ebd463c9b"}}