{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:MBWZHDAAQBYOPDA7UJ37HGPFNZ","short_pith_number":"pith:MBWZHDAA","canonical_record":{"source":{"id":"2505.19155","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-05-25T14:09:28Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"8383d6d73690403cf3c9c28906119092a8895d1cdae2f710cc8a5fa70cefb353","abstract_canon_sha256":"a9ee7423b1336a082d4d4a1c2477a6785f87906137d622720053910e40939eec"},"schema_version":"1.0"},"canonical_sha256":"606d938c008070e78c1fa277f399e56e5572147a1ff5b44205481849f6bbd2cf","source":{"kind":"arxiv","id":"2505.19155","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2505.19155","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"arxiv_version","alias_value":"2505.19155v2","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2505.19155","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"pith_short_12","alias_value":"MBWZHDAAQBYO","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"pith_short_16","alias_value":"MBWZHDAAQBYOPDA7","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"pith_short_8","alias_value":"MBWZHDAA","created_at":"2026-05-20T00:04:09Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:MBWZHDAAQBYOPDA7UJ37HGPFNZ","target":"record","payload":{"canonical_record":{"source":{"id":"2505.19155","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-05-25T14:09:28Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"8383d6d73690403cf3c9c28906119092a8895d1cdae2f710cc8a5fa70cefb353","abstract_canon_sha256":"a9ee7423b1336a082d4d4a1c2477a6785f87906137d622720053910e40939eec"},"schema_version":"1.0"},"canonical_sha256":"606d938c008070e78c1fa277f399e56e5572147a1ff5b44205481849f6bbd2cf","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:04:09.712737Z","signature_b64":"UxXL5wwLd5FynzSVznydwOrs1pN2N8vOx0vYWXIeimtJlxgL6QUr4gTzzC5S9M+p1Dt5JWcIwlXMhS39tHqCAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"606d938c008070e78c1fa277f399e56e5572147a1ff5b44205481849f6bbd2cf","last_reissued_at":"2026-05-20T00:04:09.712069Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:04:09.712069Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2505.19155","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:04:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"53Pq5SoS/zt3oqEwUC+xAt1u3FCoP8c3xHR8mmaB+24b+jOA69oJjH02cKFLvYuzIEx2zr8U65CTWHqWGSzpDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:42:10.418301Z"},"content_sha256":"085aad87636e97f9eecd0692fcbb8c91d9c51a8a20a22e3585351aa9a20e361f","schema_version":"1.0","event_id":"sha256:085aad87636e97f9eecd0692fcbb8c91d9c51a8a20a22e3585351aa9a20e361f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:MBWZHDAAQBYOPDA7UJ37HGPFNZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Sparse-to-Dense: A Free Lunch for Lossless Acceleration of Video Understanding in LLMs","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"cs.CV","authors_text":"Cunxiao Du, Fengzhuo Zhang, Jiawei Wu, Qian Liu, Sicheng Yu, Wei Gao, Xuan Zhang","submitted_at":"2025-05-25T14:09:28Z","abstract_excerpt":"Due to the auto-regressive nature of current video large language models (Video-LLMs), the inference latency increases as the input sequence length grows, posing challenges for the efficient processing of video sequences that are usually very long. We observe that during decoding, the attention scores of most tokens in Video-LLMs tend to be sparse and concentrated, with only certain tokens requiring comprehensive full attention. Based on this insight, we introduce Sparse-to-Dense (StD), a novel decoding strategy that integrates two distinct modules: one leveraging sparse top-K attention and th"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2505.19155","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2505.19155/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:04:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"INupXnnpBdXR/rD2x5Hny7Z1cTtsgyEbRC6ePe2LEbMPmrjE4Va8SdhKa6yLGSyhQNhHrV45OLb3OxFaIb3ZDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:42:10.419077Z"},"content_sha256":"046d595069fe43c29cc1496e8a8e57accc1e8b74eb7f10c1b71254eaa92aaab7","schema_version":"1.0","event_id":"sha256:046d595069fe43c29cc1496e8a8e57accc1e8b74eb7f10c1b71254eaa92aaab7"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/MBWZHDAAQBYOPDA7UJ37HGPFNZ/bundle.json","state_url":"https://pith.science/pith/MBWZHDAAQBYOPDA7UJ37HGPFNZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/MBWZHDAAQBYOPDA7UJ37HGPFNZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T12:42:10Z","links":{"resolver":"https://pith.science/pith/MBWZHDAAQBYOPDA7UJ37HGPFNZ","bundle":"https://pith.science/pith/MBWZHDAAQBYOPDA7UJ37HGPFNZ/bundle.json","state":"https://pith.science/pith/MBWZHDAAQBYOPDA7UJ37HGPFNZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/MBWZHDAAQBYOPDA7UJ37HGPFNZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:MBWZHDAAQBYOPDA7UJ37HGPFNZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a9ee7423b1336a082d4d4a1c2477a6785f87906137d622720053910e40939eec","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-05-25T14:09:28Z","title_canon_sha256":"8383d6d73690403cf3c9c28906119092a8895d1cdae2f710cc8a5fa70cefb353"},"schema_version":"1.0","source":{"id":"2505.19155","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2505.19155","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"arxiv_version","alias_value":"2505.19155v2","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2505.19155","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"pith_short_12","alias_value":"MBWZHDAAQBYO","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"pith_short_16","alias_value":"MBWZHDAAQBYOPDA7","created_at":"2026-05-20T00:04:09Z"},{"alias_kind":"pith_short_8","alias_value":"MBWZHDAA","created_at":"2026-05-20T00:04:09Z"}],"graph_snapshots":[{"event_id":"sha256:046d595069fe43c29cc1496e8a8e57accc1e8b74eb7f10c1b71254eaa92aaab7","target":"graph","created_at":"2026-05-20T00:04:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2505.19155/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Due to the auto-regressive nature of current video large language models (Video-LLMs), the inference latency increases as the input sequence length grows, posing challenges for the efficient processing of video sequences that are usually very long. We observe that during decoding, the attention scores of most tokens in Video-LLMs tend to be sparse and concentrated, with only certain tokens requiring comprehensive full attention. Based on this insight, we introduce Sparse-to-Dense (StD), a novel decoding strategy that integrates two distinct modules: one leveraging sparse top-K attention and th","authors_text":"Cunxiao Du, Fengzhuo Zhang, Jiawei Wu, Qian Liu, Sicheng Yu, Wei Gao, Xuan Zhang","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-05-25T14:09:28Z","title":"Sparse-to-Dense: A Free Lunch for Lossless Acceleration of Video Understanding in LLMs"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2505.19155","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:085aad87636e97f9eecd0692fcbb8c91d9c51a8a20a22e3585351aa9a20e361f","target":"record","created_at":"2026-05-20T00:04:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a9ee7423b1336a082d4d4a1c2477a6785f87906137d622720053910e40939eec","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-05-25T14:09:28Z","title_canon_sha256":"8383d6d73690403cf3c9c28906119092a8895d1cdae2f710cc8a5fa70cefb353"},"schema_version":"1.0","source":{"id":"2505.19155","kind":"arxiv","version":2}},"canonical_sha256":"606d938c008070e78c1fa277f399e56e5572147a1ff5b44205481849f6bbd2cf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"606d938c008070e78c1fa277f399e56e5572147a1ff5b44205481849f6bbd2cf","first_computed_at":"2026-05-20T00:04:09.712069Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:04:09.712069Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UxXL5wwLd5FynzSVznydwOrs1pN2N8vOx0vYWXIeimtJlxgL6QUr4gTzzC5S9M+p1Dt5JWcIwlXMhS39tHqCAw==","signature_status":"signed_v1","signed_at":"2026-05-20T00:04:09.712737Z","signed_message":"canonical_sha256_bytes"},"source_id":"2505.19155","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:085aad87636e97f9eecd0692fcbb8c91d9c51a8a20a22e3585351aa9a20e361f","sha256:046d595069fe43c29cc1496e8a8e57accc1e8b74eb7f10c1b71254eaa92aaab7"],"state_sha256":"3e5b85abecc2cb353511c377d2bea2a675c5b00814b3abe83ea4b44c4298e40f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P6hM60yzQ0P4QumQGfgIPM7geT5Cd+MH56PeigkF3dC9t+4tohEu4KdVvxvq5B2+DS3Lg93wTqU2wf9sipJnCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T12:42:10.422641Z","bundle_sha256":"0a326148d9635438f72f81ca150dfb4af4d487390b55810f82a0b478b6fb0001"}}