{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:5B2BJGIXKA4VWUHOJVHZEJKV73","short_pith_number":"pith:5B2BJGIX","canonical_record":{"source":{"id":"2605.30010","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-28T14:36:44Z","cross_cats_sorted":[],"title_canon_sha256":"8576dc9760f568c462d4d2c2aa9c41c06d922561acf0bc4fa71c75cfeeafa956","abstract_canon_sha256":"160947f37d986e9204c917fd0df91248ddf34958f61df4bd44d681198fa6c642"},"schema_version":"1.0"},"canonical_sha256":"e87414991750395b50ee4d4f922555feefc3476770af8fa5459206804cb5088c","source":{"kind":"arxiv","id":"2605.30010","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.30010","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"arxiv_version","alias_value":"2605.30010v1","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.30010","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"pith_short_12","alias_value":"5B2BJGIXKA4V","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"pith_short_16","alias_value":"5B2BJGIXKA4VWUHO","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"pith_short_8","alias_value":"5B2BJGIX","created_at":"2026-05-29T02:06:06Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:5B2BJGIXKA4VWUHOJVHZEJKV73","target":"record","payload":{"canonical_record":{"source":{"id":"2605.30010","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-28T14:36:44Z","cross_cats_sorted":[],"title_canon_sha256":"8576dc9760f568c462d4d2c2aa9c41c06d922561acf0bc4fa71c75cfeeafa956","abstract_canon_sha256":"160947f37d986e9204c917fd0df91248ddf34958f61df4bd44d681198fa6c642"},"schema_version":"1.0"},"canonical_sha256":"e87414991750395b50ee4d4f922555feefc3476770af8fa5459206804cb5088c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T02:06:06.754567Z","signature_b64":"i4tuaptA1OItpXshgXogdfaxpktgOsoO0UPT8TpPBmBEBc70LrMewzhz1Kq+pGhgsF+/eJ/mLw7Mf/glnvt5DA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e87414991750395b50ee4d4f922555feefc3476770af8fa5459206804cb5088c","last_reissued_at":"2026-05-29T02:06:06.753754Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T02:06:06.753754Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.30010","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T02:06:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ffAfLhBAGLOH5d8ZwRUG/Awk+8BfWJweribdh6u9HvJsWAf3uBxm/zVmrHDwsXBRkQaT2ldFiWAjioJJUS5eBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T15:30:17.293761Z"},"content_sha256":"dee2ef50e3c8f1db5fe576bb1d137819968cf85b7adfcdb7563cd813da719fbe","schema_version":"1.0","event_id":"sha256:dee2ef50e3c8f1db5fe576bb1d137819968cf85b7adfcdb7563cd813da719fbe"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:5B2BJGIXKA4VWUHOJVHZEJKV73","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"EarlyTom: Early Token Compression Completes Fast Video Understanding","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Chenhaowen Li, Hesong Wang, Huan Wang, Jian Chen, Lu Lu, Qiang Liu, Xin Jin","submitted_at":"2026-05-28T14:36:44Z","abstract_excerpt":"Video large language models (Video-LLMs) have demonstrated strong capabilities in video understanding tasks. However, their practical deployment is still hindered by the inefficiency introduced by processing massive amounts of visual tokens. Although recent approaches achieve extremely low token retention ratios while maintaining accuracy comparable to full-token baselines, most of them perform compression only at the late stage of prefilling, leaving the efficiency of the vision encoder unoptimized. In this paper, we first show that vision encoding contributes a large portion to the time-to-f"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.30010","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.30010/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T02:06:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FZbGEzV7p8ccmt7QTiY3007P0HWgCbj9cmUEAY96SQQJp1nTu/LQvtZ3CMQGwMiRbIQGbQnFpB5EEdoeiZsPCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T15:30:17.294632Z"},"content_sha256":"a35734ab6b48ea65304f76d89d9a1b898a61e761d3c1f2d35a49f221bf8933b6","schema_version":"1.0","event_id":"sha256:a35734ab6b48ea65304f76d89d9a1b898a61e761d3c1f2d35a49f221bf8933b6"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5B2BJGIXKA4VWUHOJVHZEJKV73/bundle.json","state_url":"https://pith.science/pith/5B2BJGIXKA4VWUHOJVHZEJKV73/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5B2BJGIXKA4VWUHOJVHZEJKV73/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T15:30:17Z","links":{"resolver":"https://pith.science/pith/5B2BJGIXKA4VWUHOJVHZEJKV73","bundle":"https://pith.science/pith/5B2BJGIXKA4VWUHOJVHZEJKV73/bundle.json","state":"https://pith.science/pith/5B2BJGIXKA4VWUHOJVHZEJKV73/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5B2BJGIXKA4VWUHOJVHZEJKV73/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5B2BJGIXKA4VWUHOJVHZEJKV73","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"160947f37d986e9204c917fd0df91248ddf34958f61df4bd44d681198fa6c642","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-28T14:36:44Z","title_canon_sha256":"8576dc9760f568c462d4d2c2aa9c41c06d922561acf0bc4fa71c75cfeeafa956"},"schema_version":"1.0","source":{"id":"2605.30010","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.30010","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"arxiv_version","alias_value":"2605.30010v1","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.30010","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"pith_short_12","alias_value":"5B2BJGIXKA4V","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"pith_short_16","alias_value":"5B2BJGIXKA4VWUHO","created_at":"2026-05-29T02:06:06Z"},{"alias_kind":"pith_short_8","alias_value":"5B2BJGIX","created_at":"2026-05-29T02:06:06Z"}],"graph_snapshots":[{"event_id":"sha256:a35734ab6b48ea65304f76d89d9a1b898a61e761d3c1f2d35a49f221bf8933b6","target":"graph","created_at":"2026-05-29T02:06:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.30010/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Video large language models (Video-LLMs) have demonstrated strong capabilities in video understanding tasks. However, their practical deployment is still hindered by the inefficiency introduced by processing massive amounts of visual tokens. Although recent approaches achieve extremely low token retention ratios while maintaining accuracy comparable to full-token baselines, most of them perform compression only at the late stage of prefilling, leaving the efficiency of the vision encoder unoptimized. In this paper, we first show that vision encoding contributes a large portion to the time-to-f","authors_text":"Chenhaowen Li, Hesong Wang, Huan Wang, Jian Chen, Lu Lu, Qiang Liu, Xin Jin","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-28T14:36:44Z","title":"EarlyTom: Early Token Compression Completes Fast Video Understanding"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.30010","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:dee2ef50e3c8f1db5fe576bb1d137819968cf85b7adfcdb7563cd813da719fbe","target":"record","created_at":"2026-05-29T02:06:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"160947f37d986e9204c917fd0df91248ddf34958f61df4bd44d681198fa6c642","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-28T14:36:44Z","title_canon_sha256":"8576dc9760f568c462d4d2c2aa9c41c06d922561acf0bc4fa71c75cfeeafa956"},"schema_version":"1.0","source":{"id":"2605.30010","kind":"arxiv","version":1}},"canonical_sha256":"e87414991750395b50ee4d4f922555feefc3476770af8fa5459206804cb5088c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e87414991750395b50ee4d4f922555feefc3476770af8fa5459206804cb5088c","first_computed_at":"2026-05-29T02:06:06.753754Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T02:06:06.753754Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"i4tuaptA1OItpXshgXogdfaxpktgOsoO0UPT8TpPBmBEBc70LrMewzhz1Kq+pGhgsF+/eJ/mLw7Mf/glnvt5DA==","signature_status":"signed_v1","signed_at":"2026-05-29T02:06:06.754567Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.30010","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:dee2ef50e3c8f1db5fe576bb1d137819968cf85b7adfcdb7563cd813da719fbe","sha256:a35734ab6b48ea65304f76d89d9a1b898a61e761d3c1f2d35a49f221bf8933b6"],"state_sha256":"00cfb6a485d280e43d7e8093d5312cc5ce68ee1b4d4b75010d0575a1c0cce09b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0JzqAUv7khePiA1et4IEr/a4ogfUQukPxPANyqAxV34bnnChwda77RTu8nbbPRVTn1rfMHsDXSVY1ginprRfAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T15:30:17.298885Z","bundle_sha256":"809ee2bf717bc16f109815e8ecef90225484744fe35dc0709d12e7b5117683e4"}}