{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:KY6JLRFO6DWHMVWM6LQSY7OUQ2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"bd63be4649c25f0d4dd2462720814430754fecfb1029ed03d0755d5192b9d8bb","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-01-30T05:16:12Z","title_canon_sha256":"13855a66af6c0a99e06a67418f41586ee2e5d82d2234e97cd49acefb147962b9"},"schema_version":"1.0","source":{"id":"2601.22574","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2601.22574","created_at":"2026-06-08T01:03:56Z"},{"alias_kind":"arxiv_version","alias_value":"2601.22574v2","created_at":"2026-06-08T01:03:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2601.22574","created_at":"2026-06-08T01:03:56Z"},{"alias_kind":"pith_short_12","alias_value":"KY6JLRFO6DWH","created_at":"2026-06-08T01:03:56Z"},{"alias_kind":"pith_short_16","alias_value":"KY6JLRFO6DWHMVWM","created_at":"2026-06-08T01:03:56Z"},{"alias_kind":"pith_short_8","alias_value":"KY6JLRFO","created_at":"2026-06-08T01:03:56Z"}],"graph_snapshots":[{"event_id":"sha256:569268bd59eac1119cf611bbb4b56200fc58d373f4d5d45124818d9fe0befe0d","target":"graph","created_at":"2026-06-08T01:03:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2601.22574/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Although Video Large Multimodal Models have achieved strong performance in video understanding, they still suffer from hallucination. Existing inference-time intervention methods usually modify videos under the contrastive decoding framework, but their heuristic designs bring limited improvements and increase inference latency. To address these issues, we propose ViSSRes, an inference-time intervention method that enhances video representations through a lightweight MLP-style network. Specifically, we use a contrastive random walk approach to characterize the spatiotemporal consistency of vide","authors_text":"Han Bao, Jinman Zhao, Tong Zhang, Wenbin Xing, Wenzhi Chen, Xingguo Xu, Yuansheng Gao, Zonghui Wang","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-01-30T05:16:12Z","title":"Enhancing Video Representations with Spatiotemporal-Semantic Residual to Mitigate Hallucinations in Video Large Multimodal Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2601.22574","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:99dbc326b42a25922af2e40361e3cf1ca843afaba90e79f53c0bebd7a5de1b64","target":"record","created_at":"2026-06-08T01:03:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"bd63be4649c25f0d4dd2462720814430754fecfb1029ed03d0755d5192b9d8bb","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-01-30T05:16:12Z","title_canon_sha256":"13855a66af6c0a99e06a67418f41586ee2e5d82d2234e97cd49acefb147962b9"},"schema_version":"1.0","source":{"id":"2601.22574","kind":"arxiv","version":2}},"canonical_sha256":"563c95c4aef0ec7656ccf2e12c7dd48685022b8184388b5cca054f2d6bdb9744","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"563c95c4aef0ec7656ccf2e12c7dd48685022b8184388b5cca054f2d6bdb9744","first_computed_at":"2026-06-08T01:03:56.607200Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-08T01:03:56.607200Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"mIXFfibm3PDJDcm2E2h0Esjz8Y6YbHagCn+xbv7L75gF56EZ9KcZrmf1THi0XBrFEXcwxnnlNJYgfGQ59YEiDw==","signature_status":"signed_v1","signed_at":"2026-06-08T01:03:56.608107Z","signed_message":"canonical_sha256_bytes"},"source_id":"2601.22574","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:99dbc326b42a25922af2e40361e3cf1ca843afaba90e79f53c0bebd7a5de1b64","sha256:569268bd59eac1119cf611bbb4b56200fc58d373f4d5d45124818d9fe0befe0d"],"state_sha256":"39e6b4b42d6f66c9953dbd213b180fd46be9f6eb19c63cc20eb49e355c4aac78"}