{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:XYJRGK7MC4NKU7MXGE7KE66DGP","short_pith_number":"pith:XYJRGK7M","schema_version":"1.0","canonical_sha256":"be13132bec171aaa7d97313ea27bc333eb01c46697c2fe243a0fc5f395c8f4ad","source":{"kind":"arxiv","id":"2605.28604","version":1},"attestation_state":"computed","paper":{"title":"Mining Multi-Modality Spatio-Temporal Cues for Video Important Person Identification","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CV","authors_text":"Bin Yang, Mang Ye, Minglei Yang, Wenke Huang, Xiao Wang, Xin Xu, Zheng Wang","submitted_at":"2026-05-27T15:20:06Z","abstract_excerpt":"Identifying key individuals in video scenes is essential for applications such as automated video editing and intelligent surveillance. Current methods primarily focus on static images and immediate visual cues, overlooking the rich spatio-temporal information in videos. This leads to the phenomenon of Temporal Importance Shift (TIS), wherein individuals deemed significant in early frames may be demoted as the entire temporal context is considered. To address this, we introduce the Video Important Person (VIP) identification task, aimed at automatically identifying the most influential individ"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.28604","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-27T15:20:06Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"6a66802f0d78a0a3d7e1c0c962d0c8f0a84d5e1252e10b2c86d74842769d91f8","abstract_canon_sha256":"ccf3006d47783be9380fbe5383ad080153ea61270185c6afe7f1bbfc512fd04f"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T02:04:57.566121Z","signature_b64":"fEUZYS2GZYumivrrJUYaxtQZzpKYi6PlgjPE9QNpSnya+UhX+EVnbSX9cnBQd16i9jazoZj/wL4Lq0pyHtFbCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"be13132bec171aaa7d97313ea27bc333eb01c46697c2fe243a0fc5f395c8f4ad","last_reissued_at":"2026-05-28T02:04:57.565709Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T02:04:57.565709Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Mining Multi-Modality Spatio-Temporal Cues for Video Important Person Identification","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CV","authors_text":"Bin Yang, Mang Ye, Minglei Yang, Wenke Huang, Xiao Wang, Xin Xu, Zheng Wang","submitted_at":"2026-05-27T15:20:06Z","abstract_excerpt":"Identifying key individuals in video scenes is essential for applications such as automated video editing and intelligent surveillance. Current methods primarily focus on static images and immediate visual cues, overlooking the rich spatio-temporal information in videos. This leads to the phenomenon of Temporal Importance Shift (TIS), wherein individuals deemed significant in early frames may be demoted as the entire temporal context is considered. To address this, we introduce the Video Important Person (VIP) identification task, aimed at automatically identifying the most influential individ"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28604","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.28604/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.28604","created_at":"2026-05-28T02:04:57.565767+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.28604v1","created_at":"2026-05-28T02:04:57.565767+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28604","created_at":"2026-05-28T02:04:57.565767+00:00"},{"alias_kind":"pith_short_12","alias_value":"XYJRGK7MC4NK","created_at":"2026-05-28T02:04:57.565767+00:00"},{"alias_kind":"pith_short_16","alias_value":"XYJRGK7MC4NKU7MX","created_at":"2026-05-28T02:04:57.565767+00:00"},{"alias_kind":"pith_short_8","alias_value":"XYJRGK7M","created_at":"2026-05-28T02:04:57.565767+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP","json":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP.json","graph_json":"https://pith.science/api/pith-number/XYJRGK7MC4NKU7MXGE7KE66DGP/graph.json","events_json":"https://pith.science/api/pith-number/XYJRGK7MC4NKU7MXGE7KE66DGP/events.json","paper":"https://pith.science/paper/XYJRGK7M"},"agent_actions":{"view_html":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP","download_json":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP.json","view_paper":"https://pith.science/paper/XYJRGK7M","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.28604&json=true","fetch_graph":"https://pith.science/api/pith-number/XYJRGK7MC4NKU7MXGE7KE66DGP/graph.json","fetch_events":"https://pith.science/api/pith-number/XYJRGK7MC4NKU7MXGE7KE66DGP/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP/action/timestamp_anchor","attest_storage":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP/action/storage_attestation","attest_author":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP/action/author_attestation","sign_citation":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP/action/citation_signature","submit_replication":"https://pith.science/pith/XYJRGK7MC4NKU7MXGE7KE66DGP/action/replication_record"}},"created_at":"2026-05-28T02:04:57.565767+00:00","updated_at":"2026-05-28T02:04:57.565767+00:00"}