{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:7SYRR3VBEYZNVKZDGFCYSAL2NQ","short_pith_number":"pith:7SYRR3VB","canonical_record":{"source":{"id":"2605.18547","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-18T15:27:10Z","cross_cats_sorted":[],"title_canon_sha256":"8f4241e5787ca1ab09335f58911b0ed983eb33f507a74410f70db2d747af1ab6","abstract_canon_sha256":"7c96df8125ff15969bd55dfc5ad2ae2a6d6c4e20db94d4bc2c2f1e8bb7b7a0ed"},"schema_version":"1.0"},"canonical_sha256":"fcb118eea12632daab23314589017a6c392b7d7f16449f380c46cf017b779946","source":{"kind":"arxiv","id":"2605.18547","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18547","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18547v1","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18547","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"pith_short_12","alias_value":"7SYRR3VBEYZN","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"pith_short_16","alias_value":"7SYRR3VBEYZNVKZD","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"pith_short_8","alias_value":"7SYRR3VB","created_at":"2026-05-20T00:06:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:7SYRR3VBEYZNVKZDGFCYSAL2NQ","target":"record","payload":{"canonical_record":{"source":{"id":"2605.18547","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-18T15:27:10Z","cross_cats_sorted":[],"title_canon_sha256":"8f4241e5787ca1ab09335f58911b0ed983eb33f507a74410f70db2d747af1ab6","abstract_canon_sha256":"7c96df8125ff15969bd55dfc5ad2ae2a6d6c4e20db94d4bc2c2f1e8bb7b7a0ed"},"schema_version":"1.0"},"canonical_sha256":"fcb118eea12632daab23314589017a6c392b7d7f16449f380c46cf017b779946","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:06:07.075864Z","signature_b64":"8IA/HYMx1rK2vNjW1flyxuwNm/s3RLvcjfPzRQah24jf9Q7DuKioejx193WhqoOILvca+qoP2zFhz0ZAeztTAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"fcb118eea12632daab23314589017a6c392b7d7f16449f380c46cf017b779946","last_reissued_at":"2026-05-20T00:06:07.075013Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:06:07.075013Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.18547","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ncLzW+WiAWDl1zzeHH1IX9bDDAKY+6QNLkqeqMjRlca4kKy9OdMLIAhVAeDuiw2UvYiRQw+aovBvgvoO1CXDDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T00:47:53.602835Z"},"content_sha256":"02cf59c2210c96b69c1cca751f015966e0e6aaa92dc0bcb90e7be9b1eb7229d9","schema_version":"1.0","event_id":"sha256:02cf59c2210c96b69c1cca751f015966e0e6aaa92dc0bcb90e7be9b1eb7229d9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:7SYRR3VBEYZNVKZDGFCYSAL2NQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"VISAFF: Speaker-Centered Visual Affective Feature Learning for Emotion Recognition in Conversation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Guojiang Shen, Linan ZHU, Xiangfan Chen, Xiangjie Kong, Xiao Han, Yuqian Fu, Zihao Zhai","submitted_at":"2026-05-18T15:27:10Z","abstract_excerpt":"Emotion Recognition in Conversation (ERC) is essential for effective human-machine interaction, aiming to identify speakers' emotional states in multi-turn dialogues. Early text-based methods struggle with complex scenarios like sarcasm because they inherently neglect vital non-verbal information. While recent Vision-Language Models (VLMs) address this by analyzing video directly, they are not inherently tailored for ERC and often focus on emotionally irrelevant background regions or passive listeners rather than the active speaker. Furthermore, fine-tuning these large models incurs prohibitiv"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18547","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18547/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"mgT5v/PeN45rLnDmeMqs2KLl6tJMsdn4gcMEOK3hplFXcd4mM/8gK8Wzr4RPi+e0KiQ0OrNbnGAs6zsgE11NCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T00:47:53.603628Z"},"content_sha256":"2b1b3c549c96d03a33bf9c9ff54f7ed5f1c0287a85d1fb02531ac0094f47ef43","schema_version":"1.0","event_id":"sha256:2b1b3c549c96d03a33bf9c9ff54f7ed5f1c0287a85d1fb02531ac0094f47ef43"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/7SYRR3VBEYZNVKZDGFCYSAL2NQ/bundle.json","state_url":"https://pith.science/pith/7SYRR3VBEYZNVKZDGFCYSAL2NQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/7SYRR3VBEYZNVKZDGFCYSAL2NQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-22T00:47:53Z","links":{"resolver":"https://pith.science/pith/7SYRR3VBEYZNVKZDGFCYSAL2NQ","bundle":"https://pith.science/pith/7SYRR3VBEYZNVKZDGFCYSAL2NQ/bundle.json","state":"https://pith.science/pith/7SYRR3VBEYZNVKZDGFCYSAL2NQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/7SYRR3VBEYZNVKZDGFCYSAL2NQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:7SYRR3VBEYZNVKZDGFCYSAL2NQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7c96df8125ff15969bd55dfc5ad2ae2a6d6c4e20db94d4bc2c2f1e8bb7b7a0ed","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-18T15:27:10Z","title_canon_sha256":"8f4241e5787ca1ab09335f58911b0ed983eb33f507a74410f70db2d747af1ab6"},"schema_version":"1.0","source":{"id":"2605.18547","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18547","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18547v1","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18547","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"pith_short_12","alias_value":"7SYRR3VBEYZN","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"pith_short_16","alias_value":"7SYRR3VBEYZNVKZD","created_at":"2026-05-20T00:06:07Z"},{"alias_kind":"pith_short_8","alias_value":"7SYRR3VB","created_at":"2026-05-20T00:06:07Z"}],"graph_snapshots":[{"event_id":"sha256:2b1b3c549c96d03a33bf9c9ff54f7ed5f1c0287a85d1fb02531ac0094f47ef43","target":"graph","created_at":"2026-05-20T00:06:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.18547/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Emotion Recognition in Conversation (ERC) is essential for effective human-machine interaction, aiming to identify speakers' emotional states in multi-turn dialogues. Early text-based methods struggle with complex scenarios like sarcasm because they inherently neglect vital non-verbal information. While recent Vision-Language Models (VLMs) address this by analyzing video directly, they are not inherently tailored for ERC and often focus on emotionally irrelevant background regions or passive listeners rather than the active speaker. Furthermore, fine-tuning these large models incurs prohibitiv","authors_text":"Guojiang Shen, Linan ZHU, Xiangfan Chen, Xiangjie Kong, Xiao Han, Yuqian Fu, Zihao Zhai","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-18T15:27:10Z","title":"VISAFF: Speaker-Centered Visual Affective Feature Learning for Emotion Recognition in Conversation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18547","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:02cf59c2210c96b69c1cca751f015966e0e6aaa92dc0bcb90e7be9b1eb7229d9","target":"record","created_at":"2026-05-20T00:06:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7c96df8125ff15969bd55dfc5ad2ae2a6d6c4e20db94d4bc2c2f1e8bb7b7a0ed","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-18T15:27:10Z","title_canon_sha256":"8f4241e5787ca1ab09335f58911b0ed983eb33f507a74410f70db2d747af1ab6"},"schema_version":"1.0","source":{"id":"2605.18547","kind":"arxiv","version":1}},"canonical_sha256":"fcb118eea12632daab23314589017a6c392b7d7f16449f380c46cf017b779946","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"fcb118eea12632daab23314589017a6c392b7d7f16449f380c46cf017b779946","first_computed_at":"2026-05-20T00:06:07.075013Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:06:07.075013Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"8IA/HYMx1rK2vNjW1flyxuwNm/s3RLvcjfPzRQah24jf9Q7DuKioejx193WhqoOILvca+qoP2zFhz0ZAeztTAQ==","signature_status":"signed_v1","signed_at":"2026-05-20T00:06:07.075864Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.18547","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:02cf59c2210c96b69c1cca751f015966e0e6aaa92dc0bcb90e7be9b1eb7229d9","sha256:2b1b3c549c96d03a33bf9c9ff54f7ed5f1c0287a85d1fb02531ac0094f47ef43"],"state_sha256":"7d260c82e4108926f8b6c2c219de7daeb9009bc528e5842816028d17cb415078"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0en2uuMbPYQ6bytIqLWOGodHuGSOsXvbwI/4iz7b0edULAjha6NyOibItGlf5nh3iTp+PuGPRGEaaME1Jy3ZAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-22T00:47:53.607494Z","bundle_sha256":"3f07aa3a8797544a745bba2d9f0d3eb41cd41b23c96daf0960165472d54d6890"}}