{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:ZE3T6DGMFUBLPIL4SDXPN4RCAZ","short_pith_number":"pith:ZE3T6DGM","canonical_record":{"source":{"id":"1704.08292","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-04-26T18:46:10Z","cross_cats_sorted":["cs.MM","cs.SD"],"title_canon_sha256":"9d926c92200795a3e8fd004b6b9d94ee047543eb1a0020e913ee22544bb5c195","abstract_canon_sha256":"e9e218f14cd5f4a7e6d98eb327d0b36ded7f3e1dd39b8bc61a604348e3074591"},"schema_version":"1.0"},"canonical_sha256":"c9373f0ccc2d02b7a17c90eef6f2220661e467e95ae4eecae3708e732b18502a","source":{"kind":"arxiv","id":"1704.08292","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1704.08292","created_at":"2026-05-18T00:45:28Z"},{"alias_kind":"arxiv_version","alias_value":"1704.08292v1","created_at":"2026-05-18T00:45:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1704.08292","created_at":"2026-05-18T00:45:28Z"},{"alias_kind":"pith_short_12","alias_value":"ZE3T6DGMFUBL","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_16","alias_value":"ZE3T6DGMFUBLPIL4","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_8","alias_value":"ZE3T6DGM","created_at":"2026-05-18T12:31:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:ZE3T6DGMFUBLPIL4SDXPN4RCAZ","target":"record","payload":{"canonical_record":{"source":{"id":"1704.08292","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-04-26T18:46:10Z","cross_cats_sorted":["cs.MM","cs.SD"],"title_canon_sha256":"9d926c92200795a3e8fd004b6b9d94ee047543eb1a0020e913ee22544bb5c195","abstract_canon_sha256":"e9e218f14cd5f4a7e6d98eb327d0b36ded7f3e1dd39b8bc61a604348e3074591"},"schema_version":"1.0"},"canonical_sha256":"c9373f0ccc2d02b7a17c90eef6f2220661e467e95ae4eecae3708e732b18502a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:45:28.066354Z","signature_b64":"EVfwzr9nsjCYrNQVGl3DiIlk25SCTBBcsM7qGh7Fg0E2QMI1quYnnVfGuNSWixS4xe4XqDK2USY2HSR79FYgBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c9373f0ccc2d02b7a17c90eef6f2220661e467e95ae4eecae3708e732b18502a","last_reissued_at":"2026-05-18T00:45:28.065929Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:45:28.065929Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1704.08292","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:45:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"AZNtAVkNpfpHNwEiwqEAQcCS+X+Lxog5hD8F+7A5vNWvHdMKrYbllI3cN7Syo6pZMr5OepTXAkmhZts6SK1/AA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T03:31:49.677696Z"},"content_sha256":"96875996fd0153d71b1191c1681a908b803c6f137a46c14af0fa736901c4b935","schema_version":"1.0","event_id":"sha256:96875996fd0153d71b1191c1681a908b803c6f137a46c14af0fa736901c4b935"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:ZE3T6DGMFUBLPIL4SDXPN4RCAZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Deep Cross-Modal Audio-Visual Generation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.MM","cs.SD"],"primary_cat":"cs.CV","authors_text":"Chenliang Xu, Lele Chen, Sudhanshu Srivastava, Zhiyao Duan","submitted_at":"2017-04-26T18:46:10Z","abstract_excerpt":"Cross-modal audio-visual perception has been a long-lasting topic in psychology and neurology, and various studies have discovered strong correlations in human perception of auditory and visual stimuli. Despite works in computational multimodal modeling, the problem of cross-modal audio-visual generation has not been systematically studied in the literature. In this paper, we make the first attempt to solve this cross-modal generation problem leveraging the power of deep generative adversarial training. Specifically, we use conditional generative adversarial networks to achieve cross-modal aud"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1704.08292","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:45:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"STs/gCISr6/M0DlB3XHQXxhGH4esuCP91SmAp0gbgahGwJ4QmdgXXSXjBHDcekteEPojbDVXEB78IKHrxp2UCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T03:31:49.678366Z"},"content_sha256":"a7cfb13b856378cd2cf55f6f6c891fe7bb9f24d3c828664c428788276edc5e58","schema_version":"1.0","event_id":"sha256:a7cfb13b856378cd2cf55f6f6c891fe7bb9f24d3c828664c428788276edc5e58"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZE3T6DGMFUBLPIL4SDXPN4RCAZ/bundle.json","state_url":"https://pith.science/pith/ZE3T6DGMFUBLPIL4SDXPN4RCAZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZE3T6DGMFUBLPIL4SDXPN4RCAZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-24T03:31:49Z","links":{"resolver":"https://pith.science/pith/ZE3T6DGMFUBLPIL4SDXPN4RCAZ","bundle":"https://pith.science/pith/ZE3T6DGMFUBLPIL4SDXPN4RCAZ/bundle.json","state":"https://pith.science/pith/ZE3T6DGMFUBLPIL4SDXPN4RCAZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZE3T6DGMFUBLPIL4SDXPN4RCAZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:ZE3T6DGMFUBLPIL4SDXPN4RCAZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e9e218f14cd5f4a7e6d98eb327d0b36ded7f3e1dd39b8bc61a604348e3074591","cross_cats_sorted":["cs.MM","cs.SD"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-04-26T18:46:10Z","title_canon_sha256":"9d926c92200795a3e8fd004b6b9d94ee047543eb1a0020e913ee22544bb5c195"},"schema_version":"1.0","source":{"id":"1704.08292","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1704.08292","created_at":"2026-05-18T00:45:28Z"},{"alias_kind":"arxiv_version","alias_value":"1704.08292v1","created_at":"2026-05-18T00:45:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1704.08292","created_at":"2026-05-18T00:45:28Z"},{"alias_kind":"pith_short_12","alias_value":"ZE3T6DGMFUBL","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_16","alias_value":"ZE3T6DGMFUBLPIL4","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_8","alias_value":"ZE3T6DGM","created_at":"2026-05-18T12:31:59Z"}],"graph_snapshots":[{"event_id":"sha256:a7cfb13b856378cd2cf55f6f6c891fe7bb9f24d3c828664c428788276edc5e58","target":"graph","created_at":"2026-05-18T00:45:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Cross-modal audio-visual perception has been a long-lasting topic in psychology and neurology, and various studies have discovered strong correlations in human perception of auditory and visual stimuli. Despite works in computational multimodal modeling, the problem of cross-modal audio-visual generation has not been systematically studied in the literature. In this paper, we make the first attempt to solve this cross-modal generation problem leveraging the power of deep generative adversarial training. Specifically, we use conditional generative adversarial networks to achieve cross-modal aud","authors_text":"Chenliang Xu, Lele Chen, Sudhanshu Srivastava, Zhiyao Duan","cross_cats":["cs.MM","cs.SD"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-04-26T18:46:10Z","title":"Deep Cross-Modal Audio-Visual Generation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1704.08292","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:96875996fd0153d71b1191c1681a908b803c6f137a46c14af0fa736901c4b935","target":"record","created_at":"2026-05-18T00:45:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e9e218f14cd5f4a7e6d98eb327d0b36ded7f3e1dd39b8bc61a604348e3074591","cross_cats_sorted":["cs.MM","cs.SD"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-04-26T18:46:10Z","title_canon_sha256":"9d926c92200795a3e8fd004b6b9d94ee047543eb1a0020e913ee22544bb5c195"},"schema_version":"1.0","source":{"id":"1704.08292","kind":"arxiv","version":1}},"canonical_sha256":"c9373f0ccc2d02b7a17c90eef6f2220661e467e95ae4eecae3708e732b18502a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c9373f0ccc2d02b7a17c90eef6f2220661e467e95ae4eecae3708e732b18502a","first_computed_at":"2026-05-18T00:45:28.065929Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:45:28.065929Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"EVfwzr9nsjCYrNQVGl3DiIlk25SCTBBcsM7qGh7Fg0E2QMI1quYnnVfGuNSWixS4xe4XqDK2USY2HSR79FYgBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:45:28.066354Z","signed_message":"canonical_sha256_bytes"},"source_id":"1704.08292","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:96875996fd0153d71b1191c1681a908b803c6f137a46c14af0fa736901c4b935","sha256:a7cfb13b856378cd2cf55f6f6c891fe7bb9f24d3c828664c428788276edc5e58"],"state_sha256":"2e15f4dc78d87bcb090b0b06128bb7c68ac0a9a7330a0e88efcc727ffec50919"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BbnKvoD5NMiy23Z1fTmFR4UzR3cRTqtjV/p0z6KOtQDpsjTndMibTldiQREuI6sAU8mJKnRs1JPsULnoax9iBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-24T03:31:49.681998Z","bundle_sha256":"b8b5cd21248eef9c980a90a8b42dd921b4aa4eeee66e9cf1e14bdac890da77fb"}}