{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:LPCKGKBR3CAO4OVZ2Q7HVJSTRB","short_pith_number":"pith:LPCKGKBR","canonical_record":{"source":{"id":"1712.01393","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-12-04T22:24:29Z","cross_cats_sorted":[],"title_canon_sha256":"ca3b8384c40c64bc2f24ba92d6c9f034bc9e3550f653a86c37125b7ef210418b","abstract_canon_sha256":"a7796e8df0f3b865494a3fb90b35c99ac7ba9a17ae0729f942b57af2cadd0a61"},"schema_version":"1.0"},"canonical_sha256":"5bc4a32831d880ee3ab9d43e7aa6538845bbdc7359e1671f66f899bcb35952a1","source":{"kind":"arxiv","id":"1712.01393","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.01393","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"arxiv_version","alias_value":"1712.01393v2","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.01393","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"pith_short_12","alias_value":"LPCKGKBR3CAO","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"LPCKGKBR3CAO4OVZ","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"LPCKGKBR","created_at":"2026-05-18T12:31:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:LPCKGKBR3CAO4OVZ2Q7HVJSTRB","target":"record","payload":{"canonical_record":{"source":{"id":"1712.01393","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-12-04T22:24:29Z","cross_cats_sorted":[],"title_canon_sha256":"ca3b8384c40c64bc2f24ba92d6c9f034bc9e3550f653a86c37125b7ef210418b","abstract_canon_sha256":"a7796e8df0f3b865494a3fb90b35c99ac7ba9a17ae0729f942b57af2cadd0a61"},"schema_version":"1.0"},"canonical_sha256":"5bc4a32831d880ee3ab9d43e7aa6538845bbdc7359e1671f66f899bcb35952a1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:14:28.541756Z","signature_b64":"4bE0SKR4asNXjVnpRPeWtBDm1CL0fJ4Bk1CyPb6PSkybfUpi2ZUi7FUpz52iajIUq++6dByXUzeFGxYx3X9EBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5bc4a32831d880ee3ab9d43e7aa6538845bbdc7359e1671f66f899bcb35952a1","last_reissued_at":"2026-05-18T00:14:28.541079Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:14:28.541079Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1712.01393","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:14:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+lRbc2hPjG2t+jWEFcQbBwJUIEXr6oR5R8wUWuwvhT85z5kBZg+n2kVHhhSebs32DJJ3di6zDfLIP/JcGIcGDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:46:33.075832Z"},"content_sha256":"fcb4a01e1e0ebf72b3fff0a685826bccabaaa252ea98fb91f86e8cf43a28764d","schema_version":"1.0","event_id":"sha256:fcb4a01e1e0ebf72b3fff0a685826bccabaaa252ea98fb91f86e8cf43a28764d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:LPCKGKBR3CAO4OVZ2Q7HVJSTRB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Visual to Sound: Generating Natural Sound for Videos in the Wild","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Chen Fang, Tamara L. Berg, Trung Bui, Yipin Zhou, Zhaowen Wang","submitted_at":"2017-12-04T22:24:29Z","abstract_excerpt":"As two of the five traditional human senses (sight, hearing, taste, smell, and touch), vision and sound are basic sources through which humans understand the world. Often correlated during natural events, these two modalities combine to jointly affect human perception. In this paper, we pose the task of generating sound given visual input. Such capabilities could help enable applications in virtual reality (generating sound for virtual scenes automatically) or provide additional accessibility to images or videos for people with visual impairments. As a first step in this direction, we apply le"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.01393","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:14:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JYL2XWzOVU8qary+a+Stul8i/al9m5s7oKhOXPut0g8F2BCLWjESzTbCdYzXuG+5P8tPwlVKEPVYAfhwWGlbDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:46:33.076483Z"},"content_sha256":"e8f39e1976f881beaa9619958ef4abff5669cf471a43d9080ec7810d6212a4b5","schema_version":"1.0","event_id":"sha256:e8f39e1976f881beaa9619958ef4abff5669cf471a43d9080ec7810d6212a4b5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LPCKGKBR3CAO4OVZ2Q7HVJSTRB/bundle.json","state_url":"https://pith.science/pith/LPCKGKBR3CAO4OVZ2Q7HVJSTRB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LPCKGKBR3CAO4OVZ2Q7HVJSTRB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-29T23:46:33Z","links":{"resolver":"https://pith.science/pith/LPCKGKBR3CAO4OVZ2Q7HVJSTRB","bundle":"https://pith.science/pith/LPCKGKBR3CAO4OVZ2Q7HVJSTRB/bundle.json","state":"https://pith.science/pith/LPCKGKBR3CAO4OVZ2Q7HVJSTRB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LPCKGKBR3CAO4OVZ2Q7HVJSTRB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:LPCKGKBR3CAO4OVZ2Q7HVJSTRB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a7796e8df0f3b865494a3fb90b35c99ac7ba9a17ae0729f942b57af2cadd0a61","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-12-04T22:24:29Z","title_canon_sha256":"ca3b8384c40c64bc2f24ba92d6c9f034bc9e3550f653a86c37125b7ef210418b"},"schema_version":"1.0","source":{"id":"1712.01393","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.01393","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"arxiv_version","alias_value":"1712.01393v2","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.01393","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"pith_short_12","alias_value":"LPCKGKBR3CAO","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"LPCKGKBR3CAO4OVZ","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"LPCKGKBR","created_at":"2026-05-18T12:31:28Z"}],"graph_snapshots":[{"event_id":"sha256:e8f39e1976f881beaa9619958ef4abff5669cf471a43d9080ec7810d6212a4b5","target":"graph","created_at":"2026-05-18T00:14:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"As two of the five traditional human senses (sight, hearing, taste, smell, and touch), vision and sound are basic sources through which humans understand the world. Often correlated during natural events, these two modalities combine to jointly affect human perception. In this paper, we pose the task of generating sound given visual input. Such capabilities could help enable applications in virtual reality (generating sound for virtual scenes automatically) or provide additional accessibility to images or videos for people with visual impairments. As a first step in this direction, we apply le","authors_text":"Chen Fang, Tamara L. Berg, Trung Bui, Yipin Zhou, Zhaowen Wang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-12-04T22:24:29Z","title":"Visual to Sound: Generating Natural Sound for Videos in the Wild"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.01393","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fcb4a01e1e0ebf72b3fff0a685826bccabaaa252ea98fb91f86e8cf43a28764d","target":"record","created_at":"2026-05-18T00:14:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a7796e8df0f3b865494a3fb90b35c99ac7ba9a17ae0729f942b57af2cadd0a61","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-12-04T22:24:29Z","title_canon_sha256":"ca3b8384c40c64bc2f24ba92d6c9f034bc9e3550f653a86c37125b7ef210418b"},"schema_version":"1.0","source":{"id":"1712.01393","kind":"arxiv","version":2}},"canonical_sha256":"5bc4a32831d880ee3ab9d43e7aa6538845bbdc7359e1671f66f899bcb35952a1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5bc4a32831d880ee3ab9d43e7aa6538845bbdc7359e1671f66f899bcb35952a1","first_computed_at":"2026-05-18T00:14:28.541079Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:14:28.541079Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"4bE0SKR4asNXjVnpRPeWtBDm1CL0fJ4Bk1CyPb6PSkybfUpi2ZUi7FUpz52iajIUq++6dByXUzeFGxYx3X9EBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:14:28.541756Z","signed_message":"canonical_sha256_bytes"},"source_id":"1712.01393","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fcb4a01e1e0ebf72b3fff0a685826bccabaaa252ea98fb91f86e8cf43a28764d","sha256:e8f39e1976f881beaa9619958ef4abff5669cf471a43d9080ec7810d6212a4b5"],"state_sha256":"319694ee47e167d26cc6455fb28e20d5fe0d4755ffaba062f523633e6274bf6b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZaSk9iIhTSHPvVM5yX32tAqo9IMwbADJtlQd0n9qsigl739H3q88JfTnoLyYlaDR0wMUH0QVi+nY9d03oxg3BA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-29T23:46:33.080287Z","bundle_sha256":"ef29af9299a9f591cc6cd3eab3efa7a994b38fc83cf80f867fd8e6376ae6dcce"}}