{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:UVJIO3A5UKGLHFR5ISVPLS6ZFG","short_pith_number":"pith:UVJIO3A5","canonical_record":{"source":{"id":"1804.02135","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-04-06T05:27:14Z","cross_cats_sorted":["cs.SD","eess.AS"],"title_canon_sha256":"27ec8f5015005ee22fcfabe7d50f94468fe2c7aa1ad10a82ed7d2f30a7933cc6","abstract_canon_sha256":"d0e44c96beff0f6e5e05db306953156028bc827643da852863338e9a15634448"},"schema_version":"1.0"},"canonical_sha256":"a552876c1da28cb3963d44aaf5cbd92991ed6155fc2bf114437fb65ca2248881","source":{"kind":"arxiv","id":"1804.02135","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.02135","created_at":"2026-05-17T23:54:25Z"},{"alias_kind":"arxiv_version","alias_value":"1804.02135v3","created_at":"2026-05-17T23:54:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.02135","created_at":"2026-05-17T23:54:25Z"},{"alias_kind":"pith_short_12","alias_value":"UVJIO3A5UKGL","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_16","alias_value":"UVJIO3A5UKGLHFR5","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_8","alias_value":"UVJIO3A5","created_at":"2026-05-18T12:32:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:UVJIO3A5UKGLHFR5ISVPLS6ZFG","target":"record","payload":{"canonical_record":{"source":{"id":"1804.02135","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-04-06T05:27:14Z","cross_cats_sorted":["cs.SD","eess.AS"],"title_canon_sha256":"27ec8f5015005ee22fcfabe7d50f94468fe2c7aa1ad10a82ed7d2f30a7933cc6","abstract_canon_sha256":"d0e44c96beff0f6e5e05db306953156028bc827643da852863338e9a15634448"},"schema_version":"1.0"},"canonical_sha256":"a552876c1da28cb3963d44aaf5cbd92991ed6155fc2bf114437fb65ca2248881","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:54:25.176631Z","signature_b64":"duZvI2lf/KMz+G0eu8yxE2eC58XdEj3w//7I8Up9N85siL1bCGYkmcTRYkjvEqxprzP4oU5RX63ADierQilEBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a552876c1da28cb3963d44aaf5cbd92991ed6155fc2bf114437fb65ca2248881","last_reissued_at":"2026-05-17T23:54:25.175985Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:54:25.175985Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1804.02135","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:54:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"E0zxXTI2UdxaN14UuqFifghIDQPlx09NOUeAjCU/jQLP+HQLRE2ypOEnMFcJnV4ACgrvJTjkPupQ1kTdY9AMCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T18:44:34.858672Z"},"content_sha256":"478a938a41d5de9da217fb093296d04f6ff666a955da0dcfe6a04e7c5300b5e6","schema_version":"1.0","event_id":"sha256:478a938a41d5de9da217fb093296d04f6ff666a955da0dcfe6a04e7c5300b5e6"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:UVJIO3A5UKGLHFR5ISVPLS6ZFG","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Expressive Speech Synthesis via Modeling Expressions with Variational Autoencoder","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.SD","eess.AS"],"primary_cat":"cs.CL","authors_text":"Kei Akuzawa, Yusuke Iwasawa, Yutaka Matsuo","submitted_at":"2018-04-06T05:27:14Z","abstract_excerpt":"Recent advances in neural autoregressive models have improve the performance of speech synthesis (SS). However, as they lack the ability to model global characteristics of speech (such as speaker individualities or speaking styles), particularly when these characteristics have not been labeled, making neural autoregressive SS systems more expressive is still an open issue. In this paper, we propose to combine VoiceLoop, an autoregressive SS model, with Variational Autoencoder (VAE). This approach, unlike traditional autoregressive SS systems, uses VAE to model the global characteristics explic"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.02135","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:54:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/GneYYaJjhKj6OAcRZMiIw53YxBa/hFsf+LDmvAogl/3SlKa6Go/C9eu5nHSjkYKxVzSYFCUd05UAiKPigjfAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T18:44:34.859455Z"},"content_sha256":"690b3b7442fcb7fa827a37ae129f3d0675f0fd735ebe5dd9a91006f9005edb35","schema_version":"1.0","event_id":"sha256:690b3b7442fcb7fa827a37ae129f3d0675f0fd735ebe5dd9a91006f9005edb35"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/UVJIO3A5UKGLHFR5ISVPLS6ZFG/bundle.json","state_url":"https://pith.science/pith/UVJIO3A5UKGLHFR5ISVPLS6ZFG/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/UVJIO3A5UKGLHFR5ISVPLS6ZFG/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T18:44:34Z","links":{"resolver":"https://pith.science/pith/UVJIO3A5UKGLHFR5ISVPLS6ZFG","bundle":"https://pith.science/pith/UVJIO3A5UKGLHFR5ISVPLS6ZFG/bundle.json","state":"https://pith.science/pith/UVJIO3A5UKGLHFR5ISVPLS6ZFG/state.json","well_known_bundle":"https://pith.science/.well-known/pith/UVJIO3A5UKGLHFR5ISVPLS6ZFG/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:UVJIO3A5UKGLHFR5ISVPLS6ZFG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d0e44c96beff0f6e5e05db306953156028bc827643da852863338e9a15634448","cross_cats_sorted":["cs.SD","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-04-06T05:27:14Z","title_canon_sha256":"27ec8f5015005ee22fcfabe7d50f94468fe2c7aa1ad10a82ed7d2f30a7933cc6"},"schema_version":"1.0","source":{"id":"1804.02135","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.02135","created_at":"2026-05-17T23:54:25Z"},{"alias_kind":"arxiv_version","alias_value":"1804.02135v3","created_at":"2026-05-17T23:54:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.02135","created_at":"2026-05-17T23:54:25Z"},{"alias_kind":"pith_short_12","alias_value":"UVJIO3A5UKGL","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_16","alias_value":"UVJIO3A5UKGLHFR5","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_8","alias_value":"UVJIO3A5","created_at":"2026-05-18T12:32:56Z"}],"graph_snapshots":[{"event_id":"sha256:690b3b7442fcb7fa827a37ae129f3d0675f0fd735ebe5dd9a91006f9005edb35","target":"graph","created_at":"2026-05-17T23:54:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Recent advances in neural autoregressive models have improve the performance of speech synthesis (SS). However, as they lack the ability to model global characteristics of speech (such as speaker individualities or speaking styles), particularly when these characteristics have not been labeled, making neural autoregressive SS systems more expressive is still an open issue. In this paper, we propose to combine VoiceLoop, an autoregressive SS model, with Variational Autoencoder (VAE). This approach, unlike traditional autoregressive SS systems, uses VAE to model the global characteristics explic","authors_text":"Kei Akuzawa, Yusuke Iwasawa, Yutaka Matsuo","cross_cats":["cs.SD","eess.AS"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-04-06T05:27:14Z","title":"Expressive Speech Synthesis via Modeling Expressions with Variational Autoencoder"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.02135","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:478a938a41d5de9da217fb093296d04f6ff666a955da0dcfe6a04e7c5300b5e6","target":"record","created_at":"2026-05-17T23:54:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d0e44c96beff0f6e5e05db306953156028bc827643da852863338e9a15634448","cross_cats_sorted":["cs.SD","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-04-06T05:27:14Z","title_canon_sha256":"27ec8f5015005ee22fcfabe7d50f94468fe2c7aa1ad10a82ed7d2f30a7933cc6"},"schema_version":"1.0","source":{"id":"1804.02135","kind":"arxiv","version":3}},"canonical_sha256":"a552876c1da28cb3963d44aaf5cbd92991ed6155fc2bf114437fb65ca2248881","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a552876c1da28cb3963d44aaf5cbd92991ed6155fc2bf114437fb65ca2248881","first_computed_at":"2026-05-17T23:54:25.175985Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:54:25.175985Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"duZvI2lf/KMz+G0eu8yxE2eC58XdEj3w//7I8Up9N85siL1bCGYkmcTRYkjvEqxprzP4oU5RX63ADierQilEBA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:54:25.176631Z","signed_message":"canonical_sha256_bytes"},"source_id":"1804.02135","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:478a938a41d5de9da217fb093296d04f6ff666a955da0dcfe6a04e7c5300b5e6","sha256:690b3b7442fcb7fa827a37ae129f3d0675f0fd735ebe5dd9a91006f9005edb35"],"state_sha256":"bc6502e0923252d8af8622b52008451815bfbe37b0f2ef584761acc2ed1d993e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2bRBaSqYXa6IiRHYe+DxH655yJyPVrJKerfcVtisMeT4ndpA9xLkl0f7SENx3YO3TsXIAGB9IjJDxxi2USJtDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T18:44:34.863043Z","bundle_sha256":"aaa1bdf9325bef3ada8f1cb855fae17a1b7b85f62a8f6ad40b3db1726383746d"}}