{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:XCIFDYZHTRPDRRFRAFV5F4YNLA","short_pith_number":"pith:XCIFDYZH","canonical_record":{"source":{"id":"1804.00920","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"eess.AS","submitted_at":"2018-04-03T11:43:36Z","cross_cats_sorted":["cs.CL","cs.SD","stat.ML"],"title_canon_sha256":"2b80e913b87ab4407ccf04d7f619e722773682769465e2de10e7f5f083606ebc","abstract_canon_sha256":"27457ca7f9c2280659daa7142cde45ec4bf8ddab794c5487812f1c7cb3a60ca8"},"schema_version":"1.0"},"canonical_sha256":"b89051e3279c5e38c4b1016bd2f30d58015feff62df2961566567199b56bbd07","source":{"kind":"arxiv","id":"1804.00920","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.00920","created_at":"2026-05-18T00:19:31Z"},{"alias_kind":"arxiv_version","alias_value":"1804.00920v1","created_at":"2026-05-18T00:19:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.00920","created_at":"2026-05-18T00:19:31Z"},{"alias_kind":"pith_short_12","alias_value":"XCIFDYZHTRPD","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_16","alias_value":"XCIFDYZHTRPDRRFR","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_8","alias_value":"XCIFDYZH","created_at":"2026-05-18T12:33:01Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:XCIFDYZHTRPDRRFRAFV5F4YNLA","target":"record","payload":{"canonical_record":{"source":{"id":"1804.00920","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"eess.AS","submitted_at":"2018-04-03T11:43:36Z","cross_cats_sorted":["cs.CL","cs.SD","stat.ML"],"title_canon_sha256":"2b80e913b87ab4407ccf04d7f619e722773682769465e2de10e7f5f083606ebc","abstract_canon_sha256":"27457ca7f9c2280659daa7142cde45ec4bf8ddab794c5487812f1c7cb3a60ca8"},"schema_version":"1.0"},"canonical_sha256":"b89051e3279c5e38c4b1016bd2f30d58015feff62df2961566567199b56bbd07","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:19:31.789266Z","signature_b64":"2h9cW0NsUm15pE3VQLiAtcP+bhgV2wWgohHqjBZoroKGW2k3LoSj17PADDcoVjwWLynetM2mchKO8NjeGIAPBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b89051e3279c5e38c4b1016bd2f30d58015feff62df2961566567199b56bbd07","last_reissued_at":"2026-05-18T00:19:31.788807Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:19:31.788807Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1804.00920","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:19:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Qnq+6wmix/1+nCTLzTmjhyO0fK9zL6Ns4x7w1PD5dr3v7kIHth1/XZ3cqryPj5AgmwOw3+jNB1ONpLxZCI9XCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T06:14:43.823028Z"},"content_sha256":"29093e55e03add484f210bcab143b0a0bbf5d05d3428a0bbf86b0ef810df7599","schema_version":"1.0","event_id":"sha256:29093e55e03add484f210bcab143b0a0bbf5d05d3428a0bbf86b0ef810df7599"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:XCIFDYZHTRPDRRFRAFV5F4YNLA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Speech waveform synthesis from MFCC sequences with generative adversarial networks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.SD","stat.ML"],"primary_cat":"eess.AS","authors_text":"Bajibabu Bollepalli, Hirokazu Kameoka, Junichi Yamagishi, Lauri Juvela, Manu Airaksinen, Paavo Alku, Xin Wang","submitted_at":"2018-04-03T11:43:36Z","abstract_excerpt":"This paper proposes a method for generating speech from filterbank mel frequency cepstral coefficients (MFCC), which are widely used in speech applications, such as ASR, but are generally considered unusable for speech synthesis. First, we predict fundamental frequency and voicing information from MFCCs with an autoregressive recurrent neural net. Second, the spectral envelope information contained in MFCCs is converted to all-pole filters, and a pitch-synchronous excitation model matched to these filters is trained. Finally, we introduce a generative adversarial network -based noise model to "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.00920","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:19:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"q7PbMjBcc8OW6+0zzX1ERY2EBiycVr6Nkz07bR12XlZ6CLMSgD1JjBVPzQ9fkoMpgK3nsC3JlP3UoLsyuVjDCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T06:14:43.823390Z"},"content_sha256":"d31fbe1668313c91f0d454564332276891a6e99da209aeeae31752f4bb132539","schema_version":"1.0","event_id":"sha256:d31fbe1668313c91f0d454564332276891a6e99da209aeeae31752f4bb132539"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XCIFDYZHTRPDRRFRAFV5F4YNLA/bundle.json","state_url":"https://pith.science/pith/XCIFDYZHTRPDRRFRAFV5F4YNLA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XCIFDYZHTRPDRRFRAFV5F4YNLA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T06:14:43Z","links":{"resolver":"https://pith.science/pith/XCIFDYZHTRPDRRFRAFV5F4YNLA","bundle":"https://pith.science/pith/XCIFDYZHTRPDRRFRAFV5F4YNLA/bundle.json","state":"https://pith.science/pith/XCIFDYZHTRPDRRFRAFV5F4YNLA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XCIFDYZHTRPDRRFRAFV5F4YNLA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:XCIFDYZHTRPDRRFRAFV5F4YNLA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"27457ca7f9c2280659daa7142cde45ec4bf8ddab794c5487812f1c7cb3a60ca8","cross_cats_sorted":["cs.CL","cs.SD","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"eess.AS","submitted_at":"2018-04-03T11:43:36Z","title_canon_sha256":"2b80e913b87ab4407ccf04d7f619e722773682769465e2de10e7f5f083606ebc"},"schema_version":"1.0","source":{"id":"1804.00920","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.00920","created_at":"2026-05-18T00:19:31Z"},{"alias_kind":"arxiv_version","alias_value":"1804.00920v1","created_at":"2026-05-18T00:19:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.00920","created_at":"2026-05-18T00:19:31Z"},{"alias_kind":"pith_short_12","alias_value":"XCIFDYZHTRPD","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_16","alias_value":"XCIFDYZHTRPDRRFR","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_8","alias_value":"XCIFDYZH","created_at":"2026-05-18T12:33:01Z"}],"graph_snapshots":[{"event_id":"sha256:d31fbe1668313c91f0d454564332276891a6e99da209aeeae31752f4bb132539","target":"graph","created_at":"2026-05-18T00:19:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"This paper proposes a method for generating speech from filterbank mel frequency cepstral coefficients (MFCC), which are widely used in speech applications, such as ASR, but are generally considered unusable for speech synthesis. First, we predict fundamental frequency and voicing information from MFCCs with an autoregressive recurrent neural net. Second, the spectral envelope information contained in MFCCs is converted to all-pole filters, and a pitch-synchronous excitation model matched to these filters is trained. Finally, we introduce a generative adversarial network -based noise model to ","authors_text":"Bajibabu Bollepalli, Hirokazu Kameoka, Junichi Yamagishi, Lauri Juvela, Manu Airaksinen, Paavo Alku, Xin Wang","cross_cats":["cs.CL","cs.SD","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"eess.AS","submitted_at":"2018-04-03T11:43:36Z","title":"Speech waveform synthesis from MFCC sequences with generative adversarial networks"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.00920","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:29093e55e03add484f210bcab143b0a0bbf5d05d3428a0bbf86b0ef810df7599","target":"record","created_at":"2026-05-18T00:19:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"27457ca7f9c2280659daa7142cde45ec4bf8ddab794c5487812f1c7cb3a60ca8","cross_cats_sorted":["cs.CL","cs.SD","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"eess.AS","submitted_at":"2018-04-03T11:43:36Z","title_canon_sha256":"2b80e913b87ab4407ccf04d7f619e722773682769465e2de10e7f5f083606ebc"},"schema_version":"1.0","source":{"id":"1804.00920","kind":"arxiv","version":1}},"canonical_sha256":"b89051e3279c5e38c4b1016bd2f30d58015feff62df2961566567199b56bbd07","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b89051e3279c5e38c4b1016bd2f30d58015feff62df2961566567199b56bbd07","first_computed_at":"2026-05-18T00:19:31.788807Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:19:31.788807Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"2h9cW0NsUm15pE3VQLiAtcP+bhgV2wWgohHqjBZoroKGW2k3LoSj17PADDcoVjwWLynetM2mchKO8NjeGIAPBw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:19:31.789266Z","signed_message":"canonical_sha256_bytes"},"source_id":"1804.00920","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:29093e55e03add484f210bcab143b0a0bbf5d05d3428a0bbf86b0ef810df7599","sha256:d31fbe1668313c91f0d454564332276891a6e99da209aeeae31752f4bb132539"],"state_sha256":"6b7e578901d86a87b78a57888e82519ef170491878f15ea8c79b14ef228f5ea0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9i2VsP4z5lKDjoWkh/YtLQ9Z4RQCQMvtMP4jf5k6McDGSDcQC/5fpBhPtIVmtAPgZ0sk+2q+sLFmd4k2fgNxBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T06:14:43.825492Z","bundle_sha256":"bdf4c6a3c41c151eb3328b3ccd50d7b8664c7d056eefc8d1c9072d9f4a8f05b0"}}