{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:ZDV72H4VSJEKRL2322NB2ZBMWB","short_pith_number":"pith:ZDV72H4V","canonical_record":{"source":{"id":"1803.08863","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:18:27Z","cross_cats_sorted":["eess.AS"],"title_canon_sha256":"cf6d34c4c2772bb144a4405d69a76e0e94cdfe09e7cf8d590fbe5ef581b59d2b","abstract_canon_sha256":"8a2948d030edc5c1e74c943afb5790cec32e7b1bfd2a1700a02bd5b901656be7"},"schema_version":"1.0"},"canonical_sha256":"c8ebfd1f959248a8af5bd69a1d642cb0407ac2cf60cbacd48e0a73441174b4ac","source":{"kind":"arxiv","id":"1803.08863","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.08863","created_at":"2026-05-18T00:01:15Z"},{"alias_kind":"arxiv_version","alias_value":"1803.08863v2","created_at":"2026-05-18T00:01:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.08863","created_at":"2026-05-18T00:01:15Z"},{"alias_kind":"pith_short_12","alias_value":"ZDV72H4VSJEK","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"ZDV72H4VSJEKRL23","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"ZDV72H4V","created_at":"2026-05-18T12:33:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:ZDV72H4VSJEKRL2322NB2ZBMWB","target":"record","payload":{"canonical_record":{"source":{"id":"1803.08863","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:18:27Z","cross_cats_sorted":["eess.AS"],"title_canon_sha256":"cf6d34c4c2772bb144a4405d69a76e0e94cdfe09e7cf8d590fbe5ef581b59d2b","abstract_canon_sha256":"8a2948d030edc5c1e74c943afb5790cec32e7b1bfd2a1700a02bd5b901656be7"},"schema_version":"1.0"},"canonical_sha256":"c8ebfd1f959248a8af5bd69a1d642cb0407ac2cf60cbacd48e0a73441174b4ac","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:01:15.084442Z","signature_b64":"DiCg5LNK8sny6OrKIBVQsXJQEfz3XToCUB5SaA93MLxqpfUrcKaTb07A+b8YeJdApHa3Vr55+ZHWzA1O0d0wCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c8ebfd1f959248a8af5bd69a1d642cb0407ac2cf60cbacd48e0a73441174b4ac","last_reissued_at":"2026-05-18T00:01:15.084009Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:01:15.084009Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1803.08863","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8k4tPkA1AZMg9DDcOEiOOb4T8P5cyPEI8S3FI5murnYah0CpsmmR27TyqrnxS4rNIvPpOwKE4cRjm3LX7FSnDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T22:56:39.422036Z"},"content_sha256":"579106446fab616f2614c5e24ecfc2d906afa9392c7472460c1247577e15bee7","schema_version":"1.0","event_id":"sha256:579106446fab616f2614c5e24ecfc2d906afa9392c7472460c1247577e15bee7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:ZDV72H4VSJEKRL2322NB2ZBMWB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Multilingual bottleneck features for subword modeling in zero-resource languages","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["eess.AS"],"primary_cat":"cs.CL","authors_text":"Enno Hermann, Sharon Goldwater","submitted_at":"2018-03-23T16:18:27Z","abstract_excerpt":"How can we effectively develop speech technology for languages where no transcribed data is available? Many existing approaches use no annotated resources at all, yet it makes sense to leverage information from large annotated corpora in other languages, for example in the form of multilingual bottleneck features (BNFs) obtained from a supervised speech recognition system. In this work, we evaluate the benefits of BNFs for subword modeling (feature extraction) in six unseen languages on a word discrimination task. First we establish a strong unsupervised baseline by combining two existing meth"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.08863","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DuvsOq4vXdzSvrQ8yNHFN9Z/MN6I0R/ihmKfwykMVDc14Y4C+RJVDm+3J+FO12h6/HsEVV02rx9e/zmgJ5w6Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T22:56:39.422871Z"},"content_sha256":"fa66b413434059a09bfd973b26a34362a529d5662e7e6377a0aaec91c62eab1e","schema_version":"1.0","event_id":"sha256:fa66b413434059a09bfd973b26a34362a529d5662e7e6377a0aaec91c62eab1e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZDV72H4VSJEKRL2322NB2ZBMWB/bundle.json","state_url":"https://pith.science/pith/ZDV72H4VSJEKRL2322NB2ZBMWB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZDV72H4VSJEKRL2322NB2ZBMWB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-11T22:56:39Z","links":{"resolver":"https://pith.science/pith/ZDV72H4VSJEKRL2322NB2ZBMWB","bundle":"https://pith.science/pith/ZDV72H4VSJEKRL2322NB2ZBMWB/bundle.json","state":"https://pith.science/pith/ZDV72H4VSJEKRL2322NB2ZBMWB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZDV72H4VSJEKRL2322NB2ZBMWB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:ZDV72H4VSJEKRL2322NB2ZBMWB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8a2948d030edc5c1e74c943afb5790cec32e7b1bfd2a1700a02bd5b901656be7","cross_cats_sorted":["eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:18:27Z","title_canon_sha256":"cf6d34c4c2772bb144a4405d69a76e0e94cdfe09e7cf8d590fbe5ef581b59d2b"},"schema_version":"1.0","source":{"id":"1803.08863","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.08863","created_at":"2026-05-18T00:01:15Z"},{"alias_kind":"arxiv_version","alias_value":"1803.08863v2","created_at":"2026-05-18T00:01:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.08863","created_at":"2026-05-18T00:01:15Z"},{"alias_kind":"pith_short_12","alias_value":"ZDV72H4VSJEK","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"ZDV72H4VSJEKRL23","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"ZDV72H4V","created_at":"2026-05-18T12:33:07Z"}],"graph_snapshots":[{"event_id":"sha256:fa66b413434059a09bfd973b26a34362a529d5662e7e6377a0aaec91c62eab1e","target":"graph","created_at":"2026-05-18T00:01:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"How can we effectively develop speech technology for languages where no transcribed data is available? Many existing approaches use no annotated resources at all, yet it makes sense to leverage information from large annotated corpora in other languages, for example in the form of multilingual bottleneck features (BNFs) obtained from a supervised speech recognition system. In this work, we evaluate the benefits of BNFs for subword modeling (feature extraction) in six unseen languages on a word discrimination task. First we establish a strong unsupervised baseline by combining two existing meth","authors_text":"Enno Hermann, Sharon Goldwater","cross_cats":["eess.AS"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:18:27Z","title":"Multilingual bottleneck features for subword modeling in zero-resource languages"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.08863","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:579106446fab616f2614c5e24ecfc2d906afa9392c7472460c1247577e15bee7","target":"record","created_at":"2026-05-18T00:01:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8a2948d030edc5c1e74c943afb5790cec32e7b1bfd2a1700a02bd5b901656be7","cross_cats_sorted":["eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:18:27Z","title_canon_sha256":"cf6d34c4c2772bb144a4405d69a76e0e94cdfe09e7cf8d590fbe5ef581b59d2b"},"schema_version":"1.0","source":{"id":"1803.08863","kind":"arxiv","version":2}},"canonical_sha256":"c8ebfd1f959248a8af5bd69a1d642cb0407ac2cf60cbacd48e0a73441174b4ac","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c8ebfd1f959248a8af5bd69a1d642cb0407ac2cf60cbacd48e0a73441174b4ac","first_computed_at":"2026-05-18T00:01:15.084009Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:01:15.084009Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"DiCg5LNK8sny6OrKIBVQsXJQEfz3XToCUB5SaA93MLxqpfUrcKaTb07A+b8YeJdApHa3Vr55+ZHWzA1O0d0wCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:01:15.084442Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.08863","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:579106446fab616f2614c5e24ecfc2d906afa9392c7472460c1247577e15bee7","sha256:fa66b413434059a09bfd973b26a34362a529d5662e7e6377a0aaec91c62eab1e"],"state_sha256":"62c817fee6683f71a97b93f913be22de2d2cca1d10c3a0ec16065a4bd61bb025"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VWHN+1l0JTUisEVHRFJe0oRsnX+URUxYuQVNQL2gyw1djpLEkABTAYNA5PkksYawYJdYWUoOFfsOCKtYC//KDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-11T22:56:39.427801Z","bundle_sha256":"d90aa2d4bb55da4272f7f292a4871031340683d0b42d94a3d41cd3f5d0889847"}}