{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:SWV4BSQF6PJ6XLDUNRTXXH5IV6","short_pith_number":"pith:SWV4BSQF","schema_version":"1.0","canonical_sha256":"95abc0ca05f3d3ebac746c677b9fa8afbdefaa544c953a968e266d971f4772e8","source":{"kind":"arxiv","id":"1807.10945","version":1},"attestation_state":"computed","paper":{"title":"Acoustic and Textual Data Augmentation for Improved ASR of Code-Switching Speech","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"David A. van Leeuwen, Emre Y{\\i}lmaz, Henk van den Heuvel","submitted_at":"2018-07-28T14:59:52Z","abstract_excerpt":"In this paper, we describe several techniques for improving the acoustic and language model of an automatic speech recognition (ASR) system operating on code-switching (CS) speech. We focus on the recognition of Frisian-Dutch radio broadcasts where one of the mixed languages, namely Frisian, is an under-resourced language. In previous work, we have proposed several automatic transcription strategies for CS speech to increase the amount of available training speech data. In this work, we explore how the acoustic modeling (AM) can benefit from monolingual speech data belonging to the high-resour"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1807.10945","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-07-28T14:59:52Z","cross_cats_sorted":[],"title_canon_sha256":"b8f0131d1e6efb710c43a301e0bfa2cd3948a80bd187ec5ff8d8b7a25e571c8c","abstract_canon_sha256":"aeaabf593528463d883e448380f9939053d2ee850bad9ca2bcb816fda0ef4e55"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:09:34.941579Z","signature_b64":"pLuh8GgVhucs7On57BWnpDpqbRYbj5SxPcVF5LTJ4+L6BhpTbJGgM35wdBxE4WizBuGCCHD1dzYMh3uW0jMMAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"95abc0ca05f3d3ebac746c677b9fa8afbdefaa544c953a968e266d971f4772e8","last_reissued_at":"2026-05-18T00:09:34.941083Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:09:34.941083Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Acoustic and Textual Data Augmentation for Improved ASR of Code-Switching Speech","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"David A. van Leeuwen, Emre Y{\\i}lmaz, Henk van den Heuvel","submitted_at":"2018-07-28T14:59:52Z","abstract_excerpt":"In this paper, we describe several techniques for improving the acoustic and language model of an automatic speech recognition (ASR) system operating on code-switching (CS) speech. We focus on the recognition of Frisian-Dutch radio broadcasts where one of the mixed languages, namely Frisian, is an under-resourced language. In previous work, we have proposed several automatic transcription strategies for CS speech to increase the amount of available training speech data. In this work, we explore how the acoustic modeling (AM) can benefit from monolingual speech data belonging to the high-resour"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.10945","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1807.10945","created_at":"2026-05-18T00:09:34.941165+00:00"},{"alias_kind":"arxiv_version","alias_value":"1807.10945v1","created_at":"2026-05-18T00:09:34.941165+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.10945","created_at":"2026-05-18T00:09:34.941165+00:00"},{"alias_kind":"pith_short_12","alias_value":"SWV4BSQF6PJ6","created_at":"2026-05-18T12:32:53.628368+00:00"},{"alias_kind":"pith_short_16","alias_value":"SWV4BSQF6PJ6XLDU","created_at":"2026-05-18T12:32:53.628368+00:00"},{"alias_kind":"pith_short_8","alias_value":"SWV4BSQF","created_at":"2026-05-18T12:32:53.628368+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6","json":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6.json","graph_json":"https://pith.science/api/pith-number/SWV4BSQF6PJ6XLDUNRTXXH5IV6/graph.json","events_json":"https://pith.science/api/pith-number/SWV4BSQF6PJ6XLDUNRTXXH5IV6/events.json","paper":"https://pith.science/paper/SWV4BSQF"},"agent_actions":{"view_html":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6","download_json":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6.json","view_paper":"https://pith.science/paper/SWV4BSQF","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1807.10945&json=true","fetch_graph":"https://pith.science/api/pith-number/SWV4BSQF6PJ6XLDUNRTXXH5IV6/graph.json","fetch_events":"https://pith.science/api/pith-number/SWV4BSQF6PJ6XLDUNRTXXH5IV6/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/action/timestamp_anchor","attest_storage":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/action/storage_attestation","attest_author":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/action/author_attestation","sign_citation":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/action/citation_signature","submit_replication":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/action/replication_record"}},"created_at":"2026-05-18T00:09:34.941165+00:00","updated_at":"2026-05-18T00:09:34.941165+00:00"}