{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:SWV4BSQF6PJ6XLDUNRTXXH5IV6","short_pith_number":"pith:SWV4BSQF","canonical_record":{"source":{"id":"1807.10945","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-07-28T14:59:52Z","cross_cats_sorted":[],"title_canon_sha256":"b8f0131d1e6efb710c43a301e0bfa2cd3948a80bd187ec5ff8d8b7a25e571c8c","abstract_canon_sha256":"aeaabf593528463d883e448380f9939053d2ee850bad9ca2bcb816fda0ef4e55"},"schema_version":"1.0"},"canonical_sha256":"95abc0ca05f3d3ebac746c677b9fa8afbdefaa544c953a968e266d971f4772e8","source":{"kind":"arxiv","id":"1807.10945","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.10945","created_at":"2026-05-18T00:09:34Z"},{"alias_kind":"arxiv_version","alias_value":"1807.10945v1","created_at":"2026-05-18T00:09:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.10945","created_at":"2026-05-18T00:09:34Z"},{"alias_kind":"pith_short_12","alias_value":"SWV4BSQF6PJ6","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_16","alias_value":"SWV4BSQF6PJ6XLDU","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_8","alias_value":"SWV4BSQF","created_at":"2026-05-18T12:32:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:SWV4BSQF6PJ6XLDUNRTXXH5IV6","target":"record","payload":{"canonical_record":{"source":{"id":"1807.10945","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-07-28T14:59:52Z","cross_cats_sorted":[],"title_canon_sha256":"b8f0131d1e6efb710c43a301e0bfa2cd3948a80bd187ec5ff8d8b7a25e571c8c","abstract_canon_sha256":"aeaabf593528463d883e448380f9939053d2ee850bad9ca2bcb816fda0ef4e55"},"schema_version":"1.0"},"canonical_sha256":"95abc0ca05f3d3ebac746c677b9fa8afbdefaa544c953a968e266d971f4772e8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:09:34.941579Z","signature_b64":"pLuh8GgVhucs7On57BWnpDpqbRYbj5SxPcVF5LTJ4+L6BhpTbJGgM35wdBxE4WizBuGCCHD1dzYMh3uW0jMMAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"95abc0ca05f3d3ebac746c677b9fa8afbdefaa544c953a968e266d971f4772e8","last_reissued_at":"2026-05-18T00:09:34.941083Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:09:34.941083Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1807.10945","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:09:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JuSvYkQpUZd2xZwp6vhKBDDWD8EJ9JKRCb/IQ9GV7/e6+5o/73AtczsD9K7jPn8PckLO6wwkzbPxO775pcucBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T00:49:11.155032Z"},"content_sha256":"06c21c249848e8416160327095119b34c54d21aac91839eeb20794ec9b1f0af9","schema_version":"1.0","event_id":"sha256:06c21c249848e8416160327095119b34c54d21aac91839eeb20794ec9b1f0af9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:SWV4BSQF6PJ6XLDUNRTXXH5IV6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Acoustic and Textual Data Augmentation for Improved ASR of Code-Switching Speech","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"David A. van Leeuwen, Emre Y{\\i}lmaz, Henk van den Heuvel","submitted_at":"2018-07-28T14:59:52Z","abstract_excerpt":"In this paper, we describe several techniques for improving the acoustic and language model of an automatic speech recognition (ASR) system operating on code-switching (CS) speech. We focus on the recognition of Frisian-Dutch radio broadcasts where one of the mixed languages, namely Frisian, is an under-resourced language. In previous work, we have proposed several automatic transcription strategies for CS speech to increase the amount of available training speech data. In this work, we explore how the acoustic modeling (AM) can benefit from monolingual speech data belonging to the high-resour"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.10945","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:09:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Nm07YPXUWCn/QUl4opPnRMRjsKNeS3LtA8klADh5hYhMidY2lXX7/XCmiNEGjSIFyjQKPKapAUfHu2OCjK1xDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T00:49:11.155690Z"},"content_sha256":"8456b8cc77276b98b0947891f2f8c728ed628011fc61c14843663ed648fbbca3","schema_version":"1.0","event_id":"sha256:8456b8cc77276b98b0947891f2f8c728ed628011fc61c14843663ed648fbbca3"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/bundle.json","state_url":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T00:49:11Z","links":{"resolver":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6","bundle":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/bundle.json","state":"https://pith.science/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SWV4BSQF6PJ6XLDUNRTXXH5IV6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:SWV4BSQF6PJ6XLDUNRTXXH5IV6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"aeaabf593528463d883e448380f9939053d2ee850bad9ca2bcb816fda0ef4e55","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-07-28T14:59:52Z","title_canon_sha256":"b8f0131d1e6efb710c43a301e0bfa2cd3948a80bd187ec5ff8d8b7a25e571c8c"},"schema_version":"1.0","source":{"id":"1807.10945","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.10945","created_at":"2026-05-18T00:09:34Z"},{"alias_kind":"arxiv_version","alias_value":"1807.10945v1","created_at":"2026-05-18T00:09:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.10945","created_at":"2026-05-18T00:09:34Z"},{"alias_kind":"pith_short_12","alias_value":"SWV4BSQF6PJ6","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_16","alias_value":"SWV4BSQF6PJ6XLDU","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_8","alias_value":"SWV4BSQF","created_at":"2026-05-18T12:32:53Z"}],"graph_snapshots":[{"event_id":"sha256:8456b8cc77276b98b0947891f2f8c728ed628011fc61c14843663ed648fbbca3","target":"graph","created_at":"2026-05-18T00:09:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper, we describe several techniques for improving the acoustic and language model of an automatic speech recognition (ASR) system operating on code-switching (CS) speech. We focus on the recognition of Frisian-Dutch radio broadcasts where one of the mixed languages, namely Frisian, is an under-resourced language. In previous work, we have proposed several automatic transcription strategies for CS speech to increase the amount of available training speech data. In this work, we explore how the acoustic modeling (AM) can benefit from monolingual speech data belonging to the high-resour","authors_text":"David A. van Leeuwen, Emre Y{\\i}lmaz, Henk van den Heuvel","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-07-28T14:59:52Z","title":"Acoustic and Textual Data Augmentation for Improved ASR of Code-Switching Speech"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.10945","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:06c21c249848e8416160327095119b34c54d21aac91839eeb20794ec9b1f0af9","target":"record","created_at":"2026-05-18T00:09:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"aeaabf593528463d883e448380f9939053d2ee850bad9ca2bcb816fda0ef4e55","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-07-28T14:59:52Z","title_canon_sha256":"b8f0131d1e6efb710c43a301e0bfa2cd3948a80bd187ec5ff8d8b7a25e571c8c"},"schema_version":"1.0","source":{"id":"1807.10945","kind":"arxiv","version":1}},"canonical_sha256":"95abc0ca05f3d3ebac746c677b9fa8afbdefaa544c953a968e266d971f4772e8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"95abc0ca05f3d3ebac746c677b9fa8afbdefaa544c953a968e266d971f4772e8","first_computed_at":"2026-05-18T00:09:34.941083Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:09:34.941083Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"pLuh8GgVhucs7On57BWnpDpqbRYbj5SxPcVF5LTJ4+L6BhpTbJGgM35wdBxE4WizBuGCCHD1dzYMh3uW0jMMAw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:09:34.941579Z","signed_message":"canonical_sha256_bytes"},"source_id":"1807.10945","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:06c21c249848e8416160327095119b34c54d21aac91839eeb20794ec9b1f0af9","sha256:8456b8cc77276b98b0947891f2f8c728ed628011fc61c14843663ed648fbbca3"],"state_sha256":"7ca3a6deae9cddf125eaa3a44fee1cb2655be87842444008a46163ebc5b3ac01"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/42FDHGghxnXA2dfYKwlV8nK+fyFd0BxWwCt3bKGUeIvDfCm2KpdZLjFofTuryafaAISSgWaYKnPFMI7d0LMCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T00:49:11.159293Z","bundle_sha256":"9c17079e6c13a4b9a23783f16e32371b56d488dabad0595f2572a5b7ec9a35af"}}