{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:ZPK4HX4OEYXT3JQOACPMKEIJX3","short_pith_number":"pith:ZPK4HX4O","schema_version":"1.0","canonical_sha256":"cbd5c3df8e262f3da60e009ec51109bec9259f1ded294eb6d3933e8408802050","source":{"kind":"arxiv","id":"2606.12911","version":1},"attestation_state":"computed","paper":{"title":"PiDA: Phonetically-Informed Data Augmentation for Robust Vietnamese Speech Translation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Dung D. Le, Giang Son Nguyen, Hieu Minh Truong, Nhu Vo, Tung X. Nguyen, Wray Buntine","submitted_at":"2026-06-11T05:09:59Z","abstract_excerpt":"Cascaded speech translation (ST) systems suffer from error propagation when Automatic Speech Recognition (ASR) outputs incorrect transcripts. We present the first systematic categorization of ASR errors for Vietnamese ST, classifying substitution errors by phonetic cause and quantifying their impact on downstream Neural Machine Translation (NMT) performance using Linear Mixed-Effects Modelling. We confirm that most ASR substitution errors arise from phonetic confusions rather than random noise, and that these phonetic errors significantly degrade ST quality. Motivated by this finding, we propo"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.12911","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-11T05:09:59Z","cross_cats_sorted":[],"title_canon_sha256":"81567fec6216d81da4042cd0ba3d07b740a227a3e75bba6b58dda850b8cb5d7a","abstract_canon_sha256":"23b9e64d0105638a8d4f0d6fba4aab8ca4e5d3bfe74432564dae2312add07a12"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-12T01:09:34.201181Z","signature_b64":"WjRzpZhPNtKOKHRbbNRAeN05cKgDto7LTGJFPKyt64/yTIjZt8yw1g+wP5uIj5bBemxHvgLQNIO6+2uJcyHZAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"cbd5c3df8e262f3da60e009ec51109bec9259f1ded294eb6d3933e8408802050","last_reissued_at":"2026-06-12T01:09:34.200587Z","signature_status":"signed_v1","first_computed_at":"2026-06-12T01:09:34.200587Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"PiDA: Phonetically-Informed Data Augmentation for Robust Vietnamese Speech Translation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Dung D. Le, Giang Son Nguyen, Hieu Minh Truong, Nhu Vo, Tung X. Nguyen, Wray Buntine","submitted_at":"2026-06-11T05:09:59Z","abstract_excerpt":"Cascaded speech translation (ST) systems suffer from error propagation when Automatic Speech Recognition (ASR) outputs incorrect transcripts. We present the first systematic categorization of ASR errors for Vietnamese ST, classifying substitution errors by phonetic cause and quantifying their impact on downstream Neural Machine Translation (NMT) performance using Linear Mixed-Effects Modelling. We confirm that most ASR substitution errors arise from phonetic confusions rather than random noise, and that these phonetic errors significantly degrade ST quality. Motivated by this finding, we propo"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.12911","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.12911/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.12911","created_at":"2026-06-12T01:09:34.200638+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.12911v1","created_at":"2026-06-12T01:09:34.200638+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.12911","created_at":"2026-06-12T01:09:34.200638+00:00"},{"alias_kind":"pith_short_12","alias_value":"ZPK4HX4OEYXT","created_at":"2026-06-12T01:09:34.200638+00:00"},{"alias_kind":"pith_short_16","alias_value":"ZPK4HX4OEYXT3JQO","created_at":"2026-06-12T01:09:34.200638+00:00"},{"alias_kind":"pith_short_8","alias_value":"ZPK4HX4O","created_at":"2026-06-12T01:09:34.200638+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3","json":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3.json","graph_json":"https://pith.science/api/pith-number/ZPK4HX4OEYXT3JQOACPMKEIJX3/graph.json","events_json":"https://pith.science/api/pith-number/ZPK4HX4OEYXT3JQOACPMKEIJX3/events.json","paper":"https://pith.science/paper/ZPK4HX4O"},"agent_actions":{"view_html":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3","download_json":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3.json","view_paper":"https://pith.science/paper/ZPK4HX4O","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.12911&json=true","fetch_graph":"https://pith.science/api/pith-number/ZPK4HX4OEYXT3JQOACPMKEIJX3/graph.json","fetch_events":"https://pith.science/api/pith-number/ZPK4HX4OEYXT3JQOACPMKEIJX3/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3/action/timestamp_anchor","attest_storage":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3/action/storage_attestation","attest_author":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3/action/author_attestation","sign_citation":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3/action/citation_signature","submit_replication":"https://pith.science/pith/ZPK4HX4OEYXT3JQOACPMKEIJX3/action/replication_record"}},"created_at":"2026-06-12T01:09:34.200638+00:00","updated_at":"2026-06-12T01:09:34.200638+00:00"}