{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:ML3DFPIMXIH5OJ7PGSTYTPV565","short_pith_number":"pith:ML3DFPIM","schema_version":"1.0","canonical_sha256":"62f632bd0cba0fd727ef34a789bebdf75aeb91e067274dea17747ebdbc83b385","source":{"kind":"arxiv","id":"2605.27874","version":1},"attestation_state":"computed","paper":{"title":"Syllabic-Structure Decoder for Automatic Speech Recognition in Vietnamese","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Kiet Van Nguyen, Long Hoang Huu Nguyen, Ngan Luu-Thuy Nguyen, Nghia Hieu Nguyen, Quan Ngoc Hoang","submitted_at":"2026-05-27T02:51:09Z","abstract_excerpt":"Most Automatic Speech Recognition (ASR) systems formulate transcription as a prediction problem over orthographic units such as characters, subwords, or words. Although effective, such representations do not explicitly reflect the phonetic structure of speech and often require large vocabularies to maintain adequate coverage. In this work, we are motivated from the phonemic features of Vietnamese to propose a Syllabic-Structure Decoder for ASR, which models speech at the phoneme level instead of the orthographic level. Our approach explicitly captures the phonological composition of syllables,"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.27874","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-27T02:51:09Z","cross_cats_sorted":[],"title_canon_sha256":"a54949395352c681cda26b81e7e495c3f330f3bc35017812a1568e5afe583332","abstract_canon_sha256":"a9a620979d56c18fe314c3bad58caf916ffa8f2ee70876236951c39f8fb34118"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T01:04:51.019765Z","signature_b64":"SmM6M0+ARED3f2rtFdfgUEOntB6mENfkD1uhYrqt3gtTSr/w4167ubDjMuwxY1VXZ6Aq7sqdE/2lVlgoUzAPDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"62f632bd0cba0fd727ef34a789bebdf75aeb91e067274dea17747ebdbc83b385","last_reissued_at":"2026-05-28T01:04:51.019360Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T01:04:51.019360Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Syllabic-Structure Decoder for Automatic Speech Recognition in Vietnamese","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Kiet Van Nguyen, Long Hoang Huu Nguyen, Ngan Luu-Thuy Nguyen, Nghia Hieu Nguyen, Quan Ngoc Hoang","submitted_at":"2026-05-27T02:51:09Z","abstract_excerpt":"Most Automatic Speech Recognition (ASR) systems formulate transcription as a prediction problem over orthographic units such as characters, subwords, or words. Although effective, such representations do not explicitly reflect the phonetic structure of speech and often require large vocabularies to maintain adequate coverage. In this work, we are motivated from the phonemic features of Vietnamese to propose a Syllabic-Structure Decoder for ASR, which models speech at the phoneme level instead of the orthographic level. Our approach explicitly captures the phonological composition of syllables,"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.27874","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.27874/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.27874","created_at":"2026-05-28T01:04:51.019421+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.27874v1","created_at":"2026-05-28T01:04:51.019421+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.27874","created_at":"2026-05-28T01:04:51.019421+00:00"},{"alias_kind":"pith_short_12","alias_value":"ML3DFPIMXIH5","created_at":"2026-05-28T01:04:51.019421+00:00"},{"alias_kind":"pith_short_16","alias_value":"ML3DFPIMXIH5OJ7P","created_at":"2026-05-28T01:04:51.019421+00:00"},{"alias_kind":"pith_short_8","alias_value":"ML3DFPIM","created_at":"2026-05-28T01:04:51.019421+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565","json":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565.json","graph_json":"https://pith.science/api/pith-number/ML3DFPIMXIH5OJ7PGSTYTPV565/graph.json","events_json":"https://pith.science/api/pith-number/ML3DFPIMXIH5OJ7PGSTYTPV565/events.json","paper":"https://pith.science/paper/ML3DFPIM"},"agent_actions":{"view_html":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565","download_json":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565.json","view_paper":"https://pith.science/paper/ML3DFPIM","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.27874&json=true","fetch_graph":"https://pith.science/api/pith-number/ML3DFPIMXIH5OJ7PGSTYTPV565/graph.json","fetch_events":"https://pith.science/api/pith-number/ML3DFPIMXIH5OJ7PGSTYTPV565/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565/action/timestamp_anchor","attest_storage":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565/action/storage_attestation","attest_author":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565/action/author_attestation","sign_citation":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565/action/citation_signature","submit_replication":"https://pith.science/pith/ML3DFPIMXIH5OJ7PGSTYTPV565/action/replication_record"}},"created_at":"2026-05-28T01:04:51.019421+00:00","updated_at":"2026-05-28T01:04:51.019421+00:00"}