{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:CG6T4KERCIHBSWVZAOMSP5F5K2","short_pith_number":"pith:CG6T4KER","schema_version":"1.0","canonical_sha256":"11bd3e2891120e195ab9039927f4bd5685b83f1523cf02c931d8bf8dd33c023d","source":{"kind":"arxiv","id":"1811.03189","version":1},"attestation_state":"computed","paper":{"title":"Towards Fluent Translations from Disfluent Speech","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Alex Waibel, Elizabeth Salesky, Jan Niehues, Susanne Burger","submitted_at":"2018-11-07T23:47:01Z","abstract_excerpt":"When translating from speech, special consideration for conversational speech phenomena such as disfluencies is necessary. Most machine translation training data consists of well-formed written texts, causing issues when translating spontaneous speech. Previous work has introduced an intermediate step between speech recognition (ASR) and machine translation (MT) to remove disfluencies, making the data better-matched to typical translation text and significantly improving performance. However, with the rise of end-to-end speech translation systems, this intermediate step must be incorporated in"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1811.03189","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-07T23:47:01Z","cross_cats_sorted":[],"title_canon_sha256":"4d9c5f32bd0f540a58c0c378768700096704f6b98d70f4ee0753927a3ab25840","abstract_canon_sha256":"ca16b60d7381defca0f13d228bce67db320eced458262d36ff3fdeebf4f10950"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:01:18.892181Z","signature_b64":"oJS0gG73wEaNI1u57v5Eo2+ISQViX3L+jcXWD6rpTSe2YS3q9TfNd2ANEqANg0DXJxCkk6PKU2zd395bBDHeDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"11bd3e2891120e195ab9039927f4bd5685b83f1523cf02c931d8bf8dd33c023d","last_reissued_at":"2026-05-18T00:01:18.891782Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:01:18.891782Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Towards Fluent Translations from Disfluent Speech","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Alex Waibel, Elizabeth Salesky, Jan Niehues, Susanne Burger","submitted_at":"2018-11-07T23:47:01Z","abstract_excerpt":"When translating from speech, special consideration for conversational speech phenomena such as disfluencies is necessary. Most machine translation training data consists of well-formed written texts, causing issues when translating spontaneous speech. Previous work has introduced an intermediate step between speech recognition (ASR) and machine translation (MT) to remove disfluencies, making the data better-matched to typical translation text and significantly improving performance. However, with the rise of end-to-end speech translation systems, this intermediate step must be incorporated in"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.03189","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1811.03189","created_at":"2026-05-18T00:01:18.891847+00:00"},{"alias_kind":"arxiv_version","alias_value":"1811.03189v1","created_at":"2026-05-18T00:01:18.891847+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.03189","created_at":"2026-05-18T00:01:18.891847+00:00"},{"alias_kind":"pith_short_12","alias_value":"CG6T4KERCIHB","created_at":"2026-05-18T12:32:16.446611+00:00"},{"alias_kind":"pith_short_16","alias_value":"CG6T4KERCIHBSWVZ","created_at":"2026-05-18T12:32:16.446611+00:00"},{"alias_kind":"pith_short_8","alias_value":"CG6T4KER","created_at":"2026-05-18T12:32:16.446611+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2","json":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2.json","graph_json":"https://pith.science/api/pith-number/CG6T4KERCIHBSWVZAOMSP5F5K2/graph.json","events_json":"https://pith.science/api/pith-number/CG6T4KERCIHBSWVZAOMSP5F5K2/events.json","paper":"https://pith.science/paper/CG6T4KER"},"agent_actions":{"view_html":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2","download_json":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2.json","view_paper":"https://pith.science/paper/CG6T4KER","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1811.03189&json=true","fetch_graph":"https://pith.science/api/pith-number/CG6T4KERCIHBSWVZAOMSP5F5K2/graph.json","fetch_events":"https://pith.science/api/pith-number/CG6T4KERCIHBSWVZAOMSP5F5K2/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2/action/timestamp_anchor","attest_storage":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2/action/storage_attestation","attest_author":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2/action/author_attestation","sign_citation":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2/action/citation_signature","submit_replication":"https://pith.science/pith/CG6T4KERCIHBSWVZAOMSP5F5K2/action/replication_record"}},"created_at":"2026-05-18T00:01:18.891847+00:00","updated_at":"2026-05-18T00:01:18.891847+00:00"}