{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2019:4KKAYHRXWDCLJAEJNJQIHSDMDF","short_pith_number":"pith:4KKAYHRX","schema_version":"1.0","canonical_sha256":"e2940c1e37b0c4b480896a6083c86c196a3ff6829b46b4b80ff4f3945e99073d","source":{"kind":"arxiv","id":"1901.04112","version":1},"attestation_state":"computed","paper":{"title":"Unsupervised Neural Machine Translation with SMT as Posterior Regularization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Ming Zhou, Shuai Ma, Shujie Liu, Shuo Ren, Zhirui Zhang","submitted_at":"2019-01-14T03:34:27Z","abstract_excerpt":"Without real bilingual corpus available, unsupervised Neural Machine Translation (NMT) typically requires pseudo parallel data generated with the back-translation method for the model training. However, due to weak supervision, the pseudo data inevitably contain noises and errors that will be accumulated and reinforced in the subsequent training process, leading to bad translation performance. To address this issue, we introduce phrase based Statistic Machine Translation (SMT) models which are robust to noisy data, as posterior regularizations to guide the training of unsupervised NMT models i"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1901.04112","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-01-14T03:34:27Z","cross_cats_sorted":[],"title_canon_sha256":"b6ab3cab2eed3985f94abb157c6710cb708dec960cdab134727356cb12dbb0e3","abstract_canon_sha256":"c016d121ff8df79db43d36d3341a6c23c370d826f4be4b754781000723fd474b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:56:26.259026Z","signature_b64":"UMtr2Et2P9vuiAsbTrJ0dEO5Y5/NMzTe51C0VOmbKl7rZRxWJXgzKwUe22RcNRiQPx/FRSct0aqs5ERUWEwtCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e2940c1e37b0c4b480896a6083c86c196a3ff6829b46b4b80ff4f3945e99073d","last_reissued_at":"2026-05-17T23:56:26.258576Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:56:26.258576Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Unsupervised Neural Machine Translation with SMT as Posterior Regularization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Ming Zhou, Shuai Ma, Shujie Liu, Shuo Ren, Zhirui Zhang","submitted_at":"2019-01-14T03:34:27Z","abstract_excerpt":"Without real bilingual corpus available, unsupervised Neural Machine Translation (NMT) typically requires pseudo parallel data generated with the back-translation method for the model training. However, due to weak supervision, the pseudo data inevitably contain noises and errors that will be accumulated and reinforced in the subsequent training process, leading to bad translation performance. To address this issue, we introduce phrase based Statistic Machine Translation (SMT) models which are robust to noisy data, as posterior regularizations to guide the training of unsupervised NMT models i"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.04112","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1901.04112","created_at":"2026-05-17T23:56:26.258658+00:00"},{"alias_kind":"arxiv_version","alias_value":"1901.04112v1","created_at":"2026-05-17T23:56:26.258658+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.04112","created_at":"2026-05-17T23:56:26.258658+00:00"},{"alias_kind":"pith_short_12","alias_value":"4KKAYHRXWDCL","created_at":"2026-05-18T12:33:10.108867+00:00"},{"alias_kind":"pith_short_16","alias_value":"4KKAYHRXWDCLJAEJ","created_at":"2026-05-18T12:33:10.108867+00:00"},{"alias_kind":"pith_short_8","alias_value":"4KKAYHRX","created_at":"2026-05-18T12:33:10.108867+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":1,"internal_anchor_count":1,"sample":[{"citing_arxiv_id":"2009.10297","citing_title":"CodeBLEU: a Method for Automatic Evaluation of Code Synthesis","ref_index":9,"is_internal_anchor":true}]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF","json":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF.json","graph_json":"https://pith.science/api/pith-number/4KKAYHRXWDCLJAEJNJQIHSDMDF/graph.json","events_json":"https://pith.science/api/pith-number/4KKAYHRXWDCLJAEJNJQIHSDMDF/events.json","paper":"https://pith.science/paper/4KKAYHRX"},"agent_actions":{"view_html":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF","download_json":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF.json","view_paper":"https://pith.science/paper/4KKAYHRX","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1901.04112&json=true","fetch_graph":"https://pith.science/api/pith-number/4KKAYHRXWDCLJAEJNJQIHSDMDF/graph.json","fetch_events":"https://pith.science/api/pith-number/4KKAYHRXWDCLJAEJNJQIHSDMDF/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF/action/timestamp_anchor","attest_storage":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF/action/storage_attestation","attest_author":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF/action/author_attestation","sign_citation":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF/action/citation_signature","submit_replication":"https://pith.science/pith/4KKAYHRXWDCLJAEJNJQIHSDMDF/action/replication_record"}},"created_at":"2026-05-17T23:56:26.258658+00:00","updated_at":"2026-05-17T23:56:26.258658+00:00"}