{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:HX4HN6ITVMUUKB54Z5AMOI25IY","short_pith_number":"pith:HX4HN6IT","canonical_record":{"source":{"id":"1811.01064","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-02T19:41:44Z","cross_cats_sorted":[],"title_canon_sha256":"eabb0a9bf9fb71f7edf803825c6696d345c38fb405b80e8378dade683c156883","abstract_canon_sha256":"0db50be72b01230e0e27277f4761fbd9595fe9a79266ac464b8b1bd5d953f89c"},"schema_version":"1.0"},"canonical_sha256":"3df876f913ab294507bccf40c7235d462b66ce27db3ef8a639aa10d95d7f7e10","source":{"kind":"arxiv","id":"1811.01064","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.01064","created_at":"2026-05-18T00:01:37Z"},{"alias_kind":"arxiv_version","alias_value":"1811.01064v1","created_at":"2026-05-18T00:01:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.01064","created_at":"2026-05-18T00:01:37Z"},{"alias_kind":"pith_short_12","alias_value":"HX4HN6ITVMUU","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"HX4HN6ITVMUUKB54","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"HX4HN6IT","created_at":"2026-05-18T12:32:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:HX4HN6ITVMUUKB54Z5AMOI25IY","target":"record","payload":{"canonical_record":{"source":{"id":"1811.01064","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-02T19:41:44Z","cross_cats_sorted":[],"title_canon_sha256":"eabb0a9bf9fb71f7edf803825c6696d345c38fb405b80e8378dade683c156883","abstract_canon_sha256":"0db50be72b01230e0e27277f4761fbd9595fe9a79266ac464b8b1bd5d953f89c"},"schema_version":"1.0"},"canonical_sha256":"3df876f913ab294507bccf40c7235d462b66ce27db3ef8a639aa10d95d7f7e10","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:01:37.163104Z","signature_b64":"0xGJflpXkisnczuPjHO03bLZjy6RKVLSR52XK74Z8BLLvEbB8rmVP2fWDNrTnC8x/Tds5c2dr+BlyfSRIPiPAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3df876f913ab294507bccf40c7235d462b66ce27db3ef8a639aa10d95d7f7e10","last_reissued_at":"2026-05-18T00:01:37.162698Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:01:37.162698Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1811.01064","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"NFaTR/+fiCOrsZX8Q1F3SXAAriA+ADgaAYFjZgFvkf4xihuhZ3OlKLaDXUh3sptHxKwCTcwkog4Gq49jrzZvAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T16:00:00.584853Z"},"content_sha256":"d64eeb09dcd469983d8e94463e9efed9a5e39e362b2af9270431068e2d5cecc8","schema_version":"1.0","event_id":"sha256:d64eeb09dcd469983d8e94463e9efed9a5e39e362b2af9270431068e2d5cecc8"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:HX4HN6ITVMUUKB54Z5AMOI25IY","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Neural Machine Translation into Language Varieties","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Aliia Erofeeva, Marcello Federico, Surafel M. Lakew","submitted_at":"2018-11-02T19:41:44Z","abstract_excerpt":"Both research and commercial machine translation have so far neglected the importance of properly handling the spelling, lexical and grammar divergences occurring among language varieties. Notable cases are standard national varieties such as Brazilian and European Portuguese, and Canadian and European French, which popular online machine translation services are not keeping distinct. We show that an evident side effect of modeling such varieties as unique classes is the generation of inconsistent translations. In this work, we investigate the problem of training neural machine translation fro"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.01064","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kE+N1+UtjVIeoh/q/nH7+JAVLZ3Zb25T4ahZRBcEMoFSW7xjLO893rt7D5cAwsbnzx6dBW2+/qFma+t6HuRZAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T16:00:00.585188Z"},"content_sha256":"aee5c2e5eb5242f5249796ffbe369aa052fe8e2a2875eb94f5a1ab3e6bb65278","schema_version":"1.0","event_id":"sha256:aee5c2e5eb5242f5249796ffbe369aa052fe8e2a2875eb94f5a1ab3e6bb65278"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HX4HN6ITVMUUKB54Z5AMOI25IY/bundle.json","state_url":"https://pith.science/pith/HX4HN6ITVMUUKB54Z5AMOI25IY/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HX4HN6ITVMUUKB54Z5AMOI25IY/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T16:00:00Z","links":{"resolver":"https://pith.science/pith/HX4HN6ITVMUUKB54Z5AMOI25IY","bundle":"https://pith.science/pith/HX4HN6ITVMUUKB54Z5AMOI25IY/bundle.json","state":"https://pith.science/pith/HX4HN6ITVMUUKB54Z5AMOI25IY/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HX4HN6ITVMUUKB54Z5AMOI25IY/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:HX4HN6ITVMUUKB54Z5AMOI25IY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0db50be72b01230e0e27277f4761fbd9595fe9a79266ac464b8b1bd5d953f89c","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-02T19:41:44Z","title_canon_sha256":"eabb0a9bf9fb71f7edf803825c6696d345c38fb405b80e8378dade683c156883"},"schema_version":"1.0","source":{"id":"1811.01064","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.01064","created_at":"2026-05-18T00:01:37Z"},{"alias_kind":"arxiv_version","alias_value":"1811.01064v1","created_at":"2026-05-18T00:01:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.01064","created_at":"2026-05-18T00:01:37Z"},{"alias_kind":"pith_short_12","alias_value":"HX4HN6ITVMUU","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"HX4HN6ITVMUUKB54","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"HX4HN6IT","created_at":"2026-05-18T12:32:28Z"}],"graph_snapshots":[{"event_id":"sha256:aee5c2e5eb5242f5249796ffbe369aa052fe8e2a2875eb94f5a1ab3e6bb65278","target":"graph","created_at":"2026-05-18T00:01:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Both research and commercial machine translation have so far neglected the importance of properly handling the spelling, lexical and grammar divergences occurring among language varieties. Notable cases are standard national varieties such as Brazilian and European Portuguese, and Canadian and European French, which popular online machine translation services are not keeping distinct. We show that an evident side effect of modeling such varieties as unique classes is the generation of inconsistent translations. In this work, we investigate the problem of training neural machine translation fro","authors_text":"Aliia Erofeeva, Marcello Federico, Surafel M. Lakew","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-02T19:41:44Z","title":"Neural Machine Translation into Language Varieties"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.01064","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d64eeb09dcd469983d8e94463e9efed9a5e39e362b2af9270431068e2d5cecc8","target":"record","created_at":"2026-05-18T00:01:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0db50be72b01230e0e27277f4761fbd9595fe9a79266ac464b8b1bd5d953f89c","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-02T19:41:44Z","title_canon_sha256":"eabb0a9bf9fb71f7edf803825c6696d345c38fb405b80e8378dade683c156883"},"schema_version":"1.0","source":{"id":"1811.01064","kind":"arxiv","version":1}},"canonical_sha256":"3df876f913ab294507bccf40c7235d462b66ce27db3ef8a639aa10d95d7f7e10","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3df876f913ab294507bccf40c7235d462b66ce27db3ef8a639aa10d95d7f7e10","first_computed_at":"2026-05-18T00:01:37.162698Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:01:37.162698Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"0xGJflpXkisnczuPjHO03bLZjy6RKVLSR52XK74Z8BLLvEbB8rmVP2fWDNrTnC8x/Tds5c2dr+BlyfSRIPiPAA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:01:37.163104Z","signed_message":"canonical_sha256_bytes"},"source_id":"1811.01064","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d64eeb09dcd469983d8e94463e9efed9a5e39e362b2af9270431068e2d5cecc8","sha256:aee5c2e5eb5242f5249796ffbe369aa052fe8e2a2875eb94f5a1ab3e6bb65278"],"state_sha256":"f6e5fffcdc5e903e5bbe85bc018520f114cd9d7a6e15de2fb90527bacebd5b17"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"j9vz/Pepcqb1FoPZh0BnP6Jod0vKH7EDUpmnRnYj1ot19mlucjS/hjA4tJJ1SvoDpEdOBPljzoe3R+/dEd3HAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T16:00:00.587359Z","bundle_sha256":"7ac57300d152880b16fc2793fa1ddadc00ba50e8891f98d17051fc5504ec6f07"}}