{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:I5U3FZFGEX4KMGIZEMEKMUJET6","short_pith_number":"pith:I5U3FZFG","canonical_record":{"source":{"id":"1809.00196","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-01T14:33:11Z","cross_cats_sorted":[],"title_canon_sha256":"622a9769fac477a2a6c49720b1c543ff81605e65f34648a3adde487a5e8ee8a7","abstract_canon_sha256":"baa1f3e0b384f274696666e397a9875a4a0ff77395f6ef02c8aa7792ada103b0"},"schema_version":"1.0"},"canonical_sha256":"4769b2e4a625f8a619192308a651249f9af5a33356c0192e44eb6045ebe78c66","source":{"kind":"arxiv","id":"1809.00196","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.00196","created_at":"2026-05-18T00:06:35Z"},{"alias_kind":"arxiv_version","alias_value":"1809.00196v1","created_at":"2026-05-18T00:06:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.00196","created_at":"2026-05-18T00:06:35Z"},{"alias_kind":"pith_short_12","alias_value":"I5U3FZFGEX4K","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"I5U3FZFGEX4KMGIZ","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"I5U3FZFG","created_at":"2026-05-18T12:32:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:I5U3FZFGEX4KMGIZEMEKMUJET6","target":"record","payload":{"canonical_record":{"source":{"id":"1809.00196","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-01T14:33:11Z","cross_cats_sorted":[],"title_canon_sha256":"622a9769fac477a2a6c49720b1c543ff81605e65f34648a3adde487a5e8ee8a7","abstract_canon_sha256":"baa1f3e0b384f274696666e397a9875a4a0ff77395f6ef02c8aa7792ada103b0"},"schema_version":"1.0"},"canonical_sha256":"4769b2e4a625f8a619192308a651249f9af5a33356c0192e44eb6045ebe78c66","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:06:35.795052Z","signature_b64":"4LF3CeQsr0sLrKbQfWvZHQSrn1gYPpcUhvPU+0l6fEUEj7Wxiez/v5KgnwALVDzDF9n34YR6Xq+yQu9Ln1ZNCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4769b2e4a625f8a619192308a651249f9af5a33356c0192e44eb6045ebe78c66","last_reissued_at":"2026-05-18T00:06:35.794671Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:06:35.794671Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1809.00196","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:06:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"lYrGIVZhOBUQ7t/R1m3KSVV05h+gIZXcNL/L3Ehn3ckXqC4IXB+T5xRa5UEv3MwcF1vW0IV4/LtC76w+ubvIAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T23:15:22.247558Z"},"content_sha256":"77b990d51d178ee9ada4cda18f52be41b1d11be0841eede381cfbdecdbb03fd5","schema_version":"1.0","event_id":"sha256:77b990d51d178ee9ada4cda18f52be41b1d11be0841eede381cfbdecdbb03fd5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:I5U3FZFGEX4KMGIZEMEKMUJET6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Microsoft's Submission to the WMT2018 News Translation Task: How I Learned to Stop Worrying and Love the Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Marcin Junczys-Dowmunt","submitted_at":"2018-09-01T14:33:11Z","abstract_excerpt":"This paper describes the Microsoft submission to the WMT2018 news translation shared task. We participated in one language direction -- English-German. Our system follows current best-practice and combines state-of-the-art models with new data filtering (dual conditional cross-entropy filtering) and sentence weighting methods. We trained fairly standard Transformer-big models with an updated version of Edinburgh's training scheme for WMT2017 and experimented with different filtering schemes for Paracrawl. According to automatic metrics (BLEU) we reached the highest score for this subtask with "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.00196","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:06:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6dyjIB9Ks44cFcTw56zQOo9rCTHiCaA8o9xNyYiPIOYcwZUjMkyOyKiHcAAnW2EXJNtpdm/ZknJd2PMcdXP9Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T23:15:22.247900Z"},"content_sha256":"6bc8841bed5b3c72e94531ac1ca2e071299db4f9615ef2e346f4591cacd829d5","schema_version":"1.0","event_id":"sha256:6bc8841bed5b3c72e94531ac1ca2e071299db4f9615ef2e346f4591cacd829d5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/I5U3FZFGEX4KMGIZEMEKMUJET6/bundle.json","state_url":"https://pith.science/pith/I5U3FZFGEX4KMGIZEMEKMUJET6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/I5U3FZFGEX4KMGIZEMEKMUJET6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-08T23:15:22Z","links":{"resolver":"https://pith.science/pith/I5U3FZFGEX4KMGIZEMEKMUJET6","bundle":"https://pith.science/pith/I5U3FZFGEX4KMGIZEMEKMUJET6/bundle.json","state":"https://pith.science/pith/I5U3FZFGEX4KMGIZEMEKMUJET6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/I5U3FZFGEX4KMGIZEMEKMUJET6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:I5U3FZFGEX4KMGIZEMEKMUJET6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"baa1f3e0b384f274696666e397a9875a4a0ff77395f6ef02c8aa7792ada103b0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-01T14:33:11Z","title_canon_sha256":"622a9769fac477a2a6c49720b1c543ff81605e65f34648a3adde487a5e8ee8a7"},"schema_version":"1.0","source":{"id":"1809.00196","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.00196","created_at":"2026-05-18T00:06:35Z"},{"alias_kind":"arxiv_version","alias_value":"1809.00196v1","created_at":"2026-05-18T00:06:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.00196","created_at":"2026-05-18T00:06:35Z"},{"alias_kind":"pith_short_12","alias_value":"I5U3FZFGEX4K","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"I5U3FZFGEX4KMGIZ","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"I5U3FZFG","created_at":"2026-05-18T12:32:28Z"}],"graph_snapshots":[{"event_id":"sha256:6bc8841bed5b3c72e94531ac1ca2e071299db4f9615ef2e346f4591cacd829d5","target":"graph","created_at":"2026-05-18T00:06:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"This paper describes the Microsoft submission to the WMT2018 news translation shared task. We participated in one language direction -- English-German. Our system follows current best-practice and combines state-of-the-art models with new data filtering (dual conditional cross-entropy filtering) and sentence weighting methods. We trained fairly standard Transformer-big models with an updated version of Edinburgh's training scheme for WMT2017 and experimented with different filtering schemes for Paracrawl. According to automatic metrics (BLEU) we reached the highest score for this subtask with ","authors_text":"Marcin Junczys-Dowmunt","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-01T14:33:11Z","title":"Microsoft's Submission to the WMT2018 News Translation Task: How I Learned to Stop Worrying and Love the Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.00196","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:77b990d51d178ee9ada4cda18f52be41b1d11be0841eede381cfbdecdbb03fd5","target":"record","created_at":"2026-05-18T00:06:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"baa1f3e0b384f274696666e397a9875a4a0ff77395f6ef02c8aa7792ada103b0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-01T14:33:11Z","title_canon_sha256":"622a9769fac477a2a6c49720b1c543ff81605e65f34648a3adde487a5e8ee8a7"},"schema_version":"1.0","source":{"id":"1809.00196","kind":"arxiv","version":1}},"canonical_sha256":"4769b2e4a625f8a619192308a651249f9af5a33356c0192e44eb6045ebe78c66","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4769b2e4a625f8a619192308a651249f9af5a33356c0192e44eb6045ebe78c66","first_computed_at":"2026-05-18T00:06:35.794671Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:06:35.794671Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"4LF3CeQsr0sLrKbQfWvZHQSrn1gYPpcUhvPU+0l6fEUEj7Wxiez/v5KgnwALVDzDF9n34YR6Xq+yQu9Ln1ZNCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:06:35.795052Z","signed_message":"canonical_sha256_bytes"},"source_id":"1809.00196","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:77b990d51d178ee9ada4cda18f52be41b1d11be0841eede381cfbdecdbb03fd5","sha256:6bc8841bed5b3c72e94531ac1ca2e071299db4f9615ef2e346f4591cacd829d5"],"state_sha256":"9ecc3645fbafbcd7187d1312a5df9550a4657232a4a1e4a47c9ea8761cb34f2d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"uTz0yTOYJzunWSatPI7CZsEFcOXEH+QjNq6YhIB1BKjs/2+y+fkCRY+B3WnaAA7A4UfOEGSGerIxMa1sB8ZrCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-08T23:15:22.249791Z","bundle_sha256":"7def0ae7c4a9a723736657a3062d5914a24a838ecd5e4731c0bbb1437020e8b2"}}