{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:NK5QVKFK5CV4MZ5ZUA5FAXQWDB","short_pith_number":"pith:NK5QVKFK","canonical_record":{"source":{"id":"1906.12068","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-06-28T07:31:33Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"2bd034810efae74b245c5bf5e7c65fbd4de719806369c1266160ec3bb07455f3","abstract_canon_sha256":"e51feac838d34bd8142f0fe562aa88b903601b0793eec5be9c7342794242a8fa"},"schema_version":"1.0"},"canonical_sha256":"6abb0aa8aae8abc667b9a03a505e16184c15f8940aa83321e40c21dd6aa85f34","source":{"kind":"arxiv","id":"1906.12068","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.12068","created_at":"2026-05-17T23:41:59Z"},{"alias_kind":"arxiv_version","alias_value":"1906.12068v1","created_at":"2026-05-17T23:41:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.12068","created_at":"2026-05-17T23:41:59Z"},{"alias_kind":"pith_short_12","alias_value":"NK5QVKFK5CV4","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_16","alias_value":"NK5QVKFK5CV4MZ5Z","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_8","alias_value":"NK5QVKFK","created_at":"2026-05-18T12:33:24Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:NK5QVKFK5CV4MZ5ZUA5FAXQWDB","target":"record","payload":{"canonical_record":{"source":{"id":"1906.12068","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-06-28T07:31:33Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"2bd034810efae74b245c5bf5e7c65fbd4de719806369c1266160ec3bb07455f3","abstract_canon_sha256":"e51feac838d34bd8142f0fe562aa88b903601b0793eec5be9c7342794242a8fa"},"schema_version":"1.0"},"canonical_sha256":"6abb0aa8aae8abc667b9a03a505e16184c15f8940aa83321e40c21dd6aa85f34","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:59.349330Z","signature_b64":"R7Vdt6ICJwmKiCqWlV117SNvkW2sp599V5gKPVeGpNy+xwYz/8TuHoJkJkQeiDm6g/seZp3WWxiRlJFDQYeKAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6abb0aa8aae8abc667b9a03a505e16184c15f8940aa83321e40c21dd6aa85f34","last_reissued_at":"2026-05-17T23:41:59.348823Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:59.348823Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1906.12068","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"AO2dePOFz7HvVqNYRsH7rbGOe/3SbQttM0J6Qknsn3pk8g05JghVb2It7m3oY713pGIoKsClG6NJ1UE8UgstAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T20:53:43.502607Z"},"content_sha256":"928c7951d4c1db79fc8566070204f88c3d4db92ac2d30637ff87e8632e096401","schema_version":"1.0","event_id":"sha256:928c7951d4c1db79fc8566070204f88c3d4db92ac2d30637ff87e8632e096401"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:NK5QVKFK5CV4MZ5ZUA5FAXQWDB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Lost in Translation: Loss and Decay of Linguistic Richness in Machine Translation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Andy Way, Dimitar Shterionov, Eva Vanmassenhove","submitted_at":"2019-06-28T07:31:33Z","abstract_excerpt":"This work presents an empirical approach to quantifying the loss of lexical richness in Machine Translation (MT) systems compared to Human Translation (HT). Our experiments show how current MT systems indeed fail to render the lexical diversity of human generated or translated text. The inability of MT systems to generate diverse outputs and its tendency to exacerbate already frequent patterns while ignoring less frequent ones, might be the underlying cause for, among others, the currently heavily debated issues related to gender biased output. Can we indeed, aside from biased data, talk about"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.12068","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"PVeQT7OIGluKnnAduWK160QPr/zw/viOR9XrjIVh/5IhR5QtgTi++wpi0LPqWamo+QjHAnfSuZ24ZzPa3zTsBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T20:53:43.503354Z"},"content_sha256":"17bb04134086ac4bb6458bd9ac8785fd56c4734bd9608f0b461b1f5073d304d1","schema_version":"1.0","event_id":"sha256:17bb04134086ac4bb6458bd9ac8785fd56c4734bd9608f0b461b1f5073d304d1"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NK5QVKFK5CV4MZ5ZUA5FAXQWDB/bundle.json","state_url":"https://pith.science/pith/NK5QVKFK5CV4MZ5ZUA5FAXQWDB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NK5QVKFK5CV4MZ5ZUA5FAXQWDB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T20:53:43Z","links":{"resolver":"https://pith.science/pith/NK5QVKFK5CV4MZ5ZUA5FAXQWDB","bundle":"https://pith.science/pith/NK5QVKFK5CV4MZ5ZUA5FAXQWDB/bundle.json","state":"https://pith.science/pith/NK5QVKFK5CV4MZ5ZUA5FAXQWDB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NK5QVKFK5CV4MZ5ZUA5FAXQWDB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:NK5QVKFK5CV4MZ5ZUA5FAXQWDB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e51feac838d34bd8142f0fe562aa88b903601b0793eec5be9c7342794242a8fa","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-06-28T07:31:33Z","title_canon_sha256":"2bd034810efae74b245c5bf5e7c65fbd4de719806369c1266160ec3bb07455f3"},"schema_version":"1.0","source":{"id":"1906.12068","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.12068","created_at":"2026-05-17T23:41:59Z"},{"alias_kind":"arxiv_version","alias_value":"1906.12068v1","created_at":"2026-05-17T23:41:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.12068","created_at":"2026-05-17T23:41:59Z"},{"alias_kind":"pith_short_12","alias_value":"NK5QVKFK5CV4","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_16","alias_value":"NK5QVKFK5CV4MZ5Z","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_8","alias_value":"NK5QVKFK","created_at":"2026-05-18T12:33:24Z"}],"graph_snapshots":[{"event_id":"sha256:17bb04134086ac4bb6458bd9ac8785fd56c4734bd9608f0b461b1f5073d304d1","target":"graph","created_at":"2026-05-17T23:41:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"This work presents an empirical approach to quantifying the loss of lexical richness in Machine Translation (MT) systems compared to Human Translation (HT). Our experiments show how current MT systems indeed fail to render the lexical diversity of human generated or translated text. The inability of MT systems to generate diverse outputs and its tendency to exacerbate already frequent patterns while ignoring less frequent ones, might be the underlying cause for, among others, the currently heavily debated issues related to gender biased output. Can we indeed, aside from biased data, talk about","authors_text":"Andy Way, Dimitar Shterionov, Eva Vanmassenhove","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-06-28T07:31:33Z","title":"Lost in Translation: Loss and Decay of Linguistic Richness in Machine Translation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.12068","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:928c7951d4c1db79fc8566070204f88c3d4db92ac2d30637ff87e8632e096401","target":"record","created_at":"2026-05-17T23:41:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e51feac838d34bd8142f0fe562aa88b903601b0793eec5be9c7342794242a8fa","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-06-28T07:31:33Z","title_canon_sha256":"2bd034810efae74b245c5bf5e7c65fbd4de719806369c1266160ec3bb07455f3"},"schema_version":"1.0","source":{"id":"1906.12068","kind":"arxiv","version":1}},"canonical_sha256":"6abb0aa8aae8abc667b9a03a505e16184c15f8940aa83321e40c21dd6aa85f34","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6abb0aa8aae8abc667b9a03a505e16184c15f8940aa83321e40c21dd6aa85f34","first_computed_at":"2026-05-17T23:41:59.348823Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:59.348823Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"R7Vdt6ICJwmKiCqWlV117SNvkW2sp599V5gKPVeGpNy+xwYz/8TuHoJkJkQeiDm6g/seZp3WWxiRlJFDQYeKAw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:59.349330Z","signed_message":"canonical_sha256_bytes"},"source_id":"1906.12068","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:928c7951d4c1db79fc8566070204f88c3d4db92ac2d30637ff87e8632e096401","sha256:17bb04134086ac4bb6458bd9ac8785fd56c4734bd9608f0b461b1f5073d304d1"],"state_sha256":"08b0036ffd7902a20caf96a9ad87a4f8788f2cd68bb38ebfbbdb246b7488c6a6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OAjNmvXIUDgmHTsGel1iqlXoUGOFBFvaG5Ml2byyuba7RLcVIbrNpxTA2E4ZypJ5qFF7O2zaShq+RI2wvk/eDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T20:53:43.507986Z","bundle_sha256":"58f4497162e3998b0dc7a3d73882be155e88b1d56f4b5a9173cb1c614c5ca2ea"}}