{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:6XOKZRHJEAGXHOT3HGEZIWLSYM","short_pith_number":"pith:6XOKZRHJ","canonical_record":{"source":{"id":"1906.03785","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-06-10T03:28:57Z","cross_cats_sorted":[],"title_canon_sha256":"88d21b71a93461ddd18b19e6def5a92d321176a4901b65decb567c238969954f","abstract_canon_sha256":"9e3c65975fb3cbe01584cc2c0ebcefee831c5681e7bd1be60f5936b6da8da513"},"schema_version":"1.0"},"canonical_sha256":"f5dcacc4e9200d73ba7b3989945972c329dc847b1a86b1ae169b32dba34ec80d","source":{"kind":"arxiv","id":"1906.03785","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.03785","created_at":"2026-05-17T23:43:44Z"},{"alias_kind":"arxiv_version","alias_value":"1906.03785v1","created_at":"2026-05-17T23:43:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.03785","created_at":"2026-05-17T23:43:44Z"},{"alias_kind":"pith_short_12","alias_value":"6XOKZRHJEAGX","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_16","alias_value":"6XOKZRHJEAGXHOT3","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_8","alias_value":"6XOKZRHJ","created_at":"2026-05-18T12:33:10Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:6XOKZRHJEAGXHOT3HGEZIWLSYM","target":"record","payload":{"canonical_record":{"source":{"id":"1906.03785","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-06-10T03:28:57Z","cross_cats_sorted":[],"title_canon_sha256":"88d21b71a93461ddd18b19e6def5a92d321176a4901b65decb567c238969954f","abstract_canon_sha256":"9e3c65975fb3cbe01584cc2c0ebcefee831c5681e7bd1be60f5936b6da8da513"},"schema_version":"1.0"},"canonical_sha256":"f5dcacc4e9200d73ba7b3989945972c329dc847b1a86b1ae169b32dba34ec80d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:43:44.986101Z","signature_b64":"JxBNY89Z1oEgFUNf2zEnP7w84H5v5Jr+Jr723wXov2oCjYi9telvMetDbdunosTKok6J1FlMcVt+5TIz17BuCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f5dcacc4e9200d73ba7b3989945972c329dc847b1a86b1ae169b32dba34ec80d","last_reissued_at":"2026-05-17T23:43:44.985377Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:43:44.985377Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1906.03785","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:43:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"204ogdKf7GBJKntPzWE3+dPbKuKToB+7YfT7VmpSBxXuCEhBHfPHCEuzHtLp2FG9cnL34UhSsBheX0JuYcc9Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T06:48:40.108895Z"},"content_sha256":"6a7f30224c103ff5626b884272024677da45683442d8fc1a014ccd0465cb0116","schema_version":"1.0","event_id":"sha256:6a7f30224c103ff5626b884272024677da45683442d8fc1a014ccd0465cb0116"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:6XOKZRHJEAGXHOT3HGEZIWLSYM","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Generalized Data Augmentation for Low-Resource Translation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Antonios Anastasopoulos, Graham Neubig, Mengzhou Xia, Xiang Kong","submitted_at":"2019-06-10T03:28:57Z","abstract_excerpt":"Translation to or from low-resource languages LRLs poses challenges for machine translation in terms of both adequacy and fluency. Data augmentation utilizing large amounts of monolingual data is regarded as an effective way to alleviate these problems. In this paper, we propose a general framework for data augmentation in low-resource machine translation that not only uses target-side monolingual data, but also pivots through a related high-resource language HRL. Specifically, we experiment with a two-step pivoting method to convert high-resource data to the LRL, making use of available resou"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.03785","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:43:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"a4wX1EgzcxLxCcgcp4utRZCJadDKp26g9eHSXQ2afdYXSDR9xJovV0uU9kSz8taNfsyzdssXK0dCw+a5PxmhAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T06:48:40.109246Z"},"content_sha256":"99f20fa96ea2f1d19854acb2d009740c969bf470bcb2d5b3475e50241d53ca5e","schema_version":"1.0","event_id":"sha256:99f20fa96ea2f1d19854acb2d009740c969bf470bcb2d5b3475e50241d53ca5e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6XOKZRHJEAGXHOT3HGEZIWLSYM/bundle.json","state_url":"https://pith.science/pith/6XOKZRHJEAGXHOT3HGEZIWLSYM/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6XOKZRHJEAGXHOT3HGEZIWLSYM/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T06:48:40Z","links":{"resolver":"https://pith.science/pith/6XOKZRHJEAGXHOT3HGEZIWLSYM","bundle":"https://pith.science/pith/6XOKZRHJEAGXHOT3HGEZIWLSYM/bundle.json","state":"https://pith.science/pith/6XOKZRHJEAGXHOT3HGEZIWLSYM/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6XOKZRHJEAGXHOT3HGEZIWLSYM/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:6XOKZRHJEAGXHOT3HGEZIWLSYM","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9e3c65975fb3cbe01584cc2c0ebcefee831c5681e7bd1be60f5936b6da8da513","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-06-10T03:28:57Z","title_canon_sha256":"88d21b71a93461ddd18b19e6def5a92d321176a4901b65decb567c238969954f"},"schema_version":"1.0","source":{"id":"1906.03785","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.03785","created_at":"2026-05-17T23:43:44Z"},{"alias_kind":"arxiv_version","alias_value":"1906.03785v1","created_at":"2026-05-17T23:43:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.03785","created_at":"2026-05-17T23:43:44Z"},{"alias_kind":"pith_short_12","alias_value":"6XOKZRHJEAGX","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_16","alias_value":"6XOKZRHJEAGXHOT3","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_8","alias_value":"6XOKZRHJ","created_at":"2026-05-18T12:33:10Z"}],"graph_snapshots":[{"event_id":"sha256:99f20fa96ea2f1d19854acb2d009740c969bf470bcb2d5b3475e50241d53ca5e","target":"graph","created_at":"2026-05-17T23:43:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Translation to or from low-resource languages LRLs poses challenges for machine translation in terms of both adequacy and fluency. Data augmentation utilizing large amounts of monolingual data is regarded as an effective way to alleviate these problems. In this paper, we propose a general framework for data augmentation in low-resource machine translation that not only uses target-side monolingual data, but also pivots through a related high-resource language HRL. Specifically, we experiment with a two-step pivoting method to convert high-resource data to the LRL, making use of available resou","authors_text":"Antonios Anastasopoulos, Graham Neubig, Mengzhou Xia, Xiang Kong","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-06-10T03:28:57Z","title":"Generalized Data Augmentation for Low-Resource Translation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.03785","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6a7f30224c103ff5626b884272024677da45683442d8fc1a014ccd0465cb0116","target":"record","created_at":"2026-05-17T23:43:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9e3c65975fb3cbe01584cc2c0ebcefee831c5681e7bd1be60f5936b6da8da513","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-06-10T03:28:57Z","title_canon_sha256":"88d21b71a93461ddd18b19e6def5a92d321176a4901b65decb567c238969954f"},"schema_version":"1.0","source":{"id":"1906.03785","kind":"arxiv","version":1}},"canonical_sha256":"f5dcacc4e9200d73ba7b3989945972c329dc847b1a86b1ae169b32dba34ec80d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f5dcacc4e9200d73ba7b3989945972c329dc847b1a86b1ae169b32dba34ec80d","first_computed_at":"2026-05-17T23:43:44.985377Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:43:44.985377Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"JxBNY89Z1oEgFUNf2zEnP7w84H5v5Jr+Jr723wXov2oCjYi9telvMetDbdunosTKok6J1FlMcVt+5TIz17BuCQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:43:44.986101Z","signed_message":"canonical_sha256_bytes"},"source_id":"1906.03785","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6a7f30224c103ff5626b884272024677da45683442d8fc1a014ccd0465cb0116","sha256:99f20fa96ea2f1d19854acb2d009740c969bf470bcb2d5b3475e50241d53ca5e"],"state_sha256":"514fd969e4c9d5a50dc6038b46fcaf8ef40d43dad242867e5f3e2b3d329ec765"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"zsxrfkAgWX9FjyEFBg+QzG9fCF26+dHFrrOaoCgNmVwHwab/ozcc87Dbtpbuw/3VaXUtPp+Xjyk3WxKYcpacDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T06:48:40.111333Z","bundle_sha256":"b79718a8a73b2deebbac167ce6f0a6fce85bd001bf78128e1a47594d25741637"}}