{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:K4BPE5VYM7AOY3LYHB57GELLNL","short_pith_number":"pith:K4BPE5VY","canonical_record":{"source":{"id":"1903.09460","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-03-22T11:55:21Z","cross_cats_sorted":[],"title_canon_sha256":"bac7dffad7b8f58d7416ce8c83f45f32eb0998e8d6e7b0cca2e457510f86556b","abstract_canon_sha256":"a2b071f9764db131b41d8810bcf4834f49e71da50916c9552728ea1aa3448090"},"schema_version":"1.0"},"canonical_sha256":"5702f276b867c0ec6d78387bf3116b6acf6179971eb89a5eccef1458957ba52a","source":{"kind":"arxiv","id":"1903.09460","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.09460","created_at":"2026-05-17T23:50:39Z"},{"alias_kind":"arxiv_version","alias_value":"1903.09460v1","created_at":"2026-05-17T23:50:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.09460","created_at":"2026-05-17T23:50:39Z"},{"alias_kind":"pith_short_12","alias_value":"K4BPE5VYM7AO","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_16","alias_value":"K4BPE5VYM7AOY3LY","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_8","alias_value":"K4BPE5VY","created_at":"2026-05-18T12:33:21Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:K4BPE5VYM7AOY3LYHB57GELLNL","target":"record","payload":{"canonical_record":{"source":{"id":"1903.09460","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-03-22T11:55:21Z","cross_cats_sorted":[],"title_canon_sha256":"bac7dffad7b8f58d7416ce8c83f45f32eb0998e8d6e7b0cca2e457510f86556b","abstract_canon_sha256":"a2b071f9764db131b41d8810bcf4834f49e71da50916c9552728ea1aa3448090"},"schema_version":"1.0"},"canonical_sha256":"5702f276b867c0ec6d78387bf3116b6acf6179971eb89a5eccef1458957ba52a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:50:39.573680Z","signature_b64":"ntxajEhGQmy4sxBfrn6gqETsPvEbQCORA29Nk20Z3X9IbGnicjVJbBg4yKJVvROFAZxXiWfVp8/SzImYLagoCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5702f276b867c0ec6d78387bf3116b6acf6179971eb89a5eccef1458957ba52a","last_reissued_at":"2026-05-17T23:50:39.573227Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:50:39.573227Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1903.09460","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:50:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"25dLLnSrAintySZINq+iw1l6MG1lyLUW2UuVidYzkwA5oQbPJYFB1Pr0jyaxVR7bVmCrmSlsELEcHfJrsvm1CA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T13:32:32.631819Z"},"content_sha256":"43a1a6ff84953777177287b85e6773a956cf48844de1f9338de4c92d946614dd","schema_version":"1.0","event_id":"sha256:43a1a6ff84953777177287b85e6773a956cf48844de1f9338de4c92d946614dd"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:K4BPE5VYM7AOY3LYHB57GELLNL","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Data Augmentation via Dependency Tree Morphing for Low-Resource Languages","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"G\\\"ozde G\\\"ul \\c{S}ahin, Mark Steedman","submitted_at":"2019-03-22T11:55:21Z","abstract_excerpt":"Neural NLP systems achieve high scores in the presence of sizable training dataset. Lack of such datasets leads to poor system performances in the case low-resource languages. We present two simple text augmentation techniques using dependency trees, inspired from image processing. We crop sentences by removing dependency links, and we rotate sentences by moving the tree fragments around the root. We apply these techniques to augment the training sets of low-resource languages in Universal Dependencies project. We implement a character-level sequence tagging model and evaluate the augmented da"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.09460","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:50:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7hTeQayKzg+wzP4clMs0+DPkVEJVFun/f6S4oOV/ujdVUPaPFVGyoBBdShmW0W3iwMw7qQSUXTzQJZlfZW7/BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T13:32:32.632488Z"},"content_sha256":"84e2ecd44ebc9a1ac44f9b303e2373085dc841a984f3cda4f870beb87afd8e6b","schema_version":"1.0","event_id":"sha256:84e2ecd44ebc9a1ac44f9b303e2373085dc841a984f3cda4f870beb87afd8e6b"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/K4BPE5VYM7AOY3LYHB57GELLNL/bundle.json","state_url":"https://pith.science/pith/K4BPE5VYM7AOY3LYHB57GELLNL/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/K4BPE5VYM7AOY3LYHB57GELLNL/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T13:32:32Z","links":{"resolver":"https://pith.science/pith/K4BPE5VYM7AOY3LYHB57GELLNL","bundle":"https://pith.science/pith/K4BPE5VYM7AOY3LYHB57GELLNL/bundle.json","state":"https://pith.science/pith/K4BPE5VYM7AOY3LYHB57GELLNL/state.json","well_known_bundle":"https://pith.science/.well-known/pith/K4BPE5VYM7AOY3LYHB57GELLNL/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:K4BPE5VYM7AOY3LYHB57GELLNL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a2b071f9764db131b41d8810bcf4834f49e71da50916c9552728ea1aa3448090","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-03-22T11:55:21Z","title_canon_sha256":"bac7dffad7b8f58d7416ce8c83f45f32eb0998e8d6e7b0cca2e457510f86556b"},"schema_version":"1.0","source":{"id":"1903.09460","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.09460","created_at":"2026-05-17T23:50:39Z"},{"alias_kind":"arxiv_version","alias_value":"1903.09460v1","created_at":"2026-05-17T23:50:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.09460","created_at":"2026-05-17T23:50:39Z"},{"alias_kind":"pith_short_12","alias_value":"K4BPE5VYM7AO","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_16","alias_value":"K4BPE5VYM7AOY3LY","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_8","alias_value":"K4BPE5VY","created_at":"2026-05-18T12:33:21Z"}],"graph_snapshots":[{"event_id":"sha256:84e2ecd44ebc9a1ac44f9b303e2373085dc841a984f3cda4f870beb87afd8e6b","target":"graph","created_at":"2026-05-17T23:50:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Neural NLP systems achieve high scores in the presence of sizable training dataset. Lack of such datasets leads to poor system performances in the case low-resource languages. We present two simple text augmentation techniques using dependency trees, inspired from image processing. We crop sentences by removing dependency links, and we rotate sentences by moving the tree fragments around the root. We apply these techniques to augment the training sets of low-resource languages in Universal Dependencies project. We implement a character-level sequence tagging model and evaluate the augmented da","authors_text":"G\\\"ozde G\\\"ul \\c{S}ahin, Mark Steedman","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-03-22T11:55:21Z","title":"Data Augmentation via Dependency Tree Morphing for Low-Resource Languages"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.09460","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:43a1a6ff84953777177287b85e6773a956cf48844de1f9338de4c92d946614dd","target":"record","created_at":"2026-05-17T23:50:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a2b071f9764db131b41d8810bcf4834f49e71da50916c9552728ea1aa3448090","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-03-22T11:55:21Z","title_canon_sha256":"bac7dffad7b8f58d7416ce8c83f45f32eb0998e8d6e7b0cca2e457510f86556b"},"schema_version":"1.0","source":{"id":"1903.09460","kind":"arxiv","version":1}},"canonical_sha256":"5702f276b867c0ec6d78387bf3116b6acf6179971eb89a5eccef1458957ba52a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5702f276b867c0ec6d78387bf3116b6acf6179971eb89a5eccef1458957ba52a","first_computed_at":"2026-05-17T23:50:39.573227Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:50:39.573227Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ntxajEhGQmy4sxBfrn6gqETsPvEbQCORA29Nk20Z3X9IbGnicjVJbBg4yKJVvROFAZxXiWfVp8/SzImYLagoCA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:50:39.573680Z","signed_message":"canonical_sha256_bytes"},"source_id":"1903.09460","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:43a1a6ff84953777177287b85e6773a956cf48844de1f9338de4c92d946614dd","sha256:84e2ecd44ebc9a1ac44f9b303e2373085dc841a984f3cda4f870beb87afd8e6b"],"state_sha256":"83afd843c4f4d5f8d53ebf88c1841a41318d8c7cc1e8f946c939e5971d0cf69b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"b9B5s4P3WlW/Xcgnl5nEusGs6ueDdRXj5sYw2SSAkcbtAbXZd6pYbd1bkBYd2N1AN/msp7qkAsX8rDKvMpSUAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T13:32:32.636105Z","bundle_sha256":"1ce152b02b186275e7a968fccee8cae73520b44ed1ab5604eaa94261bb5314e4"}}