{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:33MC73KKMZDY7PIL2LLLG47FSB","short_pith_number":"pith:33MC73KK","canonical_record":{"source":{"id":"1709.01643","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-09-06T01:17:31Z","cross_cats_sorted":["cs.CV","cs.LG"],"title_canon_sha256":"36bdba74959139bdf584787826b631afa2d9209301bbe488456ee7db1457427b","abstract_canon_sha256":"4ab0a3b71df8ace39f4fc0613fff2fe0041fbb26fc61711c1940eb440ffadfbc"},"schema_version":"1.0"},"canonical_sha256":"ded82fed4a66478fbd0bd2d6b373e5905e6baaf209de1c1f96b626e949c2c7fd","source":{"kind":"arxiv","id":"1709.01643","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1709.01643","created_at":"2026-05-17T23:58:54Z"},{"alias_kind":"arxiv_version","alias_value":"1709.01643v3","created_at":"2026-05-17T23:58:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1709.01643","created_at":"2026-05-17T23:58:54Z"},{"alias_kind":"pith_short_12","alias_value":"33MC73KKMZDY","created_at":"2026-05-18T12:30:55Z"},{"alias_kind":"pith_short_16","alias_value":"33MC73KKMZDY7PIL","created_at":"2026-05-18T12:30:55Z"},{"alias_kind":"pith_short_8","alias_value":"33MC73KK","created_at":"2026-05-18T12:30:55Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:33MC73KKMZDY7PIL2LLLG47FSB","target":"record","payload":{"canonical_record":{"source":{"id":"1709.01643","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-09-06T01:17:31Z","cross_cats_sorted":["cs.CV","cs.LG"],"title_canon_sha256":"36bdba74959139bdf584787826b631afa2d9209301bbe488456ee7db1457427b","abstract_canon_sha256":"4ab0a3b71df8ace39f4fc0613fff2fe0041fbb26fc61711c1940eb440ffadfbc"},"schema_version":"1.0"},"canonical_sha256":"ded82fed4a66478fbd0bd2d6b373e5905e6baaf209de1c1f96b626e949c2c7fd","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:58:54.668622Z","signature_b64":"PRDQUZ45erzFOeJCTT1CMZtszIb6SjTg0GmNjiiImV9ZETw3L7lQEsQ8vosStVMFCh/gk5crAzfOV3kFuDgZCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"ded82fed4a66478fbd0bd2d6b373e5905e6baaf209de1c1f96b626e949c2c7fd","last_reissued_at":"2026-05-17T23:58:54.668076Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:58:54.668076Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1709.01643","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:58:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8gPfqbdIbx1cPjekVXfoE4c6r02tfhOB3bOJUs7Ll5Oc+vCW8ejRiZQazxyJ0FXdJhAdpReYfFAHRKvzXtn0Bw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T21:35:36.775051Z"},"content_sha256":"806792dc42e17472bae19df6a2593aa790bf45d3c28bc81b377a63595e6fa311","schema_version":"1.0","event_id":"sha256:806792dc42e17472bae19df6a2593aa790bf45d3c28bc81b377a63595e6fa311"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:33MC73KKMZDY7PIL2LLLG47FSB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Learning to Compose Domain-Specific Transformations for Data Augmentation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CV","cs.LG"],"primary_cat":"stat.ML","authors_text":"Alexander J. Ratner, Christopher R\\'e, Henry R. Ehrenberg, Jared Dunnmon, Zeshan Hussain","submitted_at":"2017-09-06T01:17:31Z","abstract_excerpt":"Data augmentation is a ubiquitous technique for increasing the size of labeled training sets by leveraging task-specific data transformations that preserve class labels. While it is often easy for domain experts to specify individual transformations, constructing and tuning the more sophisticated compositions typically needed to achieve state-of-the-art results is a time-consuming manual task in practice. We propose a method for automating this process by learning a generative sequence model over user-specified transformation functions using a generative adversarial approach. Our method can ma"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1709.01643","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:58:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KHcQMB2CaXGmLyTQz3bM8N6H39dsFZxa7bte/ra+9NLvSiKehaR/Agb/Cnpk1Ne27nVpdENqEJMtXqQyy+rgAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T21:35:36.775723Z"},"content_sha256":"0f85fcdb5fb50358b886ab0b760cee3816ad65283e8d9fd66831e6e3a9ba81f1","schema_version":"1.0","event_id":"sha256:0f85fcdb5fb50358b886ab0b760cee3816ad65283e8d9fd66831e6e3a9ba81f1"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/33MC73KKMZDY7PIL2LLLG47FSB/bundle.json","state_url":"https://pith.science/pith/33MC73KKMZDY7PIL2LLLG47FSB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/33MC73KKMZDY7PIL2LLLG47FSB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-09T21:35:36Z","links":{"resolver":"https://pith.science/pith/33MC73KKMZDY7PIL2LLLG47FSB","bundle":"https://pith.science/pith/33MC73KKMZDY7PIL2LLLG47FSB/bundle.json","state":"https://pith.science/pith/33MC73KKMZDY7PIL2LLLG47FSB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/33MC73KKMZDY7PIL2LLLG47FSB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:33MC73KKMZDY7PIL2LLLG47FSB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4ab0a3b71df8ace39f4fc0613fff2fe0041fbb26fc61711c1940eb440ffadfbc","cross_cats_sorted":["cs.CV","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-09-06T01:17:31Z","title_canon_sha256":"36bdba74959139bdf584787826b631afa2d9209301bbe488456ee7db1457427b"},"schema_version":"1.0","source":{"id":"1709.01643","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1709.01643","created_at":"2026-05-17T23:58:54Z"},{"alias_kind":"arxiv_version","alias_value":"1709.01643v3","created_at":"2026-05-17T23:58:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1709.01643","created_at":"2026-05-17T23:58:54Z"},{"alias_kind":"pith_short_12","alias_value":"33MC73KKMZDY","created_at":"2026-05-18T12:30:55Z"},{"alias_kind":"pith_short_16","alias_value":"33MC73KKMZDY7PIL","created_at":"2026-05-18T12:30:55Z"},{"alias_kind":"pith_short_8","alias_value":"33MC73KK","created_at":"2026-05-18T12:30:55Z"}],"graph_snapshots":[{"event_id":"sha256:0f85fcdb5fb50358b886ab0b760cee3816ad65283e8d9fd66831e6e3a9ba81f1","target":"graph","created_at":"2026-05-17T23:58:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Data augmentation is a ubiquitous technique for increasing the size of labeled training sets by leveraging task-specific data transformations that preserve class labels. While it is often easy for domain experts to specify individual transformations, constructing and tuning the more sophisticated compositions typically needed to achieve state-of-the-art results is a time-consuming manual task in practice. We propose a method for automating this process by learning a generative sequence model over user-specified transformation functions using a generative adversarial approach. Our method can ma","authors_text":"Alexander J. Ratner, Christopher R\\'e, Henry R. Ehrenberg, Jared Dunnmon, Zeshan Hussain","cross_cats":["cs.CV","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-09-06T01:17:31Z","title":"Learning to Compose Domain-Specific Transformations for Data Augmentation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1709.01643","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:806792dc42e17472bae19df6a2593aa790bf45d3c28bc81b377a63595e6fa311","target":"record","created_at":"2026-05-17T23:58:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4ab0a3b71df8ace39f4fc0613fff2fe0041fbb26fc61711c1940eb440ffadfbc","cross_cats_sorted":["cs.CV","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-09-06T01:17:31Z","title_canon_sha256":"36bdba74959139bdf584787826b631afa2d9209301bbe488456ee7db1457427b"},"schema_version":"1.0","source":{"id":"1709.01643","kind":"arxiv","version":3}},"canonical_sha256":"ded82fed4a66478fbd0bd2d6b373e5905e6baaf209de1c1f96b626e949c2c7fd","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ded82fed4a66478fbd0bd2d6b373e5905e6baaf209de1c1f96b626e949c2c7fd","first_computed_at":"2026-05-17T23:58:54.668076Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:58:54.668076Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"PRDQUZ45erzFOeJCTT1CMZtszIb6SjTg0GmNjiiImV9ZETw3L7lQEsQ8vosStVMFCh/gk5crAzfOV3kFuDgZCw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:58:54.668622Z","signed_message":"canonical_sha256_bytes"},"source_id":"1709.01643","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:806792dc42e17472bae19df6a2593aa790bf45d3c28bc81b377a63595e6fa311","sha256:0f85fcdb5fb50358b886ab0b760cee3816ad65283e8d9fd66831e6e3a9ba81f1"],"state_sha256":"9d6460315310216ba64405ee2bdc0a0f6f83eee95169c91886cfb9b535b5f71c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ROO4wJA04ttMIxgnekGry1w8JT1ZtJKxdy/N3QDxjGRPcBAsDQHtAOcxKFhnIbNa9neNep/ajCJfMeT/f3SEBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-09T21:35:36.779689Z","bundle_sha256":"7df6c623dc7927fe6c4862a01f5a50faf9430b67b567f4bc36dd08ed2200944e"}}