{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:TA6W2F4ZL3GRAGZN63XQDO75PO","short_pith_number":"pith:TA6W2F4Z","canonical_record":{"source":{"id":"1703.09327","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-27T22:26:16Z","cross_cats_sorted":[],"title_canon_sha256":"b384e798bbc9468bb0b3f7808e35a904ce0b0e8dcd21fe964866aa4b392247be","abstract_canon_sha256":"547aac6092381f12f708575d0e3d00b1812bbd007cc26037b064bc81c969821d"},"schema_version":"1.0"},"canonical_sha256":"983d6d17995ecd101b2df6ef01bbfd7ba2d24e22d4d3f7efcc7084757f200915","source":{"kind":"arxiv","id":"1703.09327","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.09327","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"arxiv_version","alias_value":"1703.09327v2","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.09327","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"pith_short_12","alias_value":"TA6W2F4ZL3GR","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_16","alias_value":"TA6W2F4ZL3GRAGZN","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_8","alias_value":"TA6W2F4Z","created_at":"2026-05-18T12:31:43Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:TA6W2F4ZL3GRAGZN63XQDO75PO","target":"record","payload":{"canonical_record":{"source":{"id":"1703.09327","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-27T22:26:16Z","cross_cats_sorted":[],"title_canon_sha256":"b384e798bbc9468bb0b3f7808e35a904ce0b0e8dcd21fe964866aa4b392247be","abstract_canon_sha256":"547aac6092381f12f708575d0e3d00b1812bbd007cc26037b064bc81c969821d"},"schema_version":"1.0"},"canonical_sha256":"983d6d17995ecd101b2df6ef01bbfd7ba2d24e22d4d3f7efcc7084757f200915","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:24:42.951593Z","signature_b64":"DH0VFgivHR5wzv7FUmxP0x0m2yUX98cEo02VQr0e66vJff5YbjH5nweXkOeqQ6miE2OUMJFqHCnNllV1mMJWAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"983d6d17995ecd101b2df6ef01bbfd7ba2d24e22d4d3f7efcc7084757f200915","last_reissued_at":"2026-05-18T00:24:42.951101Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:24:42.951101Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1703.09327","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:24:42Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"l5EXDVbRxE4eSY98pEZQwz7DAsqzYTla36kc7o3LZce/wwe02AMlICH9efZY6Hj1NviBkZpWj3WYqH0JxE4oBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T00:05:43.441607Z"},"content_sha256":"acb1884e88d0c3e60da3a769ac18d2fe390ed81c8fa2c852ea5c1e93daf47759","schema_version":"1.0","event_id":"sha256:acb1884e88d0c3e60da3a769ac18d2fe390ed81c8fa2c852ea5c1e93daf47759"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:TA6W2F4ZL3GRAGZN63XQDO75PO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"DART: Noise Injection for Robust Imitation Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Anca Dragan, Jonathan Lee, Ken Goldberg, Michael Laskey, Roy Fox","submitted_at":"2017-03-27T22:26:16Z","abstract_excerpt":"One approach to Imitation Learning is Behavior Cloning, in which a robot observes a supervisor and infers a control policy. A known problem with this \"off-policy\" approach is that the robot's errors compound when drifting away from the supervisor's demonstrations. On-policy, techniques alleviate this by iteratively collecting corrective actions for the current robot policy. However, these techniques can be tedious for human supervisors, add significant computation burden, and may visit dangerous states during training. We propose an off-policy approach that injects noise into the supervisor's "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.09327","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:24:42Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"J4A+CJvxcEGRhlxgtAOEw6+WnqhJs6n1hl4y4eMWkBvfEWS8mXs8nuu6BHY6UJH2leaxtqcdV5hrofT2J167CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T00:05:43.441951Z"},"content_sha256":"d5ffe697045094f5c08975769541eb02265da180d034361fbe35ad73913ae1ed","schema_version":"1.0","event_id":"sha256:d5ffe697045094f5c08975769541eb02265da180d034361fbe35ad73913ae1ed"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/TA6W2F4ZL3GRAGZN63XQDO75PO/bundle.json","state_url":"https://pith.science/pith/TA6W2F4ZL3GRAGZN63XQDO75PO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/TA6W2F4ZL3GRAGZN63XQDO75PO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T00:05:43Z","links":{"resolver":"https://pith.science/pith/TA6W2F4ZL3GRAGZN63XQDO75PO","bundle":"https://pith.science/pith/TA6W2F4ZL3GRAGZN63XQDO75PO/bundle.json","state":"https://pith.science/pith/TA6W2F4ZL3GRAGZN63XQDO75PO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/TA6W2F4ZL3GRAGZN63XQDO75PO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:TA6W2F4ZL3GRAGZN63XQDO75PO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"547aac6092381f12f708575d0e3d00b1812bbd007cc26037b064bc81c969821d","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-27T22:26:16Z","title_canon_sha256":"b384e798bbc9468bb0b3f7808e35a904ce0b0e8dcd21fe964866aa4b392247be"},"schema_version":"1.0","source":{"id":"1703.09327","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.09327","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"arxiv_version","alias_value":"1703.09327v2","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.09327","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"pith_short_12","alias_value":"TA6W2F4ZL3GR","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_16","alias_value":"TA6W2F4ZL3GRAGZN","created_at":"2026-05-18T12:31:43Z"},{"alias_kind":"pith_short_8","alias_value":"TA6W2F4Z","created_at":"2026-05-18T12:31:43Z"}],"graph_snapshots":[{"event_id":"sha256:d5ffe697045094f5c08975769541eb02265da180d034361fbe35ad73913ae1ed","target":"graph","created_at":"2026-05-18T00:24:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"One approach to Imitation Learning is Behavior Cloning, in which a robot observes a supervisor and infers a control policy. A known problem with this \"off-policy\" approach is that the robot's errors compound when drifting away from the supervisor's demonstrations. On-policy, techniques alleviate this by iteratively collecting corrective actions for the current robot policy. However, these techniques can be tedious for human supervisors, add significant computation burden, and may visit dangerous states during training. We propose an off-policy approach that injects noise into the supervisor's ","authors_text":"Anca Dragan, Jonathan Lee, Ken Goldberg, Michael Laskey, Roy Fox","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-27T22:26:16Z","title":"DART: Noise Injection for Robust Imitation Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.09327","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:acb1884e88d0c3e60da3a769ac18d2fe390ed81c8fa2c852ea5c1e93daf47759","target":"record","created_at":"2026-05-18T00:24:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"547aac6092381f12f708575d0e3d00b1812bbd007cc26037b064bc81c969821d","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-27T22:26:16Z","title_canon_sha256":"b384e798bbc9468bb0b3f7808e35a904ce0b0e8dcd21fe964866aa4b392247be"},"schema_version":"1.0","source":{"id":"1703.09327","kind":"arxiv","version":2}},"canonical_sha256":"983d6d17995ecd101b2df6ef01bbfd7ba2d24e22d4d3f7efcc7084757f200915","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"983d6d17995ecd101b2df6ef01bbfd7ba2d24e22d4d3f7efcc7084757f200915","first_computed_at":"2026-05-18T00:24:42.951101Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:24:42.951101Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"DH0VFgivHR5wzv7FUmxP0x0m2yUX98cEo02VQr0e66vJff5YbjH5nweXkOeqQ6miE2OUMJFqHCnNllV1mMJWAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:24:42.951593Z","signed_message":"canonical_sha256_bytes"},"source_id":"1703.09327","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:acb1884e88d0c3e60da3a769ac18d2fe390ed81c8fa2c852ea5c1e93daf47759","sha256:d5ffe697045094f5c08975769541eb02265da180d034361fbe35ad73913ae1ed"],"state_sha256":"5be622d237f7783589ea17d7c0c76d7f6bd14380d0516c7bc1338324b7734a81"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+Efc1rY3X0Vs7asaF38Z3CcBZsJCHenj0C/DtppP/94vCR4UkpSPnCJSsGb+09LRYy4hOsHVi3nVhkn4ENpWCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T00:05:43.443920Z","bundle_sha256":"0fd19595eb1bc9a36500cce96f2dc4763a51342873222a904d102d954f9a9264"}}