{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:7P7YFZ3FPLSZAT3BTSFHT5WQLH","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b30da16143d9d6eca20b06ea1f7e1e252f8f018e4eff8972b61d3d6a2cff309b","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-18T00:53:20Z","title_canon_sha256":"919a6a40ed1e1cc755163ee54034f691a138b7e73369e41682a318826b3f6b68"},"schema_version":"1.0","source":{"id":"1711.06782","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.06782","created_at":"2026-05-18T00:30:15Z"},{"alias_kind":"arxiv_version","alias_value":"1711.06782v1","created_at":"2026-05-18T00:30:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.06782","created_at":"2026-05-18T00:30:15Z"},{"alias_kind":"pith_short_12","alias_value":"7P7YFZ3FPLSZ","created_at":"2026-05-18T12:31:05Z"},{"alias_kind":"pith_short_16","alias_value":"7P7YFZ3FPLSZAT3B","created_at":"2026-05-18T12:31:05Z"},{"alias_kind":"pith_short_8","alias_value":"7P7YFZ3F","created_at":"2026-05-18T12:31:05Z"}],"graph_snapshots":[{"event_id":"sha256:842ccf5a7bcb34bc75099dae6ecaaafe874ea8eae9fe9ae4a6c6247171f6530f","target":"graph","created_at":"2026-05-18T00:30:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Deep reinforcement learning algorithms can learn complex behavioral skills, but real-world application of these methods requires a large amount of experience to be collected by the agent. In practical settings, such as robotics, this involves repeatedly attempting a task, resetting the environment between each attempt. However, not all tasks are easily or automatically reversible. In practice, this learning process requires extensive human intervention. In this work, we propose an autonomous method for safe and efficient reinforcement learning that simultaneously learns a forward and reset pol","authors_text":"Benjamin Eysenbach, Julian Ibarz, Sergey Levine, Shixiang Gu","cross_cats":["cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-18T00:53:20Z","title":"Leave no Trace: Learning to Reset for Safe and Autonomous Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.06782","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:10659945c6d595dbcb6de32ada06f2fc96408fb3f86147aac42ba97cefc3a93f","target":"record","created_at":"2026-05-18T00:30:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b30da16143d9d6eca20b06ea1f7e1e252f8f018e4eff8972b61d3d6a2cff309b","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-18T00:53:20Z","title_canon_sha256":"919a6a40ed1e1cc755163ee54034f691a138b7e73369e41682a318826b3f6b68"},"schema_version":"1.0","source":{"id":"1711.06782","kind":"arxiv","version":1}},"canonical_sha256":"fbff82e7657ae5904f619c8a79f6d059d6e32a6108251f1f5c7bf3d0b576ec79","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"fbff82e7657ae5904f619c8a79f6d059d6e32a6108251f1f5c7bf3d0b576ec79","first_computed_at":"2026-05-18T00:30:15.621999Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:30:15.621999Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"LXf95uTrJbMev+ZIAzNEo3BRlRHqE6jHOjS01KwYZVHwNxCeUCIAPSCxlXlC/7kBFMlBy0n5gIiSn+O98vizBA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:30:15.622636Z","signed_message":"canonical_sha256_bytes"},"source_id":"1711.06782","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:10659945c6d595dbcb6de32ada06f2fc96408fb3f86147aac42ba97cefc3a93f","sha256:842ccf5a7bcb34bc75099dae6ecaaafe874ea8eae9fe9ae4a6c6247171f6530f"],"state_sha256":"62799a20507a47edb4304b4bd38f3b46acfbf5ce6b669ce0ccb327a717016e89"}