{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:ADYWB55JHSY2W427RD66YVWVG4","short_pith_number":"pith:ADYWB55J","canonical_record":{"source":{"id":"1802.01744","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-06T00:45:12Z","cross_cats_sorted":["cs.HC","cs.RO"],"title_canon_sha256":"2fa228e82b1f8a74dd8a835530d9eef8e2cc2a6250f7511cc13d7080dec16453","abstract_canon_sha256":"404431db3013b57711e016849999f7cc802a72252665bc22549dbd760f931600"},"schema_version":"1.0"},"canonical_sha256":"00f160f7a93cb1ab735f88fdec56d53733e074bd6e3d8472fa0c6378f963138d","source":{"kind":"arxiv","id":"1802.01744","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.01744","created_at":"2026-05-18T00:15:09Z"},{"alias_kind":"arxiv_version","alias_value":"1802.01744v2","created_at":"2026-05-18T00:15:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.01744","created_at":"2026-05-18T00:15:09Z"},{"alias_kind":"pith_short_12","alias_value":"ADYWB55JHSY2","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"ADYWB55JHSY2W427","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"ADYWB55J","created_at":"2026-05-18T12:32:13Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:ADYWB55JHSY2W427RD66YVWVG4","target":"record","payload":{"canonical_record":{"source":{"id":"1802.01744","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-06T00:45:12Z","cross_cats_sorted":["cs.HC","cs.RO"],"title_canon_sha256":"2fa228e82b1f8a74dd8a835530d9eef8e2cc2a6250f7511cc13d7080dec16453","abstract_canon_sha256":"404431db3013b57711e016849999f7cc802a72252665bc22549dbd760f931600"},"schema_version":"1.0"},"canonical_sha256":"00f160f7a93cb1ab735f88fdec56d53733e074bd6e3d8472fa0c6378f963138d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:15:09.773995Z","signature_b64":"W41NdvMOFX2GXMZOgN6lrBpZi4njsduJiT1fyaEhqFmJSWWLbS05O+J4mnSzsUjCHrrV/3Q17kX+Dzjb06wuAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"00f160f7a93cb1ab735f88fdec56d53733e074bd6e3d8472fa0c6378f963138d","last_reissued_at":"2026-05-18T00:15:09.773478Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:15:09.773478Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1802.01744","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"E+kSHQRDAXRVwe97B3qSz7PFxLYkXaQkLme+tIZZh/pJpFQiSFhXixm5653pC3Mku9NZyMNiqePOZefnmZM8DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T08:08:37.251216Z"},"content_sha256":"ae66a1b079c3f16949571ee956115890f5f5be5640bbe760ac4038c6eb55c431","schema_version":"1.0","event_id":"sha256:ae66a1b079c3f16949571ee956115890f5f5be5640bbe760ac4038c6eb55c431"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:ADYWB55JHSY2W427RD66YVWVG4","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Shared Autonomy via Deep Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.HC","cs.RO"],"primary_cat":"cs.LG","authors_text":"Anca D. Dragan, Sergey Levine, Siddharth Reddy","submitted_at":"2018-02-06T00:45:12Z","abstract_excerpt":"In shared autonomy, user input is combined with semi-autonomous control to achieve a common goal. The goal is often unknown ex-ante, so prior work enables agents to infer the goal from user input and assist with the task. Such methods tend to assume some combination of knowledge of the dynamics of the environment, the user's policy given their goal, and the set of possible goals the user might target, which limits their application to real-world scenarios. We propose a deep reinforcement learning framework for model-free shared autonomy that lifts these assumptions. We use human-in-the-loop re"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.01744","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"06kA8LMXUbApS7/GBTW82ze7XDpJQUwnoFWLU10lpqs9jS4VmNdG0yi5OIm9z5UXLgzeZhmJnkqW/eByMD3RCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T08:08:37.251807Z"},"content_sha256":"a1da7a233823b54c5ecee38f920d0df72370412f8ba832f9229493da7003ad83","schema_version":"1.0","event_id":"sha256:a1da7a233823b54c5ecee38f920d0df72370412f8ba832f9229493da7003ad83"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ADYWB55JHSY2W427RD66YVWVG4/bundle.json","state_url":"https://pith.science/pith/ADYWB55JHSY2W427RD66YVWVG4/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ADYWB55JHSY2W427RD66YVWVG4/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-22T08:08:37Z","links":{"resolver":"https://pith.science/pith/ADYWB55JHSY2W427RD66YVWVG4","bundle":"https://pith.science/pith/ADYWB55JHSY2W427RD66YVWVG4/bundle.json","state":"https://pith.science/pith/ADYWB55JHSY2W427RD66YVWVG4/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ADYWB55JHSY2W427RD66YVWVG4/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:ADYWB55JHSY2W427RD66YVWVG4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"404431db3013b57711e016849999f7cc802a72252665bc22549dbd760f931600","cross_cats_sorted":["cs.HC","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-06T00:45:12Z","title_canon_sha256":"2fa228e82b1f8a74dd8a835530d9eef8e2cc2a6250f7511cc13d7080dec16453"},"schema_version":"1.0","source":{"id":"1802.01744","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.01744","created_at":"2026-05-18T00:15:09Z"},{"alias_kind":"arxiv_version","alias_value":"1802.01744v2","created_at":"2026-05-18T00:15:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.01744","created_at":"2026-05-18T00:15:09Z"},{"alias_kind":"pith_short_12","alias_value":"ADYWB55JHSY2","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"ADYWB55JHSY2W427","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"ADYWB55J","created_at":"2026-05-18T12:32:13Z"}],"graph_snapshots":[{"event_id":"sha256:a1da7a233823b54c5ecee38f920d0df72370412f8ba832f9229493da7003ad83","target":"graph","created_at":"2026-05-18T00:15:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In shared autonomy, user input is combined with semi-autonomous control to achieve a common goal. The goal is often unknown ex-ante, so prior work enables agents to infer the goal from user input and assist with the task. Such methods tend to assume some combination of knowledge of the dynamics of the environment, the user's policy given their goal, and the set of possible goals the user might target, which limits their application to real-world scenarios. We propose a deep reinforcement learning framework for model-free shared autonomy that lifts these assumptions. We use human-in-the-loop re","authors_text":"Anca D. Dragan, Sergey Levine, Siddharth Reddy","cross_cats":["cs.HC","cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-06T00:45:12Z","title":"Shared Autonomy via Deep Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.01744","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ae66a1b079c3f16949571ee956115890f5f5be5640bbe760ac4038c6eb55c431","target":"record","created_at":"2026-05-18T00:15:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"404431db3013b57711e016849999f7cc802a72252665bc22549dbd760f931600","cross_cats_sorted":["cs.HC","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-06T00:45:12Z","title_canon_sha256":"2fa228e82b1f8a74dd8a835530d9eef8e2cc2a6250f7511cc13d7080dec16453"},"schema_version":"1.0","source":{"id":"1802.01744","kind":"arxiv","version":2}},"canonical_sha256":"00f160f7a93cb1ab735f88fdec56d53733e074bd6e3d8472fa0c6378f963138d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"00f160f7a93cb1ab735f88fdec56d53733e074bd6e3d8472fa0c6378f963138d","first_computed_at":"2026-05-18T00:15:09.773478Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:15:09.773478Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"W41NdvMOFX2GXMZOgN6lrBpZi4njsduJiT1fyaEhqFmJSWWLbS05O+J4mnSzsUjCHrrV/3Q17kX+Dzjb06wuAw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:15:09.773995Z","signed_message":"canonical_sha256_bytes"},"source_id":"1802.01744","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ae66a1b079c3f16949571ee956115890f5f5be5640bbe760ac4038c6eb55c431","sha256:a1da7a233823b54c5ecee38f920d0df72370412f8ba832f9229493da7003ad83"],"state_sha256":"a82ea5850239732fd0f69e0d0e82d415a63a53a1828976c183c1aace206ef7b5"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WRaoDIe/QDP0L9Rlw8/FwcK7DlTuig9qxGdtATstmlN3g3CJKCqbMYrTiXEFZE7CaL3vL372v2wZ48j3uJgCBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-22T08:08:37.254847Z","bundle_sha256":"a28e5a39a31069fc5168aea39f728ca74a2389d7d7cda8dc8522cc84471d580b"}}