{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:NCK5X3SVWQUKKQA2DIJONXJ3KF","short_pith_number":"pith:NCK5X3SV","canonical_record":{"source":{"id":"1606.06979","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2016-06-22T15:09:04Z","cross_cats_sorted":["cs.AI","cs.RO"],"title_canon_sha256":"6bd7782087bb43b63f780f6d293d4c6d6cd51d830f8898622cf8061fccc8a737","abstract_canon_sha256":"ae6548278b1002bd1ec028771815f447c59a4eecf09be88880fe0733f4e51d3e"},"schema_version":"1.0"},"canonical_sha256":"6895dbee55b428a5401a1a12e6dd3b516afd96285d3a8d2a3d6fbf4cdeb7d4d6","source":{"kind":"arxiv","id":"1606.06979","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1606.06979","created_at":"2026-05-18T01:12:00Z"},{"alias_kind":"arxiv_version","alias_value":"1606.06979v1","created_at":"2026-05-18T01:12:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1606.06979","created_at":"2026-05-18T01:12:00Z"},{"alias_kind":"pith_short_12","alias_value":"NCK5X3SVWQUK","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_16","alias_value":"NCK5X3SVWQUKKQA2","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_8","alias_value":"NCK5X3SV","created_at":"2026-05-18T12:30:32Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:NCK5X3SVWQUKKQA2DIJONXJ3KF","target":"record","payload":{"canonical_record":{"source":{"id":"1606.06979","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2016-06-22T15:09:04Z","cross_cats_sorted":["cs.AI","cs.RO"],"title_canon_sha256":"6bd7782087bb43b63f780f6d293d4c6d6cd51d830f8898622cf8061fccc8a737","abstract_canon_sha256":"ae6548278b1002bd1ec028771815f447c59a4eecf09be88880fe0733f4e51d3e"},"schema_version":"1.0"},"canonical_sha256":"6895dbee55b428a5401a1a12e6dd3b516afd96285d3a8d2a3d6fbf4cdeb7d4d6","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:12:00.794850Z","signature_b64":"SiZcAL+H9XrY6PcXgGPzEatmW3UcgdlZkVv51GutrRrNFX/ICApGZ7YUGlICpnKcH4Fwz9KvxY4s92pBr/lmAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6895dbee55b428a5401a1a12e6dd3b516afd96285d3a8d2a3d6fbf4cdeb7d4d6","last_reissued_at":"2026-05-18T01:12:00.794488Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:12:00.794488Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1606.06979","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:12:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"d2Fgen2AFMKJPT8tJdQSnkC3NEi/y+6okdPK+5Q/bVFhKWRRlc7xbGOK2uGDr7UIm/Pobu52C1NaeEsTzGIZDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T00:12:14.031064Z"},"content_sha256":"1996481232da92cb867c00ff24ef7024dea1a0d5ad7ed6eafa8da2959300c32f","schema_version":"1.0","event_id":"sha256:1996481232da92cb867c00ff24ef7024dea1a0d5ad7ed6eafa8da2959300c32f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:NCK5X3SVWQUKKQA2DIJONXJ3KF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Simultaneous Control and Human Feedback in the Training of a Robotic Agent with Actor-Critic Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.RO"],"primary_cat":"cs.HC","authors_text":"Kory W. Mathewson, Patrick M. Pilarski","submitted_at":"2016-06-22T15:09:04Z","abstract_excerpt":"This paper contributes a preliminary report on the advantages and disadvantages of incorporating simultaneous human control and feedback signals in the training of a reinforcement learning robotic agent. While robotic human-machine interfaces have become increasingly complex in both form and function, control remains challenging for users. This has resulted in an increasing gap between user control approaches and the number of robotic motors which can be controlled. One way to address this gap is to shift some autonomy to the robot. Semi-autonomous actions of the robotic agent can then be shap"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1606.06979","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:12:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hDwfFFRCfEfFsqYWQ/nM1iXz7cas8BYACp//2gDwQqqyCiR39EghT3PDugB+DSV5sPU8kCr3Se6Qr8zjeLHYBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T00:12:14.031632Z"},"content_sha256":"723580874f329543022289ad17a89118355adaf146257ef091af1f43120aef65","schema_version":"1.0","event_id":"sha256:723580874f329543022289ad17a89118355adaf146257ef091af1f43120aef65"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NCK5X3SVWQUKKQA2DIJONXJ3KF/bundle.json","state_url":"https://pith.science/pith/NCK5X3SVWQUKKQA2DIJONXJ3KF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NCK5X3SVWQUKKQA2DIJONXJ3KF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-09T00:12:14Z","links":{"resolver":"https://pith.science/pith/NCK5X3SVWQUKKQA2DIJONXJ3KF","bundle":"https://pith.science/pith/NCK5X3SVWQUKKQA2DIJONXJ3KF/bundle.json","state":"https://pith.science/pith/NCK5X3SVWQUKKQA2DIJONXJ3KF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NCK5X3SVWQUKKQA2DIJONXJ3KF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:NCK5X3SVWQUKKQA2DIJONXJ3KF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ae6548278b1002bd1ec028771815f447c59a4eecf09be88880fe0733f4e51d3e","cross_cats_sorted":["cs.AI","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2016-06-22T15:09:04Z","title_canon_sha256":"6bd7782087bb43b63f780f6d293d4c6d6cd51d830f8898622cf8061fccc8a737"},"schema_version":"1.0","source":{"id":"1606.06979","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1606.06979","created_at":"2026-05-18T01:12:00Z"},{"alias_kind":"arxiv_version","alias_value":"1606.06979v1","created_at":"2026-05-18T01:12:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1606.06979","created_at":"2026-05-18T01:12:00Z"},{"alias_kind":"pith_short_12","alias_value":"NCK5X3SVWQUK","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_16","alias_value":"NCK5X3SVWQUKKQA2","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_8","alias_value":"NCK5X3SV","created_at":"2026-05-18T12:30:32Z"}],"graph_snapshots":[{"event_id":"sha256:723580874f329543022289ad17a89118355adaf146257ef091af1f43120aef65","target":"graph","created_at":"2026-05-18T01:12:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"This paper contributes a preliminary report on the advantages and disadvantages of incorporating simultaneous human control and feedback signals in the training of a reinforcement learning robotic agent. While robotic human-machine interfaces have become increasingly complex in both form and function, control remains challenging for users. This has resulted in an increasing gap between user control approaches and the number of robotic motors which can be controlled. One way to address this gap is to shift some autonomy to the robot. Semi-autonomous actions of the robotic agent can then be shap","authors_text":"Kory W. Mathewson, Patrick M. Pilarski","cross_cats":["cs.AI","cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2016-06-22T15:09:04Z","title":"Simultaneous Control and Human Feedback in the Training of a Robotic Agent with Actor-Critic Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1606.06979","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1996481232da92cb867c00ff24ef7024dea1a0d5ad7ed6eafa8da2959300c32f","target":"record","created_at":"2026-05-18T01:12:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ae6548278b1002bd1ec028771815f447c59a4eecf09be88880fe0733f4e51d3e","cross_cats_sorted":["cs.AI","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2016-06-22T15:09:04Z","title_canon_sha256":"6bd7782087bb43b63f780f6d293d4c6d6cd51d830f8898622cf8061fccc8a737"},"schema_version":"1.0","source":{"id":"1606.06979","kind":"arxiv","version":1}},"canonical_sha256":"6895dbee55b428a5401a1a12e6dd3b516afd96285d3a8d2a3d6fbf4cdeb7d4d6","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6895dbee55b428a5401a1a12e6dd3b516afd96285d3a8d2a3d6fbf4cdeb7d4d6","first_computed_at":"2026-05-18T01:12:00.794488Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:12:00.794488Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"SiZcAL+H9XrY6PcXgGPzEatmW3UcgdlZkVv51GutrRrNFX/ICApGZ7YUGlICpnKcH4Fwz9KvxY4s92pBr/lmAA==","signature_status":"signed_v1","signed_at":"2026-05-18T01:12:00.794850Z","signed_message":"canonical_sha256_bytes"},"source_id":"1606.06979","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1996481232da92cb867c00ff24ef7024dea1a0d5ad7ed6eafa8da2959300c32f","sha256:723580874f329543022289ad17a89118355adaf146257ef091af1f43120aef65"],"state_sha256":"4b46620633eaa742acd04baab7724b6658e84670163dbcbc51893daa8e0945d6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"J5ecPp8nKvNPS4TWLXITxKUVEKR22efGiuwWgcoQIh6GWHP45PdGr5qLDY0HCovX+CQe2lsu1BoV5liiyItnAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-09T00:12:14.034172Z","bundle_sha256":"3347b745ecd07fb014e091062c96177c00097ad5a8922edc01d272828880e4b0"}}