{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:SGMQAHDOMBP4QXMPNJR3SEHV6P","short_pith_number":"pith:SGMQAHDO","canonical_record":{"source":{"id":"1901.02161","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-08T05:23:03Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"382e845386cfe09ad512bbecd8fe66950035988a2e51695bda22c7f886e70b2e","abstract_canon_sha256":"339bf88315cbeea7a666f5405c47d9f4f67c31c87bcdd0b16fbed8d2c9e19581"},"schema_version":"1.0"},"canonical_sha256":"9199001c6e605fc85d8f6a63b910f5f3ee1041eeeaf2420679b6ab2bd0ddaa72","source":{"kind":"arxiv","id":"1901.02161","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.02161","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"arxiv_version","alias_value":"1901.02161v2","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.02161","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"pith_short_12","alias_value":"SGMQAHDOMBP4","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"SGMQAHDOMBP4QXMP","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"SGMQAHDO","created_at":"2026-05-18T12:33:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:SGMQAHDOMBP4QXMPNJR3SEHV6P","target":"record","payload":{"canonical_record":{"source":{"id":"1901.02161","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-08T05:23:03Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"382e845386cfe09ad512bbecd8fe66950035988a2e51695bda22c7f886e70b2e","abstract_canon_sha256":"339bf88315cbeea7a666f5405c47d9f4f67c31c87bcdd0b16fbed8d2c9e19581"},"schema_version":"1.0"},"canonical_sha256":"9199001c6e605fc85d8f6a63b910f5f3ee1041eeeaf2420679b6ab2bd0ddaa72","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:44:21.861939Z","signature_b64":"4AIabSFFxSlEtzQjBb3uX08yXZgYYKwNa77hnz03JR6nbU2Y/EhgKJdjj6yPmfM+IpA2n5vxTiuiN86Hor36CQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9199001c6e605fc85d8f6a63b910f5f3ee1041eeeaf2420679b6ab2bd0ddaa72","last_reissued_at":"2026-05-17T23:44:21.861219Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:44:21.861219Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1901.02161","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"v7f4m45fwEM2xTWqoE1MwP7d6YokNI4ICpcQ0vYHANub5Y9ubGHOpTgOSif9BSMUM1XUsAwEwnuqDrx8VXnKCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T09:47:48.561985Z"},"content_sha256":"dcc0b131384c6109f3e32740c3f15ff8249abcb6063dcd4f7a5cb8d3c4c1f716","schema_version":"1.0","event_id":"sha256:dcc0b131384c6109f3e32740c3f15ff8249abcb6063dcd4f7a5cb8d3c4c1f716"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:SGMQAHDOMBP4QXMPNJR3SEHV6P","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Risk-Aware Active Inverse Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Daniel S. Brown, Scott Niekum, Yuchen Cui","submitted_at":"2019-01-08T05:23:03Z","abstract_excerpt":"Active learning from demonstration allows a robot to query a human for specific types of input to achieve efficient learning. Existing work has explored a variety of active query strategies; however, to our knowledge, none of these strategies directly minimize the performance risk of the policy the robot is learning. Utilizing recent advances in performance bounds for inverse reinforcement learning, we propose a risk-aware active inverse reinforcement learning algorithm that focuses active queries on areas of the state space with the potential for large generalization error. We show that risk-"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.02161","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1BErqXagU3GafJ/a14j876fIo4xiDVwCOfJRY2hTsPflzH9Fhck+3M4dEgA91+7eamjdbiB/omEJ8ao+duMBBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T09:47:48.562660Z"},"content_sha256":"0bc24b4768bd59fcbe1d0847abb232f817841f9c53ea69073a0dd3cebf52a780","schema_version":"1.0","event_id":"sha256:0bc24b4768bd59fcbe1d0847abb232f817841f9c53ea69073a0dd3cebf52a780"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SGMQAHDOMBP4QXMPNJR3SEHV6P/bundle.json","state_url":"https://pith.science/pith/SGMQAHDOMBP4QXMPNJR3SEHV6P/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SGMQAHDOMBP4QXMPNJR3SEHV6P/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T09:47:48Z","links":{"resolver":"https://pith.science/pith/SGMQAHDOMBP4QXMPNJR3SEHV6P","bundle":"https://pith.science/pith/SGMQAHDOMBP4QXMPNJR3SEHV6P/bundle.json","state":"https://pith.science/pith/SGMQAHDOMBP4QXMPNJR3SEHV6P/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SGMQAHDOMBP4QXMPNJR3SEHV6P/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:SGMQAHDOMBP4QXMPNJR3SEHV6P","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"339bf88315cbeea7a666f5405c47d9f4f67c31c87bcdd0b16fbed8d2c9e19581","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-08T05:23:03Z","title_canon_sha256":"382e845386cfe09ad512bbecd8fe66950035988a2e51695bda22c7f886e70b2e"},"schema_version":"1.0","source":{"id":"1901.02161","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.02161","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"arxiv_version","alias_value":"1901.02161v2","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.02161","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"pith_short_12","alias_value":"SGMQAHDOMBP4","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"SGMQAHDOMBP4QXMP","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"SGMQAHDO","created_at":"2026-05-18T12:33:27Z"}],"graph_snapshots":[{"event_id":"sha256:0bc24b4768bd59fcbe1d0847abb232f817841f9c53ea69073a0dd3cebf52a780","target":"graph","created_at":"2026-05-17T23:44:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Active learning from demonstration allows a robot to query a human for specific types of input to achieve efficient learning. Existing work has explored a variety of active query strategies; however, to our knowledge, none of these strategies directly minimize the performance risk of the policy the robot is learning. Utilizing recent advances in performance bounds for inverse reinforcement learning, we propose a risk-aware active inverse reinforcement learning algorithm that focuses active queries on areas of the state space with the potential for large generalization error. We show that risk-","authors_text":"Daniel S. Brown, Scott Niekum, Yuchen Cui","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-08T05:23:03Z","title":"Risk-Aware Active Inverse Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.02161","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:dcc0b131384c6109f3e32740c3f15ff8249abcb6063dcd4f7a5cb8d3c4c1f716","target":"record","created_at":"2026-05-17T23:44:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"339bf88315cbeea7a666f5405c47d9f4f67c31c87bcdd0b16fbed8d2c9e19581","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-08T05:23:03Z","title_canon_sha256":"382e845386cfe09ad512bbecd8fe66950035988a2e51695bda22c7f886e70b2e"},"schema_version":"1.0","source":{"id":"1901.02161","kind":"arxiv","version":2}},"canonical_sha256":"9199001c6e605fc85d8f6a63b910f5f3ee1041eeeaf2420679b6ab2bd0ddaa72","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9199001c6e605fc85d8f6a63b910f5f3ee1041eeeaf2420679b6ab2bd0ddaa72","first_computed_at":"2026-05-17T23:44:21.861219Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:44:21.861219Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"4AIabSFFxSlEtzQjBb3uX08yXZgYYKwNa77hnz03JR6nbU2Y/EhgKJdjj6yPmfM+IpA2n5vxTiuiN86Hor36CQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:44:21.861939Z","signed_message":"canonical_sha256_bytes"},"source_id":"1901.02161","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:dcc0b131384c6109f3e32740c3f15ff8249abcb6063dcd4f7a5cb8d3c4c1f716","sha256:0bc24b4768bd59fcbe1d0847abb232f817841f9c53ea69073a0dd3cebf52a780"],"state_sha256":"2f039a03fd58eee67fd588eaab2344835e7ae2d8451027350f766ae910e3d23d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"4XXri0faVgUmTEk1wrqYv341mYl1NiHQpvDPMMWs2nOzQoiyO1+q3nZQSKyyu+SfcZlZxWDod+MTl+sAJebrBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T09:47:48.566275Z","bundle_sha256":"4350e623acc0c731381996826d1cacae79fd37fc72e3e2812472a75327b91035"}}