{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:WFEZ3GZI4N5RUJTDFLKW5CMLCW","short_pith_number":"pith:WFEZ3GZI","canonical_record":{"source":{"id":"1707.09055","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SY","submitted_at":"2017-07-27T21:44:37Z","cross_cats_sorted":[],"title_canon_sha256":"b495d58dbee975b88bc0ec4b53316ed228a29cf3d285ad9b980aca57c92edd3e","abstract_canon_sha256":"fb849a87100a65492e905633936c10f1c2c39e3ec5d3a220ab842d59b6bb5176"},"schema_version":"1.0"},"canonical_sha256":"b1499d9b28e37b1a26632ad56e898b158ddfb4ce0ce87d016f9eba41e7b14a14","source":{"kind":"arxiv","id":"1707.09055","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.09055","created_at":"2026-05-18T00:39:17Z"},{"alias_kind":"arxiv_version","alias_value":"1707.09055v1","created_at":"2026-05-18T00:39:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.09055","created_at":"2026-05-18T00:39:17Z"},{"alias_kind":"pith_short_12","alias_value":"WFEZ3GZI4N5R","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_16","alias_value":"WFEZ3GZI4N5RUJTD","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_8","alias_value":"WFEZ3GZI","created_at":"2026-05-18T12:31:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:WFEZ3GZI4N5RUJTDFLKW5CMLCW","target":"record","payload":{"canonical_record":{"source":{"id":"1707.09055","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SY","submitted_at":"2017-07-27T21:44:37Z","cross_cats_sorted":[],"title_canon_sha256":"b495d58dbee975b88bc0ec4b53316ed228a29cf3d285ad9b980aca57c92edd3e","abstract_canon_sha256":"fb849a87100a65492e905633936c10f1c2c39e3ec5d3a220ab842d59b6bb5176"},"schema_version":"1.0"},"canonical_sha256":"b1499d9b28e37b1a26632ad56e898b158ddfb4ce0ce87d016f9eba41e7b14a14","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:39:17.222956Z","signature_b64":"itYjypE4r+DIzmwcgKOtsvh1t8UAPT4PCO1FB+vtQDOnH0u8ddyQS1+iX1jW5k4YOpWoYEpvu+kfnKkLGibfAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b1499d9b28e37b1a26632ad56e898b158ddfb4ce0ce87d016f9eba41e7b14a14","last_reissued_at":"2026-05-18T00:39:17.222296Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:39:17.222296Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1707.09055","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3dMAoEbaUfNI1Leik1K6pJbuM8JH6IO5oVwty5OEY+pQ6Ze3tPml31nWwcXYA33N0bKr0o9zMs6CCGfOPwh2Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T00:33:10.740419Z"},"content_sha256":"d630683cd061cf82f30a25eef81ac4161a24a21253c7729360050c553b976fa5","schema_version":"1.0","event_id":"sha256:d630683cd061cf82f30a25eef81ac4161a24a21253c7729360050c553b976fa5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:WFEZ3GZI4N5RUJTDFLKW5CMLCW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Simultaneous active parameter estimation and control using sampling-based Bayesian reinforcement learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.SY","authors_text":"Mykel Kochenderfer, Patrick Slade, Preston Culbertson, Zachary Sunberg","submitted_at":"2017-07-27T21:44:37Z","abstract_excerpt":"Robots performing manipulation tasks must operate under uncertainty about both their pose and the dynamics of the system. In order to remain robust to modeling error and shifts in payload dynamics, agents must simultaneously perform estimation and control tasks. However, the optimal estimation actions are often not the optimal actions for accomplishing the control tasks, and thus agents trade between exploration and exploitation. This work frames the problem as a Bayes-adaptive Markov decision process and solves it online using Monte Carlo tree search and an extended Kalman filter to handle Ga"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.09055","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ecEIEkS5LIuG8XTXGb0C53VFR3PQDAq/1DYSpWneHgPhr1rVflR2+K3nwyDvWQrt86pcgMw9yEiKNwfp1RclDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T00:33:10.741048Z"},"content_sha256":"2fbc3bca1cf49868d20f280c95711970217cced9a28f549846cd3909fb97b13a","schema_version":"1.0","event_id":"sha256:2fbc3bca1cf49868d20f280c95711970217cced9a28f549846cd3909fb97b13a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WFEZ3GZI4N5RUJTDFLKW5CMLCW/bundle.json","state_url":"https://pith.science/pith/WFEZ3GZI4N5RUJTDFLKW5CMLCW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WFEZ3GZI4N5RUJTDFLKW5CMLCW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T00:33:10Z","links":{"resolver":"https://pith.science/pith/WFEZ3GZI4N5RUJTDFLKW5CMLCW","bundle":"https://pith.science/pith/WFEZ3GZI4N5RUJTDFLKW5CMLCW/bundle.json","state":"https://pith.science/pith/WFEZ3GZI4N5RUJTDFLKW5CMLCW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WFEZ3GZI4N5RUJTDFLKW5CMLCW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:WFEZ3GZI4N5RUJTDFLKW5CMLCW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fb849a87100a65492e905633936c10f1c2c39e3ec5d3a220ab842d59b6bb5176","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SY","submitted_at":"2017-07-27T21:44:37Z","title_canon_sha256":"b495d58dbee975b88bc0ec4b53316ed228a29cf3d285ad9b980aca57c92edd3e"},"schema_version":"1.0","source":{"id":"1707.09055","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.09055","created_at":"2026-05-18T00:39:17Z"},{"alias_kind":"arxiv_version","alias_value":"1707.09055v1","created_at":"2026-05-18T00:39:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.09055","created_at":"2026-05-18T00:39:17Z"},{"alias_kind":"pith_short_12","alias_value":"WFEZ3GZI4N5R","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_16","alias_value":"WFEZ3GZI4N5RUJTD","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_8","alias_value":"WFEZ3GZI","created_at":"2026-05-18T12:31:53Z"}],"graph_snapshots":[{"event_id":"sha256:2fbc3bca1cf49868d20f280c95711970217cced9a28f549846cd3909fb97b13a","target":"graph","created_at":"2026-05-18T00:39:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Robots performing manipulation tasks must operate under uncertainty about both their pose and the dynamics of the system. In order to remain robust to modeling error and shifts in payload dynamics, agents must simultaneously perform estimation and control tasks. However, the optimal estimation actions are often not the optimal actions for accomplishing the control tasks, and thus agents trade between exploration and exploitation. This work frames the problem as a Bayes-adaptive Markov decision process and solves it online using Monte Carlo tree search and an extended Kalman filter to handle Ga","authors_text":"Mykel Kochenderfer, Patrick Slade, Preston Culbertson, Zachary Sunberg","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SY","submitted_at":"2017-07-27T21:44:37Z","title":"Simultaneous active parameter estimation and control using sampling-based Bayesian reinforcement learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.09055","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d630683cd061cf82f30a25eef81ac4161a24a21253c7729360050c553b976fa5","target":"record","created_at":"2026-05-18T00:39:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fb849a87100a65492e905633936c10f1c2c39e3ec5d3a220ab842d59b6bb5176","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SY","submitted_at":"2017-07-27T21:44:37Z","title_canon_sha256":"b495d58dbee975b88bc0ec4b53316ed228a29cf3d285ad9b980aca57c92edd3e"},"schema_version":"1.0","source":{"id":"1707.09055","kind":"arxiv","version":1}},"canonical_sha256":"b1499d9b28e37b1a26632ad56e898b158ddfb4ce0ce87d016f9eba41e7b14a14","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b1499d9b28e37b1a26632ad56e898b158ddfb4ce0ce87d016f9eba41e7b14a14","first_computed_at":"2026-05-18T00:39:17.222296Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:39:17.222296Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"itYjypE4r+DIzmwcgKOtsvh1t8UAPT4PCO1FB+vtQDOnH0u8ddyQS1+iX1jW5k4YOpWoYEpvu+kfnKkLGibfAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:39:17.222956Z","signed_message":"canonical_sha256_bytes"},"source_id":"1707.09055","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d630683cd061cf82f30a25eef81ac4161a24a21253c7729360050c553b976fa5","sha256:2fbc3bca1cf49868d20f280c95711970217cced9a28f549846cd3909fb97b13a"],"state_sha256":"86873a33531502c24237e47fc0c638a3955c01ec148485aa323402453c61d3fa"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"mfDd+k9+dxkOwrqmj0h5s1nHDGDi0xpL9T5bEWDwHNIV+K0DiWRBYnX8E2kgEqiVFhzGuU/BPMuDODh8E92RCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T00:33:10.744836Z","bundle_sha256":"2097d6018f73722d9da005f2c30e1b77260b2fd2a9a454f38118a0897f70efe2"}}