{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:XHV7ZNEAG4ASTW3O4ELRW7Q5D5","short_pith_number":"pith:XHV7ZNEA","canonical_record":{"source":{"id":"1509.06824","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-23T02:04:18Z","cross_cats_sorted":["cs.RO"],"title_canon_sha256":"552c4966bf5f318831806dd4f7bdc469159fd93bb745581e40d6cfe1a4b04a32","abstract_canon_sha256":"a29f7edb16d8c88682538abead494c7704d0a2531ad9ec32c40ba2efff6a8d1c"},"schema_version":"1.0"},"canonical_sha256":"b9ebfcb480370129db6ee1171b7e1d1f468f211c310356241107ddb341b9266c","source":{"kind":"arxiv","id":"1509.06824","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1509.06824","created_at":"2026-05-18T01:19:05Z"},{"alias_kind":"arxiv_version","alias_value":"1509.06824v2","created_at":"2026-05-18T01:19:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1509.06824","created_at":"2026-05-18T01:19:05Z"},{"alias_kind":"pith_short_12","alias_value":"XHV7ZNEAG4AS","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_16","alias_value":"XHV7ZNEAG4ASTW3O","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_8","alias_value":"XHV7ZNEA","created_at":"2026-05-18T12:29:50Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:XHV7ZNEAG4ASTW3O4ELRW7Q5D5","target":"record","payload":{"canonical_record":{"source":{"id":"1509.06824","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-23T02:04:18Z","cross_cats_sorted":["cs.RO"],"title_canon_sha256":"552c4966bf5f318831806dd4f7bdc469159fd93bb745581e40d6cfe1a4b04a32","abstract_canon_sha256":"a29f7edb16d8c88682538abead494c7704d0a2531ad9ec32c40ba2efff6a8d1c"},"schema_version":"1.0"},"canonical_sha256":"b9ebfcb480370129db6ee1171b7e1d1f468f211c310356241107ddb341b9266c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:19:05.801755Z","signature_b64":"LoWpysZ1Da9iViseuLeNv/83/jsJ/By6o8YLxOQ5JL3G75vrPQqa+KTXVPT8FJwx6Uwc7ihZqQgL44UWLfAHAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b9ebfcb480370129db6ee1171b7e1d1f468f211c310356241107ddb341b9266c","last_reissued_at":"2026-05-18T01:19:05.801059Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:19:05.801059Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1509.06824","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:19:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"konxhyWZTUCmVFJ/8mVrqU6YPkqaCEtQQkMuQf6O18w84n7rmGpK8Aw3rarusko7kwhPPrW8oT/IIS15eywMAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T03:43:57.020235Z"},"content_sha256":"4a074c5c27c36bdc9fe0f070a0d870969329d931dcc116bfaf8613c1031a5025","schema_version":"1.0","event_id":"sha256:4a074c5c27c36bdc9fe0f070a0d870969329d931dcc116bfaf8613c1031a5025"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:XHV7ZNEAG4ASTW3O4ELRW7Q5D5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Model-based Reinforcement Learning with Parametrized Physical Models and Optimism-Driven Exploration","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.RO"],"primary_cat":"cs.LG","authors_text":"Christopher Xie, Pieter Abbeel, Sachin Patil, Sergey Levine, Teodor Moldovan","submitted_at":"2015-09-23T02:04:18Z","abstract_excerpt":"In this paper, we present a robotic model-based reinforcement learning method that combines ideas from model identification and model predictive control. We use a feature-based representation of the dynamics that allows the dynamics model to be fitted with a simple least squares procedure, and the features are identified from a high-level specification of the robot's morphology, consisting of the number and connectivity structure of its links. Model predictive control is then used to choose the actions under an optimistic model of the dynamics, which produces an efficient and goal-directed exp"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1509.06824","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:19:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P1e7X8PEBFd7s4Za7Wp+9P+pQl1wU1gHCjcj4BfvPje/WU2eL1z7Cvoq4kWjoWuepIk/fvL0Ub1tKmsmB6svAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T03:43:57.020967Z"},"content_sha256":"d5f48b9fc2b54fc0af0320c42ef6551c13df5bd7ae37531bbb0e384e7ff739d8","schema_version":"1.0","event_id":"sha256:d5f48b9fc2b54fc0af0320c42ef6551c13df5bd7ae37531bbb0e384e7ff739d8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XHV7ZNEAG4ASTW3O4ELRW7Q5D5/bundle.json","state_url":"https://pith.science/pith/XHV7ZNEAG4ASTW3O4ELRW7Q5D5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XHV7ZNEAG4ASTW3O4ELRW7Q5D5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-12T03:43:57Z","links":{"resolver":"https://pith.science/pith/XHV7ZNEAG4ASTW3O4ELRW7Q5D5","bundle":"https://pith.science/pith/XHV7ZNEAG4ASTW3O4ELRW7Q5D5/bundle.json","state":"https://pith.science/pith/XHV7ZNEAG4ASTW3O4ELRW7Q5D5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XHV7ZNEAG4ASTW3O4ELRW7Q5D5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:XHV7ZNEAG4ASTW3O4ELRW7Q5D5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a29f7edb16d8c88682538abead494c7704d0a2531ad9ec32c40ba2efff6a8d1c","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-23T02:04:18Z","title_canon_sha256":"552c4966bf5f318831806dd4f7bdc469159fd93bb745581e40d6cfe1a4b04a32"},"schema_version":"1.0","source":{"id":"1509.06824","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1509.06824","created_at":"2026-05-18T01:19:05Z"},{"alias_kind":"arxiv_version","alias_value":"1509.06824v2","created_at":"2026-05-18T01:19:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1509.06824","created_at":"2026-05-18T01:19:05Z"},{"alias_kind":"pith_short_12","alias_value":"XHV7ZNEAG4AS","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_16","alias_value":"XHV7ZNEAG4ASTW3O","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_8","alias_value":"XHV7ZNEA","created_at":"2026-05-18T12:29:50Z"}],"graph_snapshots":[{"event_id":"sha256:d5f48b9fc2b54fc0af0320c42ef6551c13df5bd7ae37531bbb0e384e7ff739d8","target":"graph","created_at":"2026-05-18T01:19:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper, we present a robotic model-based reinforcement learning method that combines ideas from model identification and model predictive control. We use a feature-based representation of the dynamics that allows the dynamics model to be fitted with a simple least squares procedure, and the features are identified from a high-level specification of the robot's morphology, consisting of the number and connectivity structure of its links. Model predictive control is then used to choose the actions under an optimistic model of the dynamics, which produces an efficient and goal-directed exp","authors_text":"Christopher Xie, Pieter Abbeel, Sachin Patil, Sergey Levine, Teodor Moldovan","cross_cats":["cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-23T02:04:18Z","title":"Model-based Reinforcement Learning with Parametrized Physical Models and Optimism-Driven Exploration"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1509.06824","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4a074c5c27c36bdc9fe0f070a0d870969329d931dcc116bfaf8613c1031a5025","target":"record","created_at":"2026-05-18T01:19:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a29f7edb16d8c88682538abead494c7704d0a2531ad9ec32c40ba2efff6a8d1c","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-23T02:04:18Z","title_canon_sha256":"552c4966bf5f318831806dd4f7bdc469159fd93bb745581e40d6cfe1a4b04a32"},"schema_version":"1.0","source":{"id":"1509.06824","kind":"arxiv","version":2}},"canonical_sha256":"b9ebfcb480370129db6ee1171b7e1d1f468f211c310356241107ddb341b9266c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b9ebfcb480370129db6ee1171b7e1d1f468f211c310356241107ddb341b9266c","first_computed_at":"2026-05-18T01:19:05.801059Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:19:05.801059Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"LoWpysZ1Da9iViseuLeNv/83/jsJ/By6o8YLxOQ5JL3G75vrPQqa+KTXVPT8FJwx6Uwc7ihZqQgL44UWLfAHAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T01:19:05.801755Z","signed_message":"canonical_sha256_bytes"},"source_id":"1509.06824","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4a074c5c27c36bdc9fe0f070a0d870969329d931dcc116bfaf8613c1031a5025","sha256:d5f48b9fc2b54fc0af0320c42ef6551c13df5bd7ae37531bbb0e384e7ff739d8"],"state_sha256":"a552c31b49636b0da9bc63372c1348dd06010e78d6ab78c07e0951e5de20da5e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"NDtjSIhWRcknIvUGLHfDCn6lfJqktpSyS45/WD2K9mRuAsUYVsYpcuEeNy/xSgxhFKvG7cGzOxAqRDO6rlORAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-12T03:43:57.024654Z","bundle_sha256":"d5010799e176ca631c57433b2115184e8ebe1f49d380dcfb6208c23e9886c1cf"}}