{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:FZKNBEUNJDAIHLOM7E7UXEC33M","short_pith_number":"pith:FZKNBEUN","canonical_record":{"source":{"id":"1509.06791","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-22T21:27:27Z","cross_cats_sorted":["cs.RO"],"title_canon_sha256":"7cd5c7f872ceec7b26ae84f6422212a53421893899c9a658401c876b7f276395","abstract_canon_sha256":"31c78b40f165e7b7609a7a585784976812f9ad57de9268eec87a68af18f3860e"},"schema_version":"1.0"},"canonical_sha256":"2e54d0928d48c083adccf93f4b905bdb3a782eb77d982457da4f8d4ab9004f66","source":{"kind":"arxiv","id":"1509.06791","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1509.06791","created_at":"2026-05-18T01:20:42Z"},{"alias_kind":"arxiv_version","alias_value":"1509.06791v2","created_at":"2026-05-18T01:20:42Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1509.06791","created_at":"2026-05-18T01:20:42Z"},{"alias_kind":"pith_short_12","alias_value":"FZKNBEUNJDAI","created_at":"2026-05-18T12:29:22Z"},{"alias_kind":"pith_short_16","alias_value":"FZKNBEUNJDAIHLOM","created_at":"2026-05-18T12:29:22Z"},{"alias_kind":"pith_short_8","alias_value":"FZKNBEUN","created_at":"2026-05-18T12:29:22Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:FZKNBEUNJDAIHLOM7E7UXEC33M","target":"record","payload":{"canonical_record":{"source":{"id":"1509.06791","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-22T21:27:27Z","cross_cats_sorted":["cs.RO"],"title_canon_sha256":"7cd5c7f872ceec7b26ae84f6422212a53421893899c9a658401c876b7f276395","abstract_canon_sha256":"31c78b40f165e7b7609a7a585784976812f9ad57de9268eec87a68af18f3860e"},"schema_version":"1.0"},"canonical_sha256":"2e54d0928d48c083adccf93f4b905bdb3a782eb77d982457da4f8d4ab9004f66","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:20:42.976435Z","signature_b64":"gog09y4L1ln6WHEm40ELxPtIt/5qM9sWC8R7tDDfJHEhq5a0Xx8+qMZAR+Q3ooUIJF0mPNkOo4Ogw04y6DEZDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"2e54d0928d48c083adccf93f4b905bdb3a782eb77d982457da4f8d4ab9004f66","last_reissued_at":"2026-05-18T01:20:42.975726Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:20:42.975726Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1509.06791","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:20:42Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"4le5OAf/fZR0293IbuYUYo000073CwFHuZwmf5bme7geCEPaletkXMRM5C+GuItx2lx5ShPhmRY3JBYkxPo6Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T09:48:06.319284Z"},"content_sha256":"d789b08bb48f12f7749db60fc227aff6818e624f47583570b9eec805b075d561","schema_version":"1.0","event_id":"sha256:d789b08bb48f12f7749db60fc227aff6818e624f47583570b9eec805b075d561"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:FZKNBEUNJDAIHLOM7E7UXEC33M","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Learning Deep Control Policies for Autonomous Aerial Vehicles with MPC-Guided Policy Search","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.RO"],"primary_cat":"cs.LG","authors_text":"Gregory Kahn, Pieter Abbeel, Sergey Levine, Tianhao Zhang","submitted_at":"2015-09-22T21:27:27Z","abstract_excerpt":"Model predictive control (MPC) is an effective method for controlling robotic systems, particularly autonomous aerial vehicles such as quadcopters. However, application of MPC can be computationally demanding, and typically requires estimating the state of the system, which can be challenging in complex, unstructured environments. Reinforcement learning can in principle forego the need for explicit state estimation and acquire a policy that directly maps sensor readings to actions, but is difficult to apply to unstable systems that are liable to fail catastrophically during training before an "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1509.06791","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:20:42Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cQrMhRugsXPDVUWoG8d+b3rrzyh28rWyJopMEBmcOFzCBtkR4bLwdlfj8ZmiHAW2anYdeq1bZNzOjuJL6UH8Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T09:48:06.319994Z"},"content_sha256":"c8c9c516b5cf3fc1fd8b962453440b60f2247b672d952253f3913f31e854d757","schema_version":"1.0","event_id":"sha256:c8c9c516b5cf3fc1fd8b962453440b60f2247b672d952253f3913f31e854d757"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/FZKNBEUNJDAIHLOM7E7UXEC33M/bundle.json","state_url":"https://pith.science/pith/FZKNBEUNJDAIHLOM7E7UXEC33M/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/FZKNBEUNJDAIHLOM7E7UXEC33M/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T09:48:06Z","links":{"resolver":"https://pith.science/pith/FZKNBEUNJDAIHLOM7E7UXEC33M","bundle":"https://pith.science/pith/FZKNBEUNJDAIHLOM7E7UXEC33M/bundle.json","state":"https://pith.science/pith/FZKNBEUNJDAIHLOM7E7UXEC33M/state.json","well_known_bundle":"https://pith.science/.well-known/pith/FZKNBEUNJDAIHLOM7E7UXEC33M/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:FZKNBEUNJDAIHLOM7E7UXEC33M","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"31c78b40f165e7b7609a7a585784976812f9ad57de9268eec87a68af18f3860e","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-22T21:27:27Z","title_canon_sha256":"7cd5c7f872ceec7b26ae84f6422212a53421893899c9a658401c876b7f276395"},"schema_version":"1.0","source":{"id":"1509.06791","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1509.06791","created_at":"2026-05-18T01:20:42Z"},{"alias_kind":"arxiv_version","alias_value":"1509.06791v2","created_at":"2026-05-18T01:20:42Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1509.06791","created_at":"2026-05-18T01:20:42Z"},{"alias_kind":"pith_short_12","alias_value":"FZKNBEUNJDAI","created_at":"2026-05-18T12:29:22Z"},{"alias_kind":"pith_short_16","alias_value":"FZKNBEUNJDAIHLOM","created_at":"2026-05-18T12:29:22Z"},{"alias_kind":"pith_short_8","alias_value":"FZKNBEUN","created_at":"2026-05-18T12:29:22Z"}],"graph_snapshots":[{"event_id":"sha256:c8c9c516b5cf3fc1fd8b962453440b60f2247b672d952253f3913f31e854d757","target":"graph","created_at":"2026-05-18T01:20:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Model predictive control (MPC) is an effective method for controlling robotic systems, particularly autonomous aerial vehicles such as quadcopters. However, application of MPC can be computationally demanding, and typically requires estimating the state of the system, which can be challenging in complex, unstructured environments. Reinforcement learning can in principle forego the need for explicit state estimation and acquire a policy that directly maps sensor readings to actions, but is difficult to apply to unstable systems that are liable to fail catastrophically during training before an ","authors_text":"Gregory Kahn, Pieter Abbeel, Sergey Levine, Tianhao Zhang","cross_cats":["cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-22T21:27:27Z","title":"Learning Deep Control Policies for Autonomous Aerial Vehicles with MPC-Guided Policy Search"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1509.06791","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d789b08bb48f12f7749db60fc227aff6818e624f47583570b9eec805b075d561","target":"record","created_at":"2026-05-18T01:20:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"31c78b40f165e7b7609a7a585784976812f9ad57de9268eec87a68af18f3860e","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-09-22T21:27:27Z","title_canon_sha256":"7cd5c7f872ceec7b26ae84f6422212a53421893899c9a658401c876b7f276395"},"schema_version":"1.0","source":{"id":"1509.06791","kind":"arxiv","version":2}},"canonical_sha256":"2e54d0928d48c083adccf93f4b905bdb3a782eb77d982457da4f8d4ab9004f66","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2e54d0928d48c083adccf93f4b905bdb3a782eb77d982457da4f8d4ab9004f66","first_computed_at":"2026-05-18T01:20:42.975726Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:20:42.975726Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"gog09y4L1ln6WHEm40ELxPtIt/5qM9sWC8R7tDDfJHEhq5a0Xx8+qMZAR+Q3ooUIJF0mPNkOo4Ogw04y6DEZDQ==","signature_status":"signed_v1","signed_at":"2026-05-18T01:20:42.976435Z","signed_message":"canonical_sha256_bytes"},"source_id":"1509.06791","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d789b08bb48f12f7749db60fc227aff6818e624f47583570b9eec805b075d561","sha256:c8c9c516b5cf3fc1fd8b962453440b60f2247b672d952253f3913f31e854d757"],"state_sha256":"bb3aac9e85f87372b8dd3460650d92fbca5a822d43c1df16bcbf6b935b3d90dd"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Wj8wMJ4esJS2N4M0uUvlHE8wlojgBmme3ziL5awVM5qlciGZRNbRbMGRkFxdTVw1gBbFMftleS+waT1BRiO+BA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T09:48:06.323843Z","bundle_sha256":"26a4ade08827466c5b207106ab266b369edf5d4fd9ebb31896ff85e3e4e2400c"}}