{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2020:FYIKN2JAIIAZBTDYOMJMPQUODM","short_pith_number":"pith:FYIKN2JA","canonical_record":{"source":{"id":"2011.04021","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2020-11-08T16:55:16Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"c37e7f1fa8bcdaaf3ce64e5dd2554cb644bc70429b05e5c94a735e01fd44754c","abstract_canon_sha256":"0c6f79abb5b3c53e7d719cecbc0cb39973afc2867062f615b409719679852d0a"},"schema_version":"1.0"},"canonical_sha256":"2e10a6e920420190cc787312c7c28e1b31b6a83f633277b18b0ef4cfc33f4d71","source":{"kind":"arxiv","id":"2011.04021","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2011.04021","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"arxiv_version","alias_value":"2011.04021v2","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2011.04021","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"pith_short_12","alias_value":"FYIKN2JAIIAZ","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"pith_short_16","alias_value":"FYIKN2JAIIAZBTDY","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"pith_short_8","alias_value":"FYIKN2JA","created_at":"2026-07-05T02:23:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2020:FYIKN2JAIIAZBTDYOMJMPQUODM","target":"record","payload":{"canonical_record":{"source":{"id":"2011.04021","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2020-11-08T16:55:16Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"c37e7f1fa8bcdaaf3ce64e5dd2554cb644bc70429b05e5c94a735e01fd44754c","abstract_canon_sha256":"0c6f79abb5b3c53e7d719cecbc0cb39973afc2867062f615b409719679852d0a"},"schema_version":"1.0"},"canonical_sha256":"2e10a6e920420190cc787312c7c28e1b31b6a83f633277b18b0ef4cfc33f4d71","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T02:23:59.522006Z","signature_b64":"LKRHMttbRc4aLMQQbKp8FB2V5+Fo+J5umM+ftx+5K5nDWQm6rH5f/cpc4GTzqhKki17I2srbnRwtdm/OFbe2CQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"2e10a6e920420190cc787312c7c28e1b31b6a83f633277b18b0ef4cfc33f4d71","last_reissued_at":"2026-07-05T02:23:59.521502Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T02:23:59.521502Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2011.04021","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T02:23:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZHAOBfD37A89VmivB+Bib2sxDsKzUNrJs2ciRGiW0w8XrQzd4gptsRpeeBaYO67oW0HTTWkHq2ZxRK6gHtn3BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T11:50:04.177962Z"},"content_sha256":"504c3d064e0faace3d6e2756c4ce47b76a5ead08ac68c9fe51bea22d2a6fa3b3","schema_version":"1.0","event_id":"sha256:504c3d064e0faace3d6e2756c4ce47b76a5ead08ac68c9fe51bea22d2a6fa3b3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2020:FYIKN2JAIIAZBTDYOMJMPQUODM","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"On the role of planning in model-based deep reinforcement learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.AI","authors_text":"Abram L. Friesen, Arthur Guez, Fabio Viola, Feryal Behbahani, Jessica B. Hamrick, Lars Buesing, Petar Veli\\v{c}kovi\\'c, Sims Witherspoon, Th\\'eophane Weber, Thomas Anthony","submitted_at":"2020-11-08T16:55:16Z","abstract_excerpt":"Model-based planning is often thought to be necessary for deep, careful reasoning and generalization in artificial agents. While recent successes of model-based reinforcement learning (MBRL) with deep function approximation have strengthened this hypothesis, the resulting diversity of model-based methods has also made it difficult to track which components drive success and why. In this paper, we seek to disentangle the contributions of recent methods by focusing on three questions: (1) How does planning benefit MBRL agents? (2) Within planning, what choices drive performance? (3) To what exte"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2011.04021","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2011.04021/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T02:23:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"t3Q7fNsArgfXx4XbCmm+bk+jZc476zMJrFvzSXkPG8hQRMRHjxHJpqBoGcMsruuHstJ4d8fH50xsw8nQXIPmCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T11:50:04.178352Z"},"content_sha256":"1cca86d86030f9988e61cea583f92583695d97bda7cb1d6525acd10fb434623c","schema_version":"1.0","event_id":"sha256:1cca86d86030f9988e61cea583f92583695d97bda7cb1d6525acd10fb434623c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/FYIKN2JAIIAZBTDYOMJMPQUODM/bundle.json","state_url":"https://pith.science/pith/FYIKN2JAIIAZBTDYOMJMPQUODM/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/FYIKN2JAIIAZBTDYOMJMPQUODM/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T11:50:04Z","links":{"resolver":"https://pith.science/pith/FYIKN2JAIIAZBTDYOMJMPQUODM","bundle":"https://pith.science/pith/FYIKN2JAIIAZBTDYOMJMPQUODM/bundle.json","state":"https://pith.science/pith/FYIKN2JAIIAZBTDYOMJMPQUODM/state.json","well_known_bundle":"https://pith.science/.well-known/pith/FYIKN2JAIIAZBTDYOMJMPQUODM/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2020:FYIKN2JAIIAZBTDYOMJMPQUODM","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0c6f79abb5b3c53e7d719cecbc0cb39973afc2867062f615b409719679852d0a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2020-11-08T16:55:16Z","title_canon_sha256":"c37e7f1fa8bcdaaf3ce64e5dd2554cb644bc70429b05e5c94a735e01fd44754c"},"schema_version":"1.0","source":{"id":"2011.04021","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2011.04021","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"arxiv_version","alias_value":"2011.04021v2","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2011.04021","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"pith_short_12","alias_value":"FYIKN2JAIIAZ","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"pith_short_16","alias_value":"FYIKN2JAIIAZBTDY","created_at":"2026-07-05T02:23:59Z"},{"alias_kind":"pith_short_8","alias_value":"FYIKN2JA","created_at":"2026-07-05T02:23:59Z"}],"graph_snapshots":[{"event_id":"sha256:1cca86d86030f9988e61cea583f92583695d97bda7cb1d6525acd10fb434623c","target":"graph","created_at":"2026-07-05T02:23:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2011.04021/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Model-based planning is often thought to be necessary for deep, careful reasoning and generalization in artificial agents. While recent successes of model-based reinforcement learning (MBRL) with deep function approximation have strengthened this hypothesis, the resulting diversity of model-based methods has also made it difficult to track which components drive success and why. In this paper, we seek to disentangle the contributions of recent methods by focusing on three questions: (1) How does planning benefit MBRL agents? (2) Within planning, what choices drive performance? (3) To what exte","authors_text":"Abram L. Friesen, Arthur Guez, Fabio Viola, Feryal Behbahani, Jessica B. Hamrick, Lars Buesing, Petar Veli\\v{c}kovi\\'c, Sims Witherspoon, Th\\'eophane Weber, Thomas Anthony","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2020-11-08T16:55:16Z","title":"On the role of planning in model-based deep reinforcement learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2011.04021","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:504c3d064e0faace3d6e2756c4ce47b76a5ead08ac68c9fe51bea22d2a6fa3b3","target":"record","created_at":"2026-07-05T02:23:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0c6f79abb5b3c53e7d719cecbc0cb39973afc2867062f615b409719679852d0a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2020-11-08T16:55:16Z","title_canon_sha256":"c37e7f1fa8bcdaaf3ce64e5dd2554cb644bc70429b05e5c94a735e01fd44754c"},"schema_version":"1.0","source":{"id":"2011.04021","kind":"arxiv","version":2}},"canonical_sha256":"2e10a6e920420190cc787312c7c28e1b31b6a83f633277b18b0ef4cfc33f4d71","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2e10a6e920420190cc787312c7c28e1b31b6a83f633277b18b0ef4cfc33f4d71","first_computed_at":"2026-07-05T02:23:59.521502Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T02:23:59.521502Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"LKRHMttbRc4aLMQQbKp8FB2V5+Fo+J5umM+ftx+5K5nDWQm6rH5f/cpc4GTzqhKki17I2srbnRwtdm/OFbe2CQ==","signature_status":"signed_v1","signed_at":"2026-07-05T02:23:59.522006Z","signed_message":"canonical_sha256_bytes"},"source_id":"2011.04021","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:504c3d064e0faace3d6e2756c4ce47b76a5ead08ac68c9fe51bea22d2a6fa3b3","sha256:1cca86d86030f9988e61cea583f92583695d97bda7cb1d6525acd10fb434623c"],"state_sha256":"546f3490d827b676ab16ac6ab4b8f2ab868204b9cc83a64820a2c6fc86bed88e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"uMaRCBXdN7P6vcd/P1JH6/qXX3iJs2K7OBdagsC/YoCEabvQs0TnooQbE44kMbc32Ue6QStqOiZpSMKCPZppCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T11:50:04.180405Z","bundle_sha256":"09d27847094fa87ba11b447471edb452ff11edb492c9516c92527dc78ebacb3e"}}