{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:MK2QANQ2KLGG5O2TAI4OVUGJBX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"02185ddffe06763c67fdf0bfcc1e62c29130e5435d3ec7f628e713707e5c01d8","cross_cats_sorted":["cs.AI","cs.RO","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-18T12:52:57Z","title_canon_sha256":"8fde190e964fdeec0756e50b72e92f8f31b6332d4f26839d09132c83b867ab19"},"schema_version":"1.0","source":{"id":"1903.07400","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.07400","created_at":"2026-05-17T23:42:48Z"},{"alias_kind":"arxiv_version","alias_value":"1903.07400v2","created_at":"2026-05-17T23:42:48Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.07400","created_at":"2026-05-17T23:42:48Z"},{"alias_kind":"pith_short_12","alias_value":"MK2QANQ2KLGG","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_16","alias_value":"MK2QANQ2KLGG5O2T","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_8","alias_value":"MK2QANQ2","created_at":"2026-05-18T12:33:21Z"}],"graph_snapshots":[{"event_id":"sha256:920e4e856efc0e4a0ad01776ac52d182961bfa2a1b252a7ff6783f85b9b97928","target":"graph","created_at":"2026-05-17T23:42:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Exploration in sparse reward reinforcement learning remains an open challenge. Many state-of-the-art methods use intrinsic motivation to complement the sparse extrinsic reward signal, giving the agent more opportunities to receive feedback during exploration. Commonly these signals are added as bonus rewards, which results in a mixture policy that neither conducts exploration nor task fulfillment resolutely. In this paper, we instead learn separate intrinsic and extrinsic task policies and schedule between these different drives to accelerate exploration and stabilize learning. Moreover, we in","authors_text":"Jingwei Zhang, Joschka Boedecker, Nicolai Dorka, Niklas Wetzel, Wolfram Burgard","cross_cats":["cs.AI","cs.RO","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-18T12:52:57Z","title":"Scheduled Intrinsic Drive: A Hierarchical Take on Intrinsically Motivated Exploration"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.07400","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0bd2545426897e495bfc4a8309382d3a3cb969ef6ee2c7a5899048216cfb1039","target":"record","created_at":"2026-05-17T23:42:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"02185ddffe06763c67fdf0bfcc1e62c29130e5435d3ec7f628e713707e5c01d8","cross_cats_sorted":["cs.AI","cs.RO","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-18T12:52:57Z","title_canon_sha256":"8fde190e964fdeec0756e50b72e92f8f31b6332d4f26839d09132c83b867ab19"},"schema_version":"1.0","source":{"id":"1903.07400","kind":"arxiv","version":2}},"canonical_sha256":"62b500361a52cc6ebb530238ead0c90dcf8d0542b8d2622e389f4fcf40a03ab4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"62b500361a52cc6ebb530238ead0c90dcf8d0542b8d2622e389f4fcf40a03ab4","first_computed_at":"2026-05-17T23:42:48.312169Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:42:48.312169Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"9aNMCNdykEqOO9x3i4KTHrA2ihTkIc8mq22qugTU+poQe14vCBscQXyNkO36eX2qjHh9vu9kc2nNlrTQWjySBA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:42:48.312729Z","signed_message":"canonical_sha256_bytes"},"source_id":"1903.07400","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0bd2545426897e495bfc4a8309382d3a3cb969ef6ee2c7a5899048216cfb1039","sha256:920e4e856efc0e4a0ad01776ac52d182961bfa2a1b252a7ff6783f85b9b97928"],"state_sha256":"3adb9e411ea81acecd83f65b8b5e85a7527824e21c88c3b15ec7d229854c205e"}