{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:7WPL54D6SCIUN35CWQ5QKIKCWW","short_pith_number":"pith:7WPL54D6","canonical_record":{"source":{"id":"1802.08294","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-22T20:42:19Z","cross_cats_sorted":[],"title_canon_sha256":"48a6768a4076fce304179f72ef79fd56e1791035a8fce449016de2039fbb56da","abstract_canon_sha256":"f2cb8d1536389fc30f2335b2ac0fe8ce66450118677669d452f5c57a2316e026"},"schema_version":"1.0"},"canonical_sha256":"fd9ebef07e909146efa2b43b052142b5bb065fde7be9fffaab9aca0738a10cb2","source":{"kind":"arxiv","id":"1802.08294","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.08294","created_at":"2026-05-18T00:11:49Z"},{"alias_kind":"arxiv_version","alias_value":"1802.08294v2","created_at":"2026-05-18T00:11:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.08294","created_at":"2026-05-18T00:11:49Z"},{"alias_kind":"pith_short_12","alias_value":"7WPL54D6SCIU","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_16","alias_value":"7WPL54D6SCIUN35C","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_8","alias_value":"7WPL54D6","created_at":"2026-05-18T12:32:11Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:7WPL54D6SCIUN35CWQ5QKIKCWW","target":"record","payload":{"canonical_record":{"source":{"id":"1802.08294","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-22T20:42:19Z","cross_cats_sorted":[],"title_canon_sha256":"48a6768a4076fce304179f72ef79fd56e1791035a8fce449016de2039fbb56da","abstract_canon_sha256":"f2cb8d1536389fc30f2335b2ac0fe8ce66450118677669d452f5c57a2316e026"},"schema_version":"1.0"},"canonical_sha256":"fd9ebef07e909146efa2b43b052142b5bb065fde7be9fffaab9aca0738a10cb2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:11:49.814080Z","signature_b64":"QiNIhs/9SZ/nelQug6FZppw7M341JyXWwKPM7WqpS0kz5nZLMsV78kENfmaJJYH6mbFFqvvefjB8bJF9E49TCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"fd9ebef07e909146efa2b43b052142b5bb065fde7be9fffaab9aca0738a10cb2","last_reissued_at":"2026-05-18T00:11:49.813508Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:11:49.813508Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1802.08294","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:11:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"XMlKM8lNusCDJs41rGRsZHPCNrHq5+yxaU07EvmuSUssewmlyF0FAujGo79NrR0ToNduOTBWpB0PFlFJB0s3BA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T06:32:20.519214Z"},"content_sha256":"79be12e8614e9ab6b47b83fe0888008b304c0a6c86c5e495902a403384b1e90a","schema_version":"1.0","event_id":"sha256:79be12e8614e9ab6b47b83fe0888008b304c0a6c86c5e495902a403384b1e90a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:7WPL54D6SCIUN35CWQ5QKIKCWW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Unicorn: Continual Learning with a Universal, Off-policy Agent","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Andr\\'e Barreto, Augustin \\v{Z}\\'idek, Dan Horgan, Daniel J. Mankowitz, David Silver, Hado van Hasselt, John Quan, Junhyuk Oh, Matteo Hessel, Tom Schaul","submitted_at":"2018-02-22T20:42:19Z","abstract_excerpt":"Some real-world domains are best characterized as a single task, but for others this perspective is limiting. Instead, some tasks continually grow in complexity, in tandem with the agent's competence. In continual learning, also referred to as lifelong learning, there are no explicit task boundaries or curricula. As learning agents have become more powerful, continual learning remains one of the frontiers that has resisted quick progress. To test continual learning capabilities we consider a challenging 3D domain with an implicit sequence of tasks and sparse rewards. We propose a novel agent a"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.08294","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:11:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"NuxLqFq+eI0F7PzbjIvoHipy2i4zNM9jMbGkVO+uGcYi0hZ1YCv8e/02JtCCkE7IG+11BcNQiGWjuEZjZZtfBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T06:32:20.519573Z"},"content_sha256":"1c2d3d047e916e79061f85e481f811d20dcc66ba067a01191c324f20676d6741","schema_version":"1.0","event_id":"sha256:1c2d3d047e916e79061f85e481f811d20dcc66ba067a01191c324f20676d6741"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/7WPL54D6SCIUN35CWQ5QKIKCWW/bundle.json","state_url":"https://pith.science/pith/7WPL54D6SCIUN35CWQ5QKIKCWW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/7WPL54D6SCIUN35CWQ5QKIKCWW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T06:32:20Z","links":{"resolver":"https://pith.science/pith/7WPL54D6SCIUN35CWQ5QKIKCWW","bundle":"https://pith.science/pith/7WPL54D6SCIUN35CWQ5QKIKCWW/bundle.json","state":"https://pith.science/pith/7WPL54D6SCIUN35CWQ5QKIKCWW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/7WPL54D6SCIUN35CWQ5QKIKCWW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:7WPL54D6SCIUN35CWQ5QKIKCWW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f2cb8d1536389fc30f2335b2ac0fe8ce66450118677669d452f5c57a2316e026","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-22T20:42:19Z","title_canon_sha256":"48a6768a4076fce304179f72ef79fd56e1791035a8fce449016de2039fbb56da"},"schema_version":"1.0","source":{"id":"1802.08294","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.08294","created_at":"2026-05-18T00:11:49Z"},{"alias_kind":"arxiv_version","alias_value":"1802.08294v2","created_at":"2026-05-18T00:11:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.08294","created_at":"2026-05-18T00:11:49Z"},{"alias_kind":"pith_short_12","alias_value":"7WPL54D6SCIU","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_16","alias_value":"7WPL54D6SCIUN35C","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_8","alias_value":"7WPL54D6","created_at":"2026-05-18T12:32:11Z"}],"graph_snapshots":[{"event_id":"sha256:1c2d3d047e916e79061f85e481f811d20dcc66ba067a01191c324f20676d6741","target":"graph","created_at":"2026-05-18T00:11:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Some real-world domains are best characterized as a single task, but for others this perspective is limiting. Instead, some tasks continually grow in complexity, in tandem with the agent's competence. In continual learning, also referred to as lifelong learning, there are no explicit task boundaries or curricula. As learning agents have become more powerful, continual learning remains one of the frontiers that has resisted quick progress. To test continual learning capabilities we consider a challenging 3D domain with an implicit sequence of tasks and sparse rewards. We propose a novel agent a","authors_text":"Andr\\'e Barreto, Augustin \\v{Z}\\'idek, Dan Horgan, Daniel J. Mankowitz, David Silver, Hado van Hasselt, John Quan, Junhyuk Oh, Matteo Hessel, Tom Schaul","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-22T20:42:19Z","title":"Unicorn: Continual Learning with a Universal, Off-policy Agent"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.08294","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:79be12e8614e9ab6b47b83fe0888008b304c0a6c86c5e495902a403384b1e90a","target":"record","created_at":"2026-05-18T00:11:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f2cb8d1536389fc30f2335b2ac0fe8ce66450118677669d452f5c57a2316e026","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-22T20:42:19Z","title_canon_sha256":"48a6768a4076fce304179f72ef79fd56e1791035a8fce449016de2039fbb56da"},"schema_version":"1.0","source":{"id":"1802.08294","kind":"arxiv","version":2}},"canonical_sha256":"fd9ebef07e909146efa2b43b052142b5bb065fde7be9fffaab9aca0738a10cb2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"fd9ebef07e909146efa2b43b052142b5bb065fde7be9fffaab9aca0738a10cb2","first_computed_at":"2026-05-18T00:11:49.813508Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:11:49.813508Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"QiNIhs/9SZ/nelQug6FZppw7M341JyXWwKPM7WqpS0kz5nZLMsV78kENfmaJJYH6mbFFqvvefjB8bJF9E49TCQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:11:49.814080Z","signed_message":"canonical_sha256_bytes"},"source_id":"1802.08294","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:79be12e8614e9ab6b47b83fe0888008b304c0a6c86c5e495902a403384b1e90a","sha256:1c2d3d047e916e79061f85e481f811d20dcc66ba067a01191c324f20676d6741"],"state_sha256":"2fe3b86e5a64c15c5c10bec72f70808b2495b7b563da8bec78cc243a39468527"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7phl8TFdXlYCdriAAg5dvHtsvyNzKPKDSUHb1Sq6rxEQ3g07xbqf6eIK3dTgoQBa6BKMarG/wg09mPxB8DLwDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T06:32:20.521491Z","bundle_sha256":"b80b55edacb6042c5864d511d5fb5e0394914b8bd026f398fd851c449c387d64"}}