{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:ARC2YQRYPS2PF2SH5QHSZCWITE","short_pith_number":"pith:ARC2YQRY","canonical_record":{"source":{"id":"1807.04742","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-07-12T17:51:16Z","cross_cats_sorted":["cs.CV","cs.RO","stat.ML"],"title_canon_sha256":"dc56d94c4334e95b2f2ba5db058048fcbdfe6a63e650884fc1378ae23b0e557a","abstract_canon_sha256":"f369cf5237e888ac876267a032adac7c8bb1911548ef036267a043adbc009f1c"},"schema_version":"1.0"},"canonical_sha256":"0445ac42387cb4f2ea47ec0f2c8ac89900fb47a7c935c9ada0f0ab785505e955","source":{"kind":"arxiv","id":"1807.04742","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.04742","created_at":"2026-05-17T23:59:16Z"},{"alias_kind":"arxiv_version","alias_value":"1807.04742v2","created_at":"2026-05-17T23:59:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.04742","created_at":"2026-05-17T23:59:16Z"},{"alias_kind":"pith_short_12","alias_value":"ARC2YQRYPS2P","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"ARC2YQRYPS2PF2SH","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"ARC2YQRY","created_at":"2026-05-18T12:32:13Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:ARC2YQRYPS2PF2SH5QHSZCWITE","target":"record","payload":{"canonical_record":{"source":{"id":"1807.04742","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-07-12T17:51:16Z","cross_cats_sorted":["cs.CV","cs.RO","stat.ML"],"title_canon_sha256":"dc56d94c4334e95b2f2ba5db058048fcbdfe6a63e650884fc1378ae23b0e557a","abstract_canon_sha256":"f369cf5237e888ac876267a032adac7c8bb1911548ef036267a043adbc009f1c"},"schema_version":"1.0"},"canonical_sha256":"0445ac42387cb4f2ea47ec0f2c8ac89900fb47a7c935c9ada0f0ab785505e955","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:59:16.705731Z","signature_b64":"TY9s4HlHRBD621qylGW+34wqzJ0JKT6wfH8qCanhm1jzM0YeTVCBD/JPhOV6lfw6mCxLvqt20+x9CkCb+aMtDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0445ac42387cb4f2ea47ec0f2c8ac89900fb47a7c935c9ada0f0ab785505e955","last_reissued_at":"2026-05-17T23:59:16.705092Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:59:16.705092Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1807.04742","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"d6ZIgvGpld2VKURV179CX2s4Jd0xCvY9Vil2lfaHoQHbkAu0VLXjKHOk7vSZnBCc2j51aYnXDQ+MYCTHc0tfDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T21:05:03.576158Z"},"content_sha256":"cb1745e96069d856655ae2f3ca4e00c900cfb8740d1c78b9ad1d4e780f7da975","schema_version":"1.0","event_id":"sha256:cb1745e96069d856655ae2f3ca4e00c900cfb8740d1c78b9ad1d4e780f7da975"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:ARC2YQRYPS2PF2SH5QHSZCWITE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Visual Reinforcement Learning with Imagined Goals","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CV","cs.RO","stat.ML"],"primary_cat":"cs.LG","authors_text":"Ashvin Nair, Murtaza Dalal, Sergey Levine, Shikhar Bahl, Steven Lin, Vitchyr Pong","submitted_at":"2018-07-12T17:51:16Z","abstract_excerpt":"For an autonomous agent to fulfill a wide range of user-specified goals at test time, it must be able to learn broadly applicable and general-purpose skill repertoires. Furthermore, to provide the requisite level of generality, these skills must handle raw sensory input such as images. In this paper, we propose an algorithm that acquires such general-purpose skills by combining unsupervised representation learning and reinforcement learning of goal-conditioned policies. Since the particular goals that might be required at test-time are not known in advance, the agent performs a self-supervised"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.04742","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pFcqPm/Ztk2ngO6BOdev0/kFrceAvxouhwuXwRZ1JA2Es7AoCqE6VkMbd63SbbQXD4nhoCWvkDZZCarWJPd7AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T21:05:03.576946Z"},"content_sha256":"33174e36b672feeb1c73b9663b86d0199c8308122ac0d9e2958901f69158b816","schema_version":"1.0","event_id":"sha256:33174e36b672feeb1c73b9663b86d0199c8308122ac0d9e2958901f69158b816"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ARC2YQRYPS2PF2SH5QHSZCWITE/bundle.json","state_url":"https://pith.science/pith/ARC2YQRYPS2PF2SH5QHSZCWITE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ARC2YQRYPS2PF2SH5QHSZCWITE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-11T21:05:03Z","links":{"resolver":"https://pith.science/pith/ARC2YQRYPS2PF2SH5QHSZCWITE","bundle":"https://pith.science/pith/ARC2YQRYPS2PF2SH5QHSZCWITE/bundle.json","state":"https://pith.science/pith/ARC2YQRYPS2PF2SH5QHSZCWITE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ARC2YQRYPS2PF2SH5QHSZCWITE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:ARC2YQRYPS2PF2SH5QHSZCWITE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f369cf5237e888ac876267a032adac7c8bb1911548ef036267a043adbc009f1c","cross_cats_sorted":["cs.CV","cs.RO","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-07-12T17:51:16Z","title_canon_sha256":"dc56d94c4334e95b2f2ba5db058048fcbdfe6a63e650884fc1378ae23b0e557a"},"schema_version":"1.0","source":{"id":"1807.04742","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.04742","created_at":"2026-05-17T23:59:16Z"},{"alias_kind":"arxiv_version","alias_value":"1807.04742v2","created_at":"2026-05-17T23:59:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.04742","created_at":"2026-05-17T23:59:16Z"},{"alias_kind":"pith_short_12","alias_value":"ARC2YQRYPS2P","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"ARC2YQRYPS2PF2SH","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"ARC2YQRY","created_at":"2026-05-18T12:32:13Z"}],"graph_snapshots":[{"event_id":"sha256:33174e36b672feeb1c73b9663b86d0199c8308122ac0d9e2958901f69158b816","target":"graph","created_at":"2026-05-17T23:59:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"For an autonomous agent to fulfill a wide range of user-specified goals at test time, it must be able to learn broadly applicable and general-purpose skill repertoires. Furthermore, to provide the requisite level of generality, these skills must handle raw sensory input such as images. In this paper, we propose an algorithm that acquires such general-purpose skills by combining unsupervised representation learning and reinforcement learning of goal-conditioned policies. Since the particular goals that might be required at test-time are not known in advance, the agent performs a self-supervised","authors_text":"Ashvin Nair, Murtaza Dalal, Sergey Levine, Shikhar Bahl, Steven Lin, Vitchyr Pong","cross_cats":["cs.CV","cs.RO","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-07-12T17:51:16Z","title":"Visual Reinforcement Learning with Imagined Goals"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.04742","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:cb1745e96069d856655ae2f3ca4e00c900cfb8740d1c78b9ad1d4e780f7da975","target":"record","created_at":"2026-05-17T23:59:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f369cf5237e888ac876267a032adac7c8bb1911548ef036267a043adbc009f1c","cross_cats_sorted":["cs.CV","cs.RO","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-07-12T17:51:16Z","title_canon_sha256":"dc56d94c4334e95b2f2ba5db058048fcbdfe6a63e650884fc1378ae23b0e557a"},"schema_version":"1.0","source":{"id":"1807.04742","kind":"arxiv","version":2}},"canonical_sha256":"0445ac42387cb4f2ea47ec0f2c8ac89900fb47a7c935c9ada0f0ab785505e955","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0445ac42387cb4f2ea47ec0f2c8ac89900fb47a7c935c9ada0f0ab785505e955","first_computed_at":"2026-05-17T23:59:16.705092Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:59:16.705092Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"TY9s4HlHRBD621qylGW+34wqzJ0JKT6wfH8qCanhm1jzM0YeTVCBD/JPhOV6lfw6mCxLvqt20+x9CkCb+aMtDA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:59:16.705731Z","signed_message":"canonical_sha256_bytes"},"source_id":"1807.04742","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:cb1745e96069d856655ae2f3ca4e00c900cfb8740d1c78b9ad1d4e780f7da975","sha256:33174e36b672feeb1c73b9663b86d0199c8308122ac0d9e2958901f69158b816"],"state_sha256":"0f970d9142b73c1a157c7633d8365504e4a4093101c0f0e59f10a21601d7c9e3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZS/42GPQKz+146m4LuCPod3ppgIOowjReTFvABTZPfi+QONpOHpfCnXJ7uP1z8KQRyXQM+H8ZeHiDVZ/a7APDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-11T21:05:03.581011Z","bundle_sha256":"46f44e94a7c32b9c3e0ce7920fcab9752161a2c373fbd1cec1055a70a2afdc71"}}