{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:TKP3XHO6ZHB65EWS26RP4O7YLQ","short_pith_number":"pith:TKP3XHO6","canonical_record":{"source":{"id":"1905.12621","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-27T09:25:16Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"dc96ac0053a2aa0734b8c545783501e7cdc212a62145f6d6671e0683a4bdb0cc","abstract_canon_sha256":"412e99f1c3370f8146f297d4a2ae4c2f4ba41607cf1e4871235aac73b680c8d0"},"schema_version":"1.0"},"canonical_sha256":"9a9fbb9ddec9c3ee92d2d7a2fe3bf85c22861add793cf12e0be5554faebbf1ef","source":{"kind":"arxiv","id":"1905.12621","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.12621","created_at":"2026-05-17T23:44:41Z"},{"alias_kind":"arxiv_version","alias_value":"1905.12621v1","created_at":"2026-05-17T23:44:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.12621","created_at":"2026-05-17T23:44:41Z"},{"alias_kind":"pith_short_12","alias_value":"TKP3XHO6ZHB6","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"TKP3XHO6ZHB65EWS","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"TKP3XHO6","created_at":"2026-05-18T12:33:30Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:TKP3XHO6ZHB65EWS26RP4O7YLQ","target":"record","payload":{"canonical_record":{"source":{"id":"1905.12621","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-27T09:25:16Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"dc96ac0053a2aa0734b8c545783501e7cdc212a62145f6d6671e0683a4bdb0cc","abstract_canon_sha256":"412e99f1c3370f8146f297d4a2ae4c2f4ba41607cf1e4871235aac73b680c8d0"},"schema_version":"1.0"},"canonical_sha256":"9a9fbb9ddec9c3ee92d2d7a2fe3bf85c22861add793cf12e0be5554faebbf1ef","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:44:41.886041Z","signature_b64":"ReBKmIDfCPCWezMnn14amNFzEVgjhadhAhYhrKqDdxc5k/u9VwUq+MDindiypqOME7NqJGSAq9wjCDuycfrzAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9a9fbb9ddec9c3ee92d2d7a2fe3bf85c22861add793cf12e0be5554faebbf1ef","last_reissued_at":"2026-05-17T23:44:41.885547Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:44:41.885547Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1905.12621","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"45iwogymAkwb6HeRYv1M35uG4HcWUotdqhubzhsBIxSMaAKVRcBtuQ8cnemA0wFMFBP/bLG7HlWsegueWP1jBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T03:43:25.760026Z"},"content_sha256":"cf403547496340a4e25774a8610f32cd0f3f43b216e8564593638babe805393d","schema_version":"1.0","event_id":"sha256:cf403547496340a4e25774a8610f32cd0f3f43b216e8564593638babe805393d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:TKP3XHO6ZHB65EWS26RP4O7YLQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Learning latent state representation for speeding up exploration","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Abhishek Gupta, Giulia Vezzani, Lorenzo Natale, Pieter Abbeel","submitted_at":"2019-05-27T09:25:16Z","abstract_excerpt":"Exploration is an extremely challenging problem in reinforcement learning, especially in high dimensional state and action spaces and when only sparse rewards are available. Effective representations can indicate which components of the state are task relevant and thus reduce the dimensionality of the space to explore. In this work, we take a representation learning viewpoint on exploration, utilizing prior experience to learn effective latent representations, which can subsequently indicate which regions to explore. Prior experience on separate but related tasks help learn representations of "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.12621","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VP02QDAFzWcCPqXopNfZHryniLMt1i9EcG+Q20+bB0ivf7jvtLfyYKjTGqxN01kkEJr4sRfPboKUFzWSHY6MAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T03:43:25.760745Z"},"content_sha256":"ef9bf4ba9db5b3f22a3942bac25985d347d9fc47f1ffc6c1cb958f61c076c6e5","schema_version":"1.0","event_id":"sha256:ef9bf4ba9db5b3f22a3942bac25985d347d9fc47f1ffc6c1cb958f61c076c6e5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/TKP3XHO6ZHB65EWS26RP4O7YLQ/bundle.json","state_url":"https://pith.science/pith/TKP3XHO6ZHB65EWS26RP4O7YLQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/TKP3XHO6ZHB65EWS26RP4O7YLQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-09T03:43:25Z","links":{"resolver":"https://pith.science/pith/TKP3XHO6ZHB65EWS26RP4O7YLQ","bundle":"https://pith.science/pith/TKP3XHO6ZHB65EWS26RP4O7YLQ/bundle.json","state":"https://pith.science/pith/TKP3XHO6ZHB65EWS26RP4O7YLQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/TKP3XHO6ZHB65EWS26RP4O7YLQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:TKP3XHO6ZHB65EWS26RP4O7YLQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"412e99f1c3370f8146f297d4a2ae4c2f4ba41607cf1e4871235aac73b680c8d0","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-27T09:25:16Z","title_canon_sha256":"dc96ac0053a2aa0734b8c545783501e7cdc212a62145f6d6671e0683a4bdb0cc"},"schema_version":"1.0","source":{"id":"1905.12621","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.12621","created_at":"2026-05-17T23:44:41Z"},{"alias_kind":"arxiv_version","alias_value":"1905.12621v1","created_at":"2026-05-17T23:44:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.12621","created_at":"2026-05-17T23:44:41Z"},{"alias_kind":"pith_short_12","alias_value":"TKP3XHO6ZHB6","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"TKP3XHO6ZHB65EWS","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"TKP3XHO6","created_at":"2026-05-18T12:33:30Z"}],"graph_snapshots":[{"event_id":"sha256:ef9bf4ba9db5b3f22a3942bac25985d347d9fc47f1ffc6c1cb958f61c076c6e5","target":"graph","created_at":"2026-05-17T23:44:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Exploration is an extremely challenging problem in reinforcement learning, especially in high dimensional state and action spaces and when only sparse rewards are available. Effective representations can indicate which components of the state are task relevant and thus reduce the dimensionality of the space to explore. In this work, we take a representation learning viewpoint on exploration, utilizing prior experience to learn effective latent representations, which can subsequently indicate which regions to explore. Prior experience on separate but related tasks help learn representations of ","authors_text":"Abhishek Gupta, Giulia Vezzani, Lorenzo Natale, Pieter Abbeel","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-27T09:25:16Z","title":"Learning latent state representation for speeding up exploration"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.12621","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:cf403547496340a4e25774a8610f32cd0f3f43b216e8564593638babe805393d","target":"record","created_at":"2026-05-17T23:44:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"412e99f1c3370f8146f297d4a2ae4c2f4ba41607cf1e4871235aac73b680c8d0","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-27T09:25:16Z","title_canon_sha256":"dc96ac0053a2aa0734b8c545783501e7cdc212a62145f6d6671e0683a4bdb0cc"},"schema_version":"1.0","source":{"id":"1905.12621","kind":"arxiv","version":1}},"canonical_sha256":"9a9fbb9ddec9c3ee92d2d7a2fe3bf85c22861add793cf12e0be5554faebbf1ef","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9a9fbb9ddec9c3ee92d2d7a2fe3bf85c22861add793cf12e0be5554faebbf1ef","first_computed_at":"2026-05-17T23:44:41.885547Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:44:41.885547Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ReBKmIDfCPCWezMnn14amNFzEVgjhadhAhYhrKqDdxc5k/u9VwUq+MDindiypqOME7NqJGSAq9wjCDuycfrzAQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:44:41.886041Z","signed_message":"canonical_sha256_bytes"},"source_id":"1905.12621","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:cf403547496340a4e25774a8610f32cd0f3f43b216e8564593638babe805393d","sha256:ef9bf4ba9db5b3f22a3942bac25985d347d9fc47f1ffc6c1cb958f61c076c6e5"],"state_sha256":"7d766b01878d1ed3e92aa1ef7b002232aa63a73aab56fc3bbaa5deb7e962f45b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1y1rDxdRnDqILnfMpxjTUigaV2vuSQQpOAsibBnKbjTxlR6GGafRovcFJra+y3dBB/qRzBF2vh7xlc3LBGj0Cg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-09T03:43:25.764532Z","bundle_sha256":"ff375c65e613c41f9e30beb22a01d846695fb87172cd907e7efcacfb7693bc13"}}