{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:T6UMGKV3LIED2JMDIO7Z72VBUS","short_pith_number":"pith:T6UMGKV3","canonical_record":{"source":{"id":"1812.07452","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-12-18T16:08:57Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"ec9de4919603795d7377c85fae807b4cbc965f267b5a97fad4a4679ed7556401","abstract_canon_sha256":"01345bc2028335bcc0ccd78988f610cc299e209ac4f0b806572c5c3ec40850eb"},"schema_version":"1.0"},"canonical_sha256":"9fa8c32abb5a083d258343bf9feaa1a48be74bf68dc297309c93d166758f5ac1","source":{"kind":"arxiv","id":"1812.07452","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1812.07452","created_at":"2026-05-17T23:58:00Z"},{"alias_kind":"arxiv_version","alias_value":"1812.07452v1","created_at":"2026-05-17T23:58:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1812.07452","created_at":"2026-05-17T23:58:00Z"},{"alias_kind":"pith_short_12","alias_value":"T6UMGKV3LIED","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_16","alias_value":"T6UMGKV3LIED2JMD","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_8","alias_value":"T6UMGKV3","created_at":"2026-05-18T12:32:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:T6UMGKV3LIED2JMDIO7Z72VBUS","target":"record","payload":{"canonical_record":{"source":{"id":"1812.07452","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-12-18T16:08:57Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"ec9de4919603795d7377c85fae807b4cbc965f267b5a97fad4a4679ed7556401","abstract_canon_sha256":"01345bc2028335bcc0ccd78988f610cc299e209ac4f0b806572c5c3ec40850eb"},"schema_version":"1.0"},"canonical_sha256":"9fa8c32abb5a083d258343bf9feaa1a48be74bf68dc297309c93d166758f5ac1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:58:00.468391Z","signature_b64":"6qcg2NRmRjLEyXwwYQTzKwFnyrJZHavqvJJbbruabKef4U6jzh1eXIKuojlAkx0TXLt4Qw+eVkmS9kwgzI7wDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9fa8c32abb5a083d258343bf9feaa1a48be74bf68dc297309c93d166758f5ac1","last_reissued_at":"2026-05-17T23:58:00.467784Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:58:00.467784Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1812.07452","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:58:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZTo552hQZ08TTaep4F4vSYMrmp+px2BLn3pcBHV1phQb2Zfx6IM8MKp//B6K7pdqGY+iOqt6lah08OwZiPqRDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-24T16:25:48.262106Z"},"content_sha256":"479f3d26e2a2fb4a05fa463dd6fa0aef8c74de046e4bbc8c88f4b29cef6c0b80","schema_version":"1.0","event_id":"sha256:479f3d26e2a2fb4a05fa463dd6fa0aef8c74de046e4bbc8c88f4b29cef6c0b80"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:T6UMGKV3LIED2JMDIO7Z72VBUS","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Domain Adaptation for Reinforcement Learning on the Atari","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","stat.ML"],"primary_cat":"cs.LG","authors_text":"George Vogiatzis, Maria Chli, Thomas Carr","submitted_at":"2018-12-18T16:08:57Z","abstract_excerpt":"Deep reinforcement learning agents have recently been successful across a variety of discrete and continuous control tasks; however, they can be slow to train and require a large number of interactions with the environment to learn a suitable policy. This is borne out by the fact that a reinforcement learning agent has no prior knowledge of the world, no pre-existing data to depend on and so must devote considerable time to exploration. Transfer learning can alleviate some of the problems by leveraging learning done on some source task to help learning on some target task. Our work presents an"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1812.07452","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:58:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"LaBnlyQPNz+U4zJcw8qMWmL2+tZRPrXQqusoasJsRXYc43VXjDfH7LElJQ+klhXpjmpyNF7hcFRr1e4dPd9PCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-24T16:25:48.262469Z"},"content_sha256":"ceebe32b9e9206834fde4379d64f477de21c093b0513b89bd74423b1a7289a50","schema_version":"1.0","event_id":"sha256:ceebe32b9e9206834fde4379d64f477de21c093b0513b89bd74423b1a7289a50"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/T6UMGKV3LIED2JMDIO7Z72VBUS/bundle.json","state_url":"https://pith.science/pith/T6UMGKV3LIED2JMDIO7Z72VBUS/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/T6UMGKV3LIED2JMDIO7Z72VBUS/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-24T16:25:48Z","links":{"resolver":"https://pith.science/pith/T6UMGKV3LIED2JMDIO7Z72VBUS","bundle":"https://pith.science/pith/T6UMGKV3LIED2JMDIO7Z72VBUS/bundle.json","state":"https://pith.science/pith/T6UMGKV3LIED2JMDIO7Z72VBUS/state.json","well_known_bundle":"https://pith.science/.well-known/pith/T6UMGKV3LIED2JMDIO7Z72VBUS/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:T6UMGKV3LIED2JMDIO7Z72VBUS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"01345bc2028335bcc0ccd78988f610cc299e209ac4f0b806572c5c3ec40850eb","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-12-18T16:08:57Z","title_canon_sha256":"ec9de4919603795d7377c85fae807b4cbc965f267b5a97fad4a4679ed7556401"},"schema_version":"1.0","source":{"id":"1812.07452","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1812.07452","created_at":"2026-05-17T23:58:00Z"},{"alias_kind":"arxiv_version","alias_value":"1812.07452v1","created_at":"2026-05-17T23:58:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1812.07452","created_at":"2026-05-17T23:58:00Z"},{"alias_kind":"pith_short_12","alias_value":"T6UMGKV3LIED","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_16","alias_value":"T6UMGKV3LIED2JMD","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_8","alias_value":"T6UMGKV3","created_at":"2026-05-18T12:32:53Z"}],"graph_snapshots":[{"event_id":"sha256:ceebe32b9e9206834fde4379d64f477de21c093b0513b89bd74423b1a7289a50","target":"graph","created_at":"2026-05-17T23:58:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Deep reinforcement learning agents have recently been successful across a variety of discrete and continuous control tasks; however, they can be slow to train and require a large number of interactions with the environment to learn a suitable policy. This is borne out by the fact that a reinforcement learning agent has no prior knowledge of the world, no pre-existing data to depend on and so must devote considerable time to exploration. Transfer learning can alleviate some of the problems by leveraging learning done on some source task to help learning on some target task. Our work presents an","authors_text":"George Vogiatzis, Maria Chli, Thomas Carr","cross_cats":["cs.AI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-12-18T16:08:57Z","title":"Domain Adaptation for Reinforcement Learning on the Atari"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1812.07452","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:479f3d26e2a2fb4a05fa463dd6fa0aef8c74de046e4bbc8c88f4b29cef6c0b80","target":"record","created_at":"2026-05-17T23:58:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"01345bc2028335bcc0ccd78988f610cc299e209ac4f0b806572c5c3ec40850eb","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-12-18T16:08:57Z","title_canon_sha256":"ec9de4919603795d7377c85fae807b4cbc965f267b5a97fad4a4679ed7556401"},"schema_version":"1.0","source":{"id":"1812.07452","kind":"arxiv","version":1}},"canonical_sha256":"9fa8c32abb5a083d258343bf9feaa1a48be74bf68dc297309c93d166758f5ac1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9fa8c32abb5a083d258343bf9feaa1a48be74bf68dc297309c93d166758f5ac1","first_computed_at":"2026-05-17T23:58:00.467784Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:58:00.467784Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"6qcg2NRmRjLEyXwwYQTzKwFnyrJZHavqvJJbbruabKef4U6jzh1eXIKuojlAkx0TXLt4Qw+eVkmS9kwgzI7wDA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:58:00.468391Z","signed_message":"canonical_sha256_bytes"},"source_id":"1812.07452","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:479f3d26e2a2fb4a05fa463dd6fa0aef8c74de046e4bbc8c88f4b29cef6c0b80","sha256:ceebe32b9e9206834fde4379d64f477de21c093b0513b89bd74423b1a7289a50"],"state_sha256":"c2b0d7a38eb3bb4946d2ae5d144d4a7f38a9966c3ffa816290c4cb468c530ef6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"wyOUj+jyV7E7v3QlPKxP+Vp7YRlqNd/TeaZPfop7t6uI1568Uynrfbdu3w0HLgkjxu0stVO7iWzQ0sFpTBQVBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-24T16:25:48.264348Z","bundle_sha256":"64d97849268858d2f9b813866f8b265092af87247290e46de840e779ee2543ac"}}