{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:7BIMGNMH6PDMKL75B7YM3RGCYP","short_pith_number":"pith:7BIMGNMH","canonical_record":{"source":{"id":"1806.10729","kind":"arxiv","version":5},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-28T01:16:11Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"9843b21eb3500d780249a9f679f4f4372c9959c237079643d97b958e409eb082","abstract_canon_sha256":"791b05255c4de7cf675b1a0006d0c96ba4f88c5a5ee0dd5d47017411463753d1"},"schema_version":"1.0"},"canonical_sha256":"f850c33587f3c6c52ffd0ff0cdc4c2c3edb3aaf5c76af0c31a54765e29173834","source":{"kind":"arxiv","id":"1806.10729","version":5},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1806.10729","created_at":"2026-05-17T23:59:38Z"},{"alias_kind":"arxiv_version","alias_value":"1806.10729v5","created_at":"2026-05-17T23:59:38Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.10729","created_at":"2026-05-17T23:59:38Z"},{"alias_kind":"pith_short_12","alias_value":"7BIMGNMH6PDM","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_16","alias_value":"7BIMGNMH6PDMKL75","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_8","alias_value":"7BIMGNMH","created_at":"2026-05-18T12:32:11Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:7BIMGNMH6PDMKL75B7YM3RGCYP","target":"record","payload":{"canonical_record":{"source":{"id":"1806.10729","kind":"arxiv","version":5},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-28T01:16:11Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"9843b21eb3500d780249a9f679f4f4372c9959c237079643d97b958e409eb082","abstract_canon_sha256":"791b05255c4de7cf675b1a0006d0c96ba4f88c5a5ee0dd5d47017411463753d1"},"schema_version":"1.0"},"canonical_sha256":"f850c33587f3c6c52ffd0ff0cdc4c2c3edb3aaf5c76af0c31a54765e29173834","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:59:38.625965Z","signature_b64":"mCnJ5pPY034sWMT2mKsIijmhp03/sTlpPxD85fnuijefszvzNzQD/lNrjOCHG905tuTz4O8RK5LHYAEYJklMDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f850c33587f3c6c52ffd0ff0cdc4c2c3edb3aaf5c76af0c31a54765e29173834","last_reissued_at":"2026-05-17T23:59:38.625183Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:59:38.625183Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1806.10729","source_version":5,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:38Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DPtY8y4FIdYltGvru8laXlWt4J1w6nUntKQUng5ZriFdRw97FAtSy9t53WH1BdzS0rwLf8w8AlILAL0SRmjTAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T22:28:25.155632Z"},"content_sha256":"380bc0becfd2126d48d59e00b5f874d6bb65c3e415b8275f257da897756e2b51","schema_version":"1.0","event_id":"sha256:380bc0becfd2126d48d59e00b5f874d6bb65c3e415b8275f257da897756e2b51"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:7BIMGNMH6PDMKL75B7YM3RGCYP","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Illuminating Generalization in Deep Reinforcement Learning through Procedural Level Generation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","stat.ML"],"primary_cat":"cs.LG","authors_text":"Ahmed Khalifa, Julian Togelius, Niels Justesen, Philip Bontrager, Ruben Rodriguez Torrado, Sebastian Risi","submitted_at":"2018-06-28T01:16:11Z","abstract_excerpt":"Deep reinforcement learning (RL) has shown impressive results in a variety of domains, learning directly from high-dimensional sensory streams. However, when neural networks are trained in a fixed environment, such as a single level in a video game, they will usually overfit and fail to generalize to new levels. When RL models overfit, even slight modifications to the environment can result in poor agent performance. This paper explores how procedurally generated levels during training can increase generality. We show that for some games procedural level generation enables generalization to ne"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.10729","kind":"arxiv","version":5},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:38Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZCq2Lk66P9Zc5y4ZhwDDZoN1ITWj7YiAbB2E1jHXRwY60QrrMtnXYLU298kPjeVTe1CO4GGsW/ZiXXZbRwwlAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T22:28:25.156304Z"},"content_sha256":"4cf6a1ce792736931eb019b50c76afcbf3de3771af48bf62a935047d06867f52","schema_version":"1.0","event_id":"sha256:4cf6a1ce792736931eb019b50c76afcbf3de3771af48bf62a935047d06867f52"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/7BIMGNMH6PDMKL75B7YM3RGCYP/bundle.json","state_url":"https://pith.science/pith/7BIMGNMH6PDMKL75B7YM3RGCYP/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/7BIMGNMH6PDMKL75B7YM3RGCYP/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-29T22:28:25Z","links":{"resolver":"https://pith.science/pith/7BIMGNMH6PDMKL75B7YM3RGCYP","bundle":"https://pith.science/pith/7BIMGNMH6PDMKL75B7YM3RGCYP/bundle.json","state":"https://pith.science/pith/7BIMGNMH6PDMKL75B7YM3RGCYP/state.json","well_known_bundle":"https://pith.science/.well-known/pith/7BIMGNMH6PDMKL75B7YM3RGCYP/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:7BIMGNMH6PDMKL75B7YM3RGCYP","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"791b05255c4de7cf675b1a0006d0c96ba4f88c5a5ee0dd5d47017411463753d1","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-28T01:16:11Z","title_canon_sha256":"9843b21eb3500d780249a9f679f4f4372c9959c237079643d97b958e409eb082"},"schema_version":"1.0","source":{"id":"1806.10729","kind":"arxiv","version":5}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1806.10729","created_at":"2026-05-17T23:59:38Z"},{"alias_kind":"arxiv_version","alias_value":"1806.10729v5","created_at":"2026-05-17T23:59:38Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.10729","created_at":"2026-05-17T23:59:38Z"},{"alias_kind":"pith_short_12","alias_value":"7BIMGNMH6PDM","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_16","alias_value":"7BIMGNMH6PDMKL75","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_8","alias_value":"7BIMGNMH","created_at":"2026-05-18T12:32:11Z"}],"graph_snapshots":[{"event_id":"sha256:4cf6a1ce792736931eb019b50c76afcbf3de3771af48bf62a935047d06867f52","target":"graph","created_at":"2026-05-17T23:59:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Deep reinforcement learning (RL) has shown impressive results in a variety of domains, learning directly from high-dimensional sensory streams. However, when neural networks are trained in a fixed environment, such as a single level in a video game, they will usually overfit and fail to generalize to new levels. When RL models overfit, even slight modifications to the environment can result in poor agent performance. This paper explores how procedurally generated levels during training can increase generality. We show that for some games procedural level generation enables generalization to ne","authors_text":"Ahmed Khalifa, Julian Togelius, Niels Justesen, Philip Bontrager, Ruben Rodriguez Torrado, Sebastian Risi","cross_cats":["cs.AI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-28T01:16:11Z","title":"Illuminating Generalization in Deep Reinforcement Learning through Procedural Level Generation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.10729","kind":"arxiv","version":5},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:380bc0becfd2126d48d59e00b5f874d6bb65c3e415b8275f257da897756e2b51","target":"record","created_at":"2026-05-17T23:59:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"791b05255c4de7cf675b1a0006d0c96ba4f88c5a5ee0dd5d47017411463753d1","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-28T01:16:11Z","title_canon_sha256":"9843b21eb3500d780249a9f679f4f4372c9959c237079643d97b958e409eb082"},"schema_version":"1.0","source":{"id":"1806.10729","kind":"arxiv","version":5}},"canonical_sha256":"f850c33587f3c6c52ffd0ff0cdc4c2c3edb3aaf5c76af0c31a54765e29173834","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f850c33587f3c6c52ffd0ff0cdc4c2c3edb3aaf5c76af0c31a54765e29173834","first_computed_at":"2026-05-17T23:59:38.625183Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:59:38.625183Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"mCnJ5pPY034sWMT2mKsIijmhp03/sTlpPxD85fnuijefszvzNzQD/lNrjOCHG905tuTz4O8RK5LHYAEYJklMDw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:59:38.625965Z","signed_message":"canonical_sha256_bytes"},"source_id":"1806.10729","source_kind":"arxiv","source_version":5}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:380bc0becfd2126d48d59e00b5f874d6bb65c3e415b8275f257da897756e2b51","sha256:4cf6a1ce792736931eb019b50c76afcbf3de3771af48bf62a935047d06867f52"],"state_sha256":"e18d2247b9bcf0a18ba57d07a538394d5b09207020d4a6fa4a77af6a5da7df50"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EN/6H70KuEcnDjNtVn0wiH8Ov1LiMDN63uj/4Ke7hbmZrUuVmrxm/OfzBd1+QQOlm6Ux53puWuzlNikvyPIjCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-29T22:28:25.159793Z","bundle_sha256":"b7dd2f9532a376d91cabea3880d4d74a8078bd318263c13ce9534042a0b085a9"}}