{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2015:F2LZEFTFOQ5JLJJA2RL6GIBNUD","short_pith_number":"pith:F2LZEFTF","schema_version":"1.0","canonical_sha256":"2e97921665743a95a520d457e3202da0e17bd767815522d4b8639cdf84b746a7","source":{"kind":"arxiv","id":"1512.01563","version":2},"attestation_state":"computed","paper":{"title":"State of the Art Control of Atari Games Using Shallow Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Erik Talvitie, Marlos C. Machado, Michael Bowling, Yitao Liang","submitted_at":"2015-12-04T21:06:04Z","abstract_excerpt":"The recently introduced Deep Q-Networks (DQN) algorithm has gained attention as one of the first successful combinations of deep neural networks and reinforcement learning. Its promise was demonstrated in the Arcade Learning Environment (ALE), a challenging framework composed of dozens of Atari 2600 games used to evaluate general competency in AI. It achieved dramatically better results than earlier approaches, showing that its ability to learn good representations is quite robust and general. This paper attempts to understand the principles that underlie DQN's impressive performance and to be"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1512.01563","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-12-04T21:06:04Z","cross_cats_sorted":[],"title_canon_sha256":"31c6cca8acc36950e467538d7fb22708931aca23d766c46943b9009c0177b469","abstract_canon_sha256":"00d8213ca0bfe44b28a149036a5785bed6874a41cacb06e0798c3526180d7e7c"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:16:29.408603Z","signature_b64":"wUDJkKU/yD8tHROK2F6v6KvomySizT9sjAZiA+cJutxFesJzmH55A7JZef8M8q2u+sK7pjF/sgFlZ+1ffoC1AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"2e97921665743a95a520d457e3202da0e17bd767815522d4b8639cdf84b746a7","last_reissued_at":"2026-05-18T01:16:29.408092Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:16:29.408092Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"State of the Art Control of Atari Games Using Shallow Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Erik Talvitie, Marlos C. Machado, Michael Bowling, Yitao Liang","submitted_at":"2015-12-04T21:06:04Z","abstract_excerpt":"The recently introduced Deep Q-Networks (DQN) algorithm has gained attention as one of the first successful combinations of deep neural networks and reinforcement learning. Its promise was demonstrated in the Arcade Learning Environment (ALE), a challenging framework composed of dozens of Atari 2600 games used to evaluate general competency in AI. It achieved dramatically better results than earlier approaches, showing that its ability to learn good representations is quite robust and general. This paper attempts to understand the principles that underlie DQN's impressive performance and to be"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1512.01563","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1512.01563","created_at":"2026-05-18T01:16:29.408157+00:00"},{"alias_kind":"arxiv_version","alias_value":"1512.01563v2","created_at":"2026-05-18T01:16:29.408157+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1512.01563","created_at":"2026-05-18T01:16:29.408157+00:00"},{"alias_kind":"pith_short_12","alias_value":"F2LZEFTFOQ5J","created_at":"2026-05-18T12:29:19.899920+00:00"},{"alias_kind":"pith_short_16","alias_value":"F2LZEFTFOQ5JLJJA","created_at":"2026-05-18T12:29:19.899920+00:00"},{"alias_kind":"pith_short_8","alias_value":"F2LZEFTF","created_at":"2026-05-18T12:29:19.899920+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD","json":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD.json","graph_json":"https://pith.science/api/pith-number/F2LZEFTFOQ5JLJJA2RL6GIBNUD/graph.json","events_json":"https://pith.science/api/pith-number/F2LZEFTFOQ5JLJJA2RL6GIBNUD/events.json","paper":"https://pith.science/paper/F2LZEFTF"},"agent_actions":{"view_html":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD","download_json":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD.json","view_paper":"https://pith.science/paper/F2LZEFTF","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1512.01563&json=true","fetch_graph":"https://pith.science/api/pith-number/F2LZEFTFOQ5JLJJA2RL6GIBNUD/graph.json","fetch_events":"https://pith.science/api/pith-number/F2LZEFTFOQ5JLJJA2RL6GIBNUD/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD/action/timestamp_anchor","attest_storage":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD/action/storage_attestation","attest_author":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD/action/author_attestation","sign_citation":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD/action/citation_signature","submit_replication":"https://pith.science/pith/F2LZEFTFOQ5JLJJA2RL6GIBNUD/action/replication_record"}},"created_at":"2026-05-18T01:16:29.408157+00:00","updated_at":"2026-05-18T01:16:29.408157+00:00"}