{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:JJOK62EJWLCVMOY364RHBJNAMH","short_pith_number":"pith:JJOK62EJ","canonical_record":{"source":{"id":"1611.02205","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-07T18:33:38Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"b3b08c38d3dbea2b0008aaf0d86c7f3cf90587014c27362f092eb7b071471eb9","abstract_canon_sha256":"4c33f707ed18401144eafa5976b5d4d7ff5927d20df7ca685565e05ab69f88b7"},"schema_version":"1.0"},"canonical_sha256":"4a5caf6889b2c5563b1bf72270a5a061c1e14f13e7821699ca2858626e28cfcc","source":{"kind":"arxiv","id":"1611.02205","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.02205","created_at":"2026-05-18T00:51:13Z"},{"alias_kind":"arxiv_version","alias_value":"1611.02205v2","created_at":"2026-05-18T00:51:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.02205","created_at":"2026-05-18T00:51:13Z"},{"alias_kind":"pith_short_12","alias_value":"JJOK62EJWLCV","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_16","alias_value":"JJOK62EJWLCVMOY3","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_8","alias_value":"JJOK62EJ","created_at":"2026-05-18T12:30:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:JJOK62EJWLCVMOY364RHBJNAMH","target":"record","payload":{"canonical_record":{"source":{"id":"1611.02205","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-07T18:33:38Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"b3b08c38d3dbea2b0008aaf0d86c7f3cf90587014c27362f092eb7b071471eb9","abstract_canon_sha256":"4c33f707ed18401144eafa5976b5d4d7ff5927d20df7ca685565e05ab69f88b7"},"schema_version":"1.0"},"canonical_sha256":"4a5caf6889b2c5563b1bf72270a5a061c1e14f13e7821699ca2858626e28cfcc","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:51:13.296682Z","signature_b64":"nO0GxWlp7+qD6BKoqWr0EAIQlbjP5EU+Z+sqe7ncM0huXcssHmrOvpMzRqby7iVlBzYdlUYsYBBIdJcLaSspAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4a5caf6889b2c5563b1bf72270a5a061c1e14f13e7821699ca2858626e28cfcc","last_reissued_at":"2026-05-18T00:51:13.295932Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:51:13.295932Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1611.02205","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:51:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BOoPQYOC3zw43y+Gexc9XVCHlaB8o6aInna8oD4e8KcIE46/Afyrfd9ql2A/GCM0qNItk+p6bf6AgdUtqwxGDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T01:51:19.425891Z"},"content_sha256":"c05ad6486a41bf4c07ba63c9bf3ac37bbdf52108e5f8e2e661b8b6d6d2d3cb08","schema_version":"1.0","event_id":"sha256:c05ad6486a41bf4c07ba63c9bf3ac37bbdf52108e5f8e2e661b8b6d6d2d3cb08"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:JJOK62EJWLCVMOY364RHBJNAMH","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Playing SNES in the Retro Learning Environment","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Itay Hubara, Nadav Bhonker, Shai Rozenberg","submitted_at":"2016-11-07T18:33:38Z","abstract_excerpt":"Mastering a video game requires skill, tactics and strategy. While these attributes may be acquired naturally by human players, teaching them to a computer program is a far more challenging task. In recent years, extensive research was carried out in the field of reinforcement learning and numerous algorithms were introduced, aiming to learn how to perform human tasks such as playing video games. As a result, the Arcade Learning Environment (ALE) (Bellemare et al., 2013) has become a commonly used benchmark environment allowing algorithms to train on various Atari 2600 games. In many games the"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.02205","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:51:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oYcFRa92PFRZtjQ6jk7JVPN9Rh0yYxweAWQX9+6p95opRj/OTUHPVMhuiIENQtHPzPRCoEpkszxaet2cKLSEAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T01:51:19.426563Z"},"content_sha256":"631e24cdf89ee61b5486aa9a3937e46001c830b6a9094facb14dea80bd0ae8f0","schema_version":"1.0","event_id":"sha256:631e24cdf89ee61b5486aa9a3937e46001c830b6a9094facb14dea80bd0ae8f0"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JJOK62EJWLCVMOY364RHBJNAMH/bundle.json","state_url":"https://pith.science/pith/JJOK62EJWLCVMOY364RHBJNAMH/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JJOK62EJWLCVMOY364RHBJNAMH/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T01:51:19Z","links":{"resolver":"https://pith.science/pith/JJOK62EJWLCVMOY364RHBJNAMH","bundle":"https://pith.science/pith/JJOK62EJWLCVMOY364RHBJNAMH/bundle.json","state":"https://pith.science/pith/JJOK62EJWLCVMOY364RHBJNAMH/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JJOK62EJWLCVMOY364RHBJNAMH/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:JJOK62EJWLCVMOY364RHBJNAMH","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4c33f707ed18401144eafa5976b5d4d7ff5927d20df7ca685565e05ab69f88b7","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-07T18:33:38Z","title_canon_sha256":"b3b08c38d3dbea2b0008aaf0d86c7f3cf90587014c27362f092eb7b071471eb9"},"schema_version":"1.0","source":{"id":"1611.02205","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.02205","created_at":"2026-05-18T00:51:13Z"},{"alias_kind":"arxiv_version","alias_value":"1611.02205v2","created_at":"2026-05-18T00:51:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.02205","created_at":"2026-05-18T00:51:13Z"},{"alias_kind":"pith_short_12","alias_value":"JJOK62EJWLCV","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_16","alias_value":"JJOK62EJWLCVMOY3","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_8","alias_value":"JJOK62EJ","created_at":"2026-05-18T12:30:25Z"}],"graph_snapshots":[{"event_id":"sha256:631e24cdf89ee61b5486aa9a3937e46001c830b6a9094facb14dea80bd0ae8f0","target":"graph","created_at":"2026-05-18T00:51:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Mastering a video game requires skill, tactics and strategy. While these attributes may be acquired naturally by human players, teaching them to a computer program is a far more challenging task. In recent years, extensive research was carried out in the field of reinforcement learning and numerous algorithms were introduced, aiming to learn how to perform human tasks such as playing video games. As a result, the Arcade Learning Environment (ALE) (Bellemare et al., 2013) has become a commonly used benchmark environment allowing algorithms to train on various Atari 2600 games. In many games the","authors_text":"Itay Hubara, Nadav Bhonker, Shai Rozenberg","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-07T18:33:38Z","title":"Playing SNES in the Retro Learning Environment"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.02205","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c05ad6486a41bf4c07ba63c9bf3ac37bbdf52108e5f8e2e661b8b6d6d2d3cb08","target":"record","created_at":"2026-05-18T00:51:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4c33f707ed18401144eafa5976b5d4d7ff5927d20df7ca685565e05ab69f88b7","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-07T18:33:38Z","title_canon_sha256":"b3b08c38d3dbea2b0008aaf0d86c7f3cf90587014c27362f092eb7b071471eb9"},"schema_version":"1.0","source":{"id":"1611.02205","kind":"arxiv","version":2}},"canonical_sha256":"4a5caf6889b2c5563b1bf72270a5a061c1e14f13e7821699ca2858626e28cfcc","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4a5caf6889b2c5563b1bf72270a5a061c1e14f13e7821699ca2858626e28cfcc","first_computed_at":"2026-05-18T00:51:13.295932Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:51:13.295932Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"nO0GxWlp7+qD6BKoqWr0EAIQlbjP5EU+Z+sqe7ncM0huXcssHmrOvpMzRqby7iVlBzYdlUYsYBBIdJcLaSspAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:51:13.296682Z","signed_message":"canonical_sha256_bytes"},"source_id":"1611.02205","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c05ad6486a41bf4c07ba63c9bf3ac37bbdf52108e5f8e2e661b8b6d6d2d3cb08","sha256:631e24cdf89ee61b5486aa9a3937e46001c830b6a9094facb14dea80bd0ae8f0"],"state_sha256":"7cec94f5e17b2bc245576df02aa2de272a03ad88e953849c7f4154d2019a2c9b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sqK/JIttO69SRlaG/UCyJMIhc6y21TZnpMo0wThzU3AbnVUaaiHv3lYVOclroOGqL/c4Ocxu26x5NlWDBXE2DA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T01:51:19.429938Z","bundle_sha256":"62fdf0a2d96768d80d0aeaecda5c9a74b800ba9e60eb8da962615123f6b1237e"}}