{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:V3RQ63HELZOGZJ6TPBOEPTW4TF","short_pith_number":"pith:V3RQ63HE","canonical_record":{"source":{"id":"1801.08841","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-01-26T15:12:31Z","cross_cats_sorted":["cs.GT"],"title_canon_sha256":"a8b4f4322eed19d3582749f2459715df1cba4de9e1547aff3d02034d5dca1fcf","abstract_canon_sha256":"1a9745f2d75bfcc11c9061f38c89a46ad2d96b354110bfdd4e61d006ef99f50a"},"schema_version":"1.0"},"canonical_sha256":"aee30f6ce45e5c6ca7d3785c47cedc9940c7958635fc1cddc562246dbc9adc63","source":{"kind":"arxiv","id":"1801.08841","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1801.08841","created_at":"2026-05-18T00:25:02Z"},{"alias_kind":"arxiv_version","alias_value":"1801.08841v1","created_at":"2026-05-18T00:25:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.08841","created_at":"2026-05-18T00:25:02Z"},{"alias_kind":"pith_short_12","alias_value":"V3RQ63HELZOG","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_16","alias_value":"V3RQ63HELZOGZJ6T","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_8","alias_value":"V3RQ63HE","created_at":"2026-05-18T12:32:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:V3RQ63HELZOGZJ6TPBOEPTW4TF","target":"record","payload":{"canonical_record":{"source":{"id":"1801.08841","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-01-26T15:12:31Z","cross_cats_sorted":["cs.GT"],"title_canon_sha256":"a8b4f4322eed19d3582749f2459715df1cba4de9e1547aff3d02034d5dca1fcf","abstract_canon_sha256":"1a9745f2d75bfcc11c9061f38c89a46ad2d96b354110bfdd4e61d006ef99f50a"},"schema_version":"1.0"},"canonical_sha256":"aee30f6ce45e5c6ca7d3785c47cedc9940c7958635fc1cddc562246dbc9adc63","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:25:02.893551Z","signature_b64":"+LW/8sDGsy9VNxhcs8LmZKdOER26FJUKCl5sTwQV1MOd6Z9B6j0Hcfb9jUUSyYOppUHdWq0Lbp0cbo1MjxSCCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"aee30f6ce45e5c6ca7d3785c47cedc9940c7958635fc1cddc562246dbc9adc63","last_reissued_at":"2026-05-18T00:25:02.893109Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:25:02.893109Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1801.08841","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:25:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oiRijUeRirpjK5MdGSNo+0V1ZTL+ZVWvpNcW80p+cWN4HoWG0GpyojOeg2WEXmrZWcuBGFCR9ORZj6vbHqwTCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T21:35:27.705895Z"},"content_sha256":"3e6955c7cd6d5297b9d39f5cd7951bbd316ee868a1d1bc01aa8c8fcd68d0dce0","schema_version":"1.0","event_id":"sha256:3e6955c7cd6d5297b9d39f5cd7951bbd316ee868a1d1bc01aa8c8fcd68d0dce0"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:V3RQ63HELZOGZJ6TPBOEPTW4TF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"FlashRL: A Reinforcement Learning Platform for Flash Games","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.GT"],"primary_cat":"cs.AI","authors_text":"Morten Goodwin, Ole-Christoffer Granmo, Per-Arne Andersen","submitted_at":"2018-01-26T15:12:31Z","abstract_excerpt":"Reinforcement Learning (RL) is a research area that has blossomed tremendously in recent years and has shown remarkable potential in among others successfully playing computer games. However, there only exists a few game platforms that provide diversity in tasks and state-space needed to advance RL algorithms. The existing platforms offer RL access to Atari- and a few web-based games, but no platform fully expose access to Flash games. This is unfortunate because applying RL to Flash games have potential to push the research of RL algorithms.\n  This paper introduces the Flash Reinforcement Lea"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.08841","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:25:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0QIwly6k1h9HTz2zrRQ/DmDT5DR52lA/vQKWj+UQYd0biL1Zusx/o7d+GPPUPFb5+08qcLSH5kKEQqOl7pyXBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T21:35:27.706250Z"},"content_sha256":"17c788c82dab7966d885ad802b0d723ec72df496a38e4f54b7d337734b7cfa3d","schema_version":"1.0","event_id":"sha256:17c788c82dab7966d885ad802b0d723ec72df496a38e4f54b7d337734b7cfa3d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/V3RQ63HELZOGZJ6TPBOEPTW4TF/bundle.json","state_url":"https://pith.science/pith/V3RQ63HELZOGZJ6TPBOEPTW4TF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/V3RQ63HELZOGZJ6TPBOEPTW4TF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T21:35:27Z","links":{"resolver":"https://pith.science/pith/V3RQ63HELZOGZJ6TPBOEPTW4TF","bundle":"https://pith.science/pith/V3RQ63HELZOGZJ6TPBOEPTW4TF/bundle.json","state":"https://pith.science/pith/V3RQ63HELZOGZJ6TPBOEPTW4TF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/V3RQ63HELZOGZJ6TPBOEPTW4TF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:V3RQ63HELZOGZJ6TPBOEPTW4TF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"1a9745f2d75bfcc11c9061f38c89a46ad2d96b354110bfdd4e61d006ef99f50a","cross_cats_sorted":["cs.GT"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-01-26T15:12:31Z","title_canon_sha256":"a8b4f4322eed19d3582749f2459715df1cba4de9e1547aff3d02034d5dca1fcf"},"schema_version":"1.0","source":{"id":"1801.08841","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1801.08841","created_at":"2026-05-18T00:25:02Z"},{"alias_kind":"arxiv_version","alias_value":"1801.08841v1","created_at":"2026-05-18T00:25:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.08841","created_at":"2026-05-18T00:25:02Z"},{"alias_kind":"pith_short_12","alias_value":"V3RQ63HELZOG","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_16","alias_value":"V3RQ63HELZOGZJ6T","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_8","alias_value":"V3RQ63HE","created_at":"2026-05-18T12:32:56Z"}],"graph_snapshots":[{"event_id":"sha256:17c788c82dab7966d885ad802b0d723ec72df496a38e4f54b7d337734b7cfa3d","target":"graph","created_at":"2026-05-18T00:25:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Reinforcement Learning (RL) is a research area that has blossomed tremendously in recent years and has shown remarkable potential in among others successfully playing computer games. However, there only exists a few game platforms that provide diversity in tasks and state-space needed to advance RL algorithms. The existing platforms offer RL access to Atari- and a few web-based games, but no platform fully expose access to Flash games. This is unfortunate because applying RL to Flash games have potential to push the research of RL algorithms.\n  This paper introduces the Flash Reinforcement Lea","authors_text":"Morten Goodwin, Ole-Christoffer Granmo, Per-Arne Andersen","cross_cats":["cs.GT"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-01-26T15:12:31Z","title":"FlashRL: A Reinforcement Learning Platform for Flash Games"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.08841","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3e6955c7cd6d5297b9d39f5cd7951bbd316ee868a1d1bc01aa8c8fcd68d0dce0","target":"record","created_at":"2026-05-18T00:25:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"1a9745f2d75bfcc11c9061f38c89a46ad2d96b354110bfdd4e61d006ef99f50a","cross_cats_sorted":["cs.GT"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-01-26T15:12:31Z","title_canon_sha256":"a8b4f4322eed19d3582749f2459715df1cba4de9e1547aff3d02034d5dca1fcf"},"schema_version":"1.0","source":{"id":"1801.08841","kind":"arxiv","version":1}},"canonical_sha256":"aee30f6ce45e5c6ca7d3785c47cedc9940c7958635fc1cddc562246dbc9adc63","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"aee30f6ce45e5c6ca7d3785c47cedc9940c7958635fc1cddc562246dbc9adc63","first_computed_at":"2026-05-18T00:25:02.893109Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:25:02.893109Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+LW/8sDGsy9VNxhcs8LmZKdOER26FJUKCl5sTwQV1MOd6Z9B6j0Hcfb9jUUSyYOppUHdWq0Lbp0cbo1MjxSCCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:25:02.893551Z","signed_message":"canonical_sha256_bytes"},"source_id":"1801.08841","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3e6955c7cd6d5297b9d39f5cd7951bbd316ee868a1d1bc01aa8c8fcd68d0dce0","sha256:17c788c82dab7966d885ad802b0d723ec72df496a38e4f54b7d337734b7cfa3d"],"state_sha256":"167ed06935721bd4f12e5b3a4a1019d44f28fa102a430d1ca4d7cde43cbb7555"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6/GDICQ8Ka0/DAp0kJuORdhVp28UjHEJejZUffZwFJYjoyNcOCLJqXBuhj11ZifI9/+OPsyh8vagP6XzpWvuDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T21:35:27.709195Z","bundle_sha256":"01cf1aae6f27096590d3ba03caa1d5e9835a571e6b9b6437c0b731218f80ebd7"}}