{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:LMMQHYOHEYZHWB5LRM5WUIGWGM","short_pith_number":"pith:LMMQHYOH","canonical_record":{"source":{"id":"1903.04311","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-11T14:11:20Z","cross_cats_sorted":["cs.AI","cs.NE"],"title_canon_sha256":"5ac442429e3536630d5a5759ebadb5f9f413a39a6e21d3e6f960dc514f1002bc","abstract_canon_sha256":"1487a88ad459ac01d66a2329b06874579a59c5d428fe823bb45e967470ea6cc1"},"schema_version":"1.0"},"canonical_sha256":"5b1903e1c726327b07ab8b3b6a20d6331d3028fdc3fc36a87910a1a094bc4672","source":{"kind":"arxiv","id":"1903.04311","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.04311","created_at":"2026-05-17T23:48:50Z"},{"alias_kind":"arxiv_version","alias_value":"1903.04311v2","created_at":"2026-05-17T23:48:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.04311","created_at":"2026-05-17T23:48:50Z"},{"alias_kind":"pith_short_12","alias_value":"LMMQHYOHEYZH","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_16","alias_value":"LMMQHYOHEYZHWB5L","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_8","alias_value":"LMMQHYOH","created_at":"2026-05-18T12:33:21Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:LMMQHYOHEYZHWB5LRM5WUIGWGM","target":"record","payload":{"canonical_record":{"source":{"id":"1903.04311","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-11T14:11:20Z","cross_cats_sorted":["cs.AI","cs.NE"],"title_canon_sha256":"5ac442429e3536630d5a5759ebadb5f9f413a39a6e21d3e6f960dc514f1002bc","abstract_canon_sha256":"1487a88ad459ac01d66a2329b06874579a59c5d428fe823bb45e967470ea6cc1"},"schema_version":"1.0"},"canonical_sha256":"5b1903e1c726327b07ab8b3b6a20d6331d3028fdc3fc36a87910a1a094bc4672","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:48:50.040339Z","signature_b64":"N64DYCn/1ykVocL+su4NGdZKYk/6YZXeQgKKR26h4KQCUuVG/94sipUobVwp4aNnyxxuK7jp/h6o8NkxII95Cg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5b1903e1c726327b07ab8b3b6a20d6331d3028fdc3fc36a87910a1a094bc4672","last_reissued_at":"2026-05-17T23:48:50.039801Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:48:50.039801Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1903.04311","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:48:50Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"66SZz6NXGtwE6GOWrbSqeMUeBjTjfQJQxuFuI1JJ1gU1udTFh5pkCcKaLbXRQ04c7B419KLHTfo//ymZkwjyCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T14:01:53.353836Z"},"content_sha256":"ca7b0845f4d878135e35f74cb0a24ccd63be83b9bce3845e21dc7e873e5f174b","schema_version":"1.0","event_id":"sha256:ca7b0845f4d878135e35f74cb0a24ccd63be83b9bce3845e21dc7e873e5f174b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:LMMQHYOHEYZHWB5LRM5WUIGWGM","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Deep Recurrent Q-Learning vs Deep Q-Learning on a simple Partially Observable Markov Decision Process with Minecraft","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.NE"],"primary_cat":"cs.LG","authors_text":"Cl\\'ement Romac, Vincent B\\'eraud","submitted_at":"2019-03-11T14:11:20Z","abstract_excerpt":"Deep Q-Learning has been successfully applied to a wide variety of tasks in the past several years. However, the architecture of the vanilla Deep Q-Network is not suited to deal with partially observable environments such as 3D video games. For this, recurrent layers have been added to the Deep Q-Network in order to allow it to handle past dependencies. We here use Minecraft for its customization advantages and design two very simple missions that can be frames as Partially Observable Markov Decision Process. We compare on these missions the Deep Q-Network and the Deep Recurrent Q-Network in o"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.04311","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:48:50Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"eIfOT8fgUlJDHd/N2ApiwrNVOkRaMBcrCOB4MlI13grC44Jrn1B5Sw6wbiib+xk72TP3A0keReWhCrp1l1eDCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T14:01:53.354215Z"},"content_sha256":"bf29178d7cc271d698740ba4c1604777116a8634a88a70487744421b3244118e","schema_version":"1.0","event_id":"sha256:bf29178d7cc271d698740ba4c1604777116a8634a88a70487744421b3244118e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LMMQHYOHEYZHWB5LRM5WUIGWGM/bundle.json","state_url":"https://pith.science/pith/LMMQHYOHEYZHWB5LRM5WUIGWGM/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LMMQHYOHEYZHWB5LRM5WUIGWGM/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T14:01:53Z","links":{"resolver":"https://pith.science/pith/LMMQHYOHEYZHWB5LRM5WUIGWGM","bundle":"https://pith.science/pith/LMMQHYOHEYZHWB5LRM5WUIGWGM/bundle.json","state":"https://pith.science/pith/LMMQHYOHEYZHWB5LRM5WUIGWGM/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LMMQHYOHEYZHWB5LRM5WUIGWGM/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:LMMQHYOHEYZHWB5LRM5WUIGWGM","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"1487a88ad459ac01d66a2329b06874579a59c5d428fe823bb45e967470ea6cc1","cross_cats_sorted":["cs.AI","cs.NE"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-11T14:11:20Z","title_canon_sha256":"5ac442429e3536630d5a5759ebadb5f9f413a39a6e21d3e6f960dc514f1002bc"},"schema_version":"1.0","source":{"id":"1903.04311","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.04311","created_at":"2026-05-17T23:48:50Z"},{"alias_kind":"arxiv_version","alias_value":"1903.04311v2","created_at":"2026-05-17T23:48:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.04311","created_at":"2026-05-17T23:48:50Z"},{"alias_kind":"pith_short_12","alias_value":"LMMQHYOHEYZH","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_16","alias_value":"LMMQHYOHEYZHWB5L","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_8","alias_value":"LMMQHYOH","created_at":"2026-05-18T12:33:21Z"}],"graph_snapshots":[{"event_id":"sha256:bf29178d7cc271d698740ba4c1604777116a8634a88a70487744421b3244118e","target":"graph","created_at":"2026-05-17T23:48:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Deep Q-Learning has been successfully applied to a wide variety of tasks in the past several years. However, the architecture of the vanilla Deep Q-Network is not suited to deal with partially observable environments such as 3D video games. For this, recurrent layers have been added to the Deep Q-Network in order to allow it to handle past dependencies. We here use Minecraft for its customization advantages and design two very simple missions that can be frames as Partially Observable Markov Decision Process. We compare on these missions the Deep Q-Network and the Deep Recurrent Q-Network in o","authors_text":"Cl\\'ement Romac, Vincent B\\'eraud","cross_cats":["cs.AI","cs.NE"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-11T14:11:20Z","title":"Deep Recurrent Q-Learning vs Deep Q-Learning on a simple Partially Observable Markov Decision Process with Minecraft"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.04311","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ca7b0845f4d878135e35f74cb0a24ccd63be83b9bce3845e21dc7e873e5f174b","target":"record","created_at":"2026-05-17T23:48:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"1487a88ad459ac01d66a2329b06874579a59c5d428fe823bb45e967470ea6cc1","cross_cats_sorted":["cs.AI","cs.NE"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-11T14:11:20Z","title_canon_sha256":"5ac442429e3536630d5a5759ebadb5f9f413a39a6e21d3e6f960dc514f1002bc"},"schema_version":"1.0","source":{"id":"1903.04311","kind":"arxiv","version":2}},"canonical_sha256":"5b1903e1c726327b07ab8b3b6a20d6331d3028fdc3fc36a87910a1a094bc4672","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5b1903e1c726327b07ab8b3b6a20d6331d3028fdc3fc36a87910a1a094bc4672","first_computed_at":"2026-05-17T23:48:50.039801Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:48:50.039801Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"N64DYCn/1ykVocL+su4NGdZKYk/6YZXeQgKKR26h4KQCUuVG/94sipUobVwp4aNnyxxuK7jp/h6o8NkxII95Cg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:48:50.040339Z","signed_message":"canonical_sha256_bytes"},"source_id":"1903.04311","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ca7b0845f4d878135e35f74cb0a24ccd63be83b9bce3845e21dc7e873e5f174b","sha256:bf29178d7cc271d698740ba4c1604777116a8634a88a70487744421b3244118e"],"state_sha256":"b5cb6eee6d36ab782d5450b007bdb59c06536cbe791137f9365201166a415f7b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sjlgkGRunrZDAp4X4oT+gQPelzIkkIUXJtFADeVHdSJ0KXnwoP8ZrxKrjF8YwarT4M++INT7s8cf5h63qd6bDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T14:01:53.356378Z","bundle_sha256":"c3d091412ba24b1b65e6a276bd907f947b29b5c491adfcbfa290be3d153711b0"}}