{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:MMRBVIC6MMVSSQTJBU4H7VQ3WY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d38669087336242360f25d0fb90d90c0db2dd2d5b6e462c3e367d6fd814eb188","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-03-14T16:59:17Z","title_canon_sha256":"a4b8292a159ce3f4ea29bcee8bf88ce5bcd633ca6313176866adea6411416811"},"schema_version":"1.0","source":{"id":"1803.05402","kind":"arxiv","version":5}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.05402","created_at":"2026-05-18T00:06:25Z"},{"alias_kind":"arxiv_version","alias_value":"1803.05402v5","created_at":"2026-05-18T00:06:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.05402","created_at":"2026-05-18T00:06:25Z"},{"alias_kind":"pith_short_12","alias_value":"MMRBVIC6MMVS","created_at":"2026-05-18T12:32:37Z"},{"alias_kind":"pith_short_16","alias_value":"MMRBVIC6MMVSSQTJ","created_at":"2026-05-18T12:32:37Z"},{"alias_kind":"pith_short_8","alias_value":"MMRBVIC6","created_at":"2026-05-18T12:32:37Z"}],"graph_snapshots":[{"event_id":"sha256:44dca6640cd6fa88fd934070f6a44d8e77a5e120d02e3a9bb0931c0e45aab563","target":"graph","created_at":"2026-05-18T00:06:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this work we describe a novel deep reinforcement learning architecture that allows multiple actions to be selected at every time-step in an efficient manner. Multi-action policies allow complex behaviours to be learnt that would otherwise be hard to achieve when using single action selection techniques. We use both imitation learning and temporal difference (TD) reinforcement learning (RL) to provide a 4x improvement in training time and 2.5x improvement in performance over single action selection TD RL. We demonstrate the capabilities of this network using a complex in-house 3D game. Mimic","authors_text":"Henrik Holst, Jack Harmer, Joakim Bergdahl, Jorge del Val, Kristoffer Sj\\\"o\\\"o, Linus Gissl\\'en, Magnus Nordin, Tom Olsson","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-03-14T16:59:17Z","title":"Imitation Learning with Concurrent Actions in 3D Games"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.05402","kind":"arxiv","version":5},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6c80da0ae2148fa08def6c8ea4bbf8713d0e7e4c5312a037aa79f561af10096e","target":"record","created_at":"2026-05-18T00:06:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d38669087336242360f25d0fb90d90c0db2dd2d5b6e462c3e367d6fd814eb188","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-03-14T16:59:17Z","title_canon_sha256":"a4b8292a159ce3f4ea29bcee8bf88ce5bcd633ca6313176866adea6411416811"},"schema_version":"1.0","source":{"id":"1803.05402","kind":"arxiv","version":5}},"canonical_sha256":"63221aa05e632b2942690d387fd61bb623f164204a2cae3ff65417b8dcf7a00f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"63221aa05e632b2942690d387fd61bb623f164204a2cae3ff65417b8dcf7a00f","first_computed_at":"2026-05-18T00:06:25.090218Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:06:25.090218Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"sFiPvGjMymZLvew81W7rTi6Zm4DNlfjdJlIpKAEZ+TkoQHBilLQilbfuy2lwqxbgv39mjd8FAzto7ykZeG6XBA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:06:25.090937Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.05402","source_kind":"arxiv","source_version":5}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6c80da0ae2148fa08def6c8ea4bbf8713d0e7e4c5312a037aa79f561af10096e","sha256:44dca6640cd6fa88fd934070f6a44d8e77a5e120d02e3a9bb0931c0e45aab563"],"state_sha256":"5ece6cc352d79cd90b87e996a22110799a3b047623ada243c21b2ad83e428764"}