{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:H2KM56DCYCJMY2MR2Q5UCTHIBY","short_pith_number":"pith:H2KM56DC","schema_version":"1.0","canonical_sha256":"3e94cef862c092cc6991d43b414ce80e1ff0392797fc70934252d8b5bdd94a41","source":{"kind":"arxiv","id":"1602.04936","version":1},"attestation_state":"computed","paper":{"title":"Reinforcement Learning approach for Real Time Strategy Games Battle city and S3","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Amit Patel, Harshit Sethy","submitted_at":"2016-02-16T08:17:17Z","abstract_excerpt":"In this paper we proposed reinforcement learning algorithms with the generalized reward function. In our proposed method we use Q-learning and SARSA algorithms with generalised reward function to train the reinforcement learning agent. We evaluated the performance of our proposed algorithms on two real-time strategy games called BattleCity and S3. There are two main advantages of having such an approach as compared to other works in RTS. (1) We can ignore the concept of a simulator which is often game specific and is usually hard coded in any type of RTS games (2) our system can learn from int"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1602.04936","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2016-02-16T08:17:17Z","cross_cats_sorted":[],"title_canon_sha256":"f3ac8f5ae6342775970accb52e56f097b1133e80c3c9e7f6a84a35fcc96144c5","abstract_canon_sha256":"5cc4fe92aff259f181b0bd190e70ab2f2f8268a6f3a956dfca3a13a4b75f462b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:20:37.822691Z","signature_b64":"BP3ivtzaiKD5J9doLZRzd04xgAqyqKqYsMi3EWeyDXWFcWgUCqfG086DJzce9Z+xt7EHqXMz6V1/AXRWGctFBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3e94cef862c092cc6991d43b414ce80e1ff0392797fc70934252d8b5bdd94a41","last_reissued_at":"2026-05-18T01:20:37.822313Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:20:37.822313Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Reinforcement Learning approach for Real Time Strategy Games Battle city and S3","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Amit Patel, Harshit Sethy","submitted_at":"2016-02-16T08:17:17Z","abstract_excerpt":"In this paper we proposed reinforcement learning algorithms with the generalized reward function. In our proposed method we use Q-learning and SARSA algorithms with generalised reward function to train the reinforcement learning agent. We evaluated the performance of our proposed algorithms on two real-time strategy games called BattleCity and S3. There are two main advantages of having such an approach as compared to other works in RTS. (1) We can ignore the concept of a simulator which is often game specific and is usually hard coded in any type of RTS games (2) our system can learn from int"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1602.04936","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1602.04936","created_at":"2026-05-18T01:20:37.822377+00:00"},{"alias_kind":"arxiv_version","alias_value":"1602.04936v1","created_at":"2026-05-18T01:20:37.822377+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1602.04936","created_at":"2026-05-18T01:20:37.822377+00:00"},{"alias_kind":"pith_short_12","alias_value":"H2KM56DCYCJM","created_at":"2026-05-18T12:30:19.053100+00:00"},{"alias_kind":"pith_short_16","alias_value":"H2KM56DCYCJMY2MR","created_at":"2026-05-18T12:30:19.053100+00:00"},{"alias_kind":"pith_short_8","alias_value":"H2KM56DC","created_at":"2026-05-18T12:30:19.053100+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY","json":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY.json","graph_json":"https://pith.science/api/pith-number/H2KM56DCYCJMY2MR2Q5UCTHIBY/graph.json","events_json":"https://pith.science/api/pith-number/H2KM56DCYCJMY2MR2Q5UCTHIBY/events.json","paper":"https://pith.science/paper/H2KM56DC"},"agent_actions":{"view_html":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY","download_json":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY.json","view_paper":"https://pith.science/paper/H2KM56DC","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1602.04936&json=true","fetch_graph":"https://pith.science/api/pith-number/H2KM56DCYCJMY2MR2Q5UCTHIBY/graph.json","fetch_events":"https://pith.science/api/pith-number/H2KM56DCYCJMY2MR2Q5UCTHIBY/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY/action/timestamp_anchor","attest_storage":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY/action/storage_attestation","attest_author":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY/action/author_attestation","sign_citation":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY/action/citation_signature","submit_replication":"https://pith.science/pith/H2KM56DCYCJMY2MR2Q5UCTHIBY/action/replication_record"}},"created_at":"2026-05-18T01:20:37.822377+00:00","updated_at":"2026-05-18T01:20:37.822377+00:00"}