{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:3KF7OTHL6ZWOAAIWCUCTWQFCJI","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"51c1f9283a462aab2f55fc3e050ec7d70c504d86fad74220072b227b6d307b8d","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/3.0/","primary_cat":"cs.AI","submitted_at":"2014-02-18T23:01:13Z","title_canon_sha256":"bce73438242d3408f7dd7c76242264f7082894f8468acb9c1548e40e46b927fd"},"schema_version":"1.0","source":{"id":"1402.4525","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1402.4525","created_at":"2026-05-18T02:58:34Z"},{"alias_kind":"arxiv_version","alias_value":"1402.4525v1","created_at":"2026-05-18T02:58:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1402.4525","created_at":"2026-05-18T02:58:34Z"},{"alias_kind":"pith_short_12","alias_value":"3KF7OTHL6ZWO","created_at":"2026-05-18T12:28:11Z"},{"alias_kind":"pith_short_16","alias_value":"3KF7OTHL6ZWOAAIW","created_at":"2026-05-18T12:28:11Z"},{"alias_kind":"pith_short_8","alias_value":"3KF7OTHL","created_at":"2026-05-18T12:28:11Z"}],"graph_snapshots":[{"event_id":"sha256:ec90d0a8c4b7006c878c41394d3d9a41dbf47a83957ad077adbf751aac6bbe06","target":"graph","created_at":"2026-05-18T02:58:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Collecting and maintaining accurate world knowledge in a dynamic, complex, adversarial, and stochastic environment such as the RoboCup 3D Soccer Simulation is a challenging task. Knowledge should be learned in real-time with time constraints. We use recently introduced Off-Policy Gradient Descent algorithms within Reinforcement Learning that illustrate learnable knowledge representations for dynamic role assignments. The results show that the agents have learned competitive policies against the top teams from the RoboCup 2012 competitions for three vs three, five vs five, and seven vs seven ag","authors_text":"Andreas Seekircher, Saminda Abeyruwan, Ubbo Visser","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/3.0/","primary_cat":"cs.AI","submitted_at":"2014-02-18T23:01:13Z","title":"Off-Policy General Value Functions to Represent Dynamic Role Assignments in RoboCup 3D Soccer Simulation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1402.4525","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c26d7768a95dc7ed50a6285664e6f1b2c74d33e2a18ce32036773c3e8f72c27f","target":"record","created_at":"2026-05-18T02:58:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"51c1f9283a462aab2f55fc3e050ec7d70c504d86fad74220072b227b6d307b8d","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/3.0/","primary_cat":"cs.AI","submitted_at":"2014-02-18T23:01:13Z","title_canon_sha256":"bce73438242d3408f7dd7c76242264f7082894f8468acb9c1548e40e46b927fd"},"schema_version":"1.0","source":{"id":"1402.4525","kind":"arxiv","version":1}},"canonical_sha256":"da8bf74cebf66ce0011615053b40a24a104804eff496e2b435b1255717d05fd0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"da8bf74cebf66ce0011615053b40a24a104804eff496e2b435b1255717d05fd0","first_computed_at":"2026-05-18T02:58:34.006703Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:58:34.006703Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"LFFOGddiDC4h0uxWs530ROhATxyGHUexxaLqdtS9g9uGM0IvfXgC9LOL4qqWLwqD4Bv7X3SD2r4nJY/5743aBA==","signature_status":"signed_v1","signed_at":"2026-05-18T02:58:34.007310Z","signed_message":"canonical_sha256_bytes"},"source_id":"1402.4525","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c26d7768a95dc7ed50a6285664e6f1b2c74d33e2a18ce32036773c3e8f72c27f","sha256:ec90d0a8c4b7006c878c41394d3d9a41dbf47a83957ad077adbf751aac6bbe06"],"state_sha256":"3c8c24df8751bcc56ed190681d40ea6ead600aa11b8fa1fa621ee4963555bbb5"}