{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:JZ7HL5XUATFYZ722WTQ74ULFIF","short_pith_number":"pith:JZ7HL5XU","canonical_record":{"source":{"id":"1810.02912","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-10-05T23:45:14Z","cross_cats_sorted":["cs.AI","cs.MA","stat.ML"],"title_canon_sha256":"24dc353d56b4affc2f4b44d10f29f01f8ba5d3f9d3e037dbd14b706b7c12d627","abstract_canon_sha256":"8c0e8409d348c6ded4b83fd193a5caf7e2a3cea06e22c4c4b6b4a41f314c510b"},"schema_version":"1.0"},"canonical_sha256":"4e7e75f6f404cb8cff5ab4e1fe5165415bc81550ac6568c34f6a8bb3606d2bea","source":{"kind":"arxiv","id":"1810.02912","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.02912","created_at":"2026-05-17T23:44:58Z"},{"alias_kind":"arxiv_version","alias_value":"1810.02912v2","created_at":"2026-05-17T23:44:58Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.02912","created_at":"2026-05-17T23:44:58Z"},{"alias_kind":"pith_short_12","alias_value":"JZ7HL5XUATFY","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"JZ7HL5XUATFYZ722","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"JZ7HL5XU","created_at":"2026-05-18T12:32:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:JZ7HL5XUATFYZ722WTQ74ULFIF","target":"record","payload":{"canonical_record":{"source":{"id":"1810.02912","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-10-05T23:45:14Z","cross_cats_sorted":["cs.AI","cs.MA","stat.ML"],"title_canon_sha256":"24dc353d56b4affc2f4b44d10f29f01f8ba5d3f9d3e037dbd14b706b7c12d627","abstract_canon_sha256":"8c0e8409d348c6ded4b83fd193a5caf7e2a3cea06e22c4c4b6b4a41f314c510b"},"schema_version":"1.0"},"canonical_sha256":"4e7e75f6f404cb8cff5ab4e1fe5165415bc81550ac6568c34f6a8bb3606d2bea","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:44:58.885577Z","signature_b64":"d+AtYKr7YoNDMbPdZZWM8EXJMbIdeg3zxFS6Uspkjz1EW1LA9ru/bFErEZFe3BVvU6hCoV96fn2rFjf+vzn+AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4e7e75f6f404cb8cff5ab4e1fe5165415bc81550ac6568c34f6a8bb3606d2bea","last_reissued_at":"2026-05-17T23:44:58.884976Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:44:58.884976Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1810.02912","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:58Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FFleY/b19NGt17L2bEujClgvF8G9RSplhM9qQYtvskNfWX/3UTT24S3UkctCy6eaUA8N0z5J8Lq0O9kaL8UrAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T12:40:05.856944Z"},"content_sha256":"37db0b207df8ac6bb9123c29a532a0e74c805eb307768054c5163c0873396143","schema_version":"1.0","event_id":"sha256:37db0b207df8ac6bb9123c29a532a0e74c805eb307768054c5163c0873396143"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:JZ7HL5XUATFYZ722WTQ74ULFIF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Actor-Attention-Critic for Multi-Agent Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.MA","stat.ML"],"primary_cat":"cs.LG","authors_text":"Fei Sha, Shariq Iqbal","submitted_at":"2018-10-05T23:45:14Z","abstract_excerpt":"Reinforcement learning in multi-agent scenarios is important for real-world applications but presents challenges beyond those seen in single-agent settings. We present an actor-critic algorithm that trains decentralized policies in multi-agent settings, using centrally computed critics that share an attention mechanism which selects relevant information for each agent at every timestep. This attention mechanism enables more effective and scalable learning in complex multi-agent environments, when compared to recent approaches. Our approach is applicable not only to cooperative settings with sh"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.02912","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:58Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"v5PBNQfJ9YfhdZ3Tj5rJlTCuolTmZQUqIEvc8/p95TZT4Fv9IcDMGMdCmnSQYF3Eeiiwoc+XC7gTUbA2rJD8DA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T12:40:05.857300Z"},"content_sha256":"d1e6411a7c5b6046125056491842a75183dbedc8afec86b1e57f615b2272298d","schema_version":"1.0","event_id":"sha256:d1e6411a7c5b6046125056491842a75183dbedc8afec86b1e57f615b2272298d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JZ7HL5XUATFYZ722WTQ74ULFIF/bundle.json","state_url":"https://pith.science/pith/JZ7HL5XUATFYZ722WTQ74ULFIF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JZ7HL5XUATFYZ722WTQ74ULFIF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T12:40:05Z","links":{"resolver":"https://pith.science/pith/JZ7HL5XUATFYZ722WTQ74ULFIF","bundle":"https://pith.science/pith/JZ7HL5XUATFYZ722WTQ74ULFIF/bundle.json","state":"https://pith.science/pith/JZ7HL5XUATFYZ722WTQ74ULFIF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JZ7HL5XUATFYZ722WTQ74ULFIF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:JZ7HL5XUATFYZ722WTQ74ULFIF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8c0e8409d348c6ded4b83fd193a5caf7e2a3cea06e22c4c4b6b4a41f314c510b","cross_cats_sorted":["cs.AI","cs.MA","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-10-05T23:45:14Z","title_canon_sha256":"24dc353d56b4affc2f4b44d10f29f01f8ba5d3f9d3e037dbd14b706b7c12d627"},"schema_version":"1.0","source":{"id":"1810.02912","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.02912","created_at":"2026-05-17T23:44:58Z"},{"alias_kind":"arxiv_version","alias_value":"1810.02912v2","created_at":"2026-05-17T23:44:58Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.02912","created_at":"2026-05-17T23:44:58Z"},{"alias_kind":"pith_short_12","alias_value":"JZ7HL5XUATFY","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"JZ7HL5XUATFYZ722","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"JZ7HL5XU","created_at":"2026-05-18T12:32:33Z"}],"graph_snapshots":[{"event_id":"sha256:d1e6411a7c5b6046125056491842a75183dbedc8afec86b1e57f615b2272298d","target":"graph","created_at":"2026-05-17T23:44:58Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Reinforcement learning in multi-agent scenarios is important for real-world applications but presents challenges beyond those seen in single-agent settings. We present an actor-critic algorithm that trains decentralized policies in multi-agent settings, using centrally computed critics that share an attention mechanism which selects relevant information for each agent at every timestep. This attention mechanism enables more effective and scalable learning in complex multi-agent environments, when compared to recent approaches. Our approach is applicable not only to cooperative settings with sh","authors_text":"Fei Sha, Shariq Iqbal","cross_cats":["cs.AI","cs.MA","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-10-05T23:45:14Z","title":"Actor-Attention-Critic for Multi-Agent Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.02912","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:37db0b207df8ac6bb9123c29a532a0e74c805eb307768054c5163c0873396143","target":"record","created_at":"2026-05-17T23:44:58Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8c0e8409d348c6ded4b83fd193a5caf7e2a3cea06e22c4c4b6b4a41f314c510b","cross_cats_sorted":["cs.AI","cs.MA","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-10-05T23:45:14Z","title_canon_sha256":"24dc353d56b4affc2f4b44d10f29f01f8ba5d3f9d3e037dbd14b706b7c12d627"},"schema_version":"1.0","source":{"id":"1810.02912","kind":"arxiv","version":2}},"canonical_sha256":"4e7e75f6f404cb8cff5ab4e1fe5165415bc81550ac6568c34f6a8bb3606d2bea","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4e7e75f6f404cb8cff5ab4e1fe5165415bc81550ac6568c34f6a8bb3606d2bea","first_computed_at":"2026-05-17T23:44:58.884976Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:44:58.884976Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"d+AtYKr7YoNDMbPdZZWM8EXJMbIdeg3zxFS6Uspkjz1EW1LA9ru/bFErEZFe3BVvU6hCoV96fn2rFjf+vzn+AA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:44:58.885577Z","signed_message":"canonical_sha256_bytes"},"source_id":"1810.02912","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:37db0b207df8ac6bb9123c29a532a0e74c805eb307768054c5163c0873396143","sha256:d1e6411a7c5b6046125056491842a75183dbedc8afec86b1e57f615b2272298d"],"state_sha256":"fabe4d9bd943b1a9ee60f0b2e2b8d90deca1f49c72d12e7a01915798d9178c49"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Y8+S5d80d95QHocPAELM7Qigi5d3xL0b5uc6o9DRAYw1vBXzyBuTkGwYeaBA/fSES8Hpimhr4UyBwMc3BY42BA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T12:40:05.859518Z","bundle_sha256":"492c12e2232d33a3469a1d8413946ed7f0defdc745e0f5c8e99bf381e60646f1"}}