{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:QPRW2DV45W2DP4TYY3WVJU5JEQ","short_pith_number":"pith:QPRW2DV4","schema_version":"1.0","canonical_sha256":"83e36d0ebcedb437f278c6ed54d3a92425f14139f31949cc50a7d2e3a38a4368","source":{"kind":"arxiv","id":"1802.08757","version":2},"attestation_state":"computed","paper":{"title":"Fully Decentralized Multi-Agent Reinforcement Learning with Networked Agents","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.MA","math.OC","stat.ML"],"primary_cat":"cs.LG","authors_text":"Han Liu, Kaiqing Zhang, Tamer Ba\\c{s}ar, Tong Zhang, Zhuoran Yang","submitted_at":"2018-02-23T22:53:32Z","abstract_excerpt":"We consider the problem of \\emph{fully decentralized} multi-agent reinforcement learning (MARL), where the agents are located at the nodes of a time-varying communication network. Specifically, we assume that the reward functions of the agents might correspond to different tasks, and are only known to the corresponding agent. Moreover, each agent makes individual decisions based on both the information observed locally and the messages received from its neighbors over the network. Within this setting, the collective goal of the agents is to maximize the globally averaged return over the networ"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1802.08757","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-23T22:53:32Z","cross_cats_sorted":["cs.AI","cs.MA","math.OC","stat.ML"],"title_canon_sha256":"d5ed6c4e131f82f729404c0ebe0d34b7a92945683f864aa2b11cbf2ac2c2e7ee","abstract_canon_sha256":"ee4e89ae3b6ff44ffe46f7904c1887e222efeb2fec27b42f240545b11ebda089"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:22:32.953071Z","signature_b64":"6A8g2/Yt9wIvQEJveDGHS0ZiZ7TL+qqsHaVY5j8QocSwmeQv6bRcREhjIhCeV3sjUGPZAhbpGxsBidIo7f4DCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"83e36d0ebcedb437f278c6ed54d3a92425f14139f31949cc50a7d2e3a38a4368","last_reissued_at":"2026-05-18T00:22:32.952592Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:22:32.952592Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Fully Decentralized Multi-Agent Reinforcement Learning with Networked Agents","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.MA","math.OC","stat.ML"],"primary_cat":"cs.LG","authors_text":"Han Liu, Kaiqing Zhang, Tamer Ba\\c{s}ar, Tong Zhang, Zhuoran Yang","submitted_at":"2018-02-23T22:53:32Z","abstract_excerpt":"We consider the problem of \\emph{fully decentralized} multi-agent reinforcement learning (MARL), where the agents are located at the nodes of a time-varying communication network. Specifically, we assume that the reward functions of the agents might correspond to different tasks, and are only known to the corresponding agent. Moreover, each agent makes individual decisions based on both the information observed locally and the messages received from its neighbors over the network. Within this setting, the collective goal of the agents is to maximize the globally averaged return over the networ"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.08757","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1802.08757","created_at":"2026-05-18T00:22:32.952662+00:00"},{"alias_kind":"arxiv_version","alias_value":"1802.08757v2","created_at":"2026-05-18T00:22:32.952662+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.08757","created_at":"2026-05-18T00:22:32.952662+00:00"},{"alias_kind":"pith_short_12","alias_value":"QPRW2DV45W2D","created_at":"2026-05-18T12:32:46.962924+00:00"},{"alias_kind":"pith_short_16","alias_value":"QPRW2DV45W2DP4TY","created_at":"2026-05-18T12:32:46.962924+00:00"},{"alias_kind":"pith_short_8","alias_value":"QPRW2DV4","created_at":"2026-05-18T12:32:46.962924+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ","json":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ.json","graph_json":"https://pith.science/api/pith-number/QPRW2DV45W2DP4TYY3WVJU5JEQ/graph.json","events_json":"https://pith.science/api/pith-number/QPRW2DV45W2DP4TYY3WVJU5JEQ/events.json","paper":"https://pith.science/paper/QPRW2DV4"},"agent_actions":{"view_html":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ","download_json":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ.json","view_paper":"https://pith.science/paper/QPRW2DV4","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1802.08757&json=true","fetch_graph":"https://pith.science/api/pith-number/QPRW2DV45W2DP4TYY3WVJU5JEQ/graph.json","fetch_events":"https://pith.science/api/pith-number/QPRW2DV45W2DP4TYY3WVJU5JEQ/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ/action/timestamp_anchor","attest_storage":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ/action/storage_attestation","attest_author":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ/action/author_attestation","sign_citation":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ/action/citation_signature","submit_replication":"https://pith.science/pith/QPRW2DV45W2DP4TYY3WVJU5JEQ/action/replication_record"}},"created_at":"2026-05-18T00:22:32.952662+00:00","updated_at":"2026-05-18T00:22:32.952662+00:00"}