{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2017:ZXHKGNW5LTN7ZUXE3L7EBFO7TY","short_pith_number":"pith:ZXHKGNW5","schema_version":"1.0","canonical_sha256":"cdcea336dd5cdbfcd2e4dafe4095df9e02e57f2b018425fb1ce21909bdc29c5b","source":{"kind":"arxiv","id":"1706.03235","version":3},"attestation_state":"computed","paper":{"title":"ACCNet: Actor-Coordinator-Critic Net for \"Learning-to-Communicate\" with Deep Multi-agent Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.AI","authors_text":"Hangyu Mao, Yan Ni, Zhen Xiao, Zhibo Gong","submitted_at":"2017-06-10T13:50:23Z","abstract_excerpt":"Communication is a critical factor for the big multi-agent world to stay organized and productive. Typically, most previous multi-agent \"learning-to-communicate\" studies try to predefine the communication protocols or use technologies such as tabular reinforcement learning and evolutionary algorithm, which can not generalize to changing environment or large collection of agents.\n  In this paper, we propose an Actor-Coordinator-Critic Net (ACCNet) framework for solving \"learning-to-communicate\" problem. The ACCNet naturally combines the powerful actor-critic reinforcement learning technology wi"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1706.03235","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-06-10T13:50:23Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"09576b70ac5bf50fe05bfb9c8643275ea7f4976e8b3a4b208bf209114751b09a","abstract_canon_sha256":"883b0c586aae239036f40683451ba207fa25a4c5dcb97901297d69b376c6cdf7"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:31:50.909311Z","signature_b64":"cvFluYUatWI9uDFZ+z6IvZZBpJPcua9DTcTrMs1UJnTIuG2rhZ2ft2914w28qp6KzY6pOmWqwJo9a6gjgKqHCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"cdcea336dd5cdbfcd2e4dafe4095df9e02e57f2b018425fb1ce21909bdc29c5b","last_reissued_at":"2026-05-18T00:31:50.908717Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:31:50.908717Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"ACCNet: Actor-Coordinator-Critic Net for \"Learning-to-Communicate\" with Deep Multi-agent Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.AI","authors_text":"Hangyu Mao, Yan Ni, Zhen Xiao, Zhibo Gong","submitted_at":"2017-06-10T13:50:23Z","abstract_excerpt":"Communication is a critical factor for the big multi-agent world to stay organized and productive. Typically, most previous multi-agent \"learning-to-communicate\" studies try to predefine the communication protocols or use technologies such as tabular reinforcement learning and evolutionary algorithm, which can not generalize to changing environment or large collection of agents.\n  In this paper, we propose an Actor-Coordinator-Critic Net (ACCNet) framework for solving \"learning-to-communicate\" problem. The ACCNet naturally combines the powerful actor-critic reinforcement learning technology wi"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1706.03235","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1706.03235","created_at":"2026-05-18T00:31:50.908806+00:00"},{"alias_kind":"arxiv_version","alias_value":"1706.03235v3","created_at":"2026-05-18T00:31:50.908806+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1706.03235","created_at":"2026-05-18T00:31:50.908806+00:00"},{"alias_kind":"pith_short_12","alias_value":"ZXHKGNW5LTN7","created_at":"2026-05-18T12:31:59.375834+00:00"},{"alias_kind":"pith_short_16","alias_value":"ZXHKGNW5LTN7ZUXE","created_at":"2026-05-18T12:31:59.375834+00:00"},{"alias_kind":"pith_short_8","alias_value":"ZXHKGNW5","created_at":"2026-05-18T12:31:59.375834+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY","json":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY.json","graph_json":"https://pith.science/api/pith-number/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/graph.json","events_json":"https://pith.science/api/pith-number/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/events.json","paper":"https://pith.science/paper/ZXHKGNW5"},"agent_actions":{"view_html":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY","download_json":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY.json","view_paper":"https://pith.science/paper/ZXHKGNW5","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1706.03235&json=true","fetch_graph":"https://pith.science/api/pith-number/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/graph.json","fetch_events":"https://pith.science/api/pith-number/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/action/timestamp_anchor","attest_storage":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/action/storage_attestation","attest_author":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/action/author_attestation","sign_citation":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/action/citation_signature","submit_replication":"https://pith.science/pith/ZXHKGNW5LTN7ZUXE3L7EBFO7TY/action/replication_record"}},"created_at":"2026-05-18T00:31:50.908806+00:00","updated_at":"2026-05-18T00:31:50.908806+00:00"}