{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:5HS32WKTEI46XSDITP2WKBG2BT","short_pith_number":"pith:5HS32WKT","canonical_record":{"source":{"id":"1802.05438","kind":"arxiv","version":5},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2018-02-15T09:07:57Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"9798d5b299fba6fc0f60e9bffeb8b80b011f1ee31a5567b892b25375b2487cb3","abstract_canon_sha256":"91c4ac4d30db6f8ffa74190feff6df2a055ff6b7ff9f7047814817a2ee1baf23"},"schema_version":"1.0"},"canonical_sha256":"e9e5bd59532239ebc8689bf56504da0cf72ff0750be0e2c466295a7ae03c697c","source":{"kind":"arxiv","id":"1802.05438","version":5},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.05438","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"arxiv_version","alias_value":"1802.05438v5","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.05438","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"pith_short_12","alias_value":"5HS32WKTEI46","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"pith_short_16","alias_value":"5HS32WKTEI46XSDI","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"pith_short_8","alias_value":"5HS32WKT","created_at":"2026-07-05T01:59:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:5HS32WKTEI46XSDITP2WKBG2BT","target":"record","payload":{"canonical_record":{"source":{"id":"1802.05438","kind":"arxiv","version":5},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2018-02-15T09:07:57Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"9798d5b299fba6fc0f60e9bffeb8b80b011f1ee31a5567b892b25375b2487cb3","abstract_canon_sha256":"91c4ac4d30db6f8ffa74190feff6df2a055ff6b7ff9f7047814817a2ee1baf23"},"schema_version":"1.0"},"canonical_sha256":"e9e5bd59532239ebc8689bf56504da0cf72ff0750be0e2c466295a7ae03c697c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T01:59:25.210618Z","signature_b64":"AVScxT4rEgjkKqOnpMNi1J/lttlj0n8Y2hkehi0v+w5ezohxzSiiytfwPhbXIDlSZ8ryYCNRw93Oef79nAtKAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e9e5bd59532239ebc8689bf56504da0cf72ff0750be0e2c466295a7ae03c697c","last_reissued_at":"2026-07-05T01:59:25.210255Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T01:59:25.210255Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1802.05438","source_version":5,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:59:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Fc0m6vuZAbfK6k9z9aBCYulfHqkZledkv4ezRhRupwYjccqYfpdmV714vsVciACAC6ZfFEfVH9ylDDSlfinwCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T13:09:36.322208Z"},"content_sha256":"5e9b66e2b206fb666ea52abb1e170a5c94c9dfbfd2c3ea2b2436083f9ca04218","schema_version":"1.0","event_id":"sha256:5e9b66e2b206fb666ea52abb1e170a5c94c9dfbfd2c3ea2b2436083f9ca04218"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:5HS32WKTEI46XSDITP2WKBG2BT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Mean Field Multi-Agent Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.LG"],"primary_cat":"cs.MA","authors_text":"Jun Wang, Ming Zhou, Minne Li, Rui Luo, Weinan Zhang, Yaodong Yang","submitted_at":"2018-02-15T09:07:57Z","abstract_excerpt":"Existing multi-agent reinforcement learning methods are limited typically to a small number of agents. When the agent number increases largely, the learning becomes intractable due to the curse of the dimensionality and the exponential growth of agent interactions. In this paper, we present \\emph{Mean Field Reinforcement Learning} where the interactions within the population of agents are approximated by those between a single agent and the average effect from the overall population or neighboring agents; the interplay between the two entities is mutually reinforced: the learning of the indivi"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.05438","kind":"arxiv","version":5},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/1802.05438/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:59:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1wbIyCv092CT0lXBu/ZyVEmB2q8zoBHi54BSCzcMNwWUbZhll1P0OMgqSsTcldQ3kaBTdy7o+G1FNVUKTAIICg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T13:09:36.322878Z"},"content_sha256":"b508dc93f733e82f9a01660bf1c6d2aa4ac1ac9309e365d5fdc06bfc81fafbcd","schema_version":"1.0","event_id":"sha256:b508dc93f733e82f9a01660bf1c6d2aa4ac1ac9309e365d5fdc06bfc81fafbcd"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5HS32WKTEI46XSDITP2WKBG2BT/bundle.json","state_url":"https://pith.science/pith/5HS32WKTEI46XSDITP2WKBG2BT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5HS32WKTEI46XSDITP2WKBG2BT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T13:09:36Z","links":{"resolver":"https://pith.science/pith/5HS32WKTEI46XSDITP2WKBG2BT","bundle":"https://pith.science/pith/5HS32WKTEI46XSDITP2WKBG2BT/bundle.json","state":"https://pith.science/pith/5HS32WKTEI46XSDITP2WKBG2BT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5HS32WKTEI46XSDITP2WKBG2BT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:5HS32WKTEI46XSDITP2WKBG2BT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"91c4ac4d30db6f8ffa74190feff6df2a055ff6b7ff9f7047814817a2ee1baf23","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2018-02-15T09:07:57Z","title_canon_sha256":"9798d5b299fba6fc0f60e9bffeb8b80b011f1ee31a5567b892b25375b2487cb3"},"schema_version":"1.0","source":{"id":"1802.05438","kind":"arxiv","version":5}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.05438","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"arxiv_version","alias_value":"1802.05438v5","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.05438","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"pith_short_12","alias_value":"5HS32WKTEI46","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"pith_short_16","alias_value":"5HS32WKTEI46XSDI","created_at":"2026-07-05T01:59:25Z"},{"alias_kind":"pith_short_8","alias_value":"5HS32WKT","created_at":"2026-07-05T01:59:25Z"}],"graph_snapshots":[{"event_id":"sha256:b508dc93f733e82f9a01660bf1c6d2aa4ac1ac9309e365d5fdc06bfc81fafbcd","target":"graph","created_at":"2026-07-05T01:59:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/1802.05438/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Existing multi-agent reinforcement learning methods are limited typically to a small number of agents. When the agent number increases largely, the learning becomes intractable due to the curse of the dimensionality and the exponential growth of agent interactions. In this paper, we present \\emph{Mean Field Reinforcement Learning} where the interactions within the population of agents are approximated by those between a single agent and the average effect from the overall population or neighboring agents; the interplay between the two entities is mutually reinforced: the learning of the indivi","authors_text":"Jun Wang, Ming Zhou, Minne Li, Rui Luo, Weinan Zhang, Yaodong Yang","cross_cats":["cs.AI","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2018-02-15T09:07:57Z","title":"Mean Field Multi-Agent Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.05438","kind":"arxiv","version":5},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5e9b66e2b206fb666ea52abb1e170a5c94c9dfbfd2c3ea2b2436083f9ca04218","target":"record","created_at":"2026-07-05T01:59:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"91c4ac4d30db6f8ffa74190feff6df2a055ff6b7ff9f7047814817a2ee1baf23","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2018-02-15T09:07:57Z","title_canon_sha256":"9798d5b299fba6fc0f60e9bffeb8b80b011f1ee31a5567b892b25375b2487cb3"},"schema_version":"1.0","source":{"id":"1802.05438","kind":"arxiv","version":5}},"canonical_sha256":"e9e5bd59532239ebc8689bf56504da0cf72ff0750be0e2c466295a7ae03c697c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e9e5bd59532239ebc8689bf56504da0cf72ff0750be0e2c466295a7ae03c697c","first_computed_at":"2026-07-05T01:59:25.210255Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T01:59:25.210255Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"AVScxT4rEgjkKqOnpMNi1J/lttlj0n8Y2hkehi0v+w5ezohxzSiiytfwPhbXIDlSZ8ryYCNRw93Oef79nAtKAw==","signature_status":"signed_v1","signed_at":"2026-07-05T01:59:25.210618Z","signed_message":"canonical_sha256_bytes"},"source_id":"1802.05438","source_kind":"arxiv","source_version":5}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5e9b66e2b206fb666ea52abb1e170a5c94c9dfbfd2c3ea2b2436083f9ca04218","sha256:b508dc93f733e82f9a01660bf1c6d2aa4ac1ac9309e365d5fdc06bfc81fafbcd"],"state_sha256":"de4b87b3ca1aa38cf9e1652eefd4c783e77a4e2c17be83bce6fc69b38ab95360"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qqlqasgu/K+g8YCDQ4/ikOZIUUwmvyz1i6U0ZZrSVM+vCMaVhIQ/CbTWt6RwxoBO1dRyoQHqeq++GtiOJIddCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T13:09:36.326809Z","bundle_sha256":"53dd8f7d280f7506f68096a1d72340e67c528efae9878a4802d233a9de853dd6"}}