{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:G3PBFQPDS7Z2MOUMS6FFR4YJMR","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"10123f820de9c9cc70a63e57ba4d4385d4ae9773dd0e0df8c412195ccc0f7bf3","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2025-09-17T19:30:27Z","title_canon_sha256":"bf0ae994bb55fb88a299bdc462173a44513772ec20f20c3ad60254716174069f"},"schema_version":"1.0","source":{"id":"2509.14380","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2509.14380","created_at":"2026-06-08T01:05:02Z"},{"alias_kind":"arxiv_version","alias_value":"2509.14380v3","created_at":"2026-06-08T01:05:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2509.14380","created_at":"2026-06-08T01:05:02Z"},{"alias_kind":"pith_short_12","alias_value":"G3PBFQPDS7Z2","created_at":"2026-06-08T01:05:02Z"},{"alias_kind":"pith_short_16","alias_value":"G3PBFQPDS7Z2MOUM","created_at":"2026-06-08T01:05:02Z"},{"alias_kind":"pith_short_8","alias_value":"G3PBFQPD","created_at":"2026-06-08T01:05:02Z"}],"graph_snapshots":[{"event_id":"sha256:65c742aa396d5f8648a0f26891dc31c369da88d3601a7e6512e814147f38e5ee","target":"graph","created_at":"2026-06-08T01:05:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2509.14380/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Multi-Agent Reinforcement Learning (MARL) provides a powerful framework for learning coordination in multi-agent systems. However, applying MARL to robotics remains challenging due to their high-dimensional continuous joint action spaces, complex reward design, and non-stationarity from concurrently learning agents. On the other hand, humans often learn complex coordination with the help of coaches, who guide learning through carefully designed curricula and detailed feedback. Building on the reasoning capabilities of foundation models, we argue that these models can similarly coach robots to ","authors_text":"Jonghoon Ock, Kanghyun Ryu, Negar Mehr, Seoyeon Choi","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2025-09-17T19:30:27Z","title":"CRAFT: Coaching Reinforcement Learning Autonomously using Foundation Models for Multi-Robot Coordination Tasks"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2509.14380","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:bb5dc47116a533ca65ec8803764967aaeb088edbce93464badafe855a19f69ba","target":"record","created_at":"2026-06-08T01:05:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"10123f820de9c9cc70a63e57ba4d4385d4ae9773dd0e0df8c412195ccc0f7bf3","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2025-09-17T19:30:27Z","title_canon_sha256":"bf0ae994bb55fb88a299bdc462173a44513772ec20f20c3ad60254716174069f"},"schema_version":"1.0","source":{"id":"2509.14380","kind":"arxiv","version":3}},"canonical_sha256":"36de12c1e397f3a63a8c978a58f30964466ecc5aaed91df4e3ae1c4c4619c7cf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"36de12c1e397f3a63a8c978a58f30964466ecc5aaed91df4e3ae1c4c4619c7cf","first_computed_at":"2026-06-08T01:05:02.979424Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-08T01:05:02.979424Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"XToF54NRElfsSws1cf6j8hvAveBxJ6zDIjtcR1AgZnKeoyQNqtqy5vn5/JsLHrMoBdRee30/VsAKqLYPTpjcBg==","signature_status":"signed_v1","signed_at":"2026-06-08T01:05:02.980437Z","signed_message":"canonical_sha256_bytes"},"source_id":"2509.14380","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:bb5dc47116a533ca65ec8803764967aaeb088edbce93464badafe855a19f69ba","sha256:65c742aa396d5f8648a0f26891dc31c369da88d3601a7e6512e814147f38e5ee"],"state_sha256":"293e989df3ffab222649cd89233bde41442d0328a617f735df528ef14d5d1996"}