{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:LXKEYMNJGPBMHP5WHXR6S57A4Q","short_pith_number":"pith:LXKEYMNJ","canonical_record":{"source":{"id":"2605.26646","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-26T07:30:03Z","cross_cats_sorted":["cs.CL","cs.MA"],"title_canon_sha256":"ab9dcccf1d81af46e8c46a71b8093659ee01d59dcb961cbf85d9c1aece3bfcf4","abstract_canon_sha256":"fad35e7854e513a31cf406b699ee177f10f10fca3dc5889b35066b93c8e54ef2"},"schema_version":"1.0"},"canonical_sha256":"5dd44c31a933c2c3bfb63de3e977e0e402dc5d56048ad7aca3c971ee97f2d148","source":{"kind":"arxiv","id":"2605.26646","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.26646","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"arxiv_version","alias_value":"2605.26646v1","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.26646","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"pith_short_12","alias_value":"LXKEYMNJGPBM","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"pith_short_16","alias_value":"LXKEYMNJGPBMHP5W","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"pith_short_8","alias_value":"LXKEYMNJ","created_at":"2026-05-27T01:06:03Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:LXKEYMNJGPBMHP5WHXR6S57A4Q","target":"record","payload":{"canonical_record":{"source":{"id":"2605.26646","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-26T07:30:03Z","cross_cats_sorted":["cs.CL","cs.MA"],"title_canon_sha256":"ab9dcccf1d81af46e8c46a71b8093659ee01d59dcb961cbf85d9c1aece3bfcf4","abstract_canon_sha256":"fad35e7854e513a31cf406b699ee177f10f10fca3dc5889b35066b93c8e54ef2"},"schema_version":"1.0"},"canonical_sha256":"5dd44c31a933c2c3bfb63de3e977e0e402dc5d56048ad7aca3c971ee97f2d148","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-27T01:06:03.929155Z","signature_b64":"Cp5c7KGZlu7fWSNhR0HnsOMY49sm4Ok0vFvPGEdRa4IR7flGCVO476UmmctsAQBCm63vPS6ZofWmjkvqZxYACw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5dd44c31a933c2c3bfb63de3e977e0e402dc5d56048ad7aca3c971ee97f2d148","last_reissued_at":"2026-05-27T01:06:03.928303Z","signature_status":"signed_v1","first_computed_at":"2026-05-27T01:06:03.928303Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.26646","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-27T01:06:03Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"d4VquPK548IDrvGusG96pSUMRUlCfMjpHaQVnVm6LMom3Mmc18FwYNwII0ylgCK3oExRWKGqkI7kWcaTaPpDAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T18:29:17.887396Z"},"content_sha256":"e9ce04f0e097171c7dab87b406502afcfb302873b28868c60467164b4ae37266","schema_version":"1.0","event_id":"sha256:e9ce04f0e097171c7dab87b406502afcfb302873b28868c60467164b4ae37266"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:LXKEYMNJGPBMHP5WHXR6S57A4Q","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"UnityMAS-O: A General RL Optimization Framework for LLM-Based Multi-Agent Systems","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL","cs.MA"],"primary_cat":"cs.AI","authors_text":"Bin Zhang, Biqing Qi, Erhan Zhang, Haitao Li, Jiaxin Mao, Jinyuan Feng, Lingyong Yan, Qi Liu, Rui Li, Shijie Wang, Wei Yang, Xiaochi Wei, Yan Gao, Yao Hu, Yiqun Chen, Yi Wu, Zechun Niu","submitted_at":"2026-05-26T07:30:03Z","abstract_excerpt":"LLM-based multi-agent systems decompose complex tasks into interacting roles, but most remain manually orchestrated by prompts, tools, and control rules, while agents are rarely optimized through a unified reinforcement learning interface. Existing RL post-training frameworks mainly target single-policy optimization and lack abstractions for user-defined multi-agent workflows, structured interaction, role-specific credit assignment, and configurable parameter sharing.\n  We present UnityMAS-O, a general RL optimization framework for LLM-based multi-agent systems. UnityMAS-O treats the complete "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.26646","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.26646/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-27T01:06:03Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"b1uougG4yiDeIMvoUdfqgmU95/UiulQvW81d+DBzzAQiuzKd528pA8p3ouARG+O8ytPNBB/RgSlsjD1qTPNxDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T18:29:17.887977Z"},"content_sha256":"9e55bf3174e5cdc57f096275f2f610e89b5f96f7d0de68956fd147eb28e88c41","schema_version":"1.0","event_id":"sha256:9e55bf3174e5cdc57f096275f2f610e89b5f96f7d0de68956fd147eb28e88c41"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LXKEYMNJGPBMHP5WHXR6S57A4Q/bundle.json","state_url":"https://pith.science/pith/LXKEYMNJGPBMHP5WHXR6S57A4Q/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LXKEYMNJGPBMHP5WHXR6S57A4Q/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T18:29:17Z","links":{"resolver":"https://pith.science/pith/LXKEYMNJGPBMHP5WHXR6S57A4Q","bundle":"https://pith.science/pith/LXKEYMNJGPBMHP5WHXR6S57A4Q/bundle.json","state":"https://pith.science/pith/LXKEYMNJGPBMHP5WHXR6S57A4Q/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LXKEYMNJGPBMHP5WHXR6S57A4Q/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:LXKEYMNJGPBMHP5WHXR6S57A4Q","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fad35e7854e513a31cf406b699ee177f10f10fca3dc5889b35066b93c8e54ef2","cross_cats_sorted":["cs.CL","cs.MA"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-26T07:30:03Z","title_canon_sha256":"ab9dcccf1d81af46e8c46a71b8093659ee01d59dcb961cbf85d9c1aece3bfcf4"},"schema_version":"1.0","source":{"id":"2605.26646","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.26646","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"arxiv_version","alias_value":"2605.26646v1","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.26646","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"pith_short_12","alias_value":"LXKEYMNJGPBM","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"pith_short_16","alias_value":"LXKEYMNJGPBMHP5W","created_at":"2026-05-27T01:06:03Z"},{"alias_kind":"pith_short_8","alias_value":"LXKEYMNJ","created_at":"2026-05-27T01:06:03Z"}],"graph_snapshots":[{"event_id":"sha256:9e55bf3174e5cdc57f096275f2f610e89b5f96f7d0de68956fd147eb28e88c41","target":"graph","created_at":"2026-05-27T01:06:03Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.26646/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"LLM-based multi-agent systems decompose complex tasks into interacting roles, but most remain manually orchestrated by prompts, tools, and control rules, while agents are rarely optimized through a unified reinforcement learning interface. Existing RL post-training frameworks mainly target single-policy optimization and lack abstractions for user-defined multi-agent workflows, structured interaction, role-specific credit assignment, and configurable parameter sharing.\n  We present UnityMAS-O, a general RL optimization framework for LLM-based multi-agent systems. UnityMAS-O treats the complete ","authors_text":"Bin Zhang, Biqing Qi, Erhan Zhang, Haitao Li, Jiaxin Mao, Jinyuan Feng, Lingyong Yan, Qi Liu, Rui Li, Shijie Wang, Wei Yang, Xiaochi Wei, Yan Gao, Yao Hu, Yiqun Chen, Yi Wu, Zechun Niu","cross_cats":["cs.CL","cs.MA"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-26T07:30:03Z","title":"UnityMAS-O: A General RL Optimization Framework for LLM-Based Multi-Agent Systems"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.26646","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e9ce04f0e097171c7dab87b406502afcfb302873b28868c60467164b4ae37266","target":"record","created_at":"2026-05-27T01:06:03Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fad35e7854e513a31cf406b699ee177f10f10fca3dc5889b35066b93c8e54ef2","cross_cats_sorted":["cs.CL","cs.MA"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-26T07:30:03Z","title_canon_sha256":"ab9dcccf1d81af46e8c46a71b8093659ee01d59dcb961cbf85d9c1aece3bfcf4"},"schema_version":"1.0","source":{"id":"2605.26646","kind":"arxiv","version":1}},"canonical_sha256":"5dd44c31a933c2c3bfb63de3e977e0e402dc5d56048ad7aca3c971ee97f2d148","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5dd44c31a933c2c3bfb63de3e977e0e402dc5d56048ad7aca3c971ee97f2d148","first_computed_at":"2026-05-27T01:06:03.928303Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-27T01:06:03.928303Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Cp5c7KGZlu7fWSNhR0HnsOMY49sm4Ok0vFvPGEdRa4IR7flGCVO476UmmctsAQBCm63vPS6ZofWmjkvqZxYACw==","signature_status":"signed_v1","signed_at":"2026-05-27T01:06:03.929155Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.26646","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e9ce04f0e097171c7dab87b406502afcfb302873b28868c60467164b4ae37266","sha256:9e55bf3174e5cdc57f096275f2f610e89b5f96f7d0de68956fd147eb28e88c41"],"state_sha256":"c9a44595c44c5a8788db7fb0db128d21301905bf07837fa4acacde94333093ae"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kBKZrhjp/zuNdvXtP7nEX8Mf+c/eyo5LpKkSdX9tdzsUt66KRa7YGyckD50XE9EDiOhJmhFAgLyP3Q8RufknDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T18:29:17.891118Z","bundle_sha256":"73e7b5c5cf752ba6d3e09a560545208968d4336b567f38af020029735927ca68"}}