{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:RVL2XL3FLHYA5HMII57FZRU6YF","short_pith_number":"pith:RVL2XL3F","canonical_record":{"source":{"id":"2605.14289","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T02:48:23Z","cross_cats_sorted":["cs.AI","cs.CL","cs.CR"],"title_canon_sha256":"945de5ef473298834c078e322335fed3d5ebf902138f911257bc0e96ae13a74d","abstract_canon_sha256":"3168e50b2f266609e6f77c079ccd113d5d261985456fd3d68a23c56b8de5c1ce"},"schema_version":"1.0"},"canonical_sha256":"8d57abaf6559f00e9d88477e5cc69ec14c5bc0c71a7818f05cdcb4dc1b3e09b9","source":{"kind":"arxiv","id":"2605.14289","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.14289","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"arxiv_version","alias_value":"2605.14289v1","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14289","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"pith_short_12","alias_value":"RVL2XL3FLHYA","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"RVL2XL3FLHYA5HMI","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"RVL2XL3F","created_at":"2026-05-18T12:33:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:RVL2XL3FLHYA5HMII57FZRU6YF","target":"record","payload":{"canonical_record":{"source":{"id":"2605.14289","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T02:48:23Z","cross_cats_sorted":["cs.AI","cs.CL","cs.CR"],"title_canon_sha256":"945de5ef473298834c078e322335fed3d5ebf902138f911257bc0e96ae13a74d","abstract_canon_sha256":"3168e50b2f266609e6f77c079ccd113d5d261985456fd3d68a23c56b8de5c1ce"},"schema_version":"1.0"},"canonical_sha256":"8d57abaf6559f00e9d88477e5cc69ec14c5bc0c71a7818f05cdcb4dc1b3e09b9","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:39:10.214578Z","signature_b64":"l27SaBqYHUwEu2n0zzxxrdUG1HZoKMjcNMCeFthWhmvleJi9acCxJTe/1zl7Fw6vGqEyJpz/lqS7O7ciqreYBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8d57abaf6559f00e9d88477e5cc69ec14c5bc0c71a7818f05cdcb4dc1b3e09b9","last_reissued_at":"2026-05-17T23:39:10.213906Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:39:10.213906Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.14289","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hAeoj257rqpPo0XLuL3TieDEMAbim55yp2Cp/Hi/f0CmCbCsu964iSr/38lTr89doSUBKznF7qHJqzolVrfOAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T21:20:55.463148Z"},"content_sha256":"35b98a8c452f17feb260e35766201aea547d7bb4944345ad502ff9a79708c66a","schema_version":"1.0","event_id":"sha256:35b98a8c452f17feb260e35766201aea547d7bb4944345ad502ff9a79708c66a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:RVL2XL3FLHYA5HMII57FZRU6YF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"MetaMoE: Diversity-Aware Proxy Selection for Privacy-Preserving Mixture-of-Experts Unification","license":"http://creativecommons.org/licenses/by/4.0/","headline":"MetaMoE unifies domain-specialized experts into a single MoE via diversity-aware public proxy selection that approximates private data distributions for router training and expert alignment.","cross_cats":["cs.AI","cs.CL","cs.CR"],"primary_cat":"cs.LG","authors_text":"Shuhao Chen, Sinno Jialin Pan, Weisen Jiang","submitted_at":"2026-05-14T02:48:23Z","abstract_excerpt":"Mixture-of-Experts (MoE) models scale capacity by combining specialized experts, but most existing approaches assume centralized access to training data. In practice, data are distributed across clients and cannot be shared due to privacy constraints, making unified MoE training challenging. We propose MetaMoE, a privacy-preserving framework that unifies independently trained, domain-specialized experts into a single MoE using public proxy data as surrogates for inaccessible private data. Central to MetaMoE is diversity-aware proxy selection, which selects client-domain-relevant and diverse sa"},"claims":{"count":3,"items":[{"kind":"strongest_claim","text":"Experiments on computer vision and natural language processing benchmarks demonstrate that MetaMoE consistently outperforms recent privacy-preserving MoE unification methods.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"Public proxy data selected for domain relevance and diversity can sufficiently approximate inaccessible private data distributions to supervise router learning and expert alignment without introducing large distribution shift.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"MetaMoE unifies domain-specialized experts into a single MoE via diversity-aware public proxy selection that approximates private data distributions for router training and expert alignment.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"}],"snapshot_sha256":"69944ccc1638eef657e98a5fdebbd50855d320053230e40bb8c99b331a9a9f0a"},"source":{"id":"2605.14289","kind":"arxiv","version":1},"verdict":{"id":"bca359f4-6e5b-4ac8-bb2d-d3e7bcc9f0f9","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-15T02:21:07.014636Z","strongest_claim":"Experiments on computer vision and natural language processing benchmarks demonstrate that MetaMoE consistently outperforms recent privacy-preserving MoE unification methods.","one_line_summary":"MetaMoE unifies domain-specialized experts into a single MoE via diversity-aware public proxy selection that approximates private data distributions for router training and expert alignment.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"Public proxy data selected for domain relevance and diversity can sufficiently approximate inaccessible private data distributions to supervise router learning and expert alignment without introducing large distribution shift.","pith_extraction_headline":""},"references":{"count":12,"sample":[{"doi":"","year":null,"title":"Mixture-of-loras: An efficient multitask tuning for large language models","work_id":"4171e7c2-3d4b-4f02-a497-41ccc1952779","ref_index":1,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"Branch-train-merge: Embarrassingly parallel training of ex- pert language models.arXiv preprint arXiv:2208.03306","work_id":"53f249ec-fe00-4890-9c6f-64582a367d17","ref_index":2,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"The flan collection: Designing data and methods for effective instruction tuning","work_id":"56b2f752-8022-4d66-983c-2bb9cb4b2b77","ref_index":3,"cited_arxiv_id":"2301.13688","is_internal_anchor":false},{"doi":"","year":null,"title":"Model Merging in LLMs, MLLMs, and Beyond: Methods, Theories, Applications and Opportunities","work_id":"add1bfdb-f9a2-4280-a81e-ae663e81b3e3","ref_index":4,"cited_arxiv_id":"2408.07666","is_internal_anchor":true},{"doi":"","year":2025,"title":"12 Title Suppressed Due to Excessive Size A. Computation of Relevance Score Following FlexOlmo (Shi et al., 2025), we compute the relevance score g(x,D p) of a public sample x∈ D 0 with respect to a c","work_id":"64905843-7d63-45b8-ac80-4111eab60b00","ref_index":5,"cited_arxiv_id":"","is_internal_anchor":false}],"resolved_work":12,"snapshot_sha256":"898f3d9bbd639c0ce1445b8aa997909294506afea47909a22801800e44f824a4","internal_anchors":1},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"bca359f4-6e5b-4ac8-bb2d-d3e7bcc9f0f9"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Gz2zKEY+3GGyxFfeVPWTIhtbntCqNaRKRD538qHrIHjKvMAB6pH8GEWpEyWHaNxbU7OcTJ/nbUVaHb1NlF/xDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T21:20:55.463779Z"},"content_sha256":"e2f43dfbfac48f3744e436f1b63b4c4932dcd2d9a176d1b043c8af2f2ffacc62","schema_version":"1.0","event_id":"sha256:e2f43dfbfac48f3744e436f1b63b4c4932dcd2d9a176d1b043c8af2f2ffacc62"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RVL2XL3FLHYA5HMII57FZRU6YF/bundle.json","state_url":"https://pith.science/pith/RVL2XL3FLHYA5HMII57FZRU6YF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RVL2XL3FLHYA5HMII57FZRU6YF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T21:20:55Z","links":{"resolver":"https://pith.science/pith/RVL2XL3FLHYA5HMII57FZRU6YF","bundle":"https://pith.science/pith/RVL2XL3FLHYA5HMII57FZRU6YF/bundle.json","state":"https://pith.science/pith/RVL2XL3FLHYA5HMII57FZRU6YF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RVL2XL3FLHYA5HMII57FZRU6YF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:RVL2XL3FLHYA5HMII57FZRU6YF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3168e50b2f266609e6f77c079ccd113d5d261985456fd3d68a23c56b8de5c1ce","cross_cats_sorted":["cs.AI","cs.CL","cs.CR"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T02:48:23Z","title_canon_sha256":"945de5ef473298834c078e322335fed3d5ebf902138f911257bc0e96ae13a74d"},"schema_version":"1.0","source":{"id":"2605.14289","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.14289","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"arxiv_version","alias_value":"2605.14289v1","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14289","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"pith_short_12","alias_value":"RVL2XL3FLHYA","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"RVL2XL3FLHYA5HMI","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"RVL2XL3F","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:e2f43dfbfac48f3744e436f1b63b4c4932dcd2d9a176d1b043c8af2f2ffacc62","target":"graph","created_at":"2026-05-17T23:39:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":3,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Experiments on computer vision and natural language processing benchmarks demonstrate that MetaMoE consistently outperforms recent privacy-preserving MoE unification methods."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"Public proxy data selected for domain relevance and diversity can sufficiently approximate inaccessible private data distributions to supervise router learning and expert alignment without introducing large distribution shift."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"MetaMoE unifies domain-specialized experts into a single MoE via diversity-aware public proxy selection that approximates private data distributions for router training and expert alignment."}],"snapshot_sha256":"69944ccc1638eef657e98a5fdebbd50855d320053230e40bb8c99b331a9a9f0a"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Mixture-of-Experts (MoE) models scale capacity by combining specialized experts, but most existing approaches assume centralized access to training data. In practice, data are distributed across clients and cannot be shared due to privacy constraints, making unified MoE training challenging. We propose MetaMoE, a privacy-preserving framework that unifies independently trained, domain-specialized experts into a single MoE using public proxy data as surrogates for inaccessible private data. Central to MetaMoE is diversity-aware proxy selection, which selects client-domain-relevant and diverse sa","authors_text":"Shuhao Chen, Sinno Jialin Pan, Weisen Jiang","cross_cats":["cs.AI","cs.CL","cs.CR"],"headline":"MetaMoE unifies domain-specialized experts into a single MoE via diversity-aware public proxy selection that approximates private data distributions for router training and expert alignment.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T02:48:23Z","title":"MetaMoE: Diversity-Aware Proxy Selection for Privacy-Preserving Mixture-of-Experts Unification"},"references":{"count":12,"internal_anchors":1,"resolved_work":12,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"Mixture-of-loras: An efficient multitask tuning for large language models","work_id":"4171e7c2-3d4b-4f02-a497-41ccc1952779","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":2,"title":"Branch-train-merge: Embarrassingly parallel training of ex- pert language models.arXiv preprint arXiv:2208.03306","work_id":"53f249ec-fe00-4890-9c6f-64582a367d17","year":null},{"cited_arxiv_id":"2301.13688","doi":"","is_internal_anchor":false,"ref_index":3,"title":"The flan collection: Designing data and methods for effective instruction tuning","work_id":"56b2f752-8022-4d66-983c-2bb9cb4b2b77","year":null},{"cited_arxiv_id":"2408.07666","doi":"","is_internal_anchor":true,"ref_index":4,"title":"Model Merging in LLMs, MLLMs, and Beyond: Methods, Theories, Applications and Opportunities","work_id":"add1bfdb-f9a2-4280-a81e-ae663e81b3e3","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"12 Title Suppressed Due to Excessive Size A. Computation of Relevance Score Following FlexOlmo (Shi et al., 2025), we compute the relevance score g(x,D p) of a public sample x∈ D 0 with respect to a c","work_id":"64905843-7d63-45b8-ac80-4111eab60b00","year":2025}],"snapshot_sha256":"898f3d9bbd639c0ce1445b8aa997909294506afea47909a22801800e44f824a4"},"source":{"id":"2605.14289","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-15T02:21:07.014636Z","id":"bca359f4-6e5b-4ac8-bb2d-d3e7bcc9f0f9","model_set":{"reader":"grok-4.3"},"one_line_summary":"MetaMoE unifies domain-specialized experts into a single MoE via diversity-aware public proxy selection that approximates private data distributions for router training and expert alignment.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"","strongest_claim":"Experiments on computer vision and natural language processing benchmarks demonstrate that MetaMoE consistently outperforms recent privacy-preserving MoE unification methods.","weakest_assumption":"Public proxy data selected for domain relevance and diversity can sufficiently approximate inaccessible private data distributions to supervise router learning and expert alignment without introducing large distribution shift."}},"verdict_id":"bca359f4-6e5b-4ac8-bb2d-d3e7bcc9f0f9"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:35b98a8c452f17feb260e35766201aea547d7bb4944345ad502ff9a79708c66a","target":"record","created_at":"2026-05-17T23:39:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3168e50b2f266609e6f77c079ccd113d5d261985456fd3d68a23c56b8de5c1ce","cross_cats_sorted":["cs.AI","cs.CL","cs.CR"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T02:48:23Z","title_canon_sha256":"945de5ef473298834c078e322335fed3d5ebf902138f911257bc0e96ae13a74d"},"schema_version":"1.0","source":{"id":"2605.14289","kind":"arxiv","version":1}},"canonical_sha256":"8d57abaf6559f00e9d88477e5cc69ec14c5bc0c71a7818f05cdcb4dc1b3e09b9","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8d57abaf6559f00e9d88477e5cc69ec14c5bc0c71a7818f05cdcb4dc1b3e09b9","first_computed_at":"2026-05-17T23:39:10.213906Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:10.213906Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"l27SaBqYHUwEu2n0zzxxrdUG1HZoKMjcNMCeFthWhmvleJi9acCxJTe/1zl7Fw6vGqEyJpz/lqS7O7ciqreYBg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:10.214578Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.14289","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:35b98a8c452f17feb260e35766201aea547d7bb4944345ad502ff9a79708c66a","sha256:e2f43dfbfac48f3744e436f1b63b4c4932dcd2d9a176d1b043c8af2f2ffacc62"],"state_sha256":"8fcdc7efa4d7dca0d93664176c0299d8e9a56705d6742b209e9ad4973fe9ebb8"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"lIG+nJSH+bfLU4PC9OLIFejB6VQ3z6qY9kBFyduqxJMvQ1dBm3ol8/jgOZ94mzZManRVlYhLzM12svYnJOb0Cg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T21:20:55.467082Z","bundle_sha256":"75577be2e0b88343b3cab27b61148f9e3737ecce2a5f1c9a6321e23b71b779e9"}}