{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:43CNLIMOYJUQY3SF6NKQTFV6W7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"51fc8d79b634e9b52de1b192e26fa6237cf048ce1a0c2601a14752599a09446a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-03-30T02:40:20Z","title_canon_sha256":"79ea05b6d676e8d1b5bb1074f07ebaa7ca0dc93f0b562b9173db98b679719ce0"},"schema_version":"1.0","source":{"id":"2603.27965","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2603.27965","created_at":"2026-07-03T01:17:19Z"},{"alias_kind":"arxiv_version","alias_value":"2603.27965v2","created_at":"2026-07-03T01:17:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2603.27965","created_at":"2026-07-03T01:17:19Z"},{"alias_kind":"pith_short_12","alias_value":"43CNLIMOYJUQ","created_at":"2026-07-03T01:17:19Z"},{"alias_kind":"pith_short_16","alias_value":"43CNLIMOYJUQY3SF","created_at":"2026-07-03T01:17:19Z"},{"alias_kind":"pith_short_8","alias_value":"43CNLIMO","created_at":"2026-07-03T01:17:19Z"}],"graph_snapshots":[{"event_id":"sha256:914f789a318b4cf85e8ad9cefdd5456faeb788b59991db42d77569576c3a88da","target":"graph","created_at":"2026-07-03T01:17:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2603.27965/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Mixture-of-Experts (MoE) models substantially improve performance by increasing the capacity of dense architectures. However, directly training MoE models requires considerable computational resources and introduces extra overhead in parameter storage and deployment. Therefore, it is critical to develop an approach that leverages the multi-expert capability of MoE to enhance performance while incurring minimal additional cost. To this end, we propose a novel pre-training approach, termed ExFusion, which improves the efficiency of Transformer training through multi-expert fusion. Specifically, ","authors_text":"Daize Dong, Jiacheng Ruan, Suncheng Xiang, Ting Liu, Tong Zhu, Xiaoye Qu, Yu Cheng, Yuzhuo Fu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-03-30T02:40:20Z","title":"ExFusion: Efficient Transformer Training via Multi-Experts Fusion"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2603.27965","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:96db3a0319b22adaa74cefa021e5d55012841cb2adf6f528b1df4d195b63fb1c","target":"record","created_at":"2026-07-03T01:17:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"51fc8d79b634e9b52de1b192e26fa6237cf048ce1a0c2601a14752599a09446a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-03-30T02:40:20Z","title_canon_sha256":"79ea05b6d676e8d1b5bb1074f07ebaa7ca0dc93f0b562b9173db98b679719ce0"},"schema_version":"1.0","source":{"id":"2603.27965","kind":"arxiv","version":2}},"canonical_sha256":"e6c4d5a18ec2690c6e45f3550996beb7dbdc9a236cadbbb78419a0cbf1b7b1dc","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e6c4d5a18ec2690c6e45f3550996beb7dbdc9a236cadbbb78419a0cbf1b7b1dc","first_computed_at":"2026-07-03T01:17:19.337441Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-03T01:17:19.337441Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"uNyM68Dk0TqaQosuc8KV3saYhHa0mD7gb9APD9U9XEL3RaBWFrOx10fab+vITLBZKJQP3xl/tHm2iDC4fC0PBg==","signature_status":"signed_v1","signed_at":"2026-07-03T01:17:19.337914Z","signed_message":"canonical_sha256_bytes"},"source_id":"2603.27965","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:96db3a0319b22adaa74cefa021e5d55012841cb2adf6f528b1df4d195b63fb1c","sha256:914f789a318b4cf85e8ad9cefdd5456faeb788b59991db42d77569576c3a88da"],"state_sha256":"b2f9966d940178fc97bef12140aafdf8b9b6a091d987159d5c34cf61414b0636"}