{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:I4NQOE5JZ2Y7ADKD737KQGJHF7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3731f7dcd36f35538f652383ec88c2639d7346c842006b88e7d1b3c9fcc9e319","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-20T04:10:34Z","title_canon_sha256":"d451b5ae543e07485868d28c11cf687a183efc71a3f7c1c9f82e130f4ddcaff4"},"schema_version":"1.0","source":{"id":"2606.21868","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.21868","created_at":"2026-06-23T02:13:01Z"},{"alias_kind":"arxiv_version","alias_value":"2606.21868v1","created_at":"2026-06-23T02:13:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.21868","created_at":"2026-06-23T02:13:01Z"},{"alias_kind":"pith_short_12","alias_value":"I4NQOE5JZ2Y7","created_at":"2026-06-23T02:13:01Z"},{"alias_kind":"pith_short_16","alias_value":"I4NQOE5JZ2Y7ADKD","created_at":"2026-06-23T02:13:01Z"},{"alias_kind":"pith_short_8","alias_value":"I4NQOE5J","created_at":"2026-06-23T02:13:01Z"}],"graph_snapshots":[{"event_id":"sha256:d00c97057370adf75f8bd7c120f9adfc51dde8e1afbf997c295dea41ed1f8780","target":"graph","created_at":"2026-06-23T02:13:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.21868/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Modern Mixture-of-Experts (MoE) models place most of their parameters in expert layers, yet only a small fraction of those experts are used for any token. The unused weights must still be stored where the GPU can reach them. On commodity GPUs the common fix is layer-level CPU offloading, which keeps memory low but streams all of a layer's experts across PCIe on every forward pass, losing much of MoE's sparsity benefit. We cast low-resource MoE serving as a working-set management problem on the GPU: routed expert weights and the key-value (KV) cache are two streams of memory demand competing fo","authors_text":"Jiamu Zhang, Liangjie Hong, Liang Wu, Mayank Darbari","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-20T04:10:34Z","title":"WiSP: A Working-Set View of Mixture-of-Experts Serving on Extremely Low-Resource Hardware"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.21868","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:32318f41d91e5fb9610dde05261300de391f4bc31f08eb7e88e5afabe2c7afd9","target":"record","created_at":"2026-06-23T02:13:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3731f7dcd36f35538f652383ec88c2639d7346c842006b88e7d1b3c9fcc9e319","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-20T04:10:34Z","title_canon_sha256":"d451b5ae543e07485868d28c11cf687a183efc71a3f7c1c9f82e130f4ddcaff4"},"schema_version":"1.0","source":{"id":"2606.21868","kind":"arxiv","version":1}},"canonical_sha256":"471b0713a9ceb1f00d43fefea819272fce6265284283282945c450cd6faaf6e1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"471b0713a9ceb1f00d43fefea819272fce6265284283282945c450cd6faaf6e1","first_computed_at":"2026-06-23T02:13:01.457559Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-23T02:13:01.457559Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"NHZAosSa8k3LkAQeS2LuqPlw7NkzINeJ4drzEnDScTNx2cO1sCrgLKr2mTEMfg9aIOrig+bIoYT40hylW4VnCw==","signature_status":"signed_v1","signed_at":"2026-06-23T02:13:01.457903Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.21868","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:32318f41d91e5fb9610dde05261300de391f4bc31f08eb7e88e5afabe2c7afd9","sha256:d00c97057370adf75f8bd7c120f9adfc51dde8e1afbf997c295dea41ed1f8780"],"state_sha256":"00c1521aa21bd94092a98bce499023c5592c0ce0b6b436b938afb950099995c7"}