{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:3ILHTJ55PMRS3KSJP6JGJYCUXZ","short_pith_number":"pith:3ILHTJ55","canonical_record":{"source":{"id":"2603.22774","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2026-03-24T04:06:27Z","cross_cats_sorted":["cs.DC"],"title_canon_sha256":"1c456ff73655f29eea5f714ad9a39f377a7ddb439248589ccd80bd24c777736b","abstract_canon_sha256":"b18bbb050ecf934b83fad490534dadad585e888c454209ded254bcbbe209aff9"},"schema_version":"1.0"},"canonical_sha256":"da1679a7bd7b232daa497f9264e054be4c40eb7c919cb3af098bbc5d417ee9f3","source":{"kind":"arxiv","id":"2603.22774","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2603.22774","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"arxiv_version","alias_value":"2603.22774v2","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2603.22774","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"pith_short_12","alias_value":"3ILHTJ55PMRS","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"pith_short_16","alias_value":"3ILHTJ55PMRS3KSJ","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"pith_short_8","alias_value":"3ILHTJ55","created_at":"2026-05-26T02:04:09Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:3ILHTJ55PMRS3KSJP6JGJYCUXZ","target":"record","payload":{"canonical_record":{"source":{"id":"2603.22774","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2026-03-24T04:06:27Z","cross_cats_sorted":["cs.DC"],"title_canon_sha256":"1c456ff73655f29eea5f714ad9a39f377a7ddb439248589ccd80bd24c777736b","abstract_canon_sha256":"b18bbb050ecf934b83fad490534dadad585e888c454209ded254bcbbe209aff9"},"schema_version":"1.0"},"canonical_sha256":"da1679a7bd7b232daa497f9264e054be4c40eb7c919cb3af098bbc5d417ee9f3","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-26T02:04:09.541604Z","signature_b64":"+3KIMn3tdDZZBL7xk0exqNBGqdhvqTvLA7nPcD8B1KLHTP07p21f1Uw9NBC6mI//RxR+XIsVnYrTxBZx51jICw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"da1679a7bd7b232daa497f9264e054be4c40eb7c919cb3af098bbc5d417ee9f3","last_reissued_at":"2026-05-26T02:04:09.540664Z","signature_status":"signed_v1","first_computed_at":"2026-05-26T02:04:09.540664Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2603.22774","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T02:04:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"L4gu8q3B608HZDKFaUAfU0B4qpeTaZsk6cgEY/w/rC9AVgVMRkWH6fCnLvR3pfLyoKtZsyiZ7TK+ktm+eC7sAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-23T16:46:30.998552Z"},"content_sha256":"91c36ba654baf9817ba148d2ab5b2270c193bdd4bfe6129b045cc2b61b3151c9","schema_version":"1.0","event_id":"sha256:91c36ba654baf9817ba148d2ab5b2270c193bdd4bfe6129b045cc2b61b3151c9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:3ILHTJ55PMRS3KSJP6JGJYCUXZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Characterizing CPU-Induced Slowdowns in Multi-GPU LLM Inference","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DC"],"primary_cat":"cs.AR","authors_text":"Aaron Jezghani, Euijun Chung, Hyesoon Kim, Yuxiao Jia","submitted_at":"2026-03-24T04:06:27Z","abstract_excerpt":"Large-scale machine learning workloads increasingly rely on multi-GPU systems, yet their performance is often limited by an overlooked component: the CPU. Through a detailed study of modern large language model (LLM) inference and serving workloads, we find that multi-GPU performance frequently degrades not because GPUs are saturated, but because CPUs fail to keep the GPUs busy. Under limited CPU allocations, systems exhibit symptoms such as delayed kernel launch, stalled communication, and increased tokenization latency, leading to severe GPU underutilization even when ample GPU resources are"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2603.22774","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2603.22774/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T02:04:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RGNyJFx1xADBUgV0PoSjZ8DCe62F0iW6oMCSgCD/rSRIVmwSlJtjP3nCA5NMfd3zA6IZcLDirIXyuXtsp9UWAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-23T16:46:30.998942Z"},"content_sha256":"4c805aa9d252f6a0358a0b20c808d04834723c4337f6912625ec8da89a76fed9","schema_version":"1.0","event_id":"sha256:4c805aa9d252f6a0358a0b20c808d04834723c4337f6912625ec8da89a76fed9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3ILHTJ55PMRS3KSJP6JGJYCUXZ/bundle.json","state_url":"https://pith.science/pith/3ILHTJ55PMRS3KSJP6JGJYCUXZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3ILHTJ55PMRS3KSJP6JGJYCUXZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-23T16:46:30Z","links":{"resolver":"https://pith.science/pith/3ILHTJ55PMRS3KSJP6JGJYCUXZ","bundle":"https://pith.science/pith/3ILHTJ55PMRS3KSJP6JGJYCUXZ/bundle.json","state":"https://pith.science/pith/3ILHTJ55PMRS3KSJP6JGJYCUXZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3ILHTJ55PMRS3KSJP6JGJYCUXZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:3ILHTJ55PMRS3KSJP6JGJYCUXZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b18bbb050ecf934b83fad490534dadad585e888c454209ded254bcbbe209aff9","cross_cats_sorted":["cs.DC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2026-03-24T04:06:27Z","title_canon_sha256":"1c456ff73655f29eea5f714ad9a39f377a7ddb439248589ccd80bd24c777736b"},"schema_version":"1.0","source":{"id":"2603.22774","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2603.22774","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"arxiv_version","alias_value":"2603.22774v2","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2603.22774","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"pith_short_12","alias_value":"3ILHTJ55PMRS","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"pith_short_16","alias_value":"3ILHTJ55PMRS3KSJ","created_at":"2026-05-26T02:04:09Z"},{"alias_kind":"pith_short_8","alias_value":"3ILHTJ55","created_at":"2026-05-26T02:04:09Z"}],"graph_snapshots":[{"event_id":"sha256:4c805aa9d252f6a0358a0b20c808d04834723c4337f6912625ec8da89a76fed9","target":"graph","created_at":"2026-05-26T02:04:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2603.22774/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large-scale machine learning workloads increasingly rely on multi-GPU systems, yet their performance is often limited by an overlooked component: the CPU. Through a detailed study of modern large language model (LLM) inference and serving workloads, we find that multi-GPU performance frequently degrades not because GPUs are saturated, but because CPUs fail to keep the GPUs busy. Under limited CPU allocations, systems exhibit symptoms such as delayed kernel launch, stalled communication, and increased tokenization latency, leading to severe GPU underutilization even when ample GPU resources are","authors_text":"Aaron Jezghani, Euijun Chung, Hyesoon Kim, Yuxiao Jia","cross_cats":["cs.DC"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2026-03-24T04:06:27Z","title":"Characterizing CPU-Induced Slowdowns in Multi-GPU LLM Inference"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2603.22774","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:91c36ba654baf9817ba148d2ab5b2270c193bdd4bfe6129b045cc2b61b3151c9","target":"record","created_at":"2026-05-26T02:04:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b18bbb050ecf934b83fad490534dadad585e888c454209ded254bcbbe209aff9","cross_cats_sorted":["cs.DC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2026-03-24T04:06:27Z","title_canon_sha256":"1c456ff73655f29eea5f714ad9a39f377a7ddb439248589ccd80bd24c777736b"},"schema_version":"1.0","source":{"id":"2603.22774","kind":"arxiv","version":2}},"canonical_sha256":"da1679a7bd7b232daa497f9264e054be4c40eb7c919cb3af098bbc5d417ee9f3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"da1679a7bd7b232daa497f9264e054be4c40eb7c919cb3af098bbc5d417ee9f3","first_computed_at":"2026-05-26T02:04:09.540664Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-26T02:04:09.540664Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+3KIMn3tdDZZBL7xk0exqNBGqdhvqTvLA7nPcD8B1KLHTP07p21f1Uw9NBC6mI//RxR+XIsVnYrTxBZx51jICw==","signature_status":"signed_v1","signed_at":"2026-05-26T02:04:09.541604Z","signed_message":"canonical_sha256_bytes"},"source_id":"2603.22774","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:91c36ba654baf9817ba148d2ab5b2270c193bdd4bfe6129b045cc2b61b3151c9","sha256:4c805aa9d252f6a0358a0b20c808d04834723c4337f6912625ec8da89a76fed9"],"state_sha256":"1927a4dc3c047cf0bd658912b6498cedc08395732460a8fbcfadb3d652ed2ae0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"L0+CCthcHcep0uilMGT34W5bN483eDRpnv8asGpEmOva1bFiWGO4BweSedWhVOCbtsAbU8DAXEyASfxxDbUgDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-23T16:46:31.001092Z","bundle_sha256":"3f815ffcace127ca19ff9a48c2e98aeb4bdbb8d9bd9986f8e5028d60397b2248"}}