{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:ZSADPI3RHHXRHXUAVD5CR4UKHV","short_pith_number":"pith:ZSADPI3R","canonical_record":{"source":{"id":"2605.19593","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-19T09:39:16Z","cross_cats_sorted":["cs.DC"],"title_canon_sha256":"a961b1622695450c28234129164829eab2a5f5fef279bd7e917d449940272f0b","abstract_canon_sha256":"a12929b3aac98eb87dd1cbfba4d28ed62f5b162edf65e50c55ad521ff1d76adc"},"schema_version":"1.0"},"canonical_sha256":"cc8037a37139ef13de80a8fa28f28a3d495eca8b0c61d50e8851e9bb140aabd4","source":{"kind":"arxiv","id":"2605.19593","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19593","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19593v1","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19593","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"pith_short_12","alias_value":"ZSADPI3RHHXR","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"pith_short_16","alias_value":"ZSADPI3RHHXRHXUA","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"pith_short_8","alias_value":"ZSADPI3R","created_at":"2026-05-20T01:05:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:ZSADPI3RHHXRHXUAVD5CR4UKHV","target":"record","payload":{"canonical_record":{"source":{"id":"2605.19593","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-19T09:39:16Z","cross_cats_sorted":["cs.DC"],"title_canon_sha256":"a961b1622695450c28234129164829eab2a5f5fef279bd7e917d449940272f0b","abstract_canon_sha256":"a12929b3aac98eb87dd1cbfba4d28ed62f5b162edf65e50c55ad521ff1d76adc"},"schema_version":"1.0"},"canonical_sha256":"cc8037a37139ef13de80a8fa28f28a3d495eca8b0c61d50e8851e9bb140aabd4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:05:53.385863Z","signature_b64":"rTvgvw5mcp1BW49n3h6VFn1ndit86hc9ls7LR7aN9Kwm9GZhNwigTnDsrSZvQq4j0YVZNG1Rh2c1MohcJNGKDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"cc8037a37139ef13de80a8fa28f28a3d495eca8b0c61d50e8851e9bb140aabd4","last_reissued_at":"2026-05-20T01:05:53.385062Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:05:53.385062Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.19593","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DDgf3g+SSBR959Pf5Zk0QTOm36k2yuPP1cDYCJMlfR3x+QNV+Fb4gBio/UZg1YysncY3L1RWtFewjwiGdDrIBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T13:21:15.316627Z"},"content_sha256":"84520b3c90abf416cbb46a64157e74be3a5cd140695fa99e2292c8c2c474da22","schema_version":"1.0","event_id":"sha256:84520b3c90abf416cbb46a64157e74be3a5cd140695fa99e2292c8c2c474da22"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:ZSADPI3RHHXRHXUAVD5CR4UKHV","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Towards Multi-Model LLM Schedulers: Empirical Insights into Offloading and Preemption","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.DC"],"primary_cat":"cs.AI","authors_text":"Alexey Rolich, Andrea Baiocchi, Francesca Cuomo, Mert Yildiz, Pietro Spadaccino","submitted_at":"2026-05-19T09:39:16Z","abstract_excerpt":"Modern deployments of Large Language Models (LLMs) increasingly require serving multiple models with diverse architectures, sizes, and specialization on shared, heterogeneous hardware. This setting introduces new challenges for resource allocation, dispatching, and scheduling, particularly under GPU memory constraints where partial CPU-GPU offloading and preemption become necessary. While existing systems primarily optimize throughput for a single model, comparatively little work addresses multi-model scheduling under these conditions. In this paper, we present an empirical study of how differ"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19593","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.19593/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6tEtZzi1VRoXmARI7moBr/ViyHdGGVHykYJV+Khv99Ct5e3NTcuZtjqF1WkPTQw39YeKMmD/vtxhLHUf0bY1Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T13:21:15.317392Z"},"content_sha256":"43eb00e2ab413a7909de1fe47c4f59da67a7b0a231c9509aad444441c1f0ef61","schema_version":"1.0","event_id":"sha256:43eb00e2ab413a7909de1fe47c4f59da67a7b0a231c9509aad444441c1f0ef61"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZSADPI3RHHXRHXUAVD5CR4UKHV/bundle.json","state_url":"https://pith.science/pith/ZSADPI3RHHXRHXUAVD5CR4UKHV/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZSADPI3RHHXRHXUAVD5CR4UKHV/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-23T13:21:15Z","links":{"resolver":"https://pith.science/pith/ZSADPI3RHHXRHXUAVD5CR4UKHV","bundle":"https://pith.science/pith/ZSADPI3RHHXRHXUAVD5CR4UKHV/bundle.json","state":"https://pith.science/pith/ZSADPI3RHHXRHXUAVD5CR4UKHV/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZSADPI3RHHXRHXUAVD5CR4UKHV/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:ZSADPI3RHHXRHXUAVD5CR4UKHV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a12929b3aac98eb87dd1cbfba4d28ed62f5b162edf65e50c55ad521ff1d76adc","cross_cats_sorted":["cs.DC"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-19T09:39:16Z","title_canon_sha256":"a961b1622695450c28234129164829eab2a5f5fef279bd7e917d449940272f0b"},"schema_version":"1.0","source":{"id":"2605.19593","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19593","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19593v1","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19593","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"pith_short_12","alias_value":"ZSADPI3RHHXR","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"pith_short_16","alias_value":"ZSADPI3RHHXRHXUA","created_at":"2026-05-20T01:05:53Z"},{"alias_kind":"pith_short_8","alias_value":"ZSADPI3R","created_at":"2026-05-20T01:05:53Z"}],"graph_snapshots":[{"event_id":"sha256:43eb00e2ab413a7909de1fe47c4f59da67a7b0a231c9509aad444441c1f0ef61","target":"graph","created_at":"2026-05-20T01:05:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.19593/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Modern deployments of Large Language Models (LLMs) increasingly require serving multiple models with diverse architectures, sizes, and specialization on shared, heterogeneous hardware. This setting introduces new challenges for resource allocation, dispatching, and scheduling, particularly under GPU memory constraints where partial CPU-GPU offloading and preemption become necessary. While existing systems primarily optimize throughput for a single model, comparatively little work addresses multi-model scheduling under these conditions. In this paper, we present an empirical study of how differ","authors_text":"Alexey Rolich, Andrea Baiocchi, Francesca Cuomo, Mert Yildiz, Pietro Spadaccino","cross_cats":["cs.DC"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-19T09:39:16Z","title":"Towards Multi-Model LLM Schedulers: Empirical Insights into Offloading and Preemption"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19593","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:84520b3c90abf416cbb46a64157e74be3a5cd140695fa99e2292c8c2c474da22","target":"record","created_at":"2026-05-20T01:05:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a12929b3aac98eb87dd1cbfba4d28ed62f5b162edf65e50c55ad521ff1d76adc","cross_cats_sorted":["cs.DC"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-19T09:39:16Z","title_canon_sha256":"a961b1622695450c28234129164829eab2a5f5fef279bd7e917d449940272f0b"},"schema_version":"1.0","source":{"id":"2605.19593","kind":"arxiv","version":1}},"canonical_sha256":"cc8037a37139ef13de80a8fa28f28a3d495eca8b0c61d50e8851e9bb140aabd4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"cc8037a37139ef13de80a8fa28f28a3d495eca8b0c61d50e8851e9bb140aabd4","first_computed_at":"2026-05-20T01:05:53.385062Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T01:05:53.385062Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"rTvgvw5mcp1BW49n3h6VFn1ndit86hc9ls7LR7aN9Kwm9GZhNwigTnDsrSZvQq4j0YVZNG1Rh2c1MohcJNGKDA==","signature_status":"signed_v1","signed_at":"2026-05-20T01:05:53.385863Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.19593","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:84520b3c90abf416cbb46a64157e74be3a5cd140695fa99e2292c8c2c474da22","sha256:43eb00e2ab413a7909de1fe47c4f59da67a7b0a231c9509aad444441c1f0ef61"],"state_sha256":"e03e952d25757bf9c113aa7d9f551d6fd7765167a0f19e4001f7f50853238b2c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"j5DU+Hwjn0gKl8CUOdb4qKZg5mw9cNRvObdasVqSm7tc6u/eXqKljY4OxFzP9QETg+o9w1cEhWHK0EVclM5uCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-23T13:21:15.321712Z","bundle_sha256":"7514a0cf71f9d75f33a5a626ef9611480cb875f0413fc2a33ab1ac0e70db9092"}}