{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:EIOSARSDM5IK2LKKUH75IE4R7B","short_pith_number":"pith:EIOSARSD","schema_version":"1.0","canonical_sha256":"221d2046436750ad2d4aa1ffd41391f84f0f04cfc9e5f471c2b42a24dca35614","source":{"kind":"arxiv","id":"2605.27744","version":1},"attestation_state":"computed","paper":{"title":"A Policy-Driven Runtime Layer for Agentic LLM Serving","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Chaeeun Kim, Liting Hu, Rui Zhang","submitted_at":"2026-05-26T22:38:34Z","abstract_excerpt":"Multi-agent LLM systems have become the dominant production workload, but the serving stack was not built for them. The agent framework above knows agent identities, role, schemas, and dispatch structure but never sees an engine-level event; the serving engine below sees every event but knows nothing about agents. A surprising number of cross-cutting policies depend on both: prefix caching, batch shaping, speculative execution, fairness, tool-result memoization, safety enforcement, and more. Each lives in the seam between the two layers and is currently solved by a one-off patch into one neigh"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.27744","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-26T22:38:34Z","cross_cats_sorted":[],"title_canon_sha256":"b8f9fa0efc3fcb8cfa0c86b8562db7e772958b4bd6a710d67463c37a28232ea2","abstract_canon_sha256":"930595fc028870ee99aef9e0173380051a1cf44b135b449d8f2ea8a17f54e162"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T01:04:47.743727Z","signature_b64":"9KZKh9OWdUEck0WXX1RA8snTEf8RO2+denGt+U5Br5hyrvAbn0a3PedoDtckmX6Up7XmBD+b0Zuvh4Q/dW7qAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"221d2046436750ad2d4aa1ffd41391f84f0f04cfc9e5f471c2b42a24dca35614","last_reissued_at":"2026-05-28T01:04:47.743376Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T01:04:47.743376Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"A Policy-Driven Runtime Layer for Agentic LLM Serving","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Chaeeun Kim, Liting Hu, Rui Zhang","submitted_at":"2026-05-26T22:38:34Z","abstract_excerpt":"Multi-agent LLM systems have become the dominant production workload, but the serving stack was not built for them. The agent framework above knows agent identities, role, schemas, and dispatch structure but never sees an engine-level event; the serving engine below sees every event but knows nothing about agents. A surprising number of cross-cutting policies depend on both: prefix caching, batch shaping, speculative execution, fairness, tool-result memoization, safety enforcement, and more. Each lives in the seam between the two layers and is currently solved by a one-off patch into one neigh"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.27744","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.27744/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.27744","created_at":"2026-05-28T01:04:47.743433+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.27744v1","created_at":"2026-05-28T01:04:47.743433+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.27744","created_at":"2026-05-28T01:04:47.743433+00:00"},{"alias_kind":"pith_short_12","alias_value":"EIOSARSDM5IK","created_at":"2026-05-28T01:04:47.743433+00:00"},{"alias_kind":"pith_short_16","alias_value":"EIOSARSDM5IK2LKK","created_at":"2026-05-28T01:04:47.743433+00:00"},{"alias_kind":"pith_short_8","alias_value":"EIOSARSD","created_at":"2026-05-28T01:04:47.743433+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B","json":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B.json","graph_json":"https://pith.science/api/pith-number/EIOSARSDM5IK2LKKUH75IE4R7B/graph.json","events_json":"https://pith.science/api/pith-number/EIOSARSDM5IK2LKKUH75IE4R7B/events.json","paper":"https://pith.science/paper/EIOSARSD"},"agent_actions":{"view_html":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B","download_json":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B.json","view_paper":"https://pith.science/paper/EIOSARSD","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.27744&json=true","fetch_graph":"https://pith.science/api/pith-number/EIOSARSDM5IK2LKKUH75IE4R7B/graph.json","fetch_events":"https://pith.science/api/pith-number/EIOSARSDM5IK2LKKUH75IE4R7B/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B/action/timestamp_anchor","attest_storage":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B/action/storage_attestation","attest_author":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B/action/author_attestation","sign_citation":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B/action/citation_signature","submit_replication":"https://pith.science/pith/EIOSARSDM5IK2LKKUH75IE4R7B/action/replication_record"}},"created_at":"2026-05-28T01:04:47.743433+00:00","updated_at":"2026-05-28T01:04:47.743433+00:00"}