{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:3TSWZUZFODHZPEYPOPHGUAK3NR","short_pith_number":"pith:3TSWZUZF","schema_version":"1.0","canonical_sha256":"dce56cd32570cf97930f73ce6a015b6c5c7756af8438d46c034b1ee023b0a336","source":{"kind":"arxiv","id":"2606.13126","version":1},"attestation_state":"computed","paper":{"title":"MiniPIC: Flexible Position-Independent Caching in <100LOC","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.LG","authors_text":"Nathan Ordonez (1), Thomas Parnell (1) ((1) IBM Research)","submitted_at":"2026-06-11T09:51:36Z","abstract_excerpt":"Retrieval-augmented and agentic workloads repeatedly prefill recurring predictable structured inputs (which we call \"spans\") such as documents and code files. Yet, prefix caching in engines such as vLLM cannot reuse their KV entries unless they share identical prefixes with another request, while Position-Independent Caching (PIC) implementations within production-grade inference servers typically either require substantial server code changes or keep KV state outside the server, incurring host-to-device transfer overhead. We present Minimalistic PIC (MiniPIC): a minimal, flexible and fast vLL"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.13126","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-11T09:51:36Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"4077084500bf314a3709482b976e92b256b16feb1ac4f9b6b83e38f705428021","abstract_canon_sha256":"bb124ee50bc30f569b08d9cef628fd8cc2afc81a8c29bcf4c0be0b4f17d1d650"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-12T01:09:41.672423Z","signature_b64":"xejIkQQvQSnEFDizE3YLYs1TL0zr66dpP/hIRh8wbyi+YbIXi0XR6nb/8j7Dy8O9DpcNN/eeIVRIl//0Df/IBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"dce56cd32570cf97930f73ce6a015b6c5c7756af8438d46c034b1ee023b0a336","last_reissued_at":"2026-06-12T01:09:41.671621Z","signature_status":"signed_v1","first_computed_at":"2026-06-12T01:09:41.671621Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"MiniPIC: Flexible Position-Independent Caching in <100LOC","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.LG","authors_text":"Nathan Ordonez (1), Thomas Parnell (1) ((1) IBM Research)","submitted_at":"2026-06-11T09:51:36Z","abstract_excerpt":"Retrieval-augmented and agentic workloads repeatedly prefill recurring predictable structured inputs (which we call \"spans\") such as documents and code files. Yet, prefix caching in engines such as vLLM cannot reuse their KV entries unless they share identical prefixes with another request, while Position-Independent Caching (PIC) implementations within production-grade inference servers typically either require substantial server code changes or keep KV state outside the server, incurring host-to-device transfer overhead. We present Minimalistic PIC (MiniPIC): a minimal, flexible and fast vLL"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.13126","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.13126/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.13126","created_at":"2026-06-12T01:09:41.671750+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.13126v1","created_at":"2026-06-12T01:09:41.671750+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.13126","created_at":"2026-06-12T01:09:41.671750+00:00"},{"alias_kind":"pith_short_12","alias_value":"3TSWZUZFODHZ","created_at":"2026-06-12T01:09:41.671750+00:00"},{"alias_kind":"pith_short_16","alias_value":"3TSWZUZFODHZPEYP","created_at":"2026-06-12T01:09:41.671750+00:00"},{"alias_kind":"pith_short_8","alias_value":"3TSWZUZF","created_at":"2026-06-12T01:09:41.671750+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR","json":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR.json","graph_json":"https://pith.science/api/pith-number/3TSWZUZFODHZPEYPOPHGUAK3NR/graph.json","events_json":"https://pith.science/api/pith-number/3TSWZUZFODHZPEYPOPHGUAK3NR/events.json","paper":"https://pith.science/paper/3TSWZUZF"},"agent_actions":{"view_html":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR","download_json":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR.json","view_paper":"https://pith.science/paper/3TSWZUZF","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.13126&json=true","fetch_graph":"https://pith.science/api/pith-number/3TSWZUZFODHZPEYPOPHGUAK3NR/graph.json","fetch_events":"https://pith.science/api/pith-number/3TSWZUZFODHZPEYPOPHGUAK3NR/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR/action/timestamp_anchor","attest_storage":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR/action/storage_attestation","attest_author":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR/action/author_attestation","sign_citation":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR/action/citation_signature","submit_replication":"https://pith.science/pith/3TSWZUZFODHZPEYPOPHGUAK3NR/action/replication_record"}},"created_at":"2026-06-12T01:09:41.671750+00:00","updated_at":"2026-06-12T01:09:41.671750+00:00"}