{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:HMVWYJAQUTOFK55DGA2FAEPBHY","short_pith_number":"pith:HMVWYJAQ","canonical_record":{"source":{"id":"2604.13519","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-15T06:05:11Z","cross_cats_sorted":[],"title_canon_sha256":"2c6ec7183739b2bddb5024a79df32a78fcd014ad84a21dcd8ba7001d713652f5","abstract_canon_sha256":"7583a852c4ce65075affcfa8f9326141373c1cb82145c15065b021a4f373098e"},"schema_version":"1.0"},"canonical_sha256":"3b2b6c2410a4dc5577a330345011e13e0ce86ffec626c2749bc4f32707ff4856","source":{"kind":"arxiv","id":"2604.13519","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.13519","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"arxiv_version","alias_value":"2604.13519v2","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.13519","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"pith_short_12","alias_value":"HMVWYJAQUTOF","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"pith_short_16","alias_value":"HMVWYJAQUTOFK55D","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"pith_short_8","alias_value":"HMVWYJAQ","created_at":"2026-05-29T01:05:09Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:HMVWYJAQUTOFK55DGA2FAEPBHY","target":"record","payload":{"canonical_record":{"source":{"id":"2604.13519","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-15T06:05:11Z","cross_cats_sorted":[],"title_canon_sha256":"2c6ec7183739b2bddb5024a79df32a78fcd014ad84a21dcd8ba7001d713652f5","abstract_canon_sha256":"7583a852c4ce65075affcfa8f9326141373c1cb82145c15065b021a4f373098e"},"schema_version":"1.0"},"canonical_sha256":"3b2b6c2410a4dc5577a330345011e13e0ce86ffec626c2749bc4f32707ff4856","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T01:05:09.801690Z","signature_b64":"TBrTeMdDNUg1uxhF48x7rSN/VTugqHWK9H2SgAdZUphPxcfYmPY016om1yx0OjsLefKN23XUWpRpgoG16SISAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3b2b6c2410a4dc5577a330345011e13e0ce86ffec626c2749bc4f32707ff4856","last_reissued_at":"2026-05-29T01:05:09.800715Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T01:05:09.800715Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2604.13519","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7FxvZwrguP/2tds2Qs2Qwy30RQGefjZ8GFInvtUmjCcW367hXRtioQDkXLrTZT1A0hg3alhZh/zQIsZUPTB0AA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T09:30:48.489889Z"},"content_sha256":"2df40d92da02139a41d5f4cc14356c67f1dc510ea551cb841ca66752298951c2","schema_version":"1.0","event_id":"sha256:2df40d92da02139a41d5f4cc14356c67f1dc510ea551cb841ca66752298951c2"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:HMVWYJAQUTOFK55DGA2FAEPBHY","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"ToolSpec: Accelerating Tool Calling via Schema-Aware and Retrieval-Augmented Speculative Decoding","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"ToolSpec accelerates LLM tool calling up to 4.2 times by using tool schemas and past calls for accurate speculative drafts.","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Cunxiao Du, Heming Xia, Mingbo Song, Wenjie Li, Yongqi Li","submitted_at":"2026-04-15T06:05:11Z","abstract_excerpt":"Tool calling has greatly expanded the practical utility of large language models (LLMs) by enabling them to interact with external applications. As LLM capabilities advance, effective tool use increasingly involves multi-step, multi-turn interactions to solve complex tasks. However, the resulting growth in tool interactions incurs substantial latency, posing a key challenge for real-time LLM serving. Through empirical analysis, we find that tool-calling traces are highly structured, conform to constrained schemas, and often exhibit recurring invocation patterns. Motivated by this, we propose T"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"ToolSpec achieves up to a 4.2x speedup, substantially outperforming existing training-free speculative decoding methods.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"Tool-calling traces are highly structured, conform to constrained schemas, and often exhibit recurring invocation patterns that can be exploited for accurate draft generation.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"ToolSpec accelerates LLM tool calling by up to 4.2x via schema-aware finite-state machine drafting and retrieval of similar past invocations.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"ToolSpec accelerates LLM tool calling up to 4.2 times by using tool schemas and past calls for accurate speculative drafts.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"24add4ad1756d276843d6c93ec0be08f7b1f329f6480bbc9b3f6d533e9ff3bf1"},"source":{"id":"2604.13519","kind":"arxiv","version":2},"verdict":{"id":"b8ac1bf8-9d52-40d8-ad10-a2b3469d6d2f","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-10T14:14:13.569618Z","strongest_claim":"ToolSpec achieves up to a 4.2x speedup, substantially outperforming existing training-free speculative decoding methods.","one_line_summary":"ToolSpec accelerates LLM tool calling by up to 4.2x via schema-aware finite-state machine drafting and retrieval of similar past invocations.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"Tool-calling traces are highly structured, conform to constrained schemas, and often exhibit recurring invocation patterns that can be exploited for accurate draft generation.","pith_extraction_headline":"ToolSpec accelerates LLM tool calling up to 4.2 times by using tool schemas and past calls for accurate speculative drafts."},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2604.13519/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"b8ac1bf8-9d52-40d8-ad10-a2b3469d6d2f"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"569m1jZaeWZsZQja3h35CtK55WcpuhRqqcCXvuYL6HuhgAllnJBZ9yEQIJ5WfKSPGbAixGom+VrWXiJbDWTQDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T09:30:48.490343Z"},"content_sha256":"7cd9af7cb3c1c422d9d327de49e1b490ccb2b8c700a30d82f615a32272883d5f","schema_version":"1.0","event_id":"sha256:7cd9af7cb3c1c422d9d327de49e1b490ccb2b8c700a30d82f615a32272883d5f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HMVWYJAQUTOFK55DGA2FAEPBHY/bundle.json","state_url":"https://pith.science/pith/HMVWYJAQUTOFK55DGA2FAEPBHY/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HMVWYJAQUTOFK55DGA2FAEPBHY/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-30T09:30:48Z","links":{"resolver":"https://pith.science/pith/HMVWYJAQUTOFK55DGA2FAEPBHY","bundle":"https://pith.science/pith/HMVWYJAQUTOFK55DGA2FAEPBHY/bundle.json","state":"https://pith.science/pith/HMVWYJAQUTOFK55DGA2FAEPBHY/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HMVWYJAQUTOFK55DGA2FAEPBHY/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:HMVWYJAQUTOFK55DGA2FAEPBHY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7583a852c4ce65075affcfa8f9326141373c1cb82145c15065b021a4f373098e","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-15T06:05:11Z","title_canon_sha256":"2c6ec7183739b2bddb5024a79df32a78fcd014ad84a21dcd8ba7001d713652f5"},"schema_version":"1.0","source":{"id":"2604.13519","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.13519","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"arxiv_version","alias_value":"2604.13519v2","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.13519","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"pith_short_12","alias_value":"HMVWYJAQUTOF","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"pith_short_16","alias_value":"HMVWYJAQUTOFK55D","created_at":"2026-05-29T01:05:09Z"},{"alias_kind":"pith_short_8","alias_value":"HMVWYJAQ","created_at":"2026-05-29T01:05:09Z"}],"graph_snapshots":[{"event_id":"sha256:7cd9af7cb3c1c422d9d327de49e1b490ccb2b8c700a30d82f615a32272883d5f","target":"graph","created_at":"2026-05-29T01:05:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"ToolSpec achieves up to a 4.2x speedup, substantially outperforming existing training-free speculative decoding methods."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"Tool-calling traces are highly structured, conform to constrained schemas, and often exhibit recurring invocation patterns that can be exploited for accurate draft generation."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"ToolSpec accelerates LLM tool calling by up to 4.2x via schema-aware finite-state machine drafting and retrieval of similar past invocations."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"ToolSpec accelerates LLM tool calling up to 4.2 times by using tool schemas and past calls for accurate speculative drafts."}],"snapshot_sha256":"24add4ad1756d276843d6c93ec0be08f7b1f329f6480bbc9b3f6d533e9ff3bf1"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2604.13519/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Tool calling has greatly expanded the practical utility of large language models (LLMs) by enabling them to interact with external applications. As LLM capabilities advance, effective tool use increasingly involves multi-step, multi-turn interactions to solve complex tasks. However, the resulting growth in tool interactions incurs substantial latency, posing a key challenge for real-time LLM serving. Through empirical analysis, we find that tool-calling traces are highly structured, conform to constrained schemas, and often exhibit recurring invocation patterns. Motivated by this, we propose T","authors_text":"Cunxiao Du, Heming Xia, Mingbo Song, Wenjie Li, Yongqi Li","cross_cats":[],"headline":"ToolSpec accelerates LLM tool calling up to 4.2 times by using tool schemas and past calls for accurate speculative drafts.","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-15T06:05:11Z","title":"ToolSpec: Accelerating Tool Calling via Schema-Aware and Retrieval-Augmented Speculative Decoding"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2604.13519","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-10T14:14:13.569618Z","id":"b8ac1bf8-9d52-40d8-ad10-a2b3469d6d2f","model_set":{"reader":"grok-4.3"},"one_line_summary":"ToolSpec accelerates LLM tool calling by up to 4.2x via schema-aware finite-state machine drafting and retrieval of similar past invocations.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"ToolSpec accelerates LLM tool calling up to 4.2 times by using tool schemas and past calls for accurate speculative drafts.","strongest_claim":"ToolSpec achieves up to a 4.2x speedup, substantially outperforming existing training-free speculative decoding methods.","weakest_assumption":"Tool-calling traces are highly structured, conform to constrained schemas, and often exhibit recurring invocation patterns that can be exploited for accurate draft generation."}},"verdict_id":"b8ac1bf8-9d52-40d8-ad10-a2b3469d6d2f"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2df40d92da02139a41d5f4cc14356c67f1dc510ea551cb841ca66752298951c2","target":"record","created_at":"2026-05-29T01:05:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7583a852c4ce65075affcfa8f9326141373c1cb82145c15065b021a4f373098e","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-15T06:05:11Z","title_canon_sha256":"2c6ec7183739b2bddb5024a79df32a78fcd014ad84a21dcd8ba7001d713652f5"},"schema_version":"1.0","source":{"id":"2604.13519","kind":"arxiv","version":2}},"canonical_sha256":"3b2b6c2410a4dc5577a330345011e13e0ce86ffec626c2749bc4f32707ff4856","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3b2b6c2410a4dc5577a330345011e13e0ce86ffec626c2749bc4f32707ff4856","first_computed_at":"2026-05-29T01:05:09.800715Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T01:05:09.800715Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"TBrTeMdDNUg1uxhF48x7rSN/VTugqHWK9H2SgAdZUphPxcfYmPY016om1yx0OjsLefKN23XUWpRpgoG16SISAg==","signature_status":"signed_v1","signed_at":"2026-05-29T01:05:09.801690Z","signed_message":"canonical_sha256_bytes"},"source_id":"2604.13519","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2df40d92da02139a41d5f4cc14356c67f1dc510ea551cb841ca66752298951c2","sha256:7cd9af7cb3c1c422d9d327de49e1b490ccb2b8c700a30d82f615a32272883d5f"],"state_sha256":"be2b233e28470f497f9d4e2a9f84b9875fa22f2e83d58434a242650bafea6c17"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jE2ZAHVzsnnE/1GRP31im4T6QMAxwqK49PjVsw56MWw3sdMGZ1oFULBG7wlO1IKRNEIvUUrK/ZSuRDjxl46yAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-30T09:30:48.492770Z","bundle_sha256":"384ed11b5c8df3ac0e3eddd1010c3b383022487801a19282f18159004abce777"}}