{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:SIM6TG3OBTWZ7JCSRYREGR24C3","short_pith_number":"pith:SIM6TG3O","canonical_record":{"source":{"id":"2605.07243","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-08T04:59:48Z","cross_cats_sorted":[],"title_canon_sha256":"5bff5a50ecbee5f77c9aecdd5baf193b926eb9723deb9830a2e24616d150909b","abstract_canon_sha256":"26629a6a38f26d2cec8f5bc8d534060fe4fdc55871d7b9049aff8f3a1f22fc8d"},"schema_version":"1.0"},"canonical_sha256":"9219e99b6e0ced9fa4528e2243475c16c2e450882845b14915eb57663c1e3550","source":{"kind":"arxiv","id":"2605.07243","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.07243","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"arxiv_version","alias_value":"2605.07243v2","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.07243","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"pith_short_12","alias_value":"SIM6TG3OBTWZ","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"pith_short_16","alias_value":"SIM6TG3OBTWZ7JCS","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"pith_short_8","alias_value":"SIM6TG3O","created_at":"2026-05-22T02:04:42Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:SIM6TG3OBTWZ7JCSRYREGR24C3","target":"record","payload":{"canonical_record":{"source":{"id":"2605.07243","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-08T04:59:48Z","cross_cats_sorted":[],"title_canon_sha256":"5bff5a50ecbee5f77c9aecdd5baf193b926eb9723deb9830a2e24616d150909b","abstract_canon_sha256":"26629a6a38f26d2cec8f5bc8d534060fe4fdc55871d7b9049aff8f3a1f22fc8d"},"schema_version":"1.0"},"canonical_sha256":"9219e99b6e0ced9fa4528e2243475c16c2e450882845b14915eb57663c1e3550","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-22T02:04:42.061224Z","signature_b64":"qo4637x+zN2uJmv05pM5mTpifr1UMjSOJry0C0YbR/RXNSnjmG1s57X/QrmcfAMyP0MtCgtuA0Imash3CoD8BA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9219e99b6e0ced9fa4528e2243475c16c2e450882845b14915eb57663c1e3550","last_reissued_at":"2026-05-22T02:04:42.060356Z","signature_status":"signed_v1","first_computed_at":"2026-05-22T02:04:42.060356Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.07243","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T02:04:42Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cdoklXD+O8Lns/nFrm1lrJTkANi2D/4bQVdPNXkA1o+1KuwJKqrc7XU/AxdtycEiA1c19yvRLgWIJpptcCneAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T15:45:58.874581Z"},"content_sha256":"80475c2226e4aba9b1707cc9668e3deb5bb06760205a7957d85465b3b99175e0","schema_version":"1.0","event_id":"sha256:80475c2226e4aba9b1707cc9668e3deb5bb06760205a7957d85465b3b99175e0"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:SIM6TG3OBTWZ7JCSRYREGR24C3","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"SpecBlock: Block-Iterative Speculative Decoding with Dynamic Tree Drafting","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"SpecBlock accelerates LLM inference by generating blocks of dependent tokens iteratively with hidden-state inheritance and dynamic branching.","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Fan Deng, Hao Chen, Jiajie Xu, Jian Yang, Jiarun Liu, Jia Zhu, Qiang Xu, Weijie Shi, Xiangjun Huang, Xiaofang Zhou, Yaguang Wu, Yehong Xu","submitted_at":"2026-05-08T04:59:48Z","abstract_excerpt":"Speculative decoding accelerates LLM inference by drafting a tree of candidate continuations and verifying it in one target forward. Existing drafters fall into two camps with opposite weaknesses. Autoregressive drafters such as EAGLE-3 preserve dependence along each draft path but call the drafter once per tree depth, making drafting a non-trivial share of per-iteration latency. Parallel drafters cut drafter calls by predicting multiple future positions in one forward, but each position is predicted without seeing the others, producing paths the verifier rejects. In this paper, we propose Spe"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"Experiments show that SpecBlock improves mean speedup by 8-13% over EAGLE-3 at 44-52% of its drafting cost, and cost-aware adaptation extends this lead to 11-19%.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"That the layer-wise hidden-state shift within blocks and selective inheritance across blocks will preserve sufficient path dependence to keep acceptance rates high enough to offset the added mechanisms, without the rank head or mask introducing new training-inference mismatches.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"SpecBlock achieves 8-19% higher speedup than EAGLE-3 in LLM speculative decoding by using repeated block expansions with hidden-state inheritance, a dynamic rank head, and a valid-prefix training mask.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"SpecBlock accelerates LLM inference by generating blocks of dependent tokens iteratively with hidden-state inheritance and dynamic branching.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"de7a9d70a60ab86e00eb21d075281d0bea9920f632741c66bc1fff86a60aeaf6"},"source":{"id":"2605.07243","kind":"arxiv","version":2},"verdict":{"id":"3183e005-1106-415d-a51d-23b2020379bc","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-11T02:24:01.144351Z","strongest_claim":"Experiments show that SpecBlock improves mean speedup by 8-13% over EAGLE-3 at 44-52% of its drafting cost, and cost-aware adaptation extends this lead to 11-19%.","one_line_summary":"SpecBlock achieves 8-19% higher speedup than EAGLE-3 in LLM speculative decoding by using repeated block expansions with hidden-state inheritance, a dynamic rank head, and a valid-prefix training mask.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"That the layer-wise hidden-state shift within blocks and selective inheritance across blocks will preserve sufficient path dependence to keep acceptance rates high enough to offset the added mechanisms, without the rank head or mask introducing new training-inference mismatches.","pith_extraction_headline":"SpecBlock accelerates LLM inference by generating blocks of dependent tokens iteratively with hidden-state inheritance and dynamic branching."},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.07243/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"claim_evidence","ran_at":"2026-05-20T11:22:03.274502Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"ai_meta_artifact","ran_at":"2026-05-20T06:34:29.468482Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"doi_title_agreement","ran_at":"2026-05-19T17:01:19.371021Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"doi_compliance","ran_at":"2026-05-19T12:00:20.327047Z","status":"completed","version":"1.0.0","findings_count":0}],"snapshot_sha256":"da1c36f4dbdc57cfa08933f7e0b62bffb78336e9cdaf23c72bb58f9804e5ebdf"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":2,"snapshot_sha256":"4cfdf25e9ee7ee168c07404f17de3d43d46f90488f4a4dd327381345bab290af"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"3183e005-1106-415d-a51d-23b2020379bc"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T02:04:42Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"PlpPEUoBRERe48n49IGPIgaiIItSxTC1H4BKTc5Xn5gEHq03PJLveZHo7+alNUNvpODro0D9Ma+ka0hlbv/uBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T15:45:58.875585Z"},"content_sha256":"c4e5caa7616c888dd39ab8cafeacc5e69cc50789d2e800186878abc35c169ff1","schema_version":"1.0","event_id":"sha256:c4e5caa7616c888dd39ab8cafeacc5e69cc50789d2e800186878abc35c169ff1"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SIM6TG3OBTWZ7JCSRYREGR24C3/bundle.json","state_url":"https://pith.science/pith/SIM6TG3OBTWZ7JCSRYREGR24C3/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SIM6TG3OBTWZ7JCSRYREGR24C3/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T15:45:58Z","links":{"resolver":"https://pith.science/pith/SIM6TG3OBTWZ7JCSRYREGR24C3","bundle":"https://pith.science/pith/SIM6TG3OBTWZ7JCSRYREGR24C3/bundle.json","state":"https://pith.science/pith/SIM6TG3OBTWZ7JCSRYREGR24C3/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SIM6TG3OBTWZ7JCSRYREGR24C3/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:SIM6TG3OBTWZ7JCSRYREGR24C3","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"26629a6a38f26d2cec8f5bc8d534060fe4fdc55871d7b9049aff8f3a1f22fc8d","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-08T04:59:48Z","title_canon_sha256":"5bff5a50ecbee5f77c9aecdd5baf193b926eb9723deb9830a2e24616d150909b"},"schema_version":"1.0","source":{"id":"2605.07243","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.07243","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"arxiv_version","alias_value":"2605.07243v2","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.07243","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"pith_short_12","alias_value":"SIM6TG3OBTWZ","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"pith_short_16","alias_value":"SIM6TG3OBTWZ7JCS","created_at":"2026-05-22T02:04:42Z"},{"alias_kind":"pith_short_8","alias_value":"SIM6TG3O","created_at":"2026-05-22T02:04:42Z"}],"graph_snapshots":[{"event_id":"sha256:c4e5caa7616c888dd39ab8cafeacc5e69cc50789d2e800186878abc35c169ff1","target":"graph","created_at":"2026-05-22T02:04:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Experiments show that SpecBlock improves mean speedup by 8-13% over EAGLE-3 at 44-52% of its drafting cost, and cost-aware adaptation extends this lead to 11-19%."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That the layer-wise hidden-state shift within blocks and selective inheritance across blocks will preserve sufficient path dependence to keep acceptance rates high enough to offset the added mechanisms, without the rank head or mask introducing new training-inference mismatches."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"SpecBlock achieves 8-19% higher speedup than EAGLE-3 in LLM speculative decoding by using repeated block expansions with hidden-state inheritance, a dynamic rank head, and a valid-prefix training mask."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"SpecBlock accelerates LLM inference by generating blocks of dependent tokens iteratively with hidden-state inheritance and dynamic branching."}],"snapshot_sha256":"de7a9d70a60ab86e00eb21d075281d0bea9920f632741c66bc1fff86a60aeaf6"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"4cfdf25e9ee7ee168c07404f17de3d43d46f90488f4a4dd327381345bab290af"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-20T11:22:03.274502Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-20T06:34:29.468482Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_title_agreement","ran_at":"2026-05-19T17:01:19.371021Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-19T12:00:20.327047Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2605.07243/integrity.json","findings":[],"snapshot_sha256":"da1c36f4dbdc57cfa08933f7e0b62bffb78336e9cdaf23c72bb58f9804e5ebdf","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Speculative decoding accelerates LLM inference by drafting a tree of candidate continuations and verifying it in one target forward. Existing drafters fall into two camps with opposite weaknesses. Autoregressive drafters such as EAGLE-3 preserve dependence along each draft path but call the drafter once per tree depth, making drafting a non-trivial share of per-iteration latency. Parallel drafters cut drafter calls by predicting multiple future positions in one forward, but each position is predicted without seeing the others, producing paths the verifier rejects. In this paper, we propose Spe","authors_text":"Fan Deng, Hao Chen, Jiajie Xu, Jian Yang, Jiarun Liu, Jia Zhu, Qiang Xu, Weijie Shi, Xiangjun Huang, Xiaofang Zhou, Yaguang Wu, Yehong Xu","cross_cats":[],"headline":"SpecBlock accelerates LLM inference by generating blocks of dependent tokens iteratively with hidden-state inheritance and dynamic branching.","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-08T04:59:48Z","title":"SpecBlock: Block-Iterative Speculative Decoding with Dynamic Tree Drafting"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.07243","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-11T02:24:01.144351Z","id":"3183e005-1106-415d-a51d-23b2020379bc","model_set":{"reader":"grok-4.3"},"one_line_summary":"SpecBlock achieves 8-19% higher speedup than EAGLE-3 in LLM speculative decoding by using repeated block expansions with hidden-state inheritance, a dynamic rank head, and a valid-prefix training mask.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"SpecBlock accelerates LLM inference by generating blocks of dependent tokens iteratively with hidden-state inheritance and dynamic branching.","strongest_claim":"Experiments show that SpecBlock improves mean speedup by 8-13% over EAGLE-3 at 44-52% of its drafting cost, and cost-aware adaptation extends this lead to 11-19%.","weakest_assumption":"That the layer-wise hidden-state shift within blocks and selective inheritance across blocks will preserve sufficient path dependence to keep acceptance rates high enough to offset the added mechanisms, without the rank head or mask introducing new training-inference mismatches."}},"verdict_id":"3183e005-1106-415d-a51d-23b2020379bc"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:80475c2226e4aba9b1707cc9668e3deb5bb06760205a7957d85465b3b99175e0","target":"record","created_at":"2026-05-22T02:04:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"26629a6a38f26d2cec8f5bc8d534060fe4fdc55871d7b9049aff8f3a1f22fc8d","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-08T04:59:48Z","title_canon_sha256":"5bff5a50ecbee5f77c9aecdd5baf193b926eb9723deb9830a2e24616d150909b"},"schema_version":"1.0","source":{"id":"2605.07243","kind":"arxiv","version":2}},"canonical_sha256":"9219e99b6e0ced9fa4528e2243475c16c2e450882845b14915eb57663c1e3550","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9219e99b6e0ced9fa4528e2243475c16c2e450882845b14915eb57663c1e3550","first_computed_at":"2026-05-22T02:04:42.060356Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-22T02:04:42.060356Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"qo4637x+zN2uJmv05pM5mTpifr1UMjSOJry0C0YbR/RXNSnjmG1s57X/QrmcfAMyP0MtCgtuA0Imash3CoD8BA==","signature_status":"signed_v1","signed_at":"2026-05-22T02:04:42.061224Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.07243","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:80475c2226e4aba9b1707cc9668e3deb5bb06760205a7957d85465b3b99175e0","sha256:c4e5caa7616c888dd39ab8cafeacc5e69cc50789d2e800186878abc35c169ff1"],"state_sha256":"c78feb867378219d2b2082c7639128225fdcfe6866e2c6261159d11943981d21"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jte8zJOAbY0P5ySpIs9OCGT/OoGa7DCWBeSjwYrliJqSLc4cpNOKrYxYBjBXLAqGEw4ETovwb2aMsG5NLoeMCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T15:45:58.880143Z","bundle_sha256":"3b88c2ee49d508f6d044e1a1a61a88101953a4bb42b65fbb8116c39e6af6df86"}}