{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:N46WSXLFR2PLTKFA3CZ7PY6GN3","short_pith_number":"pith:N46WSXLF","schema_version":"1.0","canonical_sha256":"6f3d695d658e9eb9a8a0d8b3f7e3c66ec2617046d2841305622e6eb9becfdac6","source":{"kind":"arxiv","id":"2605.18500","version":1},"attestation_state":"computed","paper":{"title":"Implicit Hierarchical GRPO: Decoupling Tool Invocation from Execution for Tool-Integrated Mathematical Reasoning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Guojun Yin, Jiajun Chai, Jinyang Wu, Li Wang, Wei Lin, Xiaodong Lu, Xiaohan Wang, Zipeng Zhang","submitted_at":"2026-05-18T14:54:49Z","abstract_excerpt":"Large language models (LLMs) have increasingly leveraged tool invocation to enhance their reasoning capabilities. However, existing approaches typically tightly couple tool invocation with immediate execution. Such immediate tool interaction may disrupt the reasoning coherence of LLMs and constrain their expressivity, ultimately degrading reasoning performance. To this end, for the first time, we propose and formalize the problem of decoupling tool invocation from execution during reasoning, and introduce delayed execution with explicit control to enhance tool-integrated reasoning (TIR). Furth"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.18500","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-18T14:54:49Z","cross_cats_sorted":[],"title_canon_sha256":"9bfcaa672763e2bf0b2bbc8401db6a73efa6f4abf089c471b97422afbc1fb1c0","abstract_canon_sha256":"cba08a12d18c6a127260783ad91733dce75af22ca3e578a04164aaf88f80f814"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:06:04.446059Z","signature_b64":"Az7uwshtEJrcIcKfqKphi6x/sJJ/o0Yd0s6C1+Q4c7HlcMtyKAln/7PbA8GAIJS0r9kOrv5Vf2lObTanND9BCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6f3d695d658e9eb9a8a0d8b3f7e3c66ec2617046d2841305622e6eb9becfdac6","last_reissued_at":"2026-05-20T00:06:04.445282Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:06:04.445282Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Implicit Hierarchical GRPO: Decoupling Tool Invocation from Execution for Tool-Integrated Mathematical Reasoning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Guojun Yin, Jiajun Chai, Jinyang Wu, Li Wang, Wei Lin, Xiaodong Lu, Xiaohan Wang, Zipeng Zhang","submitted_at":"2026-05-18T14:54:49Z","abstract_excerpt":"Large language models (LLMs) have increasingly leveraged tool invocation to enhance their reasoning capabilities. However, existing approaches typically tightly couple tool invocation with immediate execution. Such immediate tool interaction may disrupt the reasoning coherence of LLMs and constrain their expressivity, ultimately degrading reasoning performance. To this end, for the first time, we propose and formalize the problem of decoupling tool invocation from execution during reasoning, and introduce delayed execution with explicit control to enhance tool-integrated reasoning (TIR). Furth"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18500","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18500/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.18500","created_at":"2026-05-20T00:06:04.445401+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.18500v1","created_at":"2026-05-20T00:06:04.445401+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18500","created_at":"2026-05-20T00:06:04.445401+00:00"},{"alias_kind":"pith_short_12","alias_value":"N46WSXLFR2PL","created_at":"2026-05-20T00:06:04.445401+00:00"},{"alias_kind":"pith_short_16","alias_value":"N46WSXLFR2PLTKFA","created_at":"2026-05-20T00:06:04.445401+00:00"},{"alias_kind":"pith_short_8","alias_value":"N46WSXLF","created_at":"2026-05-20T00:06:04.445401+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3","json":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3.json","graph_json":"https://pith.science/api/pith-number/N46WSXLFR2PLTKFA3CZ7PY6GN3/graph.json","events_json":"https://pith.science/api/pith-number/N46WSXLFR2PLTKFA3CZ7PY6GN3/events.json","paper":"https://pith.science/paper/N46WSXLF"},"agent_actions":{"view_html":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3","download_json":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3.json","view_paper":"https://pith.science/paper/N46WSXLF","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.18500&json=true","fetch_graph":"https://pith.science/api/pith-number/N46WSXLFR2PLTKFA3CZ7PY6GN3/graph.json","fetch_events":"https://pith.science/api/pith-number/N46WSXLFR2PLTKFA3CZ7PY6GN3/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3/action/timestamp_anchor","attest_storage":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3/action/storage_attestation","attest_author":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3/action/author_attestation","sign_citation":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3/action/citation_signature","submit_replication":"https://pith.science/pith/N46WSXLFR2PLTKFA3CZ7PY6GN3/action/replication_record"}},"created_at":"2026-05-20T00:06:04.445401+00:00","updated_at":"2026-05-20T00:06:04.445401+00:00"}