{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:FQBBRCMKCRXVCYF7TPZNQ7Y63C","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f323f0d306229f5b20287c5c0015ea271036215dc99af197e509144c8b2daa08","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-12T19:38:19Z","title_canon_sha256":"3f0f4dfa332fc874642ee8db1f05601013ee065ea51efc86a8f45f516bdcd645"},"schema_version":"1.0","source":{"id":"2604.10788","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.10788","created_at":"2026-06-02T01:03:47Z"},{"alias_kind":"arxiv_version","alias_value":"2604.10788v2","created_at":"2026-06-02T01:03:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.10788","created_at":"2026-06-02T01:03:47Z"},{"alias_kind":"pith_short_12","alias_value":"FQBBRCMKCRXV","created_at":"2026-06-02T01:03:47Z"},{"alias_kind":"pith_short_16","alias_value":"FQBBRCMKCRXVCYF7","created_at":"2026-06-02T01:03:47Z"},{"alias_kind":"pith_short_8","alias_value":"FQBBRCMK","created_at":"2026-06-02T01:03:47Z"}],"graph_snapshots":[{"event_id":"sha256:b5a9d7614af2f2ead596fea4821c280c6eb296e547a1da93d499283737b3502a","target":"graph","created_at":"2026-06-02T01:03:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Experiment results show that TInR-U achieves superior performance in both in-domain and out-of-domain settings, highlighting its effectiveness and efficiency."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That tool knowledge can be reliably internalized into LLM parameters through the described three-phase pipeline such that reasoning and tool use remain coordinated without external documentation at inference time."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"TInR-U internalizes tool knowledge into LLMs via bidirectional alignment, supervised fine-tuning, and reinforcement learning, outperforming standard tool-integrated reasoning in both in-domain and out-of-domain evaluations."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"Internalizing tool knowledge into LLMs enables coordinated reasoning and tool use without external documentation at inference time."}],"snapshot_sha256":"38e95db467ff9d4842e77ebc584bf9ec9d066f43203631fc763368d03e385e71"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2604.10788/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Tool-Integrated Reasoning (TIR) has emerged as a promising direction by extending Large Language Models' (LLMs) capabilities with external tools during reasoning. Existing TIR methods typically rely on external tool documentation during reasoning. However, this leads to tool mastery difficulty, tool size constraints, and inference inefficiency. To mitigate these issues, we explore Tool-Internalized Reasoning (TInR), aiming at facilitating reasoning with tool knowledge internalized into LLMs. Achieving this goal presents notable requirements, including tool internalization and tool-reasoning co","authors_text":"Fan Liu, Hongru Wang, Min Yang, Qiancheng Xu, Wenjie Li, Yongqi Li","cross_cats":["cs.AI"],"headline":"Internalizing tool knowledge into LLMs enables coordinated reasoning and tool use without external documentation at inference time.","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-12T19:38:19Z","title":"TInR: Exploring Tool-Internalized Reasoning in Large Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2604.10788","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-10T15:11:26.086235Z","id":"3b8ba365-23d6-4758-b363-7b7284395d42","model_set":{"reader":"grok-4.3"},"one_line_summary":"TInR-U internalizes tool knowledge into LLMs via bidirectional alignment, supervised fine-tuning, and reinforcement learning, outperforming standard tool-integrated reasoning in both in-domain and out-of-domain evaluations.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"Internalizing tool knowledge into LLMs enables coordinated reasoning and tool use without external documentation at inference time.","strongest_claim":"Experiment results show that TInR-U achieves superior performance in both in-domain and out-of-domain settings, highlighting its effectiveness and efficiency.","weakest_assumption":"That tool knowledge can be reliably internalized into LLM parameters through the described three-phase pipeline such that reasoning and tool use remain coordinated without external documentation at inference time."}},"verdict_id":"3b8ba365-23d6-4758-b363-7b7284395d42"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9fe15837214bd525750b980ae1f7d461b7c1d314da67ab292017f06eb50e576e","target":"record","created_at":"2026-06-02T01:03:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f323f0d306229f5b20287c5c0015ea271036215dc99af197e509144c8b2daa08","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-04-12T19:38:19Z","title_canon_sha256":"3f0f4dfa332fc874642ee8db1f05601013ee065ea51efc86a8f45f516bdcd645"},"schema_version":"1.0","source":{"id":"2604.10788","kind":"arxiv","version":2}},"canonical_sha256":"2c0218898a146f5160bf9bf2d87f1ed883c05e106f236ca3900a5cb0c2772316","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2c0218898a146f5160bf9bf2d87f1ed883c05e106f236ca3900a5cb0c2772316","first_computed_at":"2026-06-02T01:03:47.029686Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T01:03:47.029686Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"3UUGszrNQXcM3LtLcVMD0T/H2tFelFzduvHE93xM36KiPGiOmVuVgEqdJuuT3b6etvaa2RuHVka467ILJxO7Dw==","signature_status":"signed_v1","signed_at":"2026-06-02T01:03:47.030258Z","signed_message":"canonical_sha256_bytes"},"source_id":"2604.10788","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9fe15837214bd525750b980ae1f7d461b7c1d314da67ab292017f06eb50e576e","sha256:b5a9d7614af2f2ead596fea4821c280c6eb296e547a1da93d499283737b3502a"],"state_sha256":"a42aa5c07f1683cf9f5f17d098f7117561088a1f161ee3f51b8b3e24aeac63b4"}