{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:HXZE5YRMHKYHWOVZYE7THI2DU2","short_pith_number":"pith:HXZE5YRM","canonical_record":{"source":{"id":"2606.00096","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T13:06:59Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c2f6726818e61b318cf3644e01e47ee43bf39a3bdc2f381085bc90eefed6708f","abstract_canon_sha256":"7402d63716d1c7978ba71f6549ff919e10af1d9a5d7c9d20e2facac052a9fac6"},"schema_version":"1.0"},"canonical_sha256":"3df24ee22c3ab07b3ab9c13f33a343a6bfb453d2bacd141fd3afd1e207fa1c87","source":{"kind":"arxiv","id":"2606.00096","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00096","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00096v1","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00096","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_12","alias_value":"HXZE5YRMHKYH","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_16","alias_value":"HXZE5YRMHKYHWOVZ","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_8","alias_value":"HXZE5YRM","created_at":"2026-06-02T00:03:14Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:HXZE5YRMHKYHWOVZYE7THI2DU2","target":"record","payload":{"canonical_record":{"source":{"id":"2606.00096","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T13:06:59Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c2f6726818e61b318cf3644e01e47ee43bf39a3bdc2f381085bc90eefed6708f","abstract_canon_sha256":"7402d63716d1c7978ba71f6549ff919e10af1d9a5d7c9d20e2facac052a9fac6"},"schema_version":"1.0"},"canonical_sha256":"3df24ee22c3ab07b3ab9c13f33a343a6bfb453d2bacd141fd3afd1e207fa1c87","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T00:03:14.877897Z","signature_b64":"rkfOrnAetGfd/MuJIst4SdDz7a78aCMqgdpHV54YMBWSFLfTCnXEyLUExYrv+UYyc1vcdP+y4G7w6XnvSW1KBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3df24ee22c3ab07b3ab9c13f33a343a6bfb453d2bacd141fd3afd1e207fa1c87","last_reissued_at":"2026-06-02T00:03:14.877344Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T00:03:14.877344Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.00096","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T00:03:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"npDDP1NK9h6Wfm+vBSKaayahlcy6gjvzS5GlxdMHMLR1kL8OjA+VWhzcHwDbwEDsRynoipYe25qgxUaOrr48Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T07:09:47.960795Z"},"content_sha256":"40319fed3cab9e9ecdfedfd9826bf7325f94f664f3255b4263d723f37d9c1533","schema_version":"1.0","event_id":"sha256:40319fed3cab9e9ecdfedfd9826bf7325f94f664f3255b4263d723f37d9c1533"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:HXZE5YRMHKYHWOVZYE7THI2DU2","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Diversity Over Frequency: Rethinking Tool Use in Visual Chain-of-Thought Agents","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CV","authors_text":"Dong-Hee Kim, Donghyun Kim, Reuben Tan","submitted_at":"2026-05-25T13:06:59Z","abstract_excerpt":"Visual agents employ external visual tools within visual chains of thought to incorporate fine-grained evidence. While prior work has mainly studied these tools in visual search tasks, their role in more complex visual reasoning remains underexplored. In this paper, we move beyond simple visual search tasks to investigate more challenging tasks, including 3D spatial reasoning and medical visual question answering, where agents must integrate tool-acquired local evidence with the global context.\n  We identify a {tool-use collapse phenomenon: models progressively stop using tools while still ach"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00096","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.00096/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T00:03:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P4RtOSz8FxsJ+dviW8W4WIpYdooW+7Rb104Fmw+1T5srCKRS27AtTdbMRyVMK0/pPmXqnStNKnAjv+y2j949AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T07:09:47.961192Z"},"content_sha256":"cdbb386de254823f27a4fbd5ca90ef3e48a5b1a0389181bbaa6082d16886155d","schema_version":"1.0","event_id":"sha256:cdbb386de254823f27a4fbd5ca90ef3e48a5b1a0389181bbaa6082d16886155d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HXZE5YRMHKYHWOVZYE7THI2DU2/bundle.json","state_url":"https://pith.science/pith/HXZE5YRMHKYHWOVZYE7THI2DU2/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HXZE5YRMHKYHWOVZYE7THI2DU2/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T07:09:47Z","links":{"resolver":"https://pith.science/pith/HXZE5YRMHKYHWOVZYE7THI2DU2","bundle":"https://pith.science/pith/HXZE5YRMHKYHWOVZYE7THI2DU2/bundle.json","state":"https://pith.science/pith/HXZE5YRMHKYHWOVZYE7THI2DU2/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HXZE5YRMHKYHWOVZYE7THI2DU2/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:HXZE5YRMHKYHWOVZYE7THI2DU2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7402d63716d1c7978ba71f6549ff919e10af1d9a5d7c9d20e2facac052a9fac6","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T13:06:59Z","title_canon_sha256":"c2f6726818e61b318cf3644e01e47ee43bf39a3bdc2f381085bc90eefed6708f"},"schema_version":"1.0","source":{"id":"2606.00096","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00096","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00096v1","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00096","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_12","alias_value":"HXZE5YRMHKYH","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_16","alias_value":"HXZE5YRMHKYHWOVZ","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_8","alias_value":"HXZE5YRM","created_at":"2026-06-02T00:03:14Z"}],"graph_snapshots":[{"event_id":"sha256:cdbb386de254823f27a4fbd5ca90ef3e48a5b1a0389181bbaa6082d16886155d","target":"graph","created_at":"2026-06-02T00:03:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.00096/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Visual agents employ external visual tools within visual chains of thought to incorporate fine-grained evidence. While prior work has mainly studied these tools in visual search tasks, their role in more complex visual reasoning remains underexplored. In this paper, we move beyond simple visual search tasks to investigate more challenging tasks, including 3D spatial reasoning and medical visual question answering, where agents must integrate tool-acquired local evidence with the global context.\n  We identify a {tool-use collapse phenomenon: models progressively stop using tools while still ach","authors_text":"Dong-Hee Kim, Donghyun Kim, Reuben Tan","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T13:06:59Z","title":"Diversity Over Frequency: Rethinking Tool Use in Visual Chain-of-Thought Agents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00096","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:40319fed3cab9e9ecdfedfd9826bf7325f94f664f3255b4263d723f37d9c1533","target":"record","created_at":"2026-06-02T00:03:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7402d63716d1c7978ba71f6549ff919e10af1d9a5d7c9d20e2facac052a9fac6","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T13:06:59Z","title_canon_sha256":"c2f6726818e61b318cf3644e01e47ee43bf39a3bdc2f381085bc90eefed6708f"},"schema_version":"1.0","source":{"id":"2606.00096","kind":"arxiv","version":1}},"canonical_sha256":"3df24ee22c3ab07b3ab9c13f33a343a6bfb453d2bacd141fd3afd1e207fa1c87","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3df24ee22c3ab07b3ab9c13f33a343a6bfb453d2bacd141fd3afd1e207fa1c87","first_computed_at":"2026-06-02T00:03:14.877344Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T00:03:14.877344Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"rkfOrnAetGfd/MuJIst4SdDz7a78aCMqgdpHV54YMBWSFLfTCnXEyLUExYrv+UYyc1vcdP+y4G7w6XnvSW1KBw==","signature_status":"signed_v1","signed_at":"2026-06-02T00:03:14.877897Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.00096","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:40319fed3cab9e9ecdfedfd9826bf7325f94f664f3255b4263d723f37d9c1533","sha256:cdbb386de254823f27a4fbd5ca90ef3e48a5b1a0389181bbaa6082d16886155d"],"state_sha256":"94e47ab9acca92a31cfc0ed3b43b6fe6b13de88290d51bab094c3ab963c6b658"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KmhsMIquC+DcPQxjnUd6w1JlGg5ALZ/9iVVVO+j9oKvuvJW4eP2qFIYYU5tesJEcCpMlvfH2Ar4TYytg5mhnCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T07:09:47.964325Z","bundle_sha256":"ca95bfeff898cf33f83443e3551cb96a344ee89fc9418d2685e3f3b862cff567"}}