{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:SRG3IOMYVS6GEX5HESL5U7EYHL","short_pith_number":"pith:SRG3IOMY","schema_version":"1.0","canonical_sha256":"944db43998acbc625fa72497da7c983ad15cc74f9967f152f013b6b090543e67","source":{"kind":"arxiv","id":"2605.28465","version":1},"attestation_state":"computed","paper":{"title":"Beyond One Path: Evaluating and Enhancing Divergent Thinking in Interactive LLM Agents","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Hwanhee Lee, Ingeol Baek, Jeonghyun Park, Jihyeong Park","submitted_at":"2026-05-27T13:33:23Z","abstract_excerpt":"Divergent thinking is a core dimension of creativity, yet existing evaluations of Large Language Models (LLMs) treat them as single-turn text generations, failing to capture how an agent reasons through iterative interaction. To address this, we introduce MUTATE, an interactive benchmark designed to evaluate agentic divergent thinking at two levels: path-level, where an agent discovers multiple alternative paths to the same goal, and action-level, where individual actions require non-typical, mechanism-shifting object uses. Unlike success-only evaluations, MUTATE scores both completed paths an"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.28465","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-27T13:33:23Z","cross_cats_sorted":[],"title_canon_sha256":"61aa321027f4a8094c96671cd326a9392b4a8dd87458c634525b364beb89c7e7","abstract_canon_sha256":"68836260b02c2fced0a548802d48a32db4390ef0e1c0b95236482fbc8b2e64a2"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T02:04:53.837535Z","signature_b64":"E0+Zx/m7DjrCf450tIIuW2R5QPvZ7y5/G/3dm79MGNsOXri+9hbb1OEtDx0Bv4tDAe4/bN2m2QfnfU6bYcYSAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"944db43998acbc625fa72497da7c983ad15cc74f9967f152f013b6b090543e67","last_reissued_at":"2026-05-28T02:04:53.837119Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T02:04:53.837119Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Beyond One Path: Evaluating and Enhancing Divergent Thinking in Interactive LLM Agents","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Hwanhee Lee, Ingeol Baek, Jeonghyun Park, Jihyeong Park","submitted_at":"2026-05-27T13:33:23Z","abstract_excerpt":"Divergent thinking is a core dimension of creativity, yet existing evaluations of Large Language Models (LLMs) treat them as single-turn text generations, failing to capture how an agent reasons through iterative interaction. To address this, we introduce MUTATE, an interactive benchmark designed to evaluate agentic divergent thinking at two levels: path-level, where an agent discovers multiple alternative paths to the same goal, and action-level, where individual actions require non-typical, mechanism-shifting object uses. Unlike success-only evaluations, MUTATE scores both completed paths an"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28465","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.28465/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.28465","created_at":"2026-05-28T02:04:53.837184+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.28465v1","created_at":"2026-05-28T02:04:53.837184+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28465","created_at":"2026-05-28T02:04:53.837184+00:00"},{"alias_kind":"pith_short_12","alias_value":"SRG3IOMYVS6G","created_at":"2026-05-28T02:04:53.837184+00:00"},{"alias_kind":"pith_short_16","alias_value":"SRG3IOMYVS6GEX5H","created_at":"2026-05-28T02:04:53.837184+00:00"},{"alias_kind":"pith_short_8","alias_value":"SRG3IOMY","created_at":"2026-05-28T02:04:53.837184+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL","json":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL.json","graph_json":"https://pith.science/api/pith-number/SRG3IOMYVS6GEX5HESL5U7EYHL/graph.json","events_json":"https://pith.science/api/pith-number/SRG3IOMYVS6GEX5HESL5U7EYHL/events.json","paper":"https://pith.science/paper/SRG3IOMY"},"agent_actions":{"view_html":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL","download_json":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL.json","view_paper":"https://pith.science/paper/SRG3IOMY","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.28465&json=true","fetch_graph":"https://pith.science/api/pith-number/SRG3IOMYVS6GEX5HESL5U7EYHL/graph.json","fetch_events":"https://pith.science/api/pith-number/SRG3IOMYVS6GEX5HESL5U7EYHL/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL/action/timestamp_anchor","attest_storage":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL/action/storage_attestation","attest_author":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL/action/author_attestation","sign_citation":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL/action/citation_signature","submit_replication":"https://pith.science/pith/SRG3IOMYVS6GEX5HESL5U7EYHL/action/replication_record"}},"created_at":"2026-05-28T02:04:53.837184+00:00","updated_at":"2026-05-28T02:04:53.837184+00:00"}