{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:L7ZVS4ZDB5LRWGUHEDFW4EDLCL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b9e98dc505f5b2d931a6898c0de72203e07056db2c5cee3b8fcc38a998b185c0","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-30T16:22:12Z","title_canon_sha256":"7e662cc30dddccb71f5ae074e29c698991d985bc8b951ac34499440f9a9a84a3"},"schema_version":"1.0","source":{"id":"2606.31916","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.31916","created_at":"2026-07-01T01:18:19Z"},{"alias_kind":"arxiv_version","alias_value":"2606.31916v1","created_at":"2026-07-01T01:18:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.31916","created_at":"2026-07-01T01:18:19Z"},{"alias_kind":"pith_short_12","alias_value":"L7ZVS4ZDB5LR","created_at":"2026-07-01T01:18:19Z"},{"alias_kind":"pith_short_16","alias_value":"L7ZVS4ZDB5LRWGUH","created_at":"2026-07-01T01:18:19Z"},{"alias_kind":"pith_short_8","alias_value":"L7ZVS4ZD","created_at":"2026-07-01T01:18:19Z"}],"graph_snapshots":[{"event_id":"sha256:9cc343fdd475af6b1d2eb2df7b1a45234a7c2ad3681495fb5f0a2648367bcf31","target":"graph","created_at":"2026-07-01T01:18:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.31916/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Theory of Mind (ToM) benchmarks for Large Language Models (LLMs) typically rely on passive question-answering formats, but the deployment of LLMs in increasingly agentic and autonomous forms demands new evaluations. In this paper we evaluate an agent's ability to induce specific belief states in other agents by taking actions rather than using conversational persuasion, a capability we call Non-Conversational Planning ToM (NCP-ToM). NCP-ToM is likely to be essential for many agent use-cases, including within user-assistant interactions and pedagogical contexts, but may also present manipulatio","authors_text":"Ben Slater, John Burden, Lucy G. Cheke, Matteo G. Mecattaf, Winnie Street","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-30T16:22:12Z","title":"Theory of Mind and Persuasion Beyond Conversation: Assessing the Capacity of LLMs to Induce Belief States via Planning and Action"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.31916","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:224e45b0401c8450f2074f56104b5e233b8905d02d7e5004c38eb22a36eeba25","target":"record","created_at":"2026-07-01T01:18:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b9e98dc505f5b2d931a6898c0de72203e07056db2c5cee3b8fcc38a998b185c0","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-30T16:22:12Z","title_canon_sha256":"7e662cc30dddccb71f5ae074e29c698991d985bc8b951ac34499440f9a9a84a3"},"schema_version":"1.0","source":{"id":"2606.31916","kind":"arxiv","version":1}},"canonical_sha256":"5ff35973230f571b1a8720cb6e106b12d5dbf30b595b5e553bc1471a34b7fdd2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5ff35973230f571b1a8720cb6e106b12d5dbf30b595b5e553bc1471a34b7fdd2","first_computed_at":"2026-07-01T01:18:19.442347Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-01T01:18:19.442347Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"SZLJbXN+5wJrbDeTcxJpZ9qTktfPUwcaCAiawS4vVierMrwdaGLByp/7lLdXGEgcm4fBLX6KGYiIY0QNAlg1Bw==","signature_status":"signed_v1","signed_at":"2026-07-01T01:18:19.442807Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.31916","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:224e45b0401c8450f2074f56104b5e233b8905d02d7e5004c38eb22a36eeba25","sha256:9cc343fdd475af6b1d2eb2df7b1a45234a7c2ad3681495fb5f0a2648367bcf31"],"state_sha256":"bd6a17e9faa35744a1cd0a901a9375c73d045beb99f090d59f5e615d0ed15f3f"}