{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:WSDI4MEDOFJVWG4UHF3SGYU2UQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fdcdd5cebd5e900c30ad8c423d9d42d96a00ea372e1d2658abeaab40a2017f14","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-08T15:51:51Z","title_canon_sha256":"6d5c8a29894005245b312237385beebfdaf35e03cb15ebaf083f6f37bc8d9140"},"schema_version":"1.0","source":{"id":"2606.09669","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.09669","created_at":"2026-06-09T02:09:02Z"},{"alias_kind":"arxiv_version","alias_value":"2606.09669v1","created_at":"2026-06-09T02:09:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.09669","created_at":"2026-06-09T02:09:02Z"},{"alias_kind":"pith_short_12","alias_value":"WSDI4MEDOFJV","created_at":"2026-06-09T02:09:02Z"},{"alias_kind":"pith_short_16","alias_value":"WSDI4MEDOFJVWG4U","created_at":"2026-06-09T02:09:02Z"},{"alias_kind":"pith_short_8","alias_value":"WSDI4MED","created_at":"2026-06-09T02:09:02Z"}],"graph_snapshots":[{"event_id":"sha256:170c011611bcd48d4b00d6117683ec9a9b255e8d26e6104b01f7abe1134cee91","target":"graph","created_at":"2026-06-09T02:09:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.09669/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Spatial reasoning is a foundational capability for multimodal large language models (MLLMs) to perceive and operate within the physical world. However, existing benchmarks predominantly rely on passive evaluation (e.g., static VQA) or simulator-specific pipelines, failing to assess general interactive spatial understanding. We introduce SpatialWorld, a unified benchmark designed specifically for evaluating the interactive spatial understanding of multimodal agents in complex real-world tasks. Integrating eight heterogeneous simulation backends under a shared, simulator-agnostic protocol, Spati","authors_text":"Bohan Zeng, Bo Wang, Guoqing Huang, Hailong Qu, Haoyang Huang, Hengkang Qiao, Hongcheng Gao, Hongyixuan Yuan, Jiahao Wang, Jianhui Liu, Jingyi Tang, Junming Yang, Nan Duan, Olive Huang, Shihong Huang, Wenbo Li, Wenjie Li, Wentao Zhang, Yi Li, Yinpeng Dong, Zihao Huang","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-08T15:51:51Z","title":"SpatialWorld: Benchmarking Interactive Spatial Reasoning of Multimodal Agents in Real-World Tasks"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.09669","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9dd3df47605e0f058d1214e70d880a549682dce06daee20017e06a54475115ee","target":"record","created_at":"2026-06-09T02:09:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fdcdd5cebd5e900c30ad8c423d9d42d96a00ea372e1d2658abeaab40a2017f14","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-08T15:51:51Z","title_canon_sha256":"6d5c8a29894005245b312237385beebfdaf35e03cb15ebaf083f6f37bc8d9140"},"schema_version":"1.0","source":{"id":"2606.09669","kind":"arxiv","version":1}},"canonical_sha256":"b4868e308371535b1b94397723629aa42dbe2fc3a746e1ab12ddc7c6d551637b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b4868e308371535b1b94397723629aa42dbe2fc3a746e1ab12ddc7c6d551637b","first_computed_at":"2026-06-09T02:09:02.778487Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T02:09:02.778487Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"lsCLJYmtXyX788btd8jY1LaKtZZf1MRvhd6x9Sqpix0qmxWxDOKB/6FtDzMIL45Nxb74r4j/7pdpbqTjrwYyCQ==","signature_status":"signed_v1","signed_at":"2026-06-09T02:09:02.779017Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.09669","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9dd3df47605e0f058d1214e70d880a549682dce06daee20017e06a54475115ee","sha256:170c011611bcd48d4b00d6117683ec9a9b255e8d26e6104b01f7abe1134cee91"],"state_sha256":"a0d5bfe49446d2e9e5c0bb79b8f08e2ed04f15e4510bb5c97e80eaa6b2af2fcc"}