{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:WOJCDMMPO53E3CKOL2ZH3CBAGV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8394121beff83c1ea43a3e800eb7c5bf5bdb6b3bc007ac472078faf32dff7406","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:58:15Z","title_canon_sha256":"b235403c26beff89d41f578b7ab39bc2b122b32c998256ddd8af874091da665c"},"schema_version":"1.0","source":{"id":"2605.29360","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.29360","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"arxiv_version","alias_value":"2605.29360v1","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.29360","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_12","alias_value":"WOJCDMMPO53E","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_16","alias_value":"WOJCDMMPO53E3CKO","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_8","alias_value":"WOJCDMMP","created_at":"2026-05-29T01:05:35Z"}],"graph_snapshots":[{"event_id":"sha256:c1ff1d58f910b89a41e660af2764504f82ac2ad27f6a3fa3be74164fb43b4f67","target":"graph","created_at":"2026-05-29T01:05:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.29360/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Action-conditioned world models are increasingly used as scalable simulators for robot learning, yet current evaluations provide limited evidence that their predictions are reliable under the actions they condition on. Existing benchmarks largely emphasize visual fidelity, leaving unclear whether predicted futures are physically plausible, faithful to commanded actions, and calibrated to failure when actions should not succeed. We introduce \\textsc{MiraBench}, a hierarchical benchmark that defines \\emph{action-conditioned reliability} as a core evaluation target for robotic world models. MiraB","authors_text":"Boyuan Chen, Jiaming Ji, Jiawei Chen, Jiayi Zhou, Juntao Dai, Tianzhuo Yang, Yaodong Yang, Zhaoyi Zhang, Zihan Shen, Zirui Mi","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:58:15Z","title":"MiraBench: Evaluating Action-Conditioned Reliability in Robotic World Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.29360","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5bfc23f2647562c88b873800980866aad7c21e5a0ae1dde35ef8534e2c119965","target":"record","created_at":"2026-05-29T01:05:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8394121beff83c1ea43a3e800eb7c5bf5bdb6b3bc007ac472078faf32dff7406","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:58:15Z","title_canon_sha256":"b235403c26beff89d41f578b7ab39bc2b122b32c998256ddd8af874091da665c"},"schema_version":"1.0","source":{"id":"2605.29360","kind":"arxiv","version":1}},"canonical_sha256":"b39221b18f77764d894e5eb27d8820356d3df54109c17ac5ef9698b1fb00093a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b39221b18f77764d894e5eb27d8820356d3df54109c17ac5ef9698b1fb00093a","first_computed_at":"2026-05-29T01:05:35.231414Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T01:05:35.231414Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"N7F4GMoZhtBHZPZzBwQmoL+elFQlmsF1R9b149quSWrIL3mxMcHYiZTLyQzhAaqODEv6wmgsK+ZHL1GjNZ8OCg==","signature_status":"signed_v1","signed_at":"2026-05-29T01:05:35.231994Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.29360","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5bfc23f2647562c88b873800980866aad7c21e5a0ae1dde35ef8534e2c119965","sha256:c1ff1d58f910b89a41e660af2764504f82ac2ad27f6a3fa3be74164fb43b4f67"],"state_sha256":"8bcc51b0fbeb696042e518de24ad871109e0558b3486b58520e0d4b801e65371"}