{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:DXDMSGWCV6QIG3K64AHHJMIG33","short_pith_number":"pith:DXDMSGWC","schema_version":"1.0","canonical_sha256":"1dc6c91ac2afa0836d5ee00e74b106decd2a7482d8f4535d052e4ecdbdc5a34b","source":{"kind":"arxiv","id":"2605.27589","version":1},"attestation_state":"computed","paper":{"title":"What-If World: A Causal Benchmark for General World Models in Embodied Scenarios","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Alicia Yu, Fnu Suya, Jiaqi Ma, Jinghuai Zhang, Kaiyuan Zhang, Kunlin Cai, Mohammad Rostami, Pranav Bodapati, Rui Song, Yuan Tian","submitted_at":"2026-05-26T19:02:26Z","abstract_excerpt":"Video generation models are increasingly used as world simulators for tasks like driving and robotic manipulation. What matters in these settings is not whether a single video looks right, but whether the model's output changes when its input changes. We test this by giving a model two prompts describing the same scene with one physical detail varied, and checking whether the two videos diverge the way physics predicts. The wording difference between the prompts is small by design, since only one variable is changed, but the correct physical difference is not. A model that misses this can stil"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.27589","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-26T19:02:26Z","cross_cats_sorted":[],"title_canon_sha256":"5ba40671539519f47eec04294c552ad4511618b8973abcdc1eb1d476241cbf71","abstract_canon_sha256":"37607f1aeb14ebd8dcf21f0e270a39f0837ffdecd0397c47d77fd4ecd6952af0"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T01:04:17.096926Z","signature_b64":"MuYD4ludOk9E30HyjdaOaSaS9J+4F22itGtF3oi4PlPAxAWtLfvtHKSVBBvtmm6G7427Nzdc/YMcyuTAd+teDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1dc6c91ac2afa0836d5ee00e74b106decd2a7482d8f4535d052e4ecdbdc5a34b","last_reissued_at":"2026-05-28T01:04:17.096519Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T01:04:17.096519Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"What-If World: A Causal Benchmark for General World Models in Embodied Scenarios","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Alicia Yu, Fnu Suya, Jiaqi Ma, Jinghuai Zhang, Kaiyuan Zhang, Kunlin Cai, Mohammad Rostami, Pranav Bodapati, Rui Song, Yuan Tian","submitted_at":"2026-05-26T19:02:26Z","abstract_excerpt":"Video generation models are increasingly used as world simulators for tasks like driving and robotic manipulation. What matters in these settings is not whether a single video looks right, but whether the model's output changes when its input changes. We test this by giving a model two prompts describing the same scene with one physical detail varied, and checking whether the two videos diverge the way physics predicts. The wording difference between the prompts is small by design, since only one variable is changed, but the correct physical difference is not. A model that misses this can stil"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.27589","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.27589/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.27589","created_at":"2026-05-28T01:04:17.096574+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.27589v1","created_at":"2026-05-28T01:04:17.096574+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.27589","created_at":"2026-05-28T01:04:17.096574+00:00"},{"alias_kind":"pith_short_12","alias_value":"DXDMSGWCV6QI","created_at":"2026-05-28T01:04:17.096574+00:00"},{"alias_kind":"pith_short_16","alias_value":"DXDMSGWCV6QIG3K6","created_at":"2026-05-28T01:04:17.096574+00:00"},{"alias_kind":"pith_short_8","alias_value":"DXDMSGWC","created_at":"2026-05-28T01:04:17.096574+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33","json":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33.json","graph_json":"https://pith.science/api/pith-number/DXDMSGWCV6QIG3K64AHHJMIG33/graph.json","events_json":"https://pith.science/api/pith-number/DXDMSGWCV6QIG3K64AHHJMIG33/events.json","paper":"https://pith.science/paper/DXDMSGWC"},"agent_actions":{"view_html":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33","download_json":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33.json","view_paper":"https://pith.science/paper/DXDMSGWC","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.27589&json=true","fetch_graph":"https://pith.science/api/pith-number/DXDMSGWCV6QIG3K64AHHJMIG33/graph.json","fetch_events":"https://pith.science/api/pith-number/DXDMSGWCV6QIG3K64AHHJMIG33/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33/action/timestamp_anchor","attest_storage":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33/action/storage_attestation","attest_author":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33/action/author_attestation","sign_citation":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33/action/citation_signature","submit_replication":"https://pith.science/pith/DXDMSGWCV6QIG3K64AHHJMIG33/action/replication_record"}},"created_at":"2026-05-28T01:04:17.096574+00:00","updated_at":"2026-05-28T01:04:17.096574+00:00"}