{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:JT2CNRU6OXDJXEAPI4DJAXXFBF","short_pith_number":"pith:JT2CNRU6","canonical_record":{"source":{"id":"2605.18601","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-18T16:12:52Z","cross_cats_sorted":[],"title_canon_sha256":"1e93d45b85952716eae122d35271d0c044ee51b00aa26bc3d4ae36afde74fb3c","abstract_canon_sha256":"80ee1428ec532aef4059eae80261c6d0902db1b499255a3cc7a21cb83e4a60f1"},"schema_version":"1.0"},"canonical_sha256":"4cf426c69e75c69b900f4706905ee509662b36fd6226f96f912f2515211473b5","source":{"kind":"arxiv","id":"2605.18601","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18601","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18601v1","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18601","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"pith_short_12","alias_value":"JT2CNRU6OXDJ","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"pith_short_16","alias_value":"JT2CNRU6OXDJXEAP","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"pith_short_8","alias_value":"JT2CNRU6","created_at":"2026-05-20T00:06:10Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:JT2CNRU6OXDJXEAPI4DJAXXFBF","target":"record","payload":{"canonical_record":{"source":{"id":"2605.18601","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-18T16:12:52Z","cross_cats_sorted":[],"title_canon_sha256":"1e93d45b85952716eae122d35271d0c044ee51b00aa26bc3d4ae36afde74fb3c","abstract_canon_sha256":"80ee1428ec532aef4059eae80261c6d0902db1b499255a3cc7a21cb83e4a60f1"},"schema_version":"1.0"},"canonical_sha256":"4cf426c69e75c69b900f4706905ee509662b36fd6226f96f912f2515211473b5","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:06:10.340502Z","signature_b64":"1N6PMg+rfRyVwto5YAY5LSMbTO8OTbff8V0/5///WYHXEkjcu6+KFgI54lx651aR1q6znlMj9MzYypPRaOweCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4cf426c69e75c69b900f4706905ee509662b36fd6226f96f912f2515211473b5","last_reissued_at":"2026-05-20T00:06:10.339716Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:06:10.339716Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.18601","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qiYDJfGiNGtnX48nwqyqtm0zk+nLdkhD7G4o8armU99a2KXalUj4aTmOYCj2Q2jQCuwtNhZUAWROUZ2Xn3jUDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:39:32.069075Z"},"content_sha256":"899e6fbe5ba6ebcd697f467225cc50582e0752947fd9e0db4806e020bcd4bac3","schema_version":"1.0","event_id":"sha256:899e6fbe5ba6ebcd697f467225cc50582e0752947fd9e0db4806e020bcd4bac3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:JT2CNRU6OXDJXEAPI4DJAXXFBF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Incantation: Natural Language as the Action Interface for Multi-Entity Video World Models","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Fan Cheng, Huangji Wang, Jian Zhao, Qianyu Peng, Ruili Feng, Shangwen Zhu, Xiangrui Ke, Xinyu Cui, Yeying Jin, Zeqing Wang, Zhaohu Xing, Zhao Pu, Zhilei Shu, Zizhao Tong","submitted_at":"2026-05-18T16:12:52Z","abstract_excerpt":"Modern interactive video world models have achieved impressive visual fidelity, yet lack fine-grained multi-entity control and cross-entity, cross-world generalization. We trace this gap to the action interface: standard control protocols (e.g. animation IDs, device inputs, scene-level captions) bind action semantics to specific entities or engines at design time. We propose natural language as the interface to unlock expressiveness that no prior interface can achieve, and we present Incantation, the first interactive video world model with per-latent-frame (0.25 s) natural-language conditioni"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18601","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18601/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"claim_evidence","ran_at":"2026-05-20T00:01:59.255259Z","status":"completed","version":"1.0.0","findings_count":0}],"snapshot_sha256":"872624663d2a3c4a475d853f0e3906bac0afb6987e6a847aa8bc864300582364"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"x+YcZGj8oYFtiTwAOCuVYgJp6rv5NFbp7DmkKE00i+XARslJ/FLB8AJJUaDijKJLllxaTgnmxB/CeSPcxJMUBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:39:32.069844Z"},"content_sha256":"dbc1183a6ff81bb9fdb5457847dd6ca665dd4ad980bd1397c340fb7aea0ecce0","schema_version":"1.0","event_id":"sha256:dbc1183a6ff81bb9fdb5457847dd6ca665dd4ad980bd1397c340fb7aea0ecce0"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JT2CNRU6OXDJXEAPI4DJAXXFBF/bundle.json","state_url":"https://pith.science/pith/JT2CNRU6OXDJXEAPI4DJAXXFBF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JT2CNRU6OXDJXEAPI4DJAXXFBF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T12:39:32Z","links":{"resolver":"https://pith.science/pith/JT2CNRU6OXDJXEAPI4DJAXXFBF","bundle":"https://pith.science/pith/JT2CNRU6OXDJXEAPI4DJAXXFBF/bundle.json","state":"https://pith.science/pith/JT2CNRU6OXDJXEAPI4DJAXXFBF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JT2CNRU6OXDJXEAPI4DJAXXFBF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:JT2CNRU6OXDJXEAPI4DJAXXFBF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"80ee1428ec532aef4059eae80261c6d0902db1b499255a3cc7a21cb83e4a60f1","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-18T16:12:52Z","title_canon_sha256":"1e93d45b85952716eae122d35271d0c044ee51b00aa26bc3d4ae36afde74fb3c"},"schema_version":"1.0","source":{"id":"2605.18601","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18601","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18601v1","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18601","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"pith_short_12","alias_value":"JT2CNRU6OXDJ","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"pith_short_16","alias_value":"JT2CNRU6OXDJXEAP","created_at":"2026-05-20T00:06:10Z"},{"alias_kind":"pith_short_8","alias_value":"JT2CNRU6","created_at":"2026-05-20T00:06:10Z"}],"graph_snapshots":[{"event_id":"sha256:dbc1183a6ff81bb9fdb5457847dd6ca665dd4ad980bd1397c340fb7aea0ecce0","target":"graph","created_at":"2026-05-20T00:06:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-20T00:01:59.255259Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2605.18601/integrity.json","findings":[],"snapshot_sha256":"872624663d2a3c4a475d853f0e3906bac0afb6987e6a847aa8bc864300582364","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Modern interactive video world models have achieved impressive visual fidelity, yet lack fine-grained multi-entity control and cross-entity, cross-world generalization. We trace this gap to the action interface: standard control protocols (e.g. animation IDs, device inputs, scene-level captions) bind action semantics to specific entities or engines at design time. We propose natural language as the interface to unlock expressiveness that no prior interface can achieve, and we present Incantation, the first interactive video world model with per-latent-frame (0.25 s) natural-language conditioni","authors_text":"Fan Cheng, Huangji Wang, Jian Zhao, Qianyu Peng, Ruili Feng, Shangwen Zhu, Xiangrui Ke, Xinyu Cui, Yeying Jin, Zeqing Wang, Zhaohu Xing, Zhao Pu, Zhilei Shu, Zizhao Tong","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-18T16:12:52Z","title":"Incantation: Natural Language as the Action Interface for Multi-Entity Video World Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18601","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:899e6fbe5ba6ebcd697f467225cc50582e0752947fd9e0db4806e020bcd4bac3","target":"record","created_at":"2026-05-20T00:06:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"80ee1428ec532aef4059eae80261c6d0902db1b499255a3cc7a21cb83e4a60f1","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-18T16:12:52Z","title_canon_sha256":"1e93d45b85952716eae122d35271d0c044ee51b00aa26bc3d4ae36afde74fb3c"},"schema_version":"1.0","source":{"id":"2605.18601","kind":"arxiv","version":1}},"canonical_sha256":"4cf426c69e75c69b900f4706905ee509662b36fd6226f96f912f2515211473b5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4cf426c69e75c69b900f4706905ee509662b36fd6226f96f912f2515211473b5","first_computed_at":"2026-05-20T00:06:10.339716Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:06:10.339716Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"1N6PMg+rfRyVwto5YAY5LSMbTO8OTbff8V0/5///WYHXEkjcu6+KFgI54lx651aR1q6znlMj9MzYypPRaOweCA==","signature_status":"signed_v1","signed_at":"2026-05-20T00:06:10.340502Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.18601","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:899e6fbe5ba6ebcd697f467225cc50582e0752947fd9e0db4806e020bcd4bac3","sha256:dbc1183a6ff81bb9fdb5457847dd6ca665dd4ad980bd1397c340fb7aea0ecce0"],"state_sha256":"1a7af12076b3ddffa85d602117a334a2aba6c85d0aff7ba563c4755d80d58965"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"lBg0G2XLX7eBvthZm/JC+u9dJDYKX3tR5zWmy/PUXhzh/rSy4ZavxNG1wP5YlvhG4DD1DGCIASqzYGzXmnrmBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T12:39:32.073295Z","bundle_sha256":"5a533da159df301a0e017cb0af80265c08a7722ae717b89b26efbef023fc3b6e"}}