{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:RXSMKM7MLRNF4VP2BUVBEBVDQA","short_pith_number":"pith:RXSMKM7M","canonical_record":{"source":{"id":"2606.30054","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T09:45:15Z","cross_cats_sorted":[],"title_canon_sha256":"41e0506a51364980994283c434880e3b3532bb44dd23dcc446e571e5442bff00","abstract_canon_sha256":"0568b43610d0532b852f8c0bc28e4607cdf33e58b300b6064ab22ddf5e4a061a"},"schema_version":"1.0"},"canonical_sha256":"8de4c533ec5c5a5e55fa0d2a1206a3803e4cca4d5344637788a9dc4a3b6d697c","source":{"kind":"arxiv","id":"2606.30054","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.30054","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.30054v1","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.30054","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"pith_short_12","alias_value":"RXSMKM7MLRNF","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"pith_short_16","alias_value":"RXSMKM7MLRNF4VP2","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"pith_short_8","alias_value":"RXSMKM7M","created_at":"2026-06-30T02:17:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:RXSMKM7MLRNF4VP2BUVBEBVDQA","target":"record","payload":{"canonical_record":{"source":{"id":"2606.30054","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T09:45:15Z","cross_cats_sorted":[],"title_canon_sha256":"41e0506a51364980994283c434880e3b3532bb44dd23dcc446e571e5442bff00","abstract_canon_sha256":"0568b43610d0532b852f8c0bc28e4607cdf33e58b300b6064ab22ddf5e4a061a"},"schema_version":"1.0"},"canonical_sha256":"8de4c533ec5c5a5e55fa0d2a1206a3803e4cca4d5344637788a9dc4a3b6d697c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-30T02:17:47.662223Z","signature_b64":"GG2jYe1W6yfTYUlb1iNdVH05b4FDuN2YGZ91boMaOFNXYczcCyGQOIM/QFC5I+uuet5wcy25j3YNeEXOBX+lDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8de4c533ec5c5a5e55fa0d2a1206a3803e4cca4d5344637788a9dc4a3b6d697c","last_reissued_at":"2026-06-30T02:17:47.661710Z","signature_status":"signed_v1","first_computed_at":"2026-06-30T02:17:47.661710Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.30054","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T02:17:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZAQunHwLdLGO+Ws+iofuzfQPYfV8uIcarHLNAcMmAOyLwLwLfQcEBg8TlL6G10OSTOJLJ776ZAsD3txzesE4Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T13:59:58.191954Z"},"content_sha256":"b4c14c31679666317651ca9999f51a63950c7e12650d7ed8b2ebdb8a342c9baa","schema_version":"1.0","event_id":"sha256:b4c14c31679666317651ca9999f51a63950c7e12650d7ed8b2ebdb8a342c9baa"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:RXSMKM7MLRNF4VP2BUVBEBVDQA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Illuminating Unified Multimodal Model for Free-form Interleaved Text-Image Generation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Chonghuinan Wang, Chunwei Wang, Fan Li, Jiaqi Xu, Junwei Yang, Renjing Pei, Wangmeng Zuo, Wei Zhang, Xiaohe Wu, Yecong Wan, Zhikai Chen, Zhixin Wang","submitted_at":"2026-06-29T09:45:15Z","abstract_excerpt":"The advancement of generative AI models capable of producing text and image marks a critical step forward in the realm of multimodal intelligence, particularly for tasks involving the interleaving of both modalities. To advance this intelligence to the next stage, it is crucial for models to autonomously generate free-form interleaved text-image sequences. In this paper, we introduce ILLUME-X, an advanced unified multimodal paradigm that enables high-quality, free-form interleaved text-image generation by improving multimodal data efficiency and stabilizing the multimodal training process. ILL"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.30054","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.30054/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T02:17:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SCfmXKaKVBkgU4umLmiUwQVvuWh4KtWqO9GLb7lIK5i5DDeKhfE+FUHoQGCXfSxRGajCXadxNSnPi+c1IpLrBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T13:59:58.192345Z"},"content_sha256":"b467fb2748a21899cc32aae1d171253f3abca8d1750b56c1d1ab4bea61a7c0a8","schema_version":"1.0","event_id":"sha256:b467fb2748a21899cc32aae1d171253f3abca8d1750b56c1d1ab4bea61a7c0a8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RXSMKM7MLRNF4VP2BUVBEBVDQA/bundle.json","state_url":"https://pith.science/pith/RXSMKM7MLRNF4VP2BUVBEBVDQA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RXSMKM7MLRNF4VP2BUVBEBVDQA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-30T13:59:58Z","links":{"resolver":"https://pith.science/pith/RXSMKM7MLRNF4VP2BUVBEBVDQA","bundle":"https://pith.science/pith/RXSMKM7MLRNF4VP2BUVBEBVDQA/bundle.json","state":"https://pith.science/pith/RXSMKM7MLRNF4VP2BUVBEBVDQA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RXSMKM7MLRNF4VP2BUVBEBVDQA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:RXSMKM7MLRNF4VP2BUVBEBVDQA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0568b43610d0532b852f8c0bc28e4607cdf33e58b300b6064ab22ddf5e4a061a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T09:45:15Z","title_canon_sha256":"41e0506a51364980994283c434880e3b3532bb44dd23dcc446e571e5442bff00"},"schema_version":"1.0","source":{"id":"2606.30054","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.30054","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.30054v1","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.30054","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"pith_short_12","alias_value":"RXSMKM7MLRNF","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"pith_short_16","alias_value":"RXSMKM7MLRNF4VP2","created_at":"2026-06-30T02:17:47Z"},{"alias_kind":"pith_short_8","alias_value":"RXSMKM7M","created_at":"2026-06-30T02:17:47Z"}],"graph_snapshots":[{"event_id":"sha256:b467fb2748a21899cc32aae1d171253f3abca8d1750b56c1d1ab4bea61a7c0a8","target":"graph","created_at":"2026-06-30T02:17:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.30054/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"The advancement of generative AI models capable of producing text and image marks a critical step forward in the realm of multimodal intelligence, particularly for tasks involving the interleaving of both modalities. To advance this intelligence to the next stage, it is crucial for models to autonomously generate free-form interleaved text-image sequences. In this paper, we introduce ILLUME-X, an advanced unified multimodal paradigm that enables high-quality, free-form interleaved text-image generation by improving multimodal data efficiency and stabilizing the multimodal training process. ILL","authors_text":"Chonghuinan Wang, Chunwei Wang, Fan Li, Jiaqi Xu, Junwei Yang, Renjing Pei, Wangmeng Zuo, Wei Zhang, Xiaohe Wu, Yecong Wan, Zhikai Chen, Zhixin Wang","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T09:45:15Z","title":"Illuminating Unified Multimodal Model for Free-form Interleaved Text-Image Generation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.30054","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b4c14c31679666317651ca9999f51a63950c7e12650d7ed8b2ebdb8a342c9baa","target":"record","created_at":"2026-06-30T02:17:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0568b43610d0532b852f8c0bc28e4607cdf33e58b300b6064ab22ddf5e4a061a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T09:45:15Z","title_canon_sha256":"41e0506a51364980994283c434880e3b3532bb44dd23dcc446e571e5442bff00"},"schema_version":"1.0","source":{"id":"2606.30054","kind":"arxiv","version":1}},"canonical_sha256":"8de4c533ec5c5a5e55fa0d2a1206a3803e4cca4d5344637788a9dc4a3b6d697c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8de4c533ec5c5a5e55fa0d2a1206a3803e4cca4d5344637788a9dc4a3b6d697c","first_computed_at":"2026-06-30T02:17:47.661710Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-30T02:17:47.661710Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"GG2jYe1W6yfTYUlb1iNdVH05b4FDuN2YGZ91boMaOFNXYczcCyGQOIM/QFC5I+uuet5wcy25j3YNeEXOBX+lDg==","signature_status":"signed_v1","signed_at":"2026-06-30T02:17:47.662223Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.30054","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b4c14c31679666317651ca9999f51a63950c7e12650d7ed8b2ebdb8a342c9baa","sha256:b467fb2748a21899cc32aae1d171253f3abca8d1750b56c1d1ab4bea61a7c0a8"],"state_sha256":"f2618b6c4dfd4774a0d1e5ff3e5ef857b029456d60d94047541930042bec4f6c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Lhs5hXzOUVKgX91gxiWIyJmYTdgIsKwRQ6K16MYdx2gtcER5lmHWcB9xMiAiiFyd4DvqK6xVzIHQ6hhm2PA4AQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-30T13:59:58.194361Z","bundle_sha256":"2b13a5bb1e028c7e4ca8b45d3309dadfeac06267b94c9c93d86376a610b99a37"}}