{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:UV2W7EERDOESOABOZG2OKDUNJI","short_pith_number":"pith:UV2W7EER","canonical_record":{"source":{"id":"2605.14270","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T02:14:09Z","cross_cats_sorted":[],"title_canon_sha256":"a8472a8d08f536ec2bd0dcf679c4a7122f7afd7f8e9eb268ec5371e480df7ac8","abstract_canon_sha256":"ec2ce47ae512cbd714bc8f33cd09fd4119f46b878f970d0994a0eda7af641263"},"schema_version":"1.0"},"canonical_sha256":"a5756f90911b8927002ec9b4e50e8d4a0556ca347a1ae91b050b92aac68158e7","source":{"kind":"arxiv","id":"2605.14270","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.14270","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"arxiv_version","alias_value":"2605.14270v1","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14270","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"pith_short_12","alias_value":"UV2W7EERDOES","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"UV2W7EERDOESOABO","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"UV2W7EER","created_at":"2026-05-18T12:33:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:UV2W7EERDOESOABOZG2OKDUNJI","target":"record","payload":{"canonical_record":{"source":{"id":"2605.14270","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T02:14:09Z","cross_cats_sorted":[],"title_canon_sha256":"a8472a8d08f536ec2bd0dcf679c4a7122f7afd7f8e9eb268ec5371e480df7ac8","abstract_canon_sha256":"ec2ce47ae512cbd714bc8f33cd09fd4119f46b878f970d0994a0eda7af641263"},"schema_version":"1.0"},"canonical_sha256":"a5756f90911b8927002ec9b4e50e8d4a0556ca347a1ae91b050b92aac68158e7","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:39:10.405357Z","signature_b64":"UQetcYtZymwhKTqPHiTqdfnCg+BVQX5R4z3icf9kz5WTzTHCPO3sgzEkmDl68pTwXehpX6X9vcvxAhNxkRThAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a5756f90911b8927002ec9b4e50e8d4a0556ca347a1ae91b050b92aac68158e7","last_reissued_at":"2026-05-17T23:39:10.404862Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:39:10.404862Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.14270","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G2yuN8Ou1ABt15rwMJ8y4LFqzB3j1EihasnMauMJjgPnykSST2k2R5+Q6FkANBnUGHFtQjmJQwnkQlFybAvPBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T03:50:46.804545Z"},"content_sha256":"4c6ed9fd970bd2647ce16acb37b7c0a6eec8ad5557b1e1a58b205936499f1074","schema_version":"1.0","event_id":"sha256:4c6ed9fd970bd2647ce16acb37b7c0a6eec8ad5557b1e1a58b205936499f1074"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:UV2W7EERDOESOABOZG2OKDUNJI","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Diagnosing and Correcting Concept Omission in Multimodal Diffusion Transformers","license":"http://creativecommons.org/licenses/by/4.0/","headline":"Text embeddings in multimodal diffusion transformers encode a detectable omission signal that can be amplified to include missing concepts in generated images.","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Chaehun Shin, Jaihyun Lew, Jungbeom Lee, Kanghyun Baek, Sungroh Yoon","submitted_at":"2026-05-14T02:14:09Z","abstract_excerpt":"Multimodal Diffusion Transformers (MM-DiTs) have achieved remarkable progress in text-to-image generation, yet they frequently suffer from concept omission, where specified objects or attributes fail to emerge in the generated image. By performing linear probing on text tokens, we demonstrate that text embeddings can distinguish a characteristic `omission signal' representing the absence of target concepts. Leveraging this insight, we propose Omission Signal Intervention (OSI), which amplifies the omission signal to actively catalyze the generation of missing concepts. Comprehensive experiment"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"By performing linear probing on text tokens, we demonstrate that text embeddings can distinguish a characteristic `omission signal' representing the absence of target concepts. Leveraging this insight, we propose Omission Signal Intervention (OSI), which amplifies the omission signal to actively catalyze the generation of missing concepts.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"That the omission signal identified by linear probing is causal for concept omission and that amplifying it will reliably add missing concepts without introducing new artifacts or degrading image quality.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"Text embeddings in MM-DiTs contain a detectable omission signal for missing concepts, and amplifying it via OSI reduces concept omission in generated images on FLUX.1-Dev and SD3.5-Medium.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"Text embeddings in multimodal diffusion transformers encode a detectable omission signal that can be amplified to include missing concepts in generated images.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"954e2cbd0a87c40dca67382805c2cc94c91ed14909da65ca63386e32c7f3924a"},"source":{"id":"2605.14270","kind":"arxiv","version":1},"verdict":{"id":"87ab0f90-4d39-413b-8492-147c9670aa34","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-15T02:42:56.787920Z","strongest_claim":"By performing linear probing on text tokens, we demonstrate that text embeddings can distinguish a characteristic `omission signal' representing the absence of target concepts. Leveraging this insight, we propose Omission Signal Intervention (OSI), which amplifies the omission signal to actively catalyze the generation of missing concepts.","one_line_summary":"Text embeddings in MM-DiTs contain a detectable omission signal for missing concepts, and amplifying it via OSI reduces concept omission in generated images on FLUX.1-Dev and SD3.5-Medium.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"That the omission signal identified by linear probing is causal for concept omission and that amplifying it will reliably add missing concepts without introducing new artifacts or degrading image quality.","pith_extraction_headline":"Text embeddings in multimodal diffusion transformers encode a detectable omission signal that can be amplified to include missing concepts in generated images."},"references":{"count":57,"sample":[{"doi":"","year":null,"title":"Advances in Neural Information Processing Systems , volume=","work_id":"0044a7c0-5f55-4983-aef9-b2869094bc21","ref_index":1,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"arXiv preprint arXiv:2411.14257 , year=","work_id":"04270402-51cd-4d44-93c3-e0b3b5661b57","ref_index":2,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":2025,"title":"Lv, Zhengyao and Pan, Tianlin and Si, Chenyang and Chen, Zhaoxi and Zuo, Wangmeng and Liu, Ziwei and Wong, Kwan-Yee K. , title =. Proceedings of the IEEE/CVF International Conference on Computer Visio","work_id":"eb151b1e-d27a-47cc-b298-ee1cbbe72ca7","ref_index":3,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"arXiv preprint arXiv:2509.18096 (2025) 4","work_id":"1d9fc1c1-c3b4-45a1-8912-e8dc6c1279dd","ref_index":4,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":2023,"title":"ACM transactions on Graphics (TOG) , volume=","work_id":"4b7b98c5-9008-4a51-82e5-743acca79a8e","ref_index":5,"cited_arxiv_id":"","is_internal_anchor":false}],"resolved_work":57,"snapshot_sha256":"ad93b249747715b0d86c716884d808d805079e5af8057f9166892928a04aeeae","internal_anchors":6},"formal_canon":{"evidence_count":2,"snapshot_sha256":"09dd5c6cc10568a43870bcc33d46a71e8683b4ca379daca0c6b65198da41601b"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"87ab0f90-4d39-413b-8492-147c9670aa34"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"udi7m6xUtZdnz5FpWd5pm+G75tHrcRUgAGI16P7dysX0+lHaVgSXr4nVLf9X0lqVM8hUuNXru7Grr/BVUUO8DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T03:50:46.805728Z"},"content_sha256":"40f417c2feb907a57c3095e0cab3c268ef051b2033ec6ffaf3541d456cebc3b0","schema_version":"1.0","event_id":"sha256:40f417c2feb907a57c3095e0cab3c268ef051b2033ec6ffaf3541d456cebc3b0"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/UV2W7EERDOESOABOZG2OKDUNJI/bundle.json","state_url":"https://pith.science/pith/UV2W7EERDOESOABOZG2OKDUNJI/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/UV2W7EERDOESOABOZG2OKDUNJI/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T03:50:46Z","links":{"resolver":"https://pith.science/pith/UV2W7EERDOESOABOZG2OKDUNJI","bundle":"https://pith.science/pith/UV2W7EERDOESOABOZG2OKDUNJI/bundle.json","state":"https://pith.science/pith/UV2W7EERDOESOABOZG2OKDUNJI/state.json","well_known_bundle":"https://pith.science/.well-known/pith/UV2W7EERDOESOABOZG2OKDUNJI/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:UV2W7EERDOESOABOZG2OKDUNJI","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ec2ce47ae512cbd714bc8f33cd09fd4119f46b878f970d0994a0eda7af641263","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T02:14:09Z","title_canon_sha256":"a8472a8d08f536ec2bd0dcf679c4a7122f7afd7f8e9eb268ec5371e480df7ac8"},"schema_version":"1.0","source":{"id":"2605.14270","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.14270","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"arxiv_version","alias_value":"2605.14270v1","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14270","created_at":"2026-05-17T23:39:10Z"},{"alias_kind":"pith_short_12","alias_value":"UV2W7EERDOES","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"UV2W7EERDOESOABO","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"UV2W7EER","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:40f417c2feb907a57c3095e0cab3c268ef051b2033ec6ffaf3541d456cebc3b0","target":"graph","created_at":"2026-05-17T23:39:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"By performing linear probing on text tokens, we demonstrate that text embeddings can distinguish a characteristic `omission signal' representing the absence of target concepts. Leveraging this insight, we propose Omission Signal Intervention (OSI), which amplifies the omission signal to actively catalyze the generation of missing concepts."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That the omission signal identified by linear probing is causal for concept omission and that amplifying it will reliably add missing concepts without introducing new artifacts or degrading image quality."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"Text embeddings in MM-DiTs contain a detectable omission signal for missing concepts, and amplifying it via OSI reduces concept omission in generated images on FLUX.1-Dev and SD3.5-Medium."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"Text embeddings in multimodal diffusion transformers encode a detectable omission signal that can be amplified to include missing concepts in generated images."}],"snapshot_sha256":"954e2cbd0a87c40dca67382805c2cc94c91ed14909da65ca63386e32c7f3924a"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"09dd5c6cc10568a43870bcc33d46a71e8683b4ca379daca0c6b65198da41601b"},"paper":{"abstract_excerpt":"Multimodal Diffusion Transformers (MM-DiTs) have achieved remarkable progress in text-to-image generation, yet they frequently suffer from concept omission, where specified objects or attributes fail to emerge in the generated image. By performing linear probing on text tokens, we demonstrate that text embeddings can distinguish a characteristic `omission signal' representing the absence of target concepts. Leveraging this insight, we propose Omission Signal Intervention (OSI), which amplifies the omission signal to actively catalyze the generation of missing concepts. Comprehensive experiment","authors_text":"Chaehun Shin, Jaihyun Lew, Jungbeom Lee, Kanghyun Baek, Sungroh Yoon","cross_cats":[],"headline":"Text embeddings in multimodal diffusion transformers encode a detectable omission signal that can be amplified to include missing concepts in generated images.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T02:14:09Z","title":"Diagnosing and Correcting Concept Omission in Multimodal Diffusion Transformers"},"references":{"count":57,"internal_anchors":6,"resolved_work":57,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"Advances in Neural Information Processing Systems , volume=","work_id":"0044a7c0-5f55-4983-aef9-b2869094bc21","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":2,"title":"arXiv preprint arXiv:2411.14257 , year=","work_id":"04270402-51cd-4d44-93c3-e0b3b5661b57","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":3,"title":"Lv, Zhengyao and Pan, Tianlin and Si, Chenyang and Chen, Zhaoxi and Zuo, Wangmeng and Liu, Ziwei and Wong, Kwan-Yee K. , title =. Proceedings of the IEEE/CVF International Conference on Computer Visio","work_id":"eb151b1e-d27a-47cc-b298-ee1cbbe72ca7","year":2025},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":4,"title":"arXiv preprint arXiv:2509.18096 (2025) 4","work_id":"1d9fc1c1-c3b4-45a1-8912-e8dc6c1279dd","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"ACM transactions on Graphics (TOG) , volume=","work_id":"4b7b98c5-9008-4a51-82e5-743acca79a8e","year":2023}],"snapshot_sha256":"ad93b249747715b0d86c716884d808d805079e5af8057f9166892928a04aeeae"},"source":{"id":"2605.14270","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-15T02:42:56.787920Z","id":"87ab0f90-4d39-413b-8492-147c9670aa34","model_set":{"reader":"grok-4.3"},"one_line_summary":"Text embeddings in MM-DiTs contain a detectable omission signal for missing concepts, and amplifying it via OSI reduces concept omission in generated images on FLUX.1-Dev and SD3.5-Medium.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"Text embeddings in multimodal diffusion transformers encode a detectable omission signal that can be amplified to include missing concepts in generated images.","strongest_claim":"By performing linear probing on text tokens, we demonstrate that text embeddings can distinguish a characteristic `omission signal' representing the absence of target concepts. Leveraging this insight, we propose Omission Signal Intervention (OSI), which amplifies the omission signal to actively catalyze the generation of missing concepts.","weakest_assumption":"That the omission signal identified by linear probing is causal for concept omission and that amplifying it will reliably add missing concepts without introducing new artifacts or degrading image quality."}},"verdict_id":"87ab0f90-4d39-413b-8492-147c9670aa34"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4c6ed9fd970bd2647ce16acb37b7c0a6eec8ad5557b1e1a58b205936499f1074","target":"record","created_at":"2026-05-17T23:39:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ec2ce47ae512cbd714bc8f33cd09fd4119f46b878f970d0994a0eda7af641263","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T02:14:09Z","title_canon_sha256":"a8472a8d08f536ec2bd0dcf679c4a7122f7afd7f8e9eb268ec5371e480df7ac8"},"schema_version":"1.0","source":{"id":"2605.14270","kind":"arxiv","version":1}},"canonical_sha256":"a5756f90911b8927002ec9b4e50e8d4a0556ca347a1ae91b050b92aac68158e7","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a5756f90911b8927002ec9b4e50e8d4a0556ca347a1ae91b050b92aac68158e7","first_computed_at":"2026-05-17T23:39:10.404862Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:10.404862Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UQetcYtZymwhKTqPHiTqdfnCg+BVQX5R4z3icf9kz5WTzTHCPO3sgzEkmDl68pTwXehpX6X9vcvxAhNxkRThAw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:10.405357Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.14270","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4c6ed9fd970bd2647ce16acb37b7c0a6eec8ad5557b1e1a58b205936499f1074","sha256:40f417c2feb907a57c3095e0cab3c268ef051b2033ec6ffaf3541d456cebc3b0"],"state_sha256":"c20129bfdcb1f9d0b0c8c75752023a6576e7224470d8e70b438e6e552f5d8cd1"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8oPFuM7JBoduHb/1GSE+tKdpd0iwKfX7XziTcfCPhbSQ48wLk+dfuX4l+A+dae5j4AhOg7Zvwht0TueZ6frYBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T03:50:46.811144Z","bundle_sha256":"411d4a5259fd4493ad19bb2cb294739c8279b06f733fc1d3ce05c37ec877c368"}}