{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:J7V6AKU5W7NYW2367TSYDW4L65","short_pith_number":"pith:J7V6AKU5","canonical_record":{"source":{"id":"2605.13999","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:08:16Z","cross_cats_sorted":[],"title_canon_sha256":"ea0d26734fdc97cdf6fecf4d4a4e6e8c5fec0f9b6812536716058507d2cf62aa","abstract_canon_sha256":"f3a02ca88f918fa7d5f92f7bda1e6270c4c9abc34503a96afaad3ebca256c6a8"},"schema_version":"1.0"},"canonical_sha256":"4febe02a9db7db8b6b7efce581db8bf740a05d4b3feab80df64d0b6cd164dd04","source":{"kind":"arxiv","id":"2605.13999","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.13999","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"arxiv_version","alias_value":"2605.13999v1","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.13999","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"pith_short_12","alias_value":"J7V6AKU5W7NY","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"J7V6AKU5W7NYW236","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"J7V6AKU5","created_at":"2026-05-18T12:33:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:J7V6AKU5W7NYW2367TSYDW4L65","target":"record","payload":{"canonical_record":{"source":{"id":"2605.13999","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:08:16Z","cross_cats_sorted":[],"title_canon_sha256":"ea0d26734fdc97cdf6fecf4d4a4e6e8c5fec0f9b6812536716058507d2cf62aa","abstract_canon_sha256":"f3a02ca88f918fa7d5f92f7bda1e6270c4c9abc34503a96afaad3ebca256c6a8"},"schema_version":"1.0"},"canonical_sha256":"4febe02a9db7db8b6b7efce581db8bf740a05d4b3feab80df64d0b6cd164dd04","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:39:13.174161Z","signature_b64":"MWMEbooxMd8ERYEY6SNoD4uvZB4X1yJyvtmPLCOl1aS6UUy/dpEgd1kqtt71nEzCVJh8l5EPxTranCputqTrCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4febe02a9db7db8b6b7efce581db8bf740a05d4b3feab80df64d0b6cd164dd04","last_reissued_at":"2026-05-17T23:39:13.173623Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:39:13.173623Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.13999","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JBQ3EzWo/P2pyM60sULVu7d3pR6cEIMaW5zOvqe69pZkYS3jUF8ElzBc/M2gOJC0D1qKQyTCaF6cKGc35XvkDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T17:40:36.883648Z"},"content_sha256":"b196fb495760aec3b283d5784259202f40435eb0227e02523e71a70827f1e5ef","schema_version":"1.0","event_id":"sha256:b196fb495760aec3b283d5784259202f40435eb0227e02523e71a70827f1e5ef"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:J7V6AKU5W7NYW2367TSYDW4L65","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Support Before Frequency in Discrete Diffusion","license":"http://creativecommons.org/licenses/by/4.0/","headline":"Discrete diffusion models learn data support before frequencies.","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Adrian M\\\"uller, Antoine Gonon, Niao He, Ya-Ping Hsieh, Zebang Shen","submitted_at":"2026-05-13T18:08:16Z","abstract_excerpt":"Discrete diffusion models are increasingly competitive for language modeling, yet it remains unclear how their denoising objectives organize learning. Although these objectives target the full data distribution, we show that the exact reverse process induces a hierarchy between coarse support information and finer frequency information. For uniform and absorbing (a.k.a. masking) diffusion, we prove that, in the small-noise regime of the final denoising steps, each single-token reverse edit decomposes into a leading scale, determined by whether it moves toward the data support (e.g., grammatica"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"the exact reverse process induces a hierarchy between coarse support information and finer frequency information... discrete diffusion models learn data support before data frequencies","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"the decomposition into leading scale and finer coefficient holds in the small-noise regime of the final denoising steps","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"Discrete diffusion models learn data support before frequencies because the exact reverse process decomposes edits into a dominant validity scale and a finer probability coefficient.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"Discrete diffusion models learn data support before frequencies.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"fe2755bec9e80ac5656d8d473b5a14b5f6374af94b994e138b0ecd8467736a38"},"source":{"id":"2605.13999","kind":"arxiv","version":1},"verdict":{"id":"c9179bd8-5abe-4559-a376-f4906381af4a","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-15T05:45:02.233637Z","strongest_claim":"the exact reverse process induces a hierarchy between coarse support information and finer frequency information... discrete diffusion models learn data support before data frequencies","one_line_summary":"Discrete diffusion models learn data support before frequencies because the exact reverse process decomposes edits into a dominant validity scale and a finer probability coefficient.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"the decomposition into leading scale and finer coefficient holds in the small-noise regime of the final denoising steps","pith_extraction_headline":"Discrete diffusion models learn data support before frequencies."},"references":{"count":37,"sample":[{"doi":"","year":1963,"title":"Thompson, A. C. , title =. Proceedings of the American Mathematical Society , volume =. 1963 , doi =","work_id":"d9369e7f-e917-4d1e-9b32-1a6cbeb4a4db","ref_index":1,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"Advances in Neural Information Processing Systems , volume=","work_id":"22361021-9b89-4016-80aa-c572a4450d42","ref_index":2,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"S., and Kuleshov, V","work_id":"ce8df7d8-7fe0-475b-8258-108354ad295b","ref_index":3,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"Proceedings of the 42nd International Conference on Machine Learning , series=","work_id":"4aa3a434-36c8-41d8-8a28-843b5f56bce0","ref_index":4,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"The Diffusion Duality, Chapter II:","work_id":"69a68fd3-9b09-4d29-b4b6-bde058d7d86c","ref_index":5,"cited_arxiv_id":"","is_internal_anchor":false}],"resolved_work":37,"snapshot_sha256":"54e7e8c4e548c9ce6518d627d27ac25187789ea1ff8a13d2ec6e0dd1a26659dc","internal_anchors":6},"formal_canon":{"evidence_count":2,"snapshot_sha256":"2f3f47c3295ced330db290f51c04a15ba6dd45366c5bd3eb348a53738612a590"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"c9179bd8-5abe-4559-a376-f4906381af4a"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:39:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"aRKnU/VtoHt7U7Yj5KTacyyBvBGNv2DcqxywPYbccYwBNt3kwXu9mWf8p0jE0Lm/qaZy8jZn917gtUNzr/rqBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T17:40:36.884677Z"},"content_sha256":"de072c827a2c37fd14cd4a0f5254088145d0e46a23c69584e0cbc8a681d97930","schema_version":"1.0","event_id":"sha256:de072c827a2c37fd14cd4a0f5254088145d0e46a23c69584e0cbc8a681d97930"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/J7V6AKU5W7NYW2367TSYDW4L65/bundle.json","state_url":"https://pith.science/pith/J7V6AKU5W7NYW2367TSYDW4L65/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/J7V6AKU5W7NYW2367TSYDW4L65/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T17:40:36Z","links":{"resolver":"https://pith.science/pith/J7V6AKU5W7NYW2367TSYDW4L65","bundle":"https://pith.science/pith/J7V6AKU5W7NYW2367TSYDW4L65/bundle.json","state":"https://pith.science/pith/J7V6AKU5W7NYW2367TSYDW4L65/state.json","well_known_bundle":"https://pith.science/.well-known/pith/J7V6AKU5W7NYW2367TSYDW4L65/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:J7V6AKU5W7NYW2367TSYDW4L65","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f3a02ca88f918fa7d5f92f7bda1e6270c4c9abc34503a96afaad3ebca256c6a8","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:08:16Z","title_canon_sha256":"ea0d26734fdc97cdf6fecf4d4a4e6e8c5fec0f9b6812536716058507d2cf62aa"},"schema_version":"1.0","source":{"id":"2605.13999","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.13999","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"arxiv_version","alias_value":"2605.13999v1","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.13999","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"pith_short_12","alias_value":"J7V6AKU5W7NY","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"J7V6AKU5W7NYW236","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"J7V6AKU5","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:de072c827a2c37fd14cd4a0f5254088145d0e46a23c69584e0cbc8a681d97930","target":"graph","created_at":"2026-05-17T23:39:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"the exact reverse process induces a hierarchy between coarse support information and finer frequency information... discrete diffusion models learn data support before data frequencies"},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"the decomposition into leading scale and finer coefficient holds in the small-noise regime of the final denoising steps"},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"Discrete diffusion models learn data support before frequencies because the exact reverse process decomposes edits into a dominant validity scale and a finer probability coefficient."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"Discrete diffusion models learn data support before frequencies."}],"snapshot_sha256":"fe2755bec9e80ac5656d8d473b5a14b5f6374af94b994e138b0ecd8467736a38"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"2f3f47c3295ced330db290f51c04a15ba6dd45366c5bd3eb348a53738612a590"},"paper":{"abstract_excerpt":"Discrete diffusion models are increasingly competitive for language modeling, yet it remains unclear how their denoising objectives organize learning. Although these objectives target the full data distribution, we show that the exact reverse process induces a hierarchy between coarse support information and finer frequency information. For uniform and absorbing (a.k.a. masking) diffusion, we prove that, in the small-noise regime of the final denoising steps, each single-token reverse edit decomposes into a leading scale, determined by whether it moves toward the data support (e.g., grammatica","authors_text":"Adrian M\\\"uller, Antoine Gonon, Niao He, Ya-Ping Hsieh, Zebang Shen","cross_cats":[],"headline":"Discrete diffusion models learn data support before frequencies.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:08:16Z","title":"Support Before Frequency in Discrete Diffusion"},"references":{"count":37,"internal_anchors":6,"resolved_work":37,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"Thompson, A. C. , title =. Proceedings of the American Mathematical Society , volume =. 1963 , doi =","work_id":"d9369e7f-e917-4d1e-9b32-1a6cbeb4a4db","year":1963},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":2,"title":"Advances in Neural Information Processing Systems , volume=","work_id":"22361021-9b89-4016-80aa-c572a4450d42","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":3,"title":"S., and Kuleshov, V","work_id":"ce8df7d8-7fe0-475b-8258-108354ad295b","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":4,"title":"Proceedings of the 42nd International Conference on Machine Learning , series=","work_id":"4aa3a434-36c8-41d8-8a28-843b5f56bce0","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"The Diffusion Duality, Chapter II:","work_id":"69a68fd3-9b09-4d29-b4b6-bde058d7d86c","year":null}],"snapshot_sha256":"54e7e8c4e548c9ce6518d627d27ac25187789ea1ff8a13d2ec6e0dd1a26659dc"},"source":{"id":"2605.13999","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-15T05:45:02.233637Z","id":"c9179bd8-5abe-4559-a376-f4906381af4a","model_set":{"reader":"grok-4.3"},"one_line_summary":"Discrete diffusion models learn data support before frequencies because the exact reverse process decomposes edits into a dominant validity scale and a finer probability coefficient.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"Discrete diffusion models learn data support before frequencies.","strongest_claim":"the exact reverse process induces a hierarchy between coarse support information and finer frequency information... discrete diffusion models learn data support before data frequencies","weakest_assumption":"the decomposition into leading scale and finer coefficient holds in the small-noise regime of the final denoising steps"}},"verdict_id":"c9179bd8-5abe-4559-a376-f4906381af4a"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b196fb495760aec3b283d5784259202f40435eb0227e02523e71a70827f1e5ef","target":"record","created_at":"2026-05-17T23:39:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f3a02ca88f918fa7d5f92f7bda1e6270c4c9abc34503a96afaad3ebca256c6a8","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:08:16Z","title_canon_sha256":"ea0d26734fdc97cdf6fecf4d4a4e6e8c5fec0f9b6812536716058507d2cf62aa"},"schema_version":"1.0","source":{"id":"2605.13999","kind":"arxiv","version":1}},"canonical_sha256":"4febe02a9db7db8b6b7efce581db8bf740a05d4b3feab80df64d0b6cd164dd04","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4febe02a9db7db8b6b7efce581db8bf740a05d4b3feab80df64d0b6cd164dd04","first_computed_at":"2026-05-17T23:39:13.173623Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:13.173623Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"MWMEbooxMd8ERYEY6SNoD4uvZB4X1yJyvtmPLCOl1aS6UUy/dpEgd1kqtt71nEzCVJh8l5EPxTranCputqTrCQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:13.174161Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.13999","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b196fb495760aec3b283d5784259202f40435eb0227e02523e71a70827f1e5ef","sha256:de072c827a2c37fd14cd4a0f5254088145d0e46a23c69584e0cbc8a681d97930"],"state_sha256":"976ea88391ad42f8946a6f9ff50cb4962511ff9a4dfb0fe03a1e7b327b470f7c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"wt7juGi1XdqjD+pWMQ+K4cxifkAuQGrKWaCHnw+KHGFv+9B0NlsBQ4l02RILfzHHJo8gMTjJinygDOm2WwTyAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T17:40:36.889826Z","bundle_sha256":"ba94c9e4fbfa66c07de65a06bb020b40eb79960c98c193e8bfcf6f894a2ec4fc"}}