{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:W7NBKMVHNFGEO77K5SN475LPHC","short_pith_number":"pith:W7NBKMVH","schema_version":"1.0","canonical_sha256":"b7da1532a7694c477feaec9bcff56f38ab5b46f6930f81829196aa191da515fe","source":{"kind":"arxiv","id":"2606.04486","version":1},"attestation_state":"computed","paper":{"title":"Global Sketch-Based Watermarking for Diffusion Language Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL","cs.LG","stat.ML"],"primary_cat":"cs.CR","authors_text":"Daniel Zhao","submitted_at":"2026-06-03T06:08:58Z","abstract_excerpt":"Watermarking methods for language models have been studied extensively in the autoregressive setting, where tokens are generated sequentially. These works largely focus on local-context schemes that perturb the next token's distribution as a function of its preceding tokens. In diffusion language models, distributions over many unresolved positions are jointly sampled, allowing additive statistics of the entire sequence to be tractable during generation. We propose a watermark for masked diffusion language models that controls a global, vector-valued sketch representation of the text. Compared"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.04486","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2026-06-03T06:08:58Z","cross_cats_sorted":["cs.CL","cs.LG","stat.ML"],"title_canon_sha256":"9bb8b29a0f49c0611d32aa329664509b4dac60539e5015b2128fa36792ee53be","abstract_canon_sha256":"3c7a1ecb217ecde438813ae1adfba11e171a695a3edc7df7cecb08b6e9f26c1a"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-04T01:09:10.166423Z","signature_b64":"9URrmN//dIUx3EmliZ1xrPNvqvo4Y8l/9QEFax52e/lF+Ia82cP5rr/VvxdUejjKjM2npS6cu/2OlheKAHgJDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b7da1532a7694c477feaec9bcff56f38ab5b46f6930f81829196aa191da515fe","last_reissued_at":"2026-06-04T01:09:10.165735Z","signature_status":"signed_v1","first_computed_at":"2026-06-04T01:09:10.165735Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Global Sketch-Based Watermarking for Diffusion Language Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL","cs.LG","stat.ML"],"primary_cat":"cs.CR","authors_text":"Daniel Zhao","submitted_at":"2026-06-03T06:08:58Z","abstract_excerpt":"Watermarking methods for language models have been studied extensively in the autoregressive setting, where tokens are generated sequentially. These works largely focus on local-context schemes that perturb the next token's distribution as a function of its preceding tokens. In diffusion language models, distributions over many unresolved positions are jointly sampled, allowing additive statistics of the entire sequence to be tractable during generation. We propose a watermark for masked diffusion language models that controls a global, vector-valued sketch representation of the text. Compared"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.04486","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.04486/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.04486","created_at":"2026-06-04T01:09:10.165839+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.04486v1","created_at":"2026-06-04T01:09:10.165839+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.04486","created_at":"2026-06-04T01:09:10.165839+00:00"},{"alias_kind":"pith_short_12","alias_value":"W7NBKMVHNFGE","created_at":"2026-06-04T01:09:10.165839+00:00"},{"alias_kind":"pith_short_16","alias_value":"W7NBKMVHNFGEO77K","created_at":"2026-06-04T01:09:10.165839+00:00"},{"alias_kind":"pith_short_8","alias_value":"W7NBKMVH","created_at":"2026-06-04T01:09:10.165839+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC","json":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC.json","graph_json":"https://pith.science/api/pith-number/W7NBKMVHNFGEO77K5SN475LPHC/graph.json","events_json":"https://pith.science/api/pith-number/W7NBKMVHNFGEO77K5SN475LPHC/events.json","paper":"https://pith.science/paper/W7NBKMVH"},"agent_actions":{"view_html":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC","download_json":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC.json","view_paper":"https://pith.science/paper/W7NBKMVH","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.04486&json=true","fetch_graph":"https://pith.science/api/pith-number/W7NBKMVHNFGEO77K5SN475LPHC/graph.json","fetch_events":"https://pith.science/api/pith-number/W7NBKMVHNFGEO77K5SN475LPHC/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC/action/timestamp_anchor","attest_storage":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC/action/storage_attestation","attest_author":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC/action/author_attestation","sign_citation":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC/action/citation_signature","submit_replication":"https://pith.science/pith/W7NBKMVHNFGEO77K5SN475LPHC/action/replication_record"}},"created_at":"2026-06-04T01:09:10.165839+00:00","updated_at":"2026-06-04T01:09:10.165839+00:00"}