{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:LTJFUCK5ZM3BSYLOHFN27E7Y3B","short_pith_number":"pith:LTJFUCK5","canonical_record":{"source":{"id":"2605.27268","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-26T16:44:25Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"4f565736fe728e0535c9a20da4d4138170dcf4fd4cd8a4fea40366c34c9af145","abstract_canon_sha256":"c2454c63f4ce3958b128f4ffa96e718cffcfc978869d3dbcb7320b6c4052d0f1"},"schema_version":"1.0"},"canonical_sha256":"5cd25a095dcb3619616e395baf93f8d85686a1934ef7ab16852a8bd953a7b55b","source":{"kind":"arxiv","id":"2605.27268","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.27268","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"arxiv_version","alias_value":"2605.27268v1","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.27268","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"pith_short_12","alias_value":"LTJFUCK5ZM3B","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"pith_short_16","alias_value":"LTJFUCK5ZM3BSYLO","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"pith_short_8","alias_value":"LTJFUCK5","created_at":"2026-05-27T02:06:09Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:LTJFUCK5ZM3BSYLOHFN27E7Y3B","target":"record","payload":{"canonical_record":{"source":{"id":"2605.27268","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-26T16:44:25Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"4f565736fe728e0535c9a20da4d4138170dcf4fd4cd8a4fea40366c34c9af145","abstract_canon_sha256":"c2454c63f4ce3958b128f4ffa96e718cffcfc978869d3dbcb7320b6c4052d0f1"},"schema_version":"1.0"},"canonical_sha256":"5cd25a095dcb3619616e395baf93f8d85686a1934ef7ab16852a8bd953a7b55b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-27T02:06:09.121158Z","signature_b64":"T5F0DKVr4VM0kmoXxySlsNkQ0K6s+PDGq+c5rvChyzMktZvxBJ+6jw6xkeqNIDQbGmlJbJZqkp6jgcqbYLN9Dw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5cd25a095dcb3619616e395baf93f8d85686a1934ef7ab16852a8bd953a7b55b","last_reissued_at":"2026-05-27T02:06:09.120688Z","signature_status":"signed_v1","first_computed_at":"2026-05-27T02:06:09.120688Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.27268","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-27T02:06:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"aoeJrQmbl/QhZaMNCdSVErNJa60TH+djhGxs0I/ANPgkUJZL6On9bYGyzP0XQjI0epJela103s6QfoGjlk95Dg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T16:09:42.411774Z"},"content_sha256":"70b66153e3289a852936b5230ea4ace71a7dea921ae2061ed6555c902e90f22e","schema_version":"1.0","event_id":"sha256:70b66153e3289a852936b5230ea4ace71a7dea921ae2061ed6555c902e90f22e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:LTJFUCK5ZM3BSYLOHFN27E7Y3B","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Lost in Sampling: Assessing Lexical Reachability in LLMs via the Word Coverage Score (WCS)","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CL","authors_text":"Carlos Arriaga, Javier Conde, Javier Coronado-Bl\\'azquez, Pedro Reviriego, Samer Awad, Tairan Fu","submitted_at":"2026-05-26T16:44:25Z","abstract_excerpt":"Modern Large Language Models (LLMs) are often criticized for producing repetitive and homogeneous text, despite possessing vast latent vocabularies. While previous research has focused on model knowledge and training data, we investigate the role of decoding mechanics in suppressing linguistic diversity. We introduce the Word Coverage Score (WCS), a metric that quantifies the extent to which contextually appropriate human vocabulary is mathematically pruned by standard sampling filters (e.g., Top-$p$, Top-$k$, and Min-$p$). Rather than assessing static knowledge, the WCS measures the lexical s"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.27268","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.27268/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-27T02:06:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"iTt38U2eVo0k+9vtliyZLsernBP2nQmTI46GltE32lpFPivzTAcbQJfXOwU1tzB0uNcdEpU7hrnjUw/go2ZpCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T16:09:42.412150Z"},"content_sha256":"98f2316d69fd75652661bfdae504e35a6e392a4318a41fd851c86c1af8c7b23a","schema_version":"1.0","event_id":"sha256:98f2316d69fd75652661bfdae504e35a6e392a4318a41fd851c86c1af8c7b23a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LTJFUCK5ZM3BSYLOHFN27E7Y3B/bundle.json","state_url":"https://pith.science/pith/LTJFUCK5ZM3BSYLOHFN27E7Y3B/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LTJFUCK5ZM3BSYLOHFN27E7Y3B/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T16:09:42Z","links":{"resolver":"https://pith.science/pith/LTJFUCK5ZM3BSYLOHFN27E7Y3B","bundle":"https://pith.science/pith/LTJFUCK5ZM3BSYLOHFN27E7Y3B/bundle.json","state":"https://pith.science/pith/LTJFUCK5ZM3BSYLOHFN27E7Y3B/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LTJFUCK5ZM3BSYLOHFN27E7Y3B/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:LTJFUCK5ZM3BSYLOHFN27E7Y3B","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c2454c63f4ce3958b128f4ffa96e718cffcfc978869d3dbcb7320b6c4052d0f1","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-26T16:44:25Z","title_canon_sha256":"4f565736fe728e0535c9a20da4d4138170dcf4fd4cd8a4fea40366c34c9af145"},"schema_version":"1.0","source":{"id":"2605.27268","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.27268","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"arxiv_version","alias_value":"2605.27268v1","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.27268","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"pith_short_12","alias_value":"LTJFUCK5ZM3B","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"pith_short_16","alias_value":"LTJFUCK5ZM3BSYLO","created_at":"2026-05-27T02:06:09Z"},{"alias_kind":"pith_short_8","alias_value":"LTJFUCK5","created_at":"2026-05-27T02:06:09Z"}],"graph_snapshots":[{"event_id":"sha256:98f2316d69fd75652661bfdae504e35a6e392a4318a41fd851c86c1af8c7b23a","target":"graph","created_at":"2026-05-27T02:06:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.27268/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Modern Large Language Models (LLMs) are often criticized for producing repetitive and homogeneous text, despite possessing vast latent vocabularies. While previous research has focused on model knowledge and training data, we investigate the role of decoding mechanics in suppressing linguistic diversity. We introduce the Word Coverage Score (WCS), a metric that quantifies the extent to which contextually appropriate human vocabulary is mathematically pruned by standard sampling filters (e.g., Top-$p$, Top-$k$, and Min-$p$). Rather than assessing static knowledge, the WCS measures the lexical s","authors_text":"Carlos Arriaga, Javier Conde, Javier Coronado-Bl\\'azquez, Pedro Reviriego, Samer Awad, Tairan Fu","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-26T16:44:25Z","title":"Lost in Sampling: Assessing Lexical Reachability in LLMs via the Word Coverage Score (WCS)"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.27268","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:70b66153e3289a852936b5230ea4ace71a7dea921ae2061ed6555c902e90f22e","target":"record","created_at":"2026-05-27T02:06:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c2454c63f4ce3958b128f4ffa96e718cffcfc978869d3dbcb7320b6c4052d0f1","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-26T16:44:25Z","title_canon_sha256":"4f565736fe728e0535c9a20da4d4138170dcf4fd4cd8a4fea40366c34c9af145"},"schema_version":"1.0","source":{"id":"2605.27268","kind":"arxiv","version":1}},"canonical_sha256":"5cd25a095dcb3619616e395baf93f8d85686a1934ef7ab16852a8bd953a7b55b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5cd25a095dcb3619616e395baf93f8d85686a1934ef7ab16852a8bd953a7b55b","first_computed_at":"2026-05-27T02:06:09.120688Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-27T02:06:09.120688Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"T5F0DKVr4VM0kmoXxySlsNkQ0K6s+PDGq+c5rvChyzMktZvxBJ+6jw6xkeqNIDQbGmlJbJZqkp6jgcqbYLN9Dw==","signature_status":"signed_v1","signed_at":"2026-05-27T02:06:09.121158Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.27268","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:70b66153e3289a852936b5230ea4ace71a7dea921ae2061ed6555c902e90f22e","sha256:98f2316d69fd75652661bfdae504e35a6e392a4318a41fd851c86c1af8c7b23a"],"state_sha256":"48377419f30d86cc53a4796081f5d547eedc25291f89fb479c299ef4af6ef9b7"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"m5CKHIpWAVU/w3ykNQ2BhvP2X7oODXYo9Es+e5pSD2EIoWKD70Lyv63pQrmNNQaGHFd6nUmXrdn7CN7Uo77aBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T16:09:42.414127Z","bundle_sha256":"284d13ebfec7a3bbde61dfde503a73b0cc836cc212543505be8c5af88f5a3f14"}}