{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:EZGAHWMB7Y4X7TQ3JWCQXNA3DT","short_pith_number":"pith:EZGAHWMB","canonical_record":{"source":{"id":"2605.21227","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-20T14:19:55Z","cross_cats_sorted":[],"title_canon_sha256":"99cc1f72f65b93a401ff4d9d63517b935366e9035623b21513890426856ac488","abstract_canon_sha256":"d50cccb1ba203e1cbbcc9ab37368e5eef6a723ec7508fd9630a5c1d04746f3f4"},"schema_version":"1.0"},"canonical_sha256":"264c03d981fe397fce1b4d850bb41b1cf12612f2f6c66e26aaa73d902a2b92e0","source":{"kind":"arxiv","id":"2605.21227","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.21227","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"arxiv_version","alias_value":"2605.21227v1","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.21227","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"pith_short_12","alias_value":"EZGAHWMB7Y4X","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"pith_short_16","alias_value":"EZGAHWMB7Y4X7TQ3","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"pith_short_8","alias_value":"EZGAHWMB","created_at":"2026-05-21T01:05:44Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:EZGAHWMB7Y4X7TQ3JWCQXNA3DT","target":"record","payload":{"canonical_record":{"source":{"id":"2605.21227","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-20T14:19:55Z","cross_cats_sorted":[],"title_canon_sha256":"99cc1f72f65b93a401ff4d9d63517b935366e9035623b21513890426856ac488","abstract_canon_sha256":"d50cccb1ba203e1cbbcc9ab37368e5eef6a723ec7508fd9630a5c1d04746f3f4"},"schema_version":"1.0"},"canonical_sha256":"264c03d981fe397fce1b4d850bb41b1cf12612f2f6c66e26aaa73d902a2b92e0","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-21T01:05:44.434059Z","signature_b64":"zN0yXdpmyVDt+6yG2GAcu0fUqNXFcV9FqWtubdBFigXZiZD41u4qL1lJnVUmLP1BlUlAINpcZTHkLrKvP/tvBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"264c03d981fe397fce1b4d850bb41b1cf12612f2f6c66e26aaa73d902a2b92e0","last_reissued_at":"2026-05-21T01:05:44.433271Z","signature_status":"signed_v1","first_computed_at":"2026-05-21T01:05:44.433271Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.21227","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T01:05:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"lurI88kK1EsbOGCHFi+H84sNGiJpezPHEXfj9aLnWgR73j0KD9Xkm/Yex3euPzH2iXZGMY1sSXKf6V5x1/cVDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T08:36:14.084647Z"},"content_sha256":"4fc8f05db40ac1f4b047f0c22e6c30feb1c30abf77c0fa9c601212093f8055ec","schema_version":"1.0","event_id":"sha256:4fc8f05db40ac1f4b047f0c22e6c30feb1c30abf77c0fa9c601212093f8055ec"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:EZGAHWMB7Y4X7TQ3JWCQXNA3DT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Do LLMs Know What Luxembourgish Borrows? Probing Lexical Neology in Low-Resource Multilingual Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Nina Hosseini-Kivanani","submitted_at":"2026-05-20T14:19:55Z","abstract_excerpt":"Large language models (LLMs) are increasingly used for writing assistance in small contact languages, yet it is unclear whether they respect community norms around lexical borrowing and neology. We introduce LexNeo-Bench, a 3{,}050-instance token-level benchmark derived from LuxBorrow, a large-scale Luxembourgish news corpus, where target tokens are labelled as native or as French, German, or English borrowings. Using this benchmark, we probe three multilingual LLMs across 34 prompt settings on two tasks: borrowing type classification and a binary lexical-innovation proxy (borrowing versus nat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.21227","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.21227/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T01:05:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FaVFMjSdUSD3FfaFljoHv73/e37UxQ4kWr9Sdf6rzz5uryN27sFhy3Ro3nPnZ/t2CGMGSeBqs9uA+BMHclu6AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T08:36:14.085421Z"},"content_sha256":"c1198f14d960e876a709998f31f8cb23ca432732a908f312ef4c3d248c0b66b5","schema_version":"1.0","event_id":"sha256:c1198f14d960e876a709998f31f8cb23ca432732a908f312ef4c3d248c0b66b5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/EZGAHWMB7Y4X7TQ3JWCQXNA3DT/bundle.json","state_url":"https://pith.science/pith/EZGAHWMB7Y4X7TQ3JWCQXNA3DT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/EZGAHWMB7Y4X7TQ3JWCQXNA3DT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T08:36:14Z","links":{"resolver":"https://pith.science/pith/EZGAHWMB7Y4X7TQ3JWCQXNA3DT","bundle":"https://pith.science/pith/EZGAHWMB7Y4X7TQ3JWCQXNA3DT/bundle.json","state":"https://pith.science/pith/EZGAHWMB7Y4X7TQ3JWCQXNA3DT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/EZGAHWMB7Y4X7TQ3JWCQXNA3DT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:EZGAHWMB7Y4X7TQ3JWCQXNA3DT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d50cccb1ba203e1cbbcc9ab37368e5eef6a723ec7508fd9630a5c1d04746f3f4","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-20T14:19:55Z","title_canon_sha256":"99cc1f72f65b93a401ff4d9d63517b935366e9035623b21513890426856ac488"},"schema_version":"1.0","source":{"id":"2605.21227","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.21227","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"arxiv_version","alias_value":"2605.21227v1","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.21227","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"pith_short_12","alias_value":"EZGAHWMB7Y4X","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"pith_short_16","alias_value":"EZGAHWMB7Y4X7TQ3","created_at":"2026-05-21T01:05:44Z"},{"alias_kind":"pith_short_8","alias_value":"EZGAHWMB","created_at":"2026-05-21T01:05:44Z"}],"graph_snapshots":[{"event_id":"sha256:c1198f14d960e876a709998f31f8cb23ca432732a908f312ef4c3d248c0b66b5","target":"graph","created_at":"2026-05-21T01:05:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.21227/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large language models (LLMs) are increasingly used for writing assistance in small contact languages, yet it is unclear whether they respect community norms around lexical borrowing and neology. We introduce LexNeo-Bench, a 3{,}050-instance token-level benchmark derived from LuxBorrow, a large-scale Luxembourgish news corpus, where target tokens are labelled as native or as French, German, or English borrowings. Using this benchmark, we probe three multilingual LLMs across 34 prompt settings on two tasks: borrowing type classification and a binary lexical-innovation proxy (borrowing versus nat","authors_text":"Nina Hosseini-Kivanani","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-20T14:19:55Z","title":"Do LLMs Know What Luxembourgish Borrows? Probing Lexical Neology in Low-Resource Multilingual Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.21227","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4fc8f05db40ac1f4b047f0c22e6c30feb1c30abf77c0fa9c601212093f8055ec","target":"record","created_at":"2026-05-21T01:05:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d50cccb1ba203e1cbbcc9ab37368e5eef6a723ec7508fd9630a5c1d04746f3f4","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-20T14:19:55Z","title_canon_sha256":"99cc1f72f65b93a401ff4d9d63517b935366e9035623b21513890426856ac488"},"schema_version":"1.0","source":{"id":"2605.21227","kind":"arxiv","version":1}},"canonical_sha256":"264c03d981fe397fce1b4d850bb41b1cf12612f2f6c66e26aaa73d902a2b92e0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"264c03d981fe397fce1b4d850bb41b1cf12612f2f6c66e26aaa73d902a2b92e0","first_computed_at":"2026-05-21T01:05:44.433271Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-21T01:05:44.433271Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"zN0yXdpmyVDt+6yG2GAcu0fUqNXFcV9FqWtubdBFigXZiZD41u4qL1lJnVUmLP1BlUlAINpcZTHkLrKvP/tvBw==","signature_status":"signed_v1","signed_at":"2026-05-21T01:05:44.434059Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.21227","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4fc8f05db40ac1f4b047f0c22e6c30feb1c30abf77c0fa9c601212093f8055ec","sha256:c1198f14d960e876a709998f31f8cb23ca432732a908f312ef4c3d248c0b66b5"],"state_sha256":"7b0b583b20f30291bea388fb7c6bfd7b7b3396a2cb43c6c5eb6c41848c1653ba"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"PhrsKidVI7tw0xvzd1qFXN7FBT2tMB1LmsNx8i487br3uoSzoYcIMM7gWZtO7dN1AEGT2DJM9o9ERtK7fn3OCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T08:36:14.090269Z","bundle_sha256":"c64c99062caadaf2eaa34e445e15cc84bcd1891e4e45137523e7b0ebd4df3759"}}