{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2025:L5WER2GQQTI45O7WGUXHOFYKT6","short_pith_number":"pith:L5WER2GQ","schema_version":"1.0","canonical_sha256":"5f6c48e8d084d1cebbf6352e77170a9fb839529a8149ea6ffbeb5ee56dfca7cd","source":{"kind":"arxiv","id":"2509.21820","version":2},"attestation_state":"computed","paper":{"title":"Can LLMs Generate and Solve Linguistic Olympiad Puzzles?","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Elena Filatova, Neh Majmudar","submitted_at":"2025-09-26T03:26:28Z","abstract_excerpt":"In this paper, we introduce a combination of novel and exciting tasks: the solution and generation of linguistic puzzles. We focus on puzzles used in Linguistic Olympiads for high school students. We first extend the existing benchmark for the task of solving linguistic puzzles. We explore the use of Large Language Models (LLMs), including recent state-of-the-art models such as OpenAI's o1, for solving linguistic puzzles, analyzing their performance across various linguistic topics. We demonstrate that LLMs outperform humans on most puzzles types, except for those centered on writing systems, "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2509.21820","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2025-09-26T03:26:28Z","cross_cats_sorted":[],"title_canon_sha256":"41f29fab3bf93724455e548eb3601f0a6e77ea3ed1a31e358ae65009c8df7c0c","abstract_canon_sha256":"210e30103ad148d7b29faa9728f771dd6e7276b16a09a5f74c0d39ac8b30be9e"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:04:13.818312Z","signature_b64":"uNUQAdn8GmCCTZaK3FummAFOpQF9pAfkmkh1FIBSQmV5uiTFwHDMnpYaNAJFSFyEpE+DRCRimuBGWlQVv5VsBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5f6c48e8d084d1cebbf6352e77170a9fb839529a8149ea6ffbeb5ee56dfca7cd","last_reissued_at":"2026-05-20T00:04:13.817440Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:04:13.817440Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Can LLMs Generate and Solve Linguistic Olympiad Puzzles?","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Elena Filatova, Neh Majmudar","submitted_at":"2025-09-26T03:26:28Z","abstract_excerpt":"In this paper, we introduce a combination of novel and exciting tasks: the solution and generation of linguistic puzzles. We focus on puzzles used in Linguistic Olympiads for high school students. We first extend the existing benchmark for the task of solving linguistic puzzles. We explore the use of Large Language Models (LLMs), including recent state-of-the-art models such as OpenAI's o1, for solving linguistic puzzles, analyzing their performance across various linguistic topics. We demonstrate that LLMs outperform humans on most puzzles types, except for those centered on writing systems, "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2509.21820","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2509.21820/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2509.21820","created_at":"2026-05-20T00:04:13.817597+00:00"},{"alias_kind":"arxiv_version","alias_value":"2509.21820v2","created_at":"2026-05-20T00:04:13.817597+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2509.21820","created_at":"2026-05-20T00:04:13.817597+00:00"},{"alias_kind":"pith_short_12","alias_value":"L5WER2GQQTI4","created_at":"2026-05-20T00:04:13.817597+00:00"},{"alias_kind":"pith_short_16","alias_value":"L5WER2GQQTI45O7W","created_at":"2026-05-20T00:04:13.817597+00:00"},{"alias_kind":"pith_short_8","alias_value":"L5WER2GQ","created_at":"2026-05-20T00:04:13.817597+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6","json":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6.json","graph_json":"https://pith.science/api/pith-number/L5WER2GQQTI45O7WGUXHOFYKT6/graph.json","events_json":"https://pith.science/api/pith-number/L5WER2GQQTI45O7WGUXHOFYKT6/events.json","paper":"https://pith.science/paper/L5WER2GQ"},"agent_actions":{"view_html":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6","download_json":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6.json","view_paper":"https://pith.science/paper/L5WER2GQ","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2509.21820&json=true","fetch_graph":"https://pith.science/api/pith-number/L5WER2GQQTI45O7WGUXHOFYKT6/graph.json","fetch_events":"https://pith.science/api/pith-number/L5WER2GQQTI45O7WGUXHOFYKT6/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6/action/timestamp_anchor","attest_storage":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6/action/storage_attestation","attest_author":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6/action/author_attestation","sign_citation":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6/action/citation_signature","submit_replication":"https://pith.science/pith/L5WER2GQQTI45O7WGUXHOFYKT6/action/replication_record"}},"created_at":"2026-05-20T00:04:13.817597+00:00","updated_at":"2026-05-20T00:04:13.817597+00:00"}