{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2025:OH5GGPU3PS4MP5V5ODPJ5KUKA3","short_pith_number":"pith:OH5GGPU3","schema_version":"1.0","canonical_sha256":"71fa633e9b7cb8c7f6bd70de9eaa8a06fcbb1e58ec3c312677d3a81ad15a9d26","source":{"kind":"arxiv","id":"2510.03415","version":3},"attestation_state":"computed","paper":{"title":"LLMs Lean on Priors, Not Programming Language Semantics","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.SE"],"primary_cat":"cs.PL","authors_text":"Aditya Thimmaiah, Jayanth Srinivasa, Jiyang Zhang, Junyi Jessy Li, Milos Gligoric","submitted_at":"2025-10-03T18:23:26Z","abstract_excerpt":"Recent work asks whether large language models (LLMs) condition their reasoning on explicit rules rather than statistical regularities from pretraining. Program execution provides a canonical instance: formal semantics define behavior through symbolic transition rules that can be systematically altered under distribution shift. We investigate whether LLMs can condition their reasoning on formal semantics through program execution and introduce PLSemanticsBench, pairing featherweight C programs with two semantic systems -- small-step operational semantics and K semantics -- and probing four cap"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2510.03415","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.PL","submitted_at":"2025-10-03T18:23:26Z","cross_cats_sorted":["cs.AI","cs.CL","cs.SE"],"title_canon_sha256":"410ee2dae51fa3e37f69dafeb364f35b6a5be5b586b2f8578e343bc538738ea1","abstract_canon_sha256":"c67101530bd45661d5a039fca13d5db0ebf4d4f86dc5422f5e313fdb40eeb18b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-01T02:03:27.896953Z","signature_b64":"f5dPBEHaIMDLBc3dLN7fHrfxjeotSRDB9hyU0jCYW0ylw1bND1zRTaHqY7Go3msziChTJqtUOeLJDNVbVFqHDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"71fa633e9b7cb8c7f6bd70de9eaa8a06fcbb1e58ec3c312677d3a81ad15a9d26","last_reissued_at":"2026-06-01T02:03:27.896197Z","signature_status":"signed_v1","first_computed_at":"2026-06-01T02:03:27.896197Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"LLMs Lean on Priors, Not Programming Language Semantics","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.SE"],"primary_cat":"cs.PL","authors_text":"Aditya Thimmaiah, Jayanth Srinivasa, Jiyang Zhang, Junyi Jessy Li, Milos Gligoric","submitted_at":"2025-10-03T18:23:26Z","abstract_excerpt":"Recent work asks whether large language models (LLMs) condition their reasoning on explicit rules rather than statistical regularities from pretraining. Program execution provides a canonical instance: formal semantics define behavior through symbolic transition rules that can be systematically altered under distribution shift. We investigate whether LLMs can condition their reasoning on formal semantics through program execution and introduce PLSemanticsBench, pairing featherweight C programs with two semantic systems -- small-step operational semantics and K semantics -- and probing four cap"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.03415","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2510.03415/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2510.03415","created_at":"2026-06-01T02:03:27.896332+00:00"},{"alias_kind":"arxiv_version","alias_value":"2510.03415v3","created_at":"2026-06-01T02:03:27.896332+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.03415","created_at":"2026-06-01T02:03:27.896332+00:00"},{"alias_kind":"pith_short_12","alias_value":"OH5GGPU3PS4M","created_at":"2026-06-01T02:03:27.896332+00:00"},{"alias_kind":"pith_short_16","alias_value":"OH5GGPU3PS4MP5V5","created_at":"2026-06-01T02:03:27.896332+00:00"},{"alias_kind":"pith_short_8","alias_value":"OH5GGPU3","created_at":"2026-06-01T02:03:27.896332+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3","json":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3.json","graph_json":"https://pith.science/api/pith-number/OH5GGPU3PS4MP5V5ODPJ5KUKA3/graph.json","events_json":"https://pith.science/api/pith-number/OH5GGPU3PS4MP5V5ODPJ5KUKA3/events.json","paper":"https://pith.science/paper/OH5GGPU3"},"agent_actions":{"view_html":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3","download_json":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3.json","view_paper":"https://pith.science/paper/OH5GGPU3","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2510.03415&json=true","fetch_graph":"https://pith.science/api/pith-number/OH5GGPU3PS4MP5V5ODPJ5KUKA3/graph.json","fetch_events":"https://pith.science/api/pith-number/OH5GGPU3PS4MP5V5ODPJ5KUKA3/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3/action/timestamp_anchor","attest_storage":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3/action/storage_attestation","attest_author":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3/action/author_attestation","sign_citation":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3/action/citation_signature","submit_replication":"https://pith.science/pith/OH5GGPU3PS4MP5V5ODPJ5KUKA3/action/replication_record"}},"created_at":"2026-06-01T02:03:27.896332+00:00","updated_at":"2026-06-01T02:03:27.896332+00:00"}