{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:HXAK6GFK7BSFKXXQYIWSG234HS","short_pith_number":"pith:HXAK6GFK","canonical_record":{"source":{"id":"2605.23035","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T21:00:24Z","cross_cats_sorted":["cs.AI","q-bio.NC"],"title_canon_sha256":"1fb68ab92a5f222d71876809c24756d0cb3c2c0d5699639eaac2ccfdb05a0e68","abstract_canon_sha256":"23921f4d2249848a580eb9dc702d86e377f7fc7182f7104e7d9dd366fa78c750"},"schema_version":"1.0"},"canonical_sha256":"3dc0af18aaf864555ef0c22d236b7c3cb89e49e352187816ba71faeafece6084","source":{"kind":"arxiv","id":"2605.23035","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.23035","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"arxiv_version","alias_value":"2605.23035v1","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.23035","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"pith_short_12","alias_value":"HXAK6GFK7BSF","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"pith_short_16","alias_value":"HXAK6GFK7BSFKXXQ","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"pith_short_8","alias_value":"HXAK6GFK","created_at":"2026-05-25T02:01:35Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:HXAK6GFK7BSFKXXQYIWSG234HS","target":"record","payload":{"canonical_record":{"source":{"id":"2605.23035","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T21:00:24Z","cross_cats_sorted":["cs.AI","q-bio.NC"],"title_canon_sha256":"1fb68ab92a5f222d71876809c24756d0cb3c2c0d5699639eaac2ccfdb05a0e68","abstract_canon_sha256":"23921f4d2249848a580eb9dc702d86e377f7fc7182f7104e7d9dd366fa78c750"},"schema_version":"1.0"},"canonical_sha256":"3dc0af18aaf864555ef0c22d236b7c3cb89e49e352187816ba71faeafece6084","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-25T02:01:35.535323Z","signature_b64":"Jv0KiF7De6uezeAKP2f+ubdu4nyIMtpTSC9O5rZMCifvCXRVaI7SRkzQCoTLKiJuEg3b8o3oGdqGu1J/T95YAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3dc0af18aaf864555ef0c22d236b7c3cb89e49e352187816ba71faeafece6084","last_reissued_at":"2026-05-25T02:01:35.534765Z","signature_status":"signed_v1","first_computed_at":"2026-05-25T02:01:35.534765Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.23035","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-25T02:01:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"mqsky74AF8WuSyKWqupE+7yuRO7Obz9hklYKhox/3jWN+6ZhFEVaUpsj/7RVHYZ+hQdmXEwdCgUv3dDIGldSAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T01:37:49.714498Z"},"content_sha256":"ac9f443c4f3287f8f17584e2d7842633cdbecd8207f00748d44e7a5a4d71a18b","schema_version":"1.0","event_id":"sha256:ac9f443c4f3287f8f17584e2d7842633cdbecd8207f00748d44e7a5a4d71a18b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:HXAK6GFK7BSFKXXQYIWSG234HS","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Sparse Autoencoders Map Brain-LLM Alignment onto Cortical Semantic Topography","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","q-bio.NC"],"primary_cat":"cs.CL","authors_text":"Dongxin Guo, Jikun Wu, Siu Ming Yiu","submitted_at":"2026-05-21T21:00:24Z","abstract_excerpt":"Intermediate layers of large language models (LLMs) best predict human brain responses to language, one of the most robust findings in computational neurolinguistics, yet why remains mechanistically unexplained. We address this gap by bridging sparse autoencoders (SAEs) from mechanistic interpretability with neural encoding models, decomposing GPT-2 XL and Llama-3.1-8B into 16K-32K interpretable features per layer. A human-validated taxonomy ($\\kappa \\geq 0.74$) reveals that semantic features alone recover 94% of peak encoding performance ($r=0.285$), substantially exceeding variance-matched b"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.23035","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.23035/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-25T02:01:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"efKHCoFfLKUKiPqySX+aNkyhIKZsJmHMhsn7OwmTUqbxaiWZA0YmStUVR0R5S9+YgquBIvgTswE/YD4vvyE7AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T01:37:49.714988Z"},"content_sha256":"2ed5200d519b7ec8e0534ee03252df826f1983f395324e5707b296595e6657a5","schema_version":"1.0","event_id":"sha256:2ed5200d519b7ec8e0534ee03252df826f1983f395324e5707b296595e6657a5"},{"event_type":"integrity_finding","subject_pith_number":"pith:2026:HXAK6GFK7BSFKXXQYIWSG234HS","target":"integrity","payload":{"note":"DOI in the printed bibliography is fragmented by whitespace or line breaks. A longer candidate (10.1162/TACL\\_A\\_00548) was visible in the surrounding text but could not be confirmed against doi.org as printed.","snippet":"Byung. Why Does Surprisal From Larger Transformer-Based Language Models Provide a Poorer Fit to Human Reading Times? , journal =. 2023 , burl =. doi:10.1162/TACL\\_A\\_00548 , timestamp =","arxiv_id":"2605.23035","detector":"doi_compliance","evidence":{"ref_index":50,"verdict_class":"incontrovertible","resolved_title":null,"printed_excerpt":"Byung. Why Does Surprisal From Larger Transformer-Based Language Models Provide a Poorer Fit to Human Reading Times? , journal =. 2023 , burl =. doi:10.1162/TACL\\_A\\_00548 , timestamp =","reconstructed_doi":"10.1162/TACL\\_A\\_00548"},"severity":"advisory","ref_index":50,"audited_at":"2026-05-25T05:48:23.920055Z","event_type":"pith.integrity.v1","detected_doi":"10.1162/TACL\\_A\\_00548","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"recoverable_identifier","evidence_hash":"9f17ef93854eeae9f834711e8062cd710b27156f939bc3e72189b56b38d8f208","paper_version":1,"verdict_class":"incontrovertible","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null,"integrity_event_id":7474,"payload_sha256":"71b07d36b46b89aec76dae2274a48e1e9480a22e1f5d245173256bed8aef0217","signature_b64":"4xlySM5bnwkQqnxANxjt9eftVc0Pu5ehPvCYPkHZt0HFO8Xueg9iNS7GL7OJl0/oXhAWndsOEjNNegwzMnLGCQ==","signing_key_id":"pith-v1-2026-05"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-25T05:49:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"H5FAa46RFqrfop7fdHgSKXZfQZ57nqH7f7Hel2Rd9bh/so+LDx2TTWeSyRIYYy/Mt64PI3u2OhgsUIlCxBX8Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T01:37:49.715988Z"},"content_sha256":"92c15c5bad75acafc77d9995704e770f77ccc0ef24a9d2bf4aef4df5d8ebd096","schema_version":"1.0","event_id":"sha256:92c15c5bad75acafc77d9995704e770f77ccc0ef24a9d2bf4aef4df5d8ebd096"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HXAK6GFK7BSFKXXQYIWSG234HS/bundle.json","state_url":"https://pith.science/pith/HXAK6GFK7BSFKXXQYIWSG234HS/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HXAK6GFK7BSFKXXQYIWSG234HS/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T01:37:49Z","links":{"resolver":"https://pith.science/pith/HXAK6GFK7BSFKXXQYIWSG234HS","bundle":"https://pith.science/pith/HXAK6GFK7BSFKXXQYIWSG234HS/bundle.json","state":"https://pith.science/pith/HXAK6GFK7BSFKXXQYIWSG234HS/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HXAK6GFK7BSFKXXQYIWSG234HS/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:HXAK6GFK7BSFKXXQYIWSG234HS","merge_version":"pith-open-graph-merge-v1","event_count":3,"valid_event_count":3,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"23921f4d2249848a580eb9dc702d86e377f7fc7182f7104e7d9dd366fa78c750","cross_cats_sorted":["cs.AI","q-bio.NC"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T21:00:24Z","title_canon_sha256":"1fb68ab92a5f222d71876809c24756d0cb3c2c0d5699639eaac2ccfdb05a0e68"},"schema_version":"1.0","source":{"id":"2605.23035","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.23035","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"arxiv_version","alias_value":"2605.23035v1","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.23035","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"pith_short_12","alias_value":"HXAK6GFK7BSF","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"pith_short_16","alias_value":"HXAK6GFK7BSFKXXQ","created_at":"2026-05-25T02:01:35Z"},{"alias_kind":"pith_short_8","alias_value":"HXAK6GFK","created_at":"2026-05-25T02:01:35Z"}],"graph_snapshots":[{"event_id":"sha256:2ed5200d519b7ec8e0534ee03252df826f1983f395324e5707b296595e6657a5","target":"graph","created_at":"2026-05-25T02:01:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.23035/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Intermediate layers of large language models (LLMs) best predict human brain responses to language, one of the most robust findings in computational neurolinguistics, yet why remains mechanistically unexplained. We address this gap by bridging sparse autoencoders (SAEs) from mechanistic interpretability with neural encoding models, decomposing GPT-2 XL and Llama-3.1-8B into 16K-32K interpretable features per layer. A human-validated taxonomy ($\\kappa \\geq 0.74$) reveals that semantic features alone recover 94% of peak encoding performance ($r=0.285$), substantially exceeding variance-matched b","authors_text":"Dongxin Guo, Jikun Wu, Siu Ming Yiu","cross_cats":["cs.AI","q-bio.NC"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T21:00:24Z","title":"Sparse Autoencoders Map Brain-LLM Alignment onto Cortical Semantic Topography"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.23035","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ac9f443c4f3287f8f17584e2d7842633cdbecd8207f00748d44e7a5a4d71a18b","target":"record","created_at":"2026-05-25T02:01:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"23921f4d2249848a580eb9dc702d86e377f7fc7182f7104e7d9dd366fa78c750","cross_cats_sorted":["cs.AI","q-bio.NC"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T21:00:24Z","title_canon_sha256":"1fb68ab92a5f222d71876809c24756d0cb3c2c0d5699639eaac2ccfdb05a0e68"},"schema_version":"1.0","source":{"id":"2605.23035","kind":"arxiv","version":1}},"canonical_sha256":"3dc0af18aaf864555ef0c22d236b7c3cb89e49e352187816ba71faeafece6084","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3dc0af18aaf864555ef0c22d236b7c3cb89e49e352187816ba71faeafece6084","first_computed_at":"2026-05-25T02:01:35.534765Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-25T02:01:35.534765Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Jv0KiF7De6uezeAKP2f+ubdu4nyIMtpTSC9O5rZMCifvCXRVaI7SRkzQCoTLKiJuEg3b8o3oGdqGu1J/T95YAw==","signature_status":"signed_v1","signed_at":"2026-05-25T02:01:35.535323Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.23035","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ac9f443c4f3287f8f17584e2d7842633cdbecd8207f00748d44e7a5a4d71a18b","sha256:2ed5200d519b7ec8e0534ee03252df826f1983f395324e5707b296595e6657a5","sha256:92c15c5bad75acafc77d9995704e770f77ccc0ef24a9d2bf4aef4df5d8ebd096"],"state_sha256":"e85e619a206178b4263e7a7c0f0ca18ecb4007225464c8916fd372d32a3fff91"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sVG2LwVg5BHDxg8R00haisupg17iRR/L1LtDJxUVj3PiX41Pm4+V0t1zkl93cdzVVjSnPfkmxVh2woOajSoBDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T01:37:49.718261Z","bundle_sha256":"8a3f06d77bb1a93d581f2d5750d6162f39424bbc8d8a95f2314ff13839215612"}}