{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:DUG2N5UN4FXJG6E7OZE4HD5Y4D","short_pith_number":"pith:DUG2N5UN","canonical_record":{"source":{"id":"2605.29358","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:57:47Z","cross_cats_sorted":[],"title_canon_sha256":"36936086a9e48f35927f37cf07492990240a2ccd98775d3cc73ffb8cdfa7f3fe","abstract_canon_sha256":"30659655a2ac591ace5c17b4766375b00654ceff7c74251aafa80de9dee1aed4"},"schema_version":"1.0"},"canonical_sha256":"1d0da6f68de16e93789f7649c38fb8e0d1be25f4458eaa3de177436aa995b0da","source":{"kind":"arxiv","id":"2605.29358","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.29358","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"arxiv_version","alias_value":"2605.29358v1","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.29358","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_12","alias_value":"DUG2N5UN4FXJ","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_16","alias_value":"DUG2N5UN4FXJG6E7","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_8","alias_value":"DUG2N5UN","created_at":"2026-05-29T01:05:35Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:DUG2N5UN4FXJG6E7OZE4HD5Y4D","target":"record","payload":{"canonical_record":{"source":{"id":"2605.29358","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:57:47Z","cross_cats_sorted":[],"title_canon_sha256":"36936086a9e48f35927f37cf07492990240a2ccd98775d3cc73ffb8cdfa7f3fe","abstract_canon_sha256":"30659655a2ac591ace5c17b4766375b00654ceff7c74251aafa80de9dee1aed4"},"schema_version":"1.0"},"canonical_sha256":"1d0da6f68de16e93789f7649c38fb8e0d1be25f4458eaa3de177436aa995b0da","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T01:05:35.100094Z","signature_b64":"RLJCnUM9IaVrFGoXvbnkC+devhyHOYIQxiqNepGmdft7bO4rMp75CBwqXJeaHnusORezSHceX14mdvOkXM9UAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1d0da6f68de16e93789f7649c38fb8e0d1be25f4458eaa3de177436aa995b0da","last_reissued_at":"2026-05-29T01:05:35.099638Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T01:05:35.099638Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.29358","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"T09nVXWrtpbcWW5c2iIS2NgeFoBVA5ZPQWx35GId9TtydcD6bhGsj3vVNOB5lgWVnzLcrI/EKqUSy7DEzF3dDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T11:04:28.630490Z"},"content_sha256":"9962f27c5f6f272310cc49966321b08273492a67cbe5a7cd89211125fbad6721","schema_version":"1.0","event_id":"sha256:9962f27c5f6f272310cc49966321b08273492a67cbe5a7cd89211125fbad6721"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:DUG2N5UN4FXJG6E7OZE4HD5Y4D","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Scaling Monosemanticity: Extracting Interpretable Features from Claude 3 Sonnet","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Adam Jermyn, Adam Pearce, Adly Templeton, Alex Tamkin, Andy Jones, Brian Chen, Callum McDougall, C. Daniel Freeman, Chris Olah, Craig Citro, Edward Rees, Emmanuel Ameisen, Esin Durmus, Francesco Mosconi, Hoagy Cunningham, Jack Lindsey, Jonathan Marcus, Joshua Batson, Monte MacDiarmid, Nicholas L Turner, Shan Carter, Theodore R. Sumers, Tom Conerly, Tom Henighan, Trenton Bricken, Tristan Hume","submitted_at":"2026-05-28T04:57:47Z","abstract_excerpt":"We demonstrate that sparse autoencoders can extract interpretable features from Claude 3 Sonnet, a production-scale language model, addressing the open question of whether dictionary learning methods scale beyond small transformers. We trained sparse autoencoders with up to 34 million features on the model's middle layer residual stream, using scaling laws to guide hyperparameter selection. The resulting features are multilingual and multimodal (generalizing to images despite text-only training), respond to both concrete instances and abstract discussions of concepts, and can be used to steer "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.29358","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.29358/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"97Fo0WuwLhYWikT4W0vuUYXntwUOvLfdiok2yGWQZ1nqJP/nBtUyhqv49KgCqgD7w13PokRyMHuhPY+xD1rMBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T11:04:28.631252Z"},"content_sha256":"03142d65c30f35e02338c21d4f7b08b481f92404e27c3977e68ba2edd21eee7d","schema_version":"1.0","event_id":"sha256:03142d65c30f35e02338c21d4f7b08b481f92404e27c3977e68ba2edd21eee7d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/DUG2N5UN4FXJG6E7OZE4HD5Y4D/bundle.json","state_url":"https://pith.science/pith/DUG2N5UN4FXJG6E7OZE4HD5Y4D/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/DUG2N5UN4FXJG6E7OZE4HD5Y4D/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T11:04:28Z","links":{"resolver":"https://pith.science/pith/DUG2N5UN4FXJG6E7OZE4HD5Y4D","bundle":"https://pith.science/pith/DUG2N5UN4FXJG6E7OZE4HD5Y4D/bundle.json","state":"https://pith.science/pith/DUG2N5UN4FXJG6E7OZE4HD5Y4D/state.json","well_known_bundle":"https://pith.science/.well-known/pith/DUG2N5UN4FXJG6E7OZE4HD5Y4D/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:DUG2N5UN4FXJG6E7OZE4HD5Y4D","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"30659655a2ac591ace5c17b4766375b00654ceff7c74251aafa80de9dee1aed4","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:57:47Z","title_canon_sha256":"36936086a9e48f35927f37cf07492990240a2ccd98775d3cc73ffb8cdfa7f3fe"},"schema_version":"1.0","source":{"id":"2605.29358","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.29358","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"arxiv_version","alias_value":"2605.29358v1","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.29358","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_12","alias_value":"DUG2N5UN4FXJ","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_16","alias_value":"DUG2N5UN4FXJG6E7","created_at":"2026-05-29T01:05:35Z"},{"alias_kind":"pith_short_8","alias_value":"DUG2N5UN","created_at":"2026-05-29T01:05:35Z"}],"graph_snapshots":[{"event_id":"sha256:03142d65c30f35e02338c21d4f7b08b481f92404e27c3977e68ba2edd21eee7d","target":"graph","created_at":"2026-05-29T01:05:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.29358/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"We demonstrate that sparse autoencoders can extract interpretable features from Claude 3 Sonnet, a production-scale language model, addressing the open question of whether dictionary learning methods scale beyond small transformers. We trained sparse autoencoders with up to 34 million features on the model's middle layer residual stream, using scaling laws to guide hyperparameter selection. The resulting features are multilingual and multimodal (generalizing to images despite text-only training), respond to both concrete instances and abstract discussions of concepts, and can be used to steer ","authors_text":"Adam Jermyn, Adam Pearce, Adly Templeton, Alex Tamkin, Andy Jones, Brian Chen, Callum McDougall, C. Daniel Freeman, Chris Olah, Craig Citro, Edward Rees, Emmanuel Ameisen, Esin Durmus, Francesco Mosconi, Hoagy Cunningham, Jack Lindsey, Jonathan Marcus, Joshua Batson, Monte MacDiarmid, Nicholas L Turner, Shan Carter, Theodore R. Sumers, Tom Conerly, Tom Henighan, Trenton Bricken, Tristan Hume","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:57:47Z","title":"Scaling Monosemanticity: Extracting Interpretable Features from Claude 3 Sonnet"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.29358","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9962f27c5f6f272310cc49966321b08273492a67cbe5a7cd89211125fbad6721","target":"record","created_at":"2026-05-29T01:05:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"30659655a2ac591ace5c17b4766375b00654ceff7c74251aafa80de9dee1aed4","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T04:57:47Z","title_canon_sha256":"36936086a9e48f35927f37cf07492990240a2ccd98775d3cc73ffb8cdfa7f3fe"},"schema_version":"1.0","source":{"id":"2605.29358","kind":"arxiv","version":1}},"canonical_sha256":"1d0da6f68de16e93789f7649c38fb8e0d1be25f4458eaa3de177436aa995b0da","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1d0da6f68de16e93789f7649c38fb8e0d1be25f4458eaa3de177436aa995b0da","first_computed_at":"2026-05-29T01:05:35.099638Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T01:05:35.099638Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"RLJCnUM9IaVrFGoXvbnkC+devhyHOYIQxiqNepGmdft7bO4rMp75CBwqXJeaHnusORezSHceX14mdvOkXM9UAA==","signature_status":"signed_v1","signed_at":"2026-05-29T01:05:35.100094Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.29358","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9962f27c5f6f272310cc49966321b08273492a67cbe5a7cd89211125fbad6721","sha256:03142d65c30f35e02338c21d4f7b08b481f92404e27c3977e68ba2edd21eee7d"],"state_sha256":"4f547e596cbd7acd1cebd37a1d3bea7a06d5201334d09aa50f99ea370103daef"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kBZ5TouX73L0udtPRyzbNHBj5v2l9shd5cUM0T8x47oYk7ZmAv35+7USGo219WSxjfJyNjQsGHbHWPLIsI3qAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T11:04:28.635301Z","bundle_sha256":"43aec2563fe7fd1dffee7e40df2662651f095c4737d70671515945592845842e"}}