{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:TVQUCMNG3TAP6UQQ3ZP5INE4ME","short_pith_number":"pith:TVQUCMNG","canonical_record":{"source":{"id":"2606.26155","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T20:10:53Z","cross_cats_sorted":[],"title_canon_sha256":"518aaa0dc732829f6a8b0ddfc45413001f6f87296af33075d3bb669dc767bc26","abstract_canon_sha256":"fa35162ecc407015117ae44256f66481cda3a3168f39b2ae5a9ec1943c229041"},"schema_version":"1.0"},"canonical_sha256":"9d614131a6dcc0ff5210de5fd4349c6116431904fb2eeea0b465f18059f75cac","source":{"kind":"arxiv","id":"2606.26155","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.26155","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"arxiv_version","alias_value":"2606.26155v1","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.26155","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"pith_short_12","alias_value":"TVQUCMNG3TAP","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"pith_short_16","alias_value":"TVQUCMNG3TAP6UQQ","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"pith_short_8","alias_value":"TVQUCMNG","created_at":"2026-06-26T00:15:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:TVQUCMNG3TAP6UQQ3ZP5INE4ME","target":"record","payload":{"canonical_record":{"source":{"id":"2606.26155","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T20:10:53Z","cross_cats_sorted":[],"title_canon_sha256":"518aaa0dc732829f6a8b0ddfc45413001f6f87296af33075d3bb669dc767bc26","abstract_canon_sha256":"fa35162ecc407015117ae44256f66481cda3a3168f39b2ae5a9ec1943c229041"},"schema_version":"1.0"},"canonical_sha256":"9d614131a6dcc0ff5210de5fd4349c6116431904fb2eeea0b465f18059f75cac","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-26T00:15:27.442672Z","signature_b64":"dWiGLwt2jmFrkkQcYtXiHBChMe2GQPIzNLXeBxVnM4X4twND7GDNniSVatcX2lj7g6hosoUgttbOHxYuKr/tAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9d614131a6dcc0ff5210de5fd4349c6116431904fb2eeea0b465f18059f75cac","last_reissued_at":"2026-06-26T00:15:27.442135Z","signature_status":"signed_v1","first_computed_at":"2026-06-26T00:15:27.442135Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.26155","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-26T00:15:27Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"d0m+TnGHYK6JQPGIBhRODtamWt2ekwuAuPtwOniB4Bo4QJuzRHSmtj5m+Zg0UbLmHHOefgeo9d/lMGj9ghZ6DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T02:45:25.868800Z"},"content_sha256":"1f9714a757d8c772ab7196e704831772de6ffd8f28ade733f1c7f03f7a082101","schema_version":"1.0","event_id":"sha256:1f9714a757d8c772ab7196e704831772de6ffd8f28ade733f1c7f03f7a082101"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:TVQUCMNG3TAP6UQQ3ZP5INE4ME","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Detecting and Controlling Sycophancy with Cascading Linear Features","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Chris Bregler, Maty Bohacek, Nicholas Dufour, Rishub Jain, Roma Patel, Thomas Leung","submitted_at":"2026-06-23T20:10:53Z","abstract_excerpt":"Interpreting and controlling model behaviors through activation steering methods requires many pairs of contrastive samples that clearly exhibit desired or undesired behavior. These data pairs determine the degree to which interpretability frameworks can reliably detect model features responsible for a behavior, and therefore the ability to steer models toward or away from such behavior. In this work, we present an iterative data generation pipeline that isolates cascading linear features responsible for a behavior. Specifically, we show how moving beyond simple binary pairs of samples, and in"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.26155","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.26155/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-26T00:15:27Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"LFoYt9VM7n2lcbn8ONMrkSkF6yPlTuJ6YHuBQOsdgI3XDFot8YplCMtXGu4X8aCptCFT2p+y4/Svmmhqi94NCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T02:45:25.869168Z"},"content_sha256":"3e9686e081a59e53cc8447a7e94e7480d593d6cde3596f61bd056e4b37d80e86","schema_version":"1.0","event_id":"sha256:3e9686e081a59e53cc8447a7e94e7480d593d6cde3596f61bd056e4b37d80e86"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/TVQUCMNG3TAP6UQQ3ZP5INE4ME/bundle.json","state_url":"https://pith.science/pith/TVQUCMNG3TAP6UQQ3ZP5INE4ME/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/TVQUCMNG3TAP6UQQ3ZP5INE4ME/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T02:45:25Z","links":{"resolver":"https://pith.science/pith/TVQUCMNG3TAP6UQQ3ZP5INE4ME","bundle":"https://pith.science/pith/TVQUCMNG3TAP6UQQ3ZP5INE4ME/bundle.json","state":"https://pith.science/pith/TVQUCMNG3TAP6UQQ3ZP5INE4ME/state.json","well_known_bundle":"https://pith.science/.well-known/pith/TVQUCMNG3TAP6UQQ3ZP5INE4ME/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:TVQUCMNG3TAP6UQQ3ZP5INE4ME","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fa35162ecc407015117ae44256f66481cda3a3168f39b2ae5a9ec1943c229041","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T20:10:53Z","title_canon_sha256":"518aaa0dc732829f6a8b0ddfc45413001f6f87296af33075d3bb669dc767bc26"},"schema_version":"1.0","source":{"id":"2606.26155","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.26155","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"arxiv_version","alias_value":"2606.26155v1","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.26155","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"pith_short_12","alias_value":"TVQUCMNG3TAP","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"pith_short_16","alias_value":"TVQUCMNG3TAP6UQQ","created_at":"2026-06-26T00:15:27Z"},{"alias_kind":"pith_short_8","alias_value":"TVQUCMNG","created_at":"2026-06-26T00:15:27Z"}],"graph_snapshots":[{"event_id":"sha256:3e9686e081a59e53cc8447a7e94e7480d593d6cde3596f61bd056e4b37d80e86","target":"graph","created_at":"2026-06-26T00:15:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.26155/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Interpreting and controlling model behaviors through activation steering methods requires many pairs of contrastive samples that clearly exhibit desired or undesired behavior. These data pairs determine the degree to which interpretability frameworks can reliably detect model features responsible for a behavior, and therefore the ability to steer models toward or away from such behavior. In this work, we present an iterative data generation pipeline that isolates cascading linear features responsible for a behavior. Specifically, we show how moving beyond simple binary pairs of samples, and in","authors_text":"Chris Bregler, Maty Bohacek, Nicholas Dufour, Rishub Jain, Roma Patel, Thomas Leung","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T20:10:53Z","title":"Detecting and Controlling Sycophancy with Cascading Linear Features"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.26155","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1f9714a757d8c772ab7196e704831772de6ffd8f28ade733f1c7f03f7a082101","target":"record","created_at":"2026-06-26T00:15:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fa35162ecc407015117ae44256f66481cda3a3168f39b2ae5a9ec1943c229041","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T20:10:53Z","title_canon_sha256":"518aaa0dc732829f6a8b0ddfc45413001f6f87296af33075d3bb669dc767bc26"},"schema_version":"1.0","source":{"id":"2606.26155","kind":"arxiv","version":1}},"canonical_sha256":"9d614131a6dcc0ff5210de5fd4349c6116431904fb2eeea0b465f18059f75cac","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9d614131a6dcc0ff5210de5fd4349c6116431904fb2eeea0b465f18059f75cac","first_computed_at":"2026-06-26T00:15:27.442135Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-26T00:15:27.442135Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"dWiGLwt2jmFrkkQcYtXiHBChMe2GQPIzNLXeBxVnM4X4twND7GDNniSVatcX2lj7g6hosoUgttbOHxYuKr/tAA==","signature_status":"signed_v1","signed_at":"2026-06-26T00:15:27.442672Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.26155","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1f9714a757d8c772ab7196e704831772de6ffd8f28ade733f1c7f03f7a082101","sha256:3e9686e081a59e53cc8447a7e94e7480d593d6cde3596f61bd056e4b37d80e86"],"state_sha256":"968fa346c12482667098b732aa3eaf6e0041679709120b3295dfaccc3d126938"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"B3BeQKB7UPcxyhwJvGIo7lXl7zi4vTQvLFUTiYrp4PqI79o2cECgJou7NuKHxiVeWjeQAVYJ/SHBhXHe/+WLCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T02:45:25.871090Z","bundle_sha256":"b2adb8dcd9b5e3b7af72ef589f98dec22b5330f2debd093a4b78cdf846d9b270"}}