{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:6CPH4PCDD5XSFMCBR7PQK2MFSF","short_pith_number":"pith:6CPH4PCD","canonical_record":{"source":{"id":"2606.02211","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-01T13:10:49Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"a9dd3eea768a0f3b63e201acf7f9ec16c594cb67c9317a6d71f5a34aeac8c17a","abstract_canon_sha256":"5b194b02cf6967b277482d8fc6f8c2271eefaf6dec10203d16fc961533eac243"},"schema_version":"1.0"},"canonical_sha256":"f09e7e3c431f6f22b0418fdf056985915b58e834533955916f013f6864c71901","source":{"kind":"arxiv","id":"2606.02211","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.02211","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"arxiv_version","alias_value":"2606.02211v1","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.02211","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"pith_short_12","alias_value":"6CPH4PCDD5XS","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"pith_short_16","alias_value":"6CPH4PCDD5XSFMCB","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"pith_short_8","alias_value":"6CPH4PCD","created_at":"2026-06-02T03:04:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:6CPH4PCDD5XSFMCBR7PQK2MFSF","target":"record","payload":{"canonical_record":{"source":{"id":"2606.02211","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-01T13:10:49Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"a9dd3eea768a0f3b63e201acf7f9ec16c594cb67c9317a6d71f5a34aeac8c17a","abstract_canon_sha256":"5b194b02cf6967b277482d8fc6f8c2271eefaf6dec10203d16fc961533eac243"},"schema_version":"1.0"},"canonical_sha256":"f09e7e3c431f6f22b0418fdf056985915b58e834533955916f013f6864c71901","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T03:04:53.201828Z","signature_b64":"AfF/GtfC2GPZErGBu1MNb1z26TRP3jr/w0PMnuCCrXX4pUFOMfuvkeUL3khyrBROdPK8HjK6rNdMUUL3R0GzAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f09e7e3c431f6f22b0418fdf056985915b58e834533955916f013f6864c71901","last_reissued_at":"2026-06-02T03:04:53.201484Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T03:04:53.201484Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.02211","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T03:04:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"AEliWwGpP0rpDBBGQ9P5niLtVfx2Wa4ZtAgxYt+xBOcoHFNEZMwMJXK9BV04kDf5Wmu5TjpyOt4nEhYUWT0OCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T09:34:51.805071Z"},"content_sha256":"c53c233396ca39535bbb071d1b4b703051f094f319961a3f35f5c4d82ecf4e24","schema_version":"1.0","event_id":"sha256:c53c233396ca39535bbb071d1b4b703051f094f319961a3f35f5c4d82ecf4e24"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:6CPH4PCDD5XSFMCBR7PQK2MFSF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Consistency Training while Mitigating Obfuscation via Rate Matching","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CL","authors_text":"David Demitri Africa, Jannes Elstner, Prakhar Gupta, Sohaib Imran","submitted_at":"2026-06-01T13:10:49Z","abstract_excerpt":"Large language models are often influenced by extraneous input features, such as cues revealing a user's preferred answer. Consistency training reduces this influence by training models to behave similarly across inputs with and without the extraneous feature. However, existing methods train for consistency over entire responses or internal activations, which also constrains whether the model verbalises said extraneous features. We show this leads to obfuscation, where the model learns not to mention a cue while remaining influenced by it, which may undermine monitorability. To address this, w"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.02211","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.02211/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T03:04:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"XhMMd6tUTL1fVEGR8fTgB7AIt2ZWANffdLdDL42xSX+WbIV+j4E6xUjBnmWE7mR7gMLyKYW/39hLiCcSE9vGCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T09:34:51.805841Z"},"content_sha256":"cd7216392ebb7ecadc2a0d4eb0c11972b5fcd50eca90aca95fdfa83ce637f309","schema_version":"1.0","event_id":"sha256:cd7216392ebb7ecadc2a0d4eb0c11972b5fcd50eca90aca95fdfa83ce637f309"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6CPH4PCDD5XSFMCBR7PQK2MFSF/bundle.json","state_url":"https://pith.science/pith/6CPH4PCDD5XSFMCBR7PQK2MFSF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6CPH4PCDD5XSFMCBR7PQK2MFSF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T09:34:51Z","links":{"resolver":"https://pith.science/pith/6CPH4PCDD5XSFMCBR7PQK2MFSF","bundle":"https://pith.science/pith/6CPH4PCDD5XSFMCBR7PQK2MFSF/bundle.json","state":"https://pith.science/pith/6CPH4PCDD5XSFMCBR7PQK2MFSF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6CPH4PCDD5XSFMCBR7PQK2MFSF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:6CPH4PCDD5XSFMCBR7PQK2MFSF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5b194b02cf6967b277482d8fc6f8c2271eefaf6dec10203d16fc961533eac243","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-01T13:10:49Z","title_canon_sha256":"a9dd3eea768a0f3b63e201acf7f9ec16c594cb67c9317a6d71f5a34aeac8c17a"},"schema_version":"1.0","source":{"id":"2606.02211","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.02211","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"arxiv_version","alias_value":"2606.02211v1","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.02211","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"pith_short_12","alias_value":"6CPH4PCDD5XS","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"pith_short_16","alias_value":"6CPH4PCDD5XSFMCB","created_at":"2026-06-02T03:04:53Z"},{"alias_kind":"pith_short_8","alias_value":"6CPH4PCD","created_at":"2026-06-02T03:04:53Z"}],"graph_snapshots":[{"event_id":"sha256:cd7216392ebb7ecadc2a0d4eb0c11972b5fcd50eca90aca95fdfa83ce637f309","target":"graph","created_at":"2026-06-02T03:04:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.02211/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large language models are often influenced by extraneous input features, such as cues revealing a user's preferred answer. Consistency training reduces this influence by training models to behave similarly across inputs with and without the extraneous feature. However, existing methods train for consistency over entire responses or internal activations, which also constrains whether the model verbalises said extraneous features. We show this leads to obfuscation, where the model learns not to mention a cue while remaining influenced by it, which may undermine monitorability. To address this, w","authors_text":"David Demitri Africa, Jannes Elstner, Prakhar Gupta, Sohaib Imran","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-01T13:10:49Z","title":"Consistency Training while Mitigating Obfuscation via Rate Matching"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.02211","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c53c233396ca39535bbb071d1b4b703051f094f319961a3f35f5c4d82ecf4e24","target":"record","created_at":"2026-06-02T03:04:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5b194b02cf6967b277482d8fc6f8c2271eefaf6dec10203d16fc961533eac243","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-01T13:10:49Z","title_canon_sha256":"a9dd3eea768a0f3b63e201acf7f9ec16c594cb67c9317a6d71f5a34aeac8c17a"},"schema_version":"1.0","source":{"id":"2606.02211","kind":"arxiv","version":1}},"canonical_sha256":"f09e7e3c431f6f22b0418fdf056985915b58e834533955916f013f6864c71901","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f09e7e3c431f6f22b0418fdf056985915b58e834533955916f013f6864c71901","first_computed_at":"2026-06-02T03:04:53.201484Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T03:04:53.201484Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"AfF/GtfC2GPZErGBu1MNb1z26TRP3jr/w0PMnuCCrXX4pUFOMfuvkeUL3khyrBROdPK8HjK6rNdMUUL3R0GzAg==","signature_status":"signed_v1","signed_at":"2026-06-02T03:04:53.201828Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.02211","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c53c233396ca39535bbb071d1b4b703051f094f319961a3f35f5c4d82ecf4e24","sha256:cd7216392ebb7ecadc2a0d4eb0c11972b5fcd50eca90aca95fdfa83ce637f309"],"state_sha256":"90819958a5ae34349af8dcc271c7d2f76983395ab93ec704b6df88a95241a457"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ib8nsTYwIZvQxGVHhULhkgEjye3rVOl4xw59/iznBCKScHbetF40eTXZvAR3k9d3pKelwaWO3+uF1yeL4hsrBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T09:34:51.810192Z","bundle_sha256":"4b2230258d0f1fdb79a90dbd897578c5b66cd43e2fa15735bb3501a82eaabc92"}}