{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:6QGFT45FHVLF4BMFA4OC2QMLR5","short_pith_number":"pith:6QGFT45F","canonical_record":{"source":{"id":"2606.08044","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-06T08:10:56Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"9d7dd8d2b38696e6e60f17a6cae9f2f183f6622bf52880217498bbd3c4fd3833","abstract_canon_sha256":"556e1c4aae084ba071779e956758a5bcda175856c95bcc780756c134daa8d5ff"},"schema_version":"1.0"},"canonical_sha256":"f40c59f3a53d565e0585071c2d418b8f54f470302c2299c0d93120e5d4ef9c7c","source":{"kind":"arxiv","id":"2606.08044","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.08044","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"arxiv_version","alias_value":"2606.08044v1","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.08044","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"pith_short_12","alias_value":"6QGFT45FHVLF","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"pith_short_16","alias_value":"6QGFT45FHVLF4BMF","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"pith_short_8","alias_value":"6QGFT45F","created_at":"2026-06-09T01:05:24Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:6QGFT45FHVLF4BMFA4OC2QMLR5","target":"record","payload":{"canonical_record":{"source":{"id":"2606.08044","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-06T08:10:56Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"9d7dd8d2b38696e6e60f17a6cae9f2f183f6622bf52880217498bbd3c4fd3833","abstract_canon_sha256":"556e1c4aae084ba071779e956758a5bcda175856c95bcc780756c134daa8d5ff"},"schema_version":"1.0"},"canonical_sha256":"f40c59f3a53d565e0585071c2d418b8f54f470302c2299c0d93120e5d4ef9c7c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-09T01:05:24.237070Z","signature_b64":"+XTlk69gxc3XJ6OsfM/wgNQCSQsRAn2s/Jc835/J9C+k6KHk7gs9+o9U/S1iKL57Sapnq13I6k3jm0Sdk4pZDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f40c59f3a53d565e0585071c2d418b8f54f470302c2299c0d93120e5d4ef9c7c","last_reissued_at":"2026-06-09T01:05:24.236505Z","signature_status":"signed_v1","first_computed_at":"2026-06-09T01:05:24.236505Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.08044","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:05:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"GE1XLxw3buMT7Hje+yLkYrFhu80Ld0IBJ9xphLd+MlvRUin1mfdZsWHYJxTIy6i4CARi7lcg8ZDNd9dnXtEACA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-20T12:14:00.116330Z"},"content_sha256":"2f221a9b451db8e67e7862c9e40591109cfb3a8ae1e97e2cff6b52ff501de9b6","schema_version":"1.0","event_id":"sha256:2f221a9b451db8e67e7862c9e40591109cfb3a8ae1e97e2cff6b52ff501de9b6"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:6QGFT45FHVLF4BMFA4OC2QMLR5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"When Behavioral Safety Evaluation Fails: A Representation-Level Perspective","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.LG","authors_text":"Anders Gj{\\o}lbye, Enyi Jiang, Sanmi Koyejo, Yibo Jacky Zhang","submitted_at":"2026-06-06T08:10:56Z","abstract_excerpt":"Large Language Model (LLM) safety has often been evaluated at the behavior level, which provides limited evidence of internal robustness, as these evaluations target outputs rather than representation-level vulnerability under intervention. We formalize this discrepancy as the audit gap: the difference between behavioral safety and robustness under intervention. To study this gap, we construct dissociated models that preserve safe outward behavior while remaining vulnerable in the latent space. We introduce an intervention-based evaluation framework to test model robustness through soft interv"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.08044","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.08044/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:05:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EMqR8z7N5nhaiIEhGCDRDYixA963sqjbPU6L+8HtjV1VkrERJiG4hC6LtByFeff4XoGjpnwITiVioMHW5rVhCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-20T12:14:00.116736Z"},"content_sha256":"2584bb0b382515969ab0ca461dbbb5e1d4c1a14190c1530759dc0dbe7b33fa96","schema_version":"1.0","event_id":"sha256:2584bb0b382515969ab0ca461dbbb5e1d4c1a14190c1530759dc0dbe7b33fa96"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6QGFT45FHVLF4BMFA4OC2QMLR5/bundle.json","state_url":"https://pith.science/pith/6QGFT45FHVLF4BMFA4OC2QMLR5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6QGFT45FHVLF4BMFA4OC2QMLR5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-20T12:14:00Z","links":{"resolver":"https://pith.science/pith/6QGFT45FHVLF4BMFA4OC2QMLR5","bundle":"https://pith.science/pith/6QGFT45FHVLF4BMFA4OC2QMLR5/bundle.json","state":"https://pith.science/pith/6QGFT45FHVLF4BMFA4OC2QMLR5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6QGFT45FHVLF4BMFA4OC2QMLR5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:6QGFT45FHVLF4BMFA4OC2QMLR5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"556e1c4aae084ba071779e956758a5bcda175856c95bcc780756c134daa8d5ff","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-06T08:10:56Z","title_canon_sha256":"9d7dd8d2b38696e6e60f17a6cae9f2f183f6622bf52880217498bbd3c4fd3833"},"schema_version":"1.0","source":{"id":"2606.08044","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.08044","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"arxiv_version","alias_value":"2606.08044v1","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.08044","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"pith_short_12","alias_value":"6QGFT45FHVLF","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"pith_short_16","alias_value":"6QGFT45FHVLF4BMF","created_at":"2026-06-09T01:05:24Z"},{"alias_kind":"pith_short_8","alias_value":"6QGFT45F","created_at":"2026-06-09T01:05:24Z"}],"graph_snapshots":[{"event_id":"sha256:2584bb0b382515969ab0ca461dbbb5e1d4c1a14190c1530759dc0dbe7b33fa96","target":"graph","created_at":"2026-06-09T01:05:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.08044/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large Language Model (LLM) safety has often been evaluated at the behavior level, which provides limited evidence of internal robustness, as these evaluations target outputs rather than representation-level vulnerability under intervention. We formalize this discrepancy as the audit gap: the difference between behavioral safety and robustness under intervention. To study this gap, we construct dissociated models that preserve safe outward behavior while remaining vulnerable in the latent space. We introduce an intervention-based evaluation framework to test model robustness through soft interv","authors_text":"Anders Gj{\\o}lbye, Enyi Jiang, Sanmi Koyejo, Yibo Jacky Zhang","cross_cats":["cs.AI","cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-06T08:10:56Z","title":"When Behavioral Safety Evaluation Fails: A Representation-Level Perspective"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.08044","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2f221a9b451db8e67e7862c9e40591109cfb3a8ae1e97e2cff6b52ff501de9b6","target":"record","created_at":"2026-06-09T01:05:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"556e1c4aae084ba071779e956758a5bcda175856c95bcc780756c134daa8d5ff","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-06T08:10:56Z","title_canon_sha256":"9d7dd8d2b38696e6e60f17a6cae9f2f183f6622bf52880217498bbd3c4fd3833"},"schema_version":"1.0","source":{"id":"2606.08044","kind":"arxiv","version":1}},"canonical_sha256":"f40c59f3a53d565e0585071c2d418b8f54f470302c2299c0d93120e5d4ef9c7c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f40c59f3a53d565e0585071c2d418b8f54f470302c2299c0d93120e5d4ef9c7c","first_computed_at":"2026-06-09T01:05:24.236505Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T01:05:24.236505Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+XTlk69gxc3XJ6OsfM/wgNQCSQsRAn2s/Jc835/J9C+k6KHk7gs9+o9U/S1iKL57Sapnq13I6k3jm0Sdk4pZDQ==","signature_status":"signed_v1","signed_at":"2026-06-09T01:05:24.237070Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.08044","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2f221a9b451db8e67e7862c9e40591109cfb3a8ae1e97e2cff6b52ff501de9b6","sha256:2584bb0b382515969ab0ca461dbbb5e1d4c1a14190c1530759dc0dbe7b33fa96"],"state_sha256":"d3a1184b9e857c8468b1739cb6a60e378558d7fd2ebbea8ebc322a595393ec77"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jTVp4pp2VrJzi6bGaOkdDyS+c5Y5gT3V8qdubLa76W/qFp9CvVNWIl3hrMpSMedqA2V9FJ7Fz2qkMhw4Ye9pBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-20T12:14:00.118968Z","bundle_sha256":"5b4e2aeb9d19c8a5cffc28a18227470f7b5900657a62cacb51965437ba4d8e08"}}