{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:PSAVKVWW7JB4VENVAVVVOVSSCW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"df5733a0ca469b16a87e703a1ecb07f1a3e07824dbc2e41ff0e41e58f9449134","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2026-05-15T20:46:46Z","title_canon_sha256":"3cb634ce04f3de19af96b3ee794d5b50fad63538b55d1d22223b8695f43cb2d0"},"schema_version":"1.0","source":{"id":"2605.16626","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.16626","created_at":"2026-05-20T00:02:33Z"},{"alias_kind":"arxiv_version","alias_value":"2605.16626v1","created_at":"2026-05-20T00:02:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.16626","created_at":"2026-05-20T00:02:33Z"},{"alias_kind":"pith_short_12","alias_value":"PSAVKVWW7JB4","created_at":"2026-05-20T00:02:33Z"},{"alias_kind":"pith_short_16","alias_value":"PSAVKVWW7JB4VENV","created_at":"2026-05-20T00:02:33Z"},{"alias_kind":"pith_short_8","alias_value":"PSAVKVWW","created_at":"2026-05-20T00:02:33Z"}],"graph_snapshots":[{"event_id":"sha256:98b7a7ab3251eab5983fcbfd94248a8fefe2077c455a1fd030a920b9651d09c2","target":"graph","created_at":"2026-05-20T00:02:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-19T19:21:56.757891Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-19T18:33:26.584678Z","status":"skipped","version":"1.0.0"}],"endpoint":"/pith/2605.16626/integrity.json","findings":[],"snapshot_sha256":"137f3789de904472a64defe5979b0b17fd79f6f2d9590d5e4d77d0e52e4d0d0c","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Since autonomous coding agents generate complex behaviors at high-volume, we may want to use other LLMs to monitor actions to reduce the risk from dangerous misaligned behavior. To better understand the limitations of such monitors against the diverse attack strategies that a coding agent could use, we present SLEIGHT-Bench (Subtle Low-itEration Insight-Guided Harmful Transcripts), a benchmark of synthetic transcripts containing 40 attacks across 11 categories, each showing a coding agent covertly pursuing a harmful objective (e.g. weight exfiltration, credential theft, unmonitored rogue deplo","authors_text":"Colin Toft, Elle Najt, Fabien Roger, Joe Benton, Tyler Tracy","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2026-05-15T20:46:46Z","title":"SLEIGHT-Bench: A Benchmark of Evasion Attacks Against Agent Monitors"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.16626","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c094bddc0ff3ca381a2c640aef077144f9ce22a9ab56a591a88aeffbb9c5a2e7","target":"record","created_at":"2026-05-20T00:02:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"df5733a0ca469b16a87e703a1ecb07f1a3e07824dbc2e41ff0e41e58f9449134","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2026-05-15T20:46:46Z","title_canon_sha256":"3cb634ce04f3de19af96b3ee794d5b50fad63538b55d1d22223b8695f43cb2d0"},"schema_version":"1.0","source":{"id":"2605.16626","kind":"arxiv","version":1}},"canonical_sha256":"7c815556d6fa43ca91b5056b575652158c81dd2e69a68a67ee2241440c8a509e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7c815556d6fa43ca91b5056b575652158c81dd2e69a68a67ee2241440c8a509e","first_computed_at":"2026-05-20T00:02:33.132310Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:02:33.132310Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"7p4Amx2oY9wP/NJMeqIFhRVU8xoVZk13JhRr4JUZ4R7dyn4b23d0ik60rQfTBADuBdt7NR0jhoPez0G5MVxiCA==","signature_status":"signed_v1","signed_at":"2026-05-20T00:02:33.133134Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.16626","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c094bddc0ff3ca381a2c640aef077144f9ce22a9ab56a591a88aeffbb9c5a2e7","sha256:98b7a7ab3251eab5983fcbfd94248a8fefe2077c455a1fd030a920b9651d09c2"],"state_sha256":"9a69edf8d6f4fa1ba0b1e7c41febaa7c4662c7aff41858f3861edfe58803a357"}