{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:DFIU34BCCQOZB2JAZKRJU5LQHU","short_pith_number":"pith:DFIU34BC","canonical_record":{"source":{"id":"2505.11063","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.AI","submitted_at":"2025-05-16T10:00:15Z","cross_cats_sorted":["cs.CR"],"title_canon_sha256":"711b59bb075838dcc34c55d068321e3b16b81ccab1ea61fb1e6bff2a9d3b0d72","abstract_canon_sha256":"d23495679e14b62432017021b0edf3af2e642ef6dd299162375d8688d9397698"},"schema_version":"1.0"},"canonical_sha256":"19514df022141d90e920caa29a75703d28b3d6939cb366a928f241e37564e11d","source":{"kind":"arxiv","id":"2505.11063","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2505.11063","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"arxiv_version","alias_value":"2505.11063v3","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2505.11063","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"pith_short_12","alias_value":"DFIU34BCCQOZ","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"pith_short_16","alias_value":"DFIU34BCCQOZB2JA","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"pith_short_8","alias_value":"DFIU34BC","created_at":"2026-05-27T01:05:34Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:DFIU34BCCQOZB2JAZKRJU5LQHU","target":"record","payload":{"canonical_record":{"source":{"id":"2505.11063","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.AI","submitted_at":"2025-05-16T10:00:15Z","cross_cats_sorted":["cs.CR"],"title_canon_sha256":"711b59bb075838dcc34c55d068321e3b16b81ccab1ea61fb1e6bff2a9d3b0d72","abstract_canon_sha256":"d23495679e14b62432017021b0edf3af2e642ef6dd299162375d8688d9397698"},"schema_version":"1.0"},"canonical_sha256":"19514df022141d90e920caa29a75703d28b3d6939cb366a928f241e37564e11d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-27T01:05:34.702024Z","signature_b64":"xOht33MC0SegRxVRNM+tjAhkfNFwlOEq054MzpMAl/VKMx07cyA3V8Ziy7w018JPqo9VwyZ6fJUN/15fdNKfAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"19514df022141d90e920caa29a75703d28b3d6939cb366a928f241e37564e11d","last_reissued_at":"2026-05-27T01:05:34.701297Z","signature_status":"signed_v1","first_computed_at":"2026-05-27T01:05:34.701297Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2505.11063","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-27T01:05:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jDE1bXkQWJisktsEDX/8of6MvWEbXDjnQybBEKCeZd9AD/+wGf05TsHADlTqcP5wuzPs4KSjBz+451jKo0edBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T03:29:24.802695Z"},"content_sha256":"0b99b9ff3ed5fe636e5e5ceb2c3e39ccdd0d3a12b67ca6dfe2082127fc821407","schema_version":"1.0","event_id":"sha256:0b99b9ff3ed5fe636e5e5ceb2c3e39ccdd0d3a12b67ca6dfe2082127fc821407"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:DFIU34BCCQOZB2JAZKRJU5LQHU","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Think Twice Before You Act: Enhancing Agent Behavioral Safety with Thought Correction","license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","headline":"","cross_cats":["cs.CR"],"primary_cat":"cs.AI","authors_text":"Changyue Jiang, Geng Hong, Min Yang, Wenqi Zhang, Xudong Pan","submitted_at":"2025-05-16T10:00:15Z","abstract_excerpt":"LLM-based agents solve complex tasks through iterative reasoning, tool use, and environment interaction, where each intermediate thought directly shapes subsequent actions. Small deviations in these thoughts can therefore propagate into unsafe behaviors, yet existing guardrails typically operate only on final outputs or require intrusive model modifications. We introduce Thought-Aligner, a lightweight plug-in safety model that performs causal correction on unsafe thoughts before action execution, without altering the underlying agent. The corrected thoughts are fed back into the agent, steerin"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2505.11063","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2505.11063/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-27T01:05:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Mr3tvFGdEeqeHXCmx4fPDNL3Pe9HGRiyoVlaS4IT62a0SQKpRj2nItpBeJun4TTmS6Tj3Q07eLx4RfwMxb/PCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T03:29:24.803077Z"},"content_sha256":"1b9303071af733782bbc954d8da9f96212c012aed03b883d879329d782ff3f1e","schema_version":"1.0","event_id":"sha256:1b9303071af733782bbc954d8da9f96212c012aed03b883d879329d782ff3f1e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/DFIU34BCCQOZB2JAZKRJU5LQHU/bundle.json","state_url":"https://pith.science/pith/DFIU34BCCQOZB2JAZKRJU5LQHU/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/DFIU34BCCQOZB2JAZKRJU5LQHU/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T03:29:24Z","links":{"resolver":"https://pith.science/pith/DFIU34BCCQOZB2JAZKRJU5LQHU","bundle":"https://pith.science/pith/DFIU34BCCQOZB2JAZKRJU5LQHU/bundle.json","state":"https://pith.science/pith/DFIU34BCCQOZB2JAZKRJU5LQHU/state.json","well_known_bundle":"https://pith.science/.well-known/pith/DFIU34BCCQOZB2JAZKRJU5LQHU/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:DFIU34BCCQOZB2JAZKRJU5LQHU","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d23495679e14b62432017021b0edf3af2e642ef6dd299162375d8688d9397698","cross_cats_sorted":["cs.CR"],"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.AI","submitted_at":"2025-05-16T10:00:15Z","title_canon_sha256":"711b59bb075838dcc34c55d068321e3b16b81ccab1ea61fb1e6bff2a9d3b0d72"},"schema_version":"1.0","source":{"id":"2505.11063","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2505.11063","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"arxiv_version","alias_value":"2505.11063v3","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2505.11063","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"pith_short_12","alias_value":"DFIU34BCCQOZ","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"pith_short_16","alias_value":"DFIU34BCCQOZB2JA","created_at":"2026-05-27T01:05:34Z"},{"alias_kind":"pith_short_8","alias_value":"DFIU34BC","created_at":"2026-05-27T01:05:34Z"}],"graph_snapshots":[{"event_id":"sha256:1b9303071af733782bbc954d8da9f96212c012aed03b883d879329d782ff3f1e","target":"graph","created_at":"2026-05-27T01:05:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2505.11063/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"LLM-based agents solve complex tasks through iterative reasoning, tool use, and environment interaction, where each intermediate thought directly shapes subsequent actions. Small deviations in these thoughts can therefore propagate into unsafe behaviors, yet existing guardrails typically operate only on final outputs or require intrusive model modifications. We introduce Thought-Aligner, a lightweight plug-in safety model that performs causal correction on unsafe thoughts before action execution, without altering the underlying agent. The corrected thoughts are fed back into the agent, steerin","authors_text":"Changyue Jiang, Geng Hong, Min Yang, Wenqi Zhang, Xudong Pan","cross_cats":["cs.CR"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.AI","submitted_at":"2025-05-16T10:00:15Z","title":"Think Twice Before You Act: Enhancing Agent Behavioral Safety with Thought Correction"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2505.11063","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0b99b9ff3ed5fe636e5e5ceb2c3e39ccdd0d3a12b67ca6dfe2082127fc821407","target":"record","created_at":"2026-05-27T01:05:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d23495679e14b62432017021b0edf3af2e642ef6dd299162375d8688d9397698","cross_cats_sorted":["cs.CR"],"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.AI","submitted_at":"2025-05-16T10:00:15Z","title_canon_sha256":"711b59bb075838dcc34c55d068321e3b16b81ccab1ea61fb1e6bff2a9d3b0d72"},"schema_version":"1.0","source":{"id":"2505.11063","kind":"arxiv","version":3}},"canonical_sha256":"19514df022141d90e920caa29a75703d28b3d6939cb366a928f241e37564e11d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"19514df022141d90e920caa29a75703d28b3d6939cb366a928f241e37564e11d","first_computed_at":"2026-05-27T01:05:34.701297Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-27T01:05:34.701297Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"xOht33MC0SegRxVRNM+tjAhkfNFwlOEq054MzpMAl/VKMx07cyA3V8Ziy7w018JPqo9VwyZ6fJUN/15fdNKfAg==","signature_status":"signed_v1","signed_at":"2026-05-27T01:05:34.702024Z","signed_message":"canonical_sha256_bytes"},"source_id":"2505.11063","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0b99b9ff3ed5fe636e5e5ceb2c3e39ccdd0d3a12b67ca6dfe2082127fc821407","sha256:1b9303071af733782bbc954d8da9f96212c012aed03b883d879329d782ff3f1e"],"state_sha256":"f1e7337f9aa57c3d1bda548586f205666b0a4e25840049047d6133899fa1f23b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0pBIxJRErE+uu2L9S1xT9S2SVqSOxBPcm1a1msERvnT7VB1IeLazcC+74RoClT+kjMcTB1JBgLH/gZI93sFrDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T03:29:24.805210Z","bundle_sha256":"db5f7237017707579d0eb72ac986fc955e025dcc81f37547a8394dc70682c8f6"}}