{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:PIOHWAR645K2FC7SZYL3WA257P","short_pith_number":"pith:PIOHWAR6","canonical_record":{"source":{"id":"2603.03205","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-03-03T17:59:35Z","cross_cats_sorted":[],"title_canon_sha256":"1df978e18a5c759c347db9bc885f58c564b77b39139618c091724e6c0f5191c9","abstract_canon_sha256":"7fd198f5b62a52f10e53f0905903e55618d0e8ac9297d92570ad40b263f3c262"},"schema_version":"1.0"},"canonical_sha256":"7a1c7b023ee755a28bf2ce17bb035dfbd2f9d422f1cd68f29e162b977761e31c","source":{"kind":"arxiv","id":"2603.03205","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2603.03205","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"arxiv_version","alias_value":"2603.03205v2","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2603.03205","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"pith_short_12","alias_value":"PIOHWAR645K2","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"pith_short_16","alias_value":"PIOHWAR645K2FC7S","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"pith_short_8","alias_value":"PIOHWAR6","created_at":"2026-06-04T01:08:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:PIOHWAR645K2FC7SZYL3WA257P","target":"record","payload":{"canonical_record":{"source":{"id":"2603.03205","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-03-03T17:59:35Z","cross_cats_sorted":[],"title_canon_sha256":"1df978e18a5c759c347db9bc885f58c564b77b39139618c091724e6c0f5191c9","abstract_canon_sha256":"7fd198f5b62a52f10e53f0905903e55618d0e8ac9297d92570ad40b263f3c262"},"schema_version":"1.0"},"canonical_sha256":"7a1c7b023ee755a28bf2ce17bb035dfbd2f9d422f1cd68f29e162b977761e31c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-04T01:08:47.021469Z","signature_b64":"gP6FRVwoQ/ekOUllYmrLli1bGkPfij++CdTO8qKZMsYZUl5+20RvkAXnDdQ9qTlqRHkloPNV2Em8TYZBkmIdDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7a1c7b023ee755a28bf2ce17bb035dfbd2f9d422f1cd68f29e162b977761e31c","last_reissued_at":"2026-06-04T01:08:47.020701Z","signature_status":"signed_v1","first_computed_at":"2026-06-04T01:08:47.020701Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2603.03205","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-04T01:08:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"s2tMShB1Lx76jZsXN0+7rZdIfNSX1aRH/Ye+pG+WAWEgeOIRW09vrt8Ce2UHbLQnyCkio1+p2zw2D0+k66iYDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T12:52:36.377283Z"},"content_sha256":"2cd9ba56f08b345c53571a57b15eeff1382e084b63c4d4326227d4acc2145f52","schema_version":"1.0","event_id":"sha256:2cd9ba56f08b345c53571a57b15eeff1382e084b63c4d4326227d4acc2145f52"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:PIOHWAR645K2FC7SZYL3WA257P","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Learning When to Act or Refuse: Guarding Agentic Reasoning Models for Safe Multi-Step Tool Use","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Ahmed Awadallah, Akshay Nambi, Aradhye Agarwal, Gurdit Siyan, Joykirat Singh, Yash Pandya","submitted_at":"2026-03-03T17:59:35Z","abstract_excerpt":"Agentic language models operate in a fundamentally different safety regime than chat models: they must plan, call tools, and execute long-horizon actions where a single misstep, such as accessing files or entering credentials, can cause irreversible harm. Existing alignment methods, largely optimized for static generation and task completion, break down in these settings due to sequential decision-making, adversarial tool feedback, and overconfident intermediate reasoning. We introduce MOSAIC, a post-training framework that aligns agents for safe multi-step tool use by making safety decisions "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2603.03205","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2603.03205/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-04T01:08:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Jen6SRk6CiHuhjSpdhPwhiqxEw7t/s3CWNkE9O8Z1DI+7abSA7NLNJna/IUJkREFOQMa77showMk8KpyNJX/BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T12:52:36.378097Z"},"content_sha256":"acf88ed54db22387b2889737408b5db2293e2e267ce330c16daca55d924209cd","schema_version":"1.0","event_id":"sha256:acf88ed54db22387b2889737408b5db2293e2e267ce330c16daca55d924209cd"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/PIOHWAR645K2FC7SZYL3WA257P/bundle.json","state_url":"https://pith.science/pith/PIOHWAR645K2FC7SZYL3WA257P/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/PIOHWAR645K2FC7SZYL3WA257P/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T12:52:36Z","links":{"resolver":"https://pith.science/pith/PIOHWAR645K2FC7SZYL3WA257P","bundle":"https://pith.science/pith/PIOHWAR645K2FC7SZYL3WA257P/bundle.json","state":"https://pith.science/pith/PIOHWAR645K2FC7SZYL3WA257P/state.json","well_known_bundle":"https://pith.science/.well-known/pith/PIOHWAR645K2FC7SZYL3WA257P/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:PIOHWAR645K2FC7SZYL3WA257P","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7fd198f5b62a52f10e53f0905903e55618d0e8ac9297d92570ad40b263f3c262","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-03-03T17:59:35Z","title_canon_sha256":"1df978e18a5c759c347db9bc885f58c564b77b39139618c091724e6c0f5191c9"},"schema_version":"1.0","source":{"id":"2603.03205","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2603.03205","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"arxiv_version","alias_value":"2603.03205v2","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2603.03205","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"pith_short_12","alias_value":"PIOHWAR645K2","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"pith_short_16","alias_value":"PIOHWAR645K2FC7S","created_at":"2026-06-04T01:08:47Z"},{"alias_kind":"pith_short_8","alias_value":"PIOHWAR6","created_at":"2026-06-04T01:08:47Z"}],"graph_snapshots":[{"event_id":"sha256:acf88ed54db22387b2889737408b5db2293e2e267ce330c16daca55d924209cd","target":"graph","created_at":"2026-06-04T01:08:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2603.03205/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Agentic language models operate in a fundamentally different safety regime than chat models: they must plan, call tools, and execute long-horizon actions where a single misstep, such as accessing files or entering credentials, can cause irreversible harm. Existing alignment methods, largely optimized for static generation and task completion, break down in these settings due to sequential decision-making, adversarial tool feedback, and overconfident intermediate reasoning. We introduce MOSAIC, a post-training framework that aligns agents for safe multi-step tool use by making safety decisions ","authors_text":"Ahmed Awadallah, Akshay Nambi, Aradhye Agarwal, Gurdit Siyan, Joykirat Singh, Yash Pandya","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-03-03T17:59:35Z","title":"Learning When to Act or Refuse: Guarding Agentic Reasoning Models for Safe Multi-Step Tool Use"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2603.03205","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2cd9ba56f08b345c53571a57b15eeff1382e084b63c4d4326227d4acc2145f52","target":"record","created_at":"2026-06-04T01:08:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7fd198f5b62a52f10e53f0905903e55618d0e8ac9297d92570ad40b263f3c262","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-03-03T17:59:35Z","title_canon_sha256":"1df978e18a5c759c347db9bc885f58c564b77b39139618c091724e6c0f5191c9"},"schema_version":"1.0","source":{"id":"2603.03205","kind":"arxiv","version":2}},"canonical_sha256":"7a1c7b023ee755a28bf2ce17bb035dfbd2f9d422f1cd68f29e162b977761e31c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7a1c7b023ee755a28bf2ce17bb035dfbd2f9d422f1cd68f29e162b977761e31c","first_computed_at":"2026-06-04T01:08:47.020701Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-04T01:08:47.020701Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"gP6FRVwoQ/ekOUllYmrLli1bGkPfij++CdTO8qKZMsYZUl5+20RvkAXnDdQ9qTlqRHkloPNV2Em8TYZBkmIdDw==","signature_status":"signed_v1","signed_at":"2026-06-04T01:08:47.021469Z","signed_message":"canonical_sha256_bytes"},"source_id":"2603.03205","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2cd9ba56f08b345c53571a57b15eeff1382e084b63c4d4326227d4acc2145f52","sha256:acf88ed54db22387b2889737408b5db2293e2e267ce330c16daca55d924209cd"],"state_sha256":"cac897ae79a98cb28108ef69938930383e18bca4d85789e105208f4766af8688"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ctay6mgD1quihHbNJmCi5IRmVZaTCkIalyNxW/y4GUckN5yhhtZCjAAJ7VGVan+eiKQSkPx8aWDWQylLqW80DA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T12:52:36.381966Z","bundle_sha256":"cc2f0430859346a4dfe7b07f5dc0434258733f79025ccf07010917c1b3099ccd"}}