{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:F5GTU5NN47TFPIUJEKLNXTADMG","short_pith_number":"pith:F5GTU5NN","canonical_record":{"source":{"id":"2606.03601","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-02T13:07:12Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"532b07cc5142a45d904fd815ed1ad3e907b5fc25f2fc9d3c60cf4e8371ed737d","abstract_canon_sha256":"1556dd409a9dc898d7874028a9070d0888ce592a208e0996f66a335bf0871db7"},"schema_version":"1.0"},"canonical_sha256":"2f4d3a75ade7e657a2892296dbcc03619d20955fa4a7e8328d3b1f13e52fd2a5","source":{"kind":"arxiv","id":"2606.03601","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.03601","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"arxiv_version","alias_value":"2606.03601v1","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.03601","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"pith_short_12","alias_value":"F5GTU5NN47TF","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"pith_short_16","alias_value":"F5GTU5NN47TFPIUJ","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"pith_short_8","alias_value":"F5GTU5NN","created_at":"2026-06-03T01:06:02Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:F5GTU5NN47TFPIUJEKLNXTADMG","target":"record","payload":{"canonical_record":{"source":{"id":"2606.03601","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-02T13:07:12Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"532b07cc5142a45d904fd815ed1ad3e907b5fc25f2fc9d3c60cf4e8371ed737d","abstract_canon_sha256":"1556dd409a9dc898d7874028a9070d0888ce592a208e0996f66a335bf0871db7"},"schema_version":"1.0"},"canonical_sha256":"2f4d3a75ade7e657a2892296dbcc03619d20955fa4a7e8328d3b1f13e52fd2a5","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-03T01:06:02.046258Z","signature_b64":"/cgDvguaEMmG4aylqFUPsrdjrrSyOQsB8syz6CSYJdPi5mkMYLt59kFYn3edTWpx4WvO1PovJXM8+wNMMO4NAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"2f4d3a75ade7e657a2892296dbcc03619d20955fa4a7e8328d3b1f13e52fd2a5","last_reissued_at":"2026-06-03T01:06:02.045779Z","signature_status":"signed_v1","first_computed_at":"2026-06-03T01:06:02.045779Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.03601","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-03T01:06:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BiI9pz4HWz4hpFh3Fs/GkeTdyLoq5ng3aP1NC6lW/YxTifQg3rmpuBm9CuhStu7BVKBxsQTxnEpGT/F8WMgEDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T07:14:11.003074Z"},"content_sha256":"a218c956e359ac6d87836a94c3cfe1b540def3ae9138a2cdd9c643f870404540","schema_version":"1.0","event_id":"sha256:a218c956e359ac6d87836a94c3cfe1b540def3ae9138a2cdd9c643f870404540"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:F5GTU5NN47TFPIUJEKLNXTADMG","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"DDOR: Delta Debugging for Explainable Overrefusal Testing and Repair","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.SE","authors_text":"Dongxia Wang, Haonan Zhang, Jun Sun, Peixin Zhang, Qinyan Zhou","submitted_at":"2026-06-02T13:07:12Z","abstract_excerpt":"While safety alignment and guardrails help large language models (LLMs) avoid harmful outputs, they can also induce overrefusal, i.e., unwarranted rejection of benign queries that merely appear risky. We present DDOR (Delta Debugging for OverRefusal), a fully automated and explainable framework for overrefusal testing and repair in a black-box setting, where only model inputs and outputs are accessible and internal safety mechanisms remain opaque. DDOR applies delta debugging to localize minimal refusal-triggering fragments (mRTFs) that provide phrase-level, explainable evidence for why a refu"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.03601","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.03601/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-03T01:06:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"64dEYGiOsTXDnWNOMt/54pGkfvxCdbKHw6DXl0w5BhAYOOFCwATlPuHAK33eCWvLyrk7VebJZ9gaaNBVb+BuAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T07:14:11.003699Z"},"content_sha256":"60fe6a617bab17bfc4db08e7fcde0adcd54f48c1e91575a02fd0777457712e12","schema_version":"1.0","event_id":"sha256:60fe6a617bab17bfc4db08e7fcde0adcd54f48c1e91575a02fd0777457712e12"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/F5GTU5NN47TFPIUJEKLNXTADMG/bundle.json","state_url":"https://pith.science/pith/F5GTU5NN47TFPIUJEKLNXTADMG/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/F5GTU5NN47TFPIUJEKLNXTADMG/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-11T07:14:11Z","links":{"resolver":"https://pith.science/pith/F5GTU5NN47TFPIUJEKLNXTADMG","bundle":"https://pith.science/pith/F5GTU5NN47TFPIUJEKLNXTADMG/bundle.json","state":"https://pith.science/pith/F5GTU5NN47TFPIUJEKLNXTADMG/state.json","well_known_bundle":"https://pith.science/.well-known/pith/F5GTU5NN47TFPIUJEKLNXTADMG/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:F5GTU5NN47TFPIUJEKLNXTADMG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"1556dd409a9dc898d7874028a9070d0888ce592a208e0996f66a335bf0871db7","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-02T13:07:12Z","title_canon_sha256":"532b07cc5142a45d904fd815ed1ad3e907b5fc25f2fc9d3c60cf4e8371ed737d"},"schema_version":"1.0","source":{"id":"2606.03601","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.03601","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"arxiv_version","alias_value":"2606.03601v1","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.03601","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"pith_short_12","alias_value":"F5GTU5NN47TF","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"pith_short_16","alias_value":"F5GTU5NN47TFPIUJ","created_at":"2026-06-03T01:06:02Z"},{"alias_kind":"pith_short_8","alias_value":"F5GTU5NN","created_at":"2026-06-03T01:06:02Z"}],"graph_snapshots":[{"event_id":"sha256:60fe6a617bab17bfc4db08e7fcde0adcd54f48c1e91575a02fd0777457712e12","target":"graph","created_at":"2026-06-03T01:06:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.03601/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"While safety alignment and guardrails help large language models (LLMs) avoid harmful outputs, they can also induce overrefusal, i.e., unwarranted rejection of benign queries that merely appear risky. We present DDOR (Delta Debugging for OverRefusal), a fully automated and explainable framework for overrefusal testing and repair in a black-box setting, where only model inputs and outputs are accessible and internal safety mechanisms remain opaque. DDOR applies delta debugging to localize minimal refusal-triggering fragments (mRTFs) that provide phrase-level, explainable evidence for why a refu","authors_text":"Dongxia Wang, Haonan Zhang, Jun Sun, Peixin Zhang, Qinyan Zhou","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-02T13:07:12Z","title":"DDOR: Delta Debugging for Explainable Overrefusal Testing and Repair"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.03601","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a218c956e359ac6d87836a94c3cfe1b540def3ae9138a2cdd9c643f870404540","target":"record","created_at":"2026-06-03T01:06:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"1556dd409a9dc898d7874028a9070d0888ce592a208e0996f66a335bf0871db7","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-02T13:07:12Z","title_canon_sha256":"532b07cc5142a45d904fd815ed1ad3e907b5fc25f2fc9d3c60cf4e8371ed737d"},"schema_version":"1.0","source":{"id":"2606.03601","kind":"arxiv","version":1}},"canonical_sha256":"2f4d3a75ade7e657a2892296dbcc03619d20955fa4a7e8328d3b1f13e52fd2a5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2f4d3a75ade7e657a2892296dbcc03619d20955fa4a7e8328d3b1f13e52fd2a5","first_computed_at":"2026-06-03T01:06:02.045779Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-03T01:06:02.045779Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"/cgDvguaEMmG4aylqFUPsrdjrrSyOQsB8syz6CSYJdPi5mkMYLt59kFYn3edTWpx4WvO1PovJXM8+wNMMO4NAw==","signature_status":"signed_v1","signed_at":"2026-06-03T01:06:02.046258Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.03601","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a218c956e359ac6d87836a94c3cfe1b540def3ae9138a2cdd9c643f870404540","sha256:60fe6a617bab17bfc4db08e7fcde0adcd54f48c1e91575a02fd0777457712e12"],"state_sha256":"a0687f65ca2dca55956dffe2fb899b2e518435c7ca6e8c9a7a05ed59993e3c0f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"k6QWScjYNYdSXLFEy2WAoP91jlSK6XhihZEYYvg6RYu0zH3TNWdBU5V05IFJ/Aneg0OqZyZayEwk8T42iIFPAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-11T07:14:11.007623Z","bundle_sha256":"313c7769aeb0e159d6ba2e17458544c0bee420343a55578c501d57d6253dceac"}}