{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:ZBRVHMNJUHEOZPUAMBQI5CVQNV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4d6b957593c211930249a368e3d0933aefe5c914467af9eb0761db48b360d285","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-05-23T08:41:45Z","title_canon_sha256":"61cb3ff584e494c103edcd8842ec7b38213a45ee11db04a3a3a656c6f7879475"},"schema_version":"1.0","source":{"id":"2505.17630","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2505.17630","created_at":"2026-06-02T03:04:32Z"},{"alias_kind":"arxiv_version","alias_value":"2505.17630v4","created_at":"2026-06-02T03:04:32Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2505.17630","created_at":"2026-06-02T03:04:32Z"},{"alias_kind":"pith_short_12","alias_value":"ZBRVHMNJUHEO","created_at":"2026-06-02T03:04:32Z"},{"alias_kind":"pith_short_16","alias_value":"ZBRVHMNJUHEOZPUA","created_at":"2026-06-02T03:04:32Z"},{"alias_kind":"pith_short_8","alias_value":"ZBRVHMNJ","created_at":"2026-06-02T03:04:32Z"}],"graph_snapshots":[{"event_id":"sha256:26d11438cd5d5869f142e7ac4f13da9195eea0a5ce6c7ca590f594e586d3ad9c","target":"graph","created_at":"2026-06-02T03:04:32Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2505.17630/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Circuit localization methods aim to identify the subset of model components responsible for specific behaviors in large language models, enabling detailed mechanistic analysis. Most existing methods assume components act independently and estimate importance by perturbing each component in isolation. However, components in neural networks interact, and ignoring these interactions leads to systematic misestimation of component importance. We find that one particularly problematic interaction is attention self-repair, in which softmax redistribution causes gradients for influential attention sco","authors_text":"Casper L. Christensen, Jing Huang, Joakim Edin, Lars Maal{\\o}e, Maria Maistro, R\\'obert Csord\\'as, Tuukka Ruotsalo, Zhengxuan Wu","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-05-23T08:41:45Z","title":"Correcting Gradient-Based Circuit Localization via Interaction-Aware Backpropagation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2505.17630","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4a13ffa0b2c2f7528997312ea8331ecdc140831a274e68b914dd880bf7248d2d","target":"record","created_at":"2026-06-02T03:04:32Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4d6b957593c211930249a368e3d0933aefe5c914467af9eb0761db48b360d285","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-05-23T08:41:45Z","title_canon_sha256":"61cb3ff584e494c103edcd8842ec7b38213a45ee11db04a3a3a656c6f7879475"},"schema_version":"1.0","source":{"id":"2505.17630","kind":"arxiv","version":4}},"canonical_sha256":"c86353b1a9a1c8ecbe8060608e8ab06d56e70e14b74ea59149749e3a9a26b124","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c86353b1a9a1c8ecbe8060608e8ab06d56e70e14b74ea59149749e3a9a26b124","first_computed_at":"2026-06-02T03:04:32.602084Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T03:04:32.602084Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"60LsuqZeAvouuAXNa+vtYZ8B/6FoDcVDPKs3uMndPRjjwMS+4fDMF/XLbTiwAVHTem8gGzzvlVguAkp9eYQ+Aw==","signature_status":"signed_v1","signed_at":"2026-06-02T03:04:32.602621Z","signed_message":"canonical_sha256_bytes"},"source_id":"2505.17630","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4a13ffa0b2c2f7528997312ea8331ecdc140831a274e68b914dd880bf7248d2d","sha256:26d11438cd5d5869f142e7ac4f13da9195eea0a5ce6c7ca590f594e586d3ad9c"],"state_sha256":"0ed450edd10f610863045b41b3e76d0df264adb5345bbe2f5051ee342304c68f"}