{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:TAT4UUMRG4NLJVNLESMRIIM5W4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"49b2c8c73669007481167fd29bb3a4a8bd8f4668bf9ae90e789b23f01bcd17df","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-04T01:49:07Z","title_canon_sha256":"245ca3bf3baf1707f71095e2149601e92cd4561d605fab6b935617f69bfe3b1f"},"schema_version":"1.0","source":{"id":"2606.05574","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.05574","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"arxiv_version","alias_value":"2606.05574v1","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.05574","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_12","alias_value":"TAT4UUMRG4NL","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_16","alias_value":"TAT4UUMRG4NLJVNL","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_8","alias_value":"TAT4UUMR","created_at":"2026-06-05T01:14:55Z"}],"graph_snapshots":[{"event_id":"sha256:9be745831a966a6ae072961880141747ae71c0858955857d1695a71caf12464a","target":"graph","created_at":"2026-06-05T01:14:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.05574/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Code Agents have achieved remarkable advances in recent years, exhibiting strong capabilities across a wide range of software engineering tasks. However, their misuse often produces bloated and disorganized code that impairing readability, extensibility, and robustness. Despite this risk, existing benchmarks largely evaluate functional correctness rather than long-term maintainability of code agents. In this paper, we propose SmellBench, an extensible code refactoring benchmark that proactively injects code smells into clean code snippets from real-world repositories. This design enables the g","authors_text":"BinBin Hu, Fake Lin, Jun Zhou, Tong Xu, Xi Zhu, Zhiqiang Zhang, Zhi Zheng, Ziqi Liu, Ziwei Zhao","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-04T01:49:07Z","title":"SmellBench: Towards Fine-Grained Evaluation of Code Agents on Refactoring Tasks"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.05574","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3c8ce4939478e2346ce927e908f11f0f42bced5c5e34d95e12ec5e78fbe6879f","target":"record","created_at":"2026-06-05T01:14:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"49b2c8c73669007481167fd29bb3a4a8bd8f4668bf9ae90e789b23f01bcd17df","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-04T01:49:07Z","title_canon_sha256":"245ca3bf3baf1707f71095e2149601e92cd4561d605fab6b935617f69bfe3b1f"},"schema_version":"1.0","source":{"id":"2606.05574","kind":"arxiv","version":1}},"canonical_sha256":"9827ca5191371ab4d5ab249914219db71780f186810181703ade85bd7047a2dc","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9827ca5191371ab4d5ab249914219db71780f186810181703ade85bd7047a2dc","first_computed_at":"2026-06-05T01:14:55.324009Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-05T01:14:55.324009Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"PNXcsz1ik91sFsLB/En2fyKKnRnU4Ay05dJ+upuy4sz/pbd2vLqDyTTpsKQswqKE2o04ubpCHJ5lJSDqbIXzAQ==","signature_status":"signed_v1","signed_at":"2026-06-05T01:14:55.324468Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.05574","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3c8ce4939478e2346ce927e908f11f0f42bced5c5e34d95e12ec5e78fbe6879f","sha256:9be745831a966a6ae072961880141747ae71c0858955857d1695a71caf12464a"],"state_sha256":"57e3d6fe142db246d0755fb02bc34726e2b4ae54496ded2e09b83d8db73d9487"}