{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:HSJLAE76WQUPOVJQBDMNXOMLXS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ca003c1f24770c4dfcc4a2cd386971446953a223432c693fae1663990d22295c","cross_cats_sorted":["cs.MA"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-04T15:58:30Z","title_canon_sha256":"4737d15e6b5e92adaf542e5f0968f55c34c8de3b304de9a0f510a16eb9c4d350"},"schema_version":"1.0","source":{"id":"2606.06324","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.06324","created_at":"2026-06-05T01:15:41Z"},{"alias_kind":"arxiv_version","alias_value":"2606.06324v1","created_at":"2026-06-05T01:15:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.06324","created_at":"2026-06-05T01:15:41Z"},{"alias_kind":"pith_short_12","alias_value":"HSJLAE76WQUP","created_at":"2026-06-05T01:15:41Z"},{"alias_kind":"pith_short_16","alias_value":"HSJLAE76WQUPOVJQ","created_at":"2026-06-05T01:15:41Z"},{"alias_kind":"pith_short_8","alias_value":"HSJLAE76","created_at":"2026-06-05T01:15:41Z"}],"graph_snapshots":[{"event_id":"sha256:d19ef39702a70bbb60fbbc31c0f9fc153d35d58564821420300d282bfe18035e","target":"graph","created_at":"2026-06-05T01:15:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.06324/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"LLM-based agents increasingly rely on harnesses that provide execution environments, tool interfaces, context, lifecycle orchestration, observability, verification, and governance. Existing self-improving agents and automatic harness evolution methods mainly improve agents through runtime supervision, prompt optimization, workflow search, or harness modification based on final outcomes. However, they often fail to diagnose where the responsible evidence lies in failed trajectories and which harness layer causes the unreliable behavior, resulting in broad, indirect, or poorly scoped changes. Th","authors_text":"Junjie Wang, Mengzhuo Chen, Qing Wang, Yawen Wang, Zhe Liu","cross_cats":["cs.MA"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-04T15:58:30Z","title":"From Failed Trajectories to Reliable LLM Agents: Diagnosing and Repairing Harness Flaws"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.06324","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2e7b653c6429accea69b9734d2242b15cc7b498f5de21f02eb9eeaf5ed08dd14","target":"record","created_at":"2026-06-05T01:15:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ca003c1f24770c4dfcc4a2cd386971446953a223432c693fae1663990d22295c","cross_cats_sorted":["cs.MA"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-04T15:58:30Z","title_canon_sha256":"4737d15e6b5e92adaf542e5f0968f55c34c8de3b304de9a0f510a16eb9c4d350"},"schema_version":"1.0","source":{"id":"2606.06324","kind":"arxiv","version":1}},"canonical_sha256":"3c92b013feb428f7553008d8dbb98bbc80827887e6b6e4e7bfaa2f2cd59b0360","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3c92b013feb428f7553008d8dbb98bbc80827887e6b6e4e7bfaa2f2cd59b0360","first_computed_at":"2026-06-05T01:15:41.950855Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-05T01:15:41.950855Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"YNl3HEbIg+FBGwVB82d3baS/0plHTxzQ6wtpDI158a/c22C03C1cWfdZFm5tTjBWzYHbs/ZsxNOJHFNTPSW9AQ==","signature_status":"signed_v1","signed_at":"2026-06-05T01:15:41.951271Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.06324","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2e7b653c6429accea69b9734d2242b15cc7b498f5de21f02eb9eeaf5ed08dd14","sha256:d19ef39702a70bbb60fbbc31c0f9fc153d35d58564821420300d282bfe18035e"],"state_sha256":"936f5b33a53297f209de6008bdd5e63548d1068216c411c508baafeeae108701"}