{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:4AONZB43SJNCAGSDFT2QTCF6OO","short_pith_number":"pith:4AONZB43","canonical_record":{"source":{"id":"2605.24134","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-22T18:52:34Z","cross_cats_sorted":[],"title_canon_sha256":"f205f3816c5623e8a0269f1c7e77b6a9b632807aea4ef2c06d748943e95f71d3","abstract_canon_sha256":"7349b0aef96f11a7d509eeb0de70bc28baf622060902562c41695f0448283bb6"},"schema_version":"1.0"},"canonical_sha256":"e01cdc879b925a201a432cf50988be73a6913e37676064bee602384d5cb77d30","source":{"kind":"arxiv","id":"2605.24134","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.24134","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"arxiv_version","alias_value":"2605.24134v1","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.24134","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"pith_short_12","alias_value":"4AONZB43SJNC","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"pith_short_16","alias_value":"4AONZB43SJNCAGSD","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"pith_short_8","alias_value":"4AONZB43","created_at":"2026-05-26T01:02:48Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:4AONZB43SJNCAGSDFT2QTCF6OO","target":"record","payload":{"canonical_record":{"source":{"id":"2605.24134","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-22T18:52:34Z","cross_cats_sorted":[],"title_canon_sha256":"f205f3816c5623e8a0269f1c7e77b6a9b632807aea4ef2c06d748943e95f71d3","abstract_canon_sha256":"7349b0aef96f11a7d509eeb0de70bc28baf622060902562c41695f0448283bb6"},"schema_version":"1.0"},"canonical_sha256":"e01cdc879b925a201a432cf50988be73a6913e37676064bee602384d5cb77d30","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-26T01:02:48.050983Z","signature_b64":"eayEDI+3gSjPs0/UVMAxFCGpNSaqEvMZKnbNf9YQGDnLy8CbG+Qx5ObKC7jS39ZxsJKaGpPmmalBVhbJruZwAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e01cdc879b925a201a432cf50988be73a6913e37676064bee602384d5cb77d30","last_reissued_at":"2026-05-26T01:02:48.050233Z","signature_status":"signed_v1","first_computed_at":"2026-05-26T01:02:48.050233Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.24134","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T01:02:48Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hhYaAc0vXbghdI7UL/ITUxNvfztAnHTk1ghk4Bs0GYn/cEALIJ7c/eYT9jpnQtQopLkXxe+FED8QkpwhGmNsBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T10:56:22.552756Z"},"content_sha256":"15c880a6eb6292602a5609f85ae40919022ea5fd72c5bfccadee4a7bc4341835","schema_version":"1.0","event_id":"sha256:15c880a6eb6292602a5609f85ae40919022ea5fd72c5bfccadee4a7bc4341835"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:4AONZB43SJNCAGSDFT2QTCF6OO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"ProofAgent Harness: Open Infrastructure for Adversarial Evaluation of AI Agents","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.MA","authors_text":"Fouad Bousetouane","submitted_at":"2026-05-22T18:52:34Z","abstract_excerpt":"AI agents are entering high-risk production settings, where they use tools, retain context, follow policies, handle private data, and interact with users over multiple turns. Yet many evaluation methods still judge isolated outputs or static tasks, missing failures that emerge through trajectory, pressure, and adversarial interaction. We introduce ProofAgent Harness, open infrastructure for scalable, auditable, and adversarial AI agent evaluation. The harness provides evaluation infrastructure around an agent: it curates evaluation intelligence, runs adversarial multi-turn trials, captures beh"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.24134","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.24134/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T01:02:48Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"tHXsBzMiqPjD69WU5YCUv4tzP09Si+MJNGTL0/Cn1R5sqZ6IgUOJefyc5/RFCWPLVTvDx4MQRCdDAIeAFhGsDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T10:56:22.553125Z"},"content_sha256":"f22d7133ceb806a7e2407c7250b55e3dc7b39467c73e7115fb31f597bb36b17e","schema_version":"1.0","event_id":"sha256:f22d7133ceb806a7e2407c7250b55e3dc7b39467c73e7115fb31f597bb36b17e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/4AONZB43SJNCAGSDFT2QTCF6OO/bundle.json","state_url":"https://pith.science/pith/4AONZB43SJNCAGSDFT2QTCF6OO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/4AONZB43SJNCAGSDFT2QTCF6OO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T10:56:22Z","links":{"resolver":"https://pith.science/pith/4AONZB43SJNCAGSDFT2QTCF6OO","bundle":"https://pith.science/pith/4AONZB43SJNCAGSDFT2QTCF6OO/bundle.json","state":"https://pith.science/pith/4AONZB43SJNCAGSDFT2QTCF6OO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/4AONZB43SJNCAGSDFT2QTCF6OO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:4AONZB43SJNCAGSDFT2QTCF6OO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7349b0aef96f11a7d509eeb0de70bc28baf622060902562c41695f0448283bb6","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-22T18:52:34Z","title_canon_sha256":"f205f3816c5623e8a0269f1c7e77b6a9b632807aea4ef2c06d748943e95f71d3"},"schema_version":"1.0","source":{"id":"2605.24134","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.24134","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"arxiv_version","alias_value":"2605.24134v1","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.24134","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"pith_short_12","alias_value":"4AONZB43SJNC","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"pith_short_16","alias_value":"4AONZB43SJNCAGSD","created_at":"2026-05-26T01:02:48Z"},{"alias_kind":"pith_short_8","alias_value":"4AONZB43","created_at":"2026-05-26T01:02:48Z"}],"graph_snapshots":[{"event_id":"sha256:f22d7133ceb806a7e2407c7250b55e3dc7b39467c73e7115fb31f597bb36b17e","target":"graph","created_at":"2026-05-26T01:02:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.24134/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"AI agents are entering high-risk production settings, where they use tools, retain context, follow policies, handle private data, and interact with users over multiple turns. Yet many evaluation methods still judge isolated outputs or static tasks, missing failures that emerge through trajectory, pressure, and adversarial interaction. We introduce ProofAgent Harness, open infrastructure for scalable, auditable, and adversarial AI agent evaluation. The harness provides evaluation infrastructure around an agent: it curates evaluation intelligence, runs adversarial multi-turn trials, captures beh","authors_text":"Fouad Bousetouane","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-22T18:52:34Z","title":"ProofAgent Harness: Open Infrastructure for Adversarial Evaluation of AI Agents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.24134","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:15c880a6eb6292602a5609f85ae40919022ea5fd72c5bfccadee4a7bc4341835","target":"record","created_at":"2026-05-26T01:02:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7349b0aef96f11a7d509eeb0de70bc28baf622060902562c41695f0448283bb6","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-22T18:52:34Z","title_canon_sha256":"f205f3816c5623e8a0269f1c7e77b6a9b632807aea4ef2c06d748943e95f71d3"},"schema_version":"1.0","source":{"id":"2605.24134","kind":"arxiv","version":1}},"canonical_sha256":"e01cdc879b925a201a432cf50988be73a6913e37676064bee602384d5cb77d30","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e01cdc879b925a201a432cf50988be73a6913e37676064bee602384d5cb77d30","first_computed_at":"2026-05-26T01:02:48.050233Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-26T01:02:48.050233Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"eayEDI+3gSjPs0/UVMAxFCGpNSaqEvMZKnbNf9YQGDnLy8CbG+Qx5ObKC7jS39ZxsJKaGpPmmalBVhbJruZwAQ==","signature_status":"signed_v1","signed_at":"2026-05-26T01:02:48.050983Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.24134","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:15c880a6eb6292602a5609f85ae40919022ea5fd72c5bfccadee4a7bc4341835","sha256:f22d7133ceb806a7e2407c7250b55e3dc7b39467c73e7115fb31f597bb36b17e"],"state_sha256":"8a6dcea257ffb883beaebb300b71e547b530f3eefb771fabfb3bdafa37dc76b0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"LLxJIMAcx/7sk83PRr99kJ3PR9zm/XtbsR0Y8z/yJK0OJ46OMqAXLekvb07jjpDl+poUe8XpHHUDY2/YHigCBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T10:56:22.555160Z","bundle_sha256":"4a14ea3fa742ea2cd9ef81a73872ae66c15b666642c32d54bda8e1607db3f399"}}