{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:RLPSQLQAPCLKHYR5KM3RA7AKSF","short_pith_number":"pith:RLPSQLQA","canonical_record":{"source":{"id":"2605.16679","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-15T22:34:31Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"750e2358a343bae048180e9793fcafc4a5a1427809a1ab1734de95ff220d3cf5","abstract_canon_sha256":"0f9434e166353d9fa5596cb8fe9f44a918eb1321152c495d049129cfb1f123b1"},"schema_version":"1.0"},"canonical_sha256":"8adf282e007896a3e23d5337107c0a915bc2d41f0fd91e303e3cb24984e569aa","source":{"kind":"arxiv","id":"2605.16679","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.16679","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"arxiv_version","alias_value":"2605.16679v1","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.16679","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"pith_short_12","alias_value":"RLPSQLQAPCLK","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"pith_short_16","alias_value":"RLPSQLQAPCLKHYR5","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"pith_short_8","alias_value":"RLPSQLQA","created_at":"2026-05-20T00:02:36Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:RLPSQLQAPCLKHYR5KM3RA7AKSF","target":"record","payload":{"canonical_record":{"source":{"id":"2605.16679","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-15T22:34:31Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"750e2358a343bae048180e9793fcafc4a5a1427809a1ab1734de95ff220d3cf5","abstract_canon_sha256":"0f9434e166353d9fa5596cb8fe9f44a918eb1321152c495d049129cfb1f123b1"},"schema_version":"1.0"},"canonical_sha256":"8adf282e007896a3e23d5337107c0a915bc2d41f0fd91e303e3cb24984e569aa","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:02:36.216783Z","signature_b64":"I5UABhph/J9lSnegdF9fLbju/ZtobNIwUsS0R0OOyidQsz0sEJ2cFfNJweFnL3qdELP3KxwqbNowvpuuf1KmDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8adf282e007896a3e23d5337107c0a915bc2d41f0fd91e303e3cb24984e569aa","last_reissued_at":"2026-05-20T00:02:36.215893Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:02:36.215893Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.16679","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:02:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"45SDDvS0krb0CmBcCc0w5NFDFNcFmZBM73UkgnynHwspqGI9E+YoPavqIfjpTk72KspdHaGCU+H5qFsyKrTRAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T02:02:44.860276Z"},"content_sha256":"6d6a63aee62bcad8c48b357574071706d9e33bb3f04e79c8950636b750ccec2f","schema_version":"1.0","event_id":"sha256:6d6a63aee62bcad8c48b357574071706d9e33bb3f04e79c8950636b750ccec2f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:RLPSQLQAPCLKHYR5KM3RA7AKSF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"CHI-Bench: Can AI Agents Automate End-to-End, Long-Horizon, Policy-Rich Healthcare Workflows?","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CL","authors_text":"Biwei Huang, Caiming Xiong, Carl Yang, Chenyu You, Deon Metelski, Eric P. Xing, Fan Feng, Fangli Geng, Frank Wang, Hang Jiang, Hank Capps MD, Haolin Chen, Hua Wei, Joonyul Lee, Kevin Riley, Kun Zhang, Leon Qi, Lingjing Kong, Philip S. Yu, Qingsong Wen, Sanmi Koyejo, Steve Brown, Tao Xia, Tianyi Zeng, T. Y. Alvin Liu, Weiran Yao, Xiangchen Song, Yanjie Fu, Yuan Yuan, Yue Zhao, Zeyu Tang, Zhiwei Liu, Zixian Ma","submitted_at":"2026-05-15T22:34:31Z","abstract_excerpt":"End-to-end automation of realistic healthcare operations stresses three capabilities underrepresented in current benchmarks: policy density, decisions must be grounded in a large library of medical, insurance, and operational rules; Multi-role composition: a single task requires the agent to play multiple roles with handoffs; and multilateral interaction: intermediate workflow steps are multi-turn dialogs, such as peer-to-peer review and patient outreach. We introduce $\\chi$-Bench, a benchmark of long-horizon healthcare workflows across three domains: provider prior authorization, payer utiliz"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.16679","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.16679/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"claim_evidence","ran_at":"2026-05-19T19:01:56.384077Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"ai_meta_artifact","ran_at":"2026-05-19T18:33:26.503164Z","status":"skipped","version":"1.0.0","findings_count":0}],"snapshot_sha256":"dce68f6b97015f09cbafa183240ae52d412a0175c7cb471aed29df4e485b03ed"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:02:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6tzH5ijTaXCJcG+qXmoVf95mO+UFnUBuylaOcz7b6HsNbjormNlJyyT0+qnokRU8w6LzMvyfnwNhXaDMRdx1Bw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T02:02:44.860787Z"},"content_sha256":"9716f24e046b92758334eb3132f47ba9f46984153b423e591c22785610961694","schema_version":"1.0","event_id":"sha256:9716f24e046b92758334eb3132f47ba9f46984153b423e591c22785610961694"},{"event_type":"integrity_finding","subject_pith_number":"pith:2026:RLPSQLQAPCLKHYR5KM3RA7AKSF","target":"integrity","payload":{"note":"DOI in the printed bibliography is fragmented by whitespace or line breaks. A longer candidate (10.3122/jabfm.2018.01.170133.PMC4809054) was visible in the surrounding text but could not be confirmed against doi.org as printed.","snippet":"A. Cuellar, A. H. Krist, L. M. Nichols, and A. J. Kuzel. Facilitators and barriers to care coordination in patient-centered medical homes (PCMHs) from coordinators’ perspectives. Journal of the American Board of Family Medicine, 31(1):90–10","arxiv_id":"2605.16679","detector":"doi_compliance","evidence":{"ref_index":11,"verdict_class":"incontrovertible","resolved_title":null,"printed_excerpt":"A. Cuellar, A. H. Krist, L. M. Nichols, and A. J. Kuzel. Facilitators and barriers to care coordination in patient-centered medical homes (PCMHs) from coordinators’ perspectives. Journal of the American Board of Family Medicine, 31(1):90–10","reconstructed_doi":"10.3122/jabfm.2018.01.170133.PMC4809054"},"severity":"advisory","ref_index":11,"audited_at":"2026-05-20T17:52:44.197655Z","event_type":"pith.integrity.v1","detected_doi":"10.3122/jabfm.2018.01.170133.PMC4809054","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"recoverable_identifier","evidence_hash":"ed878828783d903c639b98d29eb7308f66c60cb6d391ce7433ff43814fc5e7f9","paper_version":2,"verdict_class":"incontrovertible","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null,"integrity_event_id":5385,"payload_sha256":"63dd30ea0975adf336468821796550099b7095bcbdb74b9e3ab6a01f7b6dc2f7","signature_b64":"6Y0tQM84a285xx8iuMOyEt0/sCE5E3LdR3S+PyQ3vr9y+UKqiHE/RYudgvPWqtA8bdLRn3pymo2LgAFmAfdwBw==","signing_key_id":"pith-v1-2026-05"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T17:53:20Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jo0XNtx+/PhLSL+lhKeDtKXvy5hd2QBekaUADJVIZatUXretwTsgsrSKQ/nwLftas0l2/eeUP1vvOFTGTSTKAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T02:02:44.861854Z"},"content_sha256":"f24c9f20f71c942f856987c451006c549b3b7c67ba3b10fc38e21b76a071d2f7","schema_version":"1.0","event_id":"sha256:f24c9f20f71c942f856987c451006c549b3b7c67ba3b10fc38e21b76a071d2f7"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RLPSQLQAPCLKHYR5KM3RA7AKSF/bundle.json","state_url":"https://pith.science/pith/RLPSQLQAPCLKHYR5KM3RA7AKSF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RLPSQLQAPCLKHYR5KM3RA7AKSF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T02:02:44Z","links":{"resolver":"https://pith.science/pith/RLPSQLQAPCLKHYR5KM3RA7AKSF","bundle":"https://pith.science/pith/RLPSQLQAPCLKHYR5KM3RA7AKSF/bundle.json","state":"https://pith.science/pith/RLPSQLQAPCLKHYR5KM3RA7AKSF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RLPSQLQAPCLKHYR5KM3RA7AKSF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:RLPSQLQAPCLKHYR5KM3RA7AKSF","merge_version":"pith-open-graph-merge-v1","event_count":3,"valid_event_count":3,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0f9434e166353d9fa5596cb8fe9f44a918eb1321152c495d049129cfb1f123b1","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-15T22:34:31Z","title_canon_sha256":"750e2358a343bae048180e9793fcafc4a5a1427809a1ab1734de95ff220d3cf5"},"schema_version":"1.0","source":{"id":"2605.16679","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.16679","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"arxiv_version","alias_value":"2605.16679v1","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.16679","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"pith_short_12","alias_value":"RLPSQLQAPCLK","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"pith_short_16","alias_value":"RLPSQLQAPCLKHYR5","created_at":"2026-05-20T00:02:36Z"},{"alias_kind":"pith_short_8","alias_value":"RLPSQLQA","created_at":"2026-05-20T00:02:36Z"}],"graph_snapshots":[{"event_id":"sha256:9716f24e046b92758334eb3132f47ba9f46984153b423e591c22785610961694","target":"graph","created_at":"2026-05-20T00:02:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-19T19:01:56.384077Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-19T18:33:26.503164Z","status":"skipped","version":"1.0.0"}],"endpoint":"/pith/2605.16679/integrity.json","findings":[],"snapshot_sha256":"dce68f6b97015f09cbafa183240ae52d412a0175c7cb471aed29df4e485b03ed","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"End-to-end automation of realistic healthcare operations stresses three capabilities underrepresented in current benchmarks: policy density, decisions must be grounded in a large library of medical, insurance, and operational rules; Multi-role composition: a single task requires the agent to play multiple roles with handoffs; and multilateral interaction: intermediate workflow steps are multi-turn dialogs, such as peer-to-peer review and patient outreach. We introduce $\\chi$-Bench, a benchmark of long-horizon healthcare workflows across three domains: provider prior authorization, payer utiliz","authors_text":"Biwei Huang, Caiming Xiong, Carl Yang, Chenyu You, Deon Metelski, Eric P. Xing, Fan Feng, Fangli Geng, Frank Wang, Hang Jiang, Hank Capps MD, Haolin Chen, Hua Wei, Joonyul Lee, Kevin Riley, Kun Zhang, Leon Qi, Lingjing Kong, Philip S. Yu, Qingsong Wen, Sanmi Koyejo, Steve Brown, Tao Xia, Tianyi Zeng, T. Y. Alvin Liu, Weiran Yao, Xiangchen Song, Yanjie Fu, Yuan Yuan, Yue Zhao, Zeyu Tang, Zhiwei Liu, Zixian Ma","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-15T22:34:31Z","title":"CHI-Bench: Can AI Agents Automate End-to-End, Long-Horizon, Policy-Rich Healthcare Workflows?"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.16679","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6d6a63aee62bcad8c48b357574071706d9e33bb3f04e79c8950636b750ccec2f","target":"record","created_at":"2026-05-20T00:02:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0f9434e166353d9fa5596cb8fe9f44a918eb1321152c495d049129cfb1f123b1","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-15T22:34:31Z","title_canon_sha256":"750e2358a343bae048180e9793fcafc4a5a1427809a1ab1734de95ff220d3cf5"},"schema_version":"1.0","source":{"id":"2605.16679","kind":"arxiv","version":1}},"canonical_sha256":"8adf282e007896a3e23d5337107c0a915bc2d41f0fd91e303e3cb24984e569aa","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8adf282e007896a3e23d5337107c0a915bc2d41f0fd91e303e3cb24984e569aa","first_computed_at":"2026-05-20T00:02:36.215893Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:02:36.215893Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"I5UABhph/J9lSnegdF9fLbju/ZtobNIwUsS0R0OOyidQsz0sEJ2cFfNJweFnL3qdELP3KxwqbNowvpuuf1KmDw==","signature_status":"signed_v1","signed_at":"2026-05-20T00:02:36.216783Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.16679","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6d6a63aee62bcad8c48b357574071706d9e33bb3f04e79c8950636b750ccec2f","sha256:9716f24e046b92758334eb3132f47ba9f46984153b423e591c22785610961694","sha256:f24c9f20f71c942f856987c451006c549b3b7c67ba3b10fc38e21b76a071d2f7"],"state_sha256":"4234d4f4f5908b4553962406837df4617ec5ed216052ca389ad28dfe443f9fcc"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OAtG7UuxJUQ1V5s/9comc4JFPRgeCvresZ9OofpYzBNUNo2XoHD2EAe3aB1h/nvmbNdNXZUM/9AL2Kj0eBnEAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T02:02:44.864295Z","bundle_sha256":"fe55b0e4daa8d791772d6d710d7402ad660bef61b86d49a7a2d088a3e4104504"}}