{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:JY7ZLVRONCWJQOLOEHEERJ2X36","short_pith_number":"pith:JY7ZLVRO","schema_version":"1.0","canonical_sha256":"4e3f95d62e68ac98396e21c848a757dfab8b9272007e5632727a27b9fa283dae","source":{"kind":"arxiv","id":"2605.22300","version":1},"attestation_state":"computed","paper":{"title":"Cross-domain benchmarks reveal when coordinated AI agents improve scientific inference from partial evidence","license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","headline":"","cross_cats":["cs.LG","cs.MA"],"primary_cat":"cs.AI","authors_text":"Fiona Y. Wong, Markus J. Buehler","submitted_at":"2026-05-21T10:46:50Z","abstract_excerpt":"Scientific evidence often spans instruments, databases, and disciplines, so no single source records the full phenomenon. This makes it difficult to determine when coordinated AI agents add value over simpler scientific workflows. We evaluate this question with a cross-domain benchmark spanning four scientific tasks: mapping molecular structure into musical representations, detecting historical paradigm shifts in science, identifying vector-borne disease emergence, and vetting transiting-exoplanet candidates. Each case uses a frozen evaluation panel, predefined scoring protocols, explicit base"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.22300","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-21T10:46:50Z","cross_cats_sorted":["cs.LG","cs.MA"],"title_canon_sha256":"dc7706feb0d7e58f1643a073b3438e49f5ecd0fe20896fd04fee79a8d656e017","abstract_canon_sha256":"e9b2b946a886a073e3f70f5498e854b08bb76fc9c0aee4c0c40fad51ac7549e4"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-22T01:04:36.840290Z","signature_b64":"i4CuFQql2JRvkhUs8X8G1A6eTMhVla/deVpYk3D6X6/SyfQtwx4WpgmcglykgNI0/U4+9y2m/78ibBAqHCNyDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4e3f95d62e68ac98396e21c848a757dfab8b9272007e5632727a27b9fa283dae","last_reissued_at":"2026-05-22T01:04:36.839561Z","signature_status":"signed_v1","first_computed_at":"2026-05-22T01:04:36.839561Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Cross-domain benchmarks reveal when coordinated AI agents improve scientific inference from partial evidence","license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","headline":"","cross_cats":["cs.LG","cs.MA"],"primary_cat":"cs.AI","authors_text":"Fiona Y. Wong, Markus J. Buehler","submitted_at":"2026-05-21T10:46:50Z","abstract_excerpt":"Scientific evidence often spans instruments, databases, and disciplines, so no single source records the full phenomenon. This makes it difficult to determine when coordinated AI agents add value over simpler scientific workflows. We evaluate this question with a cross-domain benchmark spanning four scientific tasks: mapping molecular structure into musical representations, detecting historical paradigm shifts in science, identifying vector-borne disease emergence, and vetting transiting-exoplanet candidates. Each case uses a frozen evaluation panel, predefined scoring protocols, explicit base"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.22300","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.22300/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.22300","created_at":"2026-05-22T01:04:36.839697+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.22300v1","created_at":"2026-05-22T01:04:36.839697+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.22300","created_at":"2026-05-22T01:04:36.839697+00:00"},{"alias_kind":"pith_short_12","alias_value":"JY7ZLVRONCWJ","created_at":"2026-05-22T01:04:36.839697+00:00"},{"alias_kind":"pith_short_16","alias_value":"JY7ZLVRONCWJQOLO","created_at":"2026-05-22T01:04:36.839697+00:00"},{"alias_kind":"pith_short_8","alias_value":"JY7ZLVRO","created_at":"2026-05-22T01:04:36.839697+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36","json":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36.json","graph_json":"https://pith.science/api/pith-number/JY7ZLVRONCWJQOLOEHEERJ2X36/graph.json","events_json":"https://pith.science/api/pith-number/JY7ZLVRONCWJQOLOEHEERJ2X36/events.json","paper":"https://pith.science/paper/JY7ZLVRO"},"agent_actions":{"view_html":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36","download_json":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36.json","view_paper":"https://pith.science/paper/JY7ZLVRO","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.22300&json=true","fetch_graph":"https://pith.science/api/pith-number/JY7ZLVRONCWJQOLOEHEERJ2X36/graph.json","fetch_events":"https://pith.science/api/pith-number/JY7ZLVRONCWJQOLOEHEERJ2X36/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36/action/timestamp_anchor","attest_storage":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36/action/storage_attestation","attest_author":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36/action/author_attestation","sign_citation":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36/action/citation_signature","submit_replication":"https://pith.science/pith/JY7ZLVRONCWJQOLOEHEERJ2X36/action/replication_record"}},"created_at":"2026-05-22T01:04:36.839697+00:00","updated_at":"2026-05-22T01:04:36.839697+00:00"}