{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:2EUCEFTYFNC2ZF4RKEWOHMVSRW","short_pith_number":"pith:2EUCEFTY","canonical_record":{"source":{"id":"2605.21482","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-20T17:59:03Z","cross_cats_sorted":[],"title_canon_sha256":"1e7122a99fd92404679130308878613ffd38ed7a8aed9006049c2119feeccc0a","abstract_canon_sha256":"b9c6addde6c6256fc1439ab99e392899d086f8d40f7feea1880342f4114fc616"},"schema_version":"1.0"},"canonical_sha256":"d1282216782b45ac9791512ce3b2b28d913b37baf452eb5064bdedd721fcc2e2","source":{"kind":"arxiv","id":"2605.21482","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.21482","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"arxiv_version","alias_value":"2605.21482v1","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.21482","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"pith_short_12","alias_value":"2EUCEFTYFNC2","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"pith_short_16","alias_value":"2EUCEFTYFNC2ZF4R","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"pith_short_8","alias_value":"2EUCEFTY","created_at":"2026-05-21T02:05:39Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:2EUCEFTYFNC2ZF4RKEWOHMVSRW","target":"record","payload":{"canonical_record":{"source":{"id":"2605.21482","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-20T17:59:03Z","cross_cats_sorted":[],"title_canon_sha256":"1e7122a99fd92404679130308878613ffd38ed7a8aed9006049c2119feeccc0a","abstract_canon_sha256":"b9c6addde6c6256fc1439ab99e392899d086f8d40f7feea1880342f4114fc616"},"schema_version":"1.0"},"canonical_sha256":"d1282216782b45ac9791512ce3b2b28d913b37baf452eb5064bdedd721fcc2e2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-21T02:05:39.393965Z","signature_b64":"ltB9a7ZVFOhfknk/TX2CRJ78W41k7b/pDT3ZOO5B+DRx6JTW+GCkvfpufcedyJv+XWVCx2gnlt6tacPEAewrAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d1282216782b45ac9791512ce3b2b28d913b37baf452eb5064bdedd721fcc2e2","last_reissued_at":"2026-05-21T02:05:39.393125Z","signature_status":"signed_v1","first_computed_at":"2026-05-21T02:05:39.393125Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.21482","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T02:05:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6qX7KnvGgW3wVGxGRsUjX6B9v0BraXtJ35KZkq4gb/1AD+ylo7XMOcmMu1rilUnJwWyYGAZgdFhRUyUQ2LQxDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T16:54:41.383051Z"},"content_sha256":"e0fd58b632199b778b2ee9e10e24d2ff2cd05e4d944ea7067e61e0db8cd60256","schema_version":"1.0","event_id":"sha256:e0fd58b632199b778b2ee9e10e24d2ff2cd05e4d944ea7067e61e0db8cd60256"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:2EUCEFTYFNC2ZF4RKEWOHMVSRW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"DeepWeb-Bench: A Deep Research Benchmark Demanding Massive Cross-Source Evidence and Long-Horizon Derivation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Baoqing Sun, Chongyang Pan, Haiyang Shen, Jiuzheng Wang, Mugeng Liu, Peilun Jia, Siqi Zhong, Sixiong Xie, Xiang Jing, Yun Ma, Zhuofan Shi","submitted_at":"2026-05-20T17:59:03Z","abstract_excerpt":"Deep research, in which an agent searches the open web, collects evidence, and derives an answer through extended reasoning, is a prominent use case for frontier language models. Frontier deep research products score high on existing benchmarks, making it difficult to distinguish their capabilities from current evaluation data alone. We introduce DeepWeb-Bench, a deep research benchmark that is substantially harder than existing benchmarks for the current frontier. Difficulty comes from three properties of the data itself: each task requires massive evidence collection, cross-source reconcilia"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.21482","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.21482/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T02:05:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"p3GSd/qBUPZtfhcHQGWgh7d9XUqXRo1SXptKdQ3rDvIim+sTAd4gUwnCyGjkRwgG7s/chBEsdqUA19+TJu46Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T16:54:41.383478Z"},"content_sha256":"52f15b608ee702daa37ba7b3540397b94f66846cc148edc753953465946127ae","schema_version":"1.0","event_id":"sha256:52f15b608ee702daa37ba7b3540397b94f66846cc148edc753953465946127ae"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/2EUCEFTYFNC2ZF4RKEWOHMVSRW/bundle.json","state_url":"https://pith.science/pith/2EUCEFTYFNC2ZF4RKEWOHMVSRW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/2EUCEFTYFNC2ZF4RKEWOHMVSRW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T16:54:41Z","links":{"resolver":"https://pith.science/pith/2EUCEFTYFNC2ZF4RKEWOHMVSRW","bundle":"https://pith.science/pith/2EUCEFTYFNC2ZF4RKEWOHMVSRW/bundle.json","state":"https://pith.science/pith/2EUCEFTYFNC2ZF4RKEWOHMVSRW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/2EUCEFTYFNC2ZF4RKEWOHMVSRW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:2EUCEFTYFNC2ZF4RKEWOHMVSRW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b9c6addde6c6256fc1439ab99e392899d086f8d40f7feea1880342f4114fc616","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-20T17:59:03Z","title_canon_sha256":"1e7122a99fd92404679130308878613ffd38ed7a8aed9006049c2119feeccc0a"},"schema_version":"1.0","source":{"id":"2605.21482","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.21482","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"arxiv_version","alias_value":"2605.21482v1","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.21482","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"pith_short_12","alias_value":"2EUCEFTYFNC2","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"pith_short_16","alias_value":"2EUCEFTYFNC2ZF4R","created_at":"2026-05-21T02:05:39Z"},{"alias_kind":"pith_short_8","alias_value":"2EUCEFTY","created_at":"2026-05-21T02:05:39Z"}],"graph_snapshots":[{"event_id":"sha256:52f15b608ee702daa37ba7b3540397b94f66846cc148edc753953465946127ae","target":"graph","created_at":"2026-05-21T02:05:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.21482/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Deep research, in which an agent searches the open web, collects evidence, and derives an answer through extended reasoning, is a prominent use case for frontier language models. Frontier deep research products score high on existing benchmarks, making it difficult to distinguish their capabilities from current evaluation data alone. We introduce DeepWeb-Bench, a deep research benchmark that is substantially harder than existing benchmarks for the current frontier. Difficulty comes from three properties of the data itself: each task requires massive evidence collection, cross-source reconcilia","authors_text":"Baoqing Sun, Chongyang Pan, Haiyang Shen, Jiuzheng Wang, Mugeng Liu, Peilun Jia, Siqi Zhong, Sixiong Xie, Xiang Jing, Yun Ma, Zhuofan Shi","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-20T17:59:03Z","title":"DeepWeb-Bench: A Deep Research Benchmark Demanding Massive Cross-Source Evidence and Long-Horizon Derivation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.21482","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e0fd58b632199b778b2ee9e10e24d2ff2cd05e4d944ea7067e61e0db8cd60256","target":"record","created_at":"2026-05-21T02:05:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b9c6addde6c6256fc1439ab99e392899d086f8d40f7feea1880342f4114fc616","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-20T17:59:03Z","title_canon_sha256":"1e7122a99fd92404679130308878613ffd38ed7a8aed9006049c2119feeccc0a"},"schema_version":"1.0","source":{"id":"2605.21482","kind":"arxiv","version":1}},"canonical_sha256":"d1282216782b45ac9791512ce3b2b28d913b37baf452eb5064bdedd721fcc2e2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d1282216782b45ac9791512ce3b2b28d913b37baf452eb5064bdedd721fcc2e2","first_computed_at":"2026-05-21T02:05:39.393125Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-21T02:05:39.393125Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ltB9a7ZVFOhfknk/TX2CRJ78W41k7b/pDT3ZOO5B+DRx6JTW+GCkvfpufcedyJv+XWVCx2gnlt6tacPEAewrAQ==","signature_status":"signed_v1","signed_at":"2026-05-21T02:05:39.393965Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.21482","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e0fd58b632199b778b2ee9e10e24d2ff2cd05e4d944ea7067e61e0db8cd60256","sha256:52f15b608ee702daa37ba7b3540397b94f66846cc148edc753953465946127ae"],"state_sha256":"e2d40ba9e0edb2c1ca97ef781459da718a9e5a611ee75afb6223bc63d6d2d0ed"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"lw/+o1Pzr4gtExg410s5QQFa+QCFBEpPmJc7Kx5b1BnFIphPbPsjMiLST5OxULgkwE7adsIXzIAVViRzV7nZCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T16:54:41.386836Z","bundle_sha256":"14544fcb3e9656267a12886cec2f19a6be69ed298c0d55ef69a94bbbe019507b"}}