{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:2LOP3U2AZFG6RQVHIS262VFRAK","short_pith_number":"pith:2LOP3U2A","schema_version":"1.0","canonical_sha256":"d2dcfdd340c94de8c2a744b5ed54b1028b57eb64a73e9fa619bad312169463e3","source":{"kind":"arxiv","id":"2606.15345","version":2},"attestation_state":"computed","paper":{"title":"Beyond Monolingual Deep Research: Evaluating Agents and Retrievers with Cross-Lingual BrowseComp-Plus","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Fuheng Zhao, Heli Qi, Hitomi Yanaka, Naoto Yokoya, Puxuan Yu, Qingcheng Zeng, Rui Yang, Weihao Xuan, Yuheng Lu","submitted_at":"2026-06-13T15:11:52Z","abstract_excerpt":"Deep research agents are increasingly evaluated on their ability to search for evidence, reason over retrieved sources, and produce grounded answers. Existing browsing benchmarks, however, largely assume that the user's query and the supporting evidence are written in the same language, leaving open whether agentic search systems can operate when relevant evidence appears in another language. We introduce XBCP (Cross-lingual BrowseComp-Plus), a controlled benchmark that preserves the English question-and-answer space of BrowseComp-Plus but varies the languages of the supporting documents. XBCP"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.15345","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-13T15:11:52Z","cross_cats_sorted":["cs.IR"],"title_canon_sha256":"2b083da9ad874c732517a88097666132adca4fe1234a7e5f3bbbcec22ebf19ab","abstract_canon_sha256":"b045c76f30f95e0006b2e4556cad9faa42bb0acbcab860a9ded5acb71bb18133"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:11:37.531044Z","signature_b64":"6eTqYry2iZvgLEQ2Z8Nj/A1UiMUIx41GEv/C0ZXSfMQJzWt0re0nedpiUxPqnb/QzkgwVuutSlVwJp5F9cXNCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d2dcfdd340c94de8c2a744b5ed54b1028b57eb64a73e9fa619bad312169463e3","last_reissued_at":"2026-06-19T16:11:37.530607Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:11:37.530607Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Beyond Monolingual Deep Research: Evaluating Agents and Retrievers with Cross-Lingual BrowseComp-Plus","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Fuheng Zhao, Heli Qi, Hitomi Yanaka, Naoto Yokoya, Puxuan Yu, Qingcheng Zeng, Rui Yang, Weihao Xuan, Yuheng Lu","submitted_at":"2026-06-13T15:11:52Z","abstract_excerpt":"Deep research agents are increasingly evaluated on their ability to search for evidence, reason over retrieved sources, and produce grounded answers. Existing browsing benchmarks, however, largely assume that the user's query and the supporting evidence are written in the same language, leaving open whether agentic search systems can operate when relevant evidence appears in another language. We introduce XBCP (Cross-lingual BrowseComp-Plus), a controlled benchmark that preserves the English question-and-answer space of BrowseComp-Plus but varies the languages of the supporting documents. XBCP"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.15345","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.15345/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.15345","created_at":"2026-06-19T16:11:37.530665+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.15345v2","created_at":"2026-06-19T16:11:37.530665+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.15345","created_at":"2026-06-19T16:11:37.530665+00:00"},{"alias_kind":"pith_short_12","alias_value":"2LOP3U2AZFG6","created_at":"2026-06-19T16:11:37.530665+00:00"},{"alias_kind":"pith_short_16","alias_value":"2LOP3U2AZFG6RQVH","created_at":"2026-06-19T16:11:37.530665+00:00"},{"alias_kind":"pith_short_8","alias_value":"2LOP3U2A","created_at":"2026-06-19T16:11:37.530665+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK","json":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK.json","graph_json":"https://pith.science/api/pith-number/2LOP3U2AZFG6RQVHIS262VFRAK/graph.json","events_json":"https://pith.science/api/pith-number/2LOP3U2AZFG6RQVHIS262VFRAK/events.json","paper":"https://pith.science/paper/2LOP3U2A"},"agent_actions":{"view_html":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK","download_json":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK.json","view_paper":"https://pith.science/paper/2LOP3U2A","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.15345&json=true","fetch_graph":"https://pith.science/api/pith-number/2LOP3U2AZFG6RQVHIS262VFRAK/graph.json","fetch_events":"https://pith.science/api/pith-number/2LOP3U2AZFG6RQVHIS262VFRAK/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK/action/timestamp_anchor","attest_storage":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK/action/storage_attestation","attest_author":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK/action/author_attestation","sign_citation":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK/action/citation_signature","submit_replication":"https://pith.science/pith/2LOP3U2AZFG6RQVHIS262VFRAK/action/replication_record"}},"created_at":"2026-06-19T16:11:37.530665+00:00","updated_at":"2026-06-19T16:11:37.530665+00:00"}