{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2022:IPSR7HEVLWVEOETEGULDKGU2SD","short_pith_number":"pith:IPSR7HEV","schema_version":"1.0","canonical_sha256":"43e51f9c955daa4712643516351a9a90e65a1dae6e788e9b17655442057f73e0","source":{"kind":"arxiv","id":"2201.07754","version":3},"attestation_state":"computed","paper":{"title":"Grep-BiasIR: A Dataset for Investigating Gender Representation-Bias in Information Retrieval Results","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Emilia Parada-Cabaleiro, Gertraud Medicus, Klara Krieg, Markus Schedl, Navid Rekabsaz, Oleg Lesota","submitted_at":"2022-01-19T17:50:18Z","abstract_excerpt":"The provided contents by information retrieval (IR) systems can reflect the existing societal biases and stereotypes. Such biases in retrieval results can lead to further establishing and strengthening stereotypes in society and also in the systems. To facilitate the studies of gender bias in the retrieval results of IR systems, we introduce Gender Representation-Bias for Information Retrieval (Grep-BiasIR), a novel thoroughly-audited dataset consisting of 118 bias-sensitive neutral search queries. The set of queries covers a wide range of gender-related topics, for which a biased representati"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2201.07754","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2022-01-19T17:50:18Z","cross_cats_sorted":[],"title_canon_sha256":"adaea4d0fe0d4ecfe787d8b248170ab743eaecf4a9dd4c9125e7b6b5a77902c6","abstract_canon_sha256":"8127ebfb5985e4dfecefc200dc01df5f27aa35d9f4754f50b297e33c4d78003b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T05:31:34.630934Z","signature_b64":"tbIEGiPGp+yX5jQuKU9kAU0dxMNW91R1xTycxkCTE3G7D5nCoFP/rMhouBMMfdSZYo5FdSdap1lwgJ/AVIpADQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"43e51f9c955daa4712643516351a9a90e65a1dae6e788e9b17655442057f73e0","last_reissued_at":"2026-07-05T05:31:34.630487Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T05:31:34.630487Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Grep-BiasIR: A Dataset for Investigating Gender Representation-Bias in Information Retrieval Results","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Emilia Parada-Cabaleiro, Gertraud Medicus, Klara Krieg, Markus Schedl, Navid Rekabsaz, Oleg Lesota","submitted_at":"2022-01-19T17:50:18Z","abstract_excerpt":"The provided contents by information retrieval (IR) systems can reflect the existing societal biases and stereotypes. Such biases in retrieval results can lead to further establishing and strengthening stereotypes in society and also in the systems. To facilitate the studies of gender bias in the retrieval results of IR systems, we introduce Gender Representation-Bias for Information Retrieval (Grep-BiasIR), a novel thoroughly-audited dataset consisting of 118 bias-sensitive neutral search queries. The set of queries covers a wide range of gender-related topics, for which a biased representati"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2201.07754","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2201.07754/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2201.07754","created_at":"2026-07-05T05:31:34.630534+00:00"},{"alias_kind":"arxiv_version","alias_value":"2201.07754v3","created_at":"2026-07-05T05:31:34.630534+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2201.07754","created_at":"2026-07-05T05:31:34.630534+00:00"},{"alias_kind":"pith_short_12","alias_value":"IPSR7HEVLWVE","created_at":"2026-07-05T05:31:34.630534+00:00"},{"alias_kind":"pith_short_16","alias_value":"IPSR7HEVLWVEOETE","created_at":"2026-07-05T05:31:34.630534+00:00"},{"alias_kind":"pith_short_8","alias_value":"IPSR7HEV","created_at":"2026-07-05T05:31:34.630534+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD","json":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD.json","graph_json":"https://pith.science/api/pith-number/IPSR7HEVLWVEOETEGULDKGU2SD/graph.json","events_json":"https://pith.science/api/pith-number/IPSR7HEVLWVEOETEGULDKGU2SD/events.json","paper":"https://pith.science/paper/IPSR7HEV"},"agent_actions":{"view_html":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD","download_json":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD.json","view_paper":"https://pith.science/paper/IPSR7HEV","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2201.07754&json=true","fetch_graph":"https://pith.science/api/pith-number/IPSR7HEVLWVEOETEGULDKGU2SD/graph.json","fetch_events":"https://pith.science/api/pith-number/IPSR7HEVLWVEOETEGULDKGU2SD/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD/action/timestamp_anchor","attest_storage":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD/action/storage_attestation","attest_author":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD/action/author_attestation","sign_citation":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD/action/citation_signature","submit_replication":"https://pith.science/pith/IPSR7HEVLWVEOETEGULDKGU2SD/action/replication_record"}},"created_at":"2026-07-05T05:31:34.630534+00:00","updated_at":"2026-07-05T05:31:34.630534+00:00"}