{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:P6HZQIN2QM6BUV3B27HPELY3JC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fb9343d7b6a6fe1ca807a48de349a9bd6f1b331166f7ee75c7d6c209378ae88e","cross_cats_sorted":["cs.IR"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-05-15T09:47:44Z","title_canon_sha256":"a36530d23550d6b31da3480d03dcb111072589ebe0d22fb7a41ea0628b7a2b55"},"schema_version":"1.0","source":{"id":"2605.15790","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.15790","created_at":"2026-05-20T00:01:18Z"},{"alias_kind":"arxiv_version","alias_value":"2605.15790v1","created_at":"2026-05-20T00:01:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.15790","created_at":"2026-05-20T00:01:18Z"},{"alias_kind":"pith_short_12","alias_value":"P6HZQIN2QM6B","created_at":"2026-05-20T00:01:18Z"},{"alias_kind":"pith_short_16","alias_value":"P6HZQIN2QM6BUV3B","created_at":"2026-05-20T00:01:18Z"},{"alias_kind":"pith_short_8","alias_value":"P6HZQIN2","created_at":"2026-05-20T00:01:18Z"}],"graph_snapshots":[{"event_id":"sha256:23b8202a03e87024db9bc9dccb5f21bede3a0ca9fa2e62517f01db8243790981","target":"graph","created_at":"2026-05-20T00:01:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Experimental results show that our method effectively mitigates generation bias while preserving relevance."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"The position-aware model of bias propagation combined with controlled bias injection via reranking accurately represents how retrieval choices affect downstream generation bias in top-k settings."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"Introduces FARO, a scalable quadratic optimization approach for fairness-aware top-k retrieval in RAG that mitigates generation bias via controlled reranking and position-aware propagation modeling."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"Retrieval optimization that models position-dependent bias propagation can reduce unfairness in RAG outputs while maintaining document relevance."}],"snapshot_sha256":"e5590612494e99838b948847041669d0f98483c9e3a7c1f6498ecb1a624bac89"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"e2cd21f3d2e9dc1838a682ba089d717a3f328426ee81b3f2c3875c0bdc585ae6"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-19T19:31:29.713275Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_title_agreement","ran_at":"2026-05-19T19:31:19.102646Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-19T17:33:48.745052Z","status":"skipped","version":"1.0.0"},{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-19T17:21:55.913721Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2605.15790/integrity.json","findings":[],"snapshot_sha256":"b3e475a1831eb076fa84ba800da240f1d29636814dd929a3e69fb25404342a53","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Retrieval-Augmented Generation (RAG) improves reliability of large language models by incorporating external knowledge, but the retrieval process can introduce bias that propagates to generated outputs. This issue is particularly challenging in top-k settings, where multiple documents jointly influence generation. We propose a fairness-aware retrieval framework that models and controls this bias. Our approach combines controlled bias injection via reranking, a position-aware model of bias propagation, and an optimization formulation that balances relevance and fairness. We further introduce a ","authors_text":"Jyrki Nummenmaa, Kostas Stefanidis, Vasilis Efthymiou, Yingqi Zhao","cross_cats":["cs.IR"],"headline":"Retrieval optimization that models position-dependent bias propagation can reduce unfairness in RAG outputs while maintaining document relevance.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-05-15T09:47:44Z","title":"Fairness-Aware Retrieval Optimization for Retrieval-Augmented Generation"},"references":{"count":37,"internal_anchors":7,"resolved_work":37,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"URL:https://papers.nips.cc/paper_files/paper/ 2017/hash/3f5ee243547dee91fbd053c1c4a845aa-Abstract.html","work_id":"2e440f68-a8ae-4725-a9e2-5bb4e5df8a26","year":2017},{"cited_arxiv_id":"2001.08361","doi":"","is_internal_anchor":true,"ref_index":2,"title":"Scaling Laws for Neural Language Models","work_id":"b7dd8749-9c45-4977-ab9b-64478dce1ae8","year":2020},{"cited_arxiv_id":"","doi":"10.1145/3571730","is_internal_anchor":false,"ref_index":3,"title":"Barret Zoph, Irwan Bello, Sameer Kumar, Nan Du, Yanping Huang, Jeff Dean, Noam Shazeer, and William Fedus","work_id":"aa2fb99f-beb8-463c-8cd4-c575e96e2512","year":2023},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":4,"title":"P. Lewis, E. Perez, A. Piktus, F. Petroni, V. Karpukhin, N. Goyal, H. Küttler, M. Lewis, W.-t. Yih, T. Rocktäschel, S. Riedel, D. Kiela, Retrieval-augmented generation for knowledge-intensive nlp task","work_id":"8a5c7cee-dade-462a-98ee-6e113a181d9d","year":2020},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"M. Hu, H. Wu, Z. Guan, R. Zhu, D. Guo, D. Qi, S. Li, No Free Lunch: Retrieval-Augmented Generation Undermines Fairness in LLMs, Even for Vig- 36 ilant Users, 2024. URL:http://arxiv.org/abs/2410.07589.","work_id":"483b402b-cc8b-4253-9c72-ad94aa6bb2be","year":2024}],"snapshot_sha256":"0bf5a9188b887a210601ff8767c5f459851435dbd2c4a5b32148caf96c6bbff2"},"source":{"id":"2605.15790","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-19T19:22:29.557138Z","id":"6323b9c8-04b2-4133-9da1-06a4242da12d","model_set":{"reader":"grok-4.3"},"one_line_summary":"Introduces FARO, a scalable quadratic optimization approach for fairness-aware top-k retrieval in RAG that mitigates generation bias via controlled reranking and position-aware propagation modeling.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"Retrieval optimization that models position-dependent bias propagation can reduce unfairness in RAG outputs while maintaining document relevance.","strongest_claim":"Experimental results show that our method effectively mitigates generation bias while preserving relevance.","weakest_assumption":"The position-aware model of bias propagation combined with controlled bias injection via reranking accurately represents how retrieval choices affect downstream generation bias in top-k settings."}},"verdict_id":"6323b9c8-04b2-4133-9da1-06a4242da12d"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:869326736e79267003aa0b9eb6447c595aca8665e8ab99e6ea49b2da3b099fdc","target":"record","created_at":"2026-05-20T00:01:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fb9343d7b6a6fe1ca807a48de349a9bd6f1b331166f7ee75c7d6c209378ae88e","cross_cats_sorted":["cs.IR"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-05-15T09:47:44Z","title_canon_sha256":"a36530d23550d6b31da3480d03dcb111072589ebe0d22fb7a41ea0628b7a2b55"},"schema_version":"1.0","source":{"id":"2605.15790","kind":"arxiv","version":1}},"canonical_sha256":"7f8f9821ba833c1a5761d7cef22f1b48ab6a5e2e103ca6e3d9d34ffd38649c0f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7f8f9821ba833c1a5761d7cef22f1b48ab6a5e2e103ca6e3d9d34ffd38649c0f","first_computed_at":"2026-05-20T00:01:18.453135Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:01:18.453135Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"iDoPIZadxJfRWa2+pWPFPW4MOkae0oZ/muVxbt9Kpz4tw78Fi93v8rvZc/+3v0m0xqne1UKsnxQCYhigFrmACw==","signature_status":"signed_v1","signed_at":"2026-05-20T00:01:18.453905Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.15790","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:869326736e79267003aa0b9eb6447c595aca8665e8ab99e6ea49b2da3b099fdc","sha256:23b8202a03e87024db9bc9dccb5f21bede3a0ca9fa2e62517f01db8243790981"],"state_sha256":"df8dc86b29769186962e939f5898b54a8c48baf5f902d8155fc160ca1f2ceaf4"}