{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2022:YNR7PILYEZSMAPV2FCSRJPFNTN","short_pith_number":"pith:YNR7PILY","schema_version":"1.0","canonical_sha256":"c363f7a1782664c03eba28a514bcad9b6c7df13d9e10e213e0583ecc30c2501a","source":{"kind":"arxiv","id":"2203.04462","version":1},"attestation_state":"computed","paper":{"title":"Downstream Fairness Caveats with Synthetic Healthcare Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Dennis Wei, Ioana Baldini, Jiaming Zeng, Karan Bhanot, Kristin P. Bennett","submitted_at":"2022-03-09T00:52:47Z","abstract_excerpt":"This paper evaluates synthetically generated healthcare data for biases and investigates the effect of fairness mitigation techniques on utility-fairness. Privacy laws limit access to health data such as Electronic Medical Records (EMRs) to preserve patient privacy. Albeit essential, these laws hinder research reproducibility. Synthetic data is a viable solution that can enable access to data similar to real healthcare data without privacy risks. Healthcare datasets may have biases in which certain protected groups might experience worse outcomes than others. With the real data having biases, "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2203.04462","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2022-03-09T00:52:47Z","cross_cats_sorted":[],"title_canon_sha256":"8f213fe8b8427d72aa7eed4cc97067074ec82fe4090a0e9aa62819a2cb70b9fe","abstract_canon_sha256":"1c4cf767ea7657ebbbf500bd1e5d4cd9667a4fae11ea75052c6128962c841828"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T04:03:18.639258Z","signature_b64":"JLj0MwZMgjpyrmofBCEdYhDXeNhXCA8AA/ZMygAI4ra9A4NZ3HtI2E9T2R/o7OiAUv96ylP7YYtl/8wVEWURAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c363f7a1782664c03eba28a514bcad9b6c7df13d9e10e213e0583ecc30c2501a","last_reissued_at":"2026-07-05T04:03:18.638840Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T04:03:18.638840Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Downstream Fairness Caveats with Synthetic Healthcare Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Dennis Wei, Ioana Baldini, Jiaming Zeng, Karan Bhanot, Kristin P. Bennett","submitted_at":"2022-03-09T00:52:47Z","abstract_excerpt":"This paper evaluates synthetically generated healthcare data for biases and investigates the effect of fairness mitigation techniques on utility-fairness. Privacy laws limit access to health data such as Electronic Medical Records (EMRs) to preserve patient privacy. Albeit essential, these laws hinder research reproducibility. Synthetic data is a viable solution that can enable access to data similar to real healthcare data without privacy risks. Healthcare datasets may have biases in which certain protected groups might experience worse outcomes than others. With the real data having biases, "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2203.04462","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2203.04462/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2203.04462","created_at":"2026-07-05T04:03:18.638893+00:00"},{"alias_kind":"arxiv_version","alias_value":"2203.04462v1","created_at":"2026-07-05T04:03:18.638893+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2203.04462","created_at":"2026-07-05T04:03:18.638893+00:00"},{"alias_kind":"pith_short_12","alias_value":"YNR7PILYEZSM","created_at":"2026-07-05T04:03:18.638893+00:00"},{"alias_kind":"pith_short_16","alias_value":"YNR7PILYEZSMAPV2","created_at":"2026-07-05T04:03:18.638893+00:00"},{"alias_kind":"pith_short_8","alias_value":"YNR7PILY","created_at":"2026-07-05T04:03:18.638893+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN","json":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN.json","graph_json":"https://pith.science/api/pith-number/YNR7PILYEZSMAPV2FCSRJPFNTN/graph.json","events_json":"https://pith.science/api/pith-number/YNR7PILYEZSMAPV2FCSRJPFNTN/events.json","paper":"https://pith.science/paper/YNR7PILY"},"agent_actions":{"view_html":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN","download_json":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN.json","view_paper":"https://pith.science/paper/YNR7PILY","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2203.04462&json=true","fetch_graph":"https://pith.science/api/pith-number/YNR7PILYEZSMAPV2FCSRJPFNTN/graph.json","fetch_events":"https://pith.science/api/pith-number/YNR7PILYEZSMAPV2FCSRJPFNTN/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN/action/timestamp_anchor","attest_storage":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN/action/storage_attestation","attest_author":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN/action/author_attestation","sign_citation":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN/action/citation_signature","submit_replication":"https://pith.science/pith/YNR7PILYEZSMAPV2FCSRJPFNTN/action/replication_record"}},"created_at":"2026-07-05T04:03:18.638893+00:00","updated_at":"2026-07-05T04:03:18.638893+00:00"}