{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:67SSZHDSV4XA7PFWYT3MTTLJRP","short_pith_number":"pith:67SSZHDS","canonical_record":{"source":{"id":"1707.01623","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"q-bio.QM","submitted_at":"2017-07-06T03:03:57Z","cross_cats_sorted":["cs.LG","cs.NE"],"title_canon_sha256":"6d28963f3796d1ccdfe6f5f50efae0adf671e299d2cd99c6e9efbb2a8583a5a3","abstract_canon_sha256":"c9b7fbf340b462c3e51fd1f48990a6c31b79b0a2a7b92ade371df24667098ed4"},"schema_version":"1.0"},"canonical_sha256":"f7e52c9c72af2e0fbcb6c4f6c9cd698becb0547b97945d3063b4d7f2a5326e7e","source":{"kind":"arxiv","id":"1707.01623","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.01623","created_at":"2026-05-18T00:17:19Z"},{"alias_kind":"arxiv_version","alias_value":"1707.01623v2","created_at":"2026-05-18T00:17:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.01623","created_at":"2026-05-18T00:17:19Z"},{"alias_kind":"pith_short_12","alias_value":"67SSZHDSV4XA","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_16","alias_value":"67SSZHDSV4XA7PFW","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_8","alias_value":"67SSZHDS","created_at":"2026-05-18T12:31:03Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:67SSZHDSV4XA7PFWYT3MTTLJRP","target":"record","payload":{"canonical_record":{"source":{"id":"1707.01623","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"q-bio.QM","submitted_at":"2017-07-06T03:03:57Z","cross_cats_sorted":["cs.LG","cs.NE"],"title_canon_sha256":"6d28963f3796d1ccdfe6f5f50efae0adf671e299d2cd99c6e9efbb2a8583a5a3","abstract_canon_sha256":"c9b7fbf340b462c3e51fd1f48990a6c31b79b0a2a7b92ade371df24667098ed4"},"schema_version":"1.0"},"canonical_sha256":"f7e52c9c72af2e0fbcb6c4f6c9cd698becb0547b97945d3063b4d7f2a5326e7e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:17:19.293681Z","signature_b64":"3ZpND247GenZZ2FpE4e1xcJvTcEDqYskN3HqPijoTzR0L5e1zVdciVxsMA1fAT51oeDLt3fN5pE5yfPEuOuSDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f7e52c9c72af2e0fbcb6c4f6c9cd698becb0547b97945d3063b4d7f2a5326e7e","last_reissued_at":"2026-05-18T00:17:19.293174Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:17:19.293174Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1707.01623","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:17:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6vr8ycxFlUbITb2vTKcZLZhcTKseKhfEmhYOtTm1gFcy0lihff3TIu/uYzWv9aaYRf6mt0LdW/ch8gmeM3PkCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T17:56:38.814976Z"},"content_sha256":"456fd123bfaf40b415ffffaa9d16e62e6fdb2797d634a4d383dee3d511bc9451","schema_version":"1.0","event_id":"sha256:456fd123bfaf40b415ffffaa9d16e62e6fdb2797d634a4d383dee3d511bc9451"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:67SSZHDSV4XA7PFWYT3MTTLJRP","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"RIDDLE: Race and ethnicity Imputation from Disease history with Deep LEarning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG","cs.NE"],"primary_cat":"q-bio.QM","authors_text":"Andrey Rzhetsky, Ji-Sung Kim, Xin Gao","submitted_at":"2017-07-06T03:03:57Z","abstract_excerpt":"Anonymized electronic medical records are an increasingly popular source of research data. However, these datasets often lack race and ethnicity information. This creates problems for researchers modeling human disease, as race and ethnicity are powerful confounders for many health exposures and treatment outcomes; race and ethnicity are closely linked to population-specific genetic variation. We showed that deep neural networks generate more accurate estimates for missing racial and ethnic information than competing methods (e.g., logistic regression, random forest). RIDDLE yielded significan"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.01623","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:17:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Hglu0ZC+S2NYa1GqqmzsyMupU/6ha93Tb4OQ0Trz65TlTM6aJpqHOC0/ZGM4p8t5NNqVPrmyOI9R1WjgTH5NBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T17:56:38.815347Z"},"content_sha256":"788f86f66e363395a5aaf1ebc4349c784f767e319083726e300864b619652ce8","schema_version":"1.0","event_id":"sha256:788f86f66e363395a5aaf1ebc4349c784f767e319083726e300864b619652ce8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/67SSZHDSV4XA7PFWYT3MTTLJRP/bundle.json","state_url":"https://pith.science/pith/67SSZHDSV4XA7PFWYT3MTTLJRP/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/67SSZHDSV4XA7PFWYT3MTTLJRP/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-23T17:56:38Z","links":{"resolver":"https://pith.science/pith/67SSZHDSV4XA7PFWYT3MTTLJRP","bundle":"https://pith.science/pith/67SSZHDSV4XA7PFWYT3MTTLJRP/bundle.json","state":"https://pith.science/pith/67SSZHDSV4XA7PFWYT3MTTLJRP/state.json","well_known_bundle":"https://pith.science/.well-known/pith/67SSZHDSV4XA7PFWYT3MTTLJRP/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:67SSZHDSV4XA7PFWYT3MTTLJRP","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c9b7fbf340b462c3e51fd1f48990a6c31b79b0a2a7b92ade371df24667098ed4","cross_cats_sorted":["cs.LG","cs.NE"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"q-bio.QM","submitted_at":"2017-07-06T03:03:57Z","title_canon_sha256":"6d28963f3796d1ccdfe6f5f50efae0adf671e299d2cd99c6e9efbb2a8583a5a3"},"schema_version":"1.0","source":{"id":"1707.01623","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.01623","created_at":"2026-05-18T00:17:19Z"},{"alias_kind":"arxiv_version","alias_value":"1707.01623v2","created_at":"2026-05-18T00:17:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.01623","created_at":"2026-05-18T00:17:19Z"},{"alias_kind":"pith_short_12","alias_value":"67SSZHDSV4XA","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_16","alias_value":"67SSZHDSV4XA7PFW","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_8","alias_value":"67SSZHDS","created_at":"2026-05-18T12:31:03Z"}],"graph_snapshots":[{"event_id":"sha256:788f86f66e363395a5aaf1ebc4349c784f767e319083726e300864b619652ce8","target":"graph","created_at":"2026-05-18T00:17:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Anonymized electronic medical records are an increasingly popular source of research data. However, these datasets often lack race and ethnicity information. This creates problems for researchers modeling human disease, as race and ethnicity are powerful confounders for many health exposures and treatment outcomes; race and ethnicity are closely linked to population-specific genetic variation. We showed that deep neural networks generate more accurate estimates for missing racial and ethnic information than competing methods (e.g., logistic regression, random forest). RIDDLE yielded significan","authors_text":"Andrey Rzhetsky, Ji-Sung Kim, Xin Gao","cross_cats":["cs.LG","cs.NE"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"q-bio.QM","submitted_at":"2017-07-06T03:03:57Z","title":"RIDDLE: Race and ethnicity Imputation from Disease history with Deep LEarning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.01623","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:456fd123bfaf40b415ffffaa9d16e62e6fdb2797d634a4d383dee3d511bc9451","target":"record","created_at":"2026-05-18T00:17:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c9b7fbf340b462c3e51fd1f48990a6c31b79b0a2a7b92ade371df24667098ed4","cross_cats_sorted":["cs.LG","cs.NE"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"q-bio.QM","submitted_at":"2017-07-06T03:03:57Z","title_canon_sha256":"6d28963f3796d1ccdfe6f5f50efae0adf671e299d2cd99c6e9efbb2a8583a5a3"},"schema_version":"1.0","source":{"id":"1707.01623","kind":"arxiv","version":2}},"canonical_sha256":"f7e52c9c72af2e0fbcb6c4f6c9cd698becb0547b97945d3063b4d7f2a5326e7e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f7e52c9c72af2e0fbcb6c4f6c9cd698becb0547b97945d3063b4d7f2a5326e7e","first_computed_at":"2026-05-18T00:17:19.293174Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:17:19.293174Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"3ZpND247GenZZ2FpE4e1xcJvTcEDqYskN3HqPijoTzR0L5e1zVdciVxsMA1fAT51oeDLt3fN5pE5yfPEuOuSDg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:17:19.293681Z","signed_message":"canonical_sha256_bytes"},"source_id":"1707.01623","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:456fd123bfaf40b415ffffaa9d16e62e6fdb2797d634a4d383dee3d511bc9451","sha256:788f86f66e363395a5aaf1ebc4349c784f767e319083726e300864b619652ce8"],"state_sha256":"4303c780f6a5603a996515902b010466516cbe7f69103d44f6fb4c9417ec842d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ChwGDzfqqLViTa4nxRW1WrcK2V0v3MqAp3yx5caqzuxzWESINKhjmwG4efxQLRhlxWxB3NOfxzcM9c7uxiGbAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-23T17:56:38.817875Z","bundle_sha256":"30845bc4643552bd6f24ee8812ccfdcdcbb19fe2fa569f3e19b206fc953e99ba"}}