{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:HY4JOTAW2X2XDJXXTNUTHA5EIT","short_pith_number":"pith:HY4JOTAW","canonical_record":{"source":{"id":"1706.01513","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CY","submitted_at":"2017-06-01T20:34:41Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"7a48d69f7974289f5e48a5e61d97b2f86f3fb308e8d38f5897e5392db45c8e7b","abstract_canon_sha256":"8be306a870eff2800b72788eb58c589f67239ead000d7f62b81f7d29b265ba1a"},"schema_version":"1.0"},"canonical_sha256":"3e38974c16d5f571a6f79b693383a444ebd743ca867864d1f0518e8e15aa99b5","source":{"kind":"arxiv","id":"1706.01513","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1706.01513","created_at":"2026-05-18T00:25:04Z"},{"alias_kind":"arxiv_version","alias_value":"1706.01513v2","created_at":"2026-05-18T00:25:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1706.01513","created_at":"2026-05-18T00:25:04Z"},{"alias_kind":"pith_short_12","alias_value":"HY4JOTAW2X2X","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_16","alias_value":"HY4JOTAW2X2XDJXX","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_8","alias_value":"HY4JOTAW","created_at":"2026-05-18T12:31:21Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:HY4JOTAW2X2XDJXXTNUTHA5EIT","target":"record","payload":{"canonical_record":{"source":{"id":"1706.01513","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CY","submitted_at":"2017-06-01T20:34:41Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"7a48d69f7974289f5e48a5e61d97b2f86f3fb308e8d38f5897e5392db45c8e7b","abstract_canon_sha256":"8be306a870eff2800b72788eb58c589f67239ead000d7f62b81f7d29b265ba1a"},"schema_version":"1.0"},"canonical_sha256":"3e38974c16d5f571a6f79b693383a444ebd743ca867864d1f0518e8e15aa99b5","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:25:04.157634Z","signature_b64":"tlgn4pPHnE77pPsXrVoarB+nOGyF0IXn2StefJxdbyVC17PCnusV6PJ4bz3kzlgb20nOzyrdApVLotIeQj75BQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3e38974c16d5f571a6f79b693383a444ebd743ca867864d1f0518e8e15aa99b5","last_reissued_at":"2026-05-18T00:25:04.156947Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:25:04.156947Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1706.01513","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:25:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EbOCDlz1WNCDpQEoaE1Eu+8C5wfcHZ71o7XJKetkdIq8lbkyt3ldzquT45muQx0nuWd0N3YhMvzJE8wmvEL8Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T21:23:19.218589Z"},"content_sha256":"aa0f6b89500f1bf6973102a8dc803580f1a214cabc1a091df3bd13130bd6a5b5","schema_version":"1.0","event_id":"sha256:aa0f6b89500f1bf6973102a8dc803580f1a214cabc1a091df3bd13130bd6a5b5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:HY4JOTAW2X2XDJXXTNUTHA5EIT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Beyond Volume: The Impact of Complex Healthcare Data on the Machine Learning Pipeline","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","stat.ML"],"primary_cat":"cs.CY","authors_text":"Chao Huang, Keith Feldman, Louis Faust, Nitesh V. Chawla, Xian Wu","submitted_at":"2017-06-01T20:34:41Z","abstract_excerpt":"From medical charts to national census, healthcare has traditionally operated under a paper-based paradigm. However, the past decade has marked a long and arduous transformation bringing healthcare into the digital age. Ranging from electronic health records, to digitized imaging and laboratory reports, to public health datasets, today, healthcare now generates an incredible amount of digital information. Such a wealth of data presents an exciting opportunity for integrated machine learning solutions to address problems across multiple facets of healthcare practice and administration. Unfortun"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1706.01513","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:25:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Do5uJ9fyb9IrfoNblQ4vG5dZ/OaOQYhW18gVKHQJTrc92sXVdPOoy87Hj6LNN63Zr36y8bufSsrYGxZDALsACw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T21:23:19.219293Z"},"content_sha256":"b810328ac24feb84e2a5fb6f13889cac8db0987841cc3e3a97b2f5398d6bdca4","schema_version":"1.0","event_id":"sha256:b810328ac24feb84e2a5fb6f13889cac8db0987841cc3e3a97b2f5398d6bdca4"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HY4JOTAW2X2XDJXXTNUTHA5EIT/bundle.json","state_url":"https://pith.science/pith/HY4JOTAW2X2XDJXXTNUTHA5EIT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HY4JOTAW2X2XDJXXTNUTHA5EIT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-08T21:23:19Z","links":{"resolver":"https://pith.science/pith/HY4JOTAW2X2XDJXXTNUTHA5EIT","bundle":"https://pith.science/pith/HY4JOTAW2X2XDJXXTNUTHA5EIT/bundle.json","state":"https://pith.science/pith/HY4JOTAW2X2XDJXXTNUTHA5EIT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HY4JOTAW2X2XDJXXTNUTHA5EIT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:HY4JOTAW2X2XDJXXTNUTHA5EIT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8be306a870eff2800b72788eb58c589f67239ead000d7f62b81f7d29b265ba1a","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CY","submitted_at":"2017-06-01T20:34:41Z","title_canon_sha256":"7a48d69f7974289f5e48a5e61d97b2f86f3fb308e8d38f5897e5392db45c8e7b"},"schema_version":"1.0","source":{"id":"1706.01513","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1706.01513","created_at":"2026-05-18T00:25:04Z"},{"alias_kind":"arxiv_version","alias_value":"1706.01513v2","created_at":"2026-05-18T00:25:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1706.01513","created_at":"2026-05-18T00:25:04Z"},{"alias_kind":"pith_short_12","alias_value":"HY4JOTAW2X2X","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_16","alias_value":"HY4JOTAW2X2XDJXX","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_8","alias_value":"HY4JOTAW","created_at":"2026-05-18T12:31:21Z"}],"graph_snapshots":[{"event_id":"sha256:b810328ac24feb84e2a5fb6f13889cac8db0987841cc3e3a97b2f5398d6bdca4","target":"graph","created_at":"2026-05-18T00:25:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"From medical charts to national census, healthcare has traditionally operated under a paper-based paradigm. However, the past decade has marked a long and arduous transformation bringing healthcare into the digital age. Ranging from electronic health records, to digitized imaging and laboratory reports, to public health datasets, today, healthcare now generates an incredible amount of digital information. Such a wealth of data presents an exciting opportunity for integrated machine learning solutions to address problems across multiple facets of healthcare practice and administration. Unfortun","authors_text":"Chao Huang, Keith Feldman, Louis Faust, Nitesh V. Chawla, Xian Wu","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CY","submitted_at":"2017-06-01T20:34:41Z","title":"Beyond Volume: The Impact of Complex Healthcare Data on the Machine Learning Pipeline"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1706.01513","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:aa0f6b89500f1bf6973102a8dc803580f1a214cabc1a091df3bd13130bd6a5b5","target":"record","created_at":"2026-05-18T00:25:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8be306a870eff2800b72788eb58c589f67239ead000d7f62b81f7d29b265ba1a","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CY","submitted_at":"2017-06-01T20:34:41Z","title_canon_sha256":"7a48d69f7974289f5e48a5e61d97b2f86f3fb308e8d38f5897e5392db45c8e7b"},"schema_version":"1.0","source":{"id":"1706.01513","kind":"arxiv","version":2}},"canonical_sha256":"3e38974c16d5f571a6f79b693383a444ebd743ca867864d1f0518e8e15aa99b5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3e38974c16d5f571a6f79b693383a444ebd743ca867864d1f0518e8e15aa99b5","first_computed_at":"2026-05-18T00:25:04.156947Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:25:04.156947Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"tlgn4pPHnE77pPsXrVoarB+nOGyF0IXn2StefJxdbyVC17PCnusV6PJ4bz3kzlgb20nOzyrdApVLotIeQj75BQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:25:04.157634Z","signed_message":"canonical_sha256_bytes"},"source_id":"1706.01513","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:aa0f6b89500f1bf6973102a8dc803580f1a214cabc1a091df3bd13130bd6a5b5","sha256:b810328ac24feb84e2a5fb6f13889cac8db0987841cc3e3a97b2f5398d6bdca4"],"state_sha256":"35e85c52ed3f90882e7897e476ce2253bab390421c89b1e41991249e044a922e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IDeY6go2ZKSTURl9wYsbbyP+kDuyCcW/jDJOt2Pj9PWBhE4z8Q+a0YjAqNZMPGCZIVx6mkXBTcEVhsxDHtBxCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-08T21:23:19.223789Z","bundle_sha256":"1d6e89416616f29e3e6432f862ef5b89433194f4fdf214cf245de256cc7b93fe"}}