{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:2BFLNK5RFPWSHEQPMSZILMYUZB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ecec3f0f8a4b0bd5ca86a46468b070d477a1f5530221dae81d1d7e6cf75a2d2c","cross_cats_sorted":["cs.CL","stat.AP","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-29T22:15:22Z","title_canon_sha256":"835ffc4a9f8dc5d510544277a9c1de4679a197b9513311619f1cfca28ddb2c79"},"schema_version":"1.0","source":{"id":"1904.12973","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.12973","created_at":"2026-05-17T23:47:06Z"},{"alias_kind":"arxiv_version","alias_value":"1904.12973v2","created_at":"2026-05-17T23:47:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.12973","created_at":"2026-05-17T23:47:06Z"},{"alias_kind":"pith_short_12","alias_value":"2BFLNK5RFPWS","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"2BFLNK5RFPWSHEQP","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"2BFLNK5R","created_at":"2026-05-18T12:33:07Z"}],"graph_snapshots":[{"event_id":"sha256:899f940f6449b2ac79b6ee9778d8a059e324abd2d35c627f13a827052b93fb15","target":"graph","created_at":"2026-05-17T23:47:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The recent adoption of Electronic Health Records (EHRs) by health care providers has introduced an important source of data that provides detailed and highly specific insights into patient phenotypes over large cohorts. These datasets, in combination with machine learning and statistical approaches, generate new opportunities for research and clinical care. However, many methods require the patient representations to be in structured formats, while the information in the EHR is often locked in unstructured texts designed for human readability. In this work, we develop the methodology to automa","authors_text":"Andreas Wicki, Fernando Perez Cruz, Gunnar R\\\"atsch, Julia E. Vogt, Kjong Lehmann, Melanie F. Pradier, Stefan G. Stark, Stephanie L. Hyland","cross_cats":["cs.CL","stat.AP","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-29T22:15:22Z","title":"Unsupervised Extraction of Phenotypes from Cancer Clinical Notes for Association Studies"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.12973","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:371529c318b6457644b9d7de3e4dae1f826aaa7d4e7c0e83982eab9a16b7bde4","target":"record","created_at":"2026-05-17T23:47:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ecec3f0f8a4b0bd5ca86a46468b070d477a1f5530221dae81d1d7e6cf75a2d2c","cross_cats_sorted":["cs.CL","stat.AP","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-29T22:15:22Z","title_canon_sha256":"835ffc4a9f8dc5d510544277a9c1de4679a197b9513311619f1cfca28ddb2c79"},"schema_version":"1.0","source":{"id":"1904.12973","kind":"arxiv","version":2}},"canonical_sha256":"d04ab6abb12bed23920f64b285b314c8751ba7970b3aeb249aacc67e4c670059","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d04ab6abb12bed23920f64b285b314c8751ba7970b3aeb249aacc67e4c670059","first_computed_at":"2026-05-17T23:47:06.924154Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:47:06.924154Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"nQmKuc1eUPx3wlwDMnT+18FSjKIUHNroXAN32vwGipdzy7At2dbZvPxaK8NN3UqgZHA+o2nbOE04iOvpK07OBg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:47:06.924734Z","signed_message":"canonical_sha256_bytes"},"source_id":"1904.12973","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:371529c318b6457644b9d7de3e4dae1f826aaa7d4e7c0e83982eab9a16b7bde4","sha256:899f940f6449b2ac79b6ee9778d8a059e324abd2d35c627f13a827052b93fb15"],"state_sha256":"705c5ddff576cd7f53100c2e390e1fef42e61fe8fdec066c5041e0e86f76e88f"}