{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2020:XDXLGQ6G2FTU5F7BGE5CR4625Z","short_pith_number":"pith:XDXLGQ6G","canonical_record":{"source":{"id":"2005.06624","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-05-08T14:04:18Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"4cea616f3297459cc26187ca2f613753ad2bf6e94b21948f911b088f935b9e07","abstract_canon_sha256":"09fbc370ad920e35d6da31ea847605dc428aec02d2ac67cad0128faee3510ee5"},"schema_version":"1.0"},"canonical_sha256":"b8eeb343c6d1674e97e1313a28f3daee6e929474af8efb721299732fbffa3010","source":{"kind":"arxiv","id":"2005.06624","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2005.06624","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"arxiv_version","alias_value":"2005.06624v1","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2005.06624","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"pith_short_12","alias_value":"XDXLGQ6G2FTU","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"pith_short_16","alias_value":"XDXLGQ6G2FTU5F7B","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"pith_short_8","alias_value":"XDXLGQ6G","created_at":"2026-07-05T01:02:48Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2020:XDXLGQ6G2FTU5F7BGE5CR4625Z","target":"record","payload":{"canonical_record":{"source":{"id":"2005.06624","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-05-08T14:04:18Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"4cea616f3297459cc26187ca2f613753ad2bf6e94b21948f911b088f935b9e07","abstract_canon_sha256":"09fbc370ad920e35d6da31ea847605dc428aec02d2ac67cad0128faee3510ee5"},"schema_version":"1.0"},"canonical_sha256":"b8eeb343c6d1674e97e1313a28f3daee6e929474af8efb721299732fbffa3010","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T01:02:48.829351Z","signature_b64":"O91iuXjqSsvyTf3W772PjRn37XS6mC2eJ5vr6ataRoPInry5PESNiQXYbc+wAxYC+o+JwmjbIJ+qQLF4GJwJDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b8eeb343c6d1674e97e1313a28f3daee6e929474af8efb721299732fbffa3010","last_reissued_at":"2026-07-05T01:02:48.828902Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T01:02:48.828902Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2005.06624","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:02:48Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"aLaIc5VvR+6XuswIX45aLTQibMejDxG+E4XYNYeweFPMddR/xXwF84KT7n6moa71gVtg0UjNWx3uYIFZyK0oAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T12:22:30.270550Z"},"content_sha256":"7cc9608365e621364834cc4c2368a0caaafe1eaaa984e87bcb4fc6b0f8e4d32a","schema_version":"1.0","event_id":"sha256:7cc9608365e621364834cc4c2368a0caaafe1eaaa984e87bcb4fc6b0f8e4d32a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2020:XDXLGQ6G2FTU5F7BGE5CR4625Z","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Comparative Analysis of Text Classification Approaches in Electronic Health Records","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Angus Roberts, Aurelie Mascio, Daniel Bean, Rebecca Bendayan, Richard Dobson, Robert Stewart, Zeljko Kraljevic","submitted_at":"2020-05-08T14:04:18Z","abstract_excerpt":"Text classification tasks which aim at harvesting and/or organizing information from electronic health records are pivotal to support clinical and translational research. However these present specific challenges compared to other classification tasks, notably due to the particular nature of the medical lexicon and language used in clinical records. Recent advances in embedding methods have shown promising results for several clinical tasks, yet there is no exhaustive comparison of such approaches with other commonly used word representations and classification models. In this work, we analyse"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2005.06624","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2005.06624/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:02:48Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZCZfidijVD0FPDyWWkMM7jS6uUk/oEUaidXBlICHa5hnEbvxa2sNTaMuGdxuEBHi1BPClV3ukbgGefTgJ99nBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T12:22:30.270927Z"},"content_sha256":"94fd0a3d0303f275ce8003f5001ccd4e185dced6a8345c9f37e689a708bdad54","schema_version":"1.0","event_id":"sha256:94fd0a3d0303f275ce8003f5001ccd4e185dced6a8345c9f37e689a708bdad54"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XDXLGQ6G2FTU5F7BGE5CR4625Z/bundle.json","state_url":"https://pith.science/pith/XDXLGQ6G2FTU5F7BGE5CR4625Z/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XDXLGQ6G2FTU5F7BGE5CR4625Z/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T12:22:30Z","links":{"resolver":"https://pith.science/pith/XDXLGQ6G2FTU5F7BGE5CR4625Z","bundle":"https://pith.science/pith/XDXLGQ6G2FTU5F7BGE5CR4625Z/bundle.json","state":"https://pith.science/pith/XDXLGQ6G2FTU5F7BGE5CR4625Z/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XDXLGQ6G2FTU5F7BGE5CR4625Z/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2020:XDXLGQ6G2FTU5F7BGE5CR4625Z","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"09fbc370ad920e35d6da31ea847605dc428aec02d2ac67cad0128faee3510ee5","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-05-08T14:04:18Z","title_canon_sha256":"4cea616f3297459cc26187ca2f613753ad2bf6e94b21948f911b088f935b9e07"},"schema_version":"1.0","source":{"id":"2005.06624","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2005.06624","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"arxiv_version","alias_value":"2005.06624v1","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2005.06624","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"pith_short_12","alias_value":"XDXLGQ6G2FTU","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"pith_short_16","alias_value":"XDXLGQ6G2FTU5F7B","created_at":"2026-07-05T01:02:48Z"},{"alias_kind":"pith_short_8","alias_value":"XDXLGQ6G","created_at":"2026-07-05T01:02:48Z"}],"graph_snapshots":[{"event_id":"sha256:94fd0a3d0303f275ce8003f5001ccd4e185dced6a8345c9f37e689a708bdad54","target":"graph","created_at":"2026-07-05T01:02:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2005.06624/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Text classification tasks which aim at harvesting and/or organizing information from electronic health records are pivotal to support clinical and translational research. However these present specific challenges compared to other classification tasks, notably due to the particular nature of the medical lexicon and language used in clinical records. Recent advances in embedding methods have shown promising results for several clinical tasks, yet there is no exhaustive comparison of such approaches with other commonly used word representations and classification models. In this work, we analyse","authors_text":"Angus Roberts, Aurelie Mascio, Daniel Bean, Rebecca Bendayan, Richard Dobson, Robert Stewart, Zeljko Kraljevic","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-05-08T14:04:18Z","title":"Comparative Analysis of Text Classification Approaches in Electronic Health Records"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2005.06624","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7cc9608365e621364834cc4c2368a0caaafe1eaaa984e87bcb4fc6b0f8e4d32a","target":"record","created_at":"2026-07-05T01:02:48Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"09fbc370ad920e35d6da31ea847605dc428aec02d2ac67cad0128faee3510ee5","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-05-08T14:04:18Z","title_canon_sha256":"4cea616f3297459cc26187ca2f613753ad2bf6e94b21948f911b088f935b9e07"},"schema_version":"1.0","source":{"id":"2005.06624","kind":"arxiv","version":1}},"canonical_sha256":"b8eeb343c6d1674e97e1313a28f3daee6e929474af8efb721299732fbffa3010","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b8eeb343c6d1674e97e1313a28f3daee6e929474af8efb721299732fbffa3010","first_computed_at":"2026-07-05T01:02:48.828902Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T01:02:48.828902Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"O91iuXjqSsvyTf3W772PjRn37XS6mC2eJ5vr6ataRoPInry5PESNiQXYbc+wAxYC+o+JwmjbIJ+qQLF4GJwJDw==","signature_status":"signed_v1","signed_at":"2026-07-05T01:02:48.829351Z","signed_message":"canonical_sha256_bytes"},"source_id":"2005.06624","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7cc9608365e621364834cc4c2368a0caaafe1eaaa984e87bcb4fc6b0f8e4d32a","sha256:94fd0a3d0303f275ce8003f5001ccd4e185dced6a8345c9f37e689a708bdad54"],"state_sha256":"f6c504b153830177300bf4300422a79e21788c11bb16054f2569bdb9aab0f492"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CIP0VwO6LwDdYykUiSJOpXMn1aHy8qN3NMAY9bjdlcXamt/nWPXMk0HDI3zVKYGcbY/wkaK+AGa9xDLSr4qyAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T12:22:30.272850Z","bundle_sha256":"01968143e565e9d2a2d2e9071518566d99019a3d2dd729483135cec51f159ae7"}}