{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:E6IPE6Z22Y3TE4ONKN6PCS4DDF","short_pith_number":"pith:E6IPE6Z2","canonical_record":{"source":{"id":"1808.09397","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-08-28T16:43:19Z","cross_cats_sorted":[],"title_canon_sha256":"a165b66298ea3e16fa3d82b0b6af0efc7cef96c959de4b28cf899caa6edad7fd","abstract_canon_sha256":"0e4657f6ce6bdd8114eb67adeed7726dd24fc5c978cd6ee0e449cf38ec420592"},"schema_version":"1.0"},"canonical_sha256":"2790f27b3ad6373271cd537cf14b831962909a8a3b4539f65e4db15b3048c21a","source":{"kind":"arxiv","id":"1808.09397","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.09397","created_at":"2026-05-18T00:07:01Z"},{"alias_kind":"arxiv_version","alias_value":"1808.09397v1","created_at":"2026-05-18T00:07:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.09397","created_at":"2026-05-18T00:07:01Z"},{"alias_kind":"pith_short_12","alias_value":"E6IPE6Z22Y3T","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"E6IPE6Z22Y3TE4ON","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"E6IPE6Z2","created_at":"2026-05-18T12:32:19Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:E6IPE6Z22Y3TE4ONKN6PCS4DDF","target":"record","payload":{"canonical_record":{"source":{"id":"1808.09397","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-08-28T16:43:19Z","cross_cats_sorted":[],"title_canon_sha256":"a165b66298ea3e16fa3d82b0b6af0efc7cef96c959de4b28cf899caa6edad7fd","abstract_canon_sha256":"0e4657f6ce6bdd8114eb67adeed7726dd24fc5c978cd6ee0e449cf38ec420592"},"schema_version":"1.0"},"canonical_sha256":"2790f27b3ad6373271cd537cf14b831962909a8a3b4539f65e4db15b3048c21a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:07:01.506581Z","signature_b64":"pYIDzic+HWZKjn03odd5kwNOJTdGBmVC6kobv/6pNW1h4Obhjdwt8PHvoby5LR0IIMkILlh7nRY1p806KwIBDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"2790f27b3ad6373271cd537cf14b831962909a8a3b4539f65e4db15b3048c21a","last_reissued_at":"2026-05-18T00:07:01.506075Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:07:01.506075Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1808.09397","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jFzi+7PIJ5N/LiHtNYhrZUjviMvtAoZGFItITbjCCjFsLwYgn/ioVs2W/k3twYjgEbnCrx2V8nP8aFF5a7lYAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T16:39:53.148297Z"},"content_sha256":"68f0f4992cb1ec7241ae62b162b2e8e904579bbb88a43ddc91fdfef8666fd9c9","schema_version":"1.0","event_id":"sha256:68f0f4992cb1ec7241ae62b162b2e8e904579bbb88a43ddc91fdfef8666fd9c9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:E6IPE6Z22Y3TE4ONKN6PCS4DDF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"MedSTS: A Resource for Clinical Semantic Textual Similarity","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Feichen Shen, Hongfang Liu, Liwei Wang, Majid Rastegar-Mojarad, Naveed Afzal, Sunyang Fu, Yanshan Wang","submitted_at":"2018-08-28T16:43:19Z","abstract_excerpt":"The wide adoption of electronic health records (EHRs) has enabled a wide range of applications leveraging EHR data. However, the meaningful use of EHR data largely depends on our ability to efficiently extract and consolidate information embedded in clinical text where natural language processing (NLP) techniques are essential. Semantic textual similarity (STS) that measures the semantic similarity between text snippets plays a significant role in many NLP applications. In the general NLP domain, STS shared tasks have made available a huge collection of text snippet pairs with manual annotatio"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.09397","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Paq1wVLttjfwxTUFw2M4b+MuEJxFSGh0Rreqescpcwvem8qQ8rLXTP0Oi+si8eops4jQzlmBZK2lteUHzcx0Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T16:39:53.148954Z"},"content_sha256":"3df7f1add0b217b2a6e2fae24410698336f22b64bd5a26f0520764bb078e51b6","schema_version":"1.0","event_id":"sha256:3df7f1add0b217b2a6e2fae24410698336f22b64bd5a26f0520764bb078e51b6"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/E6IPE6Z22Y3TE4ONKN6PCS4DDF/bundle.json","state_url":"https://pith.science/pith/E6IPE6Z22Y3TE4ONKN6PCS4DDF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/E6IPE6Z22Y3TE4ONKN6PCS4DDF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T16:39:53Z","links":{"resolver":"https://pith.science/pith/E6IPE6Z22Y3TE4ONKN6PCS4DDF","bundle":"https://pith.science/pith/E6IPE6Z22Y3TE4ONKN6PCS4DDF/bundle.json","state":"https://pith.science/pith/E6IPE6Z22Y3TE4ONKN6PCS4DDF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/E6IPE6Z22Y3TE4ONKN6PCS4DDF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:E6IPE6Z22Y3TE4ONKN6PCS4DDF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0e4657f6ce6bdd8114eb67adeed7726dd24fc5c978cd6ee0e449cf38ec420592","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-08-28T16:43:19Z","title_canon_sha256":"a165b66298ea3e16fa3d82b0b6af0efc7cef96c959de4b28cf899caa6edad7fd"},"schema_version":"1.0","source":{"id":"1808.09397","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.09397","created_at":"2026-05-18T00:07:01Z"},{"alias_kind":"arxiv_version","alias_value":"1808.09397v1","created_at":"2026-05-18T00:07:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.09397","created_at":"2026-05-18T00:07:01Z"},{"alias_kind":"pith_short_12","alias_value":"E6IPE6Z22Y3T","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"E6IPE6Z22Y3TE4ON","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"E6IPE6Z2","created_at":"2026-05-18T12:32:19Z"}],"graph_snapshots":[{"event_id":"sha256:3df7f1add0b217b2a6e2fae24410698336f22b64bd5a26f0520764bb078e51b6","target":"graph","created_at":"2026-05-18T00:07:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The wide adoption of electronic health records (EHRs) has enabled a wide range of applications leveraging EHR data. However, the meaningful use of EHR data largely depends on our ability to efficiently extract and consolidate information embedded in clinical text where natural language processing (NLP) techniques are essential. Semantic textual similarity (STS) that measures the semantic similarity between text snippets plays a significant role in many NLP applications. In the general NLP domain, STS shared tasks have made available a huge collection of text snippet pairs with manual annotatio","authors_text":"Feichen Shen, Hongfang Liu, Liwei Wang, Majid Rastegar-Mojarad, Naveed Afzal, Sunyang Fu, Yanshan Wang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-08-28T16:43:19Z","title":"MedSTS: A Resource for Clinical Semantic Textual Similarity"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.09397","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:68f0f4992cb1ec7241ae62b162b2e8e904579bbb88a43ddc91fdfef8666fd9c9","target":"record","created_at":"2026-05-18T00:07:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0e4657f6ce6bdd8114eb67adeed7726dd24fc5c978cd6ee0e449cf38ec420592","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-08-28T16:43:19Z","title_canon_sha256":"a165b66298ea3e16fa3d82b0b6af0efc7cef96c959de4b28cf899caa6edad7fd"},"schema_version":"1.0","source":{"id":"1808.09397","kind":"arxiv","version":1}},"canonical_sha256":"2790f27b3ad6373271cd537cf14b831962909a8a3b4539f65e4db15b3048c21a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2790f27b3ad6373271cd537cf14b831962909a8a3b4539f65e4db15b3048c21a","first_computed_at":"2026-05-18T00:07:01.506075Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:07:01.506075Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"pYIDzic+HWZKjn03odd5kwNOJTdGBmVC6kobv/6pNW1h4Obhjdwt8PHvoby5LR0IIMkILlh7nRY1p806KwIBDg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:07:01.506581Z","signed_message":"canonical_sha256_bytes"},"source_id":"1808.09397","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:68f0f4992cb1ec7241ae62b162b2e8e904579bbb88a43ddc91fdfef8666fd9c9","sha256:3df7f1add0b217b2a6e2fae24410698336f22b64bd5a26f0520764bb078e51b6"],"state_sha256":"8dd3cad4b6bdf7c8711470a979f37484d5517544adfd15a8f9d9c62aa75df9f6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"utp8MQgZ403YWk5UHqi+Q6/HCHKSsM8GaWjgKKYFUnKdORcJTtU9AtFFHxYeivLCKvOQHQKBgDhh0INUeEIBCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T16:39:53.152432Z","bundle_sha256":"622406d94a6254e8724f94f36a301c4595ed297be9b8b46a2e05dae04c9f7422"}}