{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2020:2K3TRM62POZTRL3EJOBSIMEIVX","short_pith_number":"pith:2K3TRM62","schema_version":"1.0","canonical_sha256":"d2b738b3da7bb338af644b83243088adf73dc05afc98ebc63e9598b444c4bfeb","source":{"kind":"arxiv","id":"2012.04545","version":1},"attestation_state":"computed","paper":{"title":"Discovering key topics from short, real-world medical inquiries via natural language processing and unsupervised learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL","cs.IR"],"primary_cat":"cs.LG","authors_text":"Andreas Mattern, Angelo Ziletti, Christoph Berns, David Ruau, Jagatheswari Virayah, Jennifer Liang, Marion Schwaerzler, Oliver Treichel, Stephanie Kammerath, Thomas Weber, Xin Ma","submitted_at":"2020-12-08T16:37:34Z","abstract_excerpt":"Millions of unsolicited medical inquiries are received by pharmaceutical companies every year. It has been hypothesized that these inquiries represent a treasure trove of information, potentially giving insight into matters regarding medicinal products and the associated medical treatments. However, due to the large volume and specialized nature of the inquiries, it is difficult to perform timely, recurrent, and comprehensive analyses. Here, we propose a machine learning approach based on natural language processing and unsupervised learning to automatically discover key topics in real-world m"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2012.04545","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2020-12-08T16:37:34Z","cross_cats_sorted":["cs.CL","cs.IR"],"title_canon_sha256":"7eb2479afbc5e23415176d7a9f74ef68420cce9efc6f3980551082d5c9197dae","abstract_canon_sha256":"b1fddbfa0b5d6e84096bc468614b697577bd173396de19eba6a8de327a7f6536"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T03:26:14.473190Z","signature_b64":"Qp0XFoZ03OFRB9mjbPvsWBk7yK7wpYTGu/pavk9B7CTLRlzbMGfrC7Te8IgyJVG6CaNergCzuJ4EaqV1U7+rDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d2b738b3da7bb338af644b83243088adf73dc05afc98ebc63e9598b444c4bfeb","last_reissued_at":"2026-07-05T03:26:14.472709Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T03:26:14.472709Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Discovering key topics from short, real-world medical inquiries via natural language processing and unsupervised learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL","cs.IR"],"primary_cat":"cs.LG","authors_text":"Andreas Mattern, Angelo Ziletti, Christoph Berns, David Ruau, Jagatheswari Virayah, Jennifer Liang, Marion Schwaerzler, Oliver Treichel, Stephanie Kammerath, Thomas Weber, Xin Ma","submitted_at":"2020-12-08T16:37:34Z","abstract_excerpt":"Millions of unsolicited medical inquiries are received by pharmaceutical companies every year. It has been hypothesized that these inquiries represent a treasure trove of information, potentially giving insight into matters regarding medicinal products and the associated medical treatments. However, due to the large volume and specialized nature of the inquiries, it is difficult to perform timely, recurrent, and comprehensive analyses. Here, we propose a machine learning approach based on natural language processing and unsupervised learning to automatically discover key topics in real-world m"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2012.04545","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2012.04545/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2012.04545","created_at":"2026-07-05T03:26:14.472768+00:00"},{"alias_kind":"arxiv_version","alias_value":"2012.04545v1","created_at":"2026-07-05T03:26:14.472768+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2012.04545","created_at":"2026-07-05T03:26:14.472768+00:00"},{"alias_kind":"pith_short_12","alias_value":"2K3TRM62POZT","created_at":"2026-07-05T03:26:14.472768+00:00"},{"alias_kind":"pith_short_16","alias_value":"2K3TRM62POZTRL3E","created_at":"2026-07-05T03:26:14.472768+00:00"},{"alias_kind":"pith_short_8","alias_value":"2K3TRM62","created_at":"2026-07-05T03:26:14.472768+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX","json":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX.json","graph_json":"https://pith.science/api/pith-number/2K3TRM62POZTRL3EJOBSIMEIVX/graph.json","events_json":"https://pith.science/api/pith-number/2K3TRM62POZTRL3EJOBSIMEIVX/events.json","paper":"https://pith.science/paper/2K3TRM62"},"agent_actions":{"view_html":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX","download_json":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX.json","view_paper":"https://pith.science/paper/2K3TRM62","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2012.04545&json=true","fetch_graph":"https://pith.science/api/pith-number/2K3TRM62POZTRL3EJOBSIMEIVX/graph.json","fetch_events":"https://pith.science/api/pith-number/2K3TRM62POZTRL3EJOBSIMEIVX/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX/action/timestamp_anchor","attest_storage":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX/action/storage_attestation","attest_author":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX/action/author_attestation","sign_citation":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX/action/citation_signature","submit_replication":"https://pith.science/pith/2K3TRM62POZTRL3EJOBSIMEIVX/action/replication_record"}},"created_at":"2026-07-05T03:26:14.472768+00:00","updated_at":"2026-07-05T03:26:14.472768+00:00"}