{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:HGIVJKTWIJ3CK4OF2EE7WMOIBG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"99db161044d609542d3abf9025b4d982c36a6e76e98886b25e610c828b27969b","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-01-14T20:23:02Z","title_canon_sha256":"bef7540f3030555cd491355b190137ad4c93bfdd98724bb6e8f23473aa99b5f6"},"schema_version":"1.0","source":{"id":"2601.09853","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2601.09853","created_at":"2026-06-04T01:08:39Z"},{"alias_kind":"arxiv_version","alias_value":"2601.09853v3","created_at":"2026-06-04T01:08:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2601.09853","created_at":"2026-06-04T01:08:39Z"},{"alias_kind":"pith_short_12","alias_value":"HGIVJKTWIJ3C","created_at":"2026-06-04T01:08:39Z"},{"alias_kind":"pith_short_16","alias_value":"HGIVJKTWIJ3CK4OF","created_at":"2026-06-04T01:08:39Z"},{"alias_kind":"pith_short_8","alias_value":"HGIVJKTW","created_at":"2026-06-04T01:08:39Z"}],"graph_snapshots":[{"event_id":"sha256:6750f3354cad77c0dc5db30bfaa66a9edcd103d9c1bfc015803764bee6d971b1","target":"graph","created_at":"2026-06-04T01:08:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Our analysis reveals that LLMs often fail to redirect problematic questions, even when the problematic premise is detected, and provide answers that could lead to suboptimal medical decision making."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"The semi-automated pipeline accurately identifies real-world health questions that require redirection due to embedded false premises, and clinician responses provide the appropriate benchmark."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"LLMs often fail to redirect health questions containing misconceptions, unlike clinicians, exposing safety gaps in patient-facing medical AI."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"LLMs often accept false premises in real health questions instead of redirecting to correct the misconception."}],"snapshot_sha256":"203fb0db009f8ec91c3638b3ea6591c76f7946a528bb5750f164341bf91ecbe8"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2601.09853/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Real-world health questions from patients often unintentionally embed false assumptions or premises. In such cases, safe medical communication typically involves redirection: addressing the implicit misconception and then responding to the underlying patient context, rather than the original question. While large language models (LLMs) are increasingly being used by lay users for medical advice, they have not yet been tested for this crucial competency. Therefore, in this work, we investigate how LLMs react to false premises embedded within real-world health questions. We develop a semi-automa","authors_text":"Ayman Ali, Lionel Wong, Monica Agrawal, Sraavya Sambara, Vishala Mishra, Yuan Pu","cross_cats":["cs.AI"],"headline":"LLMs often accept false premises in real health questions instead of redirecting to correct the misconception.","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-01-14T20:23:02Z","title":"MedRedFlag: Investigating how LLMs Redirect Misconceptions in Real-World Health Communication"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2601.09853","kind":"arxiv","version":3},"verdict":{"created_at":"2026-05-16T14:08:12.238173Z","id":"8d41c629-a507-4810-ada0-3052f19d289e","model_set":{"reader":"grok-4.3"},"one_line_summary":"LLMs often fail to redirect health questions containing misconceptions, unlike clinicians, exposing safety gaps in patient-facing medical AI.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"LLMs often accept false premises in real health questions instead of redirecting to correct the misconception.","strongest_claim":"Our analysis reveals that LLMs often fail to redirect problematic questions, even when the problematic premise is detected, and provide answers that could lead to suboptimal medical decision making.","weakest_assumption":"The semi-automated pipeline accurately identifies real-world health questions that require redirection due to embedded false premises, and clinician responses provide the appropriate benchmark."}},"verdict_id":"8d41c629-a507-4810-ada0-3052f19d289e"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fdac162e3babc8e55bbba27854461508e4e17b134bb7b5bbe344fbcaecdebf63","target":"record","created_at":"2026-06-04T01:08:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"99db161044d609542d3abf9025b4d982c36a6e76e98886b25e610c828b27969b","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-01-14T20:23:02Z","title_canon_sha256":"bef7540f3030555cd491355b190137ad4c93bfdd98724bb6e8f23473aa99b5f6"},"schema_version":"1.0","source":{"id":"2601.09853","kind":"arxiv","version":3}},"canonical_sha256":"399154aa7642762571c5d109fb31c809bf91bb7889328c45630a561817deadc6","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"399154aa7642762571c5d109fb31c809bf91bb7889328c45630a561817deadc6","first_computed_at":"2026-06-04T01:08:39.847334Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-04T01:08:39.847334Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"pC9WUw5C02b2meTu0jDXlb00hiWYSIPHGAFetQaIGKIl5/pDdseEZCjDXrPMtnYlv2hYYRzcJAiAMzS3OtoXBg==","signature_status":"signed_v1","signed_at":"2026-06-04T01:08:39.848010Z","signed_message":"canonical_sha256_bytes"},"source_id":"2601.09853","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fdac162e3babc8e55bbba27854461508e4e17b134bb7b5bbe344fbcaecdebf63","sha256:6750f3354cad77c0dc5db30bfaa66a9edcd103d9c1bfc015803764bee6d971b1"],"state_sha256":"f33bd261c3d9788bb2d3e94e430771697c9523a612695080c1689ae6659c9bdd"}