{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:RNKXLNDJ2QDKTSDATG4OXGQADK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c6d9e7e83fdcada655b8c37716b8a9ee5232d129d28c8bbb00fe95ea4891bc80","cross_cats_sorted":["cs.AI","cs.IR","cs.LG"],"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-13T10:06:38Z","title_canon_sha256":"9897394a88de9f227fdf8de1a9f4fe89e4f681206ce22204e0a58a01c6eadc41"},"schema_version":"1.0","source":{"id":"2605.13292","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.13292","created_at":"2026-05-18T02:44:49Z"},{"alias_kind":"arxiv_version","alias_value":"2605.13292v1","created_at":"2026-05-18T02:44:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.13292","created_at":"2026-05-18T02:44:49Z"},{"alias_kind":"pith_short_12","alias_value":"RNKXLNDJ2QDK","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"RNKXLNDJ2QDKTSDA","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"RNKXLNDJ","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:1bdef930807cd6df2c71a2869f86fc71096cc6e7774f9100e2b426a71b1f0fd1","target":"graph","created_at":"2026-05-18T02:44:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"We introduce IndicMedDialog, a parallel multi-turn medical dialogue dataset spanning English and nine Indic languages... Building on this dataset, we fine-tune IndicMedLM via parameter-efficient adaptation... and validate clinical plausibility through medical expert evaluation."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"The assumption that LLM-generated synthetic consultations, after translation with TranslateGemma and native-speaker verification, produce clinically plausible multi-turn dialogues that faithfully represent real patient-provider interactions without introducing systematic biases or factual errors."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"A parallel multi-turn medical dialogue dataset spanning English and nine Indic languages is created from synthetic consultations to enable personalized AI healthcare interactions."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"IndicMedDialog supplies parallel multi-turn medical dialogues in English and nine Indic languages to support personalized symptom-elicitation models."}],"snapshot_sha256":"782364865667287f6575d7c7b5c4a4ed4cc3a79475bd78f0b6f278996fb065a6"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Most existing medical dialogue systems operate in a single-turn question--answering paradigm or rely on template-based datasets, limiting conversational realism and multilingual applicability. We introduce IndicMedDialog, a parallel multi-turn medical dialogue dataset spanning English and nine Indic languages: Assamese, Bengali, Gujarati, Hindi, Marathi, Punjabi, Tamil, Telugu, and Urdu. The dataset extends MDDial with LLM-generated synthetic consultations, translated using TranslateGemma, verified by native speakers, and refined through a script-aware post-processing pipeline to correct phone","authors_text":"Piyush Patel, Shubham Kumar Nigam, Suparnojit Sarkar","cross_cats":["cs.AI","cs.IR","cs.LG"],"headline":"IndicMedDialog supplies parallel multi-turn medical dialogues in English and nine Indic languages to support personalized symptom-elicitation models.","license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-13T10:06:38Z","title":"IndicMedDialog: A Parallel Multi-Turn Medical Dialogue Dataset for Accessible Healthcare in Indic Languages"},"references":{"count":44,"internal_anchors":8,"resolved_work":44,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"Findings of the Association for Computational Linguistics: EMNLP 2024 , pages=","work_id":"20248839-bcd4-47c1-bec1-a4a048743cf8","year":2024},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":2,"title":"arXiv preprint arXiv:2308.08147 , year=","work_id":"cc378513-cbea-4d77-8737-597402d227ce","year":null},{"cited_arxiv_id":"2505.19630","doi":"","is_internal_anchor":true,"ref_index":3,"title":"Real-World Doctor Agent with Proactive Consultation through Multi-Agent Reinforcement Learning","work_id":"23afdfee-e306-49ad-873c-211334e6416a","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":4,"title":"Proceedings of the 2020 conference on empirical methods in natural language processing (EMNLP) , pages=","work_id":"f57864c4-6d2e-4692-bcc8-acc5c2dc05a9","year":2020},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"CCF International Conference on Natural Language Processing and Chinese Computing , pages=","work_id":"a3400c06-5077-4dc9-a9d2-7963397047d3","year":2022}],"snapshot_sha256":"59dd021b8dc861fa880a303af8b43d9520994cf63000366f80260b49f29fa6fe"},"source":{"id":"2605.13292","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-14T19:00:32.441240Z","id":"8522d356-9916-4dee-bb05-193e227de195","model_set":{"reader":"grok-4.3"},"one_line_summary":"A parallel multi-turn medical dialogue dataset spanning English and nine Indic languages is created from synthetic consultations to enable personalized AI healthcare interactions.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"IndicMedDialog supplies parallel multi-turn medical dialogues in English and nine Indic languages to support personalized symptom-elicitation models.","strongest_claim":"We introduce IndicMedDialog, a parallel multi-turn medical dialogue dataset spanning English and nine Indic languages... Building on this dataset, we fine-tune IndicMedLM via parameter-efficient adaptation... and validate clinical plausibility through medical expert evaluation.","weakest_assumption":"The assumption that LLM-generated synthetic consultations, after translation with TranslateGemma and native-speaker verification, produce clinically plausible multi-turn dialogues that faithfully represent real patient-provider interactions without introducing systematic biases or factual errors."}},"verdict_id":"8522d356-9916-4dee-bb05-193e227de195"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:87a01f85388d3f4691cd3c3bba50d0cdffd9d4cd0f7d8e773bde49dbe909de80","target":"record","created_at":"2026-05-18T02:44:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c6d9e7e83fdcada655b8c37716b8a9ee5232d129d28c8bbb00fe95ea4891bc80","cross_cats_sorted":["cs.AI","cs.IR","cs.LG"],"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-13T10:06:38Z","title_canon_sha256":"9897394a88de9f227fdf8de1a9f4fe89e4f681206ce22204e0a58a01c6eadc41"},"schema_version":"1.0","source":{"id":"2605.13292","kind":"arxiv","version":1}},"canonical_sha256":"8b5575b469d406a9c86099b8eb9a001a98f95bafcb88901c0008de9639d7f4d2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8b5575b469d406a9c86099b8eb9a001a98f95bafcb88901c0008de9639d7f4d2","first_computed_at":"2026-05-18T02:44:49.111874Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:44:49.111874Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"IjLtIjH7QTbfbN6MxFvlqBzGTQ2iSvBc2I4MK3tAp9kRNgf6U5fl9DsLkauQ7tFW1H0/9Qsj+nmQc866fKg6DQ==","signature_status":"signed_v1","signed_at":"2026-05-18T02:44:49.112362Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.13292","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:87a01f85388d3f4691cd3c3bba50d0cdffd9d4cd0f7d8e773bde49dbe909de80","sha256:1bdef930807cd6df2c71a2869f86fc71096cc6e7774f9100e2b426a71b1f0fd1"],"state_sha256":"c993ac459756818e82d71e252bac6b2df79682a2b9fa93c4d18816fbb563e4a5"}