{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:KZA5Y7NUWG5HG3PDZ5DKPPO7KY","short_pith_number":"pith:KZA5Y7NU","canonical_record":{"source":{"id":"1811.09417","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-23T10:20:02Z","cross_cats_sorted":[],"title_canon_sha256":"411b720ba67b0889bb4aafacd746bff92d609c15f42ec5c3bd547eb1e86e567f","abstract_canon_sha256":"33f83cd24c7c7d808d13bbc896dc02d023d7aaebb81369bf50b1dd34d54b32b4"},"schema_version":"1.0"},"canonical_sha256":"5641dc7db4b1ba736de3cf46a7bddf560e630be289735ff39650d234a00b9f9d","source":{"kind":"arxiv","id":"1811.09417","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.09417","created_at":"2026-05-17T23:59:37Z"},{"alias_kind":"arxiv_version","alias_value":"1811.09417v2","created_at":"2026-05-17T23:59:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.09417","created_at":"2026-05-17T23:59:37Z"},{"alias_kind":"pith_short_12","alias_value":"KZA5Y7NUWG5H","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"KZA5Y7NUWG5HG3PD","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"KZA5Y7NU","created_at":"2026-05-18T12:32:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:KZA5Y7NUWG5HG3PDZ5DKPPO7KY","target":"record","payload":{"canonical_record":{"source":{"id":"1811.09417","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-23T10:20:02Z","cross_cats_sorted":[],"title_canon_sha256":"411b720ba67b0889bb4aafacd746bff92d609c15f42ec5c3bd547eb1e86e567f","abstract_canon_sha256":"33f83cd24c7c7d808d13bbc896dc02d023d7aaebb81369bf50b1dd34d54b32b4"},"schema_version":"1.0"},"canonical_sha256":"5641dc7db4b1ba736de3cf46a7bddf560e630be289735ff39650d234a00b9f9d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:59:37.900997Z","signature_b64":"Wh/+PTNvWZrQFyqbnZQQ/STyjpkgS7HooS92OA29xLxLUXDvjuec178sDB+V4G0EQFnd3kw8+frTJ3q68GMcAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5641dc7db4b1ba736de3cf46a7bddf560e630be289735ff39650d234a00b9f9d","last_reissued_at":"2026-05-17T23:59:37.900394Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:59:37.900394Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1811.09417","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EhL8Y5sg11Bym45ljdyIcKVo3eS7MlngWAGXAI31P7g7glEo2ohtggONODlm78PBv+Wqbyh4EGUOx5mgIohJBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-05T02:33:47.384047Z"},"content_sha256":"3b0bb4e4158ae75e74a81e61c23126c029545b0758530dda7edba177139f3851","schema_version":"1.0","event_id":"sha256:3b0bb4e4158ae75e74a81e61c23126c029545b0758530dda7edba177139f3851"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:KZA5Y7NUWG5HG3PDZ5DKPPO7KY","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Natural language understanding for task oriented dialog in the biomedical domain in a low resources context","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Anita Burgun, Antoine Neuraz, Leonardo Campillos Llanos, Sophie Rosset","submitted_at":"2018-11-23T10:20:02Z","abstract_excerpt":"In the biomedical domain, the lack of sharable datasets often limit the possibility of developing natural language processing systems, especially dialogue applications and natural language understanding models. To overcome this issue, we explore data generation using templates and terminologies and data augmentation approaches. Namely, we report our experiments using paraphrasing and word representations learned on a large EHR corpus with Fasttext and ELMo, to learn a NLU model without any available dataset. We evaluate on a NLU task of natural language queries in EHRs divided in slot-filling "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.09417","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"N72IZ9thVGCVSr70O1RWl+g77+G0p5Jn/sae30oOjx4WRAlFphMwgRMFh14V+02yHdxGUm5MJFZT0k70JPBNBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-05T02:33:47.384447Z"},"content_sha256":"6a7a000da7ebf123af3a7882bcb349346ac0366efbf9391c891682bd018703c1","schema_version":"1.0","event_id":"sha256:6a7a000da7ebf123af3a7882bcb349346ac0366efbf9391c891682bd018703c1"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/KZA5Y7NUWG5HG3PDZ5DKPPO7KY/bundle.json","state_url":"https://pith.science/pith/KZA5Y7NUWG5HG3PDZ5DKPPO7KY/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/KZA5Y7NUWG5HG3PDZ5DKPPO7KY/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-05T02:33:47Z","links":{"resolver":"https://pith.science/pith/KZA5Y7NUWG5HG3PDZ5DKPPO7KY","bundle":"https://pith.science/pith/KZA5Y7NUWG5HG3PDZ5DKPPO7KY/bundle.json","state":"https://pith.science/pith/KZA5Y7NUWG5HG3PDZ5DKPPO7KY/state.json","well_known_bundle":"https://pith.science/.well-known/pith/KZA5Y7NUWG5HG3PDZ5DKPPO7KY/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:KZA5Y7NUWG5HG3PDZ5DKPPO7KY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"33f83cd24c7c7d808d13bbc896dc02d023d7aaebb81369bf50b1dd34d54b32b4","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-23T10:20:02Z","title_canon_sha256":"411b720ba67b0889bb4aafacd746bff92d609c15f42ec5c3bd547eb1e86e567f"},"schema_version":"1.0","source":{"id":"1811.09417","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.09417","created_at":"2026-05-17T23:59:37Z"},{"alias_kind":"arxiv_version","alias_value":"1811.09417v2","created_at":"2026-05-17T23:59:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.09417","created_at":"2026-05-17T23:59:37Z"},{"alias_kind":"pith_short_12","alias_value":"KZA5Y7NUWG5H","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"KZA5Y7NUWG5HG3PD","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"KZA5Y7NU","created_at":"2026-05-18T12:32:33Z"}],"graph_snapshots":[{"event_id":"sha256:6a7a000da7ebf123af3a7882bcb349346ac0366efbf9391c891682bd018703c1","target":"graph","created_at":"2026-05-17T23:59:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In the biomedical domain, the lack of sharable datasets often limit the possibility of developing natural language processing systems, especially dialogue applications and natural language understanding models. To overcome this issue, we explore data generation using templates and terminologies and data augmentation approaches. Namely, we report our experiments using paraphrasing and word representations learned on a large EHR corpus with Fasttext and ELMo, to learn a NLU model without any available dataset. We evaluate on a NLU task of natural language queries in EHRs divided in slot-filling ","authors_text":"Anita Burgun, Antoine Neuraz, Leonardo Campillos Llanos, Sophie Rosset","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-23T10:20:02Z","title":"Natural language understanding for task oriented dialog in the biomedical domain in a low resources context"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.09417","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3b0bb4e4158ae75e74a81e61c23126c029545b0758530dda7edba177139f3851","target":"record","created_at":"2026-05-17T23:59:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"33f83cd24c7c7d808d13bbc896dc02d023d7aaebb81369bf50b1dd34d54b32b4","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-23T10:20:02Z","title_canon_sha256":"411b720ba67b0889bb4aafacd746bff92d609c15f42ec5c3bd547eb1e86e567f"},"schema_version":"1.0","source":{"id":"1811.09417","kind":"arxiv","version":2}},"canonical_sha256":"5641dc7db4b1ba736de3cf46a7bddf560e630be289735ff39650d234a00b9f9d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5641dc7db4b1ba736de3cf46a7bddf560e630be289735ff39650d234a00b9f9d","first_computed_at":"2026-05-17T23:59:37.900394Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:59:37.900394Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Wh/+PTNvWZrQFyqbnZQQ/STyjpkgS7HooS92OA29xLxLUXDvjuec178sDB+V4G0EQFnd3kw8+frTJ3q68GMcAw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:59:37.900997Z","signed_message":"canonical_sha256_bytes"},"source_id":"1811.09417","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3b0bb4e4158ae75e74a81e61c23126c029545b0758530dda7edba177139f3851","sha256:6a7a000da7ebf123af3a7882bcb349346ac0366efbf9391c891682bd018703c1"],"state_sha256":"ed41710ee1ee6a9d0699eb506a58f31f9c399e69b5fb0a9974db4eb7717c2f5a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"HHBIHaPgT8HLJmM+IgsSzoqN9U2/LywP6SjOPivylayce2IRkCeew1KyVe/Fh5mppmmHr1GQyItRgQunufomDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-05T02:33:47.386577Z","bundle_sha256":"f39876efb159014df1c31550e9c3d42cf8b98b87e50ba635b400958f72d0af23"}}