@inproceedings{a3d4365b36d2423893b37ae07b2d6ef0,
title = "A bootstrapping approach to symptom entity extraction on Chinese electronic medical records",
abstract = "Symptom entities are widely distributed in Chinese electronic medical records. Previous approaches on symptom entity extraction usually extract continuous strings as symptom entities and require massive human efforts on corpus annotation. We describe the symptom entity as two-tuples of and design a soft pattern matching method to locate them in sentences in the EMR. Our bootstrapping approach which only requires a few annotated symptom tuples and it allows iterative extraction from mass electronic medical record databases without human supervision. Furthermore, the described method annotates symptom entities in EMR by the extracted tuples. Starting with 60 annotated entities, our approach reached an F value of 81.40 \% in the extraction task of 3,150 entities from 992 sets of electronic medical records.",
keywords = "Bootstrapping, Electronic medical record, Named entity extraction, Soft matching",
author = "Tianyi Qin and Yi Guan",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing AG 2016.; 15th China National Conference on Chinese Computational Linguistics, CCL 2016 and 4th International Symposium on Natural Language Processing Based on Naturally Annotated Big Data, NLP-NABD 2016 ; Conference date: 15-10-2016 Through 16-10-2016",
year = "2016",
doi = "10.1007/978-3-319-47674-2\_34",
language = "英语",
isbn = "9783319476735",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "413--423",
editor = "Maosong Sun and Zhiyuan Liu and Yang Liu and Hongfei Lin and Xuanjing Huang",
booktitle = "Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 15th China National Conference, CCL 2016 and 4th International Symposium, NLP-NABD 2016, Proceedings",
address = "德国",
}