@inproceedings{8a7707a26a6347758c70a3aac2ac2f5b,
title = "Open Information Extraction with Meta-pattern Discovery in Biomedical Literature",
abstract = "Biomedical open information extraction (BioOpenIE) is a novel paradigm to automatically extract structured information from unstructured text with no or little supervision. It does not require any pre-specified relation types but aims to extract all the relation tuples from the corpus. A major challenge for open information extraction (OpenIE) is that it produces massive surface-name formed relation tuples that cannot be directly used for downstream applications. We propose a novel framework CPIE (Clause+Pattern-guided Information Extraction) that incorporates clause extraction and meta-pattern discovery to extract structured relation tuples with little supervision. Compared with previous OpenIE methods, CPIE produces massive but more structured output that can be directly used for downstream applications. We first detect short clauses from input sentences. Then we extract quality textual patterns and perform synonymous pattern grouping to identify relation types. Last, we obtain the corresponding relation tuples by matching each quality pattern in the text. Experiments show that CPIE achieves the highest precision in comparison with state-of-the-art OpenIE baselines, and also keeps the distinctiveness and simplicity of the extracted relation tuples. CPIE shows great potential in effectively dealing with real-world biomedical literature with complicated sentence structures and rich information.",
keywords = "Biomedical information extraction, Open information extraction, Pattern mining, Text mining",
author = "Xuan Wang and Yu Zhang and Qi Li and Yinyin Chen and Jiawei Han",
note = "Publisher Copyright: {\textcopyright} 2018 ACM.; 9th ACM International Conference on Bioinformatics, Computational Biology, and Health Informatics, ACM-BCB 2018 ; Conference date: 29-08-2018 Through 01-09-2018",
year = "2018",
month = aug,
day = "15",
doi = "10.1145/3233547.3233594",
language = "English (US)",
series = "ACM-BCB 2018 - Proceedings of the 2018 ACM International Conference on Bioinformatics, Computational Biology, and Health Informatics",
publisher = "Association for Computing Machinery",
pages = "291--300",
booktitle = "ACM-BCB 2018 - Proceedings of the 2018 ACM International Conference on Bioinformatics, Computational Biology, and Health Informatics",
address = "United States",
}