@inproceedings{3c8e8f36193b4c2b8bddbb0803b036ec,
title = "An automatic unsupervised querying algorithm for efficient information extraction in biomedical domain",
abstract = "In the domain of bioinformatics, extracting a relation such as protein-protein iriterations from a large database of text documents is a challenging task. One major issue with biomedical information extraction is how to efficiently digest the sheersize of unstructured biomedical data corpus. Often, among these huge biomedical data, only a small fraction of the documents contain information that is relevant to the extraction task. We propose a novel query expansion algorithm to automatically discover the characteristics of documents that are useful for extraction of a target relation. Our technique introduces a hybrid query re-weighting algorithm combining the modified Robertson Sparck-Jones query ranking algorithm with a keyphrase extraction algorithm. Our technique also adopts a novel query translation technique that incorporates POS categories to query translation. We conduct a series of experiments and report the experimental results. The results show that our technique is able to retrieve more documents that contain protein-protein pairs from MEDLINE as iteration increases. Our technique is also compared with SLIPPER, a supervised rule-based query expansion technique. The results show that our technique outperforms SLIPPER from 17.90% to 29.98 better in four iterations.",
author = "Min Song and Song, {Il Yeol} and Xiaohua Hu and Allen, {Robert B.}",
year = "2005",
doi = "10.1007/11430919_22",
language = "English",
isbn = "3540260765",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "173--179",
booktitle = "Advances in Knowledge Discovery and Data Mining - 9th Pacific-Asia Conference, PAKDD 2005, Proceedings",
address = "Germany",
note = "9th Pacific-Asia Conference on Advances in Knowledge Discovery and Data Mining, PAKDD 2005 ; Conference date: 18-05-2005 Through 20-05-2005",
}