@inproceedings{Tutos:2010, abstract = {This paper describes an evaluation of the answerability of a set of clinical questions posed by physicians. The clinical questions belong to two categories of the five-leaf high-level hierarchical Evidence Taxonomy created by Ely and his colleagues: Intervention and Non Intervention. The questions are passed to two search engines (PubMed, Google), two question-answering systems (MedQA, Answers.com's BrainBoost), and a dictionary (OneLook) for locating the answers to the question corpus. The output of the systems is judged by a human and scored according to the Mean Reciprocal Rank (MRR). The results show the need for question modification and analyse the impact of specific types of modifications. The results also show that No Intervention questions are easier to answer than Intervention questions. Further, generic search engines like Google obtain higher MRR than specialised systems and even higher than a version of Google based on specialised literature (PubMed) only. In addition, an analysis of the location of the answer in the returned documents is provided.}, added-at = {2010-02-03T05:18:03.000+0100}, author = {Tutos, Andreea and Moll{\'a}, Diego}, biburl = {http://www.bibsonomy.org/bibtex/276e4958f59a96bfab2f1d14d5a735174/diego_ma}, booktitle = {Proceedings HIKM 2010}, interhash = {a2d36c4e380ca7fa0f579de76f9984d3}, intrahash = {76e4958f59a96bfab2f1d14d5a735174}, keywords = {molla_medicalnlp search inf-retr question_answering biomedical molla_publication}, optpages = {8 pages}, timestamp = {2010-02-03T05:18:03.000+0100}, title = {A Study on the Use of Search Engines for Answering Clinical Questions}, year = 2010 } @incollection{Shen:2005, abstract = {In this paper, we explore the syntactic relation patterns for open domain factoid question answering. We propose a pattern extraction method to extract the various relations between the proper answers and different types of question words, including target words, head words, subject words and verbs, from syntactic trees. We further propose a QA-specific tree kernel to partially match the syntactic relation patterns. It makes the more tolerant matching between two patterns and helps to solve the data sparseness problem. Lastly, we incorporate the patterns into a Maximum Entropy Model to rank the answer candidates. The experiment on TREC questions shows that the syntactic relation patterns help to improve the performance by 6.91 MRR based on the common features.}, added-at = {2009-11-11T22:33:15.000+0100}, author = {Shen, Dan and Kruijff, Geert-Jan M. and Klakow, Dietrich}, biburl = {http://www.bibsonomy.org/bibtex/2a36b72928b449ac746792a05d0ec2d7c/diego_ma}, booktitle = {Natural Language Processing ? IJCNLP 2005: Second International Joint Conference, Jeju Island, Korea, October 11-13, 2005. Proceedings.}, editor = {Dale, Robert and Wong, Kam-Fai and Su, Jian and Kwong, Oi Yee}, interhash = {cb28273b2a1837858d716919cca0c5ed}, intrahash = {a36b72928b449ac746792a05d0ec2d7c}, keywords = {question_answering machine_learning}, publisher = {Springer-Verlag}, timestamp = {2009-11-11T22:33:15.000+0100}, title = {Exploring Syntactic Relation Patterns for Question Answering}, url = {http://www.aclweb.org/anthology-new/I/I05/I05-1045.pdf}, year = 2005 } @inproceedings{Shen:2006, abstract = {In this paper, we explore correlation of dependency relation paths to rank candidate answers in answer extraction. Using the correlation measure, we compare dependency relations of a candidate answer and mapped question phrases in sentence with the corresponding relations in question. Different from previous studies, we propose an approximate phrase mapping algorithm and incorporate the mapping score into the correlation measure. The correlations are further incorporated into a Maximum Entropy-based ranking model which estimates path weights from training. Experimental results show that our method significantly outperforms state-ofthe-art syntactic relation-based methods by up to 20% in MRR.}, added-at = {2009-11-11T22:33:09.000+0100}, address = {Sydney}, author = {Shen, Dan and Klakow, Dietrich}, biburl = {http://www.bibsonomy.org/bibtex/2b385d2d62a1cec0bcaa6f01019112f65/diego_ma}, booktitle = {Proceedings COLING/ACL 2006}, interhash = {6966be5911653238e919c7e841c639d8}, intrahash = {b385d2d62a1cec0bcaa6f01019112f65}, keywords = {question_answering machine_learning dependencies DG}, pages = {889-896}, timestamp = {2009-11-11T22:33:09.000+0100}, title = {Exploring Correlation of Dependency Relation Paths for Answer Extraction}, url = {http://acl.ldc.upenn.edu/P/P06/P06-1112.pdf}, year = 2006 } @inproceedings{Ravichandran:2003, abstract = {In this paper, we show that we can obtain a good baseline performance for Question Answering (QA) by using only 4 simple features. Using these features, we contrast two approaches used for a Maximum Entropy based QA system. We view the QA problem as a classification problem and as a reranking problem. Our results indicate that the QA system viewed as a reranker clearly outperforms the QA system used as a classifier. Both systems are trained using the same data.}, added-at = {2009-11-11T21:29:27.000+0100}, author = {Ravichandran, Deepak and Hovy, Eduard and Och, Franz Josef}, biburl = {http://www.bibsonomy.org/bibtex/2a27d23a8d3286099674171fc5307141c/diego_ma}, booktitle = {Proc. ACL03 workshop on Multilingual Summarization and Question Answering}, interhash = {0b74ba3543cd82189f339e300d293813}, intrahash = {a27d23a8d3286099674171fc5307141c}, keywords = {question_answering statistical_nlp maxent}, timestamp = {2009-11-11T21:29:27.000+0100}, title = {Statistical {QA} - Classifier vs. Re-ranker: What's the Difference?}, url = {http://acl.ldc.upenn.edu/acl2003/mlsum/pdfs/Ravichandran.pdf}, year = 2003 } @inproceedings{Cao:2009, abstract = {Question answering is different from information retrieval in that it attempts to answer questions by providing summaries from numerous retrieved documents rather than by simply providing a list of documents that requires users to do additional work. However, the quality of answers that question answering provides has not been investigated extensively, and the practical approach to presenting question answers still needs more study. In addition to factoid answering using phrases or entities, most question answering systems use a sentence- based approach for generating answers. However, many sentences are often only meaningful or understandable in their context, and a passage-based presentation can often provide richer, more coherent context. However, passage-based presentations may introduce additional noise that places greater burden on users. In this study, we performed a quantitative evaluation on the two kinds of presentation produced by our online clinical question answering system, AskHERMES (http://www.AskHERMES.org). The overall finding is that, although irrelevant context can hurt the quality of an answer, the passage-based approach is generally more effective in that it provides richer context and matching across sentences.}, added-at = {2009-10-21T23:50:43.000+0200}, author = {Cao, Yong-gang and Ely, John and Antieau, Lamont and Yu, Hong}, biburl = {http://www.bibsonomy.org/bibtex/2827423c54365f46397adff2acf5be1d8/diego_ma}, booktitle = {Proc BioNLP 2009}, interhash = {14a5f834a262696999eacebc7f973000}, intrahash = {827423c54365f46397adff2acf5be1d8}, keywords = {biomedical question_answering evaluation}, pages = {171-178}, timestamp = {2009-10-21T23:50:43.000+0200}, title = {Evaluation of the Clinical Question Answering Presentation.}, url = {http://www.aclweb.org/anthology-new/W/W09/#1300}, year = 2009 } @article{Harabagiu:2007, abstract = {Generating summaries that meet the information needs of a user relies on (1) several forms of question decomposition; (2) different summarization approaches; and (3) textual inference for combining the summarization strategies. This novel framework for summarization has the advantage of producing highly responsive summaries, as indicated by the evaluation results.}, added-at = {2009-10-21T23:09:17.000+0200}, author = {Harabagiu, Sandra and Hickl, Andrew and Lacatusu, Finley}, biburl = {http://www.bibsonomy.org/bibtex/2dffae72016582208b1c20bb067790f93/diego_ma}, interhash = {30f97c12497058459d13feb3784fb993}, intrahash = {dffae72016582208b1c20bb067790f93}, journal = {Information Processing \& Management}, keywords = {summarisation question_answering}, pages = {1619-1642}, timestamp = {2009-10-21T23:09:17.000+0200}, title = {Satisfying Information Needs with Multi-document Summaries}, url = {http://portal.acm.org/citation.cfm?id=1285158}, volume = 43, year = 2007 } @inproceedings{Green:1961, added-at = {2009-09-17T23:46:31.000+0200}, address = {Los Angeles, CA}, author = {Green, B.F. and Wolf, A.K. and Chomsky, C. and Laugherty, K.}, biburl = {http://www.bibsonomy.org/bibtex/2f671771de41cbe6596c576ab578568e2/diego_ma}, booktitle = {Proceedings Western Joint IRE-AIEE-ACM Computing Conference}, interhash = {b79d23ae18618ae1e722c4050b1575ba}, intrahash = {f671771de41cbe6596c576ab578568e2}, keywords = {question_answering}, pages = {219--224}, timestamp = {2009-09-17T23:46:31.000+0200}, title = {BASEBALL: An automatic question answerer}, volume = 19, year = 1961 } @article{Bouma:2005:3, added-at = {2009-09-15T17:22:44.000+0200}, author = {Bouma, Gosse and Fahmi, Ismail and Mur, Jori and {van Noord}, Gertjan and {van der Plas}, Lonneke and and J{\"o}rg Tiedemann}, biburl = {http://www.bibsonomy.org/bibtex/279bc05bc334f9825d321071ca3825244/diego_ma}, interhash = {653c2639b94e99bf470ba9bb26ab6342}, intrahash = {79bc05bc334f9825d321071ca3825244}, journal = {Traitement Automatique des Langues (TAL)}, keywords = {question_answering DG}, number = 3, pages = {15-39}, timestamp = {2009-09-15T17:22:44.000+0200}, title = {Linguistic Knowledge and Question Answering}, url = {http://www.let.rug.nl/~gosse/papers.html}, volume = 46, year = 2005 } @inproceedings{Lin:2007, abstract = {Access to clinical evidence is a critical component of the practice of evidence-based medicine. Advanced retrieval systems can supplement precompiled secondary sources to assist physicians in making sound clinical decisions. This study explores one particular issue related to the design of such retrieval systems: the effective organization of search results to facilitate rapid understanding and synthesis of potentially relevant information. We hypothesize that grouping retrieved MEDLINE� citations into semantically-coherent clusters, based on automatically-extracted interventions from the abstract text, represents an effective strategy for presenting results, compared to a traditional ranked list. Experiments with our implemented system appear to support this claim.}, added-at = {2009-08-28T22:25:10.000+0200}, author = {Lin, Jimmy and Demner-Fushman, Dina}, biburl = {http://www.bibsonomy.org/bibtex/2286a5fe4fa5220c95046aca38a75f533/diego_ma}, booktitle = {AMIA Annu Symp Proc.}, interhash = {a894d568ce76fdc46ac489aeb707471d}, intrahash = {286a5fe4fa5220c95046aca38a75f533}, keywords = {question_answering biomedical}, pages = {458-462}, timestamp = {2009-08-28T22:25:10.000+0200}, title = {Semantic Clustering of Answers to Clinical Questions}, url = {http://www.pubmedcentral.nih.gov/articlerender.fcgi?artid=2655873}, year = 2007 } @inproceedings{Hong:2008, abstract = {Automatically extracting information needs from ad hoc clinical questions is an important step towards medical question answering. In this work, we first explored supervised machine-learning approaches to automatically classify an ad hoc clinical question into general topics. We then explored both unsupervised and supervised methods for automatically extracting keywords from an ad hoc clinical question. Our methods were evaluated on the 4,654 clinical questions maintained by the National Library of Medicine. Our best systems or methods showed F-score of 76% for the task of question-general topic classification and of 58% for extracting keywords from ad hoc clinical questions.}, added-at = {2009-08-28T21:57:28.000+0200}, author = {Yu, Hong and Cao, Yong-gang}, biburl = {http://www.bibsonomy.org/bibtex/2f8f917ddef747ce10972cdf3c5cebae8/diego_ma}, booktitle = {AMIA Annu Symp Proc.}, interhash = {8a99115444657c334df420f4153cd102}, intrahash = {f8f917ddef747ce10972cdf3c5cebae8}, keywords = {biomedical question_answering question_analysis}, pages = {96-100}, timestamp = {2009-08-28T21:57:28.000+0200}, title = {Automatically Extracting Information Needs from Ad Hoc Clinical Questions}, year = 2008 } @inproceedings{Demner-Fushman:2006, added-at = {2009-08-28T21:47:37.000+0200}, author = {Demner-Fushman, Dina and Lin, Jimmy}, biburl = {http://www.bibsonomy.org/bibtex/29b9991ab29887cfb95d1e3aa30921a5a/diego_ma}, booktitle = {Proceedings ACL}, date = {2006-11-03}, ee = {http://acl.ldc.upenn.edu/P/P06/P06-1106.pdf}, interhash = {547a66cdb2c9f3ff1781443740b1dd85}, intrahash = {9b9991ab29887cfb95d1e3aa30921a5a}, keywords = {clinical clustering question_answering summarisation}, publisher = {The Association for Computer Linguistics}, timestamp = {2009-08-28T21:47:37.000+0200}, title = {Answer Extraction, Semantic Clustering, and Extractive Summarization for Clinical Question Answering.}, url = {http://dblp.uni-trier.de/db/conf/acl/acl2006.html\#Demner-FushmanL06}, year = 2006 } @inproceedings{Huang:2006, abstract = {The paradigm of evidence-based medicine (EBM) recommends that physicians formulate clinical questions in terms of the problem/population, intervention, comparison, and outcome. Together, these elements comprise a PICO frame. Although this framework was developed to facilitate the formulation of clinical queries, the ability of PICO structures to represent physicians� information needs has not been empirically investigated. This paper evaluates the adequacy and suitability of PICO frames as a knowledge representation by analyzing 59 real-world primary-care clinical questions. We discovered that only two questions in our corpus contain all four PICO elements, and that 37% of questions contain both intervention and outcome. Our study reveals prevalent structural patterns for the four types of clinical questions: therapy, diagnosis, prognosis, and etiology. We found that the PICO framework is primarily centered on therapy questions, and is less suitable for representing other types of clinical information needs. Challenges in mapping natural language questions into PICO structures are also discussed. Although we point out limitations of the PICO framework, our work as a whole reaffirms its value as a tool to assist physicians practicing EBM.}, added-at = {2009-08-28T21:46:37.000+0200}, author = {Huang, Xiaoli and Lin, Jimmy and Demner-Fushman, Dina}, biburl = {http://www.bibsonomy.org/bibtex/27fff9d054c3c86a475fb9fda29e9a905/diego_ma}, booktitle = {AMIA Annu Symp Proc.}, interhash = {348be73b32f29ae783785b25d0c9a1b7}, intrahash = {7fff9d054c3c86a475fb9fda29e9a905}, keywords = {PICO biomedical question_answering}, pages = {359�363}, timestamp = {2009-08-28T21:46:37.000+0200}, title = {Evaluation of {PICO} as a Knowledge Representation for Clinical Questions}, url = {http://www.pubmedcentral.nih.gov/articlerender.fcgi?tool=pubmed&pubmedid=17238363}, year = 2006 } @inproceedings{Dang:2008b, added-at = {2009-08-17T09:24:28.000+0200}, author = {Dang, Hoa Tran}, biburl = {http://www.bibsonomy.org/bibtex/21be0ee9a7553672c1912fdb3d2496121/diego_ma}, booktitle = {Proc. TAC 2008}, interhash = {d2441a48504ae8b04119ecc7f6a13398}, intrahash = {1be0ee9a7553672c1912fdb3d2496121}, keywords = {summarisation question_answering}, library = {Unknown (August 2009)}, timestamp = {2009-08-17T09:24:28.000+0200}, title = {Overview of the TAC 2008 Opinion Question Answering and Summarization Tasks}, year = 2008 } @inproceedings{Yu:2005, abstract = {Research has shown that answers do not exist in biomedical corpora for many questions posed by physicians. We have therefore developed a question filtering component that determines whether or not a posed question is answerable. Using 200 clinical questions that have been annotated by physicians to be answerable or unanswerable, we have explored the use of supervised machine-learning algorithms to automatically classify questions into one of these two categories. We also have incorporated semantic features from a large biomedical knowledge terminology. Our results show that incorporating semantic features in general enhances the performance of question classification and the best system is a probabilistic indexing system that achieves an 80.5% accuracy. Our analysis also shows that stop words may play an important role for separating Answerable from Unanswerable.}, added-at = {2009-08-14T09:16:09.000+0200}, author = {Yu, Hong and Sable, Carl}, biburl = {http://www.bibsonomy.org/bibtex/261167a4bef4dfea2596b14a905ad46e0/diego_ma}, booktitle = {Proc. IJCAI'05 Workshop on Knowledge and Reasoning for Answering Questions}, interhash = {44a3aa191951f053b00ac9f83fd96cf4}, intrahash = {61167a4bef4dfea2596b14a905ad46e0}, keywords = {question_classification question_answering biomedical answerability}, library = {Web (August 2009)}, timestamp = {2009-08-14T09:16:09.000+0200}, title = {Being Erlang Shen: Identifying Answerable Questions}, url = {http://www.uwm.edu/~hongyu/publications.html}, year = 2005 } @inproceedings{Yu:2005b, abstract = {We present supervised machine-learning approaches to automatically classify medical questions based on a hierarchical evidence taxonomy created by physicians. We show that SVMs is the best classifier for this task and that a ladder approach, which incorporates the knowledge representation of the hierarchical evidence taxonomy, leads to the highest performance. We have explored the use of features from a large, robust biomedical knowledge resource, namely, the Unified Medical Language System (UMLS), and we have found that performance is generally enhanced by including these features in addition to bag-of-words.}, added-at = {2009-08-14T09:16:01.000+0200}, author = {Yu, Hong and Sable, Carl and Zhu, Hai Ran}, biburl = {http://www.bibsonomy.org/bibtex/2536edeb935472f74ddf66a0d4deb20fd/diego_ma}, booktitle = {Proc. AAAI'05 Workshop on Question Answering in Restricted Domains}, interhash = {53370a14e66634dd4250c7f2b8114ff3}, intrahash = {536edeb935472f74ddf66a0d4deb20fd}, keywords = {question_classification question_answering biomedical}, library = {Web (August 2009)}, timestamp = {2009-08-14T09:16:01.000+0200}, title = {Classifying Medical Questions based on an Evidence Taxonomy}, url = {http://www.uwm.edu/~hongyu/publications.html}, year = 2005 } @inproceedings{Terol:2006, abstract = {Nowadays, there is an increasing interest in research on QA over restricted domains. Concretely, in this paper we will show the process of question analysis in a medical QA system. This system is able to obtain answers to different natural language questions according to a question taxonomy. In this system we combine the use of NLP techniques and biomedical resources. The main NLP technique is the use of logic forms and the pattern matching technique in this question analysis performance.}, added-at = {2009-07-22T09:58:28.000+0200}, author = {Terol, Rafael M. and Mart{\'\i}nez-Barco, Patricio and Palomar, Manuel}, biburl = {http://www.bibsonomy.org/bibtex/2c1668fd0f8578440a8ec619d9e02b46e/diego_ma}, booktitle = {MICAI 2006: Advances in Artificial Intelligence}, date = {2006-11-09}, description = {dblp}, editor = {Gelbukh, Alexander F. and Garc{\'\i}a, Carlos A. Reyes}, ee = {http://dx.doi.org/10.1007/11925231_95}, interhash = {361d56bedfd4e7a6635e69d00dd25ed6}, intrahash = {c1668fd0f8578440a8ec619d9e02b46e}, isbn = {3-540-49026-4}, keywords = {questions question_answering biomedical}, library = {Web}, pages = {996-1006}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, timestamp = {2009-07-22T09:58:28.000+0200}, title = {Applying NLP Techniques and Biomedical Resources to Medical Questions in QA Performance.}, url = {http://www.springerlink.com/content/788w3483g2723927/}, volume = 4293, year = 2006 } @inproceedings{Awadallah:2006, abstract = {Answering multiple-choice questions, where a set of possible answers is provided together with the question, constitutes a simplified but nevertheless challenging area in question answering research. This paper introduces and evaluates two novel techniques for answer selection. It furthermore analyses in how far performance figures obtained using the English language Web as data source can be transferred to less dominant languages on the Web, such as Arabic. Result evaluation is based on questions from both the English and the Arabic versions of the TV show "Who wants to be a Millionaire?" as well as on the TREC-2002 QA data.}, added-at = {2009-05-27T07:50:20.000+0200}, author = {Awadallah, Rawia and Rauber, Andreas}, biburl = {http://www.bibsonomy.org/bibtex/252a06bb724d6a7adc387ce1ce8c54491/diego_ma}, booktitle = {Proceedings of the 28th European Conference on Information Retrieval (ECIR 2006)}, interhash = {99f24b6b3fa89a0f348bd0b75552301c}, intrahash = {52a06bb724d6a7adc387ce1ce8c54491}, keywords = {multiple_choice www question_answering}, library = {Mine (May 2009)}, pages = {515-518}, timestamp = {2009-05-27T07:50:20.000+0200}, title = {Web-based Multiple Choice Question Answering for English and Arabic Questions}, url = {http://www.ifs.tuwien.ac.at/~andi/lop.html}, year = 2006 } @inproceedings{Schlaefer:2006a, abstract = {The Ephyra QA system has been developed as a flexibleopen-domain QA framework. This framework allows usto combine several techniques for question analysis andanswer extraction and to incorporate multiple knowledgebases to best fit the requirements of the TREC QAtrack, in which we participated this year for the firsttime. The techniques used include pattern learning andmatching, answer type analysis and redundancy eliminationthrough filters. In this paper, we give an overviewof the Ephyra system as used within TREC 2006 andanalyze the system's performance in the QA track.}, added-at = {2009-03-31T10:24:13.000+0200}, author = {Schlaefer, Nico and Gieselman, Petra and Sautter, Guido}, biburl = {http://www.bibsonomy.org/bibtex/2f18e676141d1db1689a7d41776cb55d7/diego_ma}, booktitle = {In Proceedings of the Fifteenth Text REtrieval Conference (TREC)}, interhash = {d1465aa0b873e8aead56a34e6a59e3c2}, intrahash = {f18e676141d1db1689a7d41776cb55d7}, keywords = {question_answering ephyra}, timestamp = {2009-03-31T10:24:13.000+0200}, title = {The Ephyra QA System at TREC 2006.}, url = {http://www.cs.cmu.edu/~nico/pubs/trec2006\_schlaefer.pdf}, year = 2006 } @inproceedings{vanZaanen:2008, added-at = {2009-03-31T10:22:24.000+0200}, author = {van Zaanen, Menno}, biburl = {http://www.bibsonomy.org/bibtex/2d30ebb040a32223b88ca07c845f3f9eb/diego_ma}, booktitle = {Working Notes of CLEF 2008}, interhash = {bf5c884ad0110f6d797aab8d8ba0d9fd}, intrahash = {d30ebb040a32223b88ca07c845f3f9eb}, keywords = {question_answering}, timestamp = {2009-03-31T10:22:24.000+0200}, title = {Multi-lingual Question Answering using OpenEphyra}, url = {http://www.clef-campaign.org/2008/working\_notes/CLEF2008WN-Contents.html}, year = 2008 } @inproceedings{Turmo:2007, abstract = {This paper describes QAST, a pilot track of CLEF 2007 aimed at evaluating the task of Question Answering in Speech Transcripts. The paper summarizes the evaluation framework, the systems that participated and the results achieved. These results have shown that question answering technology can be useful to deal with spontaneous speech transcripts, so for manually transcribed speech as for automatically recognized speech. The loss in accuracy from dealing with manual transcripts to dealing with automatic ones implies that there is room for future reseach in this area.}, added-at = {2009-03-27T09:05:20.000+0100}, address = {Berlin / Heidelberg}, author = {Turmo, Jordi and Comas, Pere R. and Ayache, Christelle and Mostefa, Djamel and Rosset, Sophie and Lamel, Lori}, biburl = {http://www.bibsonomy.org/bibtex/27a93e5480645ac89d78ec7bb158b35b1/diego_ma}, booktitle = {Advances in Multilingual and Multimodal Information Retrieval}, doi = {10.1007/978-3-540-85760-0}, interhash = {3236a27ba9183e4421ee05eba183d532}, intrahash = {7a93e5480645ac89d78ec7bb158b35b1}, keywords = {speech question_answering}, library = {Web (March 2009)}, pages = {249-256}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, timestamp = {2009-03-27T09:05:20.000+0100}, title = {Overview of {QAST 2007}}, url = {http://www.springerlink.com/content/d511437177k776q0/}, volume = {5152/2008}, year = 2007 }