<?xml version="1.0" encoding="UTF-8"?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:burst="http://xmlns.com/burst/0.1/" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns="http://purl.org/rss/1.0/" xmlns:admin="http://webns.net/mvcb/" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:swrc="http://swrc.ontoware.org/ontology#" xmlns:cc="http://web.resource.org/cc/"><channel rdf:about="http://www.bibsonomy.org/user/diego_ma/named_entities"><title>BibSonomy publications for /user/diego_ma/named_entities</title><link>http://www.bibsonomy.org/burst/user/diego_ma/named_entities</link><description>BibSonomy RSS feed for /user/diego_ma/named_entities</description><dc:date>2010-03-21T18:46:03+01:00</dc:date><items><rdf:Seq><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/26331703e11ece23065a9fda52e0827ad/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/264e2ff61c23df0f5f02914ea091dc158/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/28d8585e90538626d8169eeeb8dda4d97/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2753c74267baabe14fe6d420b78043998/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/28a56675983754175b10280cc944d8e92/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2cf5005cce6fad851c7227451f85c4fcb/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2f9d2c45fe747b42f22f5da88cf71fd41/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2fe587667402ffc32b6d0d635db627a7d/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2a97c64b39d5d713400082f785d734d5b/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2d4f233fd44172dfcf0d98dd03bc781e1/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2ce8cc5153963e37fc34d9b71c2bbcc93/diego_ma"/></rdf:Seq></items></channel><item rdf:about="http://www.bibsonomy.org/bibtex/26331703e11ece23065a9fda52e0827ad/diego_ma"><title>A Survey of Named Entity Recognition and Classification</title><link>http://www.bibsonomy.org/bibtex/26331703e11ece23065a9fda52e0827ad/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2009-07-06T10:21:03+02:00</dc:date><dc:subject>named_entities survey </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Nadeau, &lt;a href=&#034;http://www.bibsonomy.org/author/David&#034;&gt;David&lt;/a&gt;  and Sekine, &lt;a href=&#034;http://www.bibsonomy.org/author/Satoshi&#034;&gt;Satoshi&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Journal of Linguisticae Investigationes&lt;/em&gt;&lt;em&gt;30(1):1-20&lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/survey"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/26331703e11ece23065a9fda52e0827ad/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/26331703e11ece23065a9fda52e0827ad/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://nlp.cs.nyu.edu/sekine/papers/li07.pdf"/><swrc:date>Mon Jul 06 10:21:03 CEST 2009</swrc:date><swrc:journal>Journal of Linguisticae Investigationes</swrc:journal><swrc:number>1</swrc:number><swrc:pages>1-20</swrc:pages><swrc:title>A Survey of Named Entity Recognition and Classification</swrc:title><swrc:volume>30</swrc:volume><swrc:year>2007</swrc:year><swrc:keywords>named_entities survey </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="Mine (July 2009)" swrc:key="library"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Nadeau, David"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Sekine, Satoshi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/264e2ff61c23df0f5f02914ea091dc158/diego_ma"><title>Named Entity Recognition for Question Answering</title><link>http://www.bibsonomy.org/bibtex/264e2ff61c23df0f5f02914ea091dc158/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2008-10-10T05:18:00+02:00</dc:date><dc:subject>named_entities AnswerFinder molla_publication </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Diego &lt;a href=&#034;http://www.bibsonomy.org/author/Moll{\&amp;#039;a}&#034;&gt;Moll&amp;#225;&lt;/a&gt;  and Menno van &lt;a href=&#034;http://www.bibsonomy.org/author/Zaanen&#034;&gt;Zaanen&lt;/a&gt;  and Daniel &lt;a href=&#034;http://www.bibsonomy.org/author/Smith&#034;&gt;Smith&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings ALTW 2006, &lt;/em&gt;&lt;em&gt;page 51-58. &lt;/em&gt;(&lt;em&gt;2006&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/AnswerFinder"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/molla_publication"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/264e2ff61c23df0f5f02914ea091dc158/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/264e2ff61c23df0f5f02914ea091dc158/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Fri Oct 10 05:18:00 CEST 2008</swrc:date><swrc:booktitle>Proceedings ALTW 2006</swrc:booktitle><swrc:pages>51-58</swrc:pages><swrc:title>Named Entity Recognition for Question Answering</swrc:title><swrc:year>2006</swrc:year><swrc:keywords>named_entities AnswerFinder molla_publication </swrc:keywords><swrc:abstract>Current text-based question answering (QA) systems usually contain a named entity recogniser (NER) as a core component. Named entity recognition as traditionally been developed as a component for information extraction systems, and current techniques are focused on this end use. However, no formal assessment has been done on the characteristics of a NER within the task of question answering. In this paper we present a NER that aims at higher recall by allowing multiple entity labels to strings. The NER is embedded in a question answering system and the overall QA system performance is compared to that of one with a traditional variation of the NER that only allows single entity labels. It is shown that the added noise produced introduced by the additional labels is offset by the higher recall gained, therefore enabling the QA system to have a better chance to find the answer.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Diego Moll{\&#039;a}"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Menno van Zaanen"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Daniel Smith"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/28d8585e90538626d8169eeeb8dda4d97/diego_ma"><title>A Named Entity Recogniser for Question Answering</title><link>http://www.bibsonomy.org/bibtex/28d8585e90538626d8169eeeb8dda4d97/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2008-01-29T07:22:25+01:00</dc:date><dc:subject>AnswerFinder named_entities molla_publication </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Menno van &lt;a href=&#034;http://www.bibsonomy.org/author/Zaanen&#034;&gt;Zaanen&lt;/a&gt;  and Diego &lt;a href=&#034;http://www.bibsonomy.org/author/Moll\&amp;#039;a&#034;&gt;Moll\&#039;a&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings PACLING 2007, &lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/AnswerFinder"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/molla_publication"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/28d8585e90538626d8169eeeb8dda4d97/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/28d8585e90538626d8169eeeb8dda4d97/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Tue Jan 29 07:22:25 CET 2008</swrc:date><swrc:booktitle>Proceedings PACLING 2007</swrc:booktitle><swrc:title>A Named Entity Recogniser for Question Answering</swrc:title><swrc:year>2007</swrc:year><swrc:keywords>AnswerFinder named_entities molla_publication </swrc:keywords><swrc:abstract>Named Entity Recognisers (NERs) are typically used by question answering (QA) systems as means to preselect answer candidates. However, there has not been much work on the formal assessment of the use of NERs for QA nor on their optimal parameters. In this paper we investigate the main characteristics of a NER for QA. The results show that it is important to maintain high recall to retain all possible answers on the one hand, while high precision is essential during the final answer selection phase. We present a NER designed for QA, which aims at having a high recall.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Menno van Zaanen"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Diego Moll\&#039;a"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"><title>Named Entity Recognition in Question Answering of Speech Data</title><link>http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2008-01-29T07:21:37+01:00</dc:date><dc:subject>AnswerFinder named_entities speech molla_publication </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Diego &lt;a href=&#034;http://www.bibsonomy.org/author/Moll{\&amp;#039;a}&#034;&gt;Moll&amp;#225;&lt;/a&gt;  and Menno van &lt;a href=&#034;http://www.bibsonomy.org/author/Zaanen&#034;&gt;Zaanen&lt;/a&gt;  and Steve &lt;a href=&#034;http://www.bibsonomy.org/author/Cassidy&#034;&gt;Cassidy&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. ALTW 2007, &lt;/em&gt;&lt;em&gt; 5, &lt;/em&gt;&lt;em&gt;page 57-65. &lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/AnswerFinder"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/molla_publication"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.alta.asn.au/events/altw2007/cdrom/index.html"/><swrc:date>Tue Jan 29 07:21:37 CET 2008</swrc:date><swrc:booktitle>Proc. ALTW 2007</swrc:booktitle><swrc:pages>57-65</swrc:pages><swrc:title>Named Entity Recognition in Question Answering of Speech Data</swrc:title><swrc:volume>5</swrc:volume><swrc:year>2007</swrc:year><swrc:keywords>AnswerFinder named_entities speech molla_publication </swrc:keywords><swrc:abstract>Question answering on speech transcripts (QAst) is a pilot track of the CLEF competition. In this paper we present our contribution to QAst, which is centred on a study of Named Entity (NE) recognition on speech transcripts, and how it impacts on the accuracy of the final question answering system. We have ported AFNER, the NE recogniser of the AnswerFinder question-answering project, to the set of answer types expected in the QAst track. AFNER uses a combination of regular expressions, lists of names (gazetteers) and machine learning to find NeWS in the data. The machine learning component was trained on a development set of the AMI corpus. In the process we identified various problems with scalability of the system and the existence of errors of the extracted annotation, which lead to relatively poor performance in general. Performance was yet comparable with state of the art, and the system was second (out of three participants) in one of the QAst subtasks.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Diego Moll{\&#039;a}"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Menno van Zaanen"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Steve Cassidy"/></rdf:_3></rdf:Seq></swrc:author><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="Nathalie Colineau"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Mark Dras"/></rdf:_2></rdf:Seq></swrc:editor></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2753c74267baabe14fe6d420b78043998/diego_ma"><title>Named Entity Recognition using an HMM-based Chunk Tagger</title><link>http://www.bibsonomy.org/bibtex/2753c74267baabe14fe6d420b78043998/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:48:42+01:00</dc:date><dc:subject>named_entities machine_learning </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;GuoDong &lt;a href=&#034;http://www.bibsonomy.org/author/Zhou&#034;&gt;Zhou&lt;/a&gt;  and Jian &lt;a href=&#034;http://www.bibsonomy.org/author/Su&#034;&gt;Su&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. 40th Annual Meeting of the Association for Computational Linguistics ACL 2002, &lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/machine_learning"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2753c74267baabe14fe6d420b78043998/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2753c74267baabe14fe6d420b78043998/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Fri Dec 14 02:48:42 CET 2007</swrc:date><swrc:booktitle>Proc. 40th Annual Meeting of the Association for Computational Linguistics (ACL 2002)</swrc:booktitle><swrc:title>Named Entity Recognition using an {HMM}-based Chunk Tagger</swrc:title><swrc:year>2002</swrc:year><swrc:keywords>named_entities machine_learning </swrc:keywords><swrc:abstract>This paper proposes a Hidden Markov Model (HMM) and an HMM-based chunk tagger, from which a named entity (NE) recognition (NER) system is built to recognize and classify names, times and numerical quantities. Through the HMM, our system is able to apply and integrate four types of internal and external evidences: 1) simple deterministic internal feature of the words, such as capitalization and digitalization; 2) internal semantic feature of important triggers; 3) internal gazetteer feature; 4) external macro context feature. In this way, the NER problem can be resolved effectively. Evaluation of our system on MUC-6 and MUC-7 English NE tasks achieves F-measures of 96.6% and 94.1% respectively. It shows that the performance is significantly better than reported by any other machine-learning system. Moreover, the performance is even consistently better than those based on handcrafted rules.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="GuoDong Zhou"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Jian Su"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"><title>Named Entity Recognition from Spontaneous Open-Domain Speech</title><link>http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:47:08+01:00</dc:date><dc:subject>named_entities speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Mihai &lt;a href=&#034;http://www.bibsonomy.org/author/Surdeanu&#034;&gt;Surdeanu&lt;/a&gt;  and Jordi &lt;a href=&#034;http://www.bibsonomy.org/author/Turmo&#034;&gt;Turmo&lt;/a&gt;  and Eli &lt;a href=&#034;http://www.bibsonomy.org/author/Comelles&#034;&gt;Comelles&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings Interspeech-05, &lt;/em&gt;&lt;em&gt;Lisbon, &lt;/em&gt;(&lt;em&gt;2005&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.lsi.upc.edu/~comelles/"/><swrc:date>Fri Dec 14 02:47:08 CET 2007</swrc:date><swrc:address>Lisbon</swrc:address><swrc:booktitle>Proceedings Interspeech-05</swrc:booktitle><swrc:title>Named Entity Recognition from Spontaneous Open-Domain Speech</swrc:title><swrc:year>2005</swrc:year><swrc:keywords>named_entities speech </swrc:keywords><swrc:abstract>This paper presents an analysis of named entity recognition and classification in spontaneous speech transcripts. We annotated a significant fraction of the Switchboard corpus with six named entity classes and investigated a battery of machine learning models that include lexical, syntactic, and semantic attributes. The best recognition and classification model obtains promising results, approaching within 5% a system evaluated on clean textual data.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Mihai Surdeanu"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Jordi Turmo"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Eli Comelles"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/28a56675983754175b10280cc944d8e92/diego_ma"><title>Reducing Question Answering Input Data Using Named Entity Recognition</title><link>http://www.bibsonomy.org/bibtex/28a56675983754175b10280cc944d8e92/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:44:32+01:00</dc:date><dc:subject>question_answering named_entities </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Elisa &lt;a href=&#034;http://www.bibsonomy.org/author/Noguera&#034;&gt;Noguera&lt;/a&gt;  and Antonio &lt;a href=&#034;http://www.bibsonomy.org/author/Toral&#034;&gt;Toral&lt;/a&gt;  and Fernando &lt;a href=&#034;http://www.bibsonomy.org/author/Llopis&#034;&gt;Llopis&lt;/a&gt;  and Rafael &lt;a href=&#034;http://www.bibsonomy.org/author/Mu{\~n}oz&#034;&gt;Mu&amp;#241;oz&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings of the 8th International Conference on Text, Speech \&amp;amp; Dialogue, &lt;/em&gt;&lt;em&gt;page 428-434. &lt;/em&gt;(&lt;em&gt;2005&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/question_answering"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/28a56675983754175b10280cc944d8e92/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/28a56675983754175b10280cc944d8e92/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://dx.doi.org/10.1007/11551874_55"/><swrc:date>Fri Dec 14 02:44:32 CET 2007</swrc:date><swrc:booktitle>Proceedings of the 8th International Conference on Text, Speech \&amp; Dialogue</swrc:booktitle><swrc:pages>428-434</swrc:pages><swrc:title>Reducing Question Answering Input Data Using Named Entity Recognition</swrc:title><swrc:year>2005</swrc:year><swrc:keywords>question_answering named_entities </swrc:keywords><swrc:abstract>In a previous paper we proved that Named Entity Recognition plays an important role to improve Question Answering by both increasing the quality of the data and by reducing its quantity. Here we present a more in-depth discussion, studying several ways in which NER can be applied in order to produce a maximum data reduction. We achieve a 60% reduction without significant data loss and a 92.5% with a reasonable implication in data quality.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Elisa Noguera"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Antonio Toral"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Fernando Llopis"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Rafael Mu{\~n}oz"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"><title>Orthographic Case Restoration Using Supervised Learning without Manual Annotation</title><link>http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:44:29+01:00</dc:date><dc:subject>named_entities question_answering speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Cheng &lt;a href=&#034;http://www.bibsonomy.org/author/Niu&#034;&gt;Niu&lt;/a&gt;  and Wei &lt;a href=&#034;http://www.bibsonomy.org/author/Li&#034;&gt;Li&lt;/a&gt;  and  &lt;a href=&#034;http://www.bibsonomy.org/author/Jihong&#034;&gt;Jihong&lt;/a&gt;  and Rohini &lt;a href=&#034;http://www.bibsonomy.org/author/Shrihari&#034;&gt;Shrihari&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;International Journal on Artificial Intelligence Tools&lt;/em&gt;&lt;em&gt;13(1):141-156&lt;/em&gt;(&lt;em&gt;2004&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/question_answering"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://homepage.mac.com/liwei999/WeiLi/Publications.html"/><swrc:date>Fri Dec 14 02:44:29 CET 2007</swrc:date><swrc:journal>International Journal on Artificial Intelligence Tools</swrc:journal><swrc:number>1</swrc:number><swrc:pages>141-156</swrc:pages><swrc:title>Orthographic Case Restoration Using Supervised Learning without Manual Annotation</swrc:title><swrc:volume>13</swrc:volume><swrc:year>2004</swrc:year><swrc:keywords>named_entities question_answering speech </swrc:keywords><swrc:abstract>One challenge in text processing is the treatment of case insensitive documents such as speech recognition results. The traditional approach is to re-train a language model excluding case-related features. This paper presents an alternative two-step approach whereby a preprocessing module (Step 1) is designed to restore case-sensitive form which is subsequently processed by the original system (Step 2). Step 1 is mainly implemented as a Hidden Markov Model trained on a large raw corpus of case sensitive documents. It is demonstrated that this approach (i) outperforms the feature exclusion approach for named entity tagging, (ii) leads to limited degradation for parsing, relationship extraction and case insensitive question answering, (iii) reduces system complexity, and (iv) has wide applicability: the restored text can be used in both statistical model and rule-based systems.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Cheng Niu"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Wei Li"/></rdf:_2><rdf:_3><swrc:Person swrc:name=" Jihong"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Rohini Shrihari"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2cf5005cce6fad851c7227451f85c4fcb/diego_ma"><title>Named Entity recognition without gazetteers</title><link>http://www.bibsonomy.org/bibtex/2cf5005cce6fad851c7227451f85c4fcb/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:43:23+01:00</dc:date><dc:subject>named_entities </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Andrei &lt;a href=&#034;http://www.bibsonomy.org/author/Mikheev&#034;&gt;Mikheev&lt;/a&gt;  and Marc &lt;a href=&#034;http://www.bibsonomy.org/author/Moens&#034;&gt;Moens&lt;/a&gt;  and Claire &lt;a href=&#034;http://www.bibsonomy.org/author/Grover&#034;&gt;Grover&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings of the Association for Computational Linguistics, &lt;/em&gt;&lt;em&gt;page 1--8. &lt;/em&gt;&lt;em&gt;Association for Computational Linguistics, &lt;/em&gt;(&lt;em&gt;1999&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2cf5005cce6fad851c7227451f85c4fcb/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2cf5005cce6fad851c7227451f85c4fcb/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Fri Dec 14 02:43:23 CET 2007</swrc:date><swrc:booktitle>Proceedings of the Association for Computational Linguistics</swrc:booktitle><swrc:pages>1--8</swrc:pages><swrc:publisher><swrc:Organization swrc:name="Association for Computational Linguistics"/></swrc:publisher><swrc:title>Named Entity recognition without gazetteers</swrc:title><swrc:year>1999</swrc:year><swrc:keywords>named_entities </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Andrei Mikheev"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Marc Moens"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Claire Grover"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2f9d2c45fe747b42f22f5da88cf71fd41/diego_ma"><title>Two Applications of Information Extraction to Biological Science Journal Articles: Enzyme Interactions and Protein Structures</title><link>http://www.bibsonomy.org/bibtex/2f9d2c45fe747b42f22f5da88cf71fd41/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:40:53+01:00</dc:date><dc:subject>inf_extraction named_entities </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Kevin &lt;a href=&#034;http://www.bibsonomy.org/author/Humphreys&#034;&gt;Humphreys&lt;/a&gt;  and George &lt;a href=&#034;http://www.bibsonomy.org/author/Demetriou&#034;&gt;Demetriou&lt;/a&gt;  and Robert &lt;a href=&#034;http://www.bibsonomy.org/author/Gaizauskas&#034;&gt;Gaizauskas&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings of the Pacific Symposium on Biocomputing&#039; 00 PSB&#039;00, &lt;/em&gt;&lt;em&gt;page 502-513. &lt;/em&gt;&lt;em&gt;Honolulu, Hawaii, &lt;/em&gt;(&lt;em&gt;2000&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/inf_extraction"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2f9d2c45fe747b42f22f5da88cf71fd41/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2f9d2c45fe747b42f22f5da88cf71fd41/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.bionlp.org/psb2000/humphreys.pdf"/><swrc:date>Fri Dec 14 02:40:53 CET 2007</swrc:date><swrc:booktitle>Proceedings of the Pacific Symposium on Biocomputing&#039; 00 (PSB&#039;00)</swrc:booktitle><swrc:organization><swrc:Organization swrc:name="Honolulu, Hawaii"/></swrc:organization><swrc:pages>502-513</swrc:pages><swrc:title>Two Applications of Information Extraction to Biological Science Journal Articles: Enzyme Interactions and Protein Structures</swrc:title><swrc:year>2000</swrc:year><swrc:keywords>inf_extraction named_entities </swrc:keywords><swrc:abstract>Information extraction technology, as defined and developed through the U.S. DARPA Message Understanding Conferences (MUCs), has proved successful at extracting information primarily from newswire texts and primarily in domains concerned with human activity. In this paper we consider the application of this technology to the extraction of information from scientific journal papers in the area of molecular biology. In particular, we describe how an information extraction system designed to participate in the MUC exercises has been modified for two bioinformatics applications: EMPathIE, concerned with enzyme and metabolic pathways; and PASTA, concerned with protein structure. Progress to date provides convincing grounds for believing that IE techniques will deliver novel and effective ways for scientists to make use of the core literature which defines their disciplines.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Kevin Humphreys"/></rdf:_1><rdf:_2><swrc:Person swrc:name="George Demetriou"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Robert Gaizauskas"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2fe587667402ffc32b6d0d635db627a7d/diego_ma"><title>Learning to Recognize Names Across Languages</title><link>http://www.bibsonomy.org/bibtex/2fe587667402ffc32b6d0d635db627a7d/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:39:12+01:00</dc:date><dc:subject>named_entities </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Anthony F. &lt;a href=&#034;http://www.bibsonomy.org/author/Gallippi&#034;&gt;Gallippi&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. COLING 1996, &lt;/em&gt;&lt;em&gt;page 424-429. &lt;/em&gt;(&lt;em&gt;1996&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2fe587667402ffc32b6d0d635db627a7d/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2fe587667402ffc32b6d0d635db627a7d/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://acl.ldc.upenn.edu/C/C96/C96-1072.pdf"/><swrc:date>Fri Dec 14 02:39:12 CET 2007</swrc:date><swrc:booktitle>Proc. COLING 1996</swrc:booktitle><swrc:pages>424-429</swrc:pages><swrc:title>Learning to Recognize Names Across Languages</swrc:title><swrc:year>1996</swrc:year><swrc:keywords>named_entities </swrc:keywords><swrc:abstract>The development of natural language proccessing (NLP) systems that perform machine translation (MT) and information retrieval (IR) has highlighted the need for the automatic recognition of proper names. While various name recognizers have been developed, they suffer from being too limited; some only recognize one name class, and all are language specific. This work develops an approach to multilingual name recognition that allows a system optimized for one language to be ported to another with little additional effort and resources. An initial core set of linguistic features, useful for name recognition in most languages, is identified. When porting to a new language, these features need to be converted (partly by hand, partly by on-line lists), after which point machine learning (ML) techniques build decision trees that map features to name classes. A system initially optimized for English has been successfully ported to Spanish and Japanese. Only a few days of human effort for each new language results in performance levels comparable to that of the best current English systems.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Anthony F. Gallippi"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2a97c64b39d5d713400082f785d734d5b/diego_ma"><title>Fine Grained Classification of Named Entities</title><link>http://www.bibsonomy.org/bibtex/2a97c64b39d5d713400082f785d734d5b/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:38:51+01:00</dc:date><dc:subject>machine_learning named_entities </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Michael &lt;a href=&#034;http://www.bibsonomy.org/author/Fleischman&#034;&gt;Fleischman&lt;/a&gt;  and Eduard &lt;a href=&#034;http://www.bibsonomy.org/author/Hovy&#034;&gt;Hovy&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings of Coling 2002, &lt;/em&gt;&lt;em&gt;Taipei, Taiwan, &lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/machine_learning"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2a97c64b39d5d713400082f785d734d5b/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2a97c64b39d5d713400082f785d734d5b/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.mit.edu/~mbf/COLING_02.pdf"/><swrc:date>Fri Dec 14 02:38:51 CET 2007</swrc:date><swrc:address>Taipei, Taiwan</swrc:address><swrc:booktitle>Proceedings of Coling 2002</swrc:booktitle><swrc:title>Fine Grained Classification of Named Entities</swrc:title><swrc:year>2002</swrc:year><swrc:keywords>machine_learning named_entities </swrc:keywords><swrc:abstract>While Named Entity extraction is useful in many natural language applications, the coarse categories that most NE extractors work with prove insufficient for complex applications such as Question Answering and Ontology generation. We examine one coarse category of named entities, persons, and describe a method for automatically classifying person instances into eight finergrained subcategories. We present a supervised learning method that considers the local context surrounding the entity as well as more global semantic information derived from topic signatures and WordNet. We reinforce this method with an algorithm that takes advantage of the presence of entities in multiple contexts.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Michael Fleischman"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Eduard Hovy"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2d4f233fd44172dfcf0d98dd03bc781e1/diego_ma"><title>Named Entity Recognition: A Maximum Entropy Approach Using Global Information</title><link>http://www.bibsonomy.org/bibtex/2d4f233fd44172dfcf0d98dd03bc781e1/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:37:20+01:00</dc:date><dc:subject>named_entities machine_learning </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Haoi Leong &lt;a href=&#034;http://www.bibsonomy.org/author/Chieu&#034;&gt;Chieu&lt;/a&gt;  and Hwee Tou &lt;a href=&#034;http://www.bibsonomy.org/author/Ng&#034;&gt;Ng&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings COLING 2002, &lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/machine_learning"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2d4f233fd44172dfcf0d98dd03bc781e1/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2d4f233fd44172dfcf0d98dd03bc781e1/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Fri Dec 14 02:37:20 CET 2007</swrc:date><swrc:booktitle>Proceedings COLING 2002</swrc:booktitle><swrc:title>Named Entity Recognition: A Maximum Entropy Approach Using Global Information</swrc:title><swrc:year>2002</swrc:year><swrc:keywords>named_entities machine_learning </swrc:keywords><swrc:abstract>This paper presents a maximum entropy-based named entity recognizer (NER). It differs from previous machine learning-based NERs in that it uses information from the whole document to classify each word, with just one classifier. Previous work that involves the gathering of information from the whole document often uses a secondary classifier, which corrects the mistakes of a primary sentencebased classifier. In this paper, we show that the maximum entropy framework is able to make use of global information directly, and achieves performance that is comparable to the best previous machine learning-based NERs on MUC-6 and MUC-7 test data.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Haoi Leong Chieu"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Hwee Tou Ng"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2ce8cc5153963e37fc34d9b71c2bbcc93/diego_ma"><title>The Role of Named Entities in Text Classification</title><link>http://www.bibsonomy.org/bibtex/2ce8cc5153963e37fc34d9b71c2bbcc93/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:35:36+01:00</dc:date><dc:subject>named_entities text_categorisation </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Quintin &lt;a href=&#034;http://www.bibsonomy.org/author/Armour&#034;&gt;Armour&lt;/a&gt;  and Nathalie &lt;a href=&#034;http://www.bibsonomy.org/author/Japkowicz&#034;&gt;Japkowicz&lt;/a&gt;  and Stan &lt;a href=&#034;http://www.bibsonomy.org/author/Matwin&#034;&gt;Matwin&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings CLiNE 2005, &lt;/em&gt;&lt;em&gt;Gatineau, Canada, &lt;/em&gt;(&lt;em&gt;2005&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/text_categorisation"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2ce8cc5153963e37fc34d9b71c2bbcc93/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2ce8cc5153963e37fc34d9b71c2bbcc93/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.crtl.ca/cline05/cline05_papers/ArmourJapkowiczMatwin.pdf"/><swrc:date>Fri Dec 14 02:35:36 CET 2007</swrc:date><swrc:address>Gatineau, Canada</swrc:address><swrc:booktitle>Proceedings CLiNE 2005</swrc:booktitle><swrc:title>The Role of Named Entities in Text Classification</swrc:title><swrc:year>2005</swrc:year><swrc:keywords>named_entities text_categorisation </swrc:keywords><swrc:abstract>Named entities are typically associated with names of people, places and organizations and constitute a group of textual elements present in almost any type of document. The general techniques used to extract them and their variable-length property also makes them an attractive type of attribute to study in text classification. In this paper, several data sets are characterized as being either dependent or independent of named entities with a Naive Bayes based ranking technique. Using this characterization, results are presented which find named entities to be in fact useful in classification tasks, and that accuracy can be improved by considering them as a special type of attribute. Namely, the inclusion of regular terms, named entity representation and the frequency with which a classifier is retrained all have an impact on the classification of documents where named entities are important.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Quintin Armour"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Nathalie Japkowicz"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Stan Matwin"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item></rdf:RDF>