<?xml version="1.0" encoding="UTF-8"?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:burst="http://xmlns.com/burst/0.1/" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns="http://purl.org/rss/1.0/" xmlns:admin="http://webns.net/mvcb/" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:swrc="http://swrc.ontoware.org/ontology#" xmlns:cc="http://web.resource.org/cc/"><channel rdf:about="http://www.bibsonomy.org/user/diego_ma/speech"><title>BibSonomy publications for /user/diego_ma/speech</title><link>http://www.bibsonomy.org/burst/user/diego_ma/speech</link><description>BibSonomy RSS feed for /user/diego_ma/speech</description><dc:date>2010-03-21T23:12:47+01:00</dc:date><items><rdf:Seq><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/26257e754b51b741ad15bb64e6243cddd/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/242ac1cbf4626a8dea0a229f643aafed4/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2367f6005012e81d06a91489496bf0263/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/24ed799d4431231eb901d366520b7b231/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2853da4a16ae749b8256e19ac458685c6/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/29d0c0e63dfcb696cf90b0981309a0b69/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/27f5c7977cedc4baf876d55e19e9e99b1/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/21f732440eb7a503828db1c6ae4b8eecf/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/290f103cb00fcd31d7ec0268544a895a1/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/29bb0d14d65d2b1982f99d20c0eda83bb/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2a43fbdd1cd0f2de278eda8fbdb4886ee/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/241937fd5a5b3382411f8f8292800cc20/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/25e436b40d3816733a62c66429217820f/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2b6e21bef2c26443ad9baab6bd97fac24/diego_ma"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2a1cda268226866da44d71e407d59cd09/diego_ma"/></rdf:Seq></items></channel><item rdf:about="http://www.bibsonomy.org/bibtex/26257e754b51b741ad15bb64e6243cddd/diego_ma"><title>Overview of QAST 2007</title><link>http://www.bibsonomy.org/bibtex/26257e754b51b741ad15bb64e6243cddd/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2009-03-27T09:05:20+01:00</dc:date><dc:subject>speech question_answering </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Turmo, &lt;a href=&#034;http://www.bibsonomy.org/author/Jordi&#034;&gt;Jordi&lt;/a&gt;  and Comas, Pere &lt;a href=&#034;http://www.bibsonomy.org/author/R.&#034;&gt;R.&lt;/a&gt;  and Ayache, &lt;a href=&#034;http://www.bibsonomy.org/author/Christelle&#034;&gt;Christelle&lt;/a&gt;  and Mostefa, &lt;a href=&#034;http://www.bibsonomy.org/author/Djamel&#034;&gt;Djamel&lt;/a&gt;  and Rosset, &lt;a href=&#034;http://www.bibsonomy.org/author/Sophie&#034;&gt;Sophie&lt;/a&gt;  and Lamel, &lt;a href=&#034;http://www.bibsonomy.org/author/Lori&#034;&gt;Lori&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Advances in Multilingual and Multimodal Information Retrieval, &lt;/em&gt;&lt;em&gt;volume 5152/2008 of Lecture Notes in Computer Science, &lt;/em&gt;&lt;em&gt;page 249-256. &lt;/em&gt;&lt;em&gt;Berlin / Heidelberg, &lt;/em&gt;&lt;em&gt;Springer, &lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/question_answering"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/26257e754b51b741ad15bb64e6243cddd/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/26257e754b51b741ad15bb64e6243cddd/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.springerlink.com/content/d511437177k776q0/"/><swrc:date>Fri Mar 27 09:05:20 CET 2009</swrc:date><swrc:address>Berlin / Heidelberg</swrc:address><swrc:booktitle>Advances in Multilingual and Multimodal Information Retrieval</swrc:booktitle><swrc:pages>249-256</swrc:pages><swrc:publisher><swrc:Organization swrc:name="Springer"/></swrc:publisher><swrc:series>Lecture Notes in Computer Science</swrc:series><swrc:title>Overview of {QAST 2007}</swrc:title><swrc:volume>5152/2008</swrc:volume><swrc:year>2007</swrc:year><swrc:keywords>speech question_answering </swrc:keywords><swrc:abstract>This paper describes QAST, a pilot track of CLEF 2007 aimed at evaluating the task of Question Answering in Speech Transcripts. The paper summarizes the evaluation framework, the systems that participated and the results achieved. These results have shown that question answering technology can be useful to deal with spontaneous speech transcripts, so for manually transcribed speech as for automatically recognized speech. The loss in accuracy from dealing with manual transcripts to dealing with automatic ones implies that there is room for future reseach in this area.</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="Web (March 2009)" swrc:key="library"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="10.1007/978-3-540-85760-0" swrc:key="doi"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Turmo, Jordi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Comas, Pere R."/></rdf:_2><rdf:_3><swrc:Person swrc:name="Ayache, Christelle"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Mostefa, Djamel"/></rdf:_4><rdf:_5><swrc:Person swrc:name="Rosset, Sophie"/></rdf:_5><rdf:_6><swrc:Person swrc:name="Lamel, Lori"/></rdf:_6></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"><title>Named Entity Recognition in Question Answering of Speech Data</title><link>http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2008-01-29T07:21:37+01:00</dc:date><dc:subject>AnswerFinder named_entities speech molla_publication </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Diego &lt;a href=&#034;http://www.bibsonomy.org/author/Moll{\&amp;#039;a}&#034;&gt;Moll&amp;#225;&lt;/a&gt;  and Menno van &lt;a href=&#034;http://www.bibsonomy.org/author/Zaanen&#034;&gt;Zaanen&lt;/a&gt;  and Steve &lt;a href=&#034;http://www.bibsonomy.org/author/Cassidy&#034;&gt;Cassidy&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. ALTW 2007, &lt;/em&gt;&lt;em&gt; 5, &lt;/em&gt;&lt;em&gt;page 57-65. &lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/AnswerFinder"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/molla_publication"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2202b97875a0ca06dba67da3f7febfc86/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.alta.asn.au/events/altw2007/cdrom/index.html"/><swrc:date>Tue Jan 29 07:21:37 CET 2008</swrc:date><swrc:booktitle>Proc. ALTW 2007</swrc:booktitle><swrc:pages>57-65</swrc:pages><swrc:title>Named Entity Recognition in Question Answering of Speech Data</swrc:title><swrc:volume>5</swrc:volume><swrc:year>2007</swrc:year><swrc:keywords>AnswerFinder named_entities speech molla_publication </swrc:keywords><swrc:abstract>Question answering on speech transcripts (QAst) is a pilot track of the CLEF competition. In this paper we present our contribution to QAst, which is centred on a study of Named Entity (NE) recognition on speech transcripts, and how it impacts on the accuracy of the final question answering system. We have ported AFNER, the NE recogniser of the AnswerFinder question-answering project, to the set of answer types expected in the QAst track. AFNER uses a combination of regular expressions, lists of names (gazetteers) and machine learning to find NeWS in the data. The machine learning component was trained on a development set of the AMI corpus. In the process we identified various problems with scalability of the system and the existence of errors of the extracted annotation, which lead to relatively poor performance in general. Performance was yet comparable with state of the art, and the system was second (out of three participants) in one of the QAst subtasks.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Diego Moll{\&#039;a}"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Menno van Zaanen"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Steve Cassidy"/></rdf:_3></rdf:Seq></swrc:author><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="Nathalie Colineau"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Mark Dras"/></rdf:_2></rdf:Seq></swrc:editor></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/242ac1cbf4626a8dea0a229f643aafed4/diego_ma"><title>Advances in Automatic Meeting Record Creation and Access</title><link>http://www.bibsonomy.org/bibtex/242ac1cbf4626a8dea0a229f643aafed4/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:47:57+01:00</dc:date><dc:subject>speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Alex &lt;a href=&#034;http://www.bibsonomy.org/author/Waibel&#034;&gt;Waibel&lt;/a&gt;  and Michael &lt;a href=&#034;http://www.bibsonomy.org/author/Ben&#034;&gt;Ben&lt;/a&gt;  and Florian &lt;a href=&#034;http://www.bibsonomy.org/author/Metze&#034;&gt;Metze&lt;/a&gt;  and Klaus &lt;a href=&#034;http://www.bibsonomy.org/author/Ries&#034;&gt;Ries&lt;/a&gt;  and Thomas &lt;a href=&#034;http://www.bibsonomy.org/author/Schaaf&#034;&gt;Schaaf&lt;/a&gt;  and Tanja &lt;a href=&#034;http://www.bibsonomy.org/author/Schultz&#034;&gt;Schultz&lt;/a&gt;  and Hagen &lt;a href=&#034;http://www.bibsonomy.org/author/Soltau&#034;&gt;Soltau&lt;/a&gt;  and Hua &lt;a href=&#034;http://www.bibsonomy.org/author/Yu&#034;&gt;Yu&lt;/a&gt;  and Klaus &lt;a href=&#034;http://www.bibsonomy.org/author/Zechner&#034;&gt;Zechner&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. ICASSP 2001, &lt;/em&gt;(&lt;em&gt;2001&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/242ac1cbf4626a8dea0a229f643aafed4/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/242ac1cbf4626a8dea0a229f643aafed4/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Fri Dec 14 02:47:57 CET 2007</swrc:date><swrc:booktitle>Proc. ICASSP 2001</swrc:booktitle><swrc:title>Advances in Automatic Meeting Record Creation and Access</swrc:title><swrc:year>2001</swrc:year><swrc:keywords>speech </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Alex Waibel"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Michael Ben"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Florian Metze"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Klaus Ries"/></rdf:_4><rdf:_5><swrc:Person swrc:name="Thomas Schaaf"/></rdf:_5><rdf:_6><swrc:Person swrc:name="Tanja Schultz"/></rdf:_6><rdf:_7><swrc:Person swrc:name="Hagen Soltau"/></rdf:_7><rdf:_8><swrc:Person swrc:name="Hua Yu"/></rdf:_8><rdf:_9><swrc:Person swrc:name="Klaus Zechner"/></rdf:_9></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"><title>Named Entity Recognition from Spontaneous Open-Domain Speech</title><link>http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:47:08+01:00</dc:date><dc:subject>named_entities speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Mihai &lt;a href=&#034;http://www.bibsonomy.org/author/Surdeanu&#034;&gt;Surdeanu&lt;/a&gt;  and Jordi &lt;a href=&#034;http://www.bibsonomy.org/author/Turmo&#034;&gt;Turmo&lt;/a&gt;  and Eli &lt;a href=&#034;http://www.bibsonomy.org/author/Comelles&#034;&gt;Comelles&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proceedings Interspeech-05, &lt;/em&gt;&lt;em&gt;Lisbon, &lt;/em&gt;(&lt;em&gt;2005&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/22b0790ca9fa1c810363f5df441fc1254/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.lsi.upc.edu/~comelles/"/><swrc:date>Fri Dec 14 02:47:08 CET 2007</swrc:date><swrc:address>Lisbon</swrc:address><swrc:booktitle>Proceedings Interspeech-05</swrc:booktitle><swrc:title>Named Entity Recognition from Spontaneous Open-Domain Speech</swrc:title><swrc:year>2005</swrc:year><swrc:keywords>named_entities speech </swrc:keywords><swrc:abstract>This paper presents an analysis of named entity recognition and classification in spontaneous speech transcripts. We annotated a significant fraction of the Switchboard corpus with six named entity classes and investigated a battery of machine learning models that include lexical, syntactic, and semantic attributes. The best recognition and classification model obtains promising results, approaching within 5% a system evaluated on clean textual data.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Mihai Surdeanu"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Jordi Turmo"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Eli Comelles"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2367f6005012e81d06a91489496bf0263/diego_ma"><title>Indexing, Browsing and Searching of Digital Video and Digital Audio Information</title><link>http://www.bibsonomy.org/bibtex/2367f6005012e81d06a91489496bf0263/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:46:43+01:00</dc:date><dc:subject>inf_retrieval speech video </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Alan F. &lt;a href=&#034;http://www.bibsonomy.org/author/Smeaton&#034;&gt;Smeaton&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Lectures on Information Retrieval, &lt;/em&gt;&lt;em&gt;Springer-Verlag, &lt;/em&gt;(&lt;em&gt;2001&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/inf_retrieval"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/video"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2367f6005012e81d06a91489496bf0263/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2367f6005012e81d06a91489496bf0263/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InCollection"/><swrc:date>Fri Dec 14 02:46:43 CET 2007</swrc:date><swrc:booktitle>Lectures on Information Retrieval</swrc:booktitle><swrc:pages>93-110</swrc:pages><swrc:publisher><swrc:Organization swrc:name="Springer-Verlag"/></swrc:publisher><swrc:series>Lecture Notes in Computer Science</swrc:series><swrc:title>Indexing, Browsing and Searching of Digital Video and Digital Audio Information</swrc:title><swrc:year>2001</swrc:year><swrc:keywords>inf_retrieval speech video </swrc:keywords><swrc:abstract>In this chapter we examine various techniques for providing content access to information stored in a continuous medium, namely digital audio and digital video. Our coverage of audio is centered around post-processing the output of automatic recognition of speech or phones and we describe the various approaches that have been taken in this area. In order to give reasonable coverage of the possibilities and limitations of content-based access to digital video information we sketch out at a high level, the approaches taken in various video compression algorithms, principally the MPEG family.. We then address approaches to shot and scene boundary detection, choosing representative frames for browsing and for search, and various browsing interfaces that have been developed. We finish with an overview of the likely developments in this area in the future.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Alan F. Smeaton"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/24ed799d4431231eb901d366520b7b231/diego_ma"><title>Survey of Current Speech Technology</title><link>http://www.bibsonomy.org/bibtex/24ed799d4431231eb901d366520b7b231/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:46:02+01:00</dc:date><dc:subject>speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Alexander I. &lt;a href=&#034;http://www.bibsonomy.org/author/Rudnicky&#034;&gt;Rudnicky&lt;/a&gt;  and Alexander G. &lt;a href=&#034;http://www.bibsonomy.org/author/Hauptmann&#034;&gt;Hauptmann&lt;/a&gt;  and Kai-Fu &lt;a href=&#034;http://www.bibsonomy.org/author/Lee&#034;&gt;Lee&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Communications of the ACM&lt;/em&gt;&lt;em&gt;37(3):52-57&lt;/em&gt;(&lt;em&gt;1994&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/24ed799d4431231eb901d366520b7b231/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/24ed799d4431231eb901d366520b7b231/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Fri Dec 14 02:46:02 CET 2007</swrc:date><swrc:journal>Communications of the ACM</swrc:journal><swrc:number>3</swrc:number><swrc:pages>52-57</swrc:pages><swrc:title>Survey of Current Speech Technology</swrc:title><swrc:volume>37</swrc:volume><swrc:year>1994</swrc:year><swrc:keywords>speech </swrc:keywords><swrc:abstract>Speech recognition and speech synthesis are technologies of particular interest for their support of direct communication between humans and computers through a communications mode humans commonly use among themselves and at which they are highly skilled. Both manipulate speech in terms of its information content; recognition transforms human speech into text to be used literally (e.g., for dictation) or interpreted as commands to control applications, and synthesis allows the generation of spoken utterances from text.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Alexander I. Rudnicky"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Alexander G. Hauptmann"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Kai-Fu Lee"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"><title>Orthographic Case Restoration Using Supervised Learning without Manual Annotation</title><link>http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:44:29+01:00</dc:date><dc:subject>named_entities question_answering speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Cheng &lt;a href=&#034;http://www.bibsonomy.org/author/Niu&#034;&gt;Niu&lt;/a&gt;  and Wei &lt;a href=&#034;http://www.bibsonomy.org/author/Li&#034;&gt;Li&lt;/a&gt;  and  &lt;a href=&#034;http://www.bibsonomy.org/author/Jihong&#034;&gt;Jihong&lt;/a&gt;  and Rohini &lt;a href=&#034;http://www.bibsonomy.org/author/Shrihari&#034;&gt;Shrihari&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;International Journal on Artificial Intelligence Tools&lt;/em&gt;&lt;em&gt;13(1):141-156&lt;/em&gt;(&lt;em&gt;2004&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/named_entities"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/question_answering"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/222f9837dac4a70418136ddfff25b241d/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://homepage.mac.com/liwei999/WeiLi/Publications.html"/><swrc:date>Fri Dec 14 02:44:29 CET 2007</swrc:date><swrc:journal>International Journal on Artificial Intelligence Tools</swrc:journal><swrc:number>1</swrc:number><swrc:pages>141-156</swrc:pages><swrc:title>Orthographic Case Restoration Using Supervised Learning without Manual Annotation</swrc:title><swrc:volume>13</swrc:volume><swrc:year>2004</swrc:year><swrc:keywords>named_entities question_answering speech </swrc:keywords><swrc:abstract>One challenge in text processing is the treatment of case insensitive documents such as speech recognition results. The traditional approach is to re-train a language model excluding case-related features. This paper presents an alternative two-step approach whereby a preprocessing module (Step 1) is designed to restore case-sensitive form which is subsequently processed by the original system (Step 2). Step 1 is mainly implemented as a Hidden Markov Model trained on a large raw corpus of case sensitive documents. It is demonstrated that this approach (i) outperforms the feature exclusion approach for named entity tagging, (ii) leads to limited degradation for parsing, relationship extraction and case insensitive question answering, (iii) reduces system complexity, and (iv) has wide applicability: the restored text can be used in both statistical model and rule-based systems.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Cheng Niu"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Wei Li"/></rdf:_2><rdf:_3><swrc:Person swrc:name=" Jihong"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Rohini Shrihari"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2853da4a16ae749b8256e19ac458685c6/diego_ma"><title>From Multimedia Retrieval to Knowledge Management</title><link>http://www.bibsonomy.org/bibtex/2853da4a16ae749b8256e19ac458685c6/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:44:14+01:00</dc:date><dc:subject>inf_retrieval speech multimedia </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Pedro J. &lt;a href=&#034;http://www.bibsonomy.org/author/Moreno&#034;&gt;Moreno&lt;/a&gt;  and J-M Van &lt;a href=&#034;http://www.bibsonomy.org/author/Thong&#034;&gt;Thong&lt;/a&gt;  and Beth &lt;a href=&#034;http://www.bibsonomy.org/author/Logan&#034;&gt;Logan&lt;/a&gt;  and Gareth J.F. &lt;a href=&#034;http://www.bibsonomy.org/author/Jones&#034;&gt;Jones&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;IEEE Computer&lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/inf_retrieval"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/multimedia"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2853da4a16ae749b8256e19ac458685c6/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2853da4a16ae749b8256e19ac458685c6/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Fri Dec 14 02:44:14 CET 2007</swrc:date><swrc:journal>IEEE Computer</swrc:journal><swrc:number>4</swrc:number><swrc:title>From Multimedia Retrieval to Knowledge Management</swrc:title><swrc:volume>35</swrc:volume><swrc:year>2002</swrc:year><swrc:keywords>inf_retrieval speech multimedia </swrc:keywords><swrc:abstract>The authors suggest ways in which speech-based multimedia information retrieval technologies can evolve into full-fledged knowledge management systems in which audio, video, and images contribute as much as textual sources</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Pedro J. Moreno"/></rdf:_1><rdf:_2><swrc:Person swrc:name="J-M Van Thong"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Beth Logan"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Gareth J.F. Jones"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/29d0c0e63dfcb696cf90b0981309a0b69/diego_ma"><title>Spoken Dialogue Technology: Enabling the Conversational User Interface</title><link>http://www.bibsonomy.org/bibtex/29d0c0e63dfcb696cf90b0981309a0b69/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:43:14+01:00</dc:date><dc:subject>speech dialogue_system </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Michael F. &lt;a href=&#034;http://www.bibsonomy.org/author/McTear&#034;&gt;McTear&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;ACM Computing Surveys&lt;/em&gt;&lt;em&gt;34(1):90-169&lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/dialogue_system"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/29d0c0e63dfcb696cf90b0981309a0b69/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/29d0c0e63dfcb696cf90b0981309a0b69/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://portal.acm.org/citation.cfm?id=505285"/><swrc:date>Fri Dec 14 02:43:14 CET 2007</swrc:date><swrc:journal>ACM Computing Surveys</swrc:journal><swrc:number>1</swrc:number><swrc:pages>90-169</swrc:pages><swrc:title>Spoken Dialogue Technology: Enabling the Conversational User Interface</swrc:title><swrc:volume>34</swrc:volume><swrc:year>2002</swrc:year><swrc:keywords>speech dialogue_system </swrc:keywords><swrc:abstract>Spoken dialogue systems allow users to interact with computer-based applications such as databases and expert systems by using natural spoken language. The origins of spoken dialogue systems can be traced back to Artificial Intelligence research in the 1950s concerned with developing conversational interfaces. However, it is only within the last decade or so, with major advances in speech technology, that large-scale working systems have been developed and, in some cases, introduced into commercial environments. As a result many major telecommunications and software companies have become aware of the potential for spoken dialogue technology to provide solutions in newly developing areas such as computer-telephony integration. Voice portals, which provide a speech-based interface between a telephone user and Web-based services, are the most recent application of spoken dialogue technology. This article describes the main components of the technology---speech recognition, language understanding, dialogue management, communication with an external source such as a database, language generation, speech synthesis---and shows how these component technologies can be integrated into a spoken dialogue system. The article describes in detail the methods that have been adopted in some well-known dialogue systems, explores different system architectures, considers issues of specification, design, and evaluation, reviews some currently available dialogue development toolkits, and outlines prospects for future development.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Michael F. McTear"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/27f5c7977cedc4baf876d55e19e9e99b1/diego_ma"><title>Question Answering on a Case Insensitive Corpus</title><link>http://www.bibsonomy.org/bibtex/27f5c7977cedc4baf876d55e19e9e99b1/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:42:23+01:00</dc:date><dc:subject>question_answering speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Wei &lt;a href=&#034;http://www.bibsonomy.org/author/Li&#034;&gt;Li&lt;/a&gt;  and Rohini &lt;a href=&#034;http://www.bibsonomy.org/author/Srihari&#034;&gt;Srihari&lt;/a&gt;  and Cheng &lt;a href=&#034;http://www.bibsonomy.org/author/Niu&#034;&gt;Niu&lt;/a&gt;  and Xiaoge &lt;a href=&#034;http://www.bibsonomy.org/author/Li&#034;&gt;Li&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. ACL 2003 Workshop on Multilingual Summarization and Question Answering, &lt;/em&gt;&lt;em&gt;page 84-93. &lt;/em&gt;(&lt;em&gt;2003&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/question_answering"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/27f5c7977cedc4baf876d55e19e9e99b1/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/27f5c7977cedc4baf876d55e19e9e99b1/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Fri Dec 14 02:42:23 CET 2007</swrc:date><swrc:booktitle>Proc. ACL 2003 Workshop on Multilingual Summarization and Question Answering</swrc:booktitle><swrc:pages>84-93</swrc:pages><swrc:title>Question Answering on a Case Insensitive Corpus</swrc:title><swrc:year>2003</swrc:year><swrc:keywords>question_answering speech </swrc:keywords><swrc:abstract>Most question answering (QA) systems rely on both keyword index and Named Entity (NE) tagging. The corpus from which the QA systems attempt to retrieve answers is usually mixed case text. However, there are numerous corpora that consist of case insensitive documents, e.g. speech recognition results. This paper presents a successful approach to QA on a case insensitive corpus, whereby a preprocessing module is designed to restore the case-sensitive form. The document pool with the restored case then feeds the QA system, which remains unchanged. The case restoration preprocessing is implemented as a Hidden Markov Model trained on a large raw corpus of case sensitive documents. It is demonstrated that this approach leads to very limited degradation in QA benchmarking (2.8%), mainly due to the limited degradation in the underlying information extraction support.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Wei Li"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Rohini Srihari"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Cheng Niu"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Xiaoge Li"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/21f732440eb7a503828db1c6ae4b8eecf/diego_ma"><title>Let's Hear it for Audio Mining</title><link>http://www.bibsonomy.org/bibtex/21f732440eb7a503828db1c6ae4b8eecf/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:42:12+01:00</dc:date><dc:subject>speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Neal &lt;a href=&#034;http://www.bibsonomy.org/author/Leavitt&#034;&gt;Leavitt&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;IEEE Computer&lt;/em&gt;&lt;em&gt;35(10):23-25&lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/21f732440eb7a503828db1c6ae4b8eecf/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/21f732440eb7a503828db1c6ae4b8eecf/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Fri Dec 14 02:42:12 CET 2007</swrc:date><swrc:journal>IEEE Computer</swrc:journal><swrc:number>10</swrc:number><swrc:pages>23-25</swrc:pages><swrc:title>Let&#039;s Hear it for Audio Mining</swrc:title><swrc:volume>35</swrc:volume><swrc:year>2002</swrc:year><swrc:keywords>speech </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Neal Leavitt"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/290f103cb00fcd31d7ec0268544a895a1/diego_ma"><title>Getting the Answers</title><link>http://www.bibsonomy.org/bibtex/290f103cb00fcd31d7ec0268544a895a1/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:41:47+01:00</dc:date><dc:subject>speech inf_retrieval </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Pamela &lt;a href=&#034;http://www.bibsonomy.org/author/Kramer&#034;&gt;Kramer&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;http://www.research.ibm.com/ thinkresearch/ pages/ 2002/ 20020411_meetingminer.shtml, &lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;) &lt;em&gt;Last visited 6 February 2004
		    .
	    &lt;/em&gt;</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/inf_retrieval"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/290f103cb00fcd31d7ec0268544a895a1/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/290f103cb00fcd31d7ec0268544a895a1/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Misc"/><owl:sameAs rdf:resource="http://www.research.ibm.com/thinkresearch/pages/2002/20020411_meetingminer.shtml"/><swrc:date>Fri Dec 14 02:41:47 CET 2007</swrc:date><swrc:howpublished>\myurl{http://www.research.ibm.com/ thinkresearch/ pages/ 2002/ 20020411_meetingminer.shtml}</swrc:howpublished><swrc:note>Last visited 6 February 2004</swrc:note><swrc:title>Getting the Answers</swrc:title><swrc:year>2002</swrc:year><swrc:keywords>speech inf_retrieval </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Pamela Kramer"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/29bb0d14d65d2b1982f99d20c0eda83bb/diego_ma"><title>A Statistical Approach to Automatic Speech Summarization</title><link>http://www.bibsonomy.org/bibtex/29bb0d14d65d2b1982f99d20c0eda83bb/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:40:45+01:00</dc:date><dc:subject>speech summarisation </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Chiori &lt;a href=&#034;http://www.bibsonomy.org/author/Hori&#034;&gt;Hori&lt;/a&gt;  and Sadaoki &lt;a href=&#034;http://www.bibsonomy.org/author/Furui&#034;&gt;Furui&lt;/a&gt;  and Rob &lt;a href=&#034;http://www.bibsonomy.org/author/Malkin&#034;&gt;Malkin&lt;/a&gt;  and Hua &lt;a href=&#034;http://www.bibsonomy.org/author/Yu&#034;&gt;Yu&lt;/a&gt;  and Alex &lt;a href=&#034;http://www.bibsonomy.org/author/Waibel&#034;&gt;Waibel&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;EURASIP Journal on Applied Signal Processing&lt;/em&gt;(&lt;em&gt;2003&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/summarisation"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/29bb0d14d65d2b1982f99d20c0eda83bb/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/29bb0d14d65d2b1982f99d20c0eda83bb/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://asp.hindawi.com/volume-2003/S1110865703211112.html"/><swrc:date>Fri Dec 14 02:40:45 CET 2007</swrc:date><swrc:journal>EURASIP Journal on Applied Signal Processing</swrc:journal><swrc:pages>1-12</swrc:pages><swrc:title>A Statistical Approach to Automatic Speech Summarization</swrc:title><swrc:volume>2</swrc:volume><swrc:year>2003</swrc:year><swrc:keywords>speech summarisation </swrc:keywords><swrc:abstract>This paper proposes a statistical approach to automatic speech summarization. In our method, a set of words maximizing a summarization score indicating the appropriateness of summarization is extracted from automatically transcribed speech and then concatenated to create a summary. The extraction process is performed using a dynamic programming (DP) technique based on a target compression ratio. In this paper, we demonstrate how an English news broadcast transcribed by a speech recognizer is automatically summarized. We adapted our method, which was originally proposed for Japanese, to English by modifying the model for estimating word concatenation probabilities based on a dependency structure in the original speech given by a stochastic dependency context free grammar (SDCFG). We also propose a method of summarizing multiple utterances using a two-level DP technique. The automatically summarized sentences are evaluated by summarization accuracy based on a comparison with a manual summary of speech that has been correctly transcribed by human subjects. Our experimental results indicate that the method we propose can effectively extract relatively important information and remove redundant and irrelevant information from English news broadcasts.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Chiori Hori"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Sadaoki Furui"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Rob Malkin"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Hua Yu"/></rdf:_4><rdf:_5><swrc:Person swrc:name="Alex Waibel"/></rdf:_5></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2a43fbdd1cd0f2de278eda8fbdb4886ee/diego_ma"><title>Automated Natural Spoken Dialog</title><link>http://www.bibsonomy.org/bibtex/2a43fbdd1cd0f2de278eda8fbdb4886ee/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:39:27+01:00</dc:date><dc:subject>speech dialogue_system </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Allen L. &lt;a href=&#034;http://www.bibsonomy.org/author/Gorin&#034;&gt;Gorin&lt;/a&gt;  and Alicia &lt;a href=&#034;http://www.bibsonomy.org/author/Abella&#034;&gt;Abella&lt;/a&gt;  and Tirso &lt;a href=&#034;http://www.bibsonomy.org/author/Alonso&#034;&gt;Alonso&lt;/a&gt;  and Giuseppe &lt;a href=&#034;http://www.bibsonomy.org/author/Riccardi&#034;&gt;Riccardi&lt;/a&gt;  and Jeremy H. &lt;a href=&#034;http://www.bibsonomy.org/author/Wright&#034;&gt;Wright&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;IEEE Computer&lt;/em&gt;&lt;em&gt;35(4):51-56&lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/dialogue_system"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2a43fbdd1cd0f2de278eda8fbdb4886ee/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2a43fbdd1cd0f2de278eda8fbdb4886ee/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Fri Dec 14 02:39:27 CET 2007</swrc:date><swrc:journal>IEEE Computer</swrc:journal><swrc:number>4</swrc:number><swrc:pages>51-56</swrc:pages><swrc:title>Automated Natural Spoken Dialog</swrc:title><swrc:volume>35</swrc:volume><swrc:year>2002</swrc:year><swrc:keywords>speech dialogue_system </swrc:keywords><swrc:abstract>The next generation of voice-based interface technology will enable easy-to-use automation of new and existing communication services, making human-machine interaction more natural.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Allen L. Gorin"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Alicia Abella"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Tirso Alonso"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Giuseppe Riccardi"/></rdf:_4><rdf:_5><swrc:Person swrc:name="Jeremy H. Wright"/></rdf:_5></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/241937fd5a5b3382411f8f8292800cc20/diego_ma"><title>Towards Speech as a Knowledge Resource</title><link>http://www.bibsonomy.org/bibtex/241937fd5a5b3382411f8f8292800cc20/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:36:42+01:00</dc:date><dc:subject>speech inf_retrieval inf_extraction </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;E. W. &lt;a href=&#034;http://www.bibsonomy.org/author/Brown&#034;&gt;Brown&lt;/a&gt;  and S. &lt;a href=&#034;http://www.bibsonomy.org/author/Srinivasan&#034;&gt;Srinivasan&lt;/a&gt;  and A. &lt;a href=&#034;http://www.bibsonomy.org/author/Coden&#034;&gt;Coden&lt;/a&gt;  and D. &lt;a href=&#034;http://www.bibsonomy.org/author/Ponceleon&#034;&gt;Ponceleon&lt;/a&gt;  and J.W. &lt;a href=&#034;http://www.bibsonomy.org/author/Cooper&#034;&gt;Cooper&lt;/a&gt;  and A. &lt;a href=&#034;http://www.bibsonomy.org/author/Amir&#034;&gt;Amir&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;IBM Systems Journal&lt;/em&gt;&lt;em&gt;40(4):985-1001&lt;/em&gt;&lt;em&gt;Dec 2001. &lt;/em&gt;</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/inf_retrieval"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/inf_extraction"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/241937fd5a5b3382411f8f8292800cc20/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/241937fd5a5b3382411f8f8292800cc20/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://www.findarticles.com/cf_dls/m0ISJ/4_40/82373866/p1/article.jhtml"/><swrc:date>Fri Dec 14 02:36:42 CET 2007</swrc:date><swrc:journal>IBM Systems Journal</swrc:journal><swrc:month>Dec</swrc:month><swrc:number>4</swrc:number><swrc:pages>985-1001</swrc:pages><swrc:title>Towards Speech as a Knowledge Resource</swrc:title><swrc:volume>40</swrc:volume><swrc:year>2001</swrc:year><swrc:keywords>speech inf_retrieval inf_extraction </swrc:keywords><swrc:abstract>Speech is a tantalizing mode of human communication. On the one hand, humans understand speech with ease and use speech to express complex ideas, information, and knowledge. On the other hand, automatic speech recognition with computers is very hard, and extracting knowledge from speech is even harder. Nevertheless, the potential reward for solving this problem drives us to pursue it. Before we can exploit speech as a knowledge resource, however, we must understand the current state of the art in speech recognition and the relevant, successful applications of speech recognition in the related areas of multimedia indexing and search. In this paper we advocate the study of speech as a knowledge resource, provide a brief introduction to the state of the art in speech recognition, describe a number of systems that use speech recognition to enable multimedia analysis, indexing, and search, and present a number of exploratory applications of speech recognition that move toward the goal of exploiting speech as a knowledge resource...</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="E. W. Brown"/></rdf:_1><rdf:_2><swrc:Person swrc:name="S. Srinivasan"/></rdf:_2><rdf:_3><swrc:Person swrc:name="A. Coden"/></rdf:_3><rdf:_4><swrc:Person swrc:name="D. Ponceleon"/></rdf:_4><rdf:_5><swrc:Person swrc:name="J.W. Cooper"/></rdf:_5><rdf:_6><swrc:Person swrc:name="A. Amir"/></rdf:_6></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/25e436b40d3816733a62c66429217820f/diego_ma"><title>Natural Language Processing to Improve Speech Recognition</title><link>http://www.bibsonomy.org/bibtex/25e436b40d3816733a62c66429217820f/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:36:28+01:00</dc:date><dc:subject>NLP speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt; &lt;a href=&#034;http://www.bibsonomy.org/author/Brainhat&#034;&gt;Brainhat&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;On-line publication, &lt;/em&gt;(&lt;em&gt;2001&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/NLP"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/25e436b40d3816733a62c66429217820f/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/25e436b40d3816733a62c66429217820f/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Misc"/><owl:sameAs rdf:resource="http://www.brainhat.com/White\%20paper.pdf"/><swrc:date>Fri Dec 14 02:36:28 CET 2007</swrc:date><swrc:howpublished>On-line publication</swrc:howpublished><swrc:title>Natural Language Processing to Improve Speech Recognition</swrc:title><swrc:year>2001</swrc:year><swrc:keywords>NLP speech </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name=" Brainhat"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2b6e21bef2c26443ad9baab6bd97fac24/diego_ma"><title>A Formal Framework for Linguistic Annotation</title><link>http://www.bibsonomy.org/bibtex/2b6e21bef2c26443ad9baab6bd97fac24/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:36:05+01:00</dc:date><dc:subject>annotation speech </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Steven &lt;a href=&#034;http://www.bibsonomy.org/author/Bird&#034;&gt;Bird&lt;/a&gt;  and Mark &lt;a href=&#034;http://www.bibsonomy.org/author/Liberman&#034;&gt;Liberman&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Speech Communication&lt;/em&gt;&lt;em&gt;33(1,2):23-60&lt;/em&gt;(&lt;em&gt;2003&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/annotation"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2b6e21bef2c26443ad9baab6bd97fac24/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2b6e21bef2c26443ad9baab6bd97fac24/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://www.ldc.upenn.edu/sb/home/publications.html"/><swrc:date>Fri Dec 14 02:36:05 CET 2007</swrc:date><swrc:journal>Speech Communication</swrc:journal><swrc:number>1,2</swrc:number><swrc:pages>23-60</swrc:pages><swrc:title>A Formal Framework for Linguistic Annotation</swrc:title><swrc:volume>33</swrc:volume><swrc:year>2003</swrc:year><swrc:keywords>annotation speech </swrc:keywords><swrc:abstract>`Linguistic annotation&#039; covers any descriptive or analytic notations applied to raw language data. The basic data may be in the form of time functions - audio, video and/or physiological recordings - or it may be textual. The added notations may include transcriptions of all sorts (from phonetic features to discourse structures), part-of-speech and sense tagging, syntactic analysis, `named entity&#039; identification, co-reference annotation, and so on. While there are several ongoing efforts to provide formats and tools for such annotations and to publish annotated linguistic databases, the lack of widely accepted standards is becoming a critical problem. Proposed standards, to the extent they exist, have focused on file formats. This paper focuses instead on the logical structure of linguistic annotations. We survey a wide variety of existing annotation formats and demonstrate a common conceptual core, the annotation graph. This provides a formal framework for constructing, maintaining and searching linguistic annotations, while remaining consistent with many alternative data structures and file formats.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Steven Bird"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Mark Liberman"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2a1cda268226866da44d71e407d59cd09/diego_ma"><title>Named Entity Recognition in Speech: Approach and Results Using the TextPro System</title><link>http://www.bibsonomy.org/bibtex/2a1cda268226866da44d71e407d59cd09/diego_ma</link><dc:creator>diego_ma</dc:creator><dc:date>2007-12-14T02:35:35+01:00</dc:date><dc:subject>speech inf_extraction </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Douglas E. &lt;a href=&#034;http://www.bibsonomy.org/author/Appelt&#034;&gt;Appelt&lt;/a&gt;  and David &lt;a href=&#034;http://www.bibsonomy.org/author/Martin&#034;&gt;Martin&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. DARPA Broadcast News Workshop, &lt;/em&gt;&lt;em&gt;page 51-54. &lt;/em&gt;(&lt;em&gt;1999&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/speech"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/inf_extraction"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2a1cda268226866da44d71e407d59cd09/diego_ma"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2a1cda268226866da44d71e407d59cd09/diego_ma"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://www.speech.sri.com/projects/sieve/publications.html"/><swrc:date>Fri Dec 14 02:35:35 CET 2007</swrc:date><swrc:booktitle>Proc. DARPA Broadcast News Workshop</swrc:booktitle><swrc:pages>51-54</swrc:pages><swrc:title>Named Entity Recognition in Speech: Approach and Results Using the {TextPro} System</swrc:title><swrc:year>1999</swrc:year><swrc:keywords>speech inf_extraction </swrc:keywords><swrc:abstract>This paper describes the application of the TextPro system to the task of recognition of named entities in speech. TextPro is a lightweight engine for interpreting cascaded finite-state transducers. Although originally intended for processing text, the experience of this evaluation demonstrates the system can easily be adapted to processing transcripts generated by a speech recognizer as well.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Douglas E. Appelt"/></rdf:_1><rdf:_2><swrc:Person swrc:name="David Martin"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item></rdf:RDF>