@article{McTear:2002, abstract = {Spoken dialogue systems allow users to interact with computer-based applications such as databases and expert systems by using natural spoken language. The origins of spoken dialogue systems can be traced back to Artificial Intelligence research in the 1950s concerned with developing conversational interfaces. However, it is only within the last decade or so, with major advances in speech technology, that large-scale working systems have been developed and, in some cases, introduced into commercial environments. As a result many major telecommunications and software companies have become aware of the potential for spoken dialogue technology to provide solutions in newly developing areas such as computer-telephony integration. Voice portals, which provide a speech-based interface between a telephone user and Web-based services, are the most recent application of spoken dialogue technology. This article describes the main components of the technology---speech recognition, language understanding, dialogue management, communication with an external source such as a database, language generation, speech synthesis---and shows how these component technologies can be integrated into a spoken dialogue system. The article describes in detail the methods that have been adopted in some well-known dialogue systems, explores different system architectures, considers issues of specification, design, and evaluation, reviews some currently available dialogue development toolkits, and outlines prospects for future development.}, added-at = {2007-12-14T02:43:14.000+0100}, author = {McTear, Michael F.}, biburl = {http://www.bibsonomy.org/bibtex/29d0c0e63dfcb696cf90b0981309a0b69/diego_ma}, interhash = {e808979df60268c15d5684ca9398c479}, intrahash = {9d0c0e63dfcb696cf90b0981309a0b69}, journal = {ACM Computing Surveys}, keywords = {speech dialogue_system}, number = 1, pages = {90-169}, timestamp = {2007-12-14T02:43:14.000+0100}, title = {Spoken Dialogue Technology: Enabling the Conversational User Interface}, url = {http://portal.acm.org/citation.cfm?id=505285}, volume = 34, year = 2002 } @inproceedings{Kim:1998b, added-at = {2007-12-14T02:41:35.000+0100}, address = {Sanibel Island}, author = {Kim, Jung Hee and Freedman, Reva and Evens, Martha W.}, biburl = {http://www.bibsonomy.org/bibtex/215f6f0f4ef402f161b5f5047a4618d81/diego_ma}, booktitle = {Proc. of the 11th International Florida Artificial Intelligence Research Symposium}, interhash = {c87b0e408d927ebd76aef89f7eccad65}, intrahash = {15f6f0f4ef402f161b5f5047a4618d81}, keywords = {tutoring_system dialogue_system}, pages = {153-157}, timestamp = {2007-12-14T02:41:35.000+0100}, title = {Responding to Unexpected Student Utterances in {CIRCSIM}-Tutor v.3: Analysis of transcripts}, year = 1998 } @inproceedings{Kim:1998, added-at = {2007-12-14T02:41:34.000+0100}, address = {Dayton}, author = {Kim, Jung Hee and Freedman, Reva and Evens, Martha W.}, biburl = {http://www.bibsonomy.org/bibtex/200917d770c1fb36933fc8f145829bd19/diego_ma}, booktitle = {Proc. of Midwest Artificial Intelligence and Cognitive Science Society Conference}, interhash = {6eaa67a9180472e1ee118468a48e0102}, intrahash = {00917d770c1fb36933fc8f145829bd19}, keywords = {tutoring_system dialogue_system}, pages = {124-131}, timestamp = {2007-12-14T02:41:34.000+0100}, title = {Relationship between Tutorial Goals and Sentence Structure in a Corpus of Tutoring Transcripts}, year = 1998 } @article{Gorin:2002, abstract = {The next generation of voice-based interface technology will enable easy-to-use automation of new and existing communication services, making human-machine interaction more natural.}, added-at = {2007-12-14T02:39:27.000+0100}, author = {Gorin, Allen L. and Abella, Alicia and Alonso, Tirso and Riccardi, Giuseppe and Wright, Jeremy H.}, biburl = {http://www.bibsonomy.org/bibtex/2a43fbdd1cd0f2de278eda8fbdb4886ee/diego_ma}, interhash = {89e6100d573df5a18574fa342ddc3fb3}, intrahash = {a43fbdd1cd0f2de278eda8fbdb4886ee}, journal = {IEEE Computer}, keywords = {speech dialogue_system}, number = 4, pages = {51-56}, timestamp = {2007-12-14T02:39:27.000+0100}, title = {Automated Natural Spoken Dialog}, volume = 35, year = 2002 } @inproceedings{Glass:1997, added-at = {2007-12-14T02:39:26.000+0100}, author = {Glass, Michael}, biburl = {http://www.bibsonomy.org/bibtex/2d16a826c5f66eab8e686fcaa0ded944c/diego_ma}, booktitle = {Proc. of the 1997 Florida Artificial Intelligence Research Symposium, FLAIRS}, interhash = {724811282e9c809b027ecbb180f1eea2}, intrahash = {d16a826c5f66eab8e686fcaa0ded944c}, keywords = {tutoring_system dialogue_system}, timestamp = {2007-12-14T02:39:26.000+0100}, title = {Some Phenomena Handled by the {CIRCSIM}-Tutor Version 3 Input Understander}, url = {CIRCSIM's web page?}, year = {Forthcoming} } @inproceedings{Freedman:1998, added-at = {2007-12-14T02:39:03.000+0100}, address = {Niagara-on-the-Lake, Ontario}, author = {Freedman, Reva and Brandle, Stefan and Glass, Michael and Kim, Jung Hee and Zhou, Yujian and Evens, Martha W.}, biburl = {http://www.bibsonomy.org/bibtex/23b1cbaaf74cac4315f21ec4ca8272852/diego_ma}, booktitle = {Proc. of the Ninth International Workshop on Natural Language Generation (INLG-9)}, interhash = {7708357e9b564b95fea552473f51a225}, intrahash = {3b1cbaaf74cac4315f21ec4ca8272852}, keywords = {tutoring_system dialogue_system}, pages = {280-283}, timestamp = {2007-12-14T02:39:03.000+0100}, title = {System Demonstration Content Planning as the Basis for an Intelligent Tutoring System}, url = {http://www.csam.iit.edu/{\~{}}circsim}, year = 1998 } @inproceedings{Freedman:1996, added-at = {2007-12-14T02:39:02.000+0100}, author = {Freedman, Reva}, biburl = {http://www.bibsonomy.org/bibtex/231fa7099581296dd44c5ec5b1cd05a41/diego_ma}, booktitle = {Online Procs. of the 1996 Midwest Artificial Intelligence and Cognitive Science Conference}, editor = {Gasser, Michael}, interhash = {9117a0a97561c374ee83755b2175fffe}, intrahash = {31fa7099581296dd44c5ec5b1cd05a41}, keywords = {tutoring_system dialogue_system}, timestamp = {2007-12-14T02:39:02.000+0100}, title = {Using a Text Planner to Model the Behavior of Human Tutors in an ITS}, url = {http:// www.cs.indiana.edu/event/maics96/Proceedings/Freedman/freedman.html}, year = 1996 } @inproceedings{Freedman:1997, added-at = {2007-12-14T02:39:01.000+0100}, author = {Freedman, Reva}, biburl = {http://www.bibsonomy.org/bibtex/2cb2be4522cf29495632413ddee182f6c/diego_ma}, booktitle = {Procs. of the AAAI 1997 Spring Symposium on Computational Models for Mixed-Initiative Interaction}, interhash = {09d673c117cd3e912ddcbced2a2e6d00}, intrahash = {cb2be4522cf29495632413ddee182f6c}, keywords = {tutoring_system dialogue_system}, timestamp = {2007-12-14T02:39:01.000+0100}, title = {Degrees of Mixed-Initiative Interaction in an Intelligent Tutoring System}, year = 1997 } @inproceedings{Ballim:2000, abstract = {In this paper we summarized a framework for designing grammar-based procedure for the automatic extraction of the semantic content from spoken queries. Starting with a case study and following an approach which combines the notions of fuzziness and robustness in sentence parsing, we showed we built practical domain-dependent rules which can be applied whenever it is possible to superimpose a sentence-level semantic structure to a text without relying on a previous deep syntactical analysis. This kind of procedure can be also profitably used as a pre-processing tool in order to cut out part of the sentence which have been recognized to have no relevance in the understanding process. In the case of particular dialogue applications where there is no need to build a complex semantic structure (e.g. word spotting or excerpting) the presented methodology may represent an efficient alternative solution to a sequential composition of deep linguistic analysis modules. Even if the query generation problem may not seem a critical application it should be held in mind that the sentence processing must be done on-line. Having this kind of constraints we cannot design our system without caring for efficiency and thus provide an immediate response. Another critical issue is related to whole robustness of the system. In our case study we tried to make experiences on how it is possible to deal with an unreliable and noisy input without asking the user for any repetition or clarification. This may correspond to a similar problem one may have when processing text coming from informal writing such as e-mails, news and in many cases Web pages where it is often the case to have irrelevant surrounding information.}, added-at = {2007-12-14T02:35:44.000+0100}, address = {Bellagio, Italy}, author = {Ballim, Afzal and Pallotta, Vincenzo}, biburl = {http://www.bibsonomy.org/bibtex/2b01763dc61196816d5e4770b26688ac5/diego_ma}, booktitle = {Proc. 3rd International Workshop on Human-Computer Conversation}, interhash = {6ffc798a029c7b184b05f9ec76bc2ed7}, intrahash = {b01763dc61196816d5e4770b26688ac5}, keywords = {dialogue_system}, note = {http://lithwww.epfl.ch/\~{}pallotta/publications.html}, timestamp = {2007-12-14T02:35:44.000+0100}, title = {The role of robust semantic analysis in spoken language dialogue systems}, year = 2000 }