@inbook{taibi2019sweet, abstract = {This paper outlines the strategies, rationale and potential uses motivating the construction of the House Corpus, a one-million-word corpus that can be accessed by authorised users through the MWSWeb site (Taibi et al. 2015a) at http://openmws. itd. cnr. it. Part 1 illustrates the tools and techniques used to index the corpus data–transcriptions of all 177 episodes in the House MD series (original US version). In particular, it describes the commercially available Elasticsearch ( https://www. elastic. co), used as an indexing, annotational and search tool. Part 2 explains that this is a multimedia corpus allowing viewings of different types of scene. The 6000-plus scenes in the corpus have been annotated in terms of their typological features: Location type (eg patient’s hospital room; medical lab etc.); Event type (handover; differential diagnosis; precipitating medical event; patient examination etc.) and Character Group type... }, added-at = {2020-01-23T19:23:45.000+0100}, author = {Taibi, Davide and Marenzi, Ivana and Ahmad, Qazi Asim Ijaz}, biburl = {https://www.bibsonomy.org/bibtex/2705b48406849dd49fa3bf985c922abc0/marenzi}, doi = {10.1285/i9788883051531p151}, editor = {Baldry, Anthony and Bianchi, Francesca and Loiacono, Anna}, interhash = {04a02f646ae1c173830bd4f915acf519}, intrahash = {705b48406849dd49fa3bf985c922abc0}, isbn = {ISBN: 978-88-8305-153-1}, keywords = {myown sysrelevantforl3s}, number = 1, pages = {151-181}, publisher = {ESE - Salento University Publishing}, timestamp = {2020-01-23T19:23:45.000+0100}, title = {Ain’t that sweet. Reflections on scene level indexing and annotation in the House Corpus Project.}, volume = 1, year = 2019 }