@inproceedings{conf/jcdl/TahmasebiNTR10, abstract = {Word sense discrimination is the first, important step towards automatic detection of language evolution within large, historic document collections. By comparing the found word senses over time, we can reveal and use important information that will improve understanding and accessibility of a digital archive. Algorithms for word sense discrimination have been developed while keeping today's language in mind and have thus been evaluated on well selected, modern datasets. The quality of the word senses found in the discrimination step has a large impact on the detection of language evolution. Therefore, as a first step, we verify that word sense discrimination can successfully be applied to digitized historic documents and that the results correctly correspond to word senses. Because accessibility of digitized historic collections is influenced also by the quality of the optical character recognition (OCR), as a second step we investigate the effects of OCR errors on word sense discrimination results. All evaluations in this paper are performed on The Times Archive, a collection of newspaper articles from 1785 - 1985.}, added-at = {2013-05-30T15:49:30.000+0200}, author = {Tahmasebi, Nina and Niklas, Kai and Theuerkauf, Thomas and Risse, Thomas}, biburl = {https://www.bibsonomy.org/bibtex/2aa3ce92fd3df220678a4606dd6b1d989/tahmasebi}, booktitle = {Proc. of 10th ACM/IEEE Joint Conference on Digital Libraries (JCDL), Surfers Paradise, Gold Coast, Australia, June 21- 25, 2010}, interhash = {0c00c5b69e96f0999c8fe6760a6f07c8}, intrahash = {aa3ce92fd3df220678a4606dd6b1d989}, keywords = {JCDL2010 myown}, pages = {89-98}, timestamp = {2017-08-12T12:25:23.000+0200}, title = {Using Word Sense Discrimination on Historic Document Collections}, url = {http://dl.acm.org/citation.cfm?doid=1816123.1816137}, year = 2010 }