HERMIT: Flexible clustering for the SemEval-2 WSI task
D. Jurgens, and K. Stevens. Proceedings of the 5th International Workshop on Semantic Evaluation, page 359--362. Stroudsburg, PA, USA, Association for Computational Linguistics, (2010)
Abstract
A single word may have multiple unspecified meanings in a corpus. Word sense induction aims to discover these different meanings through word use, and knowledge-lean algorithms attempt this without using external lexical resources. We propose a new method for identifying the different senses that uses a flexible clustering strategy to automatically determine the number of senses, rather than predefining it. We demonstrate the effectiveness using the SemEval-2 WSI task, achieving competitive scores on both the V-Measure and Recall metrics, depending on the parameter configuration.
%0 Conference Paper
%1 hermit
%A Jurgens, David
%A Stevens, Keith
%B Proceedings of the 5th International Workshop on Semantic Evaluation
%C Stroudsburg, PA, USA
%D 2010
%I Association for Computational Linguistics
%K 2010 dimensionality hermit index random reduction semeval vector wsi
%P 359--362
%T HERMIT: Flexible clustering for the SemEval-2 WSI task
%U http://dl.acm.org/citation.cfm?id=1859664.1859744
%X A single word may have multiple unspecified meanings in a corpus. Word sense induction aims to discover these different meanings through word use, and knowledge-lean algorithms attempt this without using external lexical resources. We propose a new method for identifying the different senses that uses a flexible clustering strategy to automatically determine the number of senses, rather than predefining it. We demonstrate the effectiveness using the SemEval-2 WSI task, achieving competitive scores on both the V-Measure and Recall metrics, depending on the parameter configuration.
@inproceedings{hermit,
abstract = {A single word may have multiple unspecified meanings in a corpus. Word sense induction aims to discover these different meanings through word use, and knowledge-lean algorithms attempt this without using external lexical resources. We propose a new method for identifying the different senses that uses a flexible clustering strategy to automatically determine the number of senses, rather than predefining it. We demonstrate the effectiveness using the SemEval-2 WSI task, achieving competitive scores on both the V-Measure and Recall metrics, depending on the parameter configuration.},
acmid = {1859744},
added-at = {2011-09-07T13:32:24.000+0200},
address = {Stroudsburg, PA, USA},
author = {Jurgens, David and Stevens, Keith},
biburl = {https://www.bibsonomy.org/bibtex/2e8352c8efd12a683efa8d54b1c17291d/jil},
booktitle = {Proceedings of the 5th International Workshop on Semantic Evaluation},
interhash = {8240e1dfea18f65df155e09f93d79672},
intrahash = {e8352c8efd12a683efa8d54b1c17291d},
keywords = {2010 dimensionality hermit index random reduction semeval vector wsi},
location = {Los Angeles, California},
numpages = {4},
pages = {359--362},
publisher = {Association for Computational Linguistics},
series = {SemEval '10},
timestamp = {2013-11-23T20:11:51.000+0100},
title = {HERMIT: Flexible clustering for the SemEval-2 WSI task},
url = {http://dl.acm.org/citation.cfm?id=1859664.1859744},
year = 2010
}