Recently, the relation between the entropy of words (a new measure from Information Theory introduced by
Montemurro in 2001) and the role of words in literary texts, as well as the capacity of entropy for clustering words, has
been shown. Our final goal is to investigate if and how the list of ranked words (using entropy) can be useful in other
more practical contexts, such as information retrieval task or automatic classification of bio-medical textual data. In this
work, we analyze the effectiveness of the keywords selected by the Montemurro's approach to capture the semantics
behind biomedical text collections, and using the spectrum of words we offer a visual representation of the text's
content. Besides, we compare the resulting keyword lists with the ones obtained with TF-IDF measure, and discuss
some of the most interesting facts obtained from this comparison.
%0 Conference Paper
%1 esposti2010visual
%A Esposti, Mirko Degli
%A Danger, Roxana
%A Paolo, Rosso
%A Garcia-Blasco, Sandra
%B Network Tools and Applications in Biology (NETTAB 2010), Biological Wikis
%C Napoli, Italy
%D 2010
%E Facchiano, Angelo
%E Romano, Paolo
%K biomedical entropy information-theory myown sgarcia visualization
%P 139-142
%T Visual characterization of biomedical texts with word entropy
%U http://repository.dlsi.ua.es/518/1/DegliEspostiEtAl_NETTAB10.pdf
%X Recently, the relation between the entropy of words (a new measure from Information Theory introduced by
Montemurro in 2001) and the role of words in literary texts, as well as the capacity of entropy for clustering words, has
been shown. Our final goal is to investigate if and how the list of ranked words (using entropy) can be useful in other
more practical contexts, such as information retrieval task or automatic classification of bio-medical textual data. In this
work, we analyze the effectiveness of the keywords selected by the Montemurro's approach to capture the semantics
behind biomedical text collections, and using the spectrum of words we offer a visual representation of the text's
content. Besides, we compare the resulting keyword lists with the ones obtained with TF-IDF measure, and discuss
some of the most interesting facts obtained from this comparison.
@inproceedings{esposti2010visual,
abstract = {Recently, the relation between the entropy of words (a new measure from Information Theory introduced by
Montemurro in 2001) and the role of words in literary texts, as well as the capacity of entropy for clustering words, has
been shown. Our final goal is to investigate if and how the list of ranked words (using entropy) can be useful in other
more practical contexts, such as information retrieval task or automatic classification of bio-medical textual data. In this
work, we analyze the effectiveness of the keywords selected by the Montemurro's approach to capture the semantics
behind biomedical text collections, and using the spectrum of words we offer a visual representation of the text's
content. Besides, we compare the resulting keyword lists with the ones obtained with TF-IDF measure, and discuss
some of the most interesting facts obtained from this comparison.
},
added-at = {2011-06-15T13:34:20.000+0200},
address = {Napoli, Italy},
author = {Esposti, Mirko Degli and Danger, Roxana and Paolo, Rosso and Garcia-Blasco, Sandra},
biburl = {https://www.bibsonomy.org/bibtex/28576936755ae07df4bcdf68cd1ee324a/bitsnbrains},
booktitle = {Network Tools and Applications in Biology (NETTAB 2010), Biological Wikis},
editor = {Facchiano, Angelo and Romano, Paolo},
interhash = {39e4f5c53360b8040a7099249f5635b7},
intrahash = {8576936755ae07df4bcdf68cd1ee324a},
keywords = {biomedical entropy information-theory myown sgarcia visualization},
pages = {139-142},
timestamp = {2011-06-15T14:33:03.000+0200},
title = {Visual characterization of biomedical texts with word entropy},
url = {http://repository.dlsi.ua.es/518/1/DegliEspostiEtAl_NETTAB10.pdf},
year = 2010
}