Technical terms (henceforth called terms), are important elements for digital libraries. In this paper we present a domain-independent method for the automatic extraction of multi-word terms, from machine-readable special language corpora.
The method, (C-value/NC-value), combines linguistic and statistical information. The first part, C-value enhances the common statistical measure of frequency of occurrence for term extraction, making it sensitive to a particular type of multi-word terms, the nested terms. The second part, NC-value, gives: 1) a method for the extraction of term context words (words that tend to appear with terms), 2) the incorporation of information from term context words to the extraction of terms.
Description
CiteULike: Automatic recognition of multi-word terms:. the C-value/NC-value method
%0 Journal Article
%1 Frantzi00keyphreaseExtraction
%A Frantzi, Katerina
%A Ananiadou, Sophia
%A Mima, Hideki
%D 2000
%J International Journal on Digital Libraries
%K 00 Frantzi c-value extraction keyphrease nc-value
%N 2
%P 115--130
%T Automatic recognition of multi-word terms:. the C-value/NC-value method
%U http://dx.doi.org/10.1007/s007999900023
%V 3
%X Technical terms (henceforth called terms), are important elements for digital libraries. In this paper we present a domain-independent method for the automatic extraction of multi-word terms, from machine-readable special language corpora.
The method, (C-value/NC-value), combines linguistic and statistical information. The first part, C-value enhances the common statistical measure of frequency of occurrence for term extraction, making it sensitive to a particular type of multi-word terms, the nested terms. The second part, NC-value, gives: 1) a method for the extraction of term context words (words that tend to appear with terms), 2) the incorporation of information from term context words to the extraction of terms.
@article{Frantzi00keyphreaseExtraction,
abstract = {Technical terms (henceforth called terms), are important elements for digital libraries. In this paper we present a domain-independent method for the automatic extraction of multi-word terms, from machine-readable special language corpora.
The method, (C-value/NC-value), combines linguistic and statistical information. The first part, C-value enhances the common statistical measure of frequency of occurrence for term extraction, making it sensitive to a particular type of multi-word terms, the nested terms. The second part, NC-value, gives: 1) a method for the extraction of term context words (words that tend to appear with terms), 2) the incorporation of information from term context words to the extraction of terms.},
added-at = {2010-03-10T21:56:27.000+0100},
author = {Frantzi, Katerina and Ananiadou, Sophia and Mima, Hideki},
biburl = {https://www.bibsonomy.org/bibtex/248642e2a0c949926b954005850e637fb/lee_peck},
day = 25,
description = {CiteULike: Automatic recognition of multi-word terms:. the C-value/NC-value method},
interhash = {69324838535b4a1bb1aa25e503264378},
intrahash = {48642e2a0c949926b954005850e637fb},
journal = {International Journal on Digital Libraries},
keywords = {00 Frantzi c-value extraction keyphrease nc-value},
month = {August},
number = 2,
pages = {115--130},
timestamp = {2010-03-10T21:56:27.000+0100},
title = {Automatic recognition of multi-word terms:. the C-value/NC-value method},
url = {http://dx.doi.org/10.1007/s007999900023},
volume = 3,
year = 2000
}