In this paper we address the problem of discovering missing hypertext links in Wikipedia. The method we propose consists of two steps: first, we compute a cluster of highly similar pages around a given page, and then we identify candidate links from those similar pages that might be missing on the given page. The main innovation is in the algorithm that we use for identifying similar pages, LTRank, which ranks pages using co-citation and page title information. Both LTRank and the link discovery method are manually evaluated and show acceptable results, especially given the simplicity of the methods and conservativeness of the evaluation criteria.
%0 Conference Paper
%1 Adafre:2005:DML:1134271.1134284
%A Adafre, Sisay Fissaha
%A de Rijke, Maarten
%B Proceedings of the 3rd international workshop on Link discovery
%C New York, NY, USA
%D 2005
%I ACM
%K links missing seminar ss2015 talk wikipedia
%P 90--97
%R 10.1145/1134271.1134284
%T Discovering missing links in Wikipedia
%U http://doi.acm.org/10.1145/1134271.1134284
%X In this paper we address the problem of discovering missing hypertext links in Wikipedia. The method we propose consists of two steps: first, we compute a cluster of highly similar pages around a given page, and then we identify candidate links from those similar pages that might be missing on the given page. The main innovation is in the algorithm that we use for identifying similar pages, LTRank, which ranks pages using co-citation and page title information. Both LTRank and the link discovery method are manually evaluated and show acceptable results, especially given the simplicity of the methods and conservativeness of the evaluation criteria.
%@ 1-59593-215-1
@inproceedings{Adafre:2005:DML:1134271.1134284,
abstract = {In this paper we address the problem of discovering missing hypertext links in Wikipedia. The method we propose consists of two steps: first, we compute a cluster of highly similar pages around a given page, and then we identify candidate links from those similar pages that might be missing on the given page. The main innovation is in the algorithm that we use for identifying similar pages, LTRank, which ranks pages using co-citation and page title information. Both LTRank and the link discovery method are manually evaluated and show acceptable results, especially given the simplicity of the methods and conservativeness of the evaluation criteria.},
acmid = {1134284},
added-at = {2015-06-17T22:22:36.000+0200},
address = {New York, NY, USA},
author = {Adafre, Sisay Fissaha and de Rijke, Maarten},
biburl = {https://www.bibsonomy.org/bibtex/2bba5ab3fba5c66ad99da35cccfd075aa/magnuslechner},
booktitle = {Proceedings of the 3rd international workshop on Link discovery},
description = {Discovering missing links in Wikipedia},
doi = {10.1145/1134271.1134284},
interhash = {4e320a2ee75ba8f52d8e7bdc3af25e5a},
intrahash = {bba5ab3fba5c66ad99da35cccfd075aa},
isbn = {1-59593-215-1},
keywords = {links missing seminar ss2015 talk wikipedia},
location = {Chicago, Illinois},
numpages = {8},
pages = {90--97},
publisher = {ACM},
series = {LinkKDD '05},
timestamp = {2015-06-17T22:22:36.000+0200},
title = {Discovering missing links in Wikipedia},
url = {http://doi.acm.org/10.1145/1134271.1134284},
year = 2005
}