The Web graph is a giant social network whose properties have been measured and modeled extensively in recent years. Most such studies concentrate on the graph structure alone, and do not consider textual properties of the nodes. Consequently, Web communities have been characterized purely in terms of graph structure and not on page content. We propose that a topic taxonomy such as Yahoo! or the Open Directory provides a useful framework for understanding the structure of content-based clusters ...
%0 Conference Paper
%1 citeulike:348185
%A Chakrabarti, S.
%A Joshi, M.
%A Punera, K.
%A Pennock, D.
%B Proc. 11th International World Wide Web Conference
%D 2002
%I ACM Press
%K structure web
%T The structure of broad topics on the Web
%U http://citeseer.ist.psu.edu/515762.html
%X The Web graph is a giant social network whose properties have been measured and modeled extensively in recent years. Most such studies concentrate on the graph structure alone, and do not consider textual properties of the nodes. Consequently, Web communities have been characterized purely in terms of graph structure and not on page content. We propose that a topic taxonomy such as Yahoo! or the Open Directory provides a useful framework for understanding the structure of content-based clusters ...
@inproceedings{citeulike:348185,
abstract = {The Web graph is a giant social network whose properties have been measured and modeled extensively in recent years. Most such studies concentrate on the graph structure alone, and do not consider textual properties of the nodes. Consequently, Web communities have been characterized purely in terms of graph structure and not on page content. We propose that a topic taxonomy such as Yahoo! or the Open Directory provides a useful framework for understanding the structure of content-based clusters ...},
added-at = {2007-08-18T13:22:24.000+0200},
author = {Chakrabarti, S. and Joshi, M. and Punera, K. and Pennock, D.},
biburl = {https://www.bibsonomy.org/bibtex/2e4bf1fe4057d90961bdd3394eea41ae5/a_olympia},
booktitle = {Proc. 11th International World Wide Web Conference},
citeulike-article-id = {348185},
description = {citeulike},
interhash = {bbeafbf042320a27ec0a5fae7ba5b3b3},
intrahash = {e4bf1fe4057d90961bdd3394eea41ae5},
keywords = {structure web},
priority = {2},
publisher = {ACM Press},
timestamp = {2007-08-18T13:22:37.000+0200},
title = {The structure of broad topics on the Web},
url = {http://citeseer.ist.psu.edu/515762.html},
year = 2002
}