@inproceedings{Haveliwala00ScalableTechniquesClusteringWeb, title = {Scalable Techniques for Clustering the Web}, author = {Taher H. Haveliwala and Aristides Gionis and Piotr Indyk}, booktitle = {WebDB (Informal Proceedings)}, pages = {129--134}, url = {http://citeseer.ist.psu.edu/haveliwala00scalable.html}, year = {2000}, biburl = {http://www.bibsonomy.org/bibtex/26a9c1bc0c0c42ad9f5072528f5b7bcff/mgrani}, abstract = {Clustering is one of the most crucial techniques for dealing with the massive amount of information present on the web. Clustering can either be performed once offline, independent of search queries, or performed online on the results of search queries. Our offline approach aims to efficiently cluster similar pages on the web, using the technique of Locality-Sensitive Hashing (LSH), in which web pages are hashed in such a way that similar pages have a much higher probability of collision than...}, priority = {2}, citeulike-article-id = {446846}, keywords = {clustering, web } } @inproceedings{haveliwala00scalable, title = {Scalable Techniques for Clustering the Web}, author = {Taher H. Haveliwala and Aristides Gionis and Piotr Indyk}, booktitle = {Proceedings of the Third International Workshop on the Web and Databases, WebDB 2000, in conjunction with ACM PODS/SIGMOD 2000}, editor = {Dan Suciu and Gottfried Vossen}, pages = {129-134}, url = {http://www.research.att.com/conf/webdb2000/PAPERS/8c.ps}, year = {2000}, biburl = {http://www.bibsonomy.org/bibtex/239497aee54a82587f4c921dd9ee36275/msn}, language = {english}, keywords = {cites.gradu mrefs research.clustering } } @inproceedings{conf/webdb/HaveliwalaGI00, title = {Scalable Techniques for Clustering the Web.}, author = {Taher H. Haveliwala and Aristides Gionis and Piotr Indyk}, booktitle = {WebDB (Informal Proceedings)}, pages = {129-134}, url = {http://dblp.uni-trier.de/db/conf/webdb/webdb2000.html#HaveliwalaGI00}, year = {2000}, biburl = {http://www.bibsonomy.org/bibtex/2107992a29fb16a42299a53ee1cfa75d7/dblp}, description = {dblp}, ee = {http://www.research.att.com/conf/webdb2000/PAPERS/8c.ps}, date = {2002-01-03}, keywords = {dblp } }