@inproceedings{broder1997, added-at = {2009-08-19T01:22:38.000+0200}, address = {Washington, DC, USA}, author = {Broder, A.}, biburl = {http://www.bibsonomy.org/bibtex/278b3f3faced79adfcda4e3a57f7e57ff/mstrohm}, booktitle = {SEQUENCES '97: Proceedings of the Compression and Complexity of Sequences 1997}, description = {on shingles}, interhash = {3e9b05638c537f23a276ef4e09d4b9d4}, intrahash = {78b3f3faced79adfcda4e3a57f7e57ff}, keywords = {INFLUENTIAL information-retrieval similarity}, pages = 21, publisher = {IEEE Computer Society}, timestamp = {2009-08-19T01:22:38.000+0200}, title = {On the Resemblance and Containment of Documents}, year = 1997 }