The popularity of social bookmarking sites has made them prime targets for spammers. Many of these systems require an administrator's time and energy to manually filter or remove spam. Here we discuss the motivations of social spam, and present a study of automatic detection of spammers in a social tagging system. We identify and analyze six distinct features that address various properties of social spam, finding that each of these features provides for a helpful signal to discriminate spammers from legitimate users. These features are then used in various machine learning algorithms for classification, achieving over 98\% accuracy in detecting social spammers with 2\% false positives. These promising results provide a new baseline for future efforts on social spam. We make our dataset publicly available to the research community.
%0 Conference Paper
%1 social-spam-markines
%A Markines, Benjamin
%A Cattuto, Ciro
%A Menczer, Filippo
%B the 5th International Workshop
%C New York, New York, USA
%D 2009
%E Fetterly, Dennis
%E Gyöngyi, Zoltán
%I ACM Press
%K qual social-spam
%P 41--48
%R 10.1145/1531914.1531924
%T Social spam detection
%U http://dx.doi.org/10.1145/1531914.1531924
%X The popularity of social bookmarking sites has made them prime targets for spammers. Many of these systems require an administrator's time and energy to manually filter or remove spam. Here we discuss the motivations of social spam, and present a study of automatic detection of spammers in a social tagging system. We identify and analyze six distinct features that address various properties of social spam, finding that each of these features provides for a helpful signal to discriminate spammers from legitimate users. These features are then used in various machine learning algorithms for classification, achieving over 98\% accuracy in detecting social spammers with 2\% false positives. These promising results provide a new baseline for future efforts on social spam. We make our dataset publicly available to the research community.
%@ 9781605584386
@inproceedings{social-spam-markines,
abstract = {{The popularity of social bookmarking sites has made them prime targets for spammers. Many of these systems require an administrator's time and energy to manually filter or remove spam. Here we discuss the motivations of social spam, and present a study of automatic detection of spammers in a social tagging system. We identify and analyze six distinct features that address various properties of social spam, finding that each of these features provides for a helpful signal to discriminate spammers from legitimate users. These features are then used in various machine learning algorithms for classification, achieving over 98\% accuracy in detecting social spammers with 2\% false positives. These promising results provide a new baseline for future efforts on social spam. We make our dataset publicly available to the research community.}},
added-at = {2011-09-28T23:59:32.000+0200},
address = {New York, New York, USA},
author = {Markines, Benjamin and Cattuto, Ciro and Menczer, Filippo},
biburl = {https://www.bibsonomy.org/bibtex/26d924143a07b29e39da7f227a4a7bcd8/dimitargn},
booktitle = {the 5th International Workshop},
citeulike-article-id = {4524185},
citeulike-linkout-0 = {http://portal.acm.org/citation.cfm?id=1531914.1531924},
citeulike-linkout-1 = {http://dx.doi.org/10.1145/1531914.1531924},
doi = {10.1145/1531914.1531924},
editor = {Fetterly, Dennis and Gy\"{o}ngyi, Zolt\'{a}n},
interhash = {50847302da776b6e04e53209a0b54699},
intrahash = {6d924143a07b29e39da7f227a4a7bcd8},
isbn = {9781605584386},
keywords = {qual social-spam},
location = {Madrid, Spain},
pages = {41--48},
posted-at = {2011-09-09 19:05:29},
priority = {3},
publisher = {ACM Press},
series = {AIRWeb '09},
timestamp = {2011-10-13T17:44:57.000+0200},
title = {{Social spam detection}},
url = {http://dx.doi.org/10.1145/1531914.1531924},
year = 2009
}