@book{JRC45828, editor = {}, address = {Beijing (China)}, year = {2008}, author = {Piskorski J and Sydow M and Weiss D}, isbn = {}, abstract = {We study the usability of linguistic features in theWeb spam classification task. The features were computed on two Web spam corpora: Webspam-Uk2006 and Webspam-Uk2007, we make them publicly available for other researchers. Preliminary analysis seems to indicate that certain linguistic features may be useful for the spam-detection task when combined with features studied elsewhere. }, title = {Exploring Linguistic Features for Web Spam Detection: A Preliminary Study}, url = {http://airweb.cse.lehigh.edu/2008, http://airweb.cse.lehigh.edu/2008/submissions/piskorski_2008_linguistic_analysis_spam.pdf}, volume = {}, number = {}, journal = {}, pages = {1-4}, issn = {}, publisher = {ACM}, doi = {} }