@inbook{1f02b7234a0d4324b3209fc08bd8ccd9,
title = "Performance analysis of Na{\"i}ve Bayes classification, Support Vector Machines and Neural Networks for spam categorization",
abstract = "Spam mail recognition is a new growing field which brings together the topic of natural language processing and machine learning as it is in essence a two class classification of natural language texts. An important feature of spam recognition is that it is a cost-sensitive classification: misclassification of a nonspam mail as spam is generally a more severe error than misclassifying a spam mail as non-spam. In order to be compared, the methods applied to this field should be all evaluated with the same corpus and within the same cost-sensitive framework. In this paper, the performances of Support Vector Machines (SVM), Neural Networks (NN) and Na{\"i}ve Bayes (NB) techniques are compared using a publicly available corpus (LINGSPAM) for different cost scenarios. The training time complexities of the methods are also evaluated. The results show that NN has significantly better performance than the two other, having acceptable training times. NB gives better results than SVM when the cost is extremely high while in all other cases SVM outperforms NB.",
author = "Tantuǧ, {A. C{\"u}neyd} and G{\"u}l{\c s}en Eryiǧit",
year = "2006",
doi = "10.1007/3-540-31662-0_38",
language = "English",
isbn = "3540316493",
series = "Advances in Soft Computing",
pages = "495--504",
editor = "Ajith Abraham and Bernard Baets and Mario Koeppen and Bertram Nickolay",
booktitle = "Applied Soft Computing Technologies",
}