A. Chandra, M. Suaib, and D. Beg. Informatics Engineering, an International Journal (IEIJ), 2 (3):
01 - 07(September 2014)
Abstract
Web spam is a big challenge for quality of search engine results. It is very important for search engines to detect web spam accurately. In this paper we present 32 low cost quality factors to classify spam and ham pages on real time basis. These features can be divided in to three categories: (i) URL features, (ii) Content features, and (iii) Link features. We developed a classifier using Resilient Back-propagation learning algorithm of neural network and obtained good accuracy. This classifier can be applied to search engine results on real time because calculation of these features require very little CPU resources.
%0 Journal Article
%1 chandra2014quality
%A Chandra, Ashish
%A Suaib, Mohammad
%A Beg, Dr. Rizwan
%D 2014
%J Informatics Engineering, an International Journal (IEIJ)
%K Classifier Detection Engine Network Neural Search Spam Web
%N 3
%P 01 - 07
%T Low Cost Page Quality Factors To Detect Web Spam
%U http://airccse.org/journal/ieij/vol2.html
%V 2
%X Web spam is a big challenge for quality of search engine results. It is very important for search engines to detect web spam accurately. In this paper we present 32 low cost quality factors to classify spam and ham pages on real time basis. These features can be divided in to three categories: (i) URL features, (ii) Content features, and (iii) Link features. We developed a classifier using Resilient Back-propagation learning algorithm of neural network and obtained good accuracy. This classifier can be applied to search engine results on real time because calculation of these features require very little CPU resources.
@article{chandra2014quality,
abstract = {Web spam is a big challenge for quality of search engine results. It is very important for search engines to detect web spam accurately. In this paper we present 32 low cost quality factors to classify spam and ham pages on real time basis. These features can be divided in to three categories: (i) URL features, (ii) Content features, and (iii) Link features. We developed a classifier using Resilient Back-propagation learning algorithm of neural network and obtained good accuracy. This classifier can be applied to search engine results on real time because calculation of these features require very little CPU resources.},
added-at = {2020-10-29T11:07:03.000+0100},
author = {Chandra, Ashish and Suaib, Mohammad and Beg, Dr. Rizwan},
biburl = {https://www.bibsonomy.org/bibtex/2ad22099c7f0493f71c682088aaf39104/ieij1},
interhash = {f1b2c279b86db523f314b7b4d5d11878},
intrahash = {ad22099c7f0493f71c682088aaf39104},
journal = {Informatics Engineering, an International Journal (IEIJ)},
keywords = {Classifier Detection Engine Network Neural Search Spam Web},
month = {September},
number = 3,
pages = {01 - 07},
timestamp = {2020-10-29T11:08:09.000+0100},
title = {Low Cost Page Quality Factors To Detect Web Spam},
url = {http://airccse.org/journal/ieij/vol2.html},
volume = 2,
year = 2014
}