Web crawlers are one of the most crucial components in search engines and their optimization would have a great effect on improving the searching efficiency. In this paper, we introduce an intelligent crawler called Gcrawler that uses a genetic algorithm for improving its crawling performance. Gcrawler estimates the best path for crawling on one hand and expands its initial keywords by using a genetic algorithm during the crawling on the other hand. This is the first crawler that acts intelligently without any relevance feedback or training. All the processes are online and there is no need for direct interaction with the users.
Beschreibung
IEEEXplore# Enhancing focused crawling with genetic algorithms
%0 Conference Paper
%1 Shokouhi:2005
%A Shokouhi, M.
%A Chubak, P.
%A Raeesy, Z.
%B Information Technology: Coding and Computing, 2005. ITCC 2005. International Conference on
%D 2005
%K crawl p:diss p:holmes soc
%P 503- 508 Vol. 2
%R 10.1109/ITCC.2005.145
%T Enhancing focused crawling with genetic algorithms
%U http://ieeexplore.ieee.org/xpl/freeabs_all.jsp?arnumber=1425193
%V 2
%X Web crawlers are one of the most crucial components in search engines and their optimization would have a great effect on improving the searching efficiency. In this paper, we introduce an intelligent crawler called Gcrawler that uses a genetic algorithm for improving its crawling performance. Gcrawler estimates the best path for crawling on one hand and expands its initial keywords by using a genetic algorithm during the crawling on the other hand. This is the first crawler that acts intelligently without any relevance feedback or training. All the processes are online and there is no need for direct interaction with the users.
%@ 0-7695-2315-3
@inproceedings{Shokouhi:2005,
abstract = {Web crawlers are one of the most crucial components in search engines and their optimization would have a great effect on improving the searching efficiency. In this paper, we introduce an intelligent crawler called Gcrawler that uses a genetic algorithm for improving its crawling performance. Gcrawler estimates the best path for crawling on one hand and expands its initial keywords by using a genetic algorithm during the crawling on the other hand. This is the first crawler that acts intelligently without any relevance feedback or training. All the processes are online and there is no need for direct interaction with the users.},
added-at = {2008-06-12T12:54:27.000+0200},
author = {Shokouhi, M. and Chubak, P. and Raeesy, Z.},
biburl = {https://www.bibsonomy.org/bibtex/2ee8ca7e2b66b1782cd29a42a33d9aba6/enterldestodes},
booktitle = {Information Technology: Coding and Computing, 2005. ITCC 2005. International Conference on},
description = {IEEEXplore# Enhancing focused crawling with genetic algorithms},
doi = {10.1109/ITCC.2005.145},
interhash = {5caf396ed144f7974c2302b7e6ce38fb},
intrahash = {ee8ca7e2b66b1782cd29a42a33d9aba6},
isbn = {0-7695-2315-3},
keywords = {crawl p:diss p:holmes soc},
pages = {503- 508 Vol. 2},
timestamp = {2009-03-03T12:34:12.000+0100},
title = {Enhancing focused crawling with genetic algorithms},
url = {http://ieeexplore.ieee.org/xpl/freeabs_all.jsp?arnumber=1425193},
volume = 2,
year = 2005
}