The coverage and recency of the major World Wide Web search engines was analyzed, yielding some surprising results. The coverage of any one engine is significantly limited: No single engine indexes more than about one-third of the "indexable Web," the coverage of the six engines investigated varies by an order of magnitude, and
combining the results of the six engines yields about 3.5 times as many documents on average as compared with the results from only one engine. Analysis of the overlap between pairs of engines gives an estimated lower bound on the size of the indexable Web of 320 million pages.
%0 Journal Article
%1 lawrence98searching
%A Lawrence, S.
%A Giles, C.
%D 1998
%J Science
%K search-engines
%P 98-100
%T Searching the world wide web
%U http://citeseer.comp.nus.edu.sg/lawrence98searching.html
%V 280
%X The coverage and recency of the major World Wide Web search engines was analyzed, yielding some surprising results. The coverage of any one engine is significantly limited: No single engine indexes more than about one-third of the "indexable Web," the coverage of the six engines investigated varies by an order of magnitude, and
combining the results of the six engines yields about 3.5 times as many documents on average as compared with the results from only one engine. Analysis of the overlap between pairs of engines gives an estimated lower bound on the size of the indexable Web of 320 million pages.
@article{lawrence98searching,
abstract = {The coverage and recency of the major World Wide Web search engines was analyzed, yielding some surprising results. The coverage of any one engine is significantly limited: No single engine indexes more than about one-third of the "indexable Web," the coverage of the six engines investigated varies by an order of magnitude, and
combining the results of the six engines yields about 3.5 times as many documents on average as compared with the results from only one engine. Analysis of the overlap between pairs of engines gives an estimated lower bound on the size of the indexable Web of 320 million pages.},
added-at = {2006-10-30T08:38:23.000+0100},
author = {Lawrence, S. and Giles, C.},
biburl = {https://www.bibsonomy.org/bibtex/2c77ff07c7801271cd31e54a850edf430/grahl},
day = 03,
interhash = {596cb9ed4212110df808fb642427d7f2},
intrahash = {c77ff07c7801271cd31e54a850edf430},
journal = {Science},
keywords = {search-engines},
month = {04},
pages = {98-100},
timestamp = {2006-10-30T08:38:23.000+0100},
title = {Searching the world wide web},
url = {http://citeseer.comp.nus.edu.sg/lawrence98searching.html},
volume = 280,
year = 1998
}