Sidra is a new indexing and ranking system for large-scale Web collections. Sidra creates multiple distributed indexes, organized and partitioned by different ranking criteria, aimed at supporting contextualized queries over hypertexts and their metadata. This paper presents the architecture of Sidra and the algorithms used to create its indexes. Performance measurements on the Portuguese Web data show that Sidra's indexing times and scalability are comparable to those of global Web search engines.
%0 Journal Article
%1 costa2005distributed
%A Costa, M.
%A Silva, M.
%D 2005
%J IEEE Latin America Transactions
%K archive index search web alexandria
%N 1
%P 2-8
%R 10.1109/TLA.2005.1468656
%T Distributed Indexing of Large-Scale Web Collections
%U http://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber=1468656
%V 3
%X Sidra is a new indexing and ranking system for large-scale Web collections. Sidra creates multiple distributed indexes, organized and partitioned by different ranking criteria, aimed at supporting contextualized queries over hypertexts and their metadata. This paper presents the architecture of Sidra and the algorithms used to create its indexes. Performance measurements on the Portuguese Web data show that Sidra's indexing times and scalability are comparable to those of global Web search engines.
@article{costa2005distributed,
abstract = {Sidra is a new indexing and ranking system for large-scale Web collections. Sidra creates multiple distributed indexes, organized and partitioned by different ranking criteria, aimed at supporting contextualized queries over hypertexts and their metadata. This paper presents the architecture of Sidra and the algorithms used to create its indexes. Performance measurements on the Portuguese Web data show that Sidra's indexing times and scalability are comparable to those of global Web search engines.},
added-at = {2012-09-26T13:39:25.000+0200},
author = {Costa, M. and Silva, M.},
biburl = {https://www.bibsonomy.org/bibtex/2c927cddd9fc8fb672198081f868e4efb/jaeschke},
doi = {10.1109/TLA.2005.1468656},
interhash = {aa19ebf217dc3ff7b18d4b4f18ef0f21},
intrahash = {c927cddd9fc8fb672198081f868e4efb},
issn = {1548-0992},
journal = {IEEE Latin America Transactions},
keywords = {archive index search web alexandria},
month = mar,
number = 1,
pages = {2-8},
timestamp = {2014-07-28T15:57:31.000+0200},
title = {Distributed Indexing of Large-Scale Web Collections},
url = {http://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber=1468656},
volume = 3,
year = 2005
}