M. Costa, D. Gomes, F. Couto, and M. Silva. Proceedings of the 22nd International Conference on World Wide Web Companion, page 1045--1050. Republic and Canton of Geneva, Switzerland, International World Wide Web Conferences Steering Committee, (2013)
Abstract
Web archives already hold more than 282 billion documents and users demand full-text search to explore this historical information. This survey provides an overview of web archive search architectures designed for time-travel search, i.e. full-text search on the web within a user-specified time interval. Performance, scalability and ease of management are important aspects to take in consideration when choosing a system architecture. We compare these aspects and initialize the discussion of which search architecture is more suitable for a large-scale web archive.
%0 Conference Paper
%1 costa2013survey
%A Costa, Miguel
%A Gomes, Daniel
%A Couto, Francisco
%A Silva, Mário
%B Proceedings of the 22nd International Conference on World Wide Web Companion
%C Republic and Canton of Geneva, Switzerland
%D 2013
%I International World Wide Web Conferences Steering Committee
%K architecture archive index internet search survey web
%P 1045--1050
%T A Survey of Web Archive Search Architectures
%U http://dl.acm.org/citation.cfm?id=2487788.2488116
%X Web archives already hold more than 282 billion documents and users demand full-text search to explore this historical information. This survey provides an overview of web archive search architectures designed for time-travel search, i.e. full-text search on the web within a user-specified time interval. Performance, scalability and ease of management are important aspects to take in consideration when choosing a system architecture. We compare these aspects and initialize the discussion of which search architecture is more suitable for a large-scale web archive.
%@ 978-1-4503-2038-2
@inproceedings{costa2013survey,
abstract = {Web archives already hold more than 282 billion documents and users demand full-text search to explore this historical information. This survey provides an overview of web archive search architectures designed for time-travel search, i.e. full-text search on the web within a user-specified time interval. Performance, scalability and ease of management are important aspects to take in consideration when choosing a system architecture. We compare these aspects and initialize the discussion of which search architecture is more suitable for a large-scale web archive.},
acmid = {2488116},
added-at = {2015-02-10T13:22:55.000+0100},
address = {Republic and Canton of Geneva, Switzerland},
author = {Costa, Miguel and Gomes, Daniel and Couto, Francisco and Silva, M\'{a}rio},
biburl = {https://www.bibsonomy.org/bibtex/21f57c4c796ddb0facd96de352f07bdea/jaeschke},
booktitle = {Proceedings of the 22nd International Conference on World Wide Web Companion},
interhash = {4459b35e98be0b9169dad35db7f12409},
intrahash = {1f57c4c796ddb0facd96de352f07bdea},
isbn = {978-1-4503-2038-2},
keywords = {architecture archive index internet search survey web},
location = {Rio de Janeiro, Brazil},
numpages = {6},
pages = {1045--1050},
publisher = {International World Wide Web Conferences Steering Committee},
series = {WWW '13 Companion},
timestamp = {2015-03-19T15:56:54.000+0100},
title = {A Survey of Web Archive Search Architectures},
url = {http://dl.acm.org/citation.cfm?id=2487788.2488116},
year = 2013
}