Dataspace management has been recently identified as a new agenda for information management 17, 22 and information integration 23. In sharp contrast to standard information integration architectures, a dataspace management system is a <i>data-coexistence approach:</i> it does not require <i>any</i> investments in semantic integration before querying services on the data are provided. Rather, a dataspace can be gradually enhanced over time by defining relationships among the data. Defining those integration semantics gradually is termed <i>pay-as-you-go</i> information integration 17, as time and effort (pay) are needed over time (go) to provide integration semantics. The benefits are better query results (gain). This paper is the first to explore pay-as-you-go information integration in dataspaces. We provide a technique for declarative pay-as-you-go information integration named iTrails. The core idea of our approach is to declaratively add lightweight 'hints' (trails) to a <i>search engine</i> thus allowing gradual enrichment of loosely integrated data sources. Our experiments confirm that iTrails can be efficiently implemented introducing only little overhead during query execution. At the same time iTrails strongly improves the quality of query results. Furthermore, we present rewriting and pruning techniques that allow us to scale iTrails to tens of thousands of trail definitions with minimal growth in the rewritten query size.
%0 Conference Paper
%1 Vaz_Salles:2007:IPI:1325851.1325927
%A Vaz Salles, Marcos Antonio
%A Dittrich, Jens-Peter
%A Karakashian, Shant Kirakos
%A Girard, Olivier René
%A Blunschi, Lukas
%B Proceedings of the 33rd international conference on Very large data bases
%D 2007
%I VLDB Endowment
%K dataspaces iTrails information_integration pay-as-you-go toread
%P 663--674
%T iTrails: pay-as-you-go information integration in dataspaces
%U http://dl.acm.org/citation.cfm?id=1325851.1325927
%X Dataspace management has been recently identified as a new agenda for information management 17, 22 and information integration 23. In sharp contrast to standard information integration architectures, a dataspace management system is a <i>data-coexistence approach:</i> it does not require <i>any</i> investments in semantic integration before querying services on the data are provided. Rather, a dataspace can be gradually enhanced over time by defining relationships among the data. Defining those integration semantics gradually is termed <i>pay-as-you-go</i> information integration 17, as time and effort (pay) are needed over time (go) to provide integration semantics. The benefits are better query results (gain). This paper is the first to explore pay-as-you-go information integration in dataspaces. We provide a technique for declarative pay-as-you-go information integration named iTrails. The core idea of our approach is to declaratively add lightweight 'hints' (trails) to a <i>search engine</i> thus allowing gradual enrichment of loosely integrated data sources. Our experiments confirm that iTrails can be efficiently implemented introducing only little overhead during query execution. At the same time iTrails strongly improves the quality of query results. Furthermore, we present rewriting and pruning techniques that allow us to scale iTrails to tens of thousands of trail definitions with minimal growth in the rewritten query size.
%@ 978-1-59593-649-3
@inproceedings{Vaz_Salles:2007:IPI:1325851.1325927,
abstract = {Dataspace management has been recently identified as a new agenda for information management [17, 22] and information integration [23]. In sharp contrast to standard information integration architectures, a dataspace management system is a <i>data-coexistence approach:</i> it does not require <i>any</i> investments in semantic integration before querying services on the data are provided. Rather, a dataspace can be gradually enhanced over time by defining relationships among the data. Defining those integration semantics gradually is termed <i>pay-as-you-go</i> information integration [17], as time and effort (pay) are needed over time (go) to provide integration semantics. The benefits are better query results (gain). This paper is the first to explore pay-as-you-go information integration in dataspaces. We provide a technique for declarative pay-as-you-go information integration named iTrails. The core idea of our approach is to declaratively add lightweight 'hints' (trails) to a <i>search engine</i> thus allowing gradual enrichment of loosely integrated data sources. Our experiments confirm that iTrails can be efficiently implemented introducing only little overhead during query execution. At the same time iTrails strongly improves the quality of query results. Furthermore, we present rewriting and pruning techniques that allow us to scale iTrails to tens of thousands of trail definitions with minimal growth in the rewritten query size.},
acmid = {1325927},
added-at = {2011-11-24T08:37:42.000+0100},
author = {Vaz Salles, Marcos Antonio and Dittrich, Jens-Peter and Karakashian, Shant Kirakos and Girard, Olivier Ren\'{e} and Blunschi, Lukas},
biburl = {https://www.bibsonomy.org/bibtex/26c7398feb4124d78ce82625db5b5978c/schmidt2},
booktitle = {Proceedings of the 33rd international conference on Very large data bases},
interhash = {2ab9274a3def4e081e6efdf9a8dfa9fd},
intrahash = {6c7398feb4124d78ce82625db5b5978c},
isbn = {978-1-59593-649-3},
keywords = {dataspaces iTrails information_integration pay-as-you-go toread},
location = {Vienna, Austria},
numpages = {12},
pages = {663--674},
publisher = {VLDB Endowment},
series = {VLDB '07},
timestamp = {2011-12-13T16:30:44.000+0100},
title = {iTrails: pay-as-you-go information integration in dataspaces},
url = {http://dl.acm.org/citation.cfm?id=1325851.1325927},
year = 2007
}