The Internet constitutes a potential huge store of parallel text that may be collected to be exploited by many applications
such as multilingual information retrieval, machine translation, etc. These applications usually require at least sentence-alignedbilingual text. This paper presents new aligners designed for improving the performance of classical sentence-level alignerswhile aligning structured text such as HTML. The new aligners are compared with other well-known geometric aligners.
%0 Book Section
%1 sanchez2006eam
%A Sánchez-Villamil, Enrique
%A Santos-Antón, Susana
%A Ortiz-Rojas, Sergio
%A Forcada, Mikel
%B Advances in Natural Language Processing
%C Berlin / Heidelberg
%D 2006
%I Springer
%K alignment apertium bitextor crawling
%P 280--290
%T Evaluation of Alignment Methods for HTML Parallel Text
%U http://dx.doi.org/10.1007/11816508_29
%V 4139
%X The Internet constitutes a potential huge store of parallel text that may be collected to be exploited by many applications
such as multilingual information retrieval, machine translation, etc. These applications usually require at least sentence-alignedbilingual text. This paper presents new aligners designed for improving the performance of classical sentence-level alignerswhile aligning structured text such as HTML. The new aligners are compared with other well-known geometric aligners.
@incollection{sanchez2006eam,
abstract = {The Internet constitutes a potential huge store of parallel text that may be collected to be exploited by many applications
such as multilingual information retrieval, machine translation, etc. These applications usually require at least sentence-alignedbilingual text. This paper presents new aligners designed for improving the performance of classical sentence-level alignerswhile aligning structured text such as HTML. The new aligners are compared with other well-known geometric aligners.},
added-at = {2009-09-17T15:36:10.000+0200},
address = {Berlin / Heidelberg},
author = {S{\'{a}}nchez-Villamil, Enrique and Santos-Ant{\'{o}}n, Susana and Ortiz-Rojas, Sergio and Forcada, Mikel},
biburl = {https://www.bibsonomy.org/bibtex/2a97156878c1c4d365c67f832f0793fa4/unhammer},
booktitle = {Advances in Natural Language Processing},
interhash = {0271bd44d698de148432e7585d86f6f4},
intrahash = {a97156878c1c4d365c67f832f0793fa4},
keywords = {alignment apertium bitextor crawling},
pages = {280--290},
publisher = {Springer},
series = {Lecture Notes in Computer Science},
timestamp = {2009-09-17T15:36:11.000+0200},
title = {{Evaluation of Alignment Methods for HTML Parallel Text}},
url = {http://dx.doi.org/10.1007/11816508_29},
volume = 4139,
year = 2006
}