R. Moore. Proceedings of the 42nd Annual Meeting of the Association for Computational Linguistics, Barcelona, Spain, page 518-525. (2004)
Abstract
We investigate a number of simple methods for
improving the word-alignment accuracy of IBM
Model 1. We demonstrate reduction in alignment
error rate of approximately 30% resulting from (1)
giving extra weight to the probability of alignment
to the null word, (2) smoothing probability estimates for rare words, and (3) using a simple heuristic estimation method to initialize, or replace, EM
training of model parameters.
%0 Conference Paper
%1 Moore93
%A Moore, Robert C.
%B Proceedings of the 42nd Annual Meeting of the Association for Computational Linguistics, Barcelona, Spain
%D 2004
%K article statistics algorithm machinetranslation
%P 518-525
%T Improving IBM Word Alignment Model 1
%U http://dblp.uni-trier.de/db/conf/acl/acl2004.html#Moore04
%X We investigate a number of simple methods for
improving the word-alignment accuracy of IBM
Model 1. We demonstrate reduction in alignment
error rate of approximately 30% resulting from (1)
giving extra weight to the probability of alignment
to the null word, (2) smoothing probability estimates for rare words, and (3) using a simple heuristic estimation method to initialize, or replace, EM
training of model parameters.
@inproceedings{Moore93,
abstract = {We investigate a number of simple methods for
improving the word-alignment accuracy of IBM
Model 1. We demonstrate reduction in alignment
error rate of approximately 30% resulting from (1)
giving extra weight to the probability of alignment
to the null word, (2) smoothing probability estimates for rare words, and (3) using a simple heuristic estimation method to initialize, or replace, EM
training of model parameters.
},
added-at = {2006-11-11T18:58:29.000+0100},
author = {Moore, Robert C.},
biburl = {https://www.bibsonomy.org/bibtex/21f76344cdbef366bf00193359acd487e/tmalsburg},
booktitle = {Proceedings of the 42nd Annual Meeting of the Association for Computational Linguistics, Barcelona, Spain},
interhash = {40cd8e09e13cdce75a1607aa94c65691},
intrahash = {1f76344cdbef366bf00193359acd487e},
keywords = {article statistics algorithm machinetranslation},
pages = {518-525},
timestamp = {2006-11-11T18:58:29.000+0100},
title = {Improving IBM Word Alignment Model 1},
url = {http://dblp.uni-trier.de/db/conf/acl/acl2004.html#Moore04},
year = 2004
}