@inproceedings{ea8c2d7565da49f28ba12a3d1b830973,
title = "Scaling phrase-based statistical machine translation to larger corpora and longer phrases",
abstract = "In this paper we describe a novel data structure for phrase-based statistical machine translation which allows for the retrieval of arbitrarily long phrases while simultaneously using less memory than is required by current decoder implementations. We detail the computational complexity and average retrieval times for looking up phrase translations in our suffix array-based data structure. We show how sampling can be used to reduce the retrieval time by orders of magnitude with no loss in translation quality.",
author = "Chris Callison-Burch and Colin Bannard and Josh Schroeder",
year = "2005",
doi = "10.3115/1219840.1219872",
language = "English",
isbn = "1932432515",
series = "ACL-05 - 43rd Annual Meeting of the Association for Computational Linguistics, Proceedings of the Conference",
publisher = "Association for Computational Linguistics",
pages = "255--262",
booktitle = "ACL-05 - 43rd Annual Meeting of the Association for Computational Linguistics, Proceedings of the Conference",
address = "United States",
note = "43rd Annual Meeting of the Association for Computational Linguistics, ACL-05 ; Conference date: 25-06-2005 Through 30-06-2005",
}