@inproceedings{b7598628e5ab42a9b26ae4fe5bcc3db2,
title = "Lightly supervised transliteration for machine translation",
abstract = "We present a Hebrew to English transliteration method in the context of a machine translation system. Our method uses machine learning to determine which terms are to be transliterated rather than translated. The training corpus for this purpose includes only positive examples, acquired semi-automatically. Our classifier reduces more than 38% of the errors made by a baseline method. The identified terms are then transliterated. We present an SMT-based transliteration model trained with a parallel corpus extracted from Wikipedia using a fairly simple method which requires minimal knowledge. The correct result is produced in more than 76% of the cases, and in 92% of the instances it is one of the top-5 results. We also demonstrate a small improvement in the performance of a Hebrew-to-English MT system that uses our transliteration module.",
author = "Amit Kirschenbaum and Shuly Wintner",
year = "2009",
doi = "10.3115/1609067.1609115",
language = "English",
isbn = "9781932432169",
series = "EACL 2009 - 12th Conference of the European Chapter of the Association for Computational Linguistics, Proceedings",
publisher = "Association for Computational Linguistics (ACL)",
pages = "433--441",
booktitle = "EACL 2009 - 12th Conference of the European Chapter of the Association for Computational Linguistics, Proceedings",
address = "United States",
note = "12th Conference of the European Chapter of the Association for Computational Linguistics, EACL 2009 ; Conference date: 30-03-2009 Through 03-04-2009",
}