@inproceedings{404fe4e0a80b4d2fb40aff95c745a675,
title = "Comparing Two Techniques for Learning Transliteration Models Using a Parallel Corpus",
abstract = "We compare the use of an unsupervised transliteration mining method and a rule-based method to automatically extract lists of transliteration word pairs from a parallel corpus of Hindi/Urdu. We build joint source channel models on the automatically aligned orthographic transliteration units of the automatically extracted lists of transliteration pairs resulting in two transliteration systems. We compare our systems with three transliteration systems available on the web, and show that our systems have better performance. We perform an extensive analysis of the results of using both methods and show evidence that the unsupervised transliteration mining method is superior for applications requiring high recall transliteration lists, while the rule-based method is useful for obtaining high precision lists.",
author = "Hassan Sajjad and Nadir Durrani and Helmut Schmid and Alexander Fraser",
note = "Publisher Copyright: {\textcopyright} 2011 AFNLP; 5th International Joint Conference on Natural Language Processing, IJCNLP 2011 ; Conference date: 08-11-2011 Through 13-11-2011",
year = "2011",
language = "English",
series = "IJCNLP 2011 - Proceedings of the 5th International Joint Conference on Natural Language Processing",
publisher = "Association for Computational Linguistics (ACL)",
pages = "129--137",
editor = "Haifeng Wang and David Yarowsky",
booktitle = "IJCNLP 2011 - Proceedings of the 5th International Joint Conference on Natural Language Processing",
address = "United States",
}