@inproceedings{e3fc59a6e1044771b4abab76c0d46238,
title = "MESS: A multilingual error based string similarity measure for transliterated name variants",
abstract = "Cross-lingual name matching is an important problem in the fields of machine translation and data mining. Though well studied, it lacks a generic solution largely due to issues like language specific nuances, resource scarcity, etc. Most of the proposed unsupervised approaches focus on a small subset of languages, mostly English and its derivatives, and employ specific handcrafted rules that do not port well to other languages. In this paper, we propose a generic multilingual solution that instead adds simple probabilistic extensions to existing string similarity methods. Not only does our solution depend only on freely available open source resources but we also demonstrate the superiority of our approach on 60 language pairs drawn across language families.",
author = "Nikhil Londhe and Vishrawas Gopalakrishnan and Srihari, \{Rohini K.\} and Aidong Zhang",
note = "Publisher Copyright: {\textcopyright} 2015 ACM.; 7th Annual Meeting of the Forum for Information Retrieval Evaluation, FIRE 2015 ; Conference date: 04-12-2015 Through 06-12-2015",
year = "2015",
month = dec,
day = "4",
doi = "10.1145/2838706.2838716",
language = "English",
series = "ACM International Conference Proceeding Series",
publisher = "Association for Computing Machinery ",
pages = "47--50",
editor = "Prasenjit Majumder and Mandar Mitra and Madhulika Agrawal and Parth Mehta",
booktitle = "FIRE 2015 - Proceedings of the 7th Annual Meeting of the Forum for Information Retrieval Evaluation",
address = "United States",
}