@inproceedings{8cfa969409e34e2eb66d42a6509a138c,
title = "Transcript mapping for handwritten English documents",
abstract = "Transcript mapping or text alignment with handwritten documents is the automatic alignment of words in a text file with word images in a handwritten document. Such a mapping has several applications in fields ranging from machine learning where large quantities of truth data are required for evaluating handwriting recognition algorithms, to data mining where word image indexes are used in ranked retrieval of scanned documents in a digital library. The alignment also aids {"}writer identity{"} verification algorithms. Interfaces which display scanned handwritten documents may use this alignment to highlight manuscript tokens when a person examines the corresponding transcript word. We propose an adaptation of the True DTW dynamic programming algorithm for English handwritten documents. The integration of the dissimilarity scores from a word-model word recognizer and Levenshtein distance between the recognized word and lexicon word, as a cost metric in the DTW algorithm leading to a fast and accurate alignment, is our primary contribution. Results provided, confirm the effectiveness of our approach.",
keywords = "Levenshtein distance, Mapping, Segmentation, Transcript, True DTW",
author = "Damien Jose and Anurag Bharadwaj and Venu Govindaraju",
year = "2008",
doi = "10.1117/12.766489",
language = "English",
isbn = "9780819469878",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
booktitle = "Document Recognition and Retrieval XV",
note = "Document Recognition and Retrieval XV ; Conference date: 29-01-2008 Through 31-01-2008",
}