@inproceedings{7ee785b78fd24570acd54696a9625443,
title = "An oracle-based co-training framework for writer identification in offline handwriting",
abstract = "State-of-the-art techniques for writer identification have been centered primarily on enhancing the performance of the system for writer identification. Machine learning algorithms have been used extensively to improve the accuracy of such system assuming sufficient amount of data is available for training. Little attention has been paid to the prospect of harnessing the information tapped in a large amount of un-annotated data. This paper focuses on co-training based framework that can be used for iterative labeling of the unlabeled data set exploiting the independence between the multiple views (features) of the data. This paradigm relaxes the assumption of sufficiency of the data available and tries to generate labeled data from unlabeled data set along with improving the accuracy of the system. However, performance of co-training based framework is dependent on the effectiveness of the algorithm used for the selection of data points to be added in the labeled set. We propose an Oracle based approach for data selection that learns the patterns in the score distribution of classes for labeled data points and then predicts the labels (writers) of the unlabeled data point. This method for selection statistically learns the class distribution and predicts the most probable class unlike traditional selection algorithms which were based on heuristic approaches. We conducted experiments on publicly available IAM dataset and illustrate the efficacy of the proposed approach.",
keywords = "Classifier, Co-training, Labeled and Unlabeled data, Oracle, Views, Writer Identification",
author = "Utkarsh Porwal and Sreeranga Rajan and Venu Govindaraju",
year = "2012",
doi = "10.1117/12.912221",
language = "English",
isbn = "9780819489449",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
booktitle = "Proceedings of SPIE-IS and T Electronic Imaging - Document Recognition and Retrieval XIX",
note = "Document Recognition and Retrieval XIX ; Conference date: 25-01-2012 Through 26-01-2012",
}