@inproceedings{b7aaeee4dbcb4015b912b818f8f62d8f,
title = "Transductive learning for reading handwritten tibetan manuscripts",
abstract = "We examine the use case of performing handwritten character recognition (HCR) on a newly compiled collection of Tibetan historical documents, which presents multiple challenges, including inherent challenges such as image quality and the lack of word separation, and dataset challenges such as a lack of supervised training data. To tackle these challenges, we introduce an end-to-end unsupervised full-document HCR approach composed of unsupervised line segmentation and a convolutional recurrent neural network, trained using solely synthetic data. Various augmentations are applied to these synthesized images, and we compare the effect of each augmentation on the HCR results. Since we work on a collection of historical manuscripts, we can fit the model to the available test data. During training, our network has access to both the labeled synthetic training data and the unlabeled images of the test set, and we adapt and evaluate four different semi-supervised learning and domain adaptation approaches for transductive learning in HCR. We test our approach on a set of 167 images from the 'Kadam' collection, containing 829 lines. We show that correct data augmentation is crucial for the success of HCR trained solely on synthetic data and that using an effective transductive learning approach drastically improves results.",
keywords = "CRNN, Domain Adaptation, Handwritten Recognition, Historical Document Analysis, Neural Network, Synthetic Data, Transductive Learning",
author = "Sivan Keret and Lior Wolf and Nachum Dershowitz and Eric Werner and Orna Almogi and Dorji Wangchuk",
note = "Publisher Copyright: {\textcopyright} 2019 IEEE.; 15th IAPR International Conference on Document Analysis and Recognition, ICDAR 2019 ; Conference date: 20-09-2019 Through 25-09-2019",
year = "2019",
month = sep,
doi = "10.1109/ICDAR.2019.00043",
language = "الإنجليزيّة",
series = "Proceedings of the International Conference on Document Analysis and Recognition, ICDAR",
publisher = "IEEE Computer Society",
pages = "214--221",
booktitle = "Proceedings - 15th IAPR International Conference on Document Analysis and Recognition, ICDAR 2019",
address = "الولايات المتّحدة",
}