@inproceedings{36d1eaafe71140cf82e7312566ddbe4f,
title = "Bayesian active learning for keyword spotting in handwritten documents",
abstract = "We propose the Bayesian Active Learning by Disagreement (BALD) model for keyword spotting in handwritten documents. In the context of keyword spotting in handwritten documents, the background text is all regions in the document that do not contain the keywords. The model tries to learn certain characteristics of the keyword and background text in an active learning framework. It takes into account the local character level scores and global word level scores to distinguish keywords from non-keywords. We propose to apply the bayesian active learning strategy to identify the regions of sample space from which more meaningful labeled samples of keywords and non-keywords can be extracted. This work is an extension to our previous work which used a variational dynamic background model to model the large variations of background text. The approach has been tested on IAM dataset for English. The results show that a decent background model can be learned in a more quicker and efficient manner using the BALD framework. The approach outperforms our prior work and other state of the art approaches.",
keywords = "Bayesian Active Learning, Handwriting Recognition, Spotting",
author = "Gaurav Kumar and Venu Govindaraju",
note = "Publisher Copyright: {\textcopyright} 2014 IEEE.; 22nd International Conference on Pattern Recognition, ICPR 2014 ; Conference date: 24-08-2014 Through 28-08-2014",
year = "2014",
month = dec,
day = "4",
doi = "10.1109/ICPR.2014.356",
language = "English",
series = "Proceedings - International Conference on Pattern Recognition",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "2041--2046",
booktitle = "Proceedings - International Conference on Pattern Recognition",
address = "United States",
}