@InProceedings{GiuseppeDeGregorio2022, author="Giuseppe De Gregorio and Sanket Biswas and Mohamed Ali Souibgui and Asma Bensalah and Josep Llados and Alicia Fornes and Angelo Marcelli", title="A Few Shot Multi-representation Approach for N-Gram Spotting in Historical Manuscripts", booktitle="Frontiers in Handwriting Recognition. International Conference on Frontiers in Handwriting Recognition (ICFHR2022)", year="2022", volume="13639", pages="3--12", optkeywords="N-gram spotting", optkeywords="Few-shot learning", optkeywords="Multimodal understanding", optkeywords="Historical handwritten collections", abstract="Despite recent advances in automatic text recognition, the performance remains moderate when it comes to historical manuscripts. This is mainly because of the scarcity of available labelled data to train the data-hungry Handwritten Text Recognition (HTR) models. The Keyword Spotting System (KWS) provides a valid alternative to HTR due to the reduction in error rate, but it is usually limited to a closed reference vocabulary. In this paper, we propose a few-shot learning paradigm for spotting sequences of a few characters (N-gram) that requires a small amount of labelled training data. We exhibit that recognition of important n-grams could reduce the system{\textquoteright}s dependency on vocabulary. In this case, an out-of-vocabulary (OOV) word in an input handwritten line image could be a sequence of n-grams that belong to the lexicon. An extensive experimental evaluation of our proposed multi-representation approach was carried out on a subset of Bentham{\textquoteright}s historical manuscript collections to obtain some really promising results in this direction.", optnote="DAG; 600.121; 600.162; 602.230; 600.140", optnote="exported from refbase (http://refbase.cvc.uab.es/show.php?record=3733), last updated on Tue, 25 Apr 2023 16:07:26 +0200", doi="10.1007/978-3-031-21648-0_1", file=":http://refbase.cvc.uab.es/files/GBS2022.pdf:PDF" }