@inproceedings{d3e8fff9bf404204a1859da508d8debd,
title = "Aligning transcript of historical documents using dynamic programming",
abstract = "We present a simple and accurate approach for aligning historical documents with their corresponding transcription. First, a representative of each letter in the historical document is cropped. Then, the transcription is transformed to synthetic word images by representing the letters in the transcription by the cropped letters. These synthetic word images are aligned to groups of connected components in the original text, along each line, using dynamic programming. For measuring image similarities we experimented with a variety of feature extraction and matching methods. The presented alignment algorithm was tested on two historical datasets and provided excellent results.",
keywords = "GSC features, HOG features, LBP features, alignment, dynamic programming, historical documents, profile-based features",
author = "Irina Rabaev and Rafi Cohen and Jihad El-Sana and Klara Kedem",
note = "Publisher Copyright: {\textcopyright} 2015 SPIE.; 22nd Document Recognition and Retrieval Conference, DRR 2015 ; Conference date: 11-02-2015 Through 12-02-2015",
year = "2015",
month = jan,
day = "1",
doi = "10.1117/12.2076062",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Bart Lamiroy and Ringger, {Eric K.}",
booktitle = "Proceedings of SPIE-IS and T Electronic Imaging - Document Recognition and Retrieval XXII",
address = "United States",
}