@inproceedings{c28489418b9f4f869e1e23846e52ca8c,
title = "A database for offline Arabic handwritten text recognition",
abstract = "Arabic handwritten text recognition has not received the same attention as that directed towards Latin script-based languages. In this paper, we present our efforts to develop a comprehensive Arabic Handwritten Text database (AHTD). At this stage, the database will consist of text written by 1000 writers from different countries. Currently, it has data from over 300 writers. It is composed of an images database containing images of the written text at various resolutions, and a ground truth database that contains meta-data describing the written text at the page, paragraph, and line levels. Tools to extract paragraphs from pages, segment paragraphs into lines have also been developed. Segmentation of lines into words will follow. The database will be made freely available to researchers world-wide. It is hoped that the AHTD database will stir research efforts in various handwritten-related problems such as text recognition, and writer identification and verification.",
keywords = "Arabic Handwritten Text Database, Arabic OCR, Document Analysis, Form Processing",
author = "Mahmoud, \{Sabri A.\} and Irfan Ahmad and Mohammed Alshayeb and Al-Khatib, \{Wasfi G.\}",
year = "2011",
doi = "10.1007/978-3-642-21596-4\_40",
language = "English",
isbn = "9783642215957",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
number = "PART 2",
pages = "397--406",
booktitle = "Image Analysis and Recognition - 8th International Conference, ICIAR 2011, Proceedings",
address = "Germany",
edition = "PART 2",
}