@inproceedings{5e1b12af1f26471f8dcb4207c224033d,
title = "Thinning Arabic characters for feature extraction",
abstract = "A successful approach to the recognition of Latin characters is to extract features from that character such as the number of strokes, stroke intersections and holes, and to use ad-hoc tests to differentiate between characters which have similar features. The first stage in this process is to produce thinned 1 pixel thick representations of the characters to simplify feature extraction. This approach works well with printed Latin characters which are of high quality. With poor quality characters, however, the thinning process itself is not straightforward and can introduce errors which are manifested in the later stages of the recognition process. The recognition of poor quality Arabic characters is a particular problem since the characters are calligraphic with printed characters having widely varying stroke thicknesses to simulate the drawing of the character with a calligraphy pen or brush. This paper describes the problems encountered when thinning large poor quality Arabic characters prior to the extraction of their features and submission to a syntactic recognition system.",
keywords = "Arabic, Characters, Ocr, Optical character recognition, Thinning, Urdu",
author = "John Cowell and Fiaz Hussain",
note = "Publisher Copyright: {\textcopyright} 2001 IEEE.; 5th International Conference on Information Visualisation, IV 2001 ; Conference date: 25-07-2001 Through 27-07-2001",
year = "2001",
doi = "10.1109/IV.2001.942056",
language = "English",
series = "Proceedings of the International Conference on Information Visualisation",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "181--185",
editor = "F. Khosrowshahi and E. Banissi and M. Sarfraz and A. Ursyn",
booktitle = "Proceedings - 5th International Conference on Information Visualisation, IV 2001",
}