@inproceedings{eeb234234a1e430fb5c5a06976249446,
title = "Data-driven Arabic phoneme recognition using varying number of HMM states",
abstract = "Continuous Arabic Speech Recognition, appears in many real life applications. Its speed, accuracy and improvement are highly dependent on the accuracy of the language phonemes set. The main goal of this research is to recognize and transcribe the Arabic phonemes based on a data-driven approach. We built a phoneme recognizer based on a data driven approach using HTK tool. Different numbers of Gaussian mixtures with different numbers of HMM states were used in modeling the Arabic phonemes in order to reach the best configuration. The corpus used consists of about 4000 files, representing 5 recorded hours of modern standard Arabic of TV-News. The maximum phoneme recognition accuracy reached was 56.79%. This result is very encouraging and shows the viability of our approach as compared to using a fixed number of HMM states.",
keywords = "Arabic Speech Recognition, KFUPM Arabic speech, Phoneme recognition, corpus HMM",
author = "Nahar, {Khalid M.O.} and Al-Khatib, {Wasfi G.} and Moustafa Elshafei and Husni Al-Muhtaseb and Alghamdi, {Mansour M.}",
year = "2013",
doi = "10.1109/ICCSPA.2013.6487258",
language = "English",
isbn = "9781467328210",
series = "2013 1st International Conference on Communications, Signal Processing and Their Applications, ICCSPA 2013",
booktitle = "2013 1st International Conference on Communications, Signal Processing and Their Applications, ICCSPA 2013",
}