@inproceedings{64bc0e039b6148df89ef23629886c8cc,
title = "A large-scale leveled readability lexicon for standard Arabic",
abstract = "We present a large-scale 26,000-lemma leveled readability lexicon for Modern Standard Arabic. The lexicon was manually annotated in triplicate by language professionals from three regions in the Arab world. The annotations show a high degree of agreement; and major differences were limited to regional variations. Comparing lemma readability levels with their frequencies provided good insights in the benefits and pitfalls of frequency-based readability approaches. The lexicon will be publicly available.",
keywords = "Arabic, Lexicon, Readability",
author = "{Al Khalil}, Muhamed and Nizar Habash and Zhengyang Jiang",
note = "Funding Information: The work on this project is funded by a New York University Abu Dhabi Research Enhancement Fund grant. We would like to thank Ramy Eskander and his team of annotators at Ramitechs.com for their valuablehelp, productive discussions and feedback throughout the annotation process. Publisher Copyright: {\textcopyright} European Language Resources Association (ELRA), licensed under CC-BY-NC",
year = "2020",
language = "English (US)",
isbn = "9791095546344",
series = "LREC 2020 - 12th International Conference on Language Resources and Evaluation, Conference Proceedings",
publisher = "European Language Resources Association (ELRA)",
pages = "3053--3062",
editor = "Nicoletta Calzolari and Frederic Bechet and Philippe Blache and Khalid Choukri and Christopher Cieri and Thierry Declerck and Sara Goggi and Hitoshi Isahara and Bente Maegaard and Joseph Mariani and Helene Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis",
booktitle = "LREC 2020 - 12th International Conference on Language Resources and Evaluation, Conference Proceedings",
}