@inproceedings{4161f667e1b748db96e22288b4f31962,
title = "A data-driven methodology to assess text complexity based on syntactic and semantic measurements",
abstract = "In this paper we propose a data driven methodology to assess text complexity of Spanish school texts. We model the problem as a classification task, that can be solved in a data-driven fashion using machine learning techniques. We show empirically that the discriminative power of the classifier depends on school grade level. Our proposal includes multiple predictors that capture different dimensions of text complexity such as coherence and cohesion. We provide an importance analysis of predictors across several complexity levels. Finally, we assess the model performance using accuracy and correlation measurements. The proposed model achieves accuracies of 0.7.",
keywords = "Artificial intelligence, Educational systems, Machine learning, Natural language processing, Text difficulty assessment",
author = "Diego Palma and Christian Soto and M{\'o}nica Veliz and Bernardo Riffo and Antonio Guti{\'e}rrez",
note = "Publisher Copyright: {\textcopyright} 2020, Springer Nature Switzerland AG.; 1st International Conference on Human Interaction and Emerging Technologies, IHIET 2019 ; Conference date: 22-08-2019 Through 24-08-2019",
year = "2020",
doi = "10.1007/978-3-030-25629-6_79",
language = "English",
isbn = "9783030256289",
series = "Advances in Intelligent Systems and Computing",
publisher = "Springer Verlag",
pages = "509--515",
editor = "Tareq Ahram and Redha Taiar and Serge Colson and Arnaud Choplin",
booktitle = "Human Interaction and Emerging Technologies - Proceedings of the 1st International Conference on Human Interaction and Emerging Technologies, IHIET 2019",
address = "Germany",
}