@inproceedings{62d9873b44f2464b9bea6c4a30e8ef72,
title = "The performance-actionability trade-off in retention prediction at middle school",
abstract = "Predicting students' retention risk is one of the major trends in machine learning applications in education. While early identification of at-risk students allows timely planning and implementation of measures to prevent adverse outcomes, there is a trade-off between the predictive model's performance and the prediction window size, or model performance and its actionability. In this study, we used a dataset of 83,596 unique Portuguese students in grades 5th to 9th to predict retention at or before the end of 9th grade. We explored how different prediction window sizes impact the predictive model's performance, the feature importance, and the models' bias. The models with the shorter prediction window performed better in terms of precision, but the model with the largest prediction window showed a higher lift over the existing rule-based model. Prediction window size impacted the importance of demographic features and model's fairness. Our results contribute to the extant discussion on predicting retention, by adding empirical evidence about the models' added value in performance versus the existing practice, suggesting types of data to collect and use, and discussing education-specific challenges of responsible data science.",
keywords = "feature importance, model bias, model performance, prediction window, school retention",
author = "Susana Lavado and Miguel Mateus and Leid Zejnilovic",
note = "Funding Information: This work was supported by Funda{\c c}{\~a}o para a Ci{\^e}ncia e a Tecnologia (UIDB/00124/2020, UIDP/00124/2020 and Social Sciences DataLab - PIN-FRA/22209/2016), POR Lisboa and POR Norte (Social Sciences DataLab, PINFRA/ 22209/ 2016), and BPI {"}La Caixa{"} Foundation. Publisher Copyright: {\textcopyright} 2022 IEEE.; 21st IEEE International Conference on Machine Learning and Applications, ICMLA 2022 ; Conference date: 12-12-2022 Through 14-12-2022",
year = "2022",
doi = "10.1109/ICMLA55696.2022.00087",
language = "English",
series = "Proceedings - 21st IEEE International Conference on Machine Learning and Applications, ICMLA 2022",
publisher = "Institute of Electrical and Electronics Engineers (IEEE)",
pages = "531--536",
editor = "Wani, {M. Arif} and Mehmed Kantardzic and Vasile Palade and Daniel Neagu and Longzhi Yang and Kit-Yan Chan",
booktitle = "Proceedings - 21st IEEE International Conference on Machine Learning and Applications, ICMLA 2022",
address = "United States",
}