@EdWorkingPaper{ai24-1081, title = "Leveraging Modern Machine Learning to Improve Early Warning Systems and Reduce Chronic Absenteeism in Early Childhood", author = "Tiffany Wu, Christina Weiland", institution = "Annenberg Institute at Brown University", number = "1081", year = "2024", month = "November", URL = "http://www.edworkingpapers.com/ai24-1081", abstract = {Chronic absenteeism is a critical issue that has been linked to many adverse student outcomes. The current study focuses on improving a key system already in place in many school districtsÑearly warning systems (EWSs)Ñin order to decrease chronic absenteeism in studentsÕ earliest schooling years. Using a demographically diverse population of students followed from PreK to third grade in Boston Public Schools (N=6,698), we demonstrate how and why two modern machine learning algorithmsÑthe Synthetic Minority Oversampling Technique (SMOTE) and Extreme Gradient Boosting (XGBoost)Ñcan improve EWS accuracy in proactively identifying students who are at risk of becoming chronically absent. The best-performing XGBoost model with SMOTE was approximately 52 percentage points more accurate (in terms of recall rate) than the logistic regression model closest to those used in current EWSs in correctly predicting students who would be chronically absent in third grade. Our analyses introduce varying probability thresholds and the incorporation of different years of data, showing the potential of these models to cater to school districts aiming to leverage machine learning predictions while adhering to budgetary or intervention constraints.}, }