@article{ajwr20251333,
author={{OUEDRAOGO, Issoufou and SANDWIDI, W. J. P. and KABORE, Fatoumata and KONARE, Mahamadou and OUATTARA, Cheick Abdramane},
title={Predictive Modelling of Groundwater Quality in the Nakanb¨¦ River Basin Using Machine Learning Techniques},
journal={American Journal of Water Resources},
volume={13},
number={3},
pages={86--96},
year={2025},
url={https://pubs.sciepub.com/ajwr/13/3/3},
issn={2333-4819},
abstract={Continuous monitoring of groundwater quality is essential for protecting public health and the environment, particularly in vulnerable regions such as Burkina Faso¡¯s Nakanb¨¦ Basin, where groundwater serves as a primary source of potable water. This study aimed to develop and evaluate machine learning (ML) models to predict two key water quality parameters: Total Dissolved Solids (TDS) and Total Alkalinity (TA), using data provided by the General Directorate of Water Resources (DGRE). A total of 1,765 groundwater samples were analyzed, encompassing nineteen physicochemical parameters. Prior to modelling, multicollinearity analysis was conducted to ensure the reliability of the input variables. Three regression algorithms Random Forest Regression (RFR), Multiple Linear Regression (MLR), and Decision Tree Regression (DTR) were compared for their predictive performance. Among them, Random Forest demonstrated the highest accuracy, with the highest R2 and lowest error metrics (MAE, RMSE) across both training and testing datasets for both TDS and TA. While MLR offered consistent and interpretable results, particularly for TA, DTR exhibited strong overfitting, with lower generalizability on test data. The results highlight the superiority of ensemble learning approaches, particularly RFR, in capturing complex, nonlinear relationships within groundwater quality datasets. ML application in this context provides a cost-effective and scalable alternative to conventional laboratory-based monitoring methods. It also enables the identification of influential water quality parameters, supports risk assessment of contamination, and contributes to evidence-based water resource management strategies. These findings demonstrate the potential of ML tools to enhance groundwater monitoring and advance sustainable water governance in arid and semi-arid regions.},
doi={10.12691/ajwr-13-3-3}
publisher={Science and Education Publishing}
}
