@inproceedings{20d11409c4ae4959b8584d2936c49f53,
title = "On the Impact of Industrial Delays when Mitigating Distribution Drifts: An Empirical Study on Real-World Financial Systems",
abstract = "An increasing number of financial software system relies on Machine learning models to support human decision-makers. Although these models have shown satisfactory performance to support human decision-makers in classifying financial transactions, the maintenance of such ML systems remains a challenge. After deployment in production, the performance of the models tends to degrade over time due to concept drift. Methods have been proposed to detect concept drift and retrain new models upon detection to mitigate the drop in performance. However, little is known about the effectiveness of such methods in an industrial context. In particular, their evaluation fails to consider the delay between the detection of the drift and the deployment of a new model. This delay is inherent to the strict quality assurance and manual validation processes that financial (and other critical) institutions impose on their software systems. To circumvent this limitation, we formalize the problem of retraining ML models against distribution drift in the presence of delay and propose a novel protocol to evaluate drift detectors. We report on an empirical study conducted on the transaction system of our industrial partner, BGL BNP Paribas, and two publicly available datasets: Lending Club Loan Data and Electricity. We release our tool and benchmark on GitHub. 1 We demonstrate for the first time how ignoring the delays in the evaluation of the drift detectors overestimates their ability to mitigate performance drift, up to 39.86% for our industrial application.1 Code available at https://github.com/serval-uni-lu/drift-robustness.",
keywords = "AI in finance, ML, distribution-drift, real-world system",
author = "Thibault Simonetto and Maxime Cordy and Salah Ghamizi and Traon, {Yves Le} and Cl{\'e}ment Lefebvre and Andrey Boystov and Anne Goujon",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2025.; 1st International Workshop on Discovering Drift Phenomena in Evolving Landscapes, DELTA 2024 ; Conference date: 26-08-2024 Through 26-08-2024",
year = "2025",
doi = "10.1007/978-3-031-82346-6_4",
language = "English",
isbn = "9783031823459",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "57--73",
editor = "Marco Piangerelli and Bardh Prenkaj and Ylenia Rotalinti and Ananya Joshi and Giovanni Stilo",
booktitle = "Discovering Drift Phenomena in Evolving Landscapes - 1st International Workshop, DELTA 2024, Proceedings",
address = "Germany",
}