@inproceedings{05027e5e5a8947b2820f556472a9d8b2,
title = "CFDB: Machine Learning Model Analysis via Databases of CounterFactuals",
abstract = "Data Scientists often design and train complex Machine Learning models that evolve over time due to re-training on new data, a revised architecture, or both. To assist Data Scientists in this process, many methods for analyzing models have been recently developed. A prominent approach for model analysis is based on the notion of Counterfactuals. A counterfactual (CF) intuitively explains the label assigned by the model to a particular instance by identifying perturbations to the instance that lead to a different predicted label. A large body of recent literature has demonstrated the usefulness of CFs for deriving insights on the model at large. The analyzed CFs come in various flavors and are applied to instances chosen based on various criteria, in the context of different analysis goals. In this work we propose to demonstrate CFDB (Counterfactuals Database), a unified framework for querying Counterfactuals. CFDB allows to consolidate common approaches in CF-based analysis and to provide multiple levels of abstractions in a relational framework. We will demonstrate CFDB in the context of the Lending Club Loan Data, showing its usefulness by formulating and executing multiple analyses over evolving classifiers for Loan Approval.",
keywords = "counterfactuals, databases",
author = "Idan Meyuhas and {Ben Arie}, Aviv and Yair Horesh and Daniel Deutch",
note = "Publisher Copyright: {\textcopyright} 2022 ACM.; 2022 ACM SIGMOD International Conference on the Management of Data, SIGMOD 2022 ; Conference date: 12-06-2022 Through 17-06-2022",
year = "2022",
month = jun,
day = "10",
doi = "https://doi.org/10.1145/3514221.3520162",
language = "الإنجليزيّة",
series = "Proceedings of the ACM SIGMOD International Conference on Management of Data",
pages = "2401--2404",
booktitle = "SIGMOD 2022 - Proceedings of the 2022 International Conference on Management of Data",
}