@inproceedings{004e3c134fb041c0b1ad4543deb5e880,
title = "Beyond Prediction Similarity: ShapGAP for Evaluating Faithful Surrogate Models in XAI",
abstract = "The growing importance of Explainable Artificial Intelligence (XAI) has highlighted the need to understand the decision-making processes of black-box models. Surrogation, emulating a black-box model (BB) with a white-box model (WB), is crucial in applications where BBs are unavailable due to security or practical concerns. Traditional fidelity measures only evaluate the similarity of the final predictions, which can lead to a significant limitation: considering a WB faithful even when it has the same prediction as the BB but with a completely different rationale. Addressing this limitation is crucial to develop Trustworthy AI practical applications beyond XAI. To address this issue, we introduce ShapGAP, a novel metric that assesses the faithfulness of surrogate models by comparing their reasoning paths, using SHAP explanations as a proxy. We validate the effectiveness of ShapGAP by applying it to real-world datasets from healthcare and finance domains, comparing its performance against traditional fidelity measures. Our results show that ShapGAP enables better understanding and trust in XAI systems, revealing the potential dangers of relying on models with high task accuracy but unfaithful explanations. ShapGAP serves as a valuable tool for identifying faithful surrogate models, paving the way for more reliable and Trustworthy AI applications.",
keywords = "Black-box, Explainable Artificial Intelligence (XAI), Faithfulness, Fidelity Measures, Interpretability, SHAP, Surrogate Models, White-box",
author = "Ettore Mariotti and Adarsa Sivaprasad and Moral, {Jose Maria Alonso}",
year = "2023",
month = oct,
day = "30",
doi = "10.1007/978-3-031-44064-9_10",
language = "English",
isbn = "978-3-031-44063-2",
series = "Communications in Computer and Information Science",
publisher = "Springer Nature",
pages = "160--173",
editor = "Luca Longo",
booktitle = "Explainable Artificial Intelligence",
address = "United Kingdom",
note = "First World Conference, xAI 2023 ; Conference date: 26-07-2023 Through 28-07-2023",
}