<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Applying explanation methods for the iterative refinement of an ANN-based depression screening tool</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Cristian</forename><forename type="middle">E</forename><surname>Sosa-Espadas</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Department of Systems and Computing</orgName>
								<orgName type="institution">Tecnológico Nacional de México/IT de Mérida</orgName>
								<address>
									<settlement>Merida</settlement>
									<country key="MX">Mexico</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department">AAAIMX Student Chapter at Yucatan</orgName>
								<orgName type="laboratory">AAAIMX</orgName>
								<orgName type="institution">Association for the Advancement of Artificial Intelligence</orgName>
								<address>
									<country>Mexico, Mexico</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Manuel</forename><surname>Cetina-Aguilar</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Department of Systems and Computing</orgName>
								<orgName type="institution">Tecnológico Nacional de México/IT de Mérida</orgName>
								<address>
									<settlement>Merida</settlement>
									<country key="MX">Mexico</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department">AAAIMX Student Chapter at Yucatan</orgName>
								<orgName type="laboratory">AAAIMX</orgName>
								<orgName type="institution">Association for the Advancement of Artificial Intelligence</orgName>
								<address>
									<country>Mexico, Mexico</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Jose</forename><forename type="middle">A</forename><surname>Soladrero</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Department of Systems and Computing</orgName>
								<orgName type="institution">Tecnológico Nacional de México/IT de Mérida</orgName>
								<address>
									<settlement>Merida</settlement>
									<country key="MX">Mexico</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department">AAAIMX Student Chapter at Yucatan</orgName>
								<orgName type="laboratory">AAAIMX</orgName>
								<orgName type="institution">Association for the Advancement of Artificial Intelligence</orgName>
								<address>
									<country>Mexico, Mexico</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Jesus</forename><forename type="middle">M</forename><surname>Darias</surname></persName>
							<affiliation key="aff2">
								<orgName type="department" key="dep1">Department of Software Engineering and Artificial Intelligence</orgName>
								<orgName type="department" key="dep2">Instituto de Tecnologías del Conocimiento</orgName>
								<orgName type="institution">Universidad Complutense de Madrid</orgName>
								<address>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Esteban</forename><forename type="middle">E</forename><surname>Brito-Borges</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Department of Systems and Computing</orgName>
								<orgName type="institution">Tecnológico Nacional de México/IT de Mérida</orgName>
								<address>
									<settlement>Merida</settlement>
									<country key="MX">Mexico</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department">AAAIMX Student Chapter at Yucatan</orgName>
								<orgName type="laboratory">AAAIMX</orgName>
								<orgName type="institution">Association for the Advancement of Artificial Intelligence</orgName>
								<address>
									<country>Mexico, Mexico</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Nora</forename><forename type="middle">L</forename><surname>Cuevas-Cuevas</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Department of Systems and Computing</orgName>
								<orgName type="institution">Tecnológico Nacional de México/IT de Mérida</orgName>
								<address>
									<settlement>Merida</settlement>
									<country key="MX">Mexico</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department">AAAIMX Student Chapter at Yucatan</orgName>
								<orgName type="laboratory">AAAIMX</orgName>
								<orgName type="institution">Association for the Advancement of Artificial Intelligence</orgName>
								<address>
									<country>Mexico, Mexico</country>
								</address>
							</affiliation>
						</author>
						<author role="corresp">
							<persName><forename type="first">Mauricio</forename><forename type="middle">G</forename><surname>Orozco-Del-Castillo</surname></persName>
							<email>mauricio.orozco@itmerida.edu.mx</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Systems and Computing</orgName>
								<orgName type="institution">Tecnológico Nacional de México/IT de Mérida</orgName>
								<address>
									<settlement>Merida</settlement>
									<country key="MX">Mexico</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department">AAAIMX Student Chapter at Yucatan</orgName>
								<orgName type="laboratory">AAAIMX</orgName>
								<orgName type="institution">Association for the Advancement of Artificial Intelligence</orgName>
								<address>
									<country>Mexico, Mexico</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Applying explanation methods for the iterative refinement of an ANN-based depression screening tool</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
					</monogr>
					<idno type="MD5">2103B519583B07A068815BC01947ECC8</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2023-06-19T14:46+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>Explainable Artificial Intelligence, Depression, Mental Health, Artificial Neural Networks Orozco-del-Castillo) 0000-0002-0933-5152 (C. E. Sosa-Espadas)</term>
					<term>0000-0002-2423-0711 (M. Cetina-Aguilar)</term>
					<term>0000-0001-5864-275X (J. A. Soladrero)</term>
					<term>0000-0002-2173-1422 (J. M. Darias)</term>
					<term>0000-0002-4257-944X (E. E. Brito-Borges)</term>
					<term>0000-0002-5477-6176 (N. L. Cuevas-Cuevas)</term>
					<term>0000-0001-5793-6449 (M. G. Orozco-del-Castillo)</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>Depression, as one of many mental health disorders, is a serious health and economy problem, affecting over 300 million people of all ages. The diagnosis of depression is a very complex and time-consuming task for mental health professionals, who usually rely on self-report questionnaires as a screening process. However, the items used in these questionnaires are sometimes subjective, particularly to certain demographics, and could require much time and effort from the patient. In recent years, artificial intelligence techniques, such as artificial neural networks, have been commonly used to screen for depression, however, they operate as black-box models, i.e., they lack explainability and interpretability which are mandatory in health-related fields. In this work we propose not only an artificial neural network, but also a set of explainable artificial intelligence techniques to refine a large set of items from a psychological questionnaire into a more concise, explainable one.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>The rise in mental health conditions in recent years has become a serious health and economy problem, accounting for over a trillion USD each year <ref type="bibr" target="#b0">[1]</ref>. Particularly, depression has become one of the most common mental health conditions in the modern era, affecting over 300 million people of all ages <ref type="bibr" target="#b1">[2]</ref>, and the number of patients and associated medical costs keep increasing <ref type="bibr" target="#b2">[3]</ref>. While most of the patients seeking medical treatment for depression are in their 50s or 60s <ref type="bibr" target="#b2">[3]</ref>, these issues develop much earlier. It is estimated that over 20% of the world's children and adolescents suffer from a mental condition <ref type="bibr" target="#b0">[1]</ref>, including 8% of young adults between the ages of 18 and 22 <ref type="bibr" target="#b1">[2]</ref>, which can lead to suicide, the second leading cause of death among adolescents and young adults <ref type="bibr" target="#b14">(15)</ref><ref type="bibr" target="#b15">(16)</ref><ref type="bibr" target="#b16">(17)</ref><ref type="bibr" target="#b17">(18)</ref><ref type="bibr" target="#b18">(19)</ref><ref type="bibr" target="#b19">(20)</ref><ref type="bibr" target="#b20">(21)</ref><ref type="bibr">(22)</ref><ref type="bibr">(23)</ref><ref type="bibr">(24)</ref><ref type="bibr">(25)</ref><ref type="bibr">(26)</ref><ref type="bibr">(27)</ref><ref type="bibr">(28)</ref><ref type="bibr">(29)</ref>  <ref type="bibr" target="#b0">[1]</ref>. The fact that very few people in this age group seek medical attention is attributed to an unawareness of their illness, and only seek intervention until their symptoms become severe <ref type="bibr" target="#b1">[2]</ref>. This makes research focused on developing more effective detection techniques a mandatory task; if found early, depression has a high cure rate <ref type="bibr" target="#b2">[3]</ref>.</p><p>The goal of this research is the development and refinement of a screening tool that allows the early identification of students with high risk of depression, probably due to the COVID-19 pandemic. This tool is based on an Artificial Neural Network (ANN) applied over a dataset collected from 157 users that completed a questionnaire with 102 items related to to the symptoms of Major Depression Disorder (MDD), Generalized Anxiety Disorder (GAD) and Antisocial Personality Disorder (APD). The choice of a ANN model is rooted on the very high performance demonstrated by this technique for classification tasks.</p><p>For the current work, however, we want not only to create the ANN model, but to understand the impact of each item, so we can refine the questionnaire and achieve a higher depression screening performance. Here, the ANN models have a major drawback regarding its explainability, as they are considered "black-boxes" that are not interpretable. Therefore, in order to improve our screening tool we propose the application of several explanation methods along an iterative refinement process that mimics the general structure of a case-based reasoning (CBR) system.</p><p>Paper runs as follows. Section 2 presents the background of this work. Section 3 describes the dataset and the ANN screening model. Then, Section 4 describes our iterative refinement process using explanation methods. Section 5 presents the evaluation results and section 6 concludes the paper and opens lines of future work.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Background</head><p>There is a wide range of self-report questionnaires and inventories to assess different mental illnesses and emotional states, such as the Beck Depression Inventory for depression <ref type="bibr" target="#b3">[4]</ref>, the Attention Deficit and Hyperactivity Disorder (ADHD) Screening Questionnaire (ADHD-SQ) <ref type="bibr" target="#b4">[5]</ref>, the Aspiration Index <ref type="bibr" target="#b5">[6]</ref> for the measurement of intrinsic and extrinsic aspirations, the Adult ADHD Self-Report Scale, the Borderline Personality Questionnaire <ref type="bibr" target="#b6">[7]</ref>, the Common Beliefs Survey III-Short Form <ref type="bibr" target="#b7">[8]</ref>, depression, anxiety and antisocial items <ref type="bibr" target="#b8">[9]</ref> designed from the Diagnostic Statistical Manual-V (DSM-V), the Generalized Anxiety Disorder 7 (GAD-7) <ref type="bibr" target="#b9">[10]</ref>, the reduced scale of the Morningness-Eveningness Questionnaire <ref type="bibr" target="#b10">[11]</ref>, the Rosenberg Self-Esteem Scale <ref type="bibr" target="#b11">[12]</ref>, the State-Trait Anxiety Inventory <ref type="bibr" target="#b12">[13,</ref><ref type="bibr" target="#b13">14]</ref> the Five Facet Mindfulness Questionnaire <ref type="bibr" target="#b14">[15]</ref>, etc. Nevertheless, these self-reports usually need to collect a lot of information in the form of a large number of items to be addressed <ref type="bibr" target="#b15">[16]</ref>, which usually lowers the quality of the answers as the user progresses throughout the questionnaire <ref type="bibr" target="#b16">[17]</ref>.</p><p>On the other hand, ANN models have demonstrated their extraordinary performance for classification tasks, being a very suitable tool for the screening of mental illnesses <ref type="bibr" target="#b8">[9]</ref>. However, they are black-box methods that do not allow to understand the internal data patterns that led to classification. This way, eXplainable Artificial Intelligence (XAI) proposes several methods to understand such models <ref type="bibr" target="#b17">[18]</ref>.</p><p>An XAI system must be able to explain what it has done, what is happening, and whats is going to happen <ref type="bibr" target="#b17">[18]</ref>. In order to do this, each explanation of this kind of systems depends on the tasks, skill, and expectations that the user has, and the models to be used in this systems must be transparent and accessible for their decisions and recommendations <ref type="bibr" target="#b17">[18]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Dataset and Classification Model</head><p>The dataset used on this project corresponds to the one described in <ref type="bibr" target="#b8">[9]</ref>. It consists of the answers from 157 users who answered a screening questionnaire of 102 items related to the symptoms of MDD, GAD and APD as reported by the DSM-V. The user demographic consisted of students between 18 and 23 years old, all of them enrolled at the Tecnológico Nacional de México (TecNM)/Instituto Tecnológico de Mérida (ITM), at Mérida, Yucatán, Mexico. Questions have a binary nature, where the users answered either "true" or "false" with respect to their agreement with certain statements. Additionally, there is a "expected answers datasheet" with the values that are supposed to reflect symptoms of mental conditions. This validation artifact was created by the psychologist who designed the questionnaire and contains the expected answers that a person with either MDD, GAD, or APD would most probably choose.</p><p>An additional independent variable corresponding to physical symptoms of MDD, GAD, and APD was measured through 15 complementary items. Then, a "potential depression score" (PDS) was calculated by averaging these answers and used to estimate the actual depression risk for each individual. This hypothesis of correlation between the initial 102 items and the PDS value was confirmed by our previous results. This way, an ANN can be trained on this dataset, where PDS is used as the target value for training and prediction.</p><p>The PDS variable is codified as a discrete value (ranging from 1 to 5). Initial attempts to estimate this value using a prediction ANN model did not achieve acceptable results. Therefore, the ANN was redesigned as a classification model with five classes. After the initial statistical analysis of the PDS values, a clear imbalance was found, with the highest concentration of users having scores around 3, and the lowest concentrations being located near 1 or 5. Due to this particularity, we decided to combine the five values into three new classes (1,2: Low; 3: Medium; and 4,5: High). This recodification of the target variable also presented a little imbalance, therefore we performed an upsampling process using the SMOTE technique <ref type="bibr" target="#b18">[19]</ref> to further diminish this problem.</p><p>As reported in <ref type="bibr" target="#b8">[9]</ref>, a neural classifier was trained on the dataset so relationships between physical symptoms of MDD and the remaining 102 items were found. The ANN follows a multilayer perceptron (MLP) architecture, with paramethers 𝛼 and learning-rate optimized to achieve the highest accuracy. On the test dataset (1/3 of the total items), the model presented a global accuracy of 64%. Additional performance results per target class can be appreciated in Figure <ref type="figure" target="#fig_0">1</ref> (right).</p><p>However, at this point it is critical to understand the target performance metric. Figure <ref type="figure" target="#fig_0">1</ref> shows the corresponding confusion matrix where we can observe the misclassifications returned by the ANN. Having in mind that the goal is to achieve the highest depression screening performance, there is a clear error to minimize: false negative ratio or "recall" for class "High PDS", i.e., those individuals that having an actual high risk of depression were classified by the ANN as low or medium risk, represented in Figure <ref type="figure" target="#fig_0">1</ref> at the lower row of the matrix. This false negative ratio represents individuals with a high PDS that will not be identified by the screening tool, and therefore would not receive further psychological support. Additionally, we can appreciate that precision for class "high" is very good (right column), meaning that when the ANN identifies an individual as high PDS, it is very confident. The other way around -individuals without actual risk of depression being classified as high PDS-does not imply a high risk in terms of their mental health. These individuals will be identified (incorrectly) by the screening tool and receive a deeper evaluation by the psychologists, who will ultimately discard any risk.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Iterative Refinement Method</head><p>The proposed method to refine the ANN-based depression screening tool is based on the identification of potentially anomalous items through explanation methods that provide insights of the prediction model. This process follows a cycle analogous to CBR, where a set of candidate items are identified (retrieved) and proposed for its revision by an expert user. Finally, once anomalous items are confirmed, they are used to modify the prediction model. This way, we propose an iterative process consisting on the following steps:</p><p>1. First, the classification model is introspected with explanation methods to identify those items that may lead to a lower performance (recall for class "high") according to the "expected answers datasheet". 2. Next, these answers are proposed to the expert (psychologist) as potential anomalous items. Here we will distinguish between two different anomalous items:</p><p>Inconsistent items that cause an opposite effect to the expected classification (i.e., answers that are expected to predict high PDS but according to the model do decrease the probability to be classified that way). Irrelevant items, on the other hand, are not significant according to the explanation method and do not have any remarkable effect in the classification. This process is illustrated in Figure <ref type="figure" target="#fig_1">2</ref> and is detailed as follows.</p><p>The first step for each iteration is the identification of the anomalous items of the questionnaire. Although there are several explanation methods to perform this task, we have chosen Accumulated Local Effects (ALE). ALE describes how items influence the results of the ANN, based on the differences in the predictions. When applied to our model, ALE returns a plot for each questionnaire item. Each plot contains three lines, representing -on average-the influence of that item for the classification as High, Medium, and Low classes. The x-axis represents the possible answers (0-false, and 1-true) and the y-axis corresponds to the influence of the probability to be classified as each class. Figure <ref type="figure" target="#fig_2">3</ref> shows two of these plots, where we can observe, for example, that answering true (1 in x-axis) to questionnaire item 1 decreases significantly the possibility to be classified as low PDS, whereas it increases (with less influence) the classification as medium or high PDS. If we read the question "Most of the time I have difficulty concentrating on simple task", we can intuitively confirm that the ANN model is working properly, since the "expected answers datasheet" defines that answering "true" is an indicator of higher PDS. If we look at the ALE plot on the right, we can observe that the slopes of the lines is not high enough to consider that item 2 has a clear impact on the classifications. This way, the slope of each line in the ALE plot is significant in order to determine if an item 𝐼 has an impact on the classification. So, the slope (𝑚) for each class is calculated obtaining the ( − −− → 𝐴𝐿𝐸 𝐼 ) slope vector for each class.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>ICCBR'22 Workshop Proceedings</head><formula xml:id="formula_0">− −− → 𝐴𝐿𝐸 𝐼 = ⟨𝑚 𝐻 , 𝑚 𝑀 , 𝑚 𝐿 ⟩.<label>(1)</label></formula><p>Then, we can define thresholds 𝑠 + and 𝑠 − to identify the minimum positive slope and maximum negative slope to consider that an item has impact on the classification of any of the considered classes.</p><p>Once defined these thresholds, we proceed to the identification of anomalous questions. To do so, we only need to identify items with influence (𝑠 &gt; 𝑠 + or 𝑠 &lt; 𝑠 − ) that are opposite to the values defined int "expected answers datasheet".</p><p>To understand this process we can use the examples presented in Figure <ref type="figure" target="#fig_4">4</ref>. The expected answer to item 3 "My friends have told me that I look different" to diagnose high PDS according to the psychologist is 1. However, the ALE plot (on the left) shows that the behavior of the ANN model is the other way around: answer 1 contributes to be classified as medium PDS but decreases the possibility of belonging to classes medium and high, that is a very anomalous behaviour. The ALE plot on the right side also presents an opposite behaviour where a positive answer increases possibility of classification as low but decreases medium and high.</p><p>This way, in order to detect anomalous questions, it is essential to analyze the vectors ( − −− → 𝐴𝐿𝐸 𝐼 ) that contain the slopes of the items. Then we have defined several anomalies in the questionnaire items according to the following conditions:</p><p>• Inconsistent items for class "High": Items that, with their theoretical expected answers, promoted false High PDS predictions or false non-High PDS predictions, respectively.</p><p>-Items with 𝑚 𝐻 &gt; 𝑠 + and expected answer False, OR -Items with 𝑚 𝐻 &lt; 𝑠 − and with expected True. • Inconsistent items for class "Low": Items that, with their theoretical expected answers, promoted false Low PDS predictions or false non-Low PDS predictions, respectively. -Items with 𝑚 𝐿 &gt; 𝑠 + and with expected answer True, OR -Items with 𝑚 𝐿 &gt; 𝑠 − and with expected answer False.</p><p>• Irrelevant Items: Items that do not make any difference to discern between PDS classes.</p><p>-Items with either high or Low PDS importance values being in the range [𝑠 − , 𝑠 + ].</p><p>We need to clarify that questions can be anomalous for the High PDS class, but that does not automatically makes them anomalous for the Low class. Therefore, items can be anomalous either for one class or both.</p><p>At this point, it is very important to note that the identification of anomalous items is based on the comparison to the expected answers according to the expert. However, we should consider that these expectations may be wrong due to many factors: population features, individual disorders, etc. This way, the items identified in the previous step should be considered as "potentially anomalous items" until the expert confirms that the behavior of the ANN model is correct or not. This revision process (similar to the one performed by the CBR cycle) can be really complex for users that may not have any kind of skill on machine learning. Therefore, we propose the use of additional introspective XAI methods to support this task. Concretely, we provide support to this decision making process through several explanation methods such as LIME and SHAP.</p><p>The purpose of SHAP <ref type="bibr" target="#b19">[20]</ref> is to explain the prediction of a particular instance by computing the contribution of each feature to the prediction. These contributions are computed using Shapley values, which are obtained by arranging the features in different coalitions and calculating the average marginal contribution of a feature. In simpler words, SHAP is an indicator of the contribution of a feature to the outputted probability. Local interpretable model-agnostic explanations (LIME) <ref type="bibr" target="#b20">[21]</ref> is a tool that provides explanations for individual instances relying on local surrogates. A local surrogate is an interpretable model that intends to replicate the behavior of the black-box model for instances similar to the one being analyzed. The explanation gives us the contributions of each feature according to the created surrogate. In our case, both methods are able to measure the impact of each item in the accuracy of the ANN. Therefore, we  can plot this effect using a heat-map, as presented in Figures <ref type="figure" target="#fig_5">5</ref> and Figure <ref type="figure" target="#fig_6">6</ref> where we use a blue-color scale to indicate the impact of items behaving correctly according to the "expected answers datasheet" and a red-color scale for inconsistent items. Consequently, irrelevant items appear with a color close to white. As we can see, both XAI methods reflect similar anomalies in the classification model. These heat-maps can be used by the psychologist to decide whether an item is actually an anomaly of the ANN model or it describes a certain pattern that makes sense.</p><p>With anomalous items detected and confirmed by the expert, our underlying hypothesis is that it is possible to filter these questions from the dataset in order to achieve a higher prediction performance. Specifically, curating the questionnaire removing High PDS anomalous questions should help the classifier model to more easily identify High PDS instances. This can also degrade the prediction performance of other classes, but in the use case of depression screening, we already mentioned that it is more important to identify those individuals with a high level of depression, even at the cost of having false negative predictions for the Medium PDS and Low PDS classes.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Evaluation</head><p>Our questionnaire refinement process is evaluated in this section. The removal of items is performed in an iterative fashion over the dataset, creating multiple curated versions of our model. On each iteration, the detected High PDS anomalous questions are removed. Here we are assuming that the psychologist will confirm the inconsistent impact of every potentially  anomalous item. Then the ANN is retrained over the remaining questionnaire items to verify the prediction performance of the classifier. Global accuracy performance on each iteration is displayed in Figure <ref type="figure" target="#fig_7">7</ref> (left). As this figure reflects, global accuracy ranges between .5 to .6, reflecting that our process does not have a significant impact on the global performance the model.</p><p>Also, the number of inputs used to train the classification model on each iteration is presented in Figure <ref type="figure" target="#fig_7">7</ref> (right). From 102 original items, our refinement process reduced that number down to approximately 40 questions.</p><p>Since the main objective of removing questions was to improve the identification of people in the High PDS class, it is also useful to analyse the recall metrics . Corresponding results are presented in Figure <ref type="figure" target="#fig_8">8</ref>.</p><p>Although recall decreases for the Medium PDS and Low PDS classes, the High PDS presents an important raise, which indicates that the ANN has achieved a better ability to detect individuals with a high presence of depression symptoms, which was the goal of our research.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="6.">Conclusions</head><p>This paper introduces an iterative refinement method that uses XAI techniques, such as ALE, SHAP and LIME, in order to remove irrelevant or anomalous features that could have a negative impact on an ANN-based depression screening tool. Concretely, we have defined a questionnaire refinement process that, in an iterative fashion, uses the ALE technique in order to identify anomalous questions and remove them, producing a curated set of items that enhances the prediction metrics for our target classes, namely, those representing individuals with a high risk of depression.</p><p>The main conclusion of this work is that it is possible to use XAI methods not only for the explanation of a black-box model, but also for its improvement and refinement. To do so, we propose an iterative cycle following the global cycle of CBR, where potentially anomalous items are retrieved using the ALE method, and later revised by the clinician using other XAI methods such as LIME or SHAP. The last step consists on retaining this changes into the model to begin a new iteration.</p><p>As future work, our paper can be enhanced in multiples ways. First and foremost, a larger dataset of users' answers is always desirable for data-oriented tasks, such as training classification models. This grants more confidence on the results obtained during the evaluation process, as well as stability, due to bias of any type being diluted as the number of instances grow.</p><p>In a similar way, another suggestion to increase the reach of the project is to expand the user demographic on which the questionnaire was applied. Students from other universities can manifest different subsets of depression symptoms, and extending the population stratification the data is being collected from, a better understanding on how to perform depression screening can be obtained.</p><p>Also, on a more technical level, different feature importance techniques can be applied to measure the relevance each questionnaire item has in the depression screening process. ALE provides one approach, but we could also use LIME or SHAP in this step instead of applying them for the revision.</p><p>Finally, removing not only High PS anomalous questions, but anomalous items with Low PS anomalies or even the irrelevant items is our immediate future work to improve the performance of our system.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>Figure 1 :</head><label>1</label><figDesc>Figure 1: Confusion matrix (left) and performance metrics (right) for the original ANN model. Axis values 0, 1, and 2 represent classes "low", "medium" and "high" respectively.</figDesc><graphic coords="4,303.89,181.17,166.67,53.26" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_1"><head>Figure 2 :</head><label>2</label><figDesc>Figure 2: Global schema of the proposed iterative refinement method through XAI methods.</figDesc><graphic coords="5,110.13,84.19,375.03,234.06" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_2"><head>3 .</head><label>3</label><figDesc>The expert will confirm or discard the abnormal behaviour of these items through a deeper analysis supported by additional introspective XAI methods. 4. Those items confirmed by the expert are removed from the dataset, and a new model is trained. Continuing to the next iteration from step 1.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_3"><head>Figure 3 :</head><label>3</label><figDesc>Figure 3: Example of non anomalous questions.</figDesc><graphic coords="6,89.29,84.19,416.70,162.00" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_4"><head>Figure 4 :</head><label>4</label><figDesc>Figure 4: Example of two anomalous questions where the High PDS is negative and the expected answer being positive.</figDesc><graphic coords="7,89.29,84.19,416.68,155.94" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_5"><head>Figure 5 :</head><label>5</label><figDesc>Figure 5: Heat-map reflecting the impact of every item in the model according to SHAP. Red color scale is used for inconsistent items.</figDesc><graphic coords="8,89.29,84.19,416.69,95.26" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_6"><head>Figure 6 :</head><label>6</label><figDesc>Figure 6: Heat-map reflecting the impact of every item in the model according to LIME. Red color scale is used for inconsistent items.</figDesc><graphic coords="8,89.29,223.73,416.69,95.68" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_7"><head>Figure 7 :</head><label>7</label><figDesc>Figure 7: (Left)Global accuracy and number of anomalous questions identified on each iteration. (Right) Number of questions used as inputs on each iteration.</figDesc><graphic coords="9,94.30,86.12,204.18,128.89" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_8"><head>Figure 8 :</head><label>8</label><figDesc>Figure 8: Recall results per each target class and number of anomalous items on every iteration.</figDesc><graphic coords="9,151.80,260.40,291.70,179.41" type="bitmap" /></figure>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Acknowledgments</head><p>This research is a result of the Horizon 2020 Future and Emerging Technologies (FET) programme of the European Union through the iSee project (CHIST-ERA-19-XAI-008, PCI2020-120720-2) funded by MCIN/AEI/10.13039/501100011033 and European Union "NextGenerationEU"/PRTR. This work has been also partially supported by the PERXAI project PID2020-114596RB-C21 funded by MCIN/AEI/10.13039/501100011033 and the BOSCH-UCM Honorary Chair on Artificial Intelligence applied to Internet of Things of the Universidad Complutense de Madrid. It is also part of projects 10428.21-P and 13933.22-P of the Tecnológico Nacional de México/IT de Mérida.</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Awareness, Prevention, Detection, and Therapy Applications for Depression and Anxiety in Serious Games for Children and Adolescents: Systematic Review</title>
		<author>
			<persName><forename type="first">K</forename><surname>Martinez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">I</forename><surname>Menéndez-Menéndez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Bustillo</surname></persName>
		</author>
		<idno type="DOI">10.2196/30482</idno>
	</analytic>
	<monogr>
		<title level="j">JMIR Serious Games</title>
		<imprint>
			<biblScope unit="volume">9</biblScope>
			<biblScope unit="page" from="1" to="19" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">A deep architecture for depression detection using posting, behavior, and living environment data</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">Y</forename><surname>Wu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">Y</forename><surname>Shen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">T</forename><surname>Wang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">L</forename><surname>Chen</surname></persName>
		</author>
		<idno type="DOI">10.1007/s10844-018-0533-4</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Intelligent Information Systems</title>
		<imprint>
			<biblScope unit="volume">54</biblScope>
			<biblScope unit="page" from="225" to="244" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">Context Deep Neural Network Model for Predicting Depression Risk Using Multiple Regression</title>
		<author>
			<persName><forename type="first">J.-W</forename><surname>Baek</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Chung</surname></persName>
		</author>
		<idno type="DOI">10.1109/access.2020.2968393</idno>
	</analytic>
	<monogr>
		<title level="j">IEEE Access</title>
		<imprint>
			<biblScope unit="volume">8</biblScope>
			<biblScope unit="page" from="18171" to="18181" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">An Inventory for Measuring Clinical Anxiety: Psychometric Properties</title>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">T</forename><surname>Beck</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Epstein</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Brown</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">A</forename><surname>Steer</surname></persName>
		</author>
		<idno type="DOI">10.1037/0022-006X.56.6.893</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Consulting and Clinical Psychology</title>
		<imprint>
			<biblScope unit="volume">56</biblScope>
			<biblScope unit="page" from="893" to="897" />
			<date type="published" when="1988">1988</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">Low selfawareness of ADHD in adults using a self-report screening questionnaire</title>
		<author>
			<persName><forename type="first">I</forename><surname>Manor</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Vurembrandt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Rozen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Gevah</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Weizman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Zalsman</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.eurpsy.2010.08.013</idno>
		<ptr target="http://dx.doi.org/10.1016/j.eurpsy.2010.08.013.doi:10.1016/j.eurpsy.2010.08.013" />
	</analytic>
	<monogr>
		<title level="j">European Psychiatry</title>
		<imprint>
			<biblScope unit="volume">27</biblScope>
			<biblScope unit="page" from="314" to="320" />
			<date type="published" when="2012">2012</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">A dark side of the American dream: Correlates of financial success as a central life aspiration</title>
		<author>
			<persName><forename type="first">T</forename><surname>Kasser</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">M</forename><surname>Ryan</surname></persName>
		</author>
		<idno type="DOI">10.1037/0022-3514.65.2.410</idno>
		<idno>doi:</idno>
		<ptr target="10.1037/0022-3514.65.2.410" />
	</analytic>
	<monogr>
		<title level="j">Journal of Personality and Social Psychology</title>
		<imprint>
			<biblScope unit="volume">65</biblScope>
			<biblScope unit="page" from="410" to="422" />
			<date type="published" when="1993">1993</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">The BPQ: A scale for the assessment of borderline personality based on DSM-IV criteria</title>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">M</forename><surname>Poreh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Rawlings</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Claridge</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">L</forename><surname>Freeman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Faulkner</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Shelton</surname></persName>
		</author>
		<idno type="DOI">10.1521/pedi.2006.20.3.247</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Personality Disorders</title>
		<imprint>
			<biblScope unit="volume">20</biblScope>
			<biblScope unit="page" from="247" to="260" />
			<date type="published" when="2006">2006</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">A short form of the common beliefs survey III</title>
		<author>
			<persName><forename type="first">G</forename><forename type="middle">L</forename><surname>Thorpe</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">B</forename><surname>Frey</surname></persName>
		</author>
		<idno type="DOI">10.1007/BF02238270</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Rational -Emotive and Cognitive -Behavior Therapy</title>
		<imprint>
			<biblScope unit="volume">14</biblScope>
			<biblScope unit="page" from="193" to="198" />
			<date type="published" when="1996">1996</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">An Artificial Neural Network for Depression Screening and Questionnaire Refinement in Undergraduate Students</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">G</forename><surname>Orozco-Del Castillo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">C</forename><surname>Orozco-Del Castillo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Brito-Borges</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Bermejo-Sabbagh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Cuevas-Cuevas</surname></persName>
		</author>
		<idno type="DOI">10.1007/978-3-030-89586-0_1</idno>
		<ptr target="https://link.springer.com/10.1007/978-3-030-89586-0_1.doi:10.1007/978-3-030-89586-0_1" />
	</analytic>
	<monogr>
		<title level="m">Telematics and Computing. WITCOM 2021</title>
		<title level="s">Communications in Computer and Information Science</title>
		<editor>
			<persName><forename type="first">M</forename><forename type="middle">F</forename><surname>Mata-Rivera</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">R</forename><surname>Zagal-Flores</surname></persName>
		</editor>
		<meeting><address><addrLine>Nature Switzerland AG</addrLine></address></meeting>
		<imprint>
			<publisher>Springer</publisher>
			<date type="published" when="2021">2021. 2021</date>
			<biblScope unit="volume">2</biblScope>
			<biblScope unit="page" from="1" to="13" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">A brief measure for assessing generalized anxiety disorder: The GAD-7</title>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">L</forename><surname>Spitzer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Kroenke</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">B</forename><surname>Williams</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Löwe</surname></persName>
		</author>
		<idno type="DOI">10.1001/archinte.166.10.1092</idno>
		<ptr target="https://jamanetwork.com/.doi:10.1001/archinte.166.10.1092" />
	</analytic>
	<monogr>
		<title level="j">Archives of Internal Medicine</title>
		<imprint>
			<biblScope unit="volume">166</biblScope>
			<biblScope unit="page" from="1092" to="1097" />
			<date type="published" when="2006">2006</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">Horne &amp; Östberg morningness-eveningness questionnaire: A reduced scale</title>
		<author>
			<persName><forename type="first">A</forename><surname>Adan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Almirall</surname></persName>
		</author>
		<idno type="DOI">10.1016/0191-8869(91)90110-W</idno>
	</analytic>
	<monogr>
		<title level="j">Personality and Individual Differences</title>
		<imprint>
			<biblScope unit="volume">12</biblScope>
			<biblScope unit="page" from="241" to="253" />
			<date type="published" when="1991">1991</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<monogr>
		<author>
			<persName><forename type="first">M</forename><surname>Rosenberg</surname></persName>
		</author>
		<title level="m">Society and the adolescent self-image</title>
				<meeting><address><addrLine>Middletown, CT</addrLine></address></meeting>
		<imprint>
			<publisher>Wesleyan University Press</publisher>
			<date type="published" when="1989">1989</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b12">
	<monogr>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">D</forename><surname>Spielberger</surname></persName>
		</author>
		<idno type="DOI">10.1016/B978-1-4832-3131-0.50006-8</idno>
		<title level="m">Theory and Research on Anxiety</title>
				<meeting><address><addrLine>New York, NY</addrLine></address></meeting>
		<imprint>
			<publisher>Academic Press</publisher>
			<date type="published" when="1966">1966</date>
			<biblScope unit="page" from="3" to="20" />
		</imprint>
	</monogr>
	<note>Anxiety and Behavior</note>
</biblStruct>

<biblStruct xml:id="b13">
	<analytic>
		<title level="a" type="main">Development of the Spanish Edition of the State-Trait Anxiety Inventory</title>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">D</forename><surname>Spielberger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Gonzalez-Reigosa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Martinez-Urrutia</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Interamerican Journal of Psychology</title>
		<imprint>
			<biblScope unit="volume">5</biblScope>
			<biblScope unit="page" from="3" to="4" />
			<date type="published" when="1971">1971</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">Using self-report assessment methods to explore facets of mindfulness</title>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">A</forename><surname>Baer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><forename type="middle">T</forename><surname>Smith</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Hopkins</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Krietemeyer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Toney</surname></persName>
		</author>
		<idno type="DOI">10.1177/1073191105283504</idno>
	</analytic>
	<monogr>
		<title level="j">Assessment</title>
		<imprint>
			<biblScope unit="volume">13</biblScope>
			<biblScope unit="page" from="27" to="45" />
			<date type="published" when="2006">2006</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b15">
	<monogr>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">L</forename><surname>Greene</surname></persName>
		</author>
		<title level="m">The MMPI-2: An interpretive manual</title>
				<meeting><address><addrLine>Needham Heights, MA, US</addrLine></address></meeting>
		<imprint>
			<publisher>Allyn &amp; Bacon</publisher>
			<date type="published" when="2000">2000</date>
		</imprint>
	</monogr>
	<note>2nd ed</note>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">Identifying superfluous survey items</title>
		<author>
			<persName><forename type="first">K</forename><surname>Brosnan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Grün</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Dolnicar</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.jretconser.2018.02.007</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Retailing and Consumer Services</title>
		<imprint>
			<biblScope unit="volume">43</biblScope>
			<biblScope unit="page" from="39" to="45" />
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b17">
	<analytic>
		<title level="a" type="main">XAI-Explainable artificial intelligence David</title>
		<author>
			<persName><forename type="first">G.-Z</forename><forename type="middle">Y</forename><surname>David Gunning</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Mark</forename><surname>Stefik</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Jaesik</forename><surname>Choi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Timothy</forename><surname>Miller</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Simone</forename><surname>Stumpf</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Science Robotics</title>
		<imprint>
			<biblScope unit="volume">1</biblScope>
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b18">
	<analytic>
		<title level="a" type="main">SMOTE: Synthetic minority over-sampling technique</title>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">V</forename><surname>Chawla</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">W</forename><surname>Bowyer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><forename type="middle">O</forename><surname>Hall</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><forename type="middle">P</forename><surname>Kegelmeyer</surname></persName>
		</author>
		<idno type="DOI">10.1613/jair.953</idno>
		<idno type="arXiv">arXiv:1106.1813</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Artificial Intelligence Research</title>
		<imprint>
			<biblScope unit="volume">16</biblScope>
			<biblScope unit="page" from="321" to="357" />
			<date type="published" when="2002">2002</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b19">
	<analytic>
		<title level="a" type="main">A unified approach to interpreting model predictions</title>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">M</forename><surname>Lundberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S.-I</forename><surname>Lee</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Advances in Neural Information Processing Systems 30</title>
				<editor>
			<persName><forename type="first">I</forename><surname>Guyon</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">U</forename><forename type="middle">V</forename><surname>Luxburg</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">S</forename><surname>Bengio</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">H</forename><surname>Wallach</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">R</forename><surname>Fergus</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">S</forename><surname>Vishwanathan</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">R</forename><surname>Garnett</surname></persName>
		</editor>
		<imprint>
			<publisher>Curran Associates, Inc</publisher>
			<date type="published" when="2017">2017</date>
			<biblScope unit="page" from="4765" to="4774" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b20">
	<analytic>
		<title level="a" type="main">why should i trust you?&quot;: Explaining the predictions of any classifier</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">T</forename><surname>Ribeiro</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Singh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Guestrin</surname></persName>
		</author>
		<idno type="DOI">10.1145/2939672.2939778</idno>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</title>
				<meeting>the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining<address><addrLine>New York, NY, USA</addrLine></address></meeting>
		<imprint>
			<publisher>Association for Computing Machinery</publisher>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="1135" to="1144" />
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
