<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Reliable Central Nervous System Tumor Differentiation on MRI Images with Deep Neural Networks and Conformal Prediction</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
				<date type="published" when="2024-10-20">20 October 2024</date>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Luis</forename><surname>Balderas</surname></persName>
							<affiliation key="aff0">
								<orgName type="department" key="dep1">School of Sciences, Technology and Engineering&apos;s Doctorates. Department of Computer Science and Artificial Intelligence</orgName>
								<orgName type="department" key="dep2">DiCITS</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department" key="dep1">DaSCI</orgName>
								<orgName type="department" key="dep2">iMUDS</orgName>
								<orgName type="institution">University of Granada</orgName>
								<address>
									<postCode>18071</postCode>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">María</forename><surname>Moreno De Castro</surname></persName>
							<affiliation key="aff0">
								<orgName type="department" key="dep1">School of Sciences, Technology and Engineering&apos;s Doctorates. Department of Computer Science and Artificial Intelligence</orgName>
								<orgName type="department" key="dep2">DiCITS</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department" key="dep1">DaSCI</orgName>
								<orgName type="department" key="dep2">iMUDS</orgName>
								<orgName type="institution">University of Granada</orgName>
								<address>
									<postCode>18071</postCode>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Miguel</forename><surname>Lastra</surname></persName>
							<affiliation key="aff2">
								<orgName type="department" key="dep1">Department of Software Engineering</orgName>
								<orgName type="department" key="dep2">DiCITS</orgName>
								<orgName type="department" key="dep3">DaSCI</orgName>
								<orgName type="department" key="dep4">iMUDS</orgName>
								<orgName type="institution">University of Granada</orgName>
								<address>
									<postCode>18071</postCode>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Jose</forename><forename type="middle">P</forename><surname>Martínez</surname></persName>
							<affiliation key="aff3">
								<orgName type="department">Radiodiagnosis Service</orgName>
								<orgName type="institution">Hospital Universitario &quot;Virgen de las Nieves&quot;</orgName>
								<address>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
							<affiliation key="aff4">
								<orgName type="institution" key="instit1">ibs</orgName>
								<orgName type="institution" key="instit2">Granada</orgName>
								<orgName type="institution" key="instit3">Instituto Biosanitario de Granada</orgName>
								<address>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Francisco</forename><forename type="middle">J</forename><surname>Pérez</surname></persName>
							<affiliation key="aff3">
								<orgName type="department">Radiodiagnosis Service</orgName>
								<orgName type="institution">Hospital Universitario &quot;Virgen de las Nieves&quot;</orgName>
								<address>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Antonio</forename><surname>Laínez</surname></persName>
							<affiliation key="aff3">
								<orgName type="department">Radiodiagnosis Service</orgName>
								<orgName type="institution">Hospital Universitario &quot;Virgen de las Nieves&quot;</orgName>
								<address>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
							<affiliation key="aff4">
								<orgName type="institution" key="instit1">ibs</orgName>
								<orgName type="institution" key="instit2">Granada</orgName>
								<orgName type="institution" key="instit3">Instituto Biosanitario de Granada</orgName>
								<address>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Antonio</forename><surname>Arauzo-Azofra</surname></persName>
							<affiliation key="aff5">
								<orgName type="department" key="dep1">Rural Engineering Department</orgName>
								<orgName type="department" key="dep2">DiCITS Lab</orgName>
								<orgName type="institution">University of Córdoba</orgName>
								<address>
									<postCode>14005</postCode>
									<settlement>Córdoba</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">José</forename><forename type="middle">M</forename><surname>Benítez</surname></persName>
							<affiliation key="aff0">
								<orgName type="department" key="dep1">School of Sciences, Technology and Engineering&apos;s Doctorates. Department of Computer Science and Artificial Intelligence</orgName>
								<orgName type="department" key="dep2">DiCITS</orgName>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department" key="dep1">DaSCI</orgName>
								<orgName type="department" key="dep2">iMUDS</orgName>
								<orgName type="institution">University of Granada</orgName>
								<address>
									<postCode>18071</postCode>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
							<affiliation key="aff4">
								<orgName type="institution" key="instit1">ibs</orgName>
								<orgName type="institution" key="instit2">Granada</orgName>
								<orgName type="institution" key="instit3">Instituto Biosanitario de Granada</orgName>
								<address>
									<settlement>Granada</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<author>
							<affiliation key="aff6">
								<address>
									<settlement>Santiago de Compostela</settlement>
									<country key="ES">Spain</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Reliable Central Nervous System Tumor Differentiation on MRI Images with Deep Neural Networks and Conformal Prediction</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
						<imprint>
							<date type="published" when="2024-10-20">20 October 2024</date>
						</imprint>
					</monogr>
					<idno type="MD5">A4E79D3136B095CB90A82D253938EF71</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2025-04-23T18:11+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>0000-0002-3845-8848 (L. Balderas)</term>
					<term>0000-0003-0440-0864 (M. Moreno de Castro)</term>
					<term>0000-0002-7278-2668 (M. Lastra)</term>
					<term>0000-0002-0663-2856 (A. Laínez)</term>
					<term>0000-0002-2486-5792 (A. Arauzo-Azofra)</term>
					<term>0000-0002-2346-0793 (J. M. Benítez)</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>Central nervous system tumors, particularly gliomas, rank among the top 10 causes of cancer-related deaths worldwide. Thus, precise differentiation of these tumors is crucial for effective treatment, which can reduce patient suffering and lower mortality rates. We propose a deep learning-based technique for glioma differentiation using MRI imaging, which incorporates two novel approaches. First, we represent perfusion sequences as time series, which serve as inputs for a Deep Neural Network (DNN) classifier. This classifier is trained to distinguish the sequences between low-grade glioma (LGG) and high-grade glioma (HGG). Second, we employ Conformal Prediction to calibrate the results, ensuring they include the true category with a 90% probability. This approach has been rigorously tested to evaluate its performance. Our experimental results demonstrate that our deep neural network not only provides accurate but also ensures trustworthy predictions.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>Central nervous system (CNS) tumors have traditionally been regarded as a lethal form of cancer, ranking among the top 10 causes of deaths globally. The GLOBOCAN project using nationwide data from 184 countries estimated the annual incidence of malignant-only CNS tumors to be 3.4 per 100,000 individuals <ref type="bibr" target="#b0">[1]</ref>. Within the variety of tumor types, gliomas are the most frequent primary intracerebral tumors in adults. Despite their high fatality rates, the prognosis of CNS tumors has considerably improved over the last decades, possibly because of the prompt detection, the optimization of treatment protocols including the introduction of temozolomide and the advances in neurosurgical procedures.</p><p>Accurate preoperative differentiation of primary CNS tumors is crucial because the treatment strategies differ substantially (e.g. stereotactic biopsy + chemotherapy vs. gross total resection + chemotherapy in lymphoma vs. glioblastoma). Magnetic Resonance Imaging (MRI) is the most important non-invasive technique in the diagnosis and differentiation of CNS tumors. In this context, MRI-perfusion is an imaging technique frequently used to assess the vascularization of brain lesions in a minimally invasive way. There are different approaches for the study of perfusion and lesions of CNS.</p><p>Machine learning has been employed in numerous medical problems as part of expert decision support systems. However, in most instances, these systems do not provide any information regarding the confidence of their predictions. In this paper we propose an innovative approach that treats perfusion curves as time series data and apply Deep Neural Networks (DNN) and Conformal Predictors (CP) to assess the type of glioma a patient suffers, along with measures of confidence.</p><p>In essence, this involves framing the differentiation problem as a classification task using the perfusion curve as input. This requires finding a suitable representation for the series and then identifying a technique that delivers high classification performance. On top of the classifier, a conformal predictor is built to quantify the level of uncertainty inherent in the model's predictions using specific metrics. Our research has resulted in an effective automated procedure to assist radiologists in their work, contributing to the quantification of uncertainty at the patient level, with applications in personalized and precision medicine.</p><p>The structure of the article is as follows: In Section 2, we present state-of-the-art methods that use deep learning and conformal prediction for glioma differentiation, including medical context for a better understanding of the problem. In Section 3 we detail Conformal Predictors. In Section 4, we present our proposal for glioma differentiation. In Section 5, we include the empirical study and discussion of the results. Finally, Section 6 contains the conclusions of the work.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Related work</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.1.">Medical contextualization</head><p>As noted in the introduction, gliomas are the most frequent primary intracerebral tumors in adults. The age-adjusted annual incidence of histologic verified glioma has been reported to be 7.3 cases per 100,000 person-years <ref type="bibr" target="#b1">[2]</ref>. Most patients with gliomas have a fatal prognosis, and the disease has considerable impact on patients and their families' physical, psychological, and social status. A recent study on the epidemiology of gliomas found that high-grade gliomas -HGG, grades 3 and 4 according to World Health Organization (WHO)-were present in 85% and low-grade glioma (LGG, WHO 1 and 3 grades) in 15% of the cases, with 5-year overall survival of 82, 54, 22 and 3% for grade 1, 2, 3, and 4, respectively <ref type="bibr" target="#b2">[3]</ref>.</p><p>Accurate preoperative differentiation of primary CNS tumors is essential because the treatment strategies differ substantially. MRI is the most important non-invasive technique in the diagnosis of CNS tumors. In particular, MRI-perfusion is frequently used to assess the vascularization of brain lesions. There are different approaches for the study of perfusion and lesions of CNS. The most widely used MRI-perfusion approach in clinical practice is T2 gradient echo or dynamic susceptibility contrast (DSC) due to its high sensitivity and specificity to differentiate lesions and its short acquisition time. DSC perfusion allows the study of changes in the signal intensity of the tissues derived from the passage of an intravenous gadolinium bolus administered in a peripheral vein. The passage of the contrast bolus leads to specific imaging patterns in different tissues and tumors, with changes in their signal intensity proportional to the amount of gadolinium that passes through or is deposited in them. Changes in signal intensity over time allow a curve to be obtained, from which hemodynamic parameters are inferred.</p><p>At present, pathological anatomy techniques are essential in the diagnosis and genetic and histological differentiation of gliomas. However, in the presence of lesions such as metastases, an adequate diagnostic imaging can avoid a brain biopsy. The procedure of stereotactic brain biopsy entails a considerable risk of complications (e.g., haemorrhage, infection, wound breakdown), which can be as high as 15.3% in tumors located in midline areas, while 28.8% of post-procedural intracranial haemorrhages have been reported <ref type="bibr" target="#b3">[4]</ref>.</p><p>A recent Cochrane review <ref type="bibr" target="#b4">[5]</ref> reported limited available evidence on the ability of perfusion MRI to distinguish HGG from LGG, which precludes reliable estimation of the performance of DSC MRI perfusion-derived parameters (e.g., relative cerebral blood volume or rCBV) for determining the tumor grade, specifically in untreated solid and non-enhancing LGG vs. HGG. MRI-perfusion has also been advocated as a useful tool to differentiate between gliomas and other tumors of the CNS, such as lymphomas or metastases, but with variable diagnostic yields depending on the publications. Furthermore, it demonstrated to be useful in differentiating between tumor recurrence of gliomas and post-treatment changes such as pseudo progression or radionecrosis. However, the available evidence is restricted to isolated non-clinically validated studies.</p><p>Most of these publications have focused on a classical analysis of MRI perfusion data, with special emphasis on the quantification of rCBV (an estimate of tumor perfusion), which is not quantifiable in absolute terms (thus requiring comparison with areas of normal cerebral parenchyma). A number or publications that have applied Artificial Intelligence algorithms to the analysis of brain perfusion can be found. They are discussed in section 2.2.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.2.">State-of-art Artificial Intelligence methods</head><p>In this section, we present the most relevant articles in the state of the art related to the topic. To the best of our knowledge, there is no technique in the literature that utilizes the perfusion curve as input for a time series classification model in low-grade gliomas (LGG) and high-grade gliomas (HGG). Moreover, there are numerous approaches in the literature that apply CP to quantify the uncertainty of deep learning models ( <ref type="bibr" target="#b5">[6]</ref>, <ref type="bibr" target="#b6">[7]</ref>). In fact, the combination of deep learning and CP is especially useful in biomedical problems. For example, in skin lesion classification ( <ref type="bibr" target="#b7">[8]</ref>), for the diagnosis and grading of prostate biopsies ( <ref type="bibr" target="#b8">[9]</ref>), for rating breast density in mammography ( <ref type="bibr" target="#b9">[10]</ref>), for grading the severity of spinal stenosis in lumbar spine MRI ( <ref type="bibr" target="#b10">[11]</ref>); among other applications ( <ref type="bibr" target="#b11">[12]</ref>, <ref type="bibr" target="#b12">[13]</ref>, <ref type="bibr" target="#b13">[14]</ref>), we have not encountered in the literature any work that combines DNN and CP methods in the differentiation of central nervous system tumors.</p><p>However, the non-invasive differentiation of gliomas through the application of machine learning, specifically distinguishing between LGG and HGG gliomas, has been extensively investigated in recent years. For instance, in <ref type="bibr" target="#b14">[15]</ref>, a substantial number of radiological features were extracted from MRI sequences, including T1-weighted, T1-weighted contrast-enhanced, T2-weighted, and FLAIR, across a total of 285 cases (210 HGG, 75 LGG). These features were used to train three classifiers (logistic regression, random forest, and support vector machine) to determine the glioma type, achieving an average AUC of 0.9030 for test cohorts.</p><p>In <ref type="bibr" target="#b15">[16]</ref>, a deep multi-scale 3D Convolutional Neural Network (CNN) architecture was proposed to categorize gliomas into LGG and HGG using volumetric T1 contrast-enhanced MRI sequences, achieving an accuracy of 96.49%.</p><p>Recently, some studies advocate mixed approaches incorporating molecular profiling for the differentiation of LGG and HGG ( <ref type="bibr" target="#b16">[17]</ref>). For instance, in the work by authors in <ref type="bibr" target="#b17">[18]</ref>, clinical and laboratory data were integrated to create a tool for predicting the molecular status (ATRX, IDH1/2, MGMT, and 1p19q co-deletion), distinguishing between low-grade and high-grade gliomas. The system achieved an AUC of 0.885 for this specific learning task.</p><p>Finally, other studies such as <ref type="bibr" target="#b18">[19]</ref>, <ref type="bibr" target="#b19">[20]</ref>, <ref type="bibr" target="#b20">[21]</ref>, and <ref type="bibr" target="#b21">[22]</ref> utilized cases of high-grade or low-grade gliomas to conduct specific studies on various features, but did not present tools for classification between these two grades of gliomas.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Conformal predictors</head><p>In spite of their generally accurate performance, many machine learning models are known to estimate poorly prediction probabilities. To deliver reliable estimates and avoid over or under-confidence predictions, prediction uncertainty must be quantified. This decision aligns with the demand of trustworthy Artificial Intelligence, which, as expressed in recent European Parliament AI regulations <ref type="bibr" target="#b23">[23]</ref>, includes as a requirement the models ability to quantify and communicate their confidence in their outputs ( <ref type="bibr" target="#b24">[24]</ref>, <ref type="bibr" target="#b5">[6]</ref>) with special focus on high-risk applications as AI-supported medicine <ref type="bibr" target="#b25">[25]</ref>.</p><p>Performance metrics, such as accuracy or F1-score, cannot tell about the confidence or uncertainty of the model's predictions. Even for a model that is right most of the time, not all the cases are equally easy to classify. Some of them might even be doubtful (e.g., they belong to a different distribution or their kind was mostly under represented, overlooked, or misclassified). For example, we can think about patients images from a different hospital, taken from a different MRI scanner, or labeled by another team. The model may provide unnoticed overly confident predictions because machine learning algorithms do not include a built-in warning mechanism to prevent well-informed predictions from looking the same as wild guesses <ref type="bibr" target="#b26">[26]</ref> and refers to the alignment between predicted probabilities directly provided by the model and relative frequencies in the actual data. Well-calibrated models are those where the predicted probabilities match the empirical probabilities. Thus, it is about calculating "the probability that the predicted probability is right". For example, given an MRI scan, if the model predicts class A with 80% probability, then class A should occur approximately 80 times out of 100 predictions. More formally, a well-calibrated classifier satisfies the following formula <ref type="bibr" target="#b27">[27]</ref>:</p><formula xml:id="formula_0">𝑃 (actual class is A|predicted probability of A is 𝑝) ≈ 𝑝<label>(1)</label></formula><p>To provide confidence to classification results, calibration models should be applied. Two of the most popular calibration methods are Platt's Scaling and Isotonic Regression. Platt's Scaling <ref type="bibr" target="#b28">[28]</ref> is a very popular method that maps each prediction to its empirical frequency by passing it through a sigmoid. The method is therefore parametric and presupposes normally distributed and heteroscedastic per-class scores, a notably limiting assumption <ref type="bibr" target="#b29">[29]</ref>. On the other hand, Isotonic Regression <ref type="bibr" target="#b30">[30]</ref> is more general because the map is performed with an isotonic (monotonically increasing) function. It assumes that the classifier perfectly ranks objects in the test set, essentially implying an ROC AUC of 1 and it is not recommended for small sets <ref type="bibr" target="#b29">[29]</ref>. A detailed explanation of how both calibration methods can be found in <ref type="bibr" target="#b31">[31]</ref>.</p><p>One step ahead of calibration is conformalization. To conformalize means that each single-point prediction is not only calibrated but also provided with a prediction interval, with statistical guarantees of including the true value at patient-level ( <ref type="bibr" target="#b27">[27]</ref>, <ref type="bibr" target="#b32">[32]</ref>, <ref type="bibr" target="#b29">[29]</ref>). Conformal Prediction (CP) methods conformalize the prediction. CP methods, which are distribution-free and lightweight, have shown some successful application in health-related domains, mostly for cancer prediction ( <ref type="bibr" target="#b33">[33]</ref>, <ref type="bibr" target="#b34">[34]</ref>, <ref type="bibr" target="#b35">[35]</ref>, <ref type="bibr" target="#b32">[32]</ref>, <ref type="bibr" target="#b36">[36]</ref>, <ref type="bibr" target="#b34">[34]</ref>, <ref type="bibr" target="#b37">[37]</ref>, <ref type="bibr" target="#b38">[38]</ref>, <ref type="bibr" target="#b39">[39]</ref>).</p><p>Venn-ABERS methods ( <ref type="bibr" target="#b40">[40]</ref>, <ref type="bibr" target="#b27">[27]</ref>) are members of the CP family <ref type="bibr" target="#b41">[41]</ref>, <ref type="bibr" target="#b42">[42]</ref>, <ref type="bibr" target="#b43">[43]</ref>). They share the skill to evaluate how different is an unseen instance from the training dataset. These methods were created to work on top of binary classifiers (although new implementations work for multi-class problems too <ref type="bibr" target="#b44">[44]</ref>). They conformalize the predicted probability to match the actual frequency of its class, while delivering in the process the upper (𝑝 1 ) and lower (𝑝 0 ) bounds of the probability interval that includes the true class (a property known as coverage or validity) with statistical guarantee. This prediction interval quantifies the uncertainty of predictions at instance level: the larger the interval, the lower the confidence the model has in that prediction. Venn-ABERS are an adaptation of Isotonic Regression (where it is applied twice, to fit the probability of each class) and a special case of Venn Predictors ( <ref type="bibr" target="#b45">[45]</ref>, <ref type="bibr" target="#b46">[46]</ref> , <ref type="bibr" target="#b29">[29]</ref>), from which they inherit guaranteed validity in the form of well-calibrated probability prediction.</p><p>There are two possible implementations of the Venn-ABERS algorithm depending on whether or not an independent calibration set is required separate from the training set. On one hand, an inductive approach, or Inductive Venn-ABERS (I-V-A), where the calibration is trained over a hold-on split of the training set, thus the conformalization is model-agnostic <ref type="bibr" target="#b46">[46]</ref>. On the other hand, Cross Venn-ABERS (C-V-A) where the splits are performed via k-fold, thus there is not need to reserve data just for calibration as in the inductive case and we use all available data to train the classifier but the classifier must be retrained each time we predict and conformalize the probabilitiy of a new patient <ref type="bibr" target="#b33">[33]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Our proposal</head><p>This work presents a novel methodology for the non-invasive differentiation of a specific family of CNS tumors, specifically distinguishing between high-grade (HGG) and low-grade gliomas (LGG). Patient data are 3D MRI scans focused on the T2 sequence. The T2 sequence is designed to measure the evolution of tissue signal intensity as the contrast bolus passes through. From these changes in signal intensity in the image, once processed, we construct the perfusion curve, which serves as input for our machine learning model. Thus, we transform an image processing problem into a time series classification one, which we address by combining two impactful technologies: on one hand, a deep The process initiates with the reception of a new perfusion sequence. After preprocessing the images, we extract the perfusion curve by calculating the mean luminance of the voxels at different time points. Subsequently, a CP-DNN is trained to extract the final prediction and quantify its uncertainty.</p><p>neural network capable of extracting patterns with high precision; and on the other hand, conformal predictors for quantifying the uncertainty of predictions. Consequently, we develop a decision support system with significant generalization capacity, providing valuable and calibrated information to the radiologist. The presented pipeline is divided into three phases: preprocessing of the sequence, generation of the perfusion curve, and finally, glioma differentiation with a machine learning model, specifically, a conformal predictor based on a deep neural network classifier. Below, we provide a detailed description of each phase. Figure <ref type="figure" target="#fig_0">1</ref> show the complete pipeline.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.1.">Preprocessing the perfusion MRI sequence</head><p>The differentiation process begins with the arrival of a new perfusion sequence. The first phase, related to preprocessing, involves normalizing the image in both size and grayscale levels using the Statistical Parametric Mapping technique <ref type="bibr" target="#b47">[47]</ref>. Additionally, it is crucial that the image is segmented. Despite numerous initiatives aiming to develop deep learning models for brain segmentation in MRI (as illustrated in <ref type="bibr" target="#b48">[48]</ref> and other reviews), there is, to the best of our knowledge, no automatic technique for segmenting an image in the perfusion sequence. Therefore, in our approach, cases have been segmented by radiologists using the 3D Slicer tool (https://www.slicer.org, <ref type="bibr" target="#b49">[49]</ref>).</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.2.">Generating the perfusion curve</head><p>Once the perfusion sequence is normalized and segmented, we generate the curve. The perfusion sequence consists of a series of snapshots taken over a specified period. This procedure generates 𝑛 3D images of the brain and, specifically, the glioma. By processing each of these 𝑛 images, calculating the mean luminance value of each voxel within the image in each snapshot, we generate a time series with as many points as snapshots. This way, a time series is generated out of the perfusion sequence, the perfusion curve. After that, the time series is normalized by subtracting the mean of the points and dividing by their standard deviation.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.3.">Characterizing the Glioma with a CP based on DNN</head><p>The differentiation of gliomas into low grade (LGG) and high grade (HGG) requires a machine learning system capable of extracting relevant patterns to distinguish between the two tumor types. Consequently, we constructed a deep dense neural network that takes a perfusion curve as input and classifies it into LGG and HGG. This is an unbalanced classification problem due to the prevalence of the HGG class in the data set over the LGG class. Thus, to evaluate the DNN performance, we calculate the accuracy and F1-score.</p><p>To enhance the trustworthiness of the classifier outputs, its probabilities must be calibrated. We calibrate the predictions of the model applying four independent calibration techniques: Platt's Scaling (PS), Isotonic (IR), Cross Venn-ABERS (C-V-A), and Inductive Venn-ABERS (I-V-A).</p><p>The performance of the calibrators is evaluated with classification and calibration metrics. In this way, physicians have access not only to artificial intelligence-based tools with a high level of accuracy but also to the ability to assess the confidence that these models have in each of the predictions associated with the patients, lending credibility to those predictions in which the model has sufficient confidence. To achieve this, we employ a Conformal Predictor with a specified confidence level, 𝜂, (e.g. 90%) on top of the DNN. Thus, the radiologist will know, with each prediction, whether the model has confidence exceeding 𝜂 in determining whether the tumor is a low-grade or high-grade glioma, what would increase his or her trust on the differentiation model performance.</p><p>To the best of our knowledge, there is no state-of-the-art method that addresses the problem of glioma differentiation by applying explainability and trustworthiness methods, using perfusion sequences as time series and applying DNN and CP in this binary classification context.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Empirical study</head><p>To demonstrate the ability of our method to differentiate between high-grade and low-grade gliomas satisfactorily, we have conducted a rigorous experimentation. It is detailed in this section along with the results and their analysis.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.1.">Dataset</head><p>We have compiled a cohort of 58 patients from the radiology department of the Virgen de las Nieves Hospital in Granada, Spain, selected for their exceptional quality and homogeneity in the MRI scans taken for their diagnosis and treatment.</p><p>Due to the rather small size of the dataset, we have designed a data augmentation strategy to effectively train our machine learning models. For the training partition, we generate perfusion curves not only at the level of the entire volume but also across the different 2D slices that compose it along the Z-axis. All slices of the same sequence inherit the label, either LGG or HGG, from the original sequence. This extends the training set to exceed 700 curves. Besides the anticipated imbalanced character of the problem arises. The distribution of instances between the two classes is 70% (HGG) and 30% (LGG). To address this issue, the models need to be adjusted to weigh the prediction error, making it more costly to make errors in predicting the LGG class than the HGG class.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.2.">Deep Neural Network: architecture and hyperparameters</head><p>Taking into account that the patient cohort is not very extensive, the dense neural network to be used cannot be very large, as we might incur in overfitting issues. After different attempts, an architecture with five layers (input, output, and three hidden layers with 70, 30, and 5 neurons) is considered, which yields competitive results.</p><p>For the selection of hyperparameters, a Grid Search Cross Validation is applied to choose the optimization algorithm and the parameters 𝛼 (strength of the L2 regularization term), initial learning rate, 𝛽 1 (exponential decay rate for fist moment vector), 𝛽 2 (exponential decay rate for second moment vector), and 𝜖 (value for numerical stability). The result of this hyperparameter tuning process produced the following value selection:</p><p>• Optimization algorithm: Adam • Initial Learning rate: 0.001</p><p>• 𝛼 : 0.0001</p><p>• 𝛽 1 : 0.9</p><p>• 𝛽 2 : 0.9</p><p>• 𝜖 : 0.000000001</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.3.">Metrics</head><p>Our proposal combines deep learning and conformal prediction. We use classic metrics to evaluate the goodness of the prediction and calibration metrics to assess the level of uncertainty in the predictions. For classification metrics, we use accuracy and F1-Score. For calibration metrics, we use Brier Score and Log Loss. The first one is defined as:</p><formula xml:id="formula_1">𝐵𝑆 = 1 𝑛 𝑛 ∑︁ 𝑖=1 (𝑝 𝑖 − 𝑜 𝑖 ) 2 , (<label>2</label></formula><formula xml:id="formula_2">)</formula><p>where 𝑝 is the prediction probability of occurrence of the event 𝑖, and 𝑜 𝑖 is defined as follows:</p><formula xml:id="formula_3">𝑜 𝑖 = {︂ 1 if event 𝑖 ocurred 0 if event 𝑖 not ocurred<label>(3)</label></formula><p>Log Loss is defined as</p><formula xml:id="formula_4">𝐿 𝑙𝑜𝑔 (𝑦, 𝑝) = −(𝑦 log(𝑝) + (1 − 𝑦) log(1 − 𝑝))<label>(4)</label></formula><p>with 𝑦 ∈ {0, 1} and a probability estimate 𝑝 = 𝑃 𝑟(𝑦 = 1).</p><p>For both of them, Brier Score and Log Loss, the smaller the value, the better is the calibration.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.4.">Results and analysis</head><p>We calculated the accuracy and F1-score to compare the performance of our novel DNN for time series classification approach with the leading state-of-the-art method for time series classification, which is a 1NN with Dynamic Time Warping ( <ref type="bibr" target="#b50">[50]</ref>, <ref type="bibr" target="#b51">[51]</ref>).</p><p>We have designed a data strategy to ensure the rigor of the study. In all cases, we guarantee the separation between patients is maintained. Firstly, to confirm the reliability of the results, a Stratified 5-fold Cross Validation is used. This involves generating five datasets where patients are split into 80% for training and 20% for testing each time, maintaining class proportions in each fold.</p><p>The values in Tables <ref type="table" target="#tab_1">1 and 2</ref> represent the mean values from the five runs for each metric on the test set, demonstrating that our DNN approach outperforms the state-of-the-art 1NN-DTW in both performance and calibration. These results confirm previous analyses where Inductive Venn-ABERS and other CP methods outperformed Platt's Scaling and Isotonic Regression <ref type="bibr" target="#b46">[46]</ref>.</p><p>In order to unleash the true power of the DNN+CP (actually, Inductive Venn-ABERS) combination, we conduct another experiment where the dataset is partitioned into training and test sets, with 80% of the patients used for training and 20% for testing, again in a stratified manner. We plot in Figure <ref type="figure" target="#fig_2">2</ref> the predicted and conformalized probabilities for the 12 instances (MRI scans) in the test set. On the X-axis, we can see the 12 predictions made by the model. On the Y-axis, we find the probability expressed by the model, with 0 representing a prediction of the LGG class and 1 representing a prediction of the HGG class. The black dots indicate the actual labels of the test examples. As can be seen, there are 3 cases of LGG and 9 cases of HGG, maintaining the stratification of the original dataset. The larger light blue dot corresponds to the predictions made by the dense neural network without conformalization. When the black dot and the blue dot coincide, it indicates that the neural network correctly predicted the class. Conversely, if they do not coincide, the neural network made an incorrect prediction.</p><p>The smaller blue dot (𝑝 0 ) and the red dot (𝑝 1 ) represent the probability interval containing each of the calibrated predictions (𝑝), depicted by the orange dot. This orange dot represents the predictions of our DNN+CP model expressed in terms of probability, where a probability 𝑝 ≥ 0.5 results in a predicted label of 1 (HGG class). Conversely, if 𝑝 &lt; 0.5, the predicted label is 0 (LGG class). The distance between 𝑝 0 and 𝑝 1 (𝑝 1 − 𝑝 0 ) indicates the uncertainty in the model's decision: the greater the distance between them, the higher the uncertainty in the prediction. This uncertainty is represented by the pink curve.</p><p>As observed, the neural network without conformalization makes two errors (the second and the eleventh cases). Thanks to the conformalization of the predictions, the DNN+CP model correctly predicts the second case, as the predicted probability is below 0.5, resulting in an LGG class label. Regarding the eleventh case, the DNN+CP, like the non-conformalized DNN, makes the error of categorizing the case as HGG when it is actually LGG. However, it can be seen that the uncertainty in that prediction is very high, showing confidence of less than 60%. Similarly, predictions with some uncertainty are made in the first (slightly over 60%) and third cases (close to 80%). The rest of predictions are more reliable, showing a confidence ranging from 85% to 99%.</p><p>Therefore, the combination of DNN+CP is not only more accurate, as it corrects errors that an uncalibrated neural network would make, but it also provides very valuable information to doctors about the confidence of the predictions, allowing specialists to assess each case with much more trustworthy information.  </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="6.">Conclusions</head><p>In this article, we address a global public health issue, ranked among the top 10 causes of cancerrelated mortality worldwide: the detection of central nervous system tumors. Specifically, we focus on differentiating gliomas into their two types: high-grade gliomas (HGG) and low-grade gliomas (LGG). To achieve this, we introduce a novel methodology based on time series classification. By utilizing MRI-perfusion, we transform the image into a time series, called the perfusion curve, which reflects tissue vascularization in a non-invasive manner. To classify these perfusion curves between LGG and HGG, a conformal predictor based on a deep neural network is trained. We have compared our proposal with the state-of-the-art technique in time series classification through rigorous experimentation, based on a dataset of patients from the radiology department of the "Virgen de las Nieves Hospital" in Granada, Spain, obtaining satisfactory results. We demonstrate that our methodology is not only innovative in the way it transforms the image problem into sequences, but also that the combination of deep neural networks and conformal prediction for time series classification generates an ideal tool for radiologists This tool displays exceptional generalization capability and the reduced uncertainty in its predictions, making it useful, reliable and trustworthy. This study contributes to quantifying uncertainty at patient-level with applications in personalized and precision medicine. Besides, by improving the confidence in AI-medical applications, this study also aligns with the requirements of the European Parliament AI regulation to achieve Trustworthy AI.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>Figure 1 :</head><label>1</label><figDesc>Figure 1: Complete processing pipeline for glioma differentiation between low-grade and high-grade.The process initiates with the reception of a new perfusion sequence. After preprocessing the images, we extract the perfusion curve by calculating the mean luminance of the voxels at different time points. Subsequently, a CP-DNN is trained to extract the final prediction and quantify its uncertainty.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_2"><head>Figure 2 :</head><label>2</label><figDesc>Figure 2: Probability vs conformal probability for MRI scans in the test set. Only thanks to the conformalization, the misclassified patient (second from the left) is correctly classified as a high glioma case. Large intervals show a low confidence in those predictions.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_0"><head>Table 1</head><label>1</label><figDesc>Performance metrics include accuracy and F1-score (the higher the better), and calibration metrics include Brier Score and Log Loss (the smaller the better) for the DNN model, which outperforms the state-of-the-art 1NN-DTW model (see Table2). The last four rows correspond to the implementations of the four calibration methods: IR stands for Isotonic Regression, PS stands for Platt's Scaling, C-V-A stands for Cross Venn-ABERS, and I-V-A stands for Inductive Venn-ABERS. All methods improve model performance, with Inductive Venn-ABERS significantly reducing calibration errors. The best results are highlighted in bold.</figDesc><table><row><cell>Method</cell><cell>Acc</cell><cell cols="3">F1-Score Brier Score Log Loss</cell></row><row><cell>DNN</cell><cell cols="2">0.642 0.769</cell><cell>0.289</cell><cell>1.168</cell></row><row><cell>DNN + IR</cell><cell cols="2">0.733 0.842</cell><cell>0.2</cell><cell>1.185</cell></row><row><cell>DNN + PS</cell><cell cols="2">0.733 0.844</cell><cell>0.2</cell><cell>0.612</cell></row><row><cell cols="3">DNN + C-V-A 0.677 0.787</cell><cell>0.249</cell><cell>0.755</cell></row><row><cell>DNN + I-V-A</cell><cell cols="2">0.752 0.857</cell><cell>0.197</cell><cell>0.598</cell></row><row><cell>Method</cell><cell>Acc</cell><cell cols="3">F1-Score Brier Score Log Loss</cell></row><row><cell>1NN-DTW</cell><cell cols="2">0.692 0.769</cell><cell>0.288</cell><cell>10.376</cell></row><row><cell>1NN-DTW + IR</cell><cell cols="2">0.714 0.813</cell><cell>0.233</cell><cell>0.636</cell></row><row><cell>1NN-DTW + PS</cell><cell>0.73</cell><cell>0.844</cell><cell>0.248</cell><cell>0.634</cell></row><row><cell cols="3">1NN-DTW + C-V-A 0.675 0.786</cell><cell>0.27</cell><cell>0.857</cell></row><row><cell>1NN-DTW + I-V-A</cell><cell cols="2">0.746 0.848</cell><cell>0.201</cell><cell>0.62</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_1"><head>Table 2</head><label>2</label><figDesc>Similar to Table1, here are the results for the state-of-the-art 1NN-DTW model. The classifier shows lower performance and calibration metrics compared to our approach. IR stands for Isotonic Regression, PS stands for Platt's Scaling, C-V-A stands for Cross Venn-ABERS, and I-V-A stands for Inductive Venn-ABERS. The best results are highlighted in bold.</figDesc><table /></figure>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Acknowledgments</head><p>This research has been partially funded by Spanish Ministry of Economy, Industry and Competitiveness (PID2020-118224RB-100 and PID2023-151336OB-I00), con-financed by the European Union (FEDER).</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Cancer incidence and mortality worldwide: sources, methods and major patterns in GLOBOCAN 2012</title>
		<author>
			<persName><forename type="first">J</forename><surname>Ferlay</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Soerjomataram</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Dikshit</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Eser</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Mathers</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Rebelo</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Int. J. Cancer</title>
		<imprint>
			<biblScope unit="volume">136</biblScope>
			<biblScope unit="page" from="E359" to="Ee86" />
			<date type="published" when="2015">2015</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">The epidemiology of glioma in adults: a &quot;state of the science&quot; review</title>
		<author>
			<persName><forename type="first">Q</forename><surname>Ostrom</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Bauchet</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Davis</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Neuro Oncology</title>
		<imprint>
			<biblScope unit="volume">16</biblScope>
			<biblScope unit="page" from="894" to="913" />
			<date type="published" when="2014">2014</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">Epidemiology of glioma: clinical characteristics, symptoms, and predictors of glioma pationes grade I-IV in the danish neuro-oncology registry</title>
		<author>
			<persName><forename type="first">B</forename><surname>Rasmussen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Hansen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Larsen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Kosteljanetz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Schultz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Bøgård</surname></persName>
		</author>
		<idno type="DOI">10.1007/s11060-017-2607-5</idno>
	</analytic>
	<monogr>
		<title level="j">Journal of Neuro-Oncology</title>
		<imprint>
			<biblScope unit="volume">135</biblScope>
			<biblScope unit="page" from="571" to="549" />
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">The risk of hemorrhage in steriotactic biopsy for brain tumorus</title>
		<author>
			<persName><forename type="first">Y</forename><surname>Mizobuchi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Nkajima</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Fujihara</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Matsuzaki</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Mure</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Nagahiro</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Takagi</surname></persName>
		</author>
		<idno type="DOI">10.2152/jmi.66.314</idno>
	</analytic>
	<monogr>
		<title level="j">J. Medical Investigation</title>
		<imprint>
			<biblScope unit="volume">66</biblScope>
			<biblScope unit="page" from="317" to="318" />
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">Magnetic resonance perfusion for differentiating low-grade frmo high-grade gliomas at first presentation (Review)</title>
		<author>
			<persName><forename type="first">J</forename><surname>Abrigo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Fountain</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Provenzale</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Law</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Kwong</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Hart</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><surname>Tam</surname></persName>
		</author>
		<idno type="DOI">10.1002/14651858.CD011551.pub2</idno>
	</analytic>
	<monogr>
		<title level="j">Cochrane Database of Systematic Reviews</title>
		<imprint>
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">A review of uncertainty quantification in deep learning: Techniques, applications and challenges</title>
		<author>
			<persName><forename type="first">M</forename><surname>Abdar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Pourpanah</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Hussain</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Rezazadegan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Liu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Ghavamzadeh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Fieguth</surname></persName>
		</author>
		<author>
			<persName><forename type="first">X</forename><surname>Cao</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Khosravi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><forename type="middle">R</forename><surname>Acharya</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Makarenkov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Nahavandi</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.inffus.2021.05.008</idno>
		<ptr target="https://doi.org/10.1016/j.inffus.2021.05.008" />
	</analytic>
	<monogr>
		<title level="j">Information Fusion</title>
		<imprint>
			<biblScope unit="volume">76</biblScope>
			<biblScope unit="page" from="243" to="297" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">Quantifying deep learning model uncertainty in conformal prediction</title>
		<author>
			<persName><forename type="first">H</forename><surname>Karimi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Samavi</surname></persName>
		</author>
		<idno type="DOI">10.1609/aaaiss.v1i1.27492</idno>
		<ptr target="http://dx.doi.org/10.1609/aaaiss.v1i1.27492.doi:10.1609/aaaiss.v1i1.27492" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the AAAI Symposium Series</title>
				<meeting>the AAAI Symposium Series</meeting>
		<imprint>
			<date type="published" when="2023">2023</date>
			<biblScope unit="volume">1</biblScope>
			<biblScope unit="page" from="142" to="148" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">Empirical validation of conformal prediction for trustworthy skin lesions classification</title>
		<author>
			<persName><forename type="first">J</forename><surname>Fayyad</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Alijani</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Najjaran</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.cmpb.2024.108231</idno>
		<ptr target="https://doi.org/10.1016/j.cmpb.2024.108231" />
	</analytic>
	<monogr>
		<title level="j">Computer Methods and Programs in Biomedicine</title>
		<imprint>
			<biblScope unit="volume">253</biblScope>
			<biblScope unit="page">108231</biblScope>
			<date type="published" when="2024">2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">Estimating diagnostic uncertainty in artificial intelligence assisted pathology using conformal prediction</title>
		<author>
			<persName><forename type="first">H</forename><surname>Olsson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Kartasalo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Mulliqi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Capuccini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Ruusuvuori</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Samaratunga</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Delahunt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Lindskog</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">A M</forename><surname>Janssen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Blilie</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Egevad</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Spjuth</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Eklund</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><forename type="middle">P I E</forename><surname>Panel</surname></persName>
		</author>
		<idno type="DOI">10.1038/s41467-022-34945-8</idno>
		<ptr target="https://doi.org/10.1038/s41467-022-34945-8.doi:10.1038/s41467-022-34945-8" />
	</analytic>
	<monogr>
		<title level="j">Nature Communications</title>
		<imprint>
			<biblScope unit="volume">13</biblScope>
			<biblScope unit="page">7761</biblScope>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<monogr>
		<title level="m" type="main">Three applications of conformal prediction for rating breast density in mammography</title>
		<author>
			<persName><forename type="first">C</forename><surname>Lu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Chang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Singh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Kalpathy-Cramer</surname></persName>
		</author>
		<ptr target="https://arxiv.org/abs/2206.12008.arXiv:2206.12008" />
		<imprint>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">Improving trustworthiness of ai disease severity rating in medical imaging with ordinal conformal prediction sets</title>
		<author>
			<persName><forename type="first">C</forename><surname>Lu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">N</forename><surname>Angelopoulos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Pomerantz</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Medical Image Computing and Computer Assisted Intervention -MICCAI 2022</title>
				<editor>
			<persName><forename type="first">L</forename><surname>Wang</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">Q</forename><surname>Dou</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">P</forename><forename type="middle">T</forename><surname>Fletcher</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">S</forename><surname>Speidel</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">S</forename><surname>Li</surname></persName>
		</editor>
		<meeting><address><addrLine>Nature Switzerland, Cham</addrLine></address></meeting>
		<imprint>
			<publisher>Springer</publisher>
			<date type="published" when="2022">2022</date>
			<biblScope unit="page" from="545" to="554" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">Conformal prediction in clinical medical sciences</title>
		<author>
			<persName><forename type="first">J</forename><surname>Vazquez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">C</forename><surname>Facelli</surname></persName>
		</author>
		<idno type="DOI">10.1007/s41666-021-00113-8</idno>
		<ptr target="https://doi.org/10.1007/s41666-021-00113-8.doi:10.1007/s41666-021-00113-8" />
	</analytic>
	<monogr>
		<title level="j">Journal of Healthcare Informatics Research</title>
		<imprint>
			<biblScope unit="volume">6</biblScope>
			<biblScope unit="page" from="241" to="252" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b12">
	<analytic>
		<title level="a" type="main">Fair conformal predictors for applications in medical imaging</title>
		<author>
			<persName><forename type="first">C</forename><surname>Lu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Lemay</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Chang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Höbel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Kalpathy-Cramer</surname></persName>
		</author>
		<idno type="DOI">10.1609/aaai.v36i11.21459</idno>
		<ptr target="https://ojs.aaai.org/index.php/AAAI/article/view/21459.doi:10.1609/aaai.v36i11.21459" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the AAAI Conference on Artificial Intelligence</title>
				<meeting>the AAAI Conference on Artificial Intelligence</meeting>
		<imprint>
			<date type="published" when="2022">2022</date>
			<biblScope unit="volume">36</biblScope>
			<biblScope unit="page" from="12008" to="12016" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b13">
	<analytic>
		<title level="a" type="main">Deep learning with conformal prediction for hierarchical analysis of large-scale whole-slide tissue images</title>
		<author>
			<persName><forename type="first">H</forename><surname>Wieslander</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><forename type="middle">J</forename><surname>Harrison</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Skogberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Jackson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Fridén</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Karlsson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Spjuth</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Wählby</surname></persName>
		</author>
		<idno type="DOI">10.1109/JBHI.2020.2996300</idno>
	</analytic>
	<monogr>
		<title level="j">IEEE Journal of Biomedical and Health Informatics</title>
		<imprint>
			<biblScope unit="volume">25</biblScope>
			<biblScope unit="page" from="371" to="380" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">Classification of the glioma grading using radiomics analysis</title>
		<author>
			<persName><forename type="first">H.-H</forename><surname>Cho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S.-H</forename><surname>Lee</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Kim</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Park</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">PeerJ</title>
		<imprint>
			<biblScope unit="volume">6</biblScope>
			<biblScope unit="page">e5982</biblScope>
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b15">
	<analytic>
		<title level="a" type="main">Deep multi-scale 3d convolutional neural network (cnn) for mri gliomas brain tumor classification</title>
		<author>
			<persName><forename type="first">H</forename><surname>Mzoughi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Njeh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Wali</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">B</forename><surname>Slima</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Benhamida</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Mhiri</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">B</forename><surname>Mahfoudhe</surname></persName>
		</author>
		<idno type="DOI">10.1007/s10278-020-00347-9</idno>
		<ptr target="https://doi.org/10.1007/s10278-020-00347-9.doi:10.1007/s10278-020-00347-9" />
	</analytic>
	<monogr>
		<title level="j">Journal of Digital Imaging</title>
		<imprint>
			<biblScope unit="volume">33</biblScope>
			<biblScope unit="page" from="903" to="915" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">Molecular profiling of gliomas: potential therapeutic implications</title>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C P D E P A I</forename><surname>Agusti Alentorn</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Alberto</forename><surname>Duran-Peña</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Kesari</surname></persName>
		</author>
		<idno type="DOI">10.1586/14737140.2015.1062368</idno>
		<idno>arXiv:</idno>
		<ptr target="https://doi.org/10.1586/14737140.2015.1062368" />
	</analytic>
	<monogr>
		<title level="j">Expert Review of Anticancer Therapy</title>
		<imprint>
			<biblScope unit="volume">15</biblScope>
			<biblScope unit="page" from="955" to="962" />
			<date type="published" when="2015">2015</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b17">
	<analytic>
		<title level="a" type="main">Fully automated mr based virtual biopsy of cerebral gliomas</title>
		<author>
			<persName><forename type="first">J</forename><surname>Haubold</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Hosch</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Parmar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Glas</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Guberina</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><forename type="middle">A</forename><surname>Catalano</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Pierscianek</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Wrede</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Deuschl</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Forsting</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Nensa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Flaschel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Umutlu</surname></persName>
		</author>
		<idno type="DOI">10.3390/cancers13246186</idno>
		<ptr target="https://www.mdpi.com/2072-6694/13/24/6186.doi:10.3390/cancers13246186" />
	</analytic>
	<monogr>
		<title level="j">Cancers</title>
		<imprint>
			<biblScope unit="volume">13</biblScope>
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b18">
	<analytic>
		<title level="a" type="main">Diffusion-and perfusion-weighted mri radiomics model may predict isocitrate dehydrogenase (idh) mutation and tumor aggressiveness in diffuse lower grade glioma</title>
		<author>
			<persName><forename type="first">M</forename><surname>Kim</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">Y</forename><surname>Jung</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">E</forename><surname>Park</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Jo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">Y</forename><surname>Park</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">J</forename><surname>Nam</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">H</forename><surname>Kim</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><forename type="middle">S</forename><surname>Kim</surname></persName>
		</author>
		<idno type="DOI">10.1007/s00330-019-06548-3</idno>
		<ptr target="https://doi.org/10.1007/s00330-019-06548-3.doi:10.1007/s00330-019-06548-3" />
	</analytic>
	<monogr>
		<title level="j">European Radiology</title>
		<imprint>
			<biblScope unit="volume">30</biblScope>
			<biblScope unit="page" from="2142" to="2151" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b19">
	<analytic>
		<title level="a" type="main">Noninvasive prediction of idh1 mutation and atrx expression loss in low-grade gliomas using multiparametric mr radiomic features</title>
		<author>
			<persName><forename type="first">Y</forename><surname>Ren</surname></persName>
		</author>
		<author>
			<persName><forename type="first">X</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><surname>Rui</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Pang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Qiu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Wang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Q</forename><surname>Xie</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Jin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Chen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Lu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Z</forename><surname>Yao</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">X</forename><surname>Feng</surname></persName>
		</author>
		<idno type="DOI">10.1002/jmri.26240</idno>
		<ptr target="https://onlinelibrary.wiley.com/doi/pdf/10.1002/jmri.26240" />
	</analytic>
	<monogr>
		<title level="j">Journal of Magnetic Resonance Imaging</title>
		<imprint>
			<biblScope unit="volume">49</biblScope>
			<biblScope unit="page" from="808" to="817" />
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b20">
	<analytic>
		<title level="a" type="main">Prediction of molecular mutations in diffuse low-grade gliomas using mr imaging features</title>
		<author>
			<persName><forename type="first">Z</forename><forename type="middle">A</forename><surname>Shboul</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Chen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">M</forename><surname>Iftekharuddin</surname></persName>
		</author>
		<idno type="DOI">10.1038/s41598-020-60550-0</idno>
		<ptr target="https://doi.org/10.1038/s41598-020-60550-0.doi:10.1038/s41598-020-60550-0" />
	</analytic>
	<monogr>
		<title level="j">Scientific Reports</title>
		<imprint>
			<biblScope unit="volume">10</biblScope>
			<biblScope unit="page">3711</biblScope>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b21">
	<analytic>
		<title level="a" type="main">Combining radiomics and deep convolutional neural network features from preoperative MRI for predicting clinically relevant genetic biomarkers in glioblastoma</title>
		<author>
			<persName><forename type="first">E</forename><surname>Calabrese</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">D</forename><surname>Rudie</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">M</forename><surname>Rauschecker</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">E</forename><surname>Villanueva-Meyer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">L</forename><surname>Clarke</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">A</forename><surname>Solomon</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Cha</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Neuro-Oncology Advances</title>
		<imprint>
			<biblScope unit="volume">4</biblScope>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b22">
	<monogr>
		<title/>
		<idno type="DOI">10.1093/noajnl/vdac060</idno>
		<ptr target="https://academic.oup.com/noa/article-pdf/4/1/vdac060/43778051/vdac060.pdf" />
		<imprint/>
	</monogr>
</biblStruct>

<biblStruct xml:id="b23">
	<monogr>
		<ptr target="https://digital-strategy.ec.europa.eu/en/policies/regulatory-framework-ai" />
		<title level="m">AI Act -digital-strategy</title>
				<imprint>
			<date type="published" when="2024-04-24">2024. 24-04-2024</date>
		</imprint>
	</monogr>
	<note>ec.europa</note>
</biblStruct>

<biblStruct xml:id="b24">
	<analytic>
		<title level="a" type="main">Connecting the dots in trustworthy artificial intelligence: From ai principles, ethics, and key requirements to responsible ai systems and regulation</title>
		<author>
			<persName><forename type="first">N</forename><surname>Díaz-Rodríguez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Del</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Ser</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Coeckelbergh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>López De Prado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Herrera-Viedma</surname></persName>
		</author>
		<author>
			<persName><surname>Herrera</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.inffus.2023.101896</idno>
		<ptr target="https://doi.org/10.1016/j.inffus.2023.101896" />
	</analytic>
	<monogr>
		<title level="j">Information Fusion</title>
		<imprint>
			<biblScope unit="volume">99</biblScope>
			<biblScope unit="page">101896</biblScope>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b25">
	<monogr>
		<ptr target="https://www.coalitionforhealthai.org/" />
		<title level="m">CHAI -coalitionforhealthai</title>
				<imprint>
			<date type="published" when="2024-04-24">2024. Accessed 24-04-2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b26">
	<monogr>
		<title level="m" type="main">Introduction to conformal prediction with python</title>
		<author>
			<persName><forename type="first">C</forename><surname>Molnar</surname></persName>
		</author>
		<imprint>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b27">
	<analytic>
		<title level="a" type="main">Venn-abers predictors</title>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Petej</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Thirtieth Conference on Uncertainty in Artificial Intelligence, UAI&apos;14</title>
				<meeting>the Thirtieth Conference on Uncertainty in Artificial Intelligence, UAI&apos;14<address><addrLine>Arlington, Virginia, USA</addrLine></address></meeting>
		<imprint>
			<publisher>AUAI Press</publisher>
			<date type="published" when="2014">2014</date>
			<biblScope unit="page" from="829" to="838" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b28">
	<monogr>
		<title level="m" type="main">Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods</title>
		<author>
			<persName><forename type="first">J</forename><surname>Platt</surname></persName>
		</author>
		<ptr target="https://api.semanticscholar.org/CorpusID:56563878" />
		<imprint>
			<date type="published" when="1999">1999</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b29">
	<monogr>
		<author>
			<persName><forename type="first">V</forename><surname>Manokhin</surname></persName>
		</author>
		<title level="m">Practical guide to applied conformal prediction in python: Learn and apply the best uncertainty frameworks to your industry applications</title>
				<imprint>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b30">
	<analytic>
		<title level="a" type="main">Transforming classifier scores into accurate multiclass probability estimates</title>
		<author>
			<persName><forename type="first">B</forename><surname>Zadrozny</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Elkan</surname></persName>
		</author>
		<idno type="DOI">10.1145/775047.775151</idno>
		<idno>doi:10.1145/775047.775151</idno>
		<ptr target="https://doi.org/10.1145/775047.775151" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD &apos;02</title>
				<meeting>the Eighth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD &apos;02<address><addrLine>New York, NY, USA</addrLine></address></meeting>
		<imprint>
			<publisher>Association for Computing Machinery</publisher>
			<date type="published" when="2002">2002</date>
			<biblScope unit="page" from="694" to="699" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b31">
	<analytic>
		<title level="a" type="main">Predicting good probabilities with supervised learning</title>
		<author>
			<persName><forename type="first">A</forename><surname>Niculescu-Mizil</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Caruana</surname></persName>
		</author>
		<idno type="DOI">10.1145/1102351.1102430</idno>
		<idno>doi:10.1145/1102351.1102430</idno>
		<ptr target="https://doi.org/10.1145/1102351.1102430" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 22nd International Conference on Machine Learning, ICML &apos;05</title>
				<meeting>the 22nd International Conference on Machine Learning, ICML &apos;05<address><addrLine>New York, NY, USA</addrLine></address></meeting>
		<imprint>
			<publisher>Association for Computing Machinery</publisher>
			<date type="published" when="2005">2005</date>
			<biblScope unit="page" from="625" to="632" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b32">
	<analytic>
		<title level="a" type="main">Prediction of metabolic transformations using cross Venn-ABERS predictors</title>
		<author>
			<persName><forename type="first">S</forename><surname>Arvidsson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Spjuth</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Carlsson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Toccaceli</surname></persName>
		</author>
		<ptr target="https://proceedings.mlr.press/v60/arvidsson17a.html" />
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Sixth Workshop on Conformal and Probabilistic Prediction and Applications</title>
				<editor>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">Z</forename><surname>Luo</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">H</forename><surname>Papadopoulos</surname></persName>
		</editor>
		<meeting>the Sixth Workshop on Conformal and Probabilistic Prediction and Applications<address><addrLine>PMLR</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2017">2017</date>
			<biblScope unit="volume">60</biblScope>
			<biblScope unit="page" from="118" to="131" />
		</imprint>
	</monogr>
	<note>Proceedings of Machine Learning Research</note>
</biblStruct>

<biblStruct xml:id="b33">
	<analytic>
		<title level="a" type="main">Machine learning classification with confidence: application of transductive conformal predictors to MRI-based diagnostic and prognostic markers in depression</title>
		<author>
			<persName><forename type="first">I</forename><surname>Nouretdinov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">G</forename><surname>Costafreda</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Chervonenkis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vapnik</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">H Y</forename><surname>Fu</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Neuroimage</title>
		<imprint>
			<biblScope unit="volume">56</biblScope>
			<biblScope unit="page" from="809" to="813" />
			<date type="published" when="2010">2010</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b34">
	<analytic>
		<title level="a" type="main">Conformal predictors in early diagnostics of ovarian and breast cancers</title>
		<author>
			<persName><forename type="first">D</forename><surname>Devetyarov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Nouretdinov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Burford</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Camuzeaux</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gentry-Maharaj</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Tiss</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Smith</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Z</forename><surname>Luo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Chervonenkis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Hallett</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Waterfield</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Cramer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">F</forename><surname>Timms</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Sinclair</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Menon</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Jacobs</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</author>
		<idno type="DOI">10.1007/s13748-012-0021-y</idno>
		<ptr target="https://doi.org/10.1007/s13748-012-0021-y.doi:10.1007/s13748-012-0021-y" />
	</analytic>
	<monogr>
		<title level="j">Progress in Artificial Intelligence</title>
		<imprint>
			<biblScope unit="volume">1</biblScope>
			<biblScope unit="page" from="245" to="257" />
			<date type="published" when="2012">2012</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b35">
	<analytic>
		<title level="a" type="main">Reliable diagnosis of acute abdominal pain with conformal prediction</title>
		<author>
			<persName><forename type="first">H</forename><surname>Papadopoulos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
		<ptr target="https://api.semanticscholar.org/CorpusID:18515829" />
	</analytic>
	<monogr>
		<title level="j">International journal of engineering intelligent systems for electrical engineering and communications</title>
		<imprint>
			<biblScope unit="volume">17</biblScope>
			<biblScope unit="page" from="127" to="137" />
			<date type="published" when="2009">2009</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b36">
	<analytic>
		<title level="a" type="main">Evolutionary conformal prediction for breast cancer diagnosis</title>
		<author>
			<persName><forename type="first">A</forename><surname>Lambrou</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Papadopoulos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</author>
		<idno type="DOI">10.1109/ITAB.2009.5394447</idno>
	</analytic>
	<monogr>
		<title level="m">9th International Conference on Information Technology and Applications in Biomedicine</title>
				<imprint>
			<date type="published" when="2009">2009. 2009</date>
			<biblScope unit="page" from="1" to="4" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b37">
	<analytic>
		<title level="a" type="main">Conformal prediction technique to predict breast cancer survivability</title>
		<author>
			<persName><forename type="first">L</forename><surname>Alnemer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Rajab</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Aljarah</surname></persName>
		</author>
		<idno type="DOI">10.14257/ijast.2016.96.01</idno>
	</analytic>
	<monogr>
		<title level="j">International journal of advanced science and technology</title>
		<imprint>
			<biblScope unit="volume">96</biblScope>
			<biblScope unit="page" from="1" to="10" />
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b38">
	<monogr>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">S</forename><surname>Millar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Arnn</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Himes</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">C</forename><surname>Facelli</surname></persName>
		</author>
		<idno type="DOI">10.3233/shti231113</idno>
		<ptr target="http://dx.doi.org/10.3233/SHTI231113.doi:10.3233/shti231113" />
		<title level="m">Uncertainty in breast cancer risk prediction: A conformal prediction study of race stratification</title>
				<imprint>
			<date type="published" when="2024">2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b39">
	<monogr>
		<title level="m" type="main">Conformal prediction of molecule-induced cancer cell growth inhibition challenged by strong distribution shifts</title>
		<author>
			<persName><forename type="first">S</forename><surname>Hernandez-Hernandez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Q</forename><surname>Guo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><forename type="middle">J</forename><surname>Ballester</surname></persName>
		</author>
		<idno type="DOI">10.1101/2024.03.15.585269</idno>
		<idno>arXiv:</idno>
		<ptr target="https://www.biorxiv.org/content/early/2024/03/17/2024.03.15.585269.full.pdf" />
		<imprint>
			<date type="published" when="2024">2024</date>
			<pubPlace>bioRxiv</pubPlace>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b40">
	<analytic>
		<title level="a" type="main">An Empirical Distribution Function for Sampling with Incomplete Information</title>
		<author>
			<persName><forename type="first">M</forename><surname>Ayer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><forename type="middle">D</forename><surname>Brunk</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><forename type="middle">M</forename><surname>Ewing</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><forename type="middle">T</forename><surname>Reid</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Silverman</surname></persName>
		</author>
		<idno type="DOI">10.1214/aoms/1177728423</idno>
		<ptr target="https://doi.org/10.1214/aoms/1177728423.doi:10.1214/aoms/1177728423" />
	</analytic>
	<monogr>
		<title level="j">The Annals of Mathematical Statistics</title>
		<imprint>
			<biblScope unit="volume">26</biblScope>
			<biblScope unit="page" from="641" to="647" />
			<date type="published" when="1955">1955</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b41">
	<analytic>
		<title level="a" type="main">Learning by transduction</title>
		<author>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vapnik</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Fourteenth Conference on Uncertainty in Articial Intelligence</title>
				<meeting>the Fourteenth Conference on Uncertainty in Articial Intelligence</meeting>
		<imprint>
			<publisher>Morgan Kaufmann</publisher>
			<date type="published" when="1998">1998</date>
			<biblScope unit="page" from="148" to="156" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b42">
	<analytic>
		<title level="a" type="main">Transduction with confidence and credibility</title>
		<author>
			<persName><forename type="first">C</forename><surname>Saunders</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
		<ptr target="https://eprints.soton.ac.uk/258961/" />
	</analytic>
	<monogr>
		<title level="m">Sixteenth International Joint Conference on Artificial Intelligence (IJCAI &apos;99)</title>
				<imprint>
			<date type="published" when="1999">01/01/99. 1999</date>
			<biblScope unit="page" from="722" to="726" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b43">
	<analytic>
		<title level="a" type="main">Machine-learning applications of algorithmic randomness</title>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gammerman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Saunders</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the Sixteenth International Conference on Machine Learning</title>
				<meeting>the Sixteenth International Conference on Machine Learning</meeting>
		<imprint>
			<publisher>Morgan Kaufmann</publisher>
			<date type="published" when="1999">1999</date>
			<biblScope unit="page" from="444" to="453" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b44">
	<monogr>
		<title level="m" type="main">Multi-class probabilistic classification using inductive and cross Venn-Abers predictors</title>
		<author>
			<persName><forename type="first">V</forename><surname>Manokhin</surname></persName>
		</author>
		<ptr target="https://proceedings.mlr.press/v60/manokhin17a.html" />
		<imprint>
			<date type="published" when="2017">2017</date>
			<biblScope unit="volume">60</biblScope>
			<biblScope unit="page" from="228" to="240" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b45">
	<monogr>
		<title level="m" type="main">Algorithmic learning in a random world</title>
		<author>
			<persName><forename type="first">V</forename><surname>Vovk</surname></persName>
		</author>
		<imprint>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b46">
	<analytic>
		<title level="a" type="main">Alzheimer&apos;s Disease Neuroimaging Initiative, Targeting the uncertainty of predictions at patient-level using an ensemble of classifiers coupled with calibration methods, Venn-ABERS, and conformal predictors: A case study in AD</title>
		<author>
			<persName><forename type="first">T</forename><surname>Pereira</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Cardoso</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Guerreiro</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Mendonça</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C</forename><surname>De</surname></persName>
		</author>
		<author>
			<persName><surname>Madeira</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">J. Biomed. Inform</title>
		<imprint>
			<biblScope unit="volume">101</biblScope>
			<biblScope unit="page">103350</biblScope>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b47">
	<monogr>
		<title level="m" type="main">Statistical Parametric Mapping</title>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">J</forename><surname>Friston</surname></persName>
		</author>
		<idno type="DOI">10.1007/978-1-4615-1079-6-16</idno>
		<idno>doi:10.1007/978-1-4615-1079-6-16</idno>
		<ptr target="https://doi.org/10.1007/978-1-4615-1079-6-16" />
		<imprint>
			<date type="published" when="2003">2003</date>
			<publisher>Springer US</publisher>
			<biblScope unit="page" from="237" to="250" />
			<pubPlace>Boston, MA</pubPlace>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b48">
	<analytic>
		<title level="a" type="main">Brain tumor segmentation of mri images: A comprehensive review on the application of artificial intelligence tools</title>
		<author>
			<persName><forename type="first">R</forename><surname>Ranjbarzadeh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Caputo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">B</forename><surname>Tirkolaee</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Jafarzadeh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Ghoushchi</surname></persName>
		</author>
		<author>
			<persName><surname>Bendechache</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.compbiomed.2022.106405</idno>
		<ptr target="https://doi.org/10.1016/j.compbiomed.2022.106405" />
	</analytic>
	<monogr>
		<title level="j">Computers in Biology and Medicine</title>
		<imprint>
			<biblScope unit="volume">152</biblScope>
			<biblScope unit="page">106405</biblScope>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b49">
	<analytic>
		<title level="a" type="main">3d slicer as an image computing platform for the quantitative imaging network</title>
		<author>
			<persName><forename type="first">A</forename><surname>Fedorov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Beichel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Kalpathy-Cramer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Finet</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J.-C</forename><surname>Fillion-Robin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Pujol</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Bauer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Jennings</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Fennessy</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Sonka</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Buatti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Aylward</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">V</forename><surname>Miller</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Pieper</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Kikinis</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.mri.2012.05.001</idno>
		<ptr target="https://doi.org/10.1016/j.mri.2012.05.001,quantitativeImaginginCancer" />
	</analytic>
	<monogr>
		<title level="j">Magnetic Resonance Imaging</title>
		<imprint>
			<biblScope unit="volume">30</biblScope>
			<biblScope unit="page" from="1323" to="1341" />
			<date type="published" when="2012">2012</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b50">
	<monogr>
		<author>
			<persName><forename type="first">A</forename><surname>Bagnall</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Bostrom</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Large</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Lines</surname></persName>
		</author>
		<ptr target="https://arxiv.org/abs/1602.01711.arXiv:1602.01711" />
		<title level="m">The great time series classification bake off: An experimental evaluation of recently proposed algorithms</title>
				<imprint>
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
	<note>extended version</note>
</biblStruct>

<biblStruct xml:id="b51">
	<monogr>
		<title level="m" type="main">Back to basics: A sanity check on modern time series classification algorithms</title>
		<author>
			<persName><forename type="first">B</forename><surname>Dhariyal</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><forename type="middle">L</forename><surname>Nguyen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Ifrim</surname></persName>
		</author>
		<ptr target="https://arxiv.org/abs/2308.07886.arXiv:2308.07886" />
		<imprint>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
