<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Using Wearable and Environmental Data to Improve the Prediction of Amyotrophic Lateral Sclerosis and Multiple Sclerosis Progression: an Explorative Study Notebook for the iDPP Lab on Intelligent Disease Progression Prediction at CLEF 2024</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Elena</forename><surname>Marinello</surname></persName>
							<email>elena.marinello@unipd.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Information Engineering</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Alessandro</forename><surname>Guazzo</surname></persName>
							<email>guazzoales@dei.unipd.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Information Engineering</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Enrico</forename><surname>Longato</surname></persName>
							<email>enrico.longato@unipd.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Information Engineering</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Erica</forename><surname>Tavazzi</surname></persName>
							<email>erica.tavazzi@unipd.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Information Engineering</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Isotta</forename><surname>Trescato</surname></persName>
							<email>isotta.trescato@phd.unipd.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Information Engineering</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Martina</forename><surname>Vettoretti</surname></persName>
							<email>martina.vettoretti@unipd.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Information Engineering</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Barbara</forename><forename type="middle">Di</forename><surname>Camillo</surname></persName>
							<email>barbara.dicamillo@unipd.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Information Engineering</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="department">Department of Comparative Biomedicine and Food Science</orgName>
								<orgName type="institution">University of Padova</orgName>
								<address>
									<settlement>Padova</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Using Wearable and Environmental Data to Improve the Prediction of Amyotrophic Lateral Sclerosis and Multiple Sclerosis Progression: an Explorative Study Notebook for the iDPP Lab on Intelligent Disease Progression Prediction at CLEF 2024</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
					</monogr>
					<idno type="MD5">261DFFD7BC52EF1CEA73DFB41C6DC206</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2025-04-23T17:57+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>Amyotrophic Lateral Sclerosis, Multiple Sclerosis, Logistic Regression, Ridge Regression, Random Forest, Wearable Data, Environmental Data (B. D. Camillo) 0009-0007-2445-5762 (E. Marinello)</term>
					<term>0000-0001-5155-2567 (A. Guazzo)</term>
					<term>0000-0001-5940-645X (E. Longato)</term>
					<term>0000-0001-6188-6413 (E. Tavazzi)</term>
					<term>0000-0003-0625-993X (I. Trescato)</term>
					<term>0000-0002-5020-1818 (M. Vettoretti)</term>
					<term>0000-0001-8415-4688 (B. D. Camillo)</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>Amyotrophic Lateral Sclerosis (ALS) and Multiple Sclerosis (MS) are chronic diseases with a severe impact on patients' lives. Both diseases create significant psychological and economic burdens due to alternating acute phases requiring hospital and home care. One possible solution could be the employment of sensor data to develop predictive models that can assist clinicians in making treatment and therapeutic decisions. In the context of the iDPP@CLEF 2024 challenge, this work aims to develop and compare different machine-learning approaches for predicting the Amyotrophic Lateral Sclerosis Functional Rating Scale-Revised (ALSFRS-R) scores in ALS patients, and relapses in MS patients, using wearable and environmental data, respectively. Specifically, the analysis focuses on the impact of these data and seeks to determine whether their incorporation enhances predictive performance. The results showed that there is indeed an improvement in the models' performance when sensor data are considered, in both the disease. In particular, in the case of ALS the Root Mean Square Error (RMSE) range, over the predicted twelve ALSFRS-R score, improved from [0.463-0.733] to [0.286-0.582] when incorporating the wearable data, as well as in the case of MS, where the inclusion of environmental data has improved the prediction of relapse, with the RMSE decreasing from 72.992 to 69.564.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>Amyotrophic Lateral Sclerosis (ALS) and Multiple Sclerosis (MS) are chronic neurodegenerative diseases. ALS affects the motor neurons, causing progressive degeneration of nerve cells in the spinal cord and brain, leading to an average life expectancy of three to five years <ref type="bibr" target="#b0">[1]</ref>. ALS symptoms usually are primarily related to weakness in the upper and lower limbs, or slurred speech and difficulty in swallowing <ref type="bibr" target="#b1">[2]</ref>. On the other hand, MS affects the myelinated axons in the central nervous system, causing damage to both the myelin and the axons to varying degrees. The progression of MS is highly variable and unpredictable, with the most common phenotype being relapsing-remitting: a progression pattern characterized by periods of exacerbations of the symptoms, called relapse, alternated with more stable periods <ref type="bibr" target="#b2">[3]</ref>.</p><p>Given the heterogeneous and unpredictable nature of these diseases, patients end up alternating periods in the hospital and at home, while dealing with the uncertainty of how long each acute or stable phase will last <ref type="bibr" target="#b3">[4]</ref>. This can represent a psychological and economic burden for both patients and caregivers. Clinicians, on their part, would welcome tools that can assist them throughout all stages of patient treatment by offering personalized therapeutic recommendations and identifying when urgent interventions are necessary. Predictive tools can indeed be powerful in predicting the progression of ALS disability and the occurrence of relapses in MS.</p><p>In the context of the iDPP@CLEF 2024 challenge, participants were asked to predict the progression of the ALS patients' disability status using prospective data, and predict the occurrence of relapses for MS patients by exploiting environmental and MS-specific retrospective data <ref type="bibr" target="#b4">[5,</ref><ref type="bibr" target="#b5">6]</ref>. The Challenge consisted of three tasks, described in the following sections: Section 1.1 and 1.2 refer to Task 1 and Task 2, respectively, while Section 1.3 refers to Task 3.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.1.">Task 1: ALS Disability Score from Wearable Data</head><p>Task 1 focused on using data collected through wearable devices to predict the patient's disability status measured by the twelve scores of the revised ALS functional rating scale (ALSFRS-R) <ref type="bibr" target="#b6">[7]</ref>. These ALSFRS-R scores were assigned by medical doctors during routine visits scheduled every three months. The goal of this task was to determine whether the ALSFRS-R scores assigned by clinical experts could be reliably predicted from wearable data.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.2.">Task 2: ALS Patient Self-assessment Score from Wearable Data</head><p>Similarly to Task 1, Task 2 consisted of the use of data collected through wearable devices, to predict the patient's disability status, measured by the ALSFRS-R scores. In this case, the scores were self-assessed by patients via an auto-evaluation questionnaire delivered through an app once a month. The goal was to determine whether the ALSFRS-R scores obtained from self-assessment questionnaires could be reliably predicted from wearable data.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.3.">Task 3: Relapse from EDDS Sub-scores and Environmental Data</head><p>Task 3 considered the prediction of an MS relapse using environmental data and Expanded Disability Status Scale subscores (EDSS) <ref type="bibr" target="#b7">[8]</ref>. The goal of this task was to explore whether exposure to different pollutants can be considered a useful variable in predicting the occurrence of relapses in MS patients.</p><p>To address the proposed problems, a broad set of predictive models based on different methodological approaches were trained using different subsets of the variables, provided by the challenge organizers. This study aimed to evaluate whether considering wearable data to predict ALS disability and environmental data to predict MS relapses leads to better performance with respect to models that only consider disease-specific variables collected during routine visits. To ensure consistency, all models were trained using a common framework including feature selection (via backward elimination), and hyperparameter optimization (via random search). The results suggest that collecting data from wearable devices can improve the prediction of ALS disability status. However, patients must be properly trained to use the sensors correctly. Similarly, environmental data can be beneficial for predicting the progression of MS by identifying the occurrence of relapses, focusing mainly on sensor data recorded a few days before the relapse.</p><p>The paper is organized as follows: Section 2 introduces related works and the main methodological approaches implemented until now to address ALS and MS progression prediction. Section 3 describes the methodologies employed in this study in terms of data processing and the machine-learning techniques used. Section 4 discusses the obtained results and, finally, Section 5 summarizes the key take home messages of this work.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Related Work</head><p>Different approaches have been proposed in the literature to predict the prognosis of ALS and MS patients. For both of the diseases, prediction tasks frequently employ a variety of machine-learning methodologies, with classification and regression being the most common approaches. The choice between these methods typically depends on the specific research question and the chosen outcome <ref type="bibr" target="#b8">[9]</ref>.</p><p>Regarding ALS prognosis, most studies aimed to estimate changes in the ALSFRS-R over time <ref type="bibr" target="#b9">[10,</ref><ref type="bibr" target="#b10">11,</ref><ref type="bibr" target="#b11">12,</ref><ref type="bibr" target="#b12">13,</ref><ref type="bibr" target="#b13">14]</ref>. Different studies classified patients by disease progression rates (e.g., Slow/Fast, Low/High) <ref type="bibr" target="#b14">[15,</ref><ref type="bibr" target="#b15">16,</ref><ref type="bibr" target="#b16">17]</ref>, while others have developed a model to predict when a patient will need Non-Invasive Ventilation (NIV) support within a given time window <ref type="bibr" target="#b17">[18,</ref><ref type="bibr" target="#b18">19,</ref><ref type="bibr" target="#b19">20]</ref>. Relevant biomarkers for prediction include BMI, Forced Vital Capacity (FVC), age at onset, and disease duration, as well as longitudinal data (e.g., slope, minimum, maximum, mean, standard deviation) <ref type="bibr" target="#b9">[10]</ref>. Magnetic resonance imaging (MRI) has also shown a significant impact on prediction, alongside these clinical variables <ref type="bibr" target="#b20">[21]</ref>. Regression models include Random Forest (RF) regressor and generalized boosting models <ref type="bibr" target="#b17">[18,</ref><ref type="bibr" target="#b21">22]</ref>. Recently, also graphical modeling techniques such as Dynamic Bayesian Networks (DBN) have been employed to model ALS disease progression <ref type="bibr" target="#b22">[23]</ref>. Classification models included Support Vector Machine (SVM) <ref type="bibr" target="#b15">[16]</ref>, and RF classifier <ref type="bibr" target="#b14">[15]</ref>.</p><p>On the other hand, most of the models related to MS prognosis considered as outcomes the occurrence of relapses <ref type="bibr" target="#b23">[24,</ref><ref type="bibr" target="#b24">25]</ref> and the evolution over time of the EDSS <ref type="bibr" target="#b25">[26,</ref><ref type="bibr" target="#b26">27,</ref><ref type="bibr" target="#b27">28,</ref><ref type="bibr" target="#b28">29]</ref>. The models most commonly used for classification were Logistic Regression (LR) and SVM <ref type="bibr" target="#b29">[30]</ref>, while for regression, the most popular technique was Linear Regression <ref type="bibr" target="#b30">[31]</ref>. Demographic (including age and sex), clinical, MRI (such as T2 lesion volume or number and brain atrophy), cerebrospinal fluid, and electrophysiology variables were retained as predictors in the models studied in the literature <ref type="bibr" target="#b30">[31]</ref>.</p><p>In general, for both ALS and MS, the inclusion of wearable and environmental data, respectively, in literature models is limited <ref type="bibr" target="#b31">[32,</ref><ref type="bibr" target="#b32">33]</ref>. Typically, studies focus on defining a baseline, where data are collected, and then developing a model based on this baseline to provide predictions for future outcomes <ref type="bibr" target="#b33">[34,</ref><ref type="bibr" target="#b34">35]</ref>. The main limitation of this approach is that it does not thoroughly exploit the dynamic aspect of the disease described by the full temporal evolution of data sequences, conversely to what is extensively investigated within the scope of the Challenge.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Methodology</head><p>A common data processing was performed for Task 1 and Task 2 involving ALS data, instead, the data processing for Task 3, which considered MS data, was slightly different. Then, a single model-training framework was considered for all methodological approaches across the three tasks. The following sections describe: the data processing steps needed to obtain the final set of input variables for Tasks 1, 2 (Section 3.1.1), and 3 (Section 3.1.2); the training framework used to develop the models (Section 3.2); and the description of the submitted runs (Section 3.4).</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.">Data Processing</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.1.">ALS Data Processing (Tasks 1 and 2)</head><p>The structure of the datasets provided for Task 1 and 2 was identical. The main difference between the data provided for these tasks lay in how ALSFRS-R scores were collected. In fact, for Task 1 ALSFRS-R scores were assigned by clinicians during routine visits performed more or less every three months. Instead, for Task 2, ALSFRS-R scores were self-assigned by the patients via a questionnaire delivered periodically (∼ once a month) through the BRAINTEASER app. Hence, the same processing pipeline was adopted for these two tasks.</p><p>Six static variables evaluated at the first visit were available, namely: sex, diagnostic delay, age at diagnosis, FVC, weight, and BMI. The only processing performed on these static variables concerned the sex variable which was mapped to a boolean variable equal to 0 for male patients and 1 for female patients.</p><p>All ALSFRS-R measurements collected for each patient were made available to participants despite the Task 1 and 2 goals being only the prediction of the ALSFRS-R subscores following the first visit (Task 1) or of the self-assessment score (Task 2). Hence, all available information was fully exploited to obtain a more rich and robust dataset. Specifically, each pair of consecutive ALSFRS-R subscores was considered as an independent entry characterized by the same static information of the patient they belonged to. The first set of ALSFRS-R subscores of each pair was used as input variables named start_Q*, where * represents the ALSFRS-R question number and ranges from 1 to 12. Instead, the second set of ALSFRS-R subscores of each pair were used as the target variables named end_Q*. The final sample size of data used to train models for the first task was of 131 entries (from 52 unique patients) and the one of data used to train models for the second task was of 163 entries (from 52 unique patients).</p><p>For each patient, 90 variables collected multiple times through wearable sensors were available. The processing of these variables consisted of the extraction of first-order descriptors (such as mean, first and last recorded values, and minimum and maximum values) considering all values recorded within a time window starting from the date of the start ALSFRS-R of the considered entry to the date of the end ALSFRS-R score of the same entry. The window length, expressed in days, was also included in the set of possible predictors. Moreover, the slopes of change of the following variables were also considered: total_calories, total_steps, spo2_av, heart_rate_mean, heart_rate_baseline. The slope of change was obtained as the angular coefficient of a linear fit of all recorded values for each variable within the considered time window.</p><p>To build the training set, it was instrumental to consider ALSFRS-R pairs collected after the first visit, in order to obtain a robust and rich set of variables extracted from wearable data. The richness and quality of such data tend to improve over time as the patient learns how to properly use, and becomes more familiar with, the device provided at the first visit.</p><p>After this first processing step, 487 variables were available for each entry in the dataset. Specifically, one variable for the unique patient identifier, one variable for the window length expressed in days, 12 variables for the start ALSFRS-R scores, 12 target variables for the ALSFRS-R scores to be used as outcomes, 90 * 5 = 450 variables for the first-order descriptors of the 90 wearable sensor variables, 5 variables for the considered slopes of change, and the 6 static variables.</p><p>From this full set of variables, those with more than 50% missing values and those that were almost constant (auto-correlation coefficient &gt; 0.9) were removed. Finally, collinear variables were removed by iteratively excluding those with a correlation coefficient &gt; 0.9. After this step, 131 out of 487 variables were considered for Task 1, and 134 out of 487 variables were considered for Task 2.</p><p>Then, normalization was performed to avoid introducing bias related to the different dynamic ranges of each variable and to promote consistency between the scale of the coefficients that might be estimated during model training. Specifically, min-max scaling was used and the normalization parameters were derived considering only the whole training set and applied to the test set.</p><p>Finally, the imputation of missing values in the processed input variables was performed using the mice R package <ref type="bibr" target="#b35">[36]</ref>. Also for the imputation, parameters were estimated on the whole training set and applied to the test set.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.2.">MS Data Processing (Task 3)</head><p>The processing concept for Task 3 was similar to the one proposed for Task 1 and 2 but had to be adapted considering the different structure of data available for this task.</p><p>Fifteen static variables evaluated at the first visit were available. Five variables were related to demographic information, five variables were related to MS diagnosis, and five variables were related to symptoms. The sex variable was mapped to a boolean variable equal to 0 if the patient was male and 1 if female. The variable centre was mapped to a boolean variable equal to 0 if the patient was followed at the clinic in Pavia and 1 if at the clinic in Turin. The variable residence classification consisted of three possible levels: cities, towns, and rural area. This variable was mapped to two dummy variables: residence_city and residence_rural_area. The variable ethnicity was excluded as almost all patients were caucasian. Two variables related to diagnosis criteria were excluded as almost all patients were diagnosed according to the same criterion. After these steps, 12 static variables remained.</p><p>Multiple EDSS recordings were also available from the baseline date to the date of the first relapse.</p><p>Hence, first-order descriptors were extracted also for the EDSS value considering all measurements within this time window.</p><p>For each patient, a set of 20 environmental measurements related to pollutant levels and meteorological indicators were available. Such measurements were available both before and after the baseline. Hence, similarly to what was done for wearable sensor data in Tasks 1 and 2, a set of first-order descriptors (such as mean, first and last recorded values, and minimum and maximum values) was extracted for each variable considering all values recorded within two time windows. The first time window started at the date of the first available environmental measure and ended at the baseline date. The second time window, instead, started at the baseline date and ended at the first recorded relapse date.</p><p>After this first processing step, 219 variables were available for each patient in the dataset. Specifically, one variable for the unique patient identifier, one target variable for the relapse week to be used as the outcome, 20*5 = 100 variables for the first-order descriptors of the 20 environmental variables measured before the baseline, 20*5 = 100 variables for the first-order descriptors of the 20 environmental variables measured after the baseline, 5 variables for the first-order descriptors of the EDSS measurements, and the 12 static variables.</p><p>From this full set of variables, those with more than 50% missing values and those that are almost constant (auto-correlation coefficient &gt; 0.9) were removed. Finally, collinear variables were removed by iteratively excluding those with a correlation coefficient &gt; 0.9. After this step, 69 out of 219 variables were considered for Task 3. Two patients were also excluded as almost all their variables were missing, hence, 197 unique patients were considered to train the MS models.</p><p>Following what was done for the previous tasks, normalization was performed via min-max scaling and the imputation of missing values in the processed input variables was performed using the mice R package.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.2.">Model Training and Evaluation</head><p>In Tasks 1 and 2, the prediction targets were the 12 ALSFRS-R scores evaluated, respectively by the clinician and the patients themselves. Each score must be predicted independently and it was an integer within the range [0-4]. Intuitively, this problem can be cast as a multiclass classification with five classes. However, it can also be framed as a regression problem by modifying the model output by rounding it to the nearest integer. Instead, in Task 3, the goal was to predict the week of the first relapse occurrence after the baseline, and, as the weeks are not within a finite range, this can only be approached as a regression problem. However, as the challenge submission rules require an integer value also for the predicted relapse week, the output of regression models developed for Task 3 was rounded to the nearest integer as well.</p><p>The core of the model training framework involved the Backward Feature Selection technique <ref type="bibr" target="#b36">[37]</ref> and the model's performances were evaluated through the Root Mean Squared Error score <ref type="bibr" target="#b37">[38]</ref>. The process started with all the features and iteratively they were removed one by one. At each iteration, for every feature combination, hyperparameter tuning was performed via random search over a given hyperparameter grid <ref type="bibr" target="#b38">[39]</ref>, using a 5-fold cross-validation (CV). The subset of features that resulted in the lowest RMSE score, was then chosen to train a final model. Its hyperparameters were optimized again using 5-fold CV and random search within the same hyperparameter space. Ultimately, this optimized model was tested on an independent test set, and the results were submitted to the challenge organizers for performance evaluation.</p><p>This model training framework was designed to be flexibile, allowing its application across the three different tasks with a variety of methodological approaches. The approaches considered in this study included both linear models (LR and ridge regression), as well as non-linear models (RF). For each of these models, different sets of hyperparameters were tested. For the LR, a single hyperparameter needs optimization: the strength of the regularization applied to the model, C. Similarly, for the ridge regression, the only hyperparameter that needs optimization is the strength of the L2 regularisation, 𝛼. Both C and 𝛼 were randomly sampled from 250 values in a log-uniform distribution with support [10 -4  -10 4 ]. Finally, the RF's hyperparameter space consisted of two hyperparameters: the number of trees in each RF, which was uniformly sampled in the interval [50 -500], and the maximum depth of each tree, which was uniformly sampled in the interval <ref type="bibr">[1 -100]</ref>). By default, the square root of the total number of features was evaluated at each node for splitting.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.3.">Considered Subsets of Input Variables</head><p>To evaluate whether considering wearable data to predict ALS disability and environmental data to predict MS relapses led to better performance with respect to models that only consider disease-specific variables collected during routine visits, different sets of variables were considered as input for the predictive models. Hence, for Tasks 1 and 2, the target ALSFRS-R value (e.g., end_Q1, see Section 3.1.1) was first predicted by simply holding the corresponding initial ALSFRS-R evaluation (e.g., start_Q1 see Section 3.1.1). The idea behind this approach is to provide a baseline reference point that does not involve any particular prediction model. Then, to provide a slightly more complex benchmark approach, a LR model was trained using only the 12 initial ALSFRS-R scores (e.g., all start_Q*) as possible input variables. The idea behind this second set of considered features is to assess whether considering scores from other ALSFRS-R questions leads to a more accurate prediction of the target ALSFRS-R score with respect to the one obtained by simply holding its initial value. Finally, different models were trained using all available variables (i.e., static, ALSFRS-R, and wearable data) to evaluate whether models developed including also data collected through wearable devices led to better performance with respect to the one developed using only the initial ALSFRS-R scores. The models included LR, ridge regression, RF regressor, and RF classifier.</p><p>Similarly, for Task 3, first, a ridge model was trained considering as possible input only static and EDSS variables. Then, a ridge and an RF regressor were trained after including environmental-derived variables in the pool of possible predictors. The idea behind this approach was to check whether including environmental data could improve the first-relapse-week prediction with respect to models that only consider data collected at the first visit and EDSS evaluations.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.4.">Description of Submitted Runs</head><p>The following runs were submitted for Tasks 1 and 2:</p><p>• Logistic regression (logistic): LR model with multiclass outcome. All available variables were considered in the pool of possible predictors. Each question was predicted with its independent model trained specifically for that question. • Logistic regression considering only ALSFRS-R scores (logistic_ALSFRS): LR model with multiclass outcome. Only start_Q* variables were considered in the pool of possible predictors. Each question was predicted with its independent model trained specifically for that question. • Random Forest classifier (rf): RF classifier with multiclass outcome. All available variables were considered in the pool of possible predictors. Each question was predicted with its independent model trained specifically for that question. • Ridge regression (ridge): Ridge regression model. All available variables were considered in the pool of possible predictors. Each question was predicted with its independent model trained specifically for that question. • Random Forest regressor (rf_reg): RF regressor model. All available variables were considered in the pool of possible predictors. Each question was predicted with its independent model trained specifically for that question. • hold: Each question was predicted by holding its starting value (i.e., considering the start_Q* variables as predicted end_Q* targets) • average: Each predicted score was obtained as the average output of the LR, RF classifier, ridge, and RF regressor models rounded to the nearest integer (i.e., column-wise average rounded to the nearest integer of logistic, rf, ridge, and rf_reg runs). • optrun: Each question was predicted with the best-performing model for that question (i.e., the one highlighted in bold in Table <ref type="table" target="#tab_2">1 and 3</ref>).</p><p>The following runs were submitted for Task 3:</p><p>• Ridge regression (ridge): Ridge regression model. All available variables were considered in the pool of possible predictors. • Ridge regression without considering environmental data (ridge_noenv): Ridge regression model. Environmental variables were excluded from the pool of possible predictors. • Random Forest regressor (rf_reg): RF regressor model. All available variables were considered in the pool of possible predictors. • average: Each predicted first relapse week was obtained as the average output of the ridge and RF regressor models rounded to the nearest integer (i.e., column-wise average rounded to the nearest integer of ridge and rf_reg runs).</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Results</head><p>The results for the three tasks are reported in the sections below. For Tasks 1 and 2, the results for ALSFRS-R scores prediction are reported in Section 4.1 and Section 4.2, respectively. For Task 3, the results for the week of the occurrence of the first relapse are reported in Section 4.3.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.1.">Task 1 Results</head><p>Table <ref type="table" target="#tab_0">1</ref> presents the CV results for Task 1. Each column represents one of the predicted ALSFRS-R scores (Q1 -Q12), while the rows indicate the considered models. Each cell displays the average CV RMSE. RMSE values highlighted in bold represent the lowest value of each column, thus indicating the best-performing model for each predicted question. The ridge model was the best-performing one for six out of twelve scores (Q1, Q4, Q6, Q7, Q11, Q12), with RMSE values ranging between 0.228 for Q1 and 0.570 for Q7. The LR model, when considering all available variables, also showed reliable performance, achieving the best prediction for four out of twelve scores (Q2, Q3, Q9, Q10). Its RMSE values ranged from 0.286 for Q2 to 0.582 for Q9. Conversely, the RF regressor yielded the best predictions for Q5 and Q8, with RMSE scores of 0.508 and 0.479, respectively. Finally, the hold approach and RF classifier were the worst-performing among all the models. Additionally, the LR model using only the ALSFRS-R score did not perform well, suggesting that performance improved when wearable data was added. In general, it is possible to observe that adding first all the ASLFRS-R scores, and consequentially all the other sensor variables, increased the performance in the cross-validation phase, leading to lower RMSE values.</p><p>Table <ref type="table" target="#tab_1">2</ref> shows the results of Task 1 submitted runs as evaluated by the challenge organizers. The name of the submitted run is reported in the first column of Table <ref type="table" target="#tab_1">2</ref>. Then, columns two and three of Table <ref type="table" target="#tab_1">2</ref> show the two metrics used by the organizers to evaluate participants' submitted runs on the independent test set: RMSE and Mean Absolute Error (MAE), respectively.</p><p>Results observed in CV were not confirmed on the test set, with the best-performing model being the hold method (RMSE = 0.491, MAE = 0.202) and the LR using all available variables yielding the worst result (RMSE = 0.830, MAE = 0.511). One possible explanation could be that the training set is more robust compared to the test set, since it includes data from later visits, while the test set only contains data from the initial visits. Therefore, these results are likely due to insufficient data collection during the initial visits when patients either have not started using the wearable devices or are still becoming familiar with how to use them. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.2.">Task 2 Results</head><p>Table <ref type="table" target="#tab_2">3</ref> presents the CV results for Task 2. Each column represents one of the predicted ALSFRS-R scores (Q1 -Q12), while the rows indicate the considered models. Each cell displays the average CV RMSE. RMSE values highlighted in bold represent the lowest value of each column, thus indicating the best-performing model for each predicted question. In this task, the LR model, when considering all available variables, achieved the best results for seven out of twelve scores (Q2, Q3, Q5, Q7, Q10, Q11, Q12), with RMSE values ranging between 0.139 for Q3 and 0.595 for Q10. The ridge regression, also showed good performance compared to other models, achieving the best prediction for four out of twelve scores (Q1, Q4, Q6, Q9). Its RMSE values ranged from 0.292 for Q1 to 0.449 for Q6. Conversely, the RF regressor yielded the best prediction only for Q8 with an RMSE of 0.372. Finally, the hold and RF classifier performed the worst among all the models. In general, it is possible to observe that adding first all the ASLFRS-R scores, and then all the other sensor variables, led to a performance increase in the CV phase, resulting in lower RMSE values.</p><p>Table <ref type="table" target="#tab_1">2</ref> shows the results of Task 2 submitted runs as evaluated by the challenge organizers. The name of the submitted run is reported in the first column of Table <ref type="table" target="#tab_1">2</ref>. Then, columns two and three of Table <ref type="table" target="#tab_1">2</ref> show the two metrics used by the organizers to evaluate participants' submitted runs on the independent test set: RMSE and MAE, respectively.</p><p>Results observed in CV were not confirmed on the test set also for this second task, with the bestperforming model being once again the hold method (RMSE = 0.577, MAE = 0.287) and the LR with wearable data available yielding the worst results on the test set (RMSE = 0.9930, MAE = 0.659). These results are in line with those observed in Task 1. Additionally, the scores assigned during this period are based on self-evaluation, which may further impact the accuracy of the data.</p><p>Overall, in this task, the RMSE values were lower than those obtained in Task 1, especially for the hold method. This improvement may be attributed to the fact that clinicians are able to better assign ALSFRS-R scores during visits, resulting in greater variability which leads to a more challenging prediction task. Instead, patients are typically more conservative and tend to assign similar scores between questionnaires. This leads to less variability, which makes the prediction task slightly easier, especially for the hold method. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.3.">Task 3 Results</head><p>Table <ref type="table" target="#tab_4">5</ref> reports the CV results for Task 3. Each row shows a considered model and its corresponding CV RMSE. The RMSE value highlighted in bold represents the lowest score, indicating the best-performing approach.</p><p>The ridge regression with environmental data performed best among others, with an RMSE equal to 69.564. However, in the independent test set, the best performance was achieved without including environmental variables as evidenced in Table <ref type="table" target="#tab_5">6</ref>.</p><p>In Task 3, the RMSE is very high, indicating low precision in predicting the relapse week. During the training phase, incorporating environmental data helped achieve better results. However, in the test phase, the performance was better without the environmental data. This discrepancy is likely due to the presence of significant sequences of missing data that needed to be imputed, as there are long intervals between visits in both the MS training and test sets. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Conclusions and Future Work</head><p>This study aimed at addressing the three tasks proposed within the iDPP@CLEF 2024 challenge, while also evaluating whether the inclusion of sensor and environmental data helps in improving prediction of ALS and MS progression. The challenge consisted of three different tasks. In Task 1 and Task 2, the goal was to predict the ALSFRS-R scores, assigned, respectively, by clinicians and by the patients themselves. Instead, Task 3 consisted of predicting the week of the first relapse for MS patients. A flexible training workflow was developed in order to evaluate different methodological approaches and different subsets of input variables under a common, robust training workflow. For Task 1 and Task 2, both classification and regression approaches were explored, namely: LR, ridge regression, RF regressor and RF classifier. In Task 3, only regression models were considered due to the different nature of this task, namely: ridge regression and RF regressor.</p><p>In the first two tasks, classification approaches were able to better capture the ALSFRS-R scores variability among the five classes. Instead, the regression approach tended to frequently predict the mean value within the range [0-4]. Moreover, in these tasks, the best CV results were achieved by the ridge regression and LR when including variables derived from wearable devices. On the contrary, when evaluating the models on the independent test sets, the best results were obtained by the hold method. The robustness of the results during CV can be attributed to the nature of the training set, which includes data from all visits. This results in a richer, more complete, and robust dataset characterized by a more refined wearable data collection process with respect to the test set which included only the first couple of visits when patients are still getting familiar with the data collection process and the BRAINTEASER app. Hence, the test data were more noisy and sparse.</p><p>In Task 3, the best CV results were achieved by the ridge model incorporating the environmental data. On the contrary, in the independent test set the best performance was obtained by the ridge model without considering the environmental data. This weak result for this task could be attributed to the not properly optimized variable creation process which was designed for the first two tasks and directly applied also in the third task. One possible solution could be to consider dynamic variables instead of computing first-order descriptors, given the long periods between visits, and consequently employ models that account for these dynamic data.</p><p>In conclusion, the developed models performed well within the iDPP@CLEF 2024 challenge, while contributing to raise important considerations that go beyond the competition itself. In fact, Tasks 1 and 2 results suggest that collecting wearable data can be a viable path to follow in order to improve the prediction of ALS disability status. However, a key condition that must be respected in order to benefit from the inclusion of these data, is that patients must be properly informed, trained, and followed in order to obtain rich and high-quality data over long periods of time. Otherwise, it might be more effective to rely on data that are commonly collected during routine visits of ALS patients. On the other hand, regarding MS, since the given environmental data and observations have been measured also after the relapse that needed to be predicted, it would be more effective to focus only on the environmental pollutants measured a few days before the relapse, as also confirmed by the literature <ref type="bibr" target="#b39">[40]</ref>.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_0"><head>Table 1</head><label>1</label><figDesc>CV RMSE values for methods considered in Task 1. Each column represents an ALSFRS-R question. The minimum values of each column are highlighted in bold.</figDesc><table><row><cell>Model</cell><cell>Q1</cell><cell>Q2</cell><cell>Q3</cell><cell>Q4</cell><cell>Q5</cell><cell>Q6</cell><cell>Q7</cell><cell>Q8</cell><cell>Q9</cell><cell>Q10</cell><cell>Q11</cell><cell>Q12</cell></row><row><cell>LR</cell><cell cols="12">0.395 0.286 0.288 0.526 0.522 0.606 0.604 0.568 0.582 0.243 0.393 0.504</cell></row><row><cell cols="13">LR ALSFRS only 0.463 0.456 0.438 0.568 0.583 0.700 0.733 0.640 0.805 0.507 0.470 0.548</cell></row><row><cell>Ridge</cell><cell cols="12">0.228 0.351 0.302 0.495 0.533 0.493 0.570 0.532 0.676 0.318 0.389 0.439</cell></row><row><cell>RF classifier</cell><cell cols="12">0.416 0.379 0.386 0.591 0.564 0.580 0.636 0.589 0.619 0.461 0.471 0.557</cell></row><row><cell>RF regressor</cell><cell cols="12">0.443 0.370 0.397 0.512 0.508 0.561 0.621 0.479 0.648 0.455 0.457 0.511</cell></row><row><cell>Hold</cell><cell cols="12">0.531 0.479 0.471 0.665 0.710 0.796 0.762 0.654 0.856 0.553 0.546 0.630</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_1"><head>Table 2</head><label>2</label><figDesc>Runs RMSE and MAE values for methods considered in Task 1. The minimum values are highlighted in bold.</figDesc><table><row><cell>Runs</cell><cell cols="2">RMSE MAE</cell></row><row><cell>logistic</cell><cell>0.830</cell><cell>0.511</cell></row><row><cell>logistic_ALSFRS</cell><cell>0.636</cell><cell>0.341</cell></row><row><cell>ridge</cell><cell>0.687</cell><cell>0.392</cell></row><row><cell>rf</cell><cell>0.650</cell><cell>0.361</cell></row><row><cell>rf_reg</cell><cell>0.636</cell><cell>0.373</cell></row><row><cell>hold</cell><cell cols="2">0.491 0.202</cell></row><row><cell>average</cell><cell>0.596</cell><cell>0.333</cell></row><row><cell>optrun</cell><cell>0.707</cell><cell>0.412</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_2"><head>Table 3</head><label>3</label><figDesc>CV RMSE values for methods considered in Task 2. Each column represents an ALSFRS-R question. The minimum values of each column are highlighted in bold.</figDesc><table><row><cell>Model</cell><cell>Q1</cell><cell>Q2</cell><cell>Q3</cell><cell>Q4</cell><cell>Q5</cell><cell>Q6</cell><cell>Q7</cell><cell>Q8</cell><cell>Q9</cell><cell>Q10</cell><cell>Q11</cell><cell>Q12</cell></row><row><cell>LR</cell><cell cols="12">0.360 0.453 0.139 0.466 0.525 0.497 0.412 0.447 0.452 0.595 0.414 0.263</cell></row><row><cell cols="13">LR ALSFRS Only 0.399 0.551 0.291 0.513 0.621 0.620 0.565 0.454 0.606 0.738 0.553 0.309</cell></row><row><cell>Ridge</cell><cell cols="12">0.292 0.500 0.219 0.437 0.535 0.449 0.437 0.378 0.381 0.701 0.702 0.358</cell></row><row><cell>RF classifier</cell><cell cols="12">0.357 0.490 0.223 0.481 0.565 0.531 0.465 0.412 0.418 0.688 0.769 0.347</cell></row><row><cell>RF regressor</cell><cell cols="12">0.367 0.513 0.280 0.497 0.525 0.567 0.488 0.372 0.492 0.638 0.680 0.345</cell></row><row><cell>Hold</cell><cell cols="12">0.384 0.701 0.313 0.514 0.631 0.597 0.612 0.525 0.602 0.821 0.917 0.450</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_3"><head>Table 4</head><label>4</label><figDesc>Runs RMSE and MAE values for methods considered in Task 2. The minimum values are highlighted in bold.</figDesc><table><row><cell>Runs</cell><cell cols="2">RMSE MAE</cell></row><row><cell>logistic</cell><cell>0.993</cell><cell>0.659</cell></row><row><cell>logistic_ALSFRS</cell><cell>0.854</cell><cell>0.500</cell></row><row><cell>ridge</cell><cell>0.850</cell><cell>0.545</cell></row><row><cell>rf</cell><cell>0.778</cell><cell>0.515</cell></row><row><cell>rf_reg</cell><cell>0.818</cell><cell>0.515</cell></row><row><cell>hold</cell><cell>0.577</cell><cell>0.287</cell></row><row><cell>average</cell><cell>0.783</cell><cell>0.493</cell></row><row><cell>optrun</cell><cell>0.962</cell><cell>0.606</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_4"><head>Table 5</head><label>5</label><figDesc>CV RMSE values for methods considered in Task 3. The minimum value is highlighted in bold.</figDesc><table><row><cell>Model</cell><cell>RMSE</cell></row><row><cell>Ridge</cell><cell>69.564</cell></row><row><cell cols="2">Ridge without environmental data 72.992</cell></row><row><cell>RF regressor</cell><cell>74.972</cell></row><row><cell>Average</cell><cell>82.702</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_5"><head>Table 6</head><label>6</label><figDesc>Runs RMSE and MAE values for methods considered in Task 3. The minimum values are highlighted in bold.</figDesc><table><row><cell>Runs</cell><cell cols="2">RMSE MAE</cell></row><row><cell>ridge</cell><cell>89.83</cell><cell>68.59</cell></row><row><cell cols="3">ridge_no_env 78.62 61.37</cell></row><row><cell>rf_reg</cell><cell>79.73</cell><cell>66.63</cell></row><row><cell>average</cell><cell>79.25</cell><cell>65.80</cell></row></table></figure>
		</body>
		<back>
			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Amyotrophic lateral sclerosis</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">C</forename><surname>Kiernan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Vucic</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">C</forename><surname>Cheah</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">R</forename><surname>Turner</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Eisen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Hardiman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">R</forename><surname>Burrell</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">C</forename><surname>Zoing</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">The Lancet</title>
		<imprint>
			<biblScope unit="volume">377</biblScope>
			<biblScope unit="page" from="942" to="955" />
			<date type="published" when="2011">2011</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">Amyotrophic lateral sclerosis</title>
		<author>
			<persName><forename type="first">L</forename><forename type="middle">P</forename><surname>Rowland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">A</forename><surname>Shneider</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">New England Journal of Medicine</title>
		<imprint>
			<biblScope unit="volume">344</biblScope>
			<biblScope unit="page" from="1688" to="1700" />
			<date type="published" when="2001">2001</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<monogr>
		<title level="m" type="main">Multiple sclerosis review, P &amp; T: a peer-reviewed journal for formulary management</title>
		<author>
			<persName><forename type="first">M</forename><surname>Goldenberg</surname></persName>
		</author>
		<imprint>
			<date type="published" when="2012">2012</date>
			<biblScope unit="volume">37</biblScope>
			<biblScope unit="page" from="175" to="184" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">Care management in amyotrophic lateral sclerosis</title>
		<author>
			<persName><forename type="first">M.-H</forename><surname>Soriani</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Desnuelle</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Revue Neurologique</title>
		<imprint>
			<biblScope unit="volume">173</biblScope>
			<biblScope unit="page" from="288" to="299" />
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">Overview of idpp@clef 2024: The intelligent disease progression prediction challenge</title>
		<author>
			<persName><forename type="first">G</forename><surname>Birolo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Bosoni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Faggioli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Aidos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Bergamaschi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Cavalla</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Chiò</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Dagliati</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><forename type="middle">M D</forename><surname>Nunzio</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Fariselli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">M G</forename><surname>Dominguez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Gromicho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Guazzo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Longato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C</forename><surname>Madeira</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Manera</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Marchesin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Menotti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Silvello</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Trescato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Vettoretti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">D</forename><surname>Camillo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Ferro</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Working Notes of the Conference and Labs of the Evaluation Forum (CLEF 2024)</title>
		<title level="s">CEUR Workshop Proceedings</title>
		<meeting><address><addrLine>Grenoble, France</addrLine></address></meeting>
		<imprint>
			<date type="published" when="2024">2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">Intelligent disease progression prediction: Overview of idpp@clef 2024</title>
		<author>
			<persName><forename type="first">G</forename><surname>Birolo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Bosoni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Faggioli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Aidos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Bergamaschi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Cavalla</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Chiò</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Dagliati</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><forename type="middle">M D</forename><surname>Nunzio</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Fariselli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">M G</forename><surname>Dominguez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Gromicho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Guazzo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Longato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C</forename><surname>Madeira</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Manera</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Marchesin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Menotti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Silvello</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Trescato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Vettoretti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">D</forename><surname>Camillo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Ferro</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Experimental IR Meets Multilinguality, Multimodality, and Interaction -15th International Conference of the CLEF Association, CLEF 2024</title>
		<title level="s">Lecture Notes in Computer Science</title>
		<meeting><address><addrLine>Grenoble, France</addrLine></address></meeting>
		<imprint>
			<publisher>Springer</publisher>
			<date type="published" when="2024">September 9th to 12th, 2024. 2024</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">The alsfrs-r: a revised als functional rating scale that incorporates assessments of respiratory function</title>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">M</forename><surname>Cedarbaum</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Stambler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Malta</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Fuller</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Hilt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Thurmond</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Nakanishi</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of the Neurological Sciences</title>
		<imprint>
			<biblScope unit="volume">169</biblScope>
			<biblScope unit="page" from="13" to="21" />
			<date type="published" when="1999">1999</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">Disability status and quality of life in multiple sclerosis: non-linearity of the expanded disability status scale (edss)</title>
		<author>
			<persName><forename type="first">S</forename><surname>Twork</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Wiesmeth</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Spindler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Wirtz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Schipper</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Pöhlau</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Klewer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Kugler</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Health and Quality of Life Outcomes</title>
		<imprint>
			<biblScope unit="volume">8</biblScope>
			<date type="published" when="2010">2010</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">Artificial intelligence and statistical methods for stratification and prediction of progression in amyotrophic lateral sclerosis: A systematic review</title>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Longato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Vettoretti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Aidos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Trescato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Roversi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">S</forename><surname>Martins</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">N</forename><surname>Castanho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Branco</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">F</forename><surname>Soares</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Guazzo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Birolo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Pala</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Bosoni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Chiò</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Manera</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Miranda</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Gromicho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Alves</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Bellazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Dagliati</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Fariselli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C</forename><surname>Madeira</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">Di</forename><surname>Camillo</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Artificial Intelligence in Medicine</title>
		<imprint>
			<biblScope unit="volume">142</biblScope>
			<biblScope unit="page">102588</biblScope>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">Machine learning solutions applied to amyotrophic lateral sclerosis prognosis: A review</title>
		<author>
			<persName><forename type="first">F</forename><surname>Papaiz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">E T</forename><surname>Dourado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">A D M</forename><surname>Valentim</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">H F</forename><surname>De Morais</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">P</forename><surname>Arrais</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Frontiers in Computer Science</title>
		<imprint>
			<biblScope unit="volume">4</biblScope>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">Randomforest4life: A random forest for predicting als disease progression</title>
		<author>
			<persName><forename type="first">T</forename><surname>Hothorn</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><forename type="middle">H</forename><surname>Jung</surname></persName>
		</author>
		<idno type="PMID">25141076</idno>
	</analytic>
	<monogr>
		<title level="j">Amyotrophic Lateral Sclerosis and Frontotemporal Degeneration</title>
		<imprint>
			<biblScope unit="volume">15</biblScope>
			<biblScope unit="page" from="444" to="452" />
			<date type="published" when="2014">2014</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">Predicting the severity of motor neuron disease progression using electronic health record data with a cloud computing big data approach</title>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">D</forename><surname>Ko</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>El-Ghazawi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Kim</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Morizono</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">IEEE Conference on Computational Intelligence in Bioinformatics and Computational Biology</title>
				<imprint>
			<date type="published" when="2014">2014. 2014</date>
			<biblScope unit="page" from="1" to="6" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b12">
	<analytic>
		<title level="a" type="main">Temporal modeling of deterioration patterns and clustering for disease prediction of als patients</title>
		<author>
			<persName><forename type="first">D</forename><surname>Halbersberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Lerner</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">18th IEEE International Conference On Machine Learning And Applications (ICMLA)</title>
				<imprint>
			<date type="published" when="2019">2019. 2019</date>
			<biblScope unit="page" from="62" to="68" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b13">
	<analytic>
		<title level="a" type="main">Predicting disease progression in amyotrophic lateral sclerosis</title>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">A</forename><surname>Taylor</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Fournier</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Polak</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Wang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Zach</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Keymer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">D</forename><surname>Glass</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">L</forename><surname>Ennist</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><forename type="middle">P R O</forename></persName>
		</author>
		<author>
			<persName><forename type="first">-A</forename><forename type="middle">A C T</forename><surname>Consortium</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Annals of Clinical and Translational Neurology</title>
		<imprint>
			<biblScope unit="volume">3</biblScope>
			<biblScope unit="page" from="866" to="875" />
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">Stratification of amyotrophic lateral sclerosis patients: a crowdsourcing approach</title>
		<author>
			<persName><forename type="first">R</forename><surname>Kueffner</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Al</forename></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Scientific Reports</title>
		<imprint>
			<biblScope unit="volume">9</biblScope>
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b15">
	<analytic>
		<title level="a" type="main">Using blood data for the differential diagnosis and prognosis of motor neuron diseases: a new dataset for machine learning applications</title>
		<author>
			<persName><forename type="first">A</forename><surname>Greco</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">R</forename><surname>Chiesa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Da Prato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">M</forename><surname>Romanelli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Dolciotti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Cavallini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">M</forename><surname>Masciandaro</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">P</forename><surname>Scilingo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Del Carratore</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Bongioanni</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Scientific Reports</title>
		<imprint>
			<biblScope unit="volume">11</biblScope>
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">Amyotrophic lateral sclerosis disease progression model</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">F A</forename><surname>Roberto Gomeni</surname></persName>
		</author>
		<idno type="PMID">24070404</idno>
	</analytic>
	<monogr>
		<title level="j">Amyotrophic Lateral Sclerosis and Frontotemporal Degeneration</title>
		<imprint>
			<biblScope unit="volume">15</biblScope>
			<biblScope unit="page" from="119" to="129" />
			<date type="published" when="2014">2014</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b17">
	<analytic>
		<title level="a" type="main">Predicting non-invasive ventilation in als patients using stratified disease progression groups</title>
		<author>
			<persName><forename type="first">S</forename><surname>Pires</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Gromicho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Pinto</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C</forename><surname>Madeira</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">IEEE International Conference on Data Mining Workshops (ICDMW)</title>
				<imprint>
			<date type="published" when="2018">2018. 2018</date>
			<biblScope unit="page" from="748" to="757" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b18">
	<analytic>
		<title level="a" type="main">Learning prognostic models using disease progression patterns: Predicting the need for non-invasive ventilation in amyotrophic lateral sclerosis</title>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">S</forename><surname>Martins</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Gromicho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Pinto</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C</forename><surname>Madeira</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">IEEE/ACM Transactions on Computational Biology and Bioinformatics</title>
		<imprint>
			<biblScope unit="volume">19</biblScope>
			<biblScope unit="page" from="2572" to="2583" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b19">
	<analytic>
		<title level="a" type="main">Patient stratification using clinical and patient profiles: Targeting personalized prognostic prediction in als</title>
		<author>
			<persName><forename type="first">S</forename><surname>Pires</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Gromicho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Pinto</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Carvalho</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">C</forename><surname>Madeira</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Bioinformatics and Biomedical Engineering</title>
				<editor>
			<persName><forename type="first">I</forename><surname>Rojas</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">O</forename><surname>Valenzuela</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">F</forename><surname>Rojas</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">L</forename><forename type="middle">J</forename><surname>Herrera</surname></persName>
		</editor>
		<editor>
			<persName><forename type="first">F</forename><surname>Ortuño</surname></persName>
		</editor>
		<meeting><address><addrLine>Cham</addrLine></address></meeting>
		<imprint>
			<publisher>Springer International Publishing</publisher>
			<date type="published" when="2020">2020</date>
			<biblScope unit="page" from="529" to="541" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b20">
	<analytic>
		<title level="a" type="main">Deep learning predictions of survival based on mri in amyotrophic lateral sclerosis</title>
		<author>
			<persName><forename type="first">H</forename><forename type="middle">K</forename><surname>Van Der Burgh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Schmidt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H.-J</forename><surname>Westeneng</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>De Reus</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><forename type="middle">H</forename><surname>Van Den</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">P</forename><surname>Berg</surname></persName>
		</author>
		<author>
			<persName><surname>Van Den</surname></persName>
		</author>
		<author>
			<persName><surname>Heuvel</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">NeuroImage: Clinical</title>
		<imprint>
			<biblScope unit="volume">13</biblScope>
			<biblScope unit="page" from="361" to="369" />
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b21">
	<analytic>
		<title level="a" type="main">Domain adaptation from clinical trials data to the tertiary care clinic -application to als</title>
		<author>
			<persName><forename type="first">B</forename><surname>Hadad</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Lerner</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">19th IEEE International Conference on Machine Learning and Applications (ICMLA)</title>
				<imprint>
			<publisher>IEEE</publisher>
			<date type="published" when="2020">2020. 2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b22">
	<analytic>
		<title level="a" type="main">Predicting functional impairment trajectories in amyotrophic lateral sclerosis: a probabilistic, multifactorial model of disease progression</title>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Al</forename></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of Neurology</title>
		<imprint>
			<biblScope unit="volume">269</biblScope>
			<biblScope unit="page" from="3858" to="3878" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b23">
	<analytic>
		<title level="a" type="main">A two-stage prediction model for heterogeneous effects of treatments</title>
		<author>
			<persName><forename type="first">K</forename><surname>Chalkou</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Steyerberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Egger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Manca</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Pellegrini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Salanti</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Statistics in Medicine</title>
		<imprint>
			<biblScope unit="volume">40</biblScope>
			<biblScope unit="page" from="4362" to="4375" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b24">
	<analytic>
		<title level="a" type="main">Leveraging electronic health records data to predict multiple sclerosis disease activity</title>
		<author>
			<persName><forename type="first">Y</forename><surname>Ahuja</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Kim</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Liang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Cai</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Dahal</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Seyok</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Lin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Finan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Liao</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Savovoa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Chitnis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Cai</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Z</forename><surname>Xia</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Annals of Clinical and Translational Neurology</title>
		<imprint>
			<biblScope unit="volume">8</biblScope>
			<biblScope unit="page" from="800" to="810" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b25">
	<analytic>
		<title level="a" type="main">Prediction of long-term disability in multiple sclerosis</title>
		<author>
			<persName><forename type="first">R</forename><surname>Schlaeger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Souza</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Schindler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Grize</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Dellas</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Radue</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Kappos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Fuhr</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Multiple Sclerosis Journal</title>
		<imprint>
			<biblScope unit="volume">18</biblScope>
			<biblScope unit="page" from="31" to="38" />
			<date type="published" when="2012">2012</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b26">
	<analytic>
		<title level="a" type="main">Gray matter damage predicts the accumulation of disability 13 years later in ms</title>
		<author>
			<persName><forename type="first">M</forename><surname>Filippi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Preziosa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Copetti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Riccitelli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>Horsfield</surname></persName>
		</author>
		<author>
			<persName><forename type="first">V</forename><surname>Martinelli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Comi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>Rocca</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Neurology</title>
		<imprint>
			<biblScope unit="volume">81</biblScope>
			<biblScope unit="page" from="1759" to="1767" />
			<date type="published" when="2013">2013</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b27">
	<analytic>
		<title level="a" type="main">MAGNIMS Study Group, Brain atrophy and lesion load predict long term disability in multiple sclerosis</title>
		<author>
			<persName><forename type="first">V</forename><surname>Popescu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Agosta</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><forename type="middle">E</forename><surname>Hulst</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><forename type="middle">C</forename><surname>Sluimer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">L</forename><surname>Knol</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">P</forename><surname>Sormani</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Enzinger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Ropele</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Alonso</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Sastre-Garriga</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Rovira</surname></persName>
		</author>
		<author>
			<persName><forename type="first">X</forename><surname>Montalban</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Bodini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Ciccarelli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Z</forename><surname>Khaleeli</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">T</forename><surname>Chard</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Matthews</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Palace</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Giorgio</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">De</forename><surname>Stefano</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Eisele</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gass</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">H</forename><surname>Polman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">M J</forename><surname>Uitdehaag</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">J</forename><surname>Messina</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Comi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Filippi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Barkhof</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Vrenken</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">J. Neurol. Neurosurg. Psychiatry</title>
		<imprint>
			<biblScope unit="volume">84</biblScope>
			<biblScope unit="page" from="1082" to="1091" />
			<date type="published" when="2013">2013</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b28">
	<analytic>
		<title level="a" type="main">Prediction of long-term disability in multiple sclerosis</title>
		<author>
			<persName><forename type="first">R</forename><surname>Schlaeger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Souza</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Schindler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Grize</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Dellas</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><forename type="middle">W</forename><surname>Radue</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Kappos</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Fuhr</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Mult. Scler</title>
		<imprint>
			<biblScope unit="volume">18</biblScope>
			<biblScope unit="page" from="31" to="38" />
			<date type="published" when="2012">2012</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b29">
	<analytic>
		<title level="a" type="main">Exploration of machine learning techniques in predicting multiple sclerosis disease course</title>
		<author>
			<persName><forename type="first">Y</forename><surname>Zhao</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">C</forename><surname>Healy</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Rotstein</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">R G</forename><surname>Guttmann</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Bakshi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><forename type="middle">L</forename><surname>Weiner</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">E</forename><surname>Brodley</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Chitnis</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">PLOS ONE</title>
		<imprint>
			<biblScope unit="volume">12</biblScope>
			<biblScope unit="page">e0174866</biblScope>
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b30">
	<analytic>
		<title level="a" type="main">Systematic review of prediction models in relapsing remitting multiple sclerosis</title>
		<author>
			<persName><forename type="first">F</forename><forename type="middle">S</forename><surname>Brown</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">A</forename><surname>Glasmacher</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><forename type="middle">K A</forename><surname>Kearns</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Macdougall</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Hunt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Connick</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Chandran</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">PLoS One</title>
		<imprint>
			<biblScope unit="volume">15</biblScope>
			<biblScope unit="page">e0233575</biblScope>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b31">
	<analytic>
		<title level="a" type="main">Wearable device and smartphone data quantify als progression and may provide novel outcome measures</title>
		<author>
			<persName><forename type="first">S</forename><forename type="middle">A</forename><surname>Johnson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Karas</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">M</forename><surname>Burke</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Straczkiewicz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Z</forename><forename type="middle">A</forename><surname>Scheier</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">P</forename><surname>Clark</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Iwasaki</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Lahav</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">S</forename><surname>Iyer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J.-P</forename><surname>Onnela</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">D</forename><surname>Berry</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">npj Digital Medicine</title>
		<imprint>
			<biblScope unit="volume">6</biblScope>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b32">
	<analytic>
		<title level="a" type="main">Developing a clinical-environmental-genotypic prognostic index for relapsing-onset multiple sclerosis and clinically isolated syndrome</title>
		<author>
			<persName><forename type="first">V</forename><surname>Fuh-Ngwa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Zhou</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">C</forename><surname>Charlesworth</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A.-L</forename><surname>Ponsonby</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Simpson-Yap</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Lechner-Scott</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">V</forename><surname>Taylor</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">I</forename><surname>Group</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Brain Communications</title>
		<imprint>
			<biblScope unit="volume">3</biblScope>
			<biblScope unit="page">288</biblScope>
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b33">
	<monogr>
		<title level="m" type="main">Baseline machine learning approaches to predict amyotrophic lateral sclerosis disease progression notebook for the idpp lab on intelligent disease progression prediction at clef</title>
		<author>
			<persName><forename type="first">I</forename><surname>Trescato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Guazzo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Longato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Hazizaj</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Roversi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Vettoretti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">Di</forename><surname>Camillo</surname></persName>
		</author>
		<imprint>
			<date type="published" when="2022">2022. 2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b34">
	<monogr>
		<title level="m" type="main">Baseline machine learning approaches to predict multiple sclerosis disease progression</title>
		<author>
			<persName><forename type="first">A</forename><surname>Guazzo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">I</forename><surname>Trescato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Longato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Tavazzi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Vettoretti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Camillo</surname></persName>
		</author>
		<imprint>
			<date type="published" when="2023">2023</date>
			<publisher>CLEF</publisher>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b35">
	<analytic>
		<title level="a" type="main">mice: Multivariate imputation by chained equations in R</title>
		<author>
			<persName><forename type="first">S</forename><surname>Van Buuren</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Groothuis-Oudshoorn</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of statistical software</title>
		<imprint>
			<biblScope unit="volume">45</biblScope>
			<biblScope unit="page" from="1" to="67" />
			<date type="published" when="2011">2011</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b36">
	<analytic>
		<title level="a" type="main">An introduction to variable and feature selection</title>
		<author>
			<persName><forename type="first">I</forename><forename type="middle">M</forename><surname>Guyon</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Elisseeff</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">J. Mach. Learn. Res</title>
		<imprint>
			<biblScope unit="volume">3</biblScope>
			<biblScope unit="page" from="1157" to="1182" />
			<date type="published" when="2003">2003</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b37">
	<analytic>
		<title level="a" type="main">Root-mean-square error (rmse) or mean absolute error (mae): when to use them or not</title>
		<author>
			<persName><forename type="first">T</forename><forename type="middle">O</forename><surname>Hodson</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Geoscientific Model Development</title>
		<imprint>
			<biblScope unit="volume">15</biblScope>
			<biblScope unit="page" from="5481" to="5487" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b38">
	<analytic>
		<title level="a" type="main">Random search for hyper-parameter optimization</title>
		<author>
			<persName><forename type="first">J</forename><surname>Bergstra</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Y</forename><surname>Bengio</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">J. Mach. Learn. Res</title>
		<imprint>
			<biblScope unit="volume">13</biblScope>
			<biblScope unit="page" from="281" to="305" />
			<date type="published" when="2012">2012</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b39">
	<analytic>
		<title level="a" type="main">Air pollution by particulate matter PM10 may trigger multiple sclerosis relapses</title>
		<author>
			<persName><forename type="first">J</forename><surname>Roux</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Bard</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Le Pabic</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Segala</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Reis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">C</forename><surname>Ongagna</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Ze</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Leray</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Environ Res</title>
		<imprint>
			<biblScope unit="volume">156</biblScope>
			<biblScope unit="page" from="404" to="410" />
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
