<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">A geometric XAI approach to protein pocket detection</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Giovanni</forename><surname>Bocchi</surname></persName>
							<email>giovanni.bocchi1@unimi.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Environmental Science and Policy</orgName>
								<orgName type="institution">University of Milan</orgName>
								<address>
									<addrLine>Via Saldini 50</addrLine>
									<postCode>20133</postCode>
									<settlement>Milano</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Patrizio</forename><surname>Frosini</surname></persName>
							<email>patrizio.frosini@unibo.it</email>
							<affiliation key="aff1">
								<orgName type="department">Department of Mathematics</orgName>
								<orgName type="institution">University of Bologna</orgName>
								<address>
									<addrLine>Piazza di Porta S.Donato 5</addrLine>
									<postCode>40126</postCode>
									<settlement>Bologna</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Alessandra</forename><surname>Micheletti</surname></persName>
							<email>alessandra.micheletti@unimi.it</email>
							<affiliation key="aff0">
								<orgName type="department">Department of Environmental Science and Policy</orgName>
								<orgName type="institution">University of Milan</orgName>
								<address>
									<addrLine>Via Saldini 50</addrLine>
									<postCode>20133</postCode>
									<settlement>Milano</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Alessandro</forename><surname>Pedretti</surname></persName>
							<email>alessandro.pedretti@unimi.it</email>
							<affiliation key="aff2">
								<orgName type="department">Department of Pharmaceutical Sciences</orgName>
								<orgName type="institution">University of Milan</orgName>
								<address>
									<addrLine>Via Mangiagalli 25</addrLine>
									<postCode>20133</postCode>
									<settlement>Milano</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Gianluca</forename><surname>Palermo</surname></persName>
							<email>gianluca.palermo@polimi.it</email>
							<affiliation key="aff3">
								<orgName type="department">Department of Electronics, Information and Bioengineering</orgName>
								<orgName type="institution">Politecnico of Milano</orgName>
								<address>
									<addrLine>Via Ponzio 34/5</addrLine>
									<postCode>20133</postCode>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Davide</forename><surname>Gadioli</surname></persName>
							<email>davide.gadioli@polimi.it</email>
							<affiliation key="aff3">
								<orgName type="department">Department of Electronics, Information and Bioengineering</orgName>
								<orgName type="institution">Politecnico of Milano</orgName>
								<address>
									<addrLine>Via Ponzio 34/5</addrLine>
									<postCode>20133</postCode>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Carmen</forename><surname>Gratteri</surname></persName>
							<email>carmen.gratteri@studenti.unicz.it</email>
							<affiliation key="aff4">
								<orgName type="department">Department of Health Sciences</orgName>
								<orgName type="institution">University Magna Graecia di Catanzaro</orgName>
								<address>
									<addrLine>Viale Europa</addrLine>
									<postCode>88100</postCode>
									<settlement>Catanzaro</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Filippo</forename><surname>Lunghini</surname></persName>
							<email>filippo.lunghini@dompe.com</email>
							<affiliation key="aff5">
								<orgName type="institution">Dompé Farmaceutici S.p.A</orgName>
								<address>
									<addrLine>Via Tommaso de Amicis 95</addrLine>
									<postCode>80123</postCode>
									<settlement>Napoli</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Andrea</forename><forename type="middle">Rosario</forename><surname>Beccari</surname></persName>
							<email>andrea.beccari@dompe.com</email>
							<affiliation key="aff5">
								<orgName type="institution">Dompé Farmaceutici S.p.A</orgName>
								<address>
									<addrLine>Via Tommaso de Amicis 95</addrLine>
									<postCode>80123</postCode>
									<settlement>Napoli</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Anna</forename><surname>Fava</surname></persName>
							<email>anna.fava@dompe.com</email>
							<affiliation key="aff5">
								<orgName type="institution">Dompé Farmaceutici S.p.A</orgName>
								<address>
									<addrLine>Via Tommaso de Amicis 95</addrLine>
									<postCode>80123</postCode>
									<settlement>Napoli</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Carmine</forename><surname>Talarico</surname></persName>
							<email>carmine.talarico@dompe.com</email>
							<affiliation key="aff5">
								<orgName type="institution">Dompé Farmaceutici S.p.A</orgName>
								<address>
									<addrLine>Via Tommaso de Amicis 95</addrLine>
									<postCode>80123</postCode>
									<settlement>Napoli</settlement>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">A geometric XAI approach to protein pocket detection</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
					</monogr>
					<idno type="MD5">96838A8E51D4158004E77F209B5F9559</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2025-04-23T19:36+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>Molecular Docking, Protein Pocket Detection, Equivariance, GENEOs C. Talarico) 0000-0002-4017-8212 (G. Bocchi)</term>
					<term>0000-0001-6711-1926 (P. Frosini)</term>
					<term>0000-0002-5369-5657 (A. Micheletti)</term>
					<term>0000-0001-5916-2029 (A. Pedretti)</term>
					<term>0000-0001-7955-8012 (G. Palermo)</term>
					<term>0000-0002-0143-0737 (D. Gadioli)</term>
					<term>0009-0007-3527-2080 (C. Gratteri)</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>Protein pocket detection is an essential step in structure-based virtual screening methods for identifying potential drug targets. To facilitate efficient molecular docking, an accurate determination of target binding sites is indispensable. In this study, we present GENEOnet, an innovative machine learning model based on Group Equivariant Non-Expansive Operators (GENEOs) for protein pocket detection. Our proposed method sets itself apart from other artificial intelligence techniques in the domain due to its reduced number of parameters, increased transparency, and integration of prior knowledge. The experimental assessment validates GENEOnet's efficacy with a limited training dataset, surpassing several established state-of-the-art methods based on multiple critical performance indicators computed using extensive public datasets of ligand-protein complexes. GENEOnet, the result of an ongoing collaborative effort between Italian universities and the pharmaceutical company Dompé Farmaceutici S.p.A., is accessible as a web service at https://geneonet.exscalate.eu to enable the scientific community to evaluate the pre-trained model for pocket detection.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>Molecular docking, a critical research area in both pharmaceuticals and academia, is a simulation technique utilized to predict the binding mode of small molecules with respect to specific target proteins based on their three-dimensional structures <ref type="bibr" target="#b0">[1]</ref>. This method plays a crucial role in elucidating molecular interactions and has significant applications, particularly in drug repurposing <ref type="bibr" target="#b1">[2]</ref>. Repurposing existing and approved drugs involves identifying new therapeutic uses and, bypassing the time-consuming and costly drug development process, enables researchers to expedite the delivery of novel therapies to patients in an efficient and affordable manner.</p><p>Blind docking involves the tentative to accommodate the ligand trying anywhere on the protein surface. However, blind docking comes with challenges like false positives, where ligands may score well but have no experimental binding affinity to the target due to limitations in scoring functions.</p><p>To address these concerns, "informed" docking <ref type="bibr" target="#b2">[3]</ref> is an alternative approach that restricts the search only to promising areas of a protein's surface, known as pockets. This method reduces false positives and computational time needed for extensive virtual screening. Protein pocket detection, which is the problem of identifying such pockets on a target protein, in recent years has been addressed through machine learning and AI methods. However, explainability and trustworthiness of these methods have been neglected.</p><p>In this paper, we present some recent findings relative to GENEOnet <ref type="bibr" target="#b3">[4]</ref> a simple and thus quite explainable machine learning method for protein pocket detection which is built using the mathematical theory of Group Equivariant Non-Expansive Operators.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Methods</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.1.">GENEOs</head><p>In this study, we further investigate GENEOnet a shallow network composed of Group Equivariant Non-Expansive Operator units, whose architecture is depicted in Figure <ref type="figure" target="#fig_0">1a</ref>. For a comprehensive understanding of GENEOs, we refer the reader to <ref type="bibr" target="#b4">[5,</ref><ref type="bibr" target="#b5">6]</ref>. GENEOs possess good mathematical properties that make them interesting for machine learning applications. Two primary features of GENEOs are equivariance and non-expansivity.</p><p>Equivariance <ref type="bibr" target="#b6">[7]</ref> refers to the method's ability to behave coherently with respect to the action of specific groups of geometrical transformations of the data. The simplest form of equivariance is called invariance: for instance, a rotation-invariant method must assign the same label to an image of an elephant facing upwards as it does to the same image rotated 90 degrees left independently on the correctness of the label.</p><p>Non-expansivity means that the outputs of a GENEO should not be further apart than their respective inputs with respect to an appropriate distance metric. This property can be read as a form of theoretical stability, ensuring that small input perturbations result in minimal output changes.</p><p>In this regard, adversarial attacks <ref type="bibr" target="#b7">[8]</ref> aim to assess deep learning methods' robustness against perturbations, such as rotations and noise perturbations of the inputs, and many others. Regrettably, black box models have often been shown to be susceptible to these forms of deception, which could hardly mislead human observers. Instead, by definition, GENEOs can be made resilient to the two attacks mentioned above, making them an attractive option when seeking robust and trustworthy results.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.2.">GENEOnet</head><p>GENEOnet, with a representative output displayed in Figure <ref type="figure" target="#fig_2">2a</ref>, is broken down into six steps:</p><p>1. Data preprocessing: Given an input protein 𝑃 , GENEOnet first computes a voxelization of the space enclosed within a bounding box surrounding the protein surface. Subsequently, eight potential functions are computed on the resulting voxel grid, each one modeling essential aspects of the protein structure from geometrical, physical and chemical viewpoints. 2. GENEO layer: A convolutional rigid motion equivariant operator (mostly based on gaussian kernels), depending on a shape parameter 𝜎, is applied to each potential function.</p><p>The resulting function is normalized between 0 and 1.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Convex combination:</head><p>The eight GENEO outputs are combined via convex combination with weights 𝛼. The resulting combination output, denoted as 𝜓, is normalized between 0 and 1 and encodes the probability that a voxel belongs to a pocket. 4. Thresholding: The final output is obtained by considering the connected components of the set of voxels where the value of 𝜓 is above a threshold parameter 𝜃. 5. Evaluation: If the ground truth (i.e., the co-crystallized ligand) is accessible, the output can be compared against it using a volumetric accuracy function. 6. Scoring: Each predicted pocket is assigned a score, computed as a weighted average of 𝜓 within the spatial region identified by a pocket, enabling ranking of pockets from the most promising to the least promising.</p><formula xml:id="formula_0">P φ 1 φ 2 . . . φ 7 φ 8 ψ 1 ψ 2</formula><p>. . .  </p><formula xml:id="formula_1">ψ 7 ψ 8 ψ ψ F σ1 1 F σ2 2 F σ7 7 F σ8 8 α 1 α 2 α 7 α 8 θ<label>(</label></formula></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3.">Training, model selection and comparison</head><p>Our study employed PDBbind, a publicly accessible database of curated protein-ligand complexes for binding affinity analysis, as the primary data source (available at http://pdbbind.org.cn/). We retrieved 12330 complexes from the 2020 version for evaluation and analysis.</p><p>Steps 1 through 5 were considered during the training process, with backpropagation used to optimize parameters to optimize accuracy (introduced in Step 5). GENEOnet was trained on a set of 200 molecules extracted from the retrieved complexes. However, this method did not address the challenge of identifying true pockets within high-ranked predictions (as per <ref type="bibr">Step 6)</ref>.</p><p>To tackle this issue, we generated multiple models by repeating the optimization process while maintaining the same initial parameter settings but varying the training sets (each comprising of 200 complexes). The final model was selected based on maximizing its ability to identify true pockets at the highest rank using a Validation set consisting of nearly 3000 complexes.</p><p>Moreover, we compared GENEOnet's performance against other state-of-the-art methods (see <ref type="bibr" target="#b3">[4]</ref> for results) in terms of scoring precision, volumetric matching, and shape similarity on a Test set containing approximately 9000 complexes. In all experiments, GENEOnet outperformed the others, which was unexpected due to its unique transparency, explainability, and robustness features not shared by the other methods. We will further explore some of these properties in the following section.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Analysis</head><p>In this section, our aim is to provide an additional in-depth analysis that underscores the explainability and robustness characteristics of GENEOnet, many of which can be attributed to the adoption of GENEOs as building blocks.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.">Prior knowledge</head><p>In the context of developing GENEO-based models, the selection and design of an appropriate pool of operators can be considered as a crucial step of information engineering for the problem at hand.</p><p>In the case of GENEOnet, experts in molecular docking identified lipophilicity, hydrophilicity, hydrogen bond acceptor or donor atoms, etc. (see Table <ref type="table">1b</ref>) as essential features to identify potential pockets. For example, regarding the lipophilicity potential, it was argued that a favorable pocket candidate should exhibit an average high value of this quantity. Thus, a GENEO from the family of convolutional operators with a Gaussian kernel was chosen to process this potential. The tunable shape parameter in this case is linked to the shape of the Gaussian. Analogous considerations were used to select the remaining seven GENEOs for the other potentials.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.2.">Parameters investigation</head><p>GENEOnet, as described in Section 2.2, includes a total of seventeen trainable parameters: eight shape coefficients for operator kernels, eight coefficients for the convex combination, and one threshold coefficient.</p><p>We believe that Equivariance is a primary factor contributing to GENEOnet's relatively few trainable parameters versus other CNN-based methods like DeepSite <ref type="bibr" target="#b8">[9]</ref> (844529) and DeepPocket <ref type="bibr" target="#b9">[10]</ref> (665122). Indeed the requirement for equivariance necessitated the adoption of rotation-invariant kernels, limiting the kernel search to radial functions chosen to depend on only one shape parameter. This leads to a greater understanding and interpretability of GENEOnet's kernel parameters as opposed to standard CNNs. Moreover, while not directly responsible for reducing the number of parameters, the convex constraint promotes sparsity in the combination coefficients, akin to Lasso regularisation. This may result in some biologically relevant GENEOs having small coefficients due to their correlation with other operators.</p><p>Indeed, GENEOnet's limited trainable parameters facilitate precise interpretation of each of them: shape parameters influence operator kernels; convex combination coefficients serve as feature importances for potentials (Table <ref type="table">1b</ref>); and the threshold coefficient determines the significance of voxel activation. The convex combination coefficients warrant further exploration. The lipophilic potential, essential for pockets due to their need to exhibit lipophilic properties, receives the highest score. Surprisingly, potentials linked to hydrogen bonds, despite being biologically significant, have very low scores. As already noticed, this may be a result of the convex constraint: indeed, these potentials tend to be more concentrated in small regions surrounding acceptor or donor atoms, and thus other potentials, such as the polar potential, which might be strongly correlated with hydrogen bonds, are preferred. This could be the case with the selected model where the polar operator has a convex combination weight which is the third highest.</p><p>During the model selection process, parameter sensitivity analyses were performed as byproducts when generating 200 models from different training sets (Figure <ref type="figure" target="#fig_2">2b</ref> shows boxplots of the convex combination coefficients). The findings largely confirm the conclusions of the previous paragraphs: on average, hydrogen bonds play a role but are outweighed by other operators, such as lipophilicity, which exhibit a coefficients distribution with a box containing higher values (𝛼 4 ). If this analysis confirms the importance of potentials like those related to hydrogen bonds, it also reveals that the Gravitational and Hydrophilic potentials are given very little importance, a result that was somewhat anticipated given the nature of these potentials in connection to pocket detection.  <ref type="table">1b</ref>. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.3.">Robustness test</head><p>Here we tested robustness to perturbations. In our context, robustness is strictly related to the Non-Expansivity property of GENEOs, and it is very important for pocket identification since proteins may exhibit extremely dynamic shapes, while in the data, they are frozen until crystallizing to capture an image of the structure. To test robustness, six proteins were selected: two belonging to the set of those whose true pocket was matched by the top-ranked prediction (proteins 2IGV, 4B0C), another two from the set of pockets matched by the second-ranked prediction (proteins 1L83, 3PCB), and the remaining two from those matched by the thirdranked predicted pocket (proteins 1IIH, 4TIM). White noise was introduced by summing i.i.d. Gaussian r.v. 𝒩 (0, 𝑠 2 ) with zero mean and variance 𝑠 2 to every voxel. Although i.i.d. noise is not realistic, as perturbations in the protein conformation are likely correlated because of atom interactions, it serves as a global test for robustness. We conducted multiple experiments by varying the standard deviation 𝑠 in the set {0.01, 0.03, 0.05}, each time generating 200 different perturbations. Figure <ref type="figure" target="#fig_3">3</ref> shows that overlaps and scores distributions of perturbations exhibit great robustness for all values of standard deviation 𝑠. Figure <ref type="figure" target="#fig_4">4</ref> indicates greater robustness for rankings of top and second-ranked pockets while a mildly lower degree of stability is showed for third-ranked pockets. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Discussion</head><p>The analysis presented in the preceding section provides an initial understanding of GENEOnet's explainability and trustworthiness, summarised as follows:</p><p>• GENEOnet can incorporate prior knowledge not only during feature selection but also in operator pool selection. Although feature selection is common in machine learning algorithms, this second step is less frequently considered, making the choice of operators more complex and less stable for methods like Convolutional Neural Networks. • GENEOnet has a smaller number of parameters than other protein pocket detection methods based on deep learning architectures. This attribute allows us to perform sensitivity analysis and provides interpretability by design rather than using post hoc explanation techniques. • GENEOnet's equivariance with respect to rigid motions allows us to overlook the input protein's spatial pose and helps to reduce the number of parameters. • GENEOnet's non-expansivity provides the model with a reasonable degree of robustness against small physiological modifications in the input protein's spatial conformation.</p><p>The model shows great robustness for lower noise standard deviations when analysing the identifications made by the first or second predicted pockets. However, larger input changes may influence the final prediction. We leave this study to subsequent work. • The reduced data requirements for training GENEOnet (200 complexes) compared to deep learning methods help decrease computational costs and processing times. This attribute is not directly related to explainability but makes the model more accessible as fewer resources are needed to reproduce its results or delve deeper into its analysis.</p><p>In conclusion, GENEOs hold promise for building explainable and robust models such as GENEOnet. Future work includes creating more instances of GENEO-based models <ref type="bibr" target="#b10">[11]</ref> and further evaluation of GENEOnet. A promising advancement could be the use of GENEOnet for analyzing molecular dynamics data. In molecular dynamics simulations, tracking the progression of GENEOnet scores for pockets jointly with techniques that identify breakpoints (see e.g. <ref type="bibr" target="#b11">[12]</ref>) may help pinpoint optimal frames for bond formation.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>Figure 1 :</head><label>1</label><figDesc>Figure 1: Model architecture and optimal parameters.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_1"><head></head><label></label><figDesc>(a) The input protein is depicted in white, while predicted pockets with colors. A zoom shows the true pocket containing the ligand. (b) Sensitivity analysis of convex combination coefficients. Lines indicate median values, whereas stars represent means. The order is the same as in Table</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_2"><head>Figure 2 :</head><label>2</label><figDesc>Figure 2: GENEOnet example (Protein ID 6WIY) and sensitivity analysis.</figDesc><graphic coords="5,50.11,419.18,242.35,121.18" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_3"><head>Figure 3 :</head><label>3</label><figDesc>Figure 3: Box Plots of Overlaps and Scores: For each protein, the upper boxplot illustrates the distribution of overlaps between the predicted pocket having the highest overlap to the true pocket and the true pocket itself, while the lower boxplot depicts the corresponding distribution of scores.</figDesc><graphic coords="6,95.13,285.81,133.35,198.02" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_4"><head>Figure 4 :</head><label>4</label><figDesc>Figure 4: Bar Plots of Rank Positions: Each bar chart depicts the distribution of rankings assigned to the predicted pockets that correspond to the true ones across the perturbed sample set.</figDesc><graphic coords="7,95.13,84.19,133.34,186.16" type="bitmap" /></figure>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Acknowledgments</head><p>This research was financially supported by Dompé Farmaceutici S.p.A. Additional scientific support is acknowledged to the Italian GNAMPA -INDAM group. Computational resources were partially provided by the INDACO core facility for HPC at Università degli Studi di Milano.</p><p>Availability: GENEOnet can be tested at the following URL: https://geneonet.exscalate.eu</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">The process of structure-based drug design</title>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">C</forename><surname>Anderson</surname></persName>
		</author>
		<idno type="DOI">10.1016/j.chembiol.2003.09.002</idno>
	</analytic>
	<monogr>
		<title level="j">Chem. Biol</title>
		<imprint>
			<biblScope unit="volume">10</biblScope>
			<biblScope unit="page" from="787" to="797" />
			<date type="published" when="2003">2003</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">A review of recent developments and progress in computational drug repositioning</title>
		<author>
			<persName><forename type="first">W</forename><surname>Shi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">X</forename><surname>Chen</surname></persName>
		</author>
		<idno type="DOI">10.2174/1381612826666200116145559</idno>
	</analytic>
	<monogr>
		<title level="j">Curr. Pharm. Design</title>
		<imprint>
			<biblScope unit="volume">26</biblScope>
			<biblScope unit="page" from="3059" to="3068" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">Improving accuracy and efficiency of blind protein-ligand docking by focusing on predicted binding sites</title>
		<author>
			<persName><forename type="first">D</forename><surname>Ghersi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Sanchez</surname></persName>
		</author>
		<idno type="DOI">10.1002/prot.22154</idno>
	</analytic>
	<monogr>
		<title level="j">Proteins</title>
		<imprint>
			<biblScope unit="volume">74</biblScope>
			<biblScope unit="page" from="417" to="424" />
			<date type="published" when="2009">2009</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<monogr>
		<title level="m" type="main">GENEOnet: A new machine learning paradigm based on group equivariant non-expansive operators. an application to protein pocket detection</title>
		<author>
			<persName><forename type="first">G</forename><surname>Bocchi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Frosini</surname></persName>
		</author>
		<idno type="arXiv">arXiv:2202.00451</idno>
		<imprint>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">Towards a topological-geometrical theory of group equivariant non-expansive operators for data analysis and machine learning</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">G</forename><surname>Bergomi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Frosini</surname></persName>
		</author>
		<idno type="DOI">10.1038/s42256-019-0087-3</idno>
	</analytic>
	<monogr>
		<title level="j">Nat. Mach. Intell</title>
		<imprint>
			<biblScope unit="volume">1</biblScope>
			<biblScope unit="page" from="423" to="433" />
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">On the finite representation of linear group equivariant operators via permutant measures</title>
		<author>
			<persName><forename type="first">G</forename><surname>Bocchi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Botteghi</surname></persName>
		</author>
		<idno type="DOI">10.1007/s10472-022-09830-1</idno>
	</analytic>
	<monogr>
		<title level="j">Ann. Math. Artif. Intell</title>
		<imprint>
			<biblScope unit="volume">91</biblScope>
			<biblScope unit="page" from="465" to="487" />
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">Group equivariant convolutional networks</title>
		<author>
			<persName><forename type="first">T</forename><forename type="middle">S</forename><surname>Cohen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Welling</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">ICML</title>
		<imprint>
			<biblScope unit="volume">48</biblScope>
			<biblScope unit="page" from="2990" to="2999" />
			<date type="published" when="2016">2016. 2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">Strike (with) a pose: Neural networks are easily fooled by strange poses of familiar objects</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>Alcorn</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Q</forename><surname>Li</surname></persName>
		</author>
		<idno type="DOI">10.1109/CVPR.2019.00498</idno>
	</analytic>
	<monogr>
		<title level="m">CVPR 2019</title>
				<imprint>
			<date type="published" when="2019">2019</date>
			<biblScope unit="page" from="4840" to="4849" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">Deepsite: protein-binding site predictor using 3d-convolutional neural networks</title>
		<author>
			<persName><forename type="first">J</forename><surname>Jimenez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Doerr</surname></persName>
		</author>
		<idno type="DOI">10.1093/bioinformatics/btx350</idno>
	</analytic>
	<monogr>
		<title level="j">Bioinformatics</title>
		<imprint>
			<biblScope unit="volume">33</biblScope>
			<biblScope unit="page" from="3036" to="3042" />
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">Deeppocket: Ligand binding site detection and segmentation using 3d convolutional neural networks</title>
		<author>
			<persName><forename type="first">R</forename><surname>Aggarwal</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gupta</surname></persName>
		</author>
		<idno type="DOI">10.1021/acs.jcim.1c00799</idno>
	</analytic>
	<monogr>
		<title level="j">J. Chem Inf. Model</title>
		<imprint>
			<biblScope unit="volume">62</biblScope>
			<biblScope unit="page" from="5069" to="5079" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<monogr>
		<title level="m" type="main">Low-resource white-box semantic segmentation of supporting towers on 3d point clouds via signature shape identification</title>
		<author>
			<persName><forename type="first">D</forename><surname>Lavado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Soares</surname></persName>
		</author>
		<idno type="arXiv">arXiv:2306.07809</idno>
		<imprint>
			<date type="published" when="2023">2023</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">A weighted 𝜒 2 test to detect the presence of a major change point in non-stationary markov chains</title>
		<author>
			<persName><forename type="first">A</forename><surname>Micheletti</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Aletti</surname></persName>
		</author>
		<idno type="DOI">10.1007/s10260-020-00510-0</idno>
	</analytic>
	<monogr>
		<title level="j">Stat. Method. Appl</title>
		<imprint>
			<biblScope unit="volume">29</biblScope>
			<biblScope unit="page" from="899" to="912" />
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
