<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">A Comparison of Deep Learning with Global Features for Gastrointestinal Disease Detection</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
							<email>konstantin@simula.no</email>
							<affiliation key="aff0">
								<orgName type="laboratory">Simula Research Laboratory</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">University of Oslo</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
							<email>michael@simula.no</email>
							<affiliation key="aff0">
								<orgName type="laboratory">Simula Research Laboratory</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Pål</forename><surname>Halvorsen</surname></persName>
							<affiliation key="aff0">
								<orgName type="laboratory">Simula Research Laboratory</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">University of Oslo</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Carsten</forename><surname>Griwodz</surname></persName>
							<affiliation key="aff0">
								<orgName type="laboratory">Simula Research Laboratory</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
							<affiliation key="aff1">
								<orgName type="institution">University of Oslo</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Thomas</forename><surname>De Lange</surname></persName>
							<affiliation key="aff2">
								<orgName type="institution">Cancer Registry of Norway</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Kristin</forename><forename type="middle">Ranheim</forename><surname>Randel</surname></persName>
							<affiliation key="aff1">
								<orgName type="institution">University of Oslo</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
							<affiliation key="aff2">
								<orgName type="institution">Cancer Registry of Norway</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Sigrun</forename><forename type="middle">Losada</forename><surname>Eskeland</surname></persName>
							<affiliation key="aff3">
								<orgName type="institution">Vestre Viken Hospital Trust</orgName>
								<address>
									<country key="NO">Norway</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Duc-Tien</forename><surname>Dang-Nguyen</surname></persName>
							<affiliation key="aff4">
								<orgName type="institution">Dublin City University</orgName>
								<address>
									<country key="IE">Ireland</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Olga</forename><surname>Ostroukhova</surname></persName>
							<affiliation key="aff7">
								<orgName type="institution">Research Institute of Multiprocessor Computation Systems n.a. A.V. Kalyaev</orgName>
								<address>
									<country key="RU">Russia</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Mathias</forename><surname>Lux</surname></persName>
							<affiliation key="aff5">
								<orgName type="institution">University of Klagenfurt</orgName>
								<address>
									<country key="AT">Austria</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Concetto</forename><surname>Spampinato</surname></persName>
							<affiliation key="aff6">
								<orgName type="institution">University of Catania</orgName>
								<address>
									<country key="IT">Italy</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">A Comparison of Deep Learning with Global Features for Gastrointestinal Disease Detection</title>
					</analytic>
					<monogr>
						<imprint>
							<date/>
						</imprint>
					</monogr>
					<idno type="MD5">E4F61CD64F8DF8F59EE5A1CCAC532A80</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2023-03-24T04:53+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>This paper presents our approach for the 2017 Multimedia for Medicine Medico Task of the MediaEval 2017 Benchmark. We propose a system based on global features and deep neural networks, and preliminary results comparing the approaches are presented.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1">INTRODUCTION</head><p>Following the initiative to investigate how multimedia can improve medical systems <ref type="bibr" target="#b14">[15]</ref>, the 2017 Multimedia for Medicine Medico Task <ref type="bibr" target="#b17">[18]</ref> addresses the challenge of detecting diseases based on multimedia data collected in hospitals <ref type="bibr" target="#b12">[13]</ref>, i.e., the task focuses on detecting abnormalities, diseases and anatomical landmarks in images in the gastrointestinal (GI) tract. There do exist some proposals in this area using various approaches <ref type="bibr" target="#b19">[20,</ref><ref type="bibr" target="#b20">21]</ref>, and in this paper, we describe our solutions, based on both our global-featuresbased and neural-network-based EIR prototypes <ref type="bibr" target="#b11">[12,</ref><ref type="bibr" target="#b13">14,</ref><ref type="bibr" target="#b15">16,</ref><ref type="bibr" target="#b16">17]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2">CLASSIFICATION APPROACHES</head><p>The proposed approaches are based on the hypothesis that GI tract diseases and findings can be recognized and classified based on color, shape and texture properties. In this challenge, there is no detailed ground truth ROIs provided for the training dataset, thus, already existing and well performing approaches to objects recognition are not suitable for this particular task. Moreover, a relatively low amount of training data is provided making it difficult to use modern convolutional neural network (CNN) image segmentation and region-based classification approaches. Furthermore, some objects like polyps and resection margins have a compact body and can be easily differentiated from the surrounding tissue, but other findings like ulcerative colitis have only tissue with a slightly different color properties. To address these different detection challenges, we present 17 different approaches that implement our idea of using visual properties of images for performing multi-class classification with the limited training set size. For the final classification step, we use the WEKA machine learning support library <ref type="bibr" target="#b6">[7]</ref> which is an open source collection of algorithms for machine learning and data mining. For all the approaches based on global features (GFs), we use Lucene Image Retrieval (LIRE) <ref type="bibr" target="#b9">[10]</ref>, an open source implementation of global and local features extraction and comparison. For all the deep-learning-based approaches, we use Keras <ref type="bibr" target="#b2">[3]</ref>, an open Copyright held by the owner/author(s). MediaEval'17, 13-15 September 2017, Dublin, Ireland source high-level neural networks API with Google Tensorflow <ref type="bibr" target="#b0">[1]</ref> as a computational back-end.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.1">Global-features-based</head><p>For the GF-based approaches, we use features that represent the overall image visual properties, they are easy and fast to calculate, and they can be used for image comparison, distance computing and image collection search. Here, we use the indexes of visual features extracted from training image set. A classifier is used to search the index for the image that is most similar to a given input image. The GFs we use are JCD, Tamura, Color Layout, Edge Histogram, Auto Color Correlogram and Pyramid Histogram of Oriented Gradients <ref type="bibr" target="#b9">[10]</ref>. We decided for these combinations based on our previous findings and experiments in <ref type="bibr" target="#b13">[14,</ref><ref type="bibr" target="#b15">16]</ref>. Multi-class classification is implemented as an additional classification step to determine the final image class based on the the ranked lists of a search-based classifier for each class of findings. We use the random tree (RT), random forest (RF) and logistic model tree (LMT) classifiers <ref type="bibr" target="#b6">[7]</ref> from WEKA.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.2">Deep-features-based</head><p>For the deep-features-based approaches, we use a combined method with deep residual networks for image recognition as features extractor and machine-learning classifier with the input of extracted deep-features as a multi-class classifier. We use the Inception v3 <ref type="bibr" target="#b18">[19]</ref> and ResNet50 <ref type="bibr" target="#b7">[8]</ref> models pre-trained on a set of general images. The models were modified in order to produce numerical probability output for all recognized object classes. Then, we use the class (concept) probabilities (1000 values for both networks) directly in the Concepts runs. For the Features runs, we have used the same pre-trained models without including the fully-connected layer at the top of the network, which give us an output of high-level feature probabilities (16384 values for Inception v3 and 2048 for ResNet50). Finally, we combine the probabilities by simple early fusion in one big vector of floating point numbers and use it as an input for the same classifiers we used in the GF-based approaches.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3">CNN-based</head><p>For the CNN-based approach, we created and trained a custom CNN from scratch. Our CNN consist of six convolution layers. As an activation function, we used the rectified linear unit (ReLU) <ref type="bibr" target="#b5">[6]</ref> and maxpooling for pooling. In all the layers, we also included a 0.5 dropout, and the final classification step was performed using two dense layers with first ReLU and then Sigmoid as activation functions. Both networks were trained for 200 epochs using the Adam optimizer <ref type="bibr" target="#b8">[9]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.4">Transfer-learning-based</head><p>For the transfer-learning-based (TFL) approach, we use the pretrained Inception v3 <ref type="bibr" target="#b18">[19]</ref> model and transfer learning technique <ref type="bibr" target="#b1">[2]</ref> to train the network on our specific training set. We re-trained the base model and fine-tuned the last layers on the training set following the DeCAF approach <ref type="bibr" target="#b4">[5]</ref>. We did not perform complex data augmentation and only relied on transfer learning. We froze all the basic convolutional layers of the network and only retrained the two top dense layers. The dense layers were retrained using the RMSprop <ref type="bibr" target="#b3">[4]</ref> optimizer that allows an adaptive learning rate during the training process. After 1,000 epochs, we stopped the retraining of the dense layers and started fine tuning the convolutional layers. For that step, we did the analysis of the Inception v3 model layers structure and decided to apply the fine-tuning on the top two convolutional layers. For this training step, we used a stochastic gradient descent method with a low learning rate to achieve the best effect in terms of speed and accuracy <ref type="bibr" target="#b10">[11]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3">EXPERIMENTAL RESULTS</head><p>First, we have performed an initial evaluation of the approaches using the development dataset only randomly splitting it into new training and test sets with the equal number of 2, 000 images in each. We assessed 17 different methods executed in 17 internal runs using the new sets generated. An overview of the conducted internal runs can be found in table <ref type="table" target="#tab_0">1</ref> where we provide the measured performance metrics <ref type="bibr" target="#b12">[13]</ref>. We can see that not all our approaches can perform efficiently on the given dataset. In general, we can conclude that for all the machine-learning-based classification approaches, the LMT classifier is performing the best, the RF classifier is slightly worse, and the RT classifier performs the worst. The 6 Layers CNN and Inception v3 TFL approaches performs with the comparable precision, but Inception v3 TFL have slightly better results. The Inception v3 Concepts and ResNet50 Concepts approaches performs with the comparable precision too, but all the ResNet50 Concepts approaches perform slightly better. The Inception v3 Features approaches perform the worst compared to all other features-based approaches even for the efficient LMT classifier, which can be caused by the huge feature values vector generated by the Inception v3 network. Finally, the best performing approach is the ResNet50 Features approach with the LMT classifier showing the performance of 0.828 for R K and 0.856 for F1 score.</p><p>Based on the initial evaluation, we have selected the five different approaches for the official competition submission. The approaches selected (see table <ref type="table" target="#tab_1">2</ref>) are the best performing in the internal runs while keeping as much diversity of the methods as possible. The official evaluation results provided by the organizers is presented in table 2. The best performing approach is again the ResNet50 Features approach with the LMT classifier (run #4) with the R K value of 0.802 and F1 score of 0.826. The confusion matrix of this run is presented in table 3. The often miss-classified classes are Esophagitis and Z-line that is caused by the nature of the used visual features. Both of these classes consist of pictures of Z-Line, but Esophagitis   </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4">CONCLUSION</head><p>In this paper, we presented 17 different combined approaches designed for multi-class classification of medical imaging data with the limited training dataset. We presented a novel comparison of the performance of the various visual-features-based methods with traditional custom CNN and Inception v3 with transfer-learningbased approaches. We used modified Inception v3 and ResNet50 networks and the LIRE library for the features extraction, with machine-learning classification algorithms from WEKA. Despite the limited training dataset and a presence of visually similar image classes, we achieved a good multi-class classification performance with the R K value of 0.802 and a classification speed of 46 frames per second. For our future research, we will investigate the combined approach with the fusion of multiple deep-network-based feature extractors for the initial coarse image classification together with the fine-tuned local-feature-based sub-classification for the efficient cross-class detection between visually similar images.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>MediaEval' 17</head><label>17</label><figDesc>, 13-15 September 2017, Dublin, Ireland Pogorelov et al.</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_0"><head>Table 1 :</head><label>1</label><figDesc>Initial performance evaluation based on the random split of the task development dataset.</figDesc><table><row><cell>Method</cell><cell>PREC REC SPEC ACC</cell><cell>F1</cell><cell>R K FPS</cell></row><row><cell>6 Layer CNN</cell><cell cols="3">0.659 0.642 0.947 0.900 0.640 0.600 43</cell></row><row><cell>Inception v3 TFL</cell><cell cols="3">0.700 0.695 0.961 0.925 0.704 0.661 53</cell></row><row><cell>Inception v3 Concepts RT</cell><cell cols="3">0.405 0.402 0.915 0.851 0.403 0.318 66</cell></row><row><cell>Inception v3 Concepts RF</cell><cell cols="3">0.704 0.701 0.957 0.925 0.699 0.659 50</cell></row><row><cell cols="4">Inception v3 Concepts LMT 0.771 0.763 0.970 0.940 0.745 0.721 37</cell></row><row><cell>Inception v3 Features RT</cell><cell cols="3">0.287 0.288 0.898 0.822 0.287 0.186 56</cell></row><row><cell>Inception v3 Features RF</cell><cell cols="3">0.436 0.447 0.921 0.862 0.436 0.362 43</cell></row><row><cell cols="4">Inception v3 Features LMT 0.444 0.438 0.920 0.859 0.438 0.360 30</cell></row><row><cell>ResNet50 Concepts RT</cell><cell cols="3">0.507 0.500 0.929 0.875 0.501 0.431 88</cell></row><row><cell>ResNet50 Concepts RF</cell><cell cols="3">0.762 0.753 0.965 0.938 0.751 0.720 78</cell></row><row><cell>ResNet50 Concepts LMT</cell><cell cols="3">0.781 0.799 0.983 0.970 0.797 0.750 53</cell></row><row><cell>ResNet50 Features RT</cell><cell cols="3">0.479 0.478 0.925 0.869 0.477 0.403 79</cell></row><row><cell>ResNet50 Features RF</cell><cell cols="3">0.790 0.782 0.980 0.928 0.769 0.763 70</cell></row><row><cell>ResNet50 Features LMT</cell><cell cols="3">0.841 0.839 0.985 0.972 0.856 0.828 46</cell></row><row><cell>6 Global Features RT</cell><cell cols="3">0.576 0.578 0.940 0.894 0.576 0.516 130</cell></row><row><cell>6 Global Features RF</cell><cell cols="3">0.744 0.734 0.981 0.951 0.784 0.705 105</cell></row><row><cell>6 Global Features LMT</cell><cell cols="3">0.800 0.785 0.980 0.964 0.781 0.748 80</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_1"><head>Table 2 :</head><label>2</label><figDesc>The official classification performance evaluation results (provided by the organizers) of the submitted runs.</figDesc><table><row><cell cols="2">Run # Method</cell><cell>PREC REC SPEC ACC</cell><cell>F1</cell><cell>R K FPS</cell></row><row><cell>1</cell><cell>Inception v3 TFL</cell><cell cols="3">0.735 0.715 0.963 0.725 0.725 0.686 53</cell></row><row><cell>2</cell><cell cols="4">Inception v3 Concepts LMT 0.742 0.738 0.963 0.934 0.737 0.701 37</cell></row><row><cell>3</cell><cell>ResNet50 Concepts LMT</cell><cell cols="3">0.766 0.763 0.966 0.941 0.761 0.729 53</cell></row><row><cell>4</cell><cell>ResNet50 Features LMT</cell><cell cols="3">0.829 0.826 0.975 0.957 0.826 0.802 46</cell></row><row><cell>5</cell><cell>6 Global Features LMT</cell><cell cols="3">0.766 0.760 0.966 0.940 0.757 0.727 80</cell></row></table></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" type="table" xml:id="tab_2"><head>Table 3 :</head><label>3</label><figDesc>Confusion matrix for the ResNet50 Features LMT run #4.</figDesc><table><row><cell></cell><cell></cell><cell></cell><cell></cell><cell></cell><cell cols="2">Detected class</cell><cell></cell><cell></cell><cell></cell></row><row><cell></cell><cell></cell><cell>A</cell><cell>B</cell><cell>C</cell><cell>D</cell><cell>E</cell><cell>F</cell><cell>G</cell><cell>H</cell></row><row><cell></cell><cell>Esophagitis (A)</cell><cell>319</cell><cell>0</cell><cell>4</cell><cell>2</cell><cell>174</cell><cell>0</cell><cell>1</cell><cell>0</cell></row><row><cell></cell><cell>Dyed and Lifted Polyps (B)</cell><cell>0</cell><cell>385</cell><cell>0</cell><cell>6</cell><cell>0</cell><cell>59</cell><cell>47</cell><cell>3</cell></row><row><cell>Actual class</cell><cell>Pylorus (C) Ulcerative colitis (D) Z-line (E) Dyed Resection Margins (F)</cell><cell>6 5 104 0</cell><cell>0 0 0 84</cell><cell>460 1 8 1</cell><cell>7 460 0 5</cell><cell>19 0 385 0</cell><cell>0 2 0 403</cell><cell>7 14 3 5</cell><cell>1 18 0 2</cell></row><row><cell></cell><cell>Polyps (G)</cell><cell>1</cell><cell>3</cell><cell>1</cell><cell>19</cell><cell>1</cell><cell>1</cell><cell cols="2">441 33</cell></row><row><cell></cell><cell>Cecum (H)</cell><cell>0</cell><cell>1</cell><cell>0</cell><cell>29</cell><cell>0</cell><cell>0</cell><cell cols="2">18 452</cell></row></table><note>is the inflammation of Z-Line area, thus local image characteristics should be used to distinguish between these classes more precisely. The same reason can explain some cases of miss-classification with Dyed and Lifted Polyps, Dyed Resection Margins and Polyps classes.</note></figure>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>ACKNOWLEDGMENTS</head><p>This work is founded by the FRINATEK project "EONS" #231687.</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<monogr>
		<author>
			<persName><forename type="first">Martín</forename><surname>Abadi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Ashish</forename><surname>Agarwal</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Paul</forename><surname>Barham</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Eugene</forename><surname>Brevdo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Zhifeng</forename><surname>Chen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Craig</forename><surname>Citro</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Greg</forename><forename type="middle">S</forename><surname>Corrado</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Andy</forename><surname>Davis</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Jeffrey</forename><surname>Dean</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Matthieu</forename><surname>Devin</surname></persName>
		</author>
		<author>
			<persName><surname>Others</surname></persName>
		</author>
		<idno type="arXiv">arXiv:1603.04467</idno>
		<title level="m">Tensorflow: Large-scale machine learning on heterogeneous distributed systems</title>
				<imprint>
			<date type="published" when="2016">2016. 2016</date>
		</imprint>
	</monogr>
	<note type="report_type">arXiv preprint</note>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">Transfer learning with deep networks for saliency prediction in natural video</title>
		<author>
			<persName><forename type="first">Souad</forename><surname>Chaabouni</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Jenny</forename><surname>Benois-Pineau</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Chokri</forename><surname>Ben Amar</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2016 IEEE International Conference on Image Processing (ICIP)</title>
				<meeting>the 2016 IEEE International Conference on Image Processing (ICIP)</meeting>
		<imprint>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="1604" to="1608" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<monogr>
		<author>
			<persName><forename type="first">François</forename><surname>Chollet</surname></persName>
		</author>
		<ptr target="https://keras.io/" />
		<title level="m">Keras: Deep learning library for theano and tensorflow</title>
				<imprint>
			<date type="published" when="2015">2015. 2015. 2017-09-01</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<monogr>
		<title level="m" type="main">RMSProp and equilibrated adaptive learning rates for non-convex optimization</title>
		<author>
			<persName><forename type="first">, H De</forename><surname>Yn Dauphin</surname></persName>
		</author>
		<author>
			<persName><surname>Vries</surname></persName>
		</author>
		<author>
			<persName><surname>Chung</surname></persName>
		</author>
		<author>
			<persName><surname>Bengio</surname></persName>
		</author>
		<idno type="arXiv">arXiv:1502.04390</idno>
		<imprint>
			<date type="published" when="2015">2015. 2015</date>
		</imprint>
	</monogr>
	<note type="report_type">arXiv preprint</note>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">DeCAF: A Deep Convolutional Activation Feature for Generic Visual Recognition</title>
		<author>
			<persName><forename type="first">Jeff</forename><surname>Donahue</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Yangqing</forename><surname>Jia</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Oriol</forename><surname>Vinyals</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Judy</forename><surname>Hoffman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Ning</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Eric</forename><surname>Tzeng</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Trevor</forename><surname>Darrell</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 31st International Conference on Machine Learning (ICML)</title>
				<meeting>the 31st International Conference on Machine Learning (ICML)</meeting>
		<imprint>
			<date type="published" when="2014">2014</date>
			<biblScope unit="volume">32</biblScope>
			<biblScope unit="page" from="647" to="655" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">Digital selection and analogue amplification coexist in a cortex-inspired silicon circuit</title>
		<author>
			<persName><forename type="first">Rahul</forename><surname>Richard Hr Hahnloser</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Misha</forename><forename type="middle">A</forename><surname>Sarpeshkar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Rodney</forename><forename type="middle">J</forename><surname>Mahowald</surname></persName>
		</author>
		<author>
			<persName><surname>Douglas</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Seung</forename><surname>Sebastian</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Nature</title>
		<imprint>
			<biblScope unit="volume">405</biblScope>
			<biblScope unit="page" from="947" to="951" />
			<date type="published" when="2000">2000. 2000</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">The WEKA data mining software: an update</title>
		<author>
			<persName><forename type="first">Mark</forename><surname>Hall</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Eibe</forename><surname>Frank</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Geoffrey</forename><surname>Holmes</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Bernhard</forename><surname>Pfahringer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Peter</forename><surname>Reutemann</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Ian</forename><forename type="middle">H</forename><surname>Witten</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">ACM SIGKDD explorations newsletter</title>
		<imprint>
			<biblScope unit="volume">11</biblScope>
			<biblScope unit="issue">1</biblScope>
			<biblScope unit="page" from="10" to="18" />
			<date type="published" when="2009">2009. 2009</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">Deep residual learning for image recognition</title>
		<author>
			<persName><forename type="first">Kaiming</forename><surname>He</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Xiangyu</forename><surname>Zhang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Shaoqing</forename><surname>Ren</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Jian</forename><surname>Sun</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)</title>
				<meeting>the 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)</meeting>
		<imprint>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="770" to="778" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<monogr>
		<title level="m" type="main">Adam: A method for stochastic optimization</title>
		<author>
			<persName><forename type="first">Diederik</forename><surname>Kingma</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Jimmy</forename><surname>Ba</surname></persName>
		</author>
		<idno type="arXiv">arXiv:1412.6980</idno>
		<imprint>
			<date type="published" when="2014">2014. 2014</date>
		</imprint>
	</monogr>
	<note type="report_type">arXiv preprint</note>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">LIRE: open source visual information retrieval</title>
		<author>
			<persName><forename type="first">Mathias</forename><surname>Lux</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Pål</forename><surname>Halvorsen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Nektarios</forename><surname>Anagnostopoulos</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2016 ACM Conference on Multimedia Systems (MMSys)</title>
				<meeting>the 2016 ACM Conference on Multimedia Systems (MMSys)</meeting>
		<imprint>
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
	<note>Article no. 30</note>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">On optimization methods for deep learning</title>
		<author>
			<persName><forename type="first">Jiquan</forename><surname>Ngiam</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Adam</forename><surname>Coates</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Ahbik</forename><surname>Lahiri</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Bobby</forename><surname>Prochnow</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Andrew</forename><forename type="middle">Y</forename><surname>Quoc V Le</surname></persName>
		</author>
		<author>
			<persName><surname>Ng</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 28th International Conference on Machine Learning (ICML)</title>
				<meeting>the 28th International Conference on Machine Learning (ICML)</meeting>
		<imprint>
			<date type="published" when="2011">2011</date>
			<biblScope unit="page" from="265" to="272" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">A holistic multimedia system for gastrointestinal tract disease detection</title>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sigrun</forename><surname>Losada Eskeland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Thomas</forename><surname>De Lange</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Carsten</forename><surname>Griwodz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Kristin</forename><forename type="middle">Ranheim</forename><surname>Randel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Håkon</forename><surname>Kvale Stensland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Duc-Tien</forename><surname>Dang-Nguyen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Concetto</forename><surname>Spampinato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Dag</forename><surname>Johansen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><surname>Others</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 8th ACM Conference on Multimedia Systems (MMSys)</title>
				<meeting>the 8th ACM Conference on Multimedia Systems (MMSys)</meeting>
		<imprint>
			<date type="published" when="2017">2017</date>
			<biblScope unit="page" from="112" to="123" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b12">
	<analytic>
		<title level="a" type="main">Kvasir: A Multi-Class Image Dataset for Computer Aided Gastrointestinal Disease Detection</title>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Kristin</forename><forename type="middle">Ranheim</forename><surname>Randel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Carsten</forename><surname>Griwodz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sigrun</forename><surname>Losada Eskeland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Thomas</forename><surname>De Lange</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Dag</forename><surname>Johansen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Concetto</forename><surname>Spampinato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Duc-Tien</forename><surname>Dang-Nguyen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Mathias</forename><surname>Lux</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Peter</forename><forename type="middle">Thelin</forename><surname>Schmidt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Pål</forename><surname>Halvorsen</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 8th ACM on Multimedia Systems Conference (MMSys)</title>
				<meeting>the 8th ACM on Multimedia Systems Conference (MMSys)</meeting>
		<imprint>
			<date type="published" when="2017">2017</date>
			<biblScope unit="page" from="164" to="169" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b13">
	<analytic>
		<title level="a" type="main">Efficient disease detection in gastrointestinal videos -global features versus neural networks</title>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sigrun</forename><surname>Losada Eskeland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Thomas</forename><surname>De Lange</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Dag</forename><surname>Johansen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Carsten</forename><surname>Griwodz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Peter</forename><forename type="middle">Thelin</forename><surname>Schmidt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Pål</forename><surname>Halvorsen</surname></persName>
		</author>
		<idno type="DOI">10.1007/s11042-017-4989-y</idno>
		<ptr target="https://doi.org/10.1007/s11042-017-4989-y" />
	</analytic>
	<monogr>
		<title level="j">Multimedia Tools and Applications</title>
		<imprint>
			<biblScope unit="page" from="1" to="33" />
			<date type="published" when="2017">2017. 2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">Multimedia and Medicine: Teammates for better disease detection and survival</title>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Mathias</forename><surname>Lux</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Carsten</forename><surname>Gridwodz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Concetto</forename><surname>Spampinato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sigrun</forename><forename type="middle">L</forename><surname>Thomas De Lange</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Eskeland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Wallapak</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Peter</forename><forename type="middle">T</forename><surname>Tavanapong</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Cathal</forename><surname>Schmidt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Dag</forename><surname>Gurrin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Håvard</forename><surname>Johansen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Pål</forename><surname>Johansen</surname></persName>
		</author>
		<author>
			<persName><surname>Halvorsen</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2016 ACM Multimedia Conference (ACM MM)</title>
				<meeting>the 2016 ACM Multimedia Conference (ACM MM)</meeting>
		<imprint>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="968" to="977" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b15">
	<analytic>
		<title level="a" type="main">From Annotation to Computer Aided Diagnosis: Detailed Evaluation of a Medical Multimedia System</title>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sigrun</forename><surname>Losada Eskeland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Peter</forename><forename type="middle">Thelin</forename><surname>Schmidt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Zeno</forename><surname>Albisser</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Dag</forename><surname>Johansen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Carsten</forename><surname>Griwodz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Pål</forename><surname>Halvorsen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Thomas</forename><surname>De Lange</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Transactions on Multimedia Computing, Communications and Applications</title>
		<imprint>
			<biblScope unit="volume">9</biblScope>
			<biblScope unit="page">4</biblScope>
			<date type="published" when="2017">2017. 2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">EIR -Efficient Computer Aided Diagnosis Framework for Gastrointestinal endoscopies</title>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Pål</forename><surname>Halvorsen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Carsten</forename><surname>Thomas De Lange</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Peter</forename><forename type="middle">Thelin</forename><surname>Griwodz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sigrun</forename><surname>Schmidt</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Dag</forename><surname>Losada Eskeland</surname></persName>
		</author>
		<author>
			<persName><surname>Johansen</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 14th International Workshop on Content-based Multimedia Indexing (CBMI)</title>
				<meeting>the 14th International Workshop on Content-based Multimedia Indexing (CBMI)</meeting>
		<imprint>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="1" to="6" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b17">
	<analytic>
		<title level="a" type="main">Multimedia for Medicine: The Medico Task at MediaEval</title>
		<author>
			<persName><forename type="first">Michael</forename><surname>Riegler</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Konstantin</forename><surname>Pogorelov</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Pål</forename><surname>Halvorsen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Kristin</forename><forename type="middle">Ranheim</forename><surname>Randel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sigrun</forename><surname>Losada Eskeland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Duc-Tien</forename><surname>Dang-Nguyen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Mathias</forename><surname>Lux</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Carsten</forename><surname>Griwodz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Concetto</forename><surname>Spampinato</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Thomas</forename><surname>De Lange</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 2017 MediaEval Benchmarking Initiative for Multimedia Evaluation</title>
				<meeting>the 2017 MediaEval Benchmarking Initiative for Multimedia Evaluation</meeting>
		<imprint>
			<date type="published" when="2017">2017. 2017</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b18">
	<monogr>
		<title level="m" type="main">Rethinking the inception architecture for computer vision</title>
		<author>
			<persName><forename type="first">Christian</forename><surname>Szegedy</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Vincent</forename><surname>Vanhoucke</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Sergey</forename><surname>Ioffe</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Jonathon</forename><surname>Shlens</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Zbigniew</forename><surname>Wojna</surname></persName>
		</author>
		<idno type="arXiv">arXiv:1512.00567</idno>
		<imprint>
			<date type="published" when="2015">2015. 2015</date>
		</imprint>
	</monogr>
	<note type="report_type">arXiv preprint</note>
</biblStruct>

<biblStruct xml:id="b19">
	<analytic>
		<title level="a" type="main">Computer-aided detection of retroflexion in colonoscopy</title>
		<author>
			<persName><forename type="first">Yi</forename><surname>Wang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Wallapak</forename><surname>Tavanapong</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Johnny</forename><surname>Wong</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Junghwan</forename><surname>Oh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Piet C De</forename><surname>Groen</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceeding of the 24th International Symposium on Computer-Based Medical Systems (CBMS)</title>
				<meeting>eeding of the 24th International Symposium on Computer-Based Medical Systems (CBMS)</meeting>
		<imprint>
			<date type="published" when="2011">2011</date>
			<biblScope unit="page" from="1" to="6" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b20">
	<analytic>
		<title level="a" type="main">Polyp-alert: Near real-time feedback during colonoscopy</title>
		<author>
			<persName><forename type="first">Yi</forename><surname>Wang</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Wallapak</forename><surname>Tavanapong</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Johnny</forename><surname>Wong</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Jung</forename><surname>Hwan Oh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Piet C De</forename><surname>Groen</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Computer methods and programs in biomedicine</title>
		<imprint>
			<biblScope unit="volume">120</biblScope>
			<biblScope unit="issue">3</biblScope>
			<biblScope unit="page" from="164" to="179" />
			<date type="published" when="2015">2015. 2015</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
