<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Supporting Ontology-Based Standardization of Biomedical Metadata in the CEDAR Workbench</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Marcos</forename><surname>Martínez-Romero</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Martin</forename><forename type="middle">J</forename><surname>O'connor</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Michael</forename><surname>Dorf</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Jennifer</forename><surname>Vendetti</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Debra</forename><surname>Willrett</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Attila</forename><forename type="middle">L</forename><surname>Egyedi</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">John</forename><surname>Graybeal</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Mark</forename><forename type="middle">A</forename><surname>Musen</surname></persName>
							<affiliation key="aff0">
								<orgName type="department">Center for Biomedical Informatics Research</orgName>
								<orgName type="institution">Stanford University</orgName>
								<address>
									<addrLine>1265 Welch Rd</addrLine>
									<postCode>94305</postCode>
									<settlement>Stanford</settlement>
									<region>CA</region>
									<country key="US">USA</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Supporting Ontology-Based Standardization of Biomedical Metadata in the CEDAR Workbench</title>
					</analytic>
					<monogr>
						<imprint>
							<date/>
						</imprint>
					</monogr>
					<idno type="MD5">BB7775C0561D94F37D57C060C12D47DE</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2023-03-25T02:13+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>The availability of associated descriptive metadata for scientific datasets is important for discovering and reproducing scientific experiments. The use of ontologies has become a key focus for increasing the quality of these metadata. Despite the wide availability of biomedical ontologies, scientists wishing to use these ontologies when developing metadata descriptions face a number of practical difficulties. A core difficulty is the lack of tools for developing ontology-linked metadata specifications that can be published and shared. Additional difficulties include the lack of support for defining new terms in cases when no existing terms are found and for creating custom term collections to meet domain-specific needs.</p><p>To address these problems, we developed tools that allow scientists to find terms in ontologies for annotating their data and to dynamically create new terms and value sets. This work has been incorporated into a Web-based platform called the CEDAR Workbench. The resulting integrated environment presents a set of highly interactive interfaces for creating and publishing ontology-rich metadata specifications.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1">INTRODUCTION</head><p>In biomedicine, high-quality, standardized metadata are crucial for facilitating the discovery of scientific datasets and reproducibility of the corresponding experiments. In the last few years, the biomedical community has driven the development of metadata standards and guidelines for a variety of experiment types. Scientists use these specifications to inform their annotation of experimental results <ref type="bibr" target="#b14">(Tenenbaum, Sansone, &amp; Haendel, 2014)</ref>. One of the earliest examples is the MIAME standard <ref type="bibr" target="#b0">(Brazma et al., 2001)</ref>, which is used to describe metadata about microarray experiments. These standards and guidelines underpin metadata submissions to many public metadata repositories <ref type="bibr" target="#b3">(Edgar, Domrachev, &amp; Lash, 2002)</ref>. The BioSharing resource <ref type="bibr" target="#b6">(McQuilton et al., 2016)</ref> catalogs hundreds of these standardization efforts.</p><p>Despite the growing use of standards for defining metadata and the wide availability of biomedical ontologies, metadata submitted to public repositories rarely use standard terms <ref type="bibr" target="#b1">(Bui &amp; Park, 2006)</ref>. As a result, finding or reusing the metadata is a challenge and understanding the underlying experiments can be extremely hard, often requiring significant post-processing of metadata to extract useful content.</p><p>A key problem is that scientists face considerable practical barriers when attempting to link their metadata to ontology terms. Submission mechanisms for biomedical repositories are typically based on spreadsheets, with a variety of ad hoc formats that rarely support inclusion of ontology-based annotations. Even in cases where such annotations can be entered, scientists have no easy way to find and use terms from ontologies to include in their metadata submissions. Other difficulties include poor support for on-the-fly term creation when the necessary terms are not found and for creating custom lists of terms to meet domain-specific needs.</p><p>A variety of tools have been developed to address the challenge of metadata quality. Foremost among these are the ISA Tools <ref type="bibr" target="#b12">(Rocca-Serra et al., 2010)</ref>, which allow curators to create spreadsheet-based submissions for metadata repositories. LinkedISA provides a means to interoperate with Linked Open Data, effectively adding controlled term linkage to templates (González-Beltrán, Maguire, Sansone, &amp; Rocca-Serra, 2014). A similar spreadsheet-based tool called RightField <ref type="bibr" target="#b16">(Wolstencroft et al., 2011)</ref> provides a mechanism for embedding ontology annotation capabilities in Excel or Open Office spreadsheets using ontologies from the BioPortal repository <ref type="bibr" target="#b9">(Noy et al., 2009)</ref>. Annotare <ref type="bibr" target="#b13">(Shankar et al., 2010)</ref>, which is used to submit experimental data to the Ar-rayExpress metadata repository <ref type="bibr" target="#b11">(Parkinson et al., 2005)</ref>, also supports ontology-based suggestions. These tools address specific issues of metadata quality but they do not provide an integrated environment that can support the entire metadata specification and submission process for widely used biomedical repositories.</p><p>The Center for Expanded Data Annotation and Retrieval (CEDAR)<ref type="foot" target="#foot_0">1</ref> is developing a computational ecosystem to overcome the barriers to creating high-quality metadata in biomedicine <ref type="bibr" target="#b7">(Musen et al., 2015)</ref>. CEDAR provides a suite of highly sophisticated tools designed to make the authoring of metadata as natural as possible, while also using ontologies to enrich the generated descriptions with standard terms.</p><p>In this paper, we describe the main features CEDAR developed to make it possible to easily construct Web-based metadata-acquisition forms, enrich those forms with ontology concepts, and then fill out the forms to create ontologyannotated descriptions of scientific experiments.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2">BACKGROUND</head><p>The CEDAR Workbench<ref type="foot" target="#foot_1">2</ref> is a suite of Web-based tools and REST APIs centered on the use of highly-modular metadata-acquisition forms called metadata templates (or simply templates). These templates define the data attributestermed template fields or fields-needed to describe biomedical experiments. For example, an experiment template may have an organism field containing the name of the organism being studied by the experiment (e.g., Homo sapiens). The templates may specify lists of permissible values for template fields. The central goal when designing a template is to enable the capture of sufficiently precise and complete metadata about experimental data to facilitate data discovery, interpretation, and reuse.</p><p>The CEDAR Workbench provides three core components that form a metadata construction pipeline (Fig. <ref type="figure" target="#fig_0">1):</ref> (1) a Template Designer, which supports interactive template creation; (2) a Metadata Editor, which allows end-users to fill in templates with metadata; and (3) a Metadata Repository for storing both templates and the metadata created using those templates. The CEDAR Workbench also allows scientists to upload the metadata created to public biomedical repositories.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.1">Template Designer and Metadata Editor</head><p>In the Template Designer, template authors assemble templates from one or more input fields. There are numerous field types available to template authors (e.g., text, paragraph, e-mail, numeric, and date). Users can also define reusable groups of fields, called elements. For example, the fields that describe a publication (e.g., authors, title, year, publication type, etc.) could be grouped together to form a publication element, which can then be reused in multiple templates. After a template is created, the Metadata Editor can be used to automatically generate a forms-based acquisition interface for entering metadata for that template. Scientists entering metadata using the Metadata Editor are prompted in real time with drop-down lists, auto-completion suggestions, and verification hints, significantly reducing their error rate while speeding metadata entry and repair. These prompts are driven by the value constraints specified in templates.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.2">Metadata Repository</head><p>Templates and metadata produced by the Workbench are stored in CEDAR's metadata repository. CEDAR incorporates a standardized model of templates and metadata, together with Web-based services to store, search, and share these resources <ref type="bibr" target="#b10">(O'Connor et al., 2016)</ref>. This model is based on the JSON Schema and JSON-LD specifications. It allows users to publish their metadata as both JSON-LD and RDF, thus facilitating interoperation with Linked Open Data.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.3">Support for ontology-based metadata</head><p>The CEDAR tools provide mechanisms for structurally describing templates and publishing metadata created using those templates in an open format. To increase the metadata quality further, we offer the ability to enrich these descriptions with controlled terms from ontologies. We extended the Template Designer and Metadata Editor to let users specify semantic content for templates and to easily enter semantically precise terms in their metadata. These extensions, can help to improve metadata adherence to the FAIR data principles <ref type="bibr" target="#b15">(Wilkinson et al., 2016)</ref> and interoperability with Linked Open Data. </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3">IMPLEMENTATION</head><p>We have enhanced the CEDAR Workbench to provide the ability to link ontology terms selected from BioPortal to biomedical metadata. BioPortal, developed by the National Center for Biomedical Ontology (NCBO) <ref type="bibr" target="#b8">(Musen et al., 2012)</ref>, is a popular platform for hosting and sharing biomedical ontologies. It provides access to more than 550 ontologies, and contains over 8 million classes and 64,000 properties. The BioPortal API provides a rich set of operations to access and use ontologies. We extended this API to provide the fine grained, highly interactive class and property lookup features needed by CEDAR's term search and selection features. To facilitate general use of these features, we encapsulated BioPortal's API as a CEDAR service and made it available as a public REST endpoint. 3 We now describe these extensions. 3 The REST endpoints that provide ontology-based services to the CEDAR Workbench are documented at https://terminology.metadatacenter.net/api.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1">Class and Property Search</head><p>CEDAR allows template authors to search for ontology terms to annotate their templates, that is, to add type and property assertions to template elements and fields using ontology classes and properties. Classes and object, data, and annotation properties for performing these annotations can be selected from terms supplied by BioPortal. Fig. <ref type="figure" target="#fig_1">2</ref> shows a screenshot of the ontology lookup user interface of the CEDAR Workbench. In the example shown, the template author entered the search term publication and then selected the Publication class from the National Cancer Institute Thesaurus (NCIT). The interface shows detailed information both for the selected class and the associated ontology, as well as for the position of the class in the class tree of NCIT.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.2">Value Set creation</head><p>A value set is a list of possible values for a specific purpose. In the CEDAR Workbench, value sets are a useful mechanism to define pick lists of permissible values for template fields. CEDAR works in conjunction with BioPortal to allow template authors to dynamically create value sets containing the terms in these pick lists. Value sets can contain classes from any combination of BioPortal ontologies. Upon creation, a value set is immediately assigned a unique, provisional IRI. The CEDAR Workbench supports the creation, retrieval, update, and deletion of these value sets.</p><p>For example, suppose that the template author wishes to constrain the values of a Study type field to three specific types of longitudinal studies (prospective study, retrospective study, and hybrid study). The Clinical Trials Ontology (CTO) is a good source of these types since it contains 375 study type classes (represented as descendants of the Study type class). Instead of selecting all these types, the template author can create a value set containing only the desired types. Fig. <ref type="figure" target="#fig_3">3</ref> shows a screenshot of value set creation features for this example presented in the Template Designer. Here, the user creates a value set named Longitudinal study types with three terms selected from CTO.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.3">Class creation</head><p>Despite the vast number of classes and properties available in biomedical repositories, ontologies often do not contain the exact term a user requires. To address this problem, CEDAR allows users to dynamically define new classes and immediately to use them. When generating a new class, users can optionally link it to one or several existing classes by means of the RDFS subclassOf relationship and SKOS relationships <ref type="bibr">(closeMatch, exactMatch, broadMatch, nar-rowMatch, relatedMatch)</ref>. Upon creation, a class is immediately assigned a unique, provisional IRI.</p><p>For example, suppose that a user needs to use the anatomical term adductor dorsalis. This term is not available in any BioPortal ontology, though the adductor muscle class in the UBERON ontology is a close conceptual match. In this case, the user decides to create an adductor dorsalis class via the CEDAR Workbench and indicate that the new term is a subclass of the adductor muscle UBERON class. Fig. <ref type="figure" target="#fig_2">4</ref> shows the class creation interface for this example. The adductor dorsalis class is stored in BioPortal as a CEDAR provisional class and is immediately available to all CEDAR users. Eventually, maintainers of UBERON may decide to incorporate the adductor dorsalis class to the ontology or may decide to reject it. If the class is added to UBERON, the permanent identifier for the class will be stored as part of the information of the provisional class. If adductor dorsalis is not included in the next version of the ontology, the subclassOf link will removed, but the class will still be valid in CEDAR.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.4">Value Constraints</head><p>With the above functionality, the system can limit the possible values of a template field to a predefined sets of ontology terms or value sets. Some template authors may need to define value constraints that go beyond predefined term  lists. For example, a user may wish to constrain the values of a disorder template field to all subclasses in three specific branches of the DOID ontology rooted at the terms cognitive disorder, sleep disorder, and dissociative disorder.</p><p>To deal with use cases such as this one, the system effectively allows template designers to constrain field values to any combination of (1) all classes in an ontology branch, (2) all classes from a specific ontology, (3) new or existing classes, and (4) new or existing value sets. Multiple constraint types can be specified for the same field.</p><p>Users populating templates using the Metadata Editor are presented in real time with a list of choices driven by these value constraints. Fig. <ref type="figure" target="#fig_4">5</ref> shows an example of choices presented for a disorder field that has had its values constrained to come from the three DOID ontology disease branches described in the earlier example. All terms from these three branches are combined in real time and presented as a single list.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4">EVALUATION</head><p>CEDAR is working with several biomedical communities to perform an initial evaluation of our ontology-based annotation functionality. This evaluation is being carried out in the context of using CEDAR to develop metadata submission pipelines for three biomedical groups. These groups are (1) the LINCS Consortium,<ref type="foot" target="#foot_2">4</ref> which is developing a catalog of cellular signatures; (2) ImmPort,<ref type="foot" target="#foot_3">5</ref> a portal for immunologyrelated datasets; and (3) the AIRR Community,<ref type="foot" target="#foot_4">6</ref> which is developing standards for describing datasets acquired using advanced sequencing technologies. In all three cases, the workflow is: (1) design metadata templates for each group's relevant datasets; (2) enhance these templates with ontology-based annotations; (3) scientists populate the templates with metadata describing their experiments; and (4) submit the generated metadata to the appropriate repositories.</p><p>Working together with the LINCS, ImmPort, and AIRR teams we first used the Template Designer tool to develop a basic version of the templates required by each group. We then annotated those templates using ontologies. Each project required a slightly different annotation workflow.</p><p>To annotate ImmPort data, members of the Human Immunology Project Consortium (HIPC)<ref type="foot" target="#foot_5">7</ref> performed an analysis of all fields and value constraints in the ImmPort system to identify appropriate controlled-term linkages. They used the Template Designer to comprehensively annotate the ImmPort templates with the controlled terms identified. They also specified value constraints for controlled-value fields to ensure that the generated acquisition interfaces restricted the acquisition of metadata to appropriate terms. In the cases where custom value sets were required for fields, CEDAR used BioPortal's value set features to let users define these resources. The process for the AIRR community was slightly different, since that community already incorporated ontology-based annotations as an integral part of their metadata-specification process. All these annotations were available in spreadsheet format and the only required step was to formalize them using the Template Designer. Finally, the LINCS team identified and encoded controlled term linkage for an initial subset of their templates.</p><p>The system successfully represented all required controlled-term annotations for the three groups. We are now completing the metadata submission pipeline for each group. For the LINCS and ImmPort projects, we are submitting the generated metadata into their community domain repositories. The AIRR submission process involves submitting the generated metadata to the public NCBI Bi-oSample repository. <ref type="foot" target="#foot_6">8</ref> We have completed prototype LINCS and NCBI pipeline submissions and will evaluate the speed, reliability, and completeness of the submission process before releasing each submission pipelines for public use.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5">DISCUSSION</head><p>Despite the growing number of ontologies in biomedicine, scientists rarely select standard terms for describing their experiments. Consequently, finding scientific datasets and understanding the corresponding experiments can be extremely hard and time-consuming, and often requires considerable post-processing of metadata to extract relevant content. A fundamental problem is the lack of convenient and openly available tools for linking metadata to ontologies. It takes time and effort to create well-specified metadata and scientists often view the task of metadata authoring as a burden that does not bring them any direct benefit. The CEDAR Workbench allows template authors to make extensive use of ontologies from BioPortal to add type and property assertions to template fields and to constrain the values of fields to ontology terms. Once those templates are created, metadata authors can easily use them to generate rich metadata without needing any understanding of ontology structures. The features described in this paper represent a major step toward overcoming the barriers to the creation of high-quality metadata in biomedicine. Through our approach, we hope to make it easier, and even fun, for scientists to annotate their experimental data in ways that ensure their value to the scientific community.</p><p>We are studying a variety of technologies to further ease the work of entering metadata. We developed a recommendation service that identifies common patterns in the metadata repository and that generates real-time suggestions for filling out templates <ref type="bibr" target="#b5">(Martínez-Romero et al., 2017)</ref>. This service is the first of a planned set of intelligent authoring components that will also include the extraction and semantic annotation of templates and metadata from semistructured sources, such as spreadsheets, scientific articles, and Web pages.</p><p>We also plan to develop an ontology enrichment pipeline in which ontology owners receive term requests based on the new classes created from CEDAR, which could be used to refine and extend their ontologies. The TermGenie <ref type="bibr" target="#b2">(Dietze et al., 2014)</ref> tool for requesting new Gene Ontology classes provides a model for the planned functionality.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>Fig. 1 .</head><label>1</label><figDesc>Fig. 1. An overview of CEDAR's metadata authoring workflow. Template authors use the Template Designer tool to create metadata templates. The Metadata Editor uses these templates to generate a graphical interface to acquire metadata from scientists. Acquired metadata are saved in CEDAR's Metadata Repository.</figDesc><graphic coords="2,63.12,63.84,485.76,221.52" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_1"><head>Fig. 2 .</head><label>2</label><figDesc>Fig. 2. Screenshot of CEDAR Template Designer's ontology lookup interface. Here, the user entered the search term publication and selected the class Publication from the National Cancer Institute Thesaurus (NCIT). The location of the selected class in the class tree is presented, as well as class and ontology details.</figDesc><graphic coords="3,59.76,80.16,490.56,326.88" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_2"><head>Fig. 4 .</head><label>4</label><figDesc>Fig. 4. Example of class creation in the CEDAR Workbench. The user creates the adductor dorsalis class and links it to the adductor muscle class in the UBERON ontology via the subclassOf relation.</figDesc><graphic coords="4,323.04,386.64,235.68,291.12" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_3"><head>Fig. 3 .</head><label>3</label><figDesc>Fig. 3. Screenshot showing an example of value set creation. The user is building a Longitudinal study types value set with terms from the Clinical Trials Ontology (shown as CTO).</figDesc><graphic coords="4,61.20,77.28,232.56,295.44" type="bitmap" /></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_4"><head>Fig. 5 .</head><label>5</label><figDesc>Fig. 5. Screenshot of the Metadata Editor that shows the possible values of a Disorder field in a Study template. This field has been constrained to accept values from the branches of the DOID ontology with roots cognitive disorder, sleep disorder, and dissociative disorder.</figDesc><graphic coords="5,46.56,301.20,258.96,208.80" type="bitmap" /></figure>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="1" xml:id="foot_0">https://metadatacenter.org/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="2" xml:id="foot_1">https://cedar.metadatacenter.net</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="4" xml:id="foot_2">http://www.lincsproject.org</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="5" xml:id="foot_3">http://www.immport.org</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="6" xml:id="foot_4">http://airr-community.org</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="7" xml:id="foot_5">https://www.immuneprofiling.org/hipc</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="8" xml:id="foot_6">https://www.ncbi.nlm.nih.gov/biosample</note>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>ACKNOWLEDGMENTS</head><p>CEDAR is supported by the National Institutes of Health through an NIH Big Data to Knowledge program under grant 1U54AI117925. NCBO is supported by the NIH Common Fund under grant U54HG004028. The CEDAR Workbench is available at https://cedar.metadatacenter.net, and on GitHub (https://github.com/metadatacenter).</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Minimum information about a microarray experiment (MIAME)-toward standards for microarray data</title>
		<author>
			<persName><forename type="first">A</forename><surname>Brazma</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Hingamp</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Quackenbush</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Sherlock</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Spellman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Stoeckert</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Aach</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Nat Genet</title>
		<imprint>
			<biblScope unit="volume">29</biblScope>
			<biblScope unit="page" from="365" to="371" />
			<date type="published" when="2001">2001</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">An assessment of metadata quality: A case study of the National Science Digital Library Metadata Repository</title>
		<author>
			<persName><forename type="first">Y</forename><surname>Bui</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J.-R</forename><surname>Park</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of CAIS/ACSI</title>
				<meeting>CAIS/ACSI</meeting>
		<imprint>
			<date type="published" when="2006">2006. 2006</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<analytic>
		<title level="a" type="main">TermGenie -a webapplication for pattern-based ontology class generation</title>
		<author>
			<persName><forename type="first">H</forename><surname>Dietze</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><forename type="middle">Z</forename><surname>Berardini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">E</forename><surname>Foulger</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">P</forename><surname>Hill</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Lomax</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Osumi-Sutherland</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Roncaglia</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of Biomedical Semantics</title>
		<imprint>
			<biblScope unit="volume">5</biblScope>
			<biblScope unit="issue">1</biblScope>
			<biblScope unit="page">48</biblScope>
			<date type="published" when="2014">2014</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">Gene Expression Omnibus: NCBI gene expression and hybridization array data repository</title>
		<author>
			<persName><forename type="first">R</forename><surname>Edgar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Domrachev</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">E</forename><surname>Lash</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Nucleic Acids Res</title>
		<imprint>
			<biblScope unit="volume">30</biblScope>
			<biblScope unit="issue">1</biblScope>
			<biblScope unit="page" from="207" to="210" />
			<date type="published" when="2002">2002</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<analytic>
		<title level="a" type="main">linkedISA: semantic representation of ISA-Tab experimental metadata</title>
		<author>
			<persName><forename type="first">A</forename><surname>González-Beltrán</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Maguire</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S.-A</forename><surname>Sansone</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Rocca-Serra</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">BMC bioinformatics</title>
		<imprint>
			<biblScope unit="volume">15</biblScope>
			<biblScope unit="page">S4</biblScope>
			<date type="published" when="2014">2014</date>
		</imprint>
	</monogr>
	<note>Suppl 1</note>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">Fast and accurate metadata authoring using ontology-based recommendations</title>
		<author>
			<persName><forename type="first">M</forename><surname>Martínez-Romero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">J</forename><surname>O'connor</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Shankar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Panahiazar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Willrett</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">L</forename><surname>Egyedi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Gevaert</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of AMIA 2017 Annual Symposium</title>
				<meeting>AMIA 2017 Annual Symposium</meeting>
		<imprint>
			<date type="published" when="2017">2017</date>
		</imprint>
	</monogr>
	<note>to appear</note>
</biblStruct>

<biblStruct xml:id="b6">
	<monogr>
		<author>
			<persName><forename type="first">P</forename><surname>Mcquilton</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gonzalez-Beltran</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Rocca-Serra</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Thurston</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Lister</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Maguire</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S.-A</forename><surname>Sansone</surname></persName>
		</author>
		<title level="m">BioSharing: curated and crowd-sourced metadata standards, databases and data policies in the life sciences</title>
				<imprint>
			<date type="published" when="2016">2016. 2016</date>
		</imprint>
	</monogr>
	<note>Database: the journal of biological databases and curation</note>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">The Center for Expanded Data Annotation and Retrieval</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>Musen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">A</forename><surname>Bean</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">H</forename><surname>Cheung</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Dumontier</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">A</forename><surname>Durante</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Gevaert</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Gonzalez-Beltran</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of the American Medical Informatics Association</title>
		<imprint>
			<biblScope unit="volume">22</biblScope>
			<biblScope unit="issue">6</biblScope>
			<biblScope unit="page" from="1148" to="1152" />
			<date type="published" when="2015">2015</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">The National Center for Biomedical Ontology</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>Musen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">F</forename><surname>Noy</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">H</forename><surname>Shah</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><forename type="middle">L</forename><surname>Whetzel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">G</forename><surname>Chute</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M.-A</forename><surname>Story</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Smith</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of the American Medical Informatics Association</title>
		<imprint>
			<date type="published" when="2012">2012</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">BioPortal: ontologies and integrated data resources at the click of a mouse</title>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">F</forename><surname>Noy</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">H</forename><surname>Shah</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><forename type="middle">L</forename><surname>Whetzel</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Dai</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Dorf</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Griffith</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Jonquet</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Nucleic acids research</title>
		<imprint>
			<biblScope unit="volume">37</biblScope>
			<biblScope unit="page" from="W170" to="173" />
			<date type="published" when="2009">2009</date>
		</imprint>
	</monogr>
	<note>Web Server issue</note>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">An open repository model for acquiring knowledge about scientific experiments</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">J</forename><surname>O'connor</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Martinez-Romero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">L</forename><surname>Egyedi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Willrett</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Graybeal</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>Musen</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 20th International Conference on Knowledge Engineering and Knowledge Management (EKAW2016)</title>
				<meeting>the 20th International Conference on Knowledge Engineering and Knowledge Management (EKAW2016)</meeting>
		<imprint>
			<date type="published" when="2016">2016</date>
			<biblScope unit="volume">10024</biblScope>
			<biblScope unit="page" from="762" to="777" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">ArrayExpress--a public repository for microarray gene expression data at the EBI</title>
		<author>
			<persName><forename type="first">H</forename><surname>Parkinson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">U</forename><surname>Sarkans</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Shojatalab</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Abeygunawardena</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Contrino</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Coulson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Farne</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Nucleic acids research</title>
		<imprint>
			<biblScope unit="volume">33</biblScope>
			<biblScope unit="page" from="D553" to="D555" />
			<date type="published" when="2005">2005</date>
		</imprint>
	</monogr>
	<note>Database issue</note>
</biblStruct>

<biblStruct xml:id="b12">
	<analytic>
		<title level="a" type="main">ISA software suite: Supporting standards-compliant experimental annotation and enabling curation at the community level</title>
		<author>
			<persName><forename type="first">P</forename><surname>Rocca-Serra</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Brandizi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Maguire</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Sklyar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Taylor</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><surname>Begley</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Field</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Bioinformatics</title>
		<imprint>
			<biblScope unit="volume">26</biblScope>
			<biblScope unit="issue">18</biblScope>
			<biblScope unit="page">2354</biblScope>
			<date type="published" when="2010">2010</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b13">
	<analytic>
		<title level="a" type="main">Annotare-a tool for annotating highthroughput biomedical investigations and resulting data</title>
		<author>
			<persName><forename type="first">R</forename><surname>Shankar</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Parkinson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Burdett</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Hastings</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Liu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Miller</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Srinivasa</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Bioinformatics</title>
		<imprint>
			<biblScope unit="volume">26</biblScope>
			<biblScope unit="issue">19</biblScope>
			<biblScope unit="page" from="2470" to="2471" />
			<date type="published" when="2010">2010</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">A sea of standards for omics data: sink or swim?</title>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">D</forename><surname>Tenenbaum</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S.-A</forename><surname>Sansone</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Haendel</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of the American Medical Informatics Association</title>
		<imprint>
			<biblScope unit="volume">21</biblScope>
			<biblScope unit="issue">2</biblScope>
			<biblScope unit="page" from="200" to="203" />
			<date type="published" when="2014">2014</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b15">
	<analytic>
		<title level="a" type="main">The FAIR Guiding Principles for scientific data management and stewardship</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">D</forename><surname>Wilkinson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Dumontier</surname></persName>
		</author>
		<author>
			<persName><forename type="first">Ij</forename><forename type="middle">J</forename><surname>Aalbersberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Appleton</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Axton</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Baak</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><surname>Blomberg</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Scientific Data</title>
		<imprint>
			<biblScope unit="volume">3</biblScope>
			<biblScope unit="page">160018</biblScope>
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">RightField: Embedding ontology annotation in spreadsheets</title>
		<author>
			<persName><forename type="first">K</forename><surname>Wolstencroft</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Owen</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Horridge</surname></persName>
		</author>
		<author>
			<persName><forename type="first">O</forename><surname>Krebs</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><surname>Mueller</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">L</forename><surname>Snoep</surname></persName>
		</author>
		<author>
			<persName><forename type="first">F</forename><surname>Du Preez</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Bioinformatics</title>
		<imprint>
			<biblScope unit="volume">27</biblScope>
			<biblScope unit="issue">14</biblScope>
			<biblScope unit="page" from="2021" to="2022" />
			<date type="published" when="2011">2011</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
