<?xml version="1.0" encoding="UTF-8"?>
<TEI xml:space="preserve" xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 https://raw.githubusercontent.com/kermitt2/grobid/master/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Let&apos;s Stop Building at the Feet of Giants: Recovering unavailable Requirements Quality Artifacts</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName><forename type="first">Julian</forename><surname>Frattini</surname></persName>
							<email>julian.frattini@bth.se</email>
							<affiliation key="aff0">
								<orgName type="institution">Blekinge Institute of Technology</orgName>
								<address>
									<addrLine>Valhallavägen 1</addrLine>
									<postCode>371 41</postCode>
									<settlement>Karlskrona</settlement>
									<country key="SE">Sweden</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Lloyd</forename><surname>Montgomery</surname></persName>
							<email>lloyd.montgomery@uni-hamburg.de</email>
							<affiliation key="aff1">
								<orgName type="institution">University of Hamburg</orgName>
								<address>
									<postCode>20146</postCode>
									<settlement>Hamburg</settlement>
									<country key="DE">Germany</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Davide</forename><surname>Fucci</surname></persName>
							<email>davide.fucci@bth.se</email>
							<affiliation key="aff0">
								<orgName type="institution">Blekinge Institute of Technology</orgName>
								<address>
									<addrLine>Valhallavägen 1</addrLine>
									<postCode>371 41</postCode>
									<settlement>Karlskrona</settlement>
									<country key="SE">Sweden</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Jannik</forename><surname>Fischbach</surname></persName>
							<email>jannik.fischbach@netlight.com</email>
							<affiliation key="aff2">
								<orgName type="institution">Netlight Consulting GmbH</orgName>
								<address>
									<addrLine>Sternstraße 5</addrLine>
									<postCode>80538</postCode>
									<settlement>Munich</settlement>
									<country key="DE">Germany</country>
								</address>
							</affiliation>
							<affiliation key="aff3">
								<orgName type="department">fortiss GmbH</orgName>
								<address>
									<addrLine>Guerickestraße 25</addrLine>
									<postCode>80805</postCode>
									<settlement>Munich</settlement>
									<country key="DE">Germany</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Michael</forename><surname>Unterkalmsteiner</surname></persName>
							<email>michael.unterkalmsteiner@bth.se</email>
							<affiliation key="aff0">
								<orgName type="institution">Blekinge Institute of Technology</orgName>
								<address>
									<addrLine>Valhallavägen 1</addrLine>
									<postCode>371 41</postCode>
									<settlement>Karlskrona</settlement>
									<country key="SE">Sweden</country>
								</address>
							</affiliation>
						</author>
						<author>
							<persName><forename type="first">Daniel</forename><surname>Mendez</surname></persName>
							<email>daniel.mendez@bth.se</email>
							<affiliation key="aff0">
								<orgName type="institution">Blekinge Institute of Technology</orgName>
								<address>
									<addrLine>Valhallavägen 1</addrLine>
									<postCode>371 41</postCode>
									<settlement>Karlskrona</settlement>
									<country key="SE">Sweden</country>
								</address>
							</affiliation>
							<affiliation key="aff3">
								<orgName type="department">fortiss GmbH</orgName>
								<address>
									<addrLine>Guerickestraße 25</addrLine>
									<postCode>80805</postCode>
									<settlement>Munich</settlement>
									<country key="DE">Germany</country>
								</address>
							</affiliation>
						</author>
						<title level="a" type="main">Let&apos;s Stop Building at the Feet of Giants: Recovering unavailable Requirements Quality Artifacts</title>
					</analytic>
					<monogr>
						<idno type="ISSN">1613-0073</idno>
					</monogr>
					<idno type="MD5">4F40BC4F82A31C0C9E35A9FA02C7195A</idno>
					<idno type="DOI">10.5281/zenodo.7708571</idno>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<encodingDesc>
			<appInfo>
				<application version="0.7.2" ident="GROBID" when="2023-04-29T06:36+0000">
					<desc>GROBID - A machine learning software for extracting information from scholarly documents</desc>
					<ref target="https://github.com/kermitt2/grobid"/>
				</application>
			</appInfo>
		</encodingDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>requirements quality, open science, availability, artifacts, data set Orcid 0000-0003-3995-6125 (J. Frattini)</term>
					<term>0000-0002-8249-1418 (L. Montgomery)</term>
					<term>0000-0002-0679-4361 (D. Fucci)</term>
					<term>0000-0002-4361-6118 (J. Fischbach)</term>
					<term>0000-0003-4118-0952 (M. Unterkalmsteiner)</term>
					<term>0000-0003-0619-6027 (D. Mendez)</term>
				</keywords>
			</textClass>
			<abstract>
<div xmlns="http://www.tei-c.org/ns/1.0"><p>Requirements quality literature abounds with publications presenting artifacts, such as data sets and tools. However, recent systematic studies show that more than 80% of these artifacts have become unavailable or were never made public, limiting reproducibility and reusability. In this work, we report on an attempt to recover those artifacts. To that end, we requested corresponding authors of unavailable artifacts to recover and disclose them according to open science principles. Our results, based on 19 answers from 35 authors (54% response rate), include an assessment of the availability of requirements quality artifacts and a breakdown of authors' reasons for their continued unavailability. Overall, we improved the availability of seven data sets and seven implementations.</p></div>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1.">Introduction</head><p>Data sets and tools are often reported as important contributions to requirements quality literature <ref type="bibr" target="#b0">[1]</ref>. However, a recent secondary study revealed that out of 57 primary studies, as little as 12% of data sets and 19% of tools are currently publicly available <ref type="bibr" target="#b1">[2]</ref>. The unavailability of those artifacts has two major consequences. Firstly, empirical results are difficult to reproduce, which inhibits the process of strengthening the empirical evidence of scientific contributions. Secondly, the presented artifacts are difficult to reuse, which necessitates scientific progress to restart over and over again instead of evolving from existing contributions. Ultimately, these consequences inhibit the progress of the requirements quality research domain.</p><p>Following open science practices in software engineering improves the accessibility of artifacts and the preservation of future contributions <ref type="bibr" target="#b2">[3]</ref> but it is difficult to apply them in retrospect. Because of this, the accessibility of artifacts in past publications deteriorated over time <ref type="bibr" target="#b0">[1]</ref>. The resulting unavailability of artifacts <ref type="bibr" target="#b1">[2]</ref> poses a significant challenge to artifact-dependent research, like the requirements quality or the larger natural language processing for requirements engineering (NLP4RE) domain. In this work, we set to recover unavailable requirements quality artifacts by requesting authors to disclose them according to open science principles. Our main contribution is the recovery of seven data sets and seven implementations. Nevertheless, 16 out of 35 (46%) requests to authors remained unanswered, indicating that the research community needs to emphasize further the importance of persistently archiving research data.</p><p>The remainder of this manuscript is structured as follows: Section 2 introduces the background both on the topic of open science and requirements quality research. Section 3 describes the process and Section 4 the results of the recovery. We discuss these results in Section 5 before concluding in Section 6.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.">Background</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.1.">Open Science in Software Engineering</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.2.">Requirements Quality Literature</head><p>Recent advances have established that artifacts produced in requirements engineering (RE) have a significant impact on downstream software development activities <ref type="bibr" target="#b8">[9]</ref>, potentially even causing project failure <ref type="bibr" target="#b9">[10]</ref>. Consequently, requirements artifacts merit quality assurance <ref type="bibr" target="#b0">[1]</ref>. The requirements quality literature is dedicated to providing the understanding as well as the support for measuring and improving the quality of requirements <ref type="bibr" target="#b0">[1]</ref>. One popular approach to this is the proposal of quality factors. Requirements quality publications often formulate one or more quality factors-e.g., the use of coordination ambiguity leading to divergent interpretations <ref type="bibr" target="#b10">[11]</ref>-annotate instances of that quality factor in a data set, and finally present an implementation (i.e., an algorithm or full-fledged tool) to detect these instances automatically.</p><p>These artifacts-both data sets and implementations-represent essential contributions facilitating empirical research and technology transfer. While the (annotated) data sets are the main driver for developing new and improving existing implementations for quality factor detection, implementations are the tools to be deployed in industry for actual integration and improvement of the software engineering process. The NLP4RE research domain, which applies natural language processing (NLP) techniques to RE <ref type="bibr" target="#b11">[12]</ref> and constitutes a large part of the contributions to the requirements quality literature <ref type="bibr" target="#b0">[1]</ref>, is particularly focused on said delivery and improvement of tools. In addition to the dependency of these NLP-powered tools on the availability and reliability of training data, this puts the NLP4RE research domain on the forefront of the open science challenge <ref type="bibr" target="#b11">[12]</ref>. The NLP4RE community is therefore particularly aware of its dependency on the availability of artifacts <ref type="bibr" target="#b12">[13]</ref>.</p><p>However, recent systematic studies revealed that a significant amount of these artifacts are not available<ref type="foot" target="#foot_1">2</ref> anymore or have never been <ref type="bibr" target="#b11">[12,</ref><ref type="bibr" target="#b0">1,</ref><ref type="bibr" target="#b1">2]</ref>. Table <ref type="table">1</ref> reports the availability status of 57 data sets (D) and 36 implementations (I) extracted from the 57 primary studies of our previously-published literature review on requirements quality factors <ref type="bibr" target="#b1">[2]</ref>.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Recovery Process</head><p>The insight that the availability of requirements quality artifacts is insufficient <ref type="bibr" target="#b0">[1,</ref><ref type="bibr" target="#b1">2]</ref> motivated our objective to improve the state of open science in the requirements quality literature by ensuring the recoverability of data, a necessary prerequisite for the reproducibility of scientific work <ref type="bibr" target="#b13">[14]</ref>.</p><p>In this section, we document the artifact recovery process along the undertaken steps. In Section 3.1, we describe the selection of the sample of primary studies. We detail our approach to contact corresponding authors in Section 3.2 and maintain correspondence with them in Section 3.3. Finally, we document the evaluation of the recovery process and success in Section 3.4. All produced data, scripts, and documentation are disclosed in our replication package <ref type="foot" target="#foot_3">4</ref> .</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Table 1</head><p>Availability status of requirements quality artifacts <ref type="bibr" target="#b1">[2]</ref> including data sets (D) and implementations (I)</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Status</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Explanation (D) (I) Open Data</head><p>The artifact is hosted in a service that satisfies the following criteria:</p><p>(1) immutable URL (cannot be altered by the author or someone else), ( <ref type="formula">2</ref>) permanent (the hosting organization has a mission to maintain artifacts for the foreseeable future), ( <ref type="formula">3</ref>) accessible (there is a DOI pointing to the real data source URL), and (4) open-source license (the artifact has a license which grants access and re-use) 1 0</p><p>Open Source 3 [only for implementations] The implementation is available for all to use, and the code base has been disclosed -5</p><p>Available in paper [only for data sets] The data set is small enough that the authors disclose the entire data set in the manuscript</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5">-</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Reachable link</head><p>The artifact is reachable now but is missing some of the Open Data aspects (see above) </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.1.">Study sample selection and preparation</head><p>We used convenience sampling since the primary studies on which we base our results were selected based on expediency <ref type="bibr" target="#b14">[15]</ref>. In particular, we recovered artifacts from a set of primary studies used to build an ontology of requirements quality factors <ref type="bibr" target="#b1">[2]</ref>. To develop this ontology, we collected manuscripts reporting quality factors from an original set of publications reported in another secondary study <ref type="bibr" target="#b0">[1]</ref>. Extracting data sets and implementations from such publications revealed the unfortunate state of artifact availability.</p><p>We enhanced the data regarding data sets and implementations from our previous study <ref type="bibr" target="#b1">[2]</ref> with the following information.</p><p>• Corresponding author: each artifact was associated with a corresponding author. • Mention: each artifact was associated with its verbatim mention in the manuscript.</p><p>Additionally, we corrected information about one data set and three implementations that persisted in the previous study <ref type="bibr" target="#b1">[2]</ref>.</p><p>Using a spreadsheet, we collected data about 1. authors (n=35), specifying for each author the name and email address, 2. data sets (n=57), specifying for each data set its containing publication, its verbatim mention, the corresponding author, and its current availability, and 3. implementations (n=36), specifying for each implementation its containing publication, its verbatim mention, the corresponding author, and its current availability.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.2.">Approaching authors</head><p>We created a Python script that automatically assembles one email for each corresponding author. This email contained the following elements:</p><p>1. Header: an explanation of our endeavor and a request to contribute to open science (or alternatively explain why this is impossible). 2. Artifact list: a list of artifacts contained in the publications of the authors that were not open access. 3. Instructions: brief how to to properly disclose artifacts according to the open science principles as well as the offer to assist them in the process 4. Contact: a way to reach out to us.</p><p>We approached the authors in a first mail on the 30 th of November 2022, followed by a reminder on the 13 th of December, and a final reminder on the 11 th of January 2023. For authors that did not respond to our request until the final reminder, we additionally contacted their co-authors to increase the likelihood of response. We concluded the recovery process on the 8th of February 2023, yielding a time frame of 70 days.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.3.">Correspondence</head><p>We kept close contact with the authors we approached by responding in a window of 24 hours within workdays. During this process, we clarified concerns and offered our help. We processed and recorded the information contained in the authors' answers in a spreadsheet file. We tracked the response status in an additional column, denoting the request as either undeliverable, unanswered, answered, or completed. We labeled a recovery request as completed once the corresponding author, for all their artifacts, either improved their availability or explained the inability to recover or disclose them.</p><p>Furthermore, we documented the dates of the first email sent, the first response received, and the completion of the request alongside the number of emails sent by the author in addition to the updated availability status of the artifacts and, eventually, the author's explanation for not taking the recommended actions. Two authors coded these explanations independently and came to an absolute agreement on the types of reasons for non-recovery. When the corresponding author's email address was no longer used, we reached out via personal contacts or social networks like Twitter and LinkedIn.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.4.">Evaluation</head><p>To evaluate the artifact recovery process, we generated statistics of the following data from the documentation in our tables.</p><p>1. Correspondence (author response time and frequency) to evaluate the effort of the recovery process. 2. Recovery request success (change in artifact availability) to evaluate the success of the recovery process.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="3.">Reason for non-recovery (author responses excusing the recovery) to evaluate the reasons inhibiting open access.</head><p>We evaluated the data by generating descriptive statistics from our documentation.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.">Results</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.1.">Correspondence</head><p>Out of the 35 approached corresponding authors, 19 answered the recovery request, and 13 completed it. We could not reach three authors despite searching for a valid contact. The distribution of correspondence status is visualized in Figure <ref type="figure" target="#fig_1">1a</ref>. It took, on average, 14.6 days for a corresponding author to reply to our request and 22.4 additional days to complete the request. On average, a request was resolved in an exchange of 3 emails with the corresponding author. The distributions of these statistics are visualized in Figure <ref type="figure" target="#fig_1">1b</ref> and Figure <ref type="figure" target="#fig_1">1c</ref>, respectively.  </p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="4.2.">Artifact Recovery Success</head><p>The corresponding authors improved the availability of seven data sets (four of which follow open-access principles) and seven implementations (six following open-access principles). This increases the availability of data sets from 12.3% (7/57, 1 open access) to 22.8% (13/57, 5 open access) and the availability of implementations from 19.4% (7/36, 0 open access) to 30.6% (11/36, 6 open access). Authors further confirmed the unavailability of 21 data sets and six implementations and provided reasons for the inability to recover or disclose them.</p><p>Figure <ref type="figure" target="#fig_3">2</ref> visualizes the success of the recovery request. The heatmap considers all artifacts (data sets in Figure <ref type="figure" target="#fig_3">2a</ref> and implementations in Figure <ref type="figure" target="#fig_3">2b</ref>) where the corresponding author completed the recovery request. The number in a cell represents the number of artifacts for which the original availability (on the y-axis) has been updated to the new availability (on the x-axis). The count of artifacts whose availability remained the same (e.g., because an author confirmed that the artifact could not be made more available) is reported on the diagonal (shaded gray). An improvement in the availability of an artifact contributes to cells to the right of the diagonal, a deterioration of the availability to the left.</p><p>For example, one implementation was previously available upon request <ref type="bibr" target="#b15">[16]</ref>. Now that the authors disclosed the implementation following open access principles<ref type="foot" target="#foot_4">5</ref> , the entry moved three cells to the right (see Figure <ref type="figure" target="#fig_3">2b</ref>). Open Access Link Original availability 0 0 0 0 0 0 0 0 0 12 0 0 3 0 0 1 0 0 5 0 0 0 0 0 0 2 2 0 0 0 0 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0 0 Open Source Open Access Original availability 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 1 2 0 0 0 1 3 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 0 0 0 0 1 0 0 0 0 0 0 0 0 0 2 0 0 0 0 0 0 0 0  The inability to recover or disclose artifacts was reported as follows: among 21 unrecoverable data sets, 15 were lost (i.e., the author could not find them anymore or the contact, whom the author assumed had the data, was unreachable), and six could not be disclosed due to sensitive contents. Among the six unrecoverable implementations, three became proprietary, and three were lost.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="5.">Discussion</head><p>Within the 70-day time frame for the process, authors of requirements quality publications recovered several data sets and implementations that are now available for reproduction of scientific results and reuse in future projects. We referenced the recovered artifacts in the requirements quality factor ontology <ref type="bibr" target="#b1">[2]</ref> <ref type="foot" target="#foot_5">6</ref> as well as our replication package to make them accessible.</p><p>Additionally, the authors confirmed the unavailability of several more artifacts. While this does not actively improve the availability of artifacts for reproduction, it clarifies the ambiguous status of several data sets and implementations. Overall, when authors answered a recovery request, they either recovered their data or reported the inability to do so with helpful explanations. Recovery requests failed due to (1) no response, (2) the artifact being lost, or (3) the artifact containing sensitive information. We did not encounter other reasons for the failure of a recovery request, which corroborates the goodwill of the sampled requirements quality community in its commitment to open science. This stands in contrast to the experience of other artifact recovery attempts, where researchers encountered reasons like requests for reimbursements or not seeing any personal gain in the recovery <ref type="bibr" target="#b7">[8]</ref>.</p><p>We cannot claim that our observations are universally valid for the software (requirements) engineering community due to the limitations of our study. For one, the set of primary studies was obtained via convenience sampling from a previous study <ref type="bibr" target="#b1">[2]</ref>. This sample has known limitations as several primary studies relevant to requirements quality literature are missing. Hence, the results of recovery success and correspondence do not represent the complete requirements quality literature and research community. Furthermore, our conclusion regarding the status of correspondence, especially the status of unanswered and answered requests, is limited by how we decided to approach corresponding authors. Using emails as the mean of communication impedes the response rate since they are often abandoned with a change of affiliation <ref type="bibr" target="#b16">[17]</ref>. The limited success of correspondence is a consequence of the time frame and communication channels used in this study rather than an indicator of the research community's attitude towards open science.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="6.">Conclusion</head><p>Both the credibility and reusability of previous publications in the requirements quality literature have been impeded by the unavailability of data sets and implementations. We requested corresponding authors of 57 publications to disclose their artifacts according to the open science principles. We improved the availability of seven data sets and seven implementations, several of which now follow open science principles.</p><p>With this study, we want to raise awareness about the importance of recovering artifacts associated with older publications. While adherence to the open science principles recently rose thanks to comprehensive guidelines (see <ref type="bibr" target="#b2">[3]</ref>) or community initiatives such as artifact evaluation tracks at conferences, they are rarely applied retroactively to previous publications. Furthermore, we hope that the material we created will support researchers in areas that heavily rely on artifacts, such as NLP4RE, to recover more of them.</p><p>Our agenda, in the scope of the requirements quality factor ontology <ref type="foot" target="#foot_6">7</ref> , includes providing a central repository of updated information on the availability and location of relevant artifacts. We invite researchers to contribute to this cause and strengthen the evidence in our field.</p></div><figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_0"><head>U n d e li v e r a b le U n a n s w e r e</head><label></label><figDesc></figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_1"><head>Figure 1 :</head><label>1</label><figDesc>Figure 1: Correspondence to the artifact recovery request</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_2"><head></head><label></label><figDesc>Change of availability in implementations</figDesc></figure>
<figure xmlns="http://www.tei-c.org/ns/1.0" xml:id="fig_3"><head>Figure 2 :</head><label>2</label><figDesc>Figure 2: Change of artifact availability</figDesc></figure>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" xml:id="foot_0">Scientific work needs to be reproducible<ref type="bibr" target="#b2">[3]</ref> to strengthen the evidence it contributes to a field of research<ref type="bibr" target="#b3">[4]</ref>. Open science is the initiative of ensuring public availability of research artifacts<ref type="bibr" target="#b2">[3]</ref> and, hence, facilitating reproducibility. Within open science, the facets of open access for publications, open data for data sets, and open source for source code are most relevant to software engineering<ref type="bibr" target="#b4">[5]</ref>, where each facet of open science entails different techniques and best practices to disclose its respective type of research artifact. Several governmental research funding agencies, including the European Union, made open access to scientific results (including data, tools, etc.) mandatory<ref type="bibr" target="#b0">1</ref> .In literature, Minocher et al. propose four attributes data recoveribility, data usability, analytical clarity, and agreement of results and explicitly emphasize the sequential dependency of those attributes-e.g., analytical clarity of data is meaningless if the data is not recoverable.Recent endeavors of incentivizing scholars to follow open science principles include open science badges<ref type="bibr" target="#b5">[6]</ref> and the registered reports<ref type="bibr" target="#b6">[7]</ref>. However, the software engineering research community is still in the process of adapting open science principles<ref type="bibr" target="#b2">[3]</ref>, and the unavailability of artifacts is common<ref type="bibr" target="#b0">[1]</ref>. Prominent reasons for the unavailability of artifacts include the sensitivity of data or corresponding authors changing their affiliation and consequently losing access to their artifacts<ref type="bibr" target="#b7">[8]</ref>. While some reasons for the unavailability of artifacts (e.g., the sensitivity of company-owned data) may well require significant effort to cope with, other reasons (e.g., loss of artifact, lack of diligence) can be circumvented easily by following proposed guidelines<ref type="bibr" target="#b2">[3]</ref> and making use of modern tools for artifact sharing. 1 https://research-and-innovation.ec.europa.eu/strategy/strategy-2020-2024/our-digital-future/open-science/ open-access_en</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="2" xml:id="foot_1">Where available means a status of Upon request (see Table1) or better.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="3" xml:id="foot_2">In this context, we are using the term open source as commonly understood, not as used in the open science framework<ref type="bibr" target="#b4">[5]</ref>, which would imply adherence to the properties listed under open data.</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="4" xml:id="foot_3">Available at https://doi.org/10.5281/zenodo.7708571</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="5" xml:id="foot_4">Now publicly available at https://doi.org/10.5281/zenodo.7484023</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="6" xml:id="foot_5">See Content at http://reqfactoront.com/</note>
			<note xmlns="http://www.tei-c.org/ns/1.0" place="foot" n="7" xml:id="foot_6">http://reqfactoront.com</note>
		</body>
		<back>

			<div type="acknowledgement">
<div xmlns="http://www.tei-c.org/ns/1.0"><head>Acknowledgments</head><p>The KKS foundation supported this work through the S.E.R.T. Research Profile project at Blekinge Institute of Technology. We additionally thank the reviewers for their valuable feedback upon which the manuscript was improved.</p></div>
			</div>

			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Empirical research on requirements quality: a systematic mapping study</title>
		<author>
			<persName><forename type="first">L</forename><surname>Montgomery</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Fucci</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Bouraffa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Scholz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><surname>Maalej</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Requirements Engineering</title>
		<imprint>
			<biblScope unit="page" from="1" to="27" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">A live extensible ontology of quality factors for textual requirements</title>
		<author>
			<persName><forename type="first">J</forename><surname>Frattini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Montgomery</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Fischbach</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Unterkalmsteiner</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Mendez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Fucci</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">IEEE 30th International Requirements Engineering Conference (RE), IEEE</title>
				<imprint>
			<date type="published" when="2022">2022. 2022</date>
			<biblScope unit="page" from="274" to="280" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b2">
	<monogr>
		<author>
			<persName><forename type="first">D</forename><surname>Mendez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Graziotin</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Wagner</surname></persName>
		</author>
		<author>
			<persName><forename type="first">H</forename><surname>Seibold</surname></persName>
		</author>
		<title level="m">Contemporary empirical methods in software engineering</title>
				<imprint>
			<publisher>Springer</publisher>
			<date type="published" when="2020">2020</date>
			<biblScope unit="page" from="477" to="501" />
		</imprint>
	</monogr>
	<note>Open science in software engineering</note>
</biblStruct>

<biblStruct xml:id="b3">
	<analytic>
		<title level="a" type="main">Variability and reproducibility in software engineering: A study of four companies that developed the same system</title>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">C</forename><surname>Anda</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">I</forename><surname>Sjøberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Mockus</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">TSE</title>
		<imprint>
			<biblScope unit="volume">35</biblScope>
			<biblScope unit="page" from="407" to="429" />
			<date type="published" when="2008">2008</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b4">
	<monogr>
		<author>
			<persName><forename type="first">J</forename><surname>Tennant</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Beamer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Bosman</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Brembs</surname></persName>
		</author>
		<author>
			<persName><forename type="first">N</forename><forename type="middle">C</forename><surname>Chung</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Clement</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Crick</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Dugan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Dunning</surname></persName>
		</author>
		<title level="m">Foundations for open scholarship strategy development</title>
				<imprint>
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b5">
	<analytic>
		<title level="a" type="main">Badges to acknowledge open practices: A simple, low-cost, effective method for increasing transparency</title>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">C</forename><surname>Kidwell</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><forename type="middle">B</forename><surname>Lazarević</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E</forename><surname>Baranski</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><forename type="middle">E</forename><surname>Hardwicke</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Piechowski</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L.-S</forename><surname>Falkenberg</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Kennett</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Slowik</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">PLoS biology</title>
		<imprint>
			<biblScope unit="volume">14</biblScope>
			<biblScope unit="page">e1002456</biblScope>
			<date type="published" when="2016">2016</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b6">
	<analytic>
		<title level="a" type="main">The preregistration revolution</title>
		<author>
			<persName><forename type="first">B</forename><forename type="middle">A</forename><surname>Nosek</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><forename type="middle">R</forename><surname>Ebersole</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><forename type="middle">C</forename><surname>Dehaven</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">T</forename><surname>Mellor</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Proceedings of the National Academy of Sciences</title>
		<imprint>
			<biblScope unit="volume">115</biblScope>
			<biblScope unit="page" from="2600" to="2606" />
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b7">
	<analytic>
		<title level="a" type="main">Many researchers were not compliant with their published data sharing statement: mixed-methods study</title>
		<author>
			<persName><forename type="first">M</forename><surname>Gabelica</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Bojčić</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Puljak</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Journal of Clinical Epidemiology</title>
		<imprint>
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b8">
	<analytic>
		<title level="a" type="main">Status quo in requirements engineering: A theory and a global family of surveys</title>
		<author>
			<persName><forename type="first">S</forename><surname>Wagner</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><forename type="middle">M</forename><surname>Fernández</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Felderer</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Vetrò</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Kalinowski</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Wieringa</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Pfahl</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Conte</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M.-T</forename><surname>Christiansson</surname></persName>
		</author>
		<author>
			<persName><forename type="first">D</forename><surname>Greer</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">TOSEM</title>
		<imprint>
			<biblScope unit="volume">28</biblScope>
			<biblScope unit="page" from="1" to="48" />
			<date type="published" when="2019">2019</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b9">
	<analytic>
		<title level="a" type="main">Naming the pain in requirements engineering: Design of a global family of surveys and first results from germany</title>
		<author>
			<persName><forename type="first">D</forename><surname>Mendez</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Wagner</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">Proceedings of the 17th International Conference on Evaluation and Assessment in Software Engineering</title>
				<meeting>the 17th International Conference on Evaluation and Assessment in Software Engineering</meeting>
		<imprint>
			<date type="published" when="2013">2013</date>
			<biblScope unit="page" from="183" to="194" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b10">
	<analytic>
		<title level="a" type="main">Using domain-specific corpora for improved handling of ambiguity in requirements</title>
		<author>
			<persName><forename type="first">S</forename><surname>Ezzini</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Abualhaija</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Arora</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><surname>Sabetzadeh</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><forename type="middle">C</forename><surname>Briand</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">IEEE/ACM 43rd International Conference on Software Engineering (ICSE), IEEE</title>
				<imprint>
			<date type="published" when="2021">2021. 2021</date>
			<biblScope unit="page" from="1485" to="1497" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b11">
	<analytic>
		<title level="a" type="main">Natural language processing for requirements engineering: A systematic mapping study</title>
		<author>
			<persName><forename type="first">L</forename><surname>Zhao</surname></persName>
		</author>
		<author>
			<persName><forename type="first">W</forename><surname>Alhoshan</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Ferrari</surname></persName>
		</author>
		<author>
			<persName><forename type="first">K</forename><forename type="middle">J</forename><surname>Letsholo</surname></persName>
		</author>
		<author>
			<persName><forename type="first">M</forename><forename type="middle">A</forename><surname>Ajagbe</surname></persName>
		</author>
		<author>
			<persName><forename type="first">E.-V</forename><surname>Chioasca</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><forename type="middle">T</forename><surname>Batista-Navarro</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">ACM Computing Surveys (CSUR)</title>
		<imprint>
			<biblScope unit="volume">54</biblScope>
			<biblScope unit="page" from="1" to="41" />
			<date type="published" when="2021">2021</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b12">
	<analytic>
		<title level="a" type="main">Natural language processing for requirements engineering: The best is yet to come</title>
		<author>
			<persName><forename type="first">F</forename><surname>Dalpiaz</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Ferrari</surname></persName>
		</author>
		<author>
			<persName><forename type="first">X</forename><surname>Franch</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Palomares</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">IEEE software</title>
		<imprint>
			<biblScope unit="volume">35</biblScope>
			<biblScope unit="page" from="115" to="119" />
			<date type="published" when="2018">2018</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b13">
	<monogr>
		<author>
			<persName><forename type="first">R</forename><surname>Minocher</surname></persName>
		</author>
		<author>
			<persName><forename type="first">S</forename><surname>Atmaca</surname></persName>
		</author>
		<author>
			<persName><forename type="first">C</forename><surname>Bavero</surname></persName>
		</author>
		<author>
			<persName><forename type="first">R</forename><surname>Mcelreath</surname></persName>
		</author>
		<author>
			<persName><forename type="first">B</forename><surname>Beheim</surname></persName>
		</author>
		<title level="m">Reproducibility improves exponentially over 63 years of social learning research</title>
				<imprint>
			<date type="published" when="2020">2020</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b14">
	<analytic>
		<title level="a" type="main">Sampling in software engineering research: A critical review and guidelines</title>
		<author>
			<persName><forename type="first">S</forename><surname>Baltes</surname></persName>
		</author>
		<author>
			<persName><forename type="first">P</forename><surname>Ralph</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Empirical Software Engineering</title>
		<imprint>
			<biblScope unit="volume">27</biblScope>
			<biblScope unit="page" from="1" to="31" />
			<date type="published" when="2022">2022</date>
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b15">
	<analytic>
		<title level="a" type="main">Engineering requirements with desiree: An empirical evaluation</title>
		<author>
			<persName><forename type="first">F.-L</forename><surname>Li</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Horkoff</surname></persName>
		</author>
		<author>
			<persName><forename type="first">L</forename><surname>Liu</surname></persName>
		</author>
		<author>
			<persName><forename type="first">A</forename><surname>Borgida</surname></persName>
		</author>
		<author>
			<persName><forename type="first">G</forename><surname>Guizzardi</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><surname>Mylopoulos</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="m">International Conference on Advanced Information Systems Engineering</title>
				<imprint>
			<publisher>Springer</publisher>
			<date type="published" when="2016">2016</date>
			<biblScope unit="page" from="221" to="238" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b16">
	<analytic>
		<title level="a" type="main">E-mail decay rates among corresponding authors in medline: The ability to communicate with and request materials from authors is being eroded by the expiration of e-mail addresses</title>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">D</forename><surname>Wren</surname></persName>
		</author>
		<author>
			<persName><forename type="first">J</forename><forename type="middle">E</forename><surname>Grissom</surname></persName>
		</author>
		<author>
			<persName><forename type="first">T</forename><surname>Conway</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">EMBO reports</title>
		<imprint>
			<biblScope unit="volume">7</biblScope>
			<biblScope unit="page" from="122" to="127" />
			<date type="published" when="2006">2006</date>
		</imprint>
	</monogr>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>
