<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.0 20120330//EN" "JATS-archivearticle1.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-title-group>
        <journal-title>Corresponding author.
nEvelop-O alberto.camara-ballesteros@ejprd-project.eu (A. Cámara)
rOcid</journal-title>
      </journal-title-group>
    </journal-meta>
    <article-meta>
      <title-group>
        <article-title>Surveyed common data access policies preferences amongst European Reference Networks</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <string-name>Alberto Cámara</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Nirupama Benis</string-name>
          <xref ref-type="aff" rid="aff0">0</xref>
          <xref ref-type="aff" rid="aff4">4</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>César H. Bernabé</string-name>
          <xref ref-type="aff" rid="aff2">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Inés D.O. Coelho</string-name>
          <xref ref-type="aff" rid="aff1">1</xref>
          <xref ref-type="aff" rid="aff3">3</xref>
          <xref ref-type="aff" rid="aff5">5</xref>
          <xref ref-type="aff" rid="aff7">7</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Clémence M. A. Le Cornec</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Aylin Demir</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Bruna D.S. Vieira</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Jose A. Ramírez</string-name>
          <xref ref-type="aff" rid="aff0">0</xref>
          <xref ref-type="aff" rid="aff2">2</xref>
          <xref ref-type="aff" rid="aff4">4</xref>
          <xref ref-type="aff" rid="aff6">6</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>K. Joeri van der Velde</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Shuxin Zhang</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Ronald Cornet</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Annika Jacobsen</string-name>
          <xref ref-type="aff" rid="aff2">2</xref>
          <xref ref-type="aff" rid="aff5">5</xref>
          <xref ref-type="aff" rid="aff6">6</xref>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Marco Roos</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Franz Schaefer</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Morris A. Swertz</string-name>
        </contrib>
        <contrib contrib-type="author">
          <string-name>Mark D. Wilkinson</string-name>
        </contrib>
        <aff id="aff0">
          <label>0</label>
          <institution>Amsterdam Public Health, Digital Health Methodology</institution>
          ,
          <addr-line>Amsterdam</addr-line>
          ,
          <country country="NL">The Netherlands</country>
        </aff>
        <aff id="aff1">
          <label>1</label>
          <institution>Centre for Molecular and Biomolecular Informatics, Radboud University Medical Center</institution>
          ,
          <addr-line>Nijmegen</addr-line>
          ,
          <country country="NL">The Netherlands</country>
        </aff>
        <aff id="aff2">
          <label>2</label>
          <institution>Department of Human Genetics, Leiden University Medical Center</institution>
          ,
          <addr-line>Leiden</addr-line>
          ,
          <country country="NL">The Netherlands</country>
        </aff>
        <aff id="aff3">
          <label>3</label>
          <institution>Department of Medical Imaging, Radboud University Medical Center</institution>
          ,
          <addr-line>Nijmegen</addr-line>
          ,
          <country country="NL">The Netherlands</country>
        </aff>
        <aff id="aff4">
          <label>4</label>
          <institution>Department of Medical Informatics, Amsterdam UMC location University of Amsterdam</institution>
          ,
          <addr-line>Meibergdreef 9, Amsterdam</addr-line>
          ,
          <country country="NL">The Netherlands</country>
        </aff>
        <aff id="aff5">
          <label>5</label>
          <institution>Division of Paediatric Nephrology, Center for Paediatrics and Adolescent Medicine, University of Heidelberg</institution>
          ,
          <addr-line>Heidelberg</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
        <aff id="aff6">
          <label>6</label>
          <institution>Genomics Coordination Center, University of Groningen and University Medical Center</institution>
          ,
          <addr-line>Groningen</addr-line>
          ,
          <country country="NL">The Netherlands</country>
        </aff>
        <aff id="aff7">
          <label>7</label>
          <institution>Institute of Medical Informatics, Goethe University Frankfurt, University Hospital Frankfurt</institution>
          ,
          <addr-line>Frankfurt am Main</addr-line>
          ,
          <country country="DE">Germany</country>
        </aff>
      </contrib-group>
      <pub-date>
        <year>2023</year>
      </pub-date>
      <volume>000</volume>
      <fpage>0</fpage>
      <lpage>0001</lpage>
      <abstract>
        <p>Background: Data sharing amongst existing Rare Disease (RD) registries, even though being a process that presents multiple barriers, would enrich and ease research, as well as facilitate interoperability between the registries themselves. Methods: To understand their preferences on sharing data, we surveyed 24 European Reference Networks (ERNs) from the RD Domain. Results: The answers show that most ERNs are willing to share a set of Common Data Elements for free with authenticated users at an aggregated or pseudonymized level the moment the data is collected. The one exception is the industry sector, to which ERNs prefer to ask for a fee. Objective: Our aim is to create a reference for how most RD registries are willing to share their data, improving the ability of other stakeholders to make informed decisions to make their data interoperable.</p>
      </abstract>
      <kwd-group>
        <kwd>Rare diseases</kwd>
        <kwd>patient registries</kwd>
        <kwd>FAIR data sharing</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec id="sec-1">
      <title>1. Introduction</title>
      <p>
        Amongst the clinical domains, the Rare Disease (RD) domain is one of the most convoluted
regarding data sharing. This is the result of numerous factors, such as the intrinsic low prevalence
of RDs that causes data to be siloed, scarce, and heterogeneous (as it ranges from documents
updated by patients or their caretakers to clinical registries operated by data stewards and
managing institutions). Another relevant aspect of RD data is that it usually is highly distributed
[
        <xref ref-type="bibr" rid="ref1">1</xref>
        ], as specialised institutions usually focus on one RD or a group of RDs. Perhaps the most
crucial limitation is that the data from the RD domain is personally identifiable by nature (as a
consequence of the small number of people affected by these diseases) [
        <xref ref-type="bibr" rid="ref2">2</xref>
        ]. These circumstances,
together with general problems related to information sharing, such as the absence of a common
standardised vocabulary to describe it, cause great impediments to research activities [
        <xref ref-type="bibr" rid="ref3">3</xref>
        ].
      </p>
      <p>
        To alleviate some of these issues, the Joint Research Centre1 composed a set of Common
Data Elements (CDEs) [
        <xref ref-type="bibr" rid="ref4">4</xref>
        ] that are considered essential for further research on RDs. This set of
CDEs collects information that is prevalent for all European Registry Networks (ERNs), such as
diagnosis, sex, status, phenotype, etc. The CDEs are modeled by the European Joint Programme
on Rare Diseases (EJP-RD)2 as the CDE Semantic Model, which recommends a collection of
widespread ontologies that serve as a common group of terminologies to represent knowledge.
By implementing the CDE Semantic Model, ERNs can increase their data sharing capabilities
amongst themselves and with external resources. With the help of EJP-RD, most registries are
undergoing a FAIRification process and implementation of the CDEs, which are crucial steps
towards improving interoperability and data sharing within the RD community. [
        <xref ref-type="bibr" rid="ref5">5</xref>
        ] shows the
procedure for applying the CDE Semantic Model to a registry of vascular anomalies, which
entails the use of standardised terms from widespread ontologies, applying a transformation
layer from whatever kind of data existed in the registry to a Resource Description Framework
(RDF), as a way to make the data machine-interpretable and provide semantics amongst other
steps. The EJP RD is currently working on the Virtual Platform (VP), a place where ERNs
and other RD-related resources can connect to become discoverable (requiring the creation
and collection of a Data Catalog Vocabulary (DCAT)-based minimal set of metadata about the
registry and its contents, which is being designed by the experts at the EJP-RD) and share their
data. The objective of this paper is to inventorize the ERNs’ preferences when sharing their
data, such as exactly what data to share, how to share it, whom to give access to it, and its time
of publication.
      </p>
    </sec>
    <sec id="sec-2">
      <title>2. Methods and results</title>
      <p>All 24 ERNs were invited to complete a survey in which they describe which stakeholder is
allowed for which level of data sharing. Nine types of stakeholders were considered: Contributing
researcher (CR), Non-contributing researcher (NCR), Industry (IND), National Health Authority
(NHA), Regulatory authority (RA), Health technology Assessment/Payors (HTA), European
Health Data Space (EHDS). Patient Organisation (PO), and Non-Governmental Organization
1https://joint-research-centre.ec.europa.eu/index_en
2https://www.ejprarediseases.org/
Average
0.0%
0.0%
0.0%
0.0%
0.0%
0.0%
0.0%
0.0%
0.0%
0.0%</p>
      <p>CDEs
21.4%
21.4%
45.5%
63.6%
54.5%
60.0%
60.0%
41.7%
44.4%
45.8%
28.6%
35.7%
45.5%
27.3%
36.4%
30.0%
30.0%
33.3%
44.4%
38.9%
50.0%
42.9%
9.1%
9.1%
9.1%
10.0%
10.0%
25.0%
11.2%
19.6%
(NGO). Five aspects of data sharing are considered: Data to be shared (1), Highest data level to
be shared (2), Access modalities(3), Timing (4), and Need for Data Access Committee (DAC) (5).
The options presented for each aspect, as well as the results from the survey can be found on
their respective tables.</p>
      <p>
        To help with visualisation, the responses were plotted, they can be found here [
        <xref ref-type="bibr" rid="ref6">6</xref>
        ]. You can
find the original responses from the ERNs that agreed to share them here [
        <xref ref-type="bibr" rid="ref7">7</xref>
        ].
      </p>
    </sec>
    <sec id="sec-3">
      <title>3. Discussion</title>
      <p>The results from the survey indicate that the paramount priority for ERNs is to protect their
patient’s privacy, as they all want to share their data, but in a controlled and safe manner. That
is why no ERN answered that they did not want to share any of their data, and most of them are
willing to give access to the CDEs by themselves (45.8% on average) or with some extras (38.9%
on average) to all stakeholders. Most ERNs want to share data that is pseudonymised (37.0% on
average) or aggregated (42.1% on average), as it allows for research to be done without risking
the privacy of their patients. The majority of ERNs want to share their data for free (42.8%
on average), but a considerable amount of them require the user to be authenticated (42.5%
on average). Regarding the data sharing timing, the overwhelming majority are willing to
share it immediately upon collection (72.2% on average), probably because that way it becomes
available for research as soon as possible, and almost all registries require stakeholders trying
to access their data need to submit a request to their DAC - the next point of the survey. This
is no surprise, as that way they can carefully examine exactly who accesses their data, what
data they share and exactly when to share it. Two stakeholders seem to be polar opposites
in the ERNs perspective: researchers and industry. For researchers, ERNs want to share all
their data at pseudonymised patient level (57.1%), and for free (some of them with (50.0%) and
some of them without authentication (42.9%)). These answers further support the point that the
RD community is willing to assist researchers as much as possible while protecting patients’
privacy. This might be the cause for the trend towards industry, one of the stakeholders with
which ERNs have the lowest percentage of willingness to share all available data (9.3%), the
highest willingness to share aggregated data (57.1%), and the highest willingness to have access
with both authentication and fees (53.8%). Remarkably, researchers seem to favor data sharing
with the industry over other stakeholders like patient organisations, which might suggest that
researchers are faced with maintaining balance between protecting their patients and finding in
the industry a source for funding that increases the sustainability of the registry itself.</p>
    </sec>
    <sec id="sec-4">
      <title>Acknowledgments</title>
      <p>This work was supported by the European Joint Programme on Rare Diseases, ERICA and
the following Europen Reference Networks: BOND, ERKNeT, Endo-ERN, ERNICA,
EURACAN, eUROGEN, EURONMD, GUARD-Heart, LUNG, MetabERN, PaedCan, RARE-LIVER, RITA,
VASCERN.</p>
      <p>Average
100.0%
100.0%
100.0%
75.0%
100.0%
75.0%
100.0%
75.0%
75.0%
0.0%
0.0%
0.0%
25.0%
0.0%
25.0%
0.0%
25.0%
25.0%</p>
    </sec>
  </body>
  <back>
    <ref-list>
      <ref id="ref1">
        <mixed-citation>
          [1]
          <string-name>
            <given-names>H. J. S.</given-names>
            <surname>Dawkins</surname>
          </string-name>
          , et al.,
          <source>Progress in rare diseases research</source>
          <year>2010</year>
          -2016:
          <article-title>An irdirc perspective</article-title>
          ,
          <source>Clinical and Translational Science</source>
          <volume>11</volume>
          (
          <year>2018</year>
          )
          <fpage>11</fpage>
          -
          <lpage>20</lpage>
          .
          <source>doi:1 0 . 1 1 1 1 / c t s . 1 2</source>
          <volume>5 0 1 .</volume>
        </mixed-citation>
      </ref>
      <ref id="ref2">
        <mixed-citation>
          [2]
          <string-name>
            <given-names>M. G.</given-names>
            <surname>Hansson</surname>
          </string-name>
          , et al.,
          <article-title>The risk of re-identification versus the need to identify individuals in rare disease research</article-title>
          ,
          <source>European Journal of Human Genetics</source>
          <volume>24</volume>
          (
          <year>2016</year>
          )
          <fpage>1553</fpage>
          -
          <lpage>1558</lpage>
          .
          <source>doi:1 0 . 1 0</source>
          <volume>3 8</volume>
          / e j h
          <source>g . 2 0</source>
          <volume>1 6 . 5</volume>
          <fpage>2</fpage>
          .
        </mixed-citation>
      </ref>
      <ref id="ref3">
        <mixed-citation>
          [3]
          <string-name>
            <given-names>A.</given-names>
            <surname>Schieppati</surname>
          </string-name>
          , et al.,
          <article-title>Why rare diseases are an important medical and social issue, The Lancet (British edition</article-title>
          )
          <volume>371</volume>
          (
          <year>2008</year>
          )
          <fpage>2039</fpage>
          -
          <lpage>2041</lpage>
          .
          <source>doi:1 0 . 1 0 1 6 / S 0 1</source>
          <volume>4 0 - 6 7 3 6 ( 0 8 ) 6 0 8 7 2 - 7</volume>
          .
        </mixed-citation>
      </ref>
      <ref id="ref4">
        <mixed-citation>
          [4]
          <string-name>
            <surname>EJP-RD</surname>
          </string-name>
          , Cde semantic model,
          <year>2020</year>
          . URL: https://github.com
          <article-title>/ejp-rd-vp/ CDE-semantic-model, last accessed: 2 Nov 2022</article-title>
          .
        </mixed-citation>
      </ref>
      <ref id="ref5">
        <mixed-citation>
          [5]
          <string-name>
            <given-names>B. D. S.</given-names>
            <surname>Vieira</surname>
          </string-name>
          , et al.,
          <article-title>Applying the fair data principles to the registry of vascular anomalies (vasca)</article-title>
          ,
          <source>Studies in health technology and informatics 271</source>
          (
          <year>2020</year>
          )
          <fpage>115</fpage>
          -
          <lpage>116</lpage>
          .
          <source>doi:1 0 . 3 2 3 3 / S H T I 2 0</source>
          <volume>0 0 8 5 .</volume>
        </mixed-citation>
      </ref>
      <ref id="ref6">
        <mixed-citation>
          [6]
          <string-name>
            <given-names>A.</given-names>
            <surname>Cámara</surname>
          </string-name>
          ,
          <article-title>Plots for data sharing policies survey</article-title>
          ,
          <source>2022. doi:1 0 . 5 2 8 1 / z e n o d o . 7 2</source>
          <volume>7 4 7 5 2 .</volume>
        </mixed-citation>
      </ref>
      <ref id="ref7">
        <mixed-citation>
          [7]
          <string-name>
            <given-names>A.</given-names>
            <surname>Cámara</surname>
          </string-name>
          ,
          <article-title>Responses to the data access policies survey</article-title>
          ,
          <source>2022. doi:1 0 . 5 2 8 1 / z e n o d o . 7 5</source>
          <volume>3 5 2 9 1 .</volume>
        </mixed-citation>
      </ref>
    </ref-list>
  </back>
</article>