<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20151215//EN" "http://jats.nlm.nih.gov/publishing/1.3/JATS-journalpublishing1-3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" dtd-version="1.1" specific-use="sps-1.9" article-type="research-article" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">tinf</journal-id>
            <journal-title-group>
                <journal-title>Transinformação</journal-title>
                <abbrev-journal-title abbrev-type="publisher">Transinformação</abbrev-journal-title>
            </journal-title-group>
            <issn pub-type="ppub">0103-3786</issn>
            <issn pub-type="epub">2318-0889</issn>
            <publisher>
                <publisher-name>Pontifícia Universidade Católica de Campinas</publisher-name>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="other">00325</article-id>
            <article-id pub-id-type="doi">10.1590/2318-0889202537e2513075</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>ORIGINAL</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Scientific production on data repositories and open science published in the Web of Science database: Methodi Ordinatio and content analysis</article-title>
                <trans-title-group xml:lang="pt">
                    <trans-title>Produção científica sobre repositórios de dados e ciência aberta publicada na base Web of Science: Methodi Ordinatio e análise de conteúdo</trans-title>
                </trans-title-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <contrib-id contrib-id-type="orcid">0000-0002-4475-1725</contrib-id>
                    <name>
                        <surname>Rodrigues-Junior</surname>
                        <given-names>Sinval Adalberto</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/contributor-roles/conceptualization">Conceptualization</role>
                    <role content-type="http://credit.niso.org/contributor-roles/data-curation">Data curation</role>
                    <role content-type="http://credit.niso.org/contributor-roles/formal-analysis">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/contributor-roles/investigation">Investigation</role>
                    <role content-type="http://credit.niso.org/contributor-roles/methodology">Methodology</role>
                    <role content-type="http://credit.niso.org/contributor-roles/writing-original-draft">Writing – original draft</role>
                    <xref ref-type="aff" rid="aff01">1</xref>
                    <xref ref-type="corresp" rid="c01"/>
                </contrib>
                <contrib contrib-type="author">
                    <contrib-id contrib-id-type="orcid">0000-0003-1636-4151</contrib-id>
                    <name>
                        <surname>Texeira</surname>
                        <given-names>Marcelo Votto</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/contributor-roles/conceptualization">Conceptualization</role>
                    <role content-type="http://credit.niso.org/contributor-roles/supervision">Supervision</role>
                    <role content-type="http://credit.niso.org/contributor-roles/validation">Validation</role>
                    <role content-type="http://credit.niso.org/contributor-roles/writing-review-editing">Writing – review and editing</role>
                    <xref ref-type="aff" rid="aff01">1</xref>
                </contrib>
            </contrib-group>
            <aff id="aff01">
                <label>1</label>
                <institution content-type="orgname">Universidade Comunitária da Região de Chapecó</institution>
                <institution content-type="orgdiv1">Curso de Biblioteconomia</institution>
                <institution content-type="orgdiv2">Departamento de Ensino à Distância</institution>
                <addr-line>
                    <city>Chapecó</city>
                    <state>SC</state>
                </addr-line>
                <country country="BR">Brasil</country>
                <institution content-type="original">Universidade Comunitária da Região de Chapecó, Curso de Biblioteconomia, Departamento de Ensino à Distância. Chapecó, SC, Brasil.</institution>
            </aff>
            <author-notes>
                <corresp id="c01">Correspondence to: S. A. RODRIGUES-JUNIOR. E-mail: <email>rodriguesjunior.sa@unochapeco.edu.br</email>. </corresp>
                <fn fn-type="edited-by">
                    <label>Editor</label>
                    <p>Luisa Angélica Paraguai Donati</p>
                </fn>
                <fn fn-type="coi-statement">
                    <label>Conflict of interest</label>
                    <p>The authors declare that they have no conflicts of interest.</p>
                </fn>
            </author-notes>
            <pub-date publication-format="electronic" date-type="pub">
                <day>0</day>
                <month>0</month>
                <year>2025</year>
            </pub-date>
            <pub-date publication-format="electronic" date-type="collection">
                <year>2025</year>
            </pub-date>
            <volume>37</volume>
            <elocation-id>e2513075</elocation-id>
            <history>
                <date date-type="received">
                    <day>07</day>
                    <month>05</month>
                    <year>2025</year>
                </date>
                <date date-type="accepted">
                    <day>16</day>
                    <month>10</month>
                    <year>2025</year>
                </date>
            </history>
            <permissions>
                <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/" xml:lang="en">
                    <license-p>This is an Open Access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <abstract>
                <title>Abstract</title>
                <p>The opening of scientific data proposed by the Open Science movement presupposes careful planning for data collection, organization, and treatment, aiming at their sharing, accessibility, and reuse. Data repositories have been conceived as structures necessary to enable open access to data. This study aimed to analyze the influence of data repositories on the disclosure and sharing of scientific data proposed by the Open Science movement. The Methodi Ordinatio, developed to organize a portfolio of scientific publications, was adopted to analyze the subject of ‘Data Repositories’ and ‘Open Science’. The studies were ranked using the InOrdinatio index, and the 15 best ranked studies were included and analyzed through Bardin’s content analysis. Most studies describe the structure involved in data repositories within the biological, chemical, and health areas. Other studies addressed data reuse, data organization and analysis processes and tools, as well as data selection and classification algorithms. The units of analysis selected for the content analysis were categorized as open access, information technologies, data processing, and information retrieval. Systems (processes and structures), metadata standards, ontologies, semantic web, data types, and their management were addressed by these studies. It is concluded that open data repositories are growing rapidly. Production with the greatest impact has occurred in the biological and biomedical/health areas, highlighting the structure involved in repositories within these fields. Data repositories provide systems for depositing, managing, searching, accessing, and reusing data based on processes and technologies — often developed as open-source software — in alignment with the proposed Open Science model.</p>
            </abstract>
            <trans-abstract xml:lang="pt">
                <title>Resumo</title>
                <p>A abertura de dados proposta pelo movimento da Ciência Aberta pressupõe um planejamento para a coleta, organização e tratamento desses dados, visando ao compartilhamento, à acessibilidade e a reutilização deles. Os repositórios de dados foram planejados como estruturas que permitem o acesso aberto a esses conteúdos. Este estudo teve como objetivo analisar a influência dos repositórios de dados na abertura e compartilhamento de dados científicos propostos pelo movimento da Ciência Aberta. O Methodi Ordinatio, desenvolvido para organizar um portfólio de publicações, foi adotado para analisar o tema “Repositórios de Dados” e “Ciência Aberta”. Os estudos foram classificados segundo o índice InOrdinatio, e os 15 estudos mais bem classificados foram analisados por meio da análise de conteúdo de Bardin. A maioria dos estudos descreve a estrutura de repositórios de dados nas áreas biológicas, químicas e de saúde. Os demais abordaram a reutilização de dados, processos e ferramentas de organização e análise de dados e algoritmos de seleção e classificação de informações. As unidades de análise selecionadas para a análise de conteúdo foram categorizadas em acesso aberto, tecnologias de informação, processamento de dados e recuperação de informação. Sistemas (processos e estruturas), padrões de metadados, ontologias, web semântica, tipos de dados e seu gerenciamento foram abordados nesses estudos. Conclui-se que os repositórios de dados abertos estão crescendo rapidamente. A produção de maior impacto ocorreu nas áreas biológica e biomédica/de saúde e destaca a estrutura envolvida nesses repositórios. Os repositórios de dados fornecem sistemas de depósito, gerenciamento, busca, acesso e reutilização de dados baseados em processos e tecnologias, em sua maioria desenvolvidos em software de código aberto, alinhando-se ao modelo de Ciência Aberta proposto.</p>
            </trans-abstract>
            <kwd-group xml:lang="en">
                <title>Keywords</title>
                <kwd>Content analysis</kwd>
                <kwd>Data repository</kwd>
                <kwd>Open access</kwd>
                <kwd>Open science</kwd>
            </kwd-group>
            <kwd-group xml:lang="pt">
                <title>Palavras-chave</title>
                <kwd>Análise de conteúdo</kwd>
                <kwd>Repositório de dados</kwd>
                <kwd>Acesso livre</kwd>
                <kwd>Ciência aberta</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="intro">
            <title>Introduction</title>
            <p>The scenario of scientific production has undergone significant changes over the last 20 years with the introduction of the Open Science paradigm. This movement is guided by the understanding that scientific knowledge should be widely and openly shared for the benefit of all people (<xref ref-type="bibr" rid="B40">United Nations Educational, Scientific and Cultural Organization, 2022</xref>). Notably, scientific knowledge is considered a driving force for economic growth and for solving complex problems in an interconnected world (<xref ref-type="bibr" rid="B30">Silva; Silveira, 2019</xref>; <xref ref-type="bibr" rid="B40">United Nations Educational, Scientific and Cultural Organization, 2022</xref>). Hence, the more open and global its production is, the faster these problems can be solved.</p>
            <p>The Open Science model is a contemporary approach that aims to democratize access to scientific knowledge, strengthen the transparency of research processes, and expand the social impact of science. Among its main advantages are free access to publications and data, which reduce economic barriers and promotes greater equity in the dissemination of knowledge (<xref ref-type="bibr" rid="B42">United Nations Educational, Scientific and Cultural Organization, 2021</xref>). Furthermore, interdisciplinary collaboration and information sharing foster innovation and scientific efficiency, avoiding duplication of efforts and optimizing public resources (<xref ref-type="bibr" rid="B09">European Commission, 2016</xref>; <xref ref-type="bibr" rid="B10">Fecher; Friesike, 2014</xref>). Methodological transparency, supported by the openness of protocols, codes, and databases, contributes to the reproducibility and reliability of results (<xref ref-type="bibr" rid="B20">Nosek <italic>et al.</italic>, 2015</xref>). From a social perspective, the model encourages knowledge transfer and the practical application of discoveries, driving public policies and evidence-driven technological solutions (<xref ref-type="bibr" rid="B43">Vicente-Saez; Martinez-Fuentes, 2018</xref>). Finally, by favoring the participation of historically underrepresented countries and groups, Open Science promotes greater inclusion and cognitive justice in the global scientific system (<xref ref-type="bibr" rid="B08">Chan <italic>et al.</italic>, 2020</xref>). Thus, it has consolidated itself as a paradigm that combines scientific rigor, social responsibility, and equity in access to knowledge.</p>
            <p>Despite the undeniable gains of opening the production of scientific knowledge, Open Science faces a series of challenges, including the need to prepare scientists for a necessary change in behavior regarding their activity. Incentives and technical training for data sharing are on the agenda (<xref ref-type="bibr" rid="B44">Walters, 2020</xref>). Additionally, an adequate information infrastructure is required and involves practices from library science, archival science, and data management (<xref ref-type="bibr" rid="B27">Sayão; Sales, 2023</xref>). There is also a demand for technological resources, namely servers, hardware, and software. In this sense, open data repositories are foundational elements of the Open Science ecosystem. <xref ref-type="bibr" rid="B23">Pampel <italic>et al.</italic> (2023)</xref> counted more than 3,000 data repositories registered in re3data, signaling a growing increase in the ecosystem that meets re3data’s quality and openness requirements. Moreover, along with data repositories, data journals have been listed as possible sources of open data and are seen as a response to the need for recognition of data authors (<xref ref-type="bibr" rid="B15">Kindling; Strecker, 2022</xref>; <xref ref-type="bibr" rid="B44">Walters, 2020</xref>).</p>
            <sec>
                <title>The open science paradigm</title>
                <p>One of the first manifestations toward the opening of access to scientific information came from the Budapest Open Access Initiative (BOAI) in December 2001. This group advocated for the acceleration of efforts to make studies freely available to the global public (<xref ref-type="bibr" rid="B06">Budapest Open Access Initiative, 2002</xref>). Their initial approach recommended the practice of self-archiving journal articles in open electronic repositories by authors (green way) and the development of journals committed to open access (gold way) (<xref ref-type="bibr" rid="B06">Budapest Open Access Initiative, 2002</xref>). Therefore, the recommendation stands in opposition to the traditional publishing model established by commercial publishers who, in addition to charging researchers and institutions where the research is developed to publish, also profit from subscribers willing to access the scientific information (<xref ref-type="bibr" rid="B30">Silva; Silveira, 2019</xref>).</p>
                <p>Ever since, Open Science has become a topic of discussion in the scientific community. In 2020, the United Nations Educational, Scientific and Cultural Organization (UNESCO) conducted a global consultation about Open Science, which presented the perceptions of the topic across countries from the five continents. Integration of Open Science through the entire research cycle, including open methodology, open source, open peer review, open software, open education, research evaluation metrics, and citizen science was emphasized (<xref ref-type="bibr" rid="B41">United Nations Educational, Scientific and Cultural Organization, 2020</xref>). It also gave birth to the UNESCO Recommendations on Open Science, which are based on four pillars: open scientific knowledge, open science infrastructures, open involvement of societal actors (scientific communication) and dialogue with other knowledge systems (<xref ref-type="fig" rid="f01">Figure 1</xref>) (<xref ref-type="bibr" rid="B42">United Nations Educational, Scientific and Cultural Organization, 2021</xref>).</p>
                <p>Open scientific knowledge involves scientific publications, open research data, open educational resources, free and open-source software, and open hardware. Open scientific infrastructures refer to virtual and physical infrastructures, equipment, instruments, information sources, files, scientific data, among others, which make scientific work more collaborative. The involvement of societal actors is associated with collaboration between scientists and members of society beyond the scientific community. Crowdfunding, third-party contributions, scientific volunteering, and citizen science are some related concepts. Finally, openness to other knowledge systems, such as local communities, marginalized academies and traditional populations constitutes the fourth foundational pillar of the Open Science movement (<xref ref-type="bibr" rid="B42">United Nations Educational, Scientific and Cultural Organization, 2021</xref>).</p>
                <fig id="f01">
                    <label>Figure 1</label>
                    <caption>
                        <title>Pillars of the UNESCO Recommendation on Open Science.</title>
                    </caption>
                    <graphic xlink:href="2318-0889-tinf-37-e2513075-gf01.jpg"/>
                    <attrib>Source: <xref ref-type="bibr" rid="B42">United Nations Educational, Scientific and Cultural Organization (2021)</xref>.</attrib>
                </fig>
            </sec>
            <sec>
                <title>Open data within the open science paradigm</title>
                <p>Open data is the second dimension of the Open Science Taxonomy described by <xref ref-type="bibr" rid="B25">Pontika <italic>et al.</italic> (2015)</xref> and expanded by <xref ref-type="bibr" rid="B31">Silveira <italic>et al.</italic> (2023)</xref>. It addresses open big data, open data standards, the use and reuse of open data, requirements for opening data, open data visualization, government open data, open administrative data, FAIR principles, and public data (<xref ref-type="bibr" rid="B31">Silveira <italic>et al.</italic>, 2023</xref>). Open data, therefore, is a key dimension of the Open Science paradigm. Importantly, most of these sub-dimensions are interrelated. Open research data include digital and analogical data, raw and processed data, metadata, text records, images and sounds, protocols, analysis codes, and workflows (<xref ref-type="bibr" rid="B31">Silveira <italic>et al.</italic>, 2023</xref>; <xref ref-type="bibr" rid="B41">United Nations Educational, Scientific and Cultural Organization, 2020</xref>).</p>
                <p>When it comes to Open Data in the revised Open Science taxonomy, the first subdivision of the nine refers to Open Big Data (<xref ref-type="bibr" rid="B31">Silveira <italic>et al.</italic>, 2023</xref>). Big data comprises large, complex sets of data with interaction potential that cannot be processed with standard management techniques. Decision-making in several fields, including business, government and public administration, and health care, amongst others, has relied on properly analyzed big data (<xref ref-type="bibr" rid="B01">Acharjya; Kauser, 2016</xref>; <xref ref-type="bibr" rid="B39">Ularu <italic>et al.</italic>, 2012</xref>). Big data is based on four aspects, the so-called 4Vs: veracity, variety, volume, and velocity. Veracity stands for the truthfulness of the information generated with data, so decisions can be made based on it. Volume stands for data gathered, velocity stands for the processing time required to analyze big data, and variety stands for the variability of data types involved in big data (<xref ref-type="bibr" rid="B39">Ularu <italic>et al.</italic>, 2012</xref>). Open data standards are required so that open data may be correctly identified, cited, and reported (<xref ref-type="bibr" rid="B26">Sansone <italic>et al.</italic>, 2019</xref>). Such standards involve guiding principles or checklists that signal the information required to contextualize the object, dictionaries and ontologies to properly and unambiguously define the object, models and formats of structures that include transmission formats to ease the exchange of data between systems, and identifiers of digital objects that confer unique identities to the objects. These standards have been developed by communities under the FAIRsharing flag (<ext-link ext-link-type="uri" xlink:href="https://fairsharing.org/">https://fairsharing.org/</ext-link>) (<xref ref-type="bibr" rid="B26">Sansone <italic>et</italic> al., 2019</xref>).</p>
                <p>FAIRsharing derives from the FAIR principles, an acronym that stands for Findable, Accessible, Interoperable and Reusable open data (<xref ref-type="bibr" rid="B45">Wilkinson <italic>et al.</italic>, 2016</xref>). Findability, in this context is associated with the existence of a globally unique and persistent identifier, data described with rich metadata that includes the identifier of the object being described, and indexation in a searchable source. Accessibility relates to the retrieval of data by the identifier under a standard, open, and free communication protocol, and the maintenance of metadata even when data is no longer available. Interoperability is based on metadata composed by formal, accessible, shared, and widely applicable language, by vocabularies that follow the FAIR principles, and metadata that references other metadata. Finally, reusability relies on richly described metadata, released with a clear and accessible usage license, detailed data provenance, and metadata meeting domain-relevant community standards (<xref ref-type="bibr" rid="B45">Wilkinson <italic>et al</italic>., 2016</xref>).</p>
                <p>According to <xref ref-type="bibr" rid="B45">Wilkinson <italic>et al.</italic> (2016)</xref>, open data is not an aim in itself; rather, it serves to provide open data as a valuable digital resource and an opportunity for the scientific community to pursue new discoveries and innovations. It is expected that data collection efforts will not be duplicated, and that data sharing and reuse will bring the scientific community closer together for collaboration.</p>
                <p>As part of the eScience movement, the open data sharing has been extended beyond science, to government and administrative data. Advocates propose that governments can enhance transparency in stewardship by opening data in public repositories. The Open Government Partnership was launched in 2011 by a group of eight founding countries, including Brazil, and now extends to more than 80 countries (<xref ref-type="bibr" rid="B28">Sena; Segundo; Melo, 2022</xref>). Countries commit to initiatives that promote transparency, access to public information, and citizen participation. Each government elaborates two-year action plans focusing on state commitments to the open government principles − namely transparency, accountability, citizen participation, technology, and innovation. The execution of the proposed activities is monitored during the plan’s implementation and, at the end of the two years, a new plan is implemented (<xref ref-type="bibr" rid="B03">Bertin <italic>et a</italic>l., 2019</xref>).</p>
            </sec>
            <sec>
                <title>Data sharing in open data repositories</title>
                <p>For one to deposit data in an open data repository, data management planning is required prior to the beginning of the research. Tools are available for these data management planning, such as DMPTool and DataUp (<xref ref-type="bibr" rid="B35">Strasser; Cruse, 2013</xref>, <xref ref-type="bibr" rid="B33">Strasser; Abrams; Cruse, 2014</xref>). A successful data management plan would allow others to find, access, understand, and reuse data over a 20-year span (<xref ref-type="bibr" rid="B34">Strasser <italic>et al.</italic>, 2011</xref>). <xref ref-type="fig" rid="f02">Figure 2</xref> depicts the data management life cycle from th e perspective of the researcher.</p>
                <fig id="f02">
                    <label>Figure 2</label>
                    <caption>
                        <title>Data management life cycle.</title>
                    </caption>
                    <graphic xlink:href="2318-0889-tinf-37-e2513075-gf02.jpg"/>
                    <attrib>Source: <xref ref-type="bibr" rid="B34">Strasser et al. (2011)</xref>.</attrib>
                </fig>
                <p>Data collection also corresponds to the creation of the dataset and should explicitly include a sampling plan, the description of data collection and analysis, including the rationale for the methods chosen along with contextual information. The organization of data should consider the file formats used and the contents to be generated. Data management requires the definition of who is responsible for it, as well as the definition of the data version and how it will be handled, the necessary backups, and their frequency. Data description relies on the metadata. How metadata will be recorded, which metadata standard will be adopted, which tool will be used, and where it will be deposited are some of the questions to be asked when considering data description. Data sharing may occur even during the research process, within the research team. After the end of the research, sharing with a broader scientific community may also be planned. Similarly, data preservation may be required during the research execution and after its end. Preservation must consider archival requirements for data, documentation, and metadata (<xref ref-type="bibr" rid="B34">Strasser <italic>et</italic> al., 2011</xref>).</p>
                <p>Although technological issues are required to achieve the best experience in data sharing in science, digital technology keeps evolving to provide researchers with data to analyze (<xref ref-type="bibr" rid="B07">Carlson, 2006</xref>). The speed of development of the required digital infrastructure is high and supports the growing demand of data sharing under the eScience context (<xref ref-type="bibr" rid="B12">Greenberg <italic>et al.</italic>, 2009</xref>). It seems that the challenges to data sharing are more related to established practices adopted by researchers, motivated by different factors, including the perceived value of their time, concerns about misinterpretation and misuse of data, and lack of expertise in data sharing (<xref ref-type="bibr" rid="B38">Tenopir <italic>et al.</italic>, 2011</xref>). Moreover, recognition for data sharing has yet to be fully established, and it seems that the scientific community must be involved, including funders, research societies, universities, and scientific rating organizations. Issues that deserve attention include credit attribution for data sharing, support for education, and community standards for data sharing.</p>
                <p>In light of the existing challenges related to data sharing in open data repositories, this study aimed to identify the most relevant studies on data repositories and open science and to analyze their content.</p>
            </sec>
        </sec>
        <sec sec-type="methods">
            <title>Methodological Procedures</title>
            <p>The study was conceived as a quantitative-qualitative study, based on the context of scientific production on data repositories and open science indexed in the Web of Science (WoS) database. The Methodi Ordinatio, proposed by <xref ref-type="bibr" rid="B22">Pagani, Kovaleski and Resende (2015)</xref> was applied and adapted to achieve the proposed objectives. This method proposes a strategy for building a portfolio of relevant studies to answer the research question, following a systematized review proposal. It adopts a multi-criteria model for evaluating and ranking publications (InOrdinatio) based on the impact factor, year of publication, and number of citations to determine the relevance of studies to the field (<xref ref-type="bibr" rid="B22">Pagani; Kovaleski; Resende, 2015</xref>).</p>
            <p>Methodi Ordinatio is composed of nine phases, as follows: Phase 1) − Establishment of research intention; Phase 2) − Preliminary exploratory research with keywords in the databases; Phase 3) - Definition and combination of keywords and databases; Phase 4) − Final search in databases; Phase 5) − Filtering procedures; Phase 6) − Identification of the impact factor, year of publication and number of citations; Phase 7) − Ranking of articles using InOrdinatio; Phase 8) - Search for full articles; Phase 9) − Final reading and systematic analysis of articles.</p>
            <p>Next, the way in which the nine phases were applied in this study is described.</p>
            <p>Phase 1) − Establishment of research intention: the initial research theme was defined as the requirements for building a data repository.</p>
            <p>Phase 2) − Preliminary exploratory research with keywords in databases: the Web of Science (WoS) database was chosen because it provides the largest number of studies on the topic in an exploratory and comparative search with Scopus. Also, it was chosen because it provides one of the metrics for ranking studies, the impact factor, in addition to the number of citations. At this stage, a preliminary, broader search on the topic was carried out using the following search strategy:</p>
            <disp-quote>
                <p><italic>‘data repository OR data repositories OR open data repository (All fields) AND open science OR open data OR open data repository ecosystem OR open data repository eco-system ( All fields)</italic></p>
                <p><italic>NOT Document types</italic>: <italic>Early access’</italic></p>
            </disp-quote>
            <p>The search was carried out on November 8th 2023. Documents in press (with early access) were removed from the search strategy itself because the publication date was not established.</p>
            <p> Phase 3) − Definition and combination of keywords and databases: Based on the analysis of indexed keywords and authors’ keywords, a thematic focus was defined, considering the frequency of keywords and thematic growth trends. Therefore, it was decided to address the association between the theme “Open Science” and its derivations with data repositories. The question to be answered was: “What is the impact of the Open Science model on the construction of data repositories?”</p>
            <p>Phase 4) − Final search in databases: The final search strategy was structured based on words representing ‘data repositories’ and words that represented the context of Open Science, according to the taxonomy defined in <xref ref-type="bibr" rid="B25">Pontika <italic>et al.</italic> (2015)</xref>. Finally, early access studies were removed, as were conference papers, data articles, and editorial material. Therefore, only published original articles and review articles made up the portfolio.</p>
            <disp-quote>
                <p>‘<italic>”data repository” OR “data repositories” (All fields) AND “open science” OR “open access”</italic></p>
                <p><italic>OR “open data” OR “open science policies” OR “open science tools” OR “open repositories”</italic></p>
                <p><italic>OR “open data repository” OR “open data repository ecosystem” OR “open data repository eco-system” (All fields) NOT Document types: Early access NOT Document types</italic>:</p>
                <p><italic>Conference paper OR Data paper OR Editorial material’</italic></p>
            </disp-quote>
            <p>Phase 5) − Filtering procedures: the complete WoS records database was downloaded in Excel format (.xlsx) and studies were selected considering whether the title represented the topic under study. A single researcher selected the studies, and, in case of doubt, the researcher kept the study among those eligible.</p>
            <p>Phase 6) − Identification of the impact factor, year of publication and number of citations: the metric adopted was the WoS Impact Factor (IF). When the journal did not present an IF, the Journal Citation Indicator (JCI) − also provided in WoS − was considered. The year of publication and the number of citations across all databases were also collected from the database.</p>
            <p>Phase 7) − Ranking of articles using InOrdinatio: the selected articles were ranked using the following formula:</p>
            <disp-formula id="e01">
                <mml:math>
                    <mml:mi>I</mml:mi>
                    <mml:mi>n</mml:mi>
                    <mml:mi>O</mml:mi>
                    <mml:mi>r</mml:mi>
                    <mml:mi>d</mml:mi>
                    <mml:mi>i</mml:mi>
                    <mml:mi>n</mml:mi>
                    <mml:mi>a</mml:mi>
                    <mml:mi>t</mml:mi>
                    <mml:mi>i</mml:mi>
                    <mml:mi>o</mml:mi>
                    <mml:mo>=</mml:mo>
                    <mml:mo>(</mml:mo>
                    <mml:mi>F</mml:mi>
                    <mml:mi>I</mml:mi>
                    <mml:mo>/</mml:mo>
                    <mml:mn>1000</mml:mn>
                    <mml:mo>)</mml:mo>
                    <mml:mo>+</mml:mo>
                    <mml:msup>
                        <mml:mi>&#x3B1;</mml:mi>
                        <mml:mo>&#x2217;</mml:mo>
                    </mml:msup>
                    <mml:mo>[</mml:mo>
                    <mml:mn>10</mml:mn>
                    <mml:mo>&#x2212;</mml:mo>
                    <mml:mo>(</mml:mo>
                    <mml:mi>Y</mml:mi>
                    <mml:mi>e</mml:mi>
                    <mml:mi>a</mml:mi>
                    <mml:mi>r</mml:mi>
                    <mml:mo>&#xA0;</mml:mo>
                    <mml:mi>o</mml:mi>
                    <mml:mi>f</mml:mi>
                    <mml:mo>&#xA0;</mml:mo>
                    <mml:mi>r</mml:mi>
                    <mml:mi>e</mml:mi>
                    <mml:mi>s</mml:mi>
                    <mml:mi>e</mml:mi>
                    <mml:mi>a</mml:mi>
                    <mml:mi>r</mml:mi>
                    <mml:mi>c</mml:mi>
                    <mml:mi>h</mml:mi>
                    <mml:mo>&#x2212;</mml:mo>
                    <mml:mi>Y</mml:mi>
                    <mml:mi>e</mml:mi>
                    <mml:mi>a</mml:mi>
                    <mml:mi>r</mml:mi>
                    <mml:mo>&#xA0;</mml:mo>
                    <mml:mi>o</mml:mi>
                    <mml:mi>f</mml:mi>
                    <mml:mo>&#xA0;</mml:mo>
                    <mml:mi>p</mml:mi>
                    <mml:mi>u</mml:mi>
                    <mml:mi>b</mml:mi>
                    <mml:mi>l</mml:mi>
                    <mml:mi>i</mml:mi>
                    <mml:mi>c</mml:mi>
                    <mml:mi>a</mml:mi>
                    <mml:mi>t</mml:mi>
                    <mml:mi>i</mml:mi>
                    <mml:mi>o</mml:mi>
                    <mml:mi>n</mml:mi>
                    <mml:mo>)</mml:mo>
                    <mml:mo>]</mml:mo>
                    <mml:mo>+</mml:mo>
                    <mml:mo>(</mml:mo>
                    <mml:mi mathvariant="normal">&#x3A3;</mml:mi>
                    <mml:mi>C</mml:mi>
                    <mml:mi>i</mml:mi>
                    <mml:mo>)</mml:mo>
                </mml:math>
            </disp-formula>
            <p>Where FI is the impact factor, α is a weighting factor for the weight of the year of publication, which can vary from 1 to 10; the year of research is the year in which the study is being carried out, the year of publication is the year in which the article was published, and <italic>Σ</italic>Ci is the sum of citations. Regarding the weighting factor of the year of publication, it is considered that topics in which more recent studies are more relevant can adopt weighting factors closer to or equal to 10, while topics in which the date of publication is irrelevant or which tends to consider older studies as more relevant, brings the weighting factor closer to 1. In this study, the weighting factor adopted was 10, considering the current relevance of the studies in the context analyzed.</p>
            <p>Phase 8) − Search for full articles: the 15 studies with the highest InOrdinato index were included in the study.</p>
            <p>Phase 9) − Final reading and systematic analysis of the articles: at this stage, the reading, interpretation, and synthesis of the texts were conducted following the content analysis method proposed by <xref ref-type="bibr" rid="B02">Bardin (2020)</xref>. First, an exploratory reading of the studies was carried out. Then, excerpts (units of analysis) relevant to answering the research question were selected and represented by thematic categories and subcategories.</p>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <p>The results of the final search (Phase 4) indicated a total of 545 documents. Filtering these documents by title led to the exclusion of 358 records, resulting in 152 remaining documents. The InOrdinatio index was applied to all 152 documents and <xref ref-type="table" rid="t01">Table 1</xref> presents the 15 studies with the highest InOrdinatio index included in the study.</p>
            <table-wrap id="t01">
                <label>Table 1</label>
                <caption>
                    <title>Included studies based on InOrdinatio ranking.</title>
                </caption>
                <table frame="hsides" rules="groups">
                    <thead>
                        <tr align="center">
                            <th align="left">Ranking of Phase 7</th>
                            <th> Studies<break/>(first author, year, title, and journal)</th>
                            <th>Country</th>
                            <th>Impact factor (Phase 6)</th>
                            <th>Citations (Phase 6)</th>
                            <th> Year<break/>(Phase 6)</th>
                            <th>InOrdinatio (Phase 7)</th>
                        </tr>
                    </thead>
                    <tbody>
                        <tr align="center" valign="top">
                            <td align="left">1</td>
                            <td align="justify"> Smedley (2015). The BioMart community portal: an innovative alternative to large, centralized data repositories. <italic>Nucleic Acids Research</italic></td>
                            <td>Italy</td>
                            <td>14.9</td>
                            <td>475</td>
                            <td>2015</td>
                            <td>495.0149</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">2</td>
                            <td align="justify"> Bhattacharya (2018). ImmPort, toward repurposing of open access immunological assay data for translational and clinical research. <italic>Scientific Data</italic></td>
                            <td>USA</td>
                            <td>9.8</td>
                            <td>372</td>
                            <td>2018</td>
                            <td>422.0098</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">3</td>
                            <td align="justify"> Sud (2016). Metabolomics Workbench: An international repository for metabolomics data and metadata, metabolite standards, protocols, tutorials and training, and analysis tools. <italic>Nucleic Acids Research</italic></td>
                            <td>USA</td>
                            <td>14.9</td>
                            <td>376</td>
                            <td>2016</td>
                            <td>406.0149</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">4</td>
                            <td align="justify"> Okuda (2017). jPOSTrepo: an international standard data repository for proteomes. <italic>Nucleic Acids Research</italic></td>
                            <td>Japan</td>
                            <td>14.9</td>
                            <td>302</td>
                            <td>2017</td>
                            <td>342.0149</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">5</td>
                            <td align="justify"> <xref ref-type="bibr" rid="B37">Taylor (2017)</xref>. The Cambridge Centre for Ageing and Neuroscience (Cam-CAN) data repository: Structural and functional MRI, MEG, and cognitive data from a cross-sectional adult lifespan sample. <italic>Neuroimage</italic></td>
                            <td>United Kingdom</td>
                            <td>5.7</td>
                            <td>272</td>
                            <td>2017</td>
                            <td>312.0057</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">6</td>
                            <td align="justify"> Guo (2020). CNSA: a data repository for archiving omics data. <italic>Database</italic></td>
                            <td>China</td>
                            <td>5.8</td>
                            <td>147</td>
                            <td>2020</td>
                            <td>217.0058</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">7</td>
                            <td align="justify"> Piwowar (2013). Data reuse and the open data citation advantage. <italic>PeerJ</italic></td>
                            <td>USA</td>
                            <td>2.7</td>
                            <td>176</td>
                            <td>2013</td>
                            <td>176.0027</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">8</td>
                            <td align="justify"> <xref ref-type="bibr" rid="B29">Shi (2022)</xref>. DRAMP 3.0: an enhanced comprehensive data repository of antimicrobial peptides. <italic>Nucleic Acids Research</italic></td>
                            <td>China</td>
                            <td>14.9</td>
                            <td>53</td>
                            <td>2022</td>
                            <td>143.0149</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">9</td>
                            <td align="justify"> Michener (2015). Ecological data sharing. <italic>Ecological Informatics</italic></td>
                            <td>USA</td>
                            <td>5.1</td>
                            <td>123</td>
                            <td>2015</td>
                            <td>143.0051</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">10</td>
                            <td align="justify"> Kearnes (2021). The Open Reaction Database. <italic>Journal of the American Chemical Society</italic></td>
                            <td>USA</td>
                            <td>15</td>
                            <td>61</td>
                            <td>2021</td>
                            <td>141.015</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">11</td>
                            <td align="justify"> Moriya (2019). The jPOST environment: an integrated proteomics data repository and database. <italic>Nucleic Acids Research</italic></td>
                            <td>Japan</td>
                            <td>14.9</td>
                            <td>56</td>
                            <td>2019</td>
                            <td>116.0149</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">12</td>
                            <td align="justify"> Nargesian (2018). Table Union Search on Open Data. <italic>Proceedings of the VLDB Endowment</italic></td>
                            <td>Canada</td>
                            <td>2.5</td>
                            <td>61</td>
                            <td>2018</td>
                            <td>111.0025</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">13</td>
                            <td align="justify"> Bishop (2017). Revisiting Qualitative Data Reuse: A Decade On. <italic>SAGE Open</italic></td>
                            <td>United Kingdom and Finland</td>
                            <td>2</td>
                            <td>68</td>
                            <td>2017</td>
                            <td>108.002</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">14</td>
                            <td align="justify"> Zheng (2021). DrugComb update: a more comprehensive drug sensitivity data repository and analysis portal. <italic>Nucleic Acids Research</italic></td>
                            <td>Finland</td>
                            <td>14.9</td>
                            <td>27</td>
                            <td>2021</td>
                            <td>107.0149</td>
                        </tr>
                        <tr align="center" valign="top">
                            <td align="left">15</td>
                            <td align="justify"> Gad (2022). An improved binary sparrow search algorithm for feature selection in data classification. <italic>Neural Computing and Applications</italic></td>
                            <td>Egipt and Australia</td>
                            <td>6</td>
                            <td>15</td>
                            <td>2022</td>
                            <td>105.006</td>
                        </tr>
                    </tbody>
                </table>
                <table-wrap-foot>
                    <attrib>Source: Prepared by the authors (2023).</attrib>
                </table-wrap-foot>
            </table-wrap>
            <p>Ten out of the 15 studies included (66.7%) described open data repositories, eight of which (53.3%) were from the biological field. The United States was the country with the highest number of studies (<italic>n</italic>=5), followed by Japan and China (<italic>n</italic>=2). Eight of the repositories belonged to the biological field, one of chemistry and one of health. The other five studies addressed data reuse (<xref ref-type="bibr" rid="B24">Piwowar; Vision, 2013</xref>), sharing data on ecology (<xref ref-type="bibr" rid="B17">Michener, 2015</xref>), merging tables of open data from different sources (<xref ref-type="bibr" rid="B19">Nargesian <italic>et al.</italic>, 2018</xref>), reuse of qualitative data (<xref ref-type="bibr" rid="B05">Bishop; Kuula-Luumi, 2017</xref>) and data selection and classification algorithms (<xref ref-type="bibr" rid="B11">Gad <italic>et</italic> al., 2022</xref>).</p>
            <p>The content analysis of the 15 studies resulted in 57 units of analysis representing four distinct categories: “<italic>open access, information technologies, data processing, and information retrieval</italic>” (<xref ref-type="fig" rid="f03">Figure 3</xref>).</p>
            <fig id="f03">
                <label>Figure 3</label>
                <caption>
                    <title>Structure of categories presented by the assessed studies.</title>
                </caption>
                <graphic xlink:href="2318-0889-tinf-37-e2513075-gf03.jpg"/>
                <attrib>Source: Prepared by the authors (2023).</attrib>
            </fig>
            <p>Open data repositories enable open access to data, promoting transparency and accessibility. Twelve units of analysis highlighted this relationship:</p>
            <disp-quote>
                <p>Study 2 (p. 2) − The goal of ImmPort is to ensure that basic and clinical research data are accessible to researchers in ways that allow effective sharing of data and knowledge. In order to facilitate this process, the ImmPort ecosystem includes four major applications: Private Data, Shared Data, Data Analysis, and Resources.</p>
                <p>Study 10 (p. 18824) − Commitment to Open Access. As the name implies, the Open Reaction Database is designed for open access and community contributions.</p>
            </disp-quote>
            <p>Furthermore, repositories provide <italic>information technologies</italic> such as systems, metadata and the data itself. Twelve units of analysis referred to systems including relational data management systems written in open source, graphical and programmatic interfaces (data sets, filters and attributes), databases and data analysis systems written in different open codes and machine learning algorithms aimed at combining data:</p>
            <disp-quote>
                <p>Study 2 (p. 2) − The ImmPort database architecture is designed to support and maintain a variety of multi-modal immunological data such as study method documentation, metadata and standardized data formats and terminologies. Together, these efforts facilitate accurate and efficient secondary analysis of large-scale immunology data.</p>
                <p>Study 6 (p. 2) − Based on the Django framework which is a high-level Python Web framework for web development and maintenance (<ext-link ext-link-type="uri" xlink:href="https://www.djangoproject.com/">https://www.djangoproject.com/</ext-link>), CNSA is developed in Python.</p>
            </disp-quote>
            <p>Another four units of analysis referred to metadata standards, as follows:</p>
            <disp-quote>
                <p>Study 9 (p. 41) − Data products cannot be re-used unless the context, structure, collection and processing methods, and quality of the data are sufficiently documented. Ideally, all aspects of the data are documented throughout the entire project from planning and hypothesis formulation through QA/QC and metadata creation through analysis and dissemination. Creating comprehensive metadata is most effective when researchers are routinely documenting data collection, processing and analysis activities. New tools such as open lab notebooks allow research notes and data to be published online as they are created. Metadata management is facilitated when standards such as ISO 19115 and EML are adopted and comprehensive, user-friendly tools like Morpho are employed to create, manage, and disseminate the project’s metadata.</p>
            </disp-quote>
            <p>Besides, another nineteen units of analysis identified the data itself as a constituent of information technologies. These units present elements related to data analysis, such as open-source technologies and programs, data management tools, incentives and barriers to data sharing, citations and metrics related to data:</p>
            <disp-quote>
                <p>Study 7 (p. 9) − Citations were 9% higher for papers with available data, independent of other variables (p &lt; 0.01, 95% confidence intervals [5% to 13%]).</p>
                <p>Study 9 (p. 36) − Funders, journals and professional societies can each drive sociological change with respect to data sharing. Establishing and enforcing mandates for data archiving greatly increase the likelihood that data will be available for the long-term (Vines <italic>et al.</italic>, 2013). Moreover, funders, publishers and professional societies can all contribute to incentivizing and reducing barriers to data sharing by providing credit, supporting education, establishing community standards for data and data sharing, and streamlining approaches to data submission.</p>
                <p>Study 9 (p. 41) − The DMPTool and DMPonline are tools that make it easy for researchers to create an initial data management plan that meets the requirements for a particular research sponsor in the USA and UK, respectively (see <ext-link ext-link-type="uri" xlink:href="https://dmponline.dcc.ac.uk/">https://dmptool.org/ and https://dmponline.dcc.ac.uk/</ext-link>). The DMPTool also allows one to share a plan with the project team and publish it openly for broader viewing and attribution.</p>
            </disp-quote>
            <p>The <italic>data processing</italic> category was represented by four units of analysis, and addressed data generation and data management, including its curation. The unit below expresses this context:</p>
            <disp-quote>
                <p>Study 9 (p. 41) − Before a project gets underway, researchers should have a plan for how the data will be managed. Plans should cover: (1) data collection and processing methods, organization in tables or databases, and relevant access and use policies; (2) quality assurance and quality control procedures; (3) metadata creation and management; (4) data preservation; (5) integration, analysis, synthesis and dissemination; (6) relevant policies including data sharing plans; and (7) a budget that explicitly details costs (i.e., time and money) for preparing, documenting, and archiving data.</p>
            </disp-quote>
            <p>Finally, six units of analysis expressed the information retrieval category. The category involved the concepts search, semantic web and ontologies, all provided by open repositories to provide accessibility to research data:</p>
            <disp-quote>
                <p>Study 11 (p. D1223) − jPOSTdb is constructed based on the Semantic Web technology that facilitates integration of various databases containing big data (29). The protein sequence and annotation databases, such as UniProt and neXtProt, have released data formatted by the Resource Description Framework (RDF) data model, which supports the Semantic Web technology (21,30). In addition, not only the proteome data, but also other omics and life science-related data have been converted to RDF data and released in the NBDC RDF portal (<ext-link ext-link-type="uri" xlink:href="https://integbio.jp/rdf/">https://integbio.jp/rdf/</ext-link>) and EBI RDF platform (31) and have been incorporated into various life science databases such as TogoGenome, a genomic database based on RefSeq data (<ext-link ext-link-type="uri" xlink:href="http://togogenome.org/">http://togogenome.org/</ext-link>), TogoVar, a database of human genome variants/variations (<ext-link ext-link-type="uri" xlink:href="https://togovar.biosciencedbc.jp/">https://togovar.biosciencedbc.jp/</ext-link>) and GlyTouCan, a glycan structure repository (32).</p>
            </disp-quote>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <p>The quantitative-qualitative study method was based on <xref ref-type="bibr" rid="B22">Pagani, Kovaleski, and Resende’s (2015)</xref> Methodi Ordinatio, adapted to answer the proposed question. The adaptations involved the application of the bibliometric method to analyze the scenario of scientific production regarding data repositories in Phases 2 and 4. The Methodi Ordinatio generated a portfolio of studies, among which the 15 best ranked were analyzed. The analysis of the studies attributed to data repositories the collaboration with the openness of scientific data and its transparency (<xref ref-type="bibr" rid="B04">Bhattacharya <italic>et al.</italic>, 2018</xref>; <xref ref-type="bibr" rid="B14">Kearnes <italic>et al.</italic>, 2021</xref>; <xref ref-type="bibr" rid="B46">Zheng <italic>et al.</italic>, 2021</xref>), as proposed by United Nations Educational, Scientific and Cultural Organization (<xref ref-type="bibr" rid="B41">2020</xref>). Furthermore, our results indicated repositories proposing strategies for processing data, helping to organizing them for sharing and reuse since their generation by researchers, in addition to their curation and management (<xref ref-type="bibr" rid="B04">Bhattacharya <italic>et al.</italic>, 2018</xref>; <xref ref-type="bibr" rid="B17">Michener, 2015</xref>; <xref ref-type="bibr" rid="B46">Zheng <italic>et al.</italic>, 2021</xref>). In addition, repositories provide the necessary information technology structure, such as systems, metadata and the data itself (<xref ref-type="bibr" rid="B04">Bhattacharya <italic>et al.</italic>, 2018</xref>; <xref ref-type="bibr" rid="B13">Guo <italic>et al.</italic>, 2020</xref>; <xref ref-type="bibr" rid="B32">Smedley <italic>et al.</italic>, 2015</xref>; <xref ref-type="bibr" rid="B46">Zheng <italic>et al.</italic>, 2021</xref>), as well as the structure for information retrieval that involves ontologies, semantic web, and the search processes themselves (<xref ref-type="bibr" rid="B04">Bhattacharya <italic>et al.</italic>, 2018</xref>; <xref ref-type="bibr" rid="B11">Gad <italic>et al.</italic>, 2022</xref>; <xref ref-type="bibr" rid="B18">Moriya <italic>et al.</italic>, 2019</xref>; <xref ref-type="bibr" rid="B21">Okuda <italic>et al.</italic>, 2017</xref>). Most studies were not necessarily related to the area of information science but rather described active data repositories in the biological, chemical, and health areas.</p>
            <p>The method adopted in the study, involving InOrdinatio to highlight the most relevant studies, considered the criteria involved in calculating the index (<xref ref-type="bibr" rid="B22">Pagani; Kovaleski; Resende, 2015</xref>). The decision to adopt a weighting factor (α) equal to 10 together with the year of publication was based on the understanding of the relevance of the recent aspect of the study, in contrast to the total number of citations, known to be lower in more recent studies. On the other hand, the adoption of InOrdinatio may have presented studies that did not necessarily associate open data repositories with information science, which may have generated a selection bias due to the impact factor of the journals.</p>
            <p>The studies analyzed revealed the commitment of data repositories to open access to data, in line with what is recommended in the UNESCO Recommendations (<xref ref-type="bibr" rid="B42">United Nations Educational, Scientific and Cultural Organization, 2021</xref>). The Recommendations advocate for “open access to scientific publications, research data, metadata, open educational resources, software, source codes and hardware available in the public domain or under copyright and open licenses”. In this sense, in addition to the openly expressed commitment to open access in some studies (<xref ref-type="bibr" rid="B04">Bhattacharya <italic>et al.</italic>, 2018</xref>; <xref ref-type="bibr" rid="B14">Kearnes <italic>et al.</italic>, 2021</xref>; <xref ref-type="bibr" rid="B46">Zheng <italic>et al.</italic>, 2021</xref>), others observed the construction of repository systems in open source (<xref ref-type="bibr" rid="B04">Bhattacharya <italic>et al.</italic>, 2018</xref>; <xref ref-type="bibr" rid="B32">Smedley <italic>et al.</italic>, 2015</xref>); and the use of open data analysis resources (<xref ref-type="bibr" rid="B36">Sud <italic>et al.</italic>, 2016</xref>; <xref ref-type="bibr" rid="B46">Zheng <italic>et</italic> al., 2021</xref>).</p>
            <p>Importantly, the concept “system”, in the context of information retrieval presupposes − beyond the hard aspect of software or technology − “the set of processes, human skills, techniques and technologies, sources of information united in a systemic way with the purpose of effectively providing Information Retrieval” (<xref ref-type="bibr" rid="B16">Lancaster, 1979</xref>). Thus, it includes all processes and technologies required to guarantee the findability of information and its use or reuse. Regarding data repositories, the FAIR principles (Findability, Accessibility, Interoperability and Reusability) guide this particular information system, including metadata standards (<xref ref-type="bibr" rid="B42">United Nations Educational, Scientific and Cultural Organization, 2021</xref>; <xref ref-type="bibr" rid="B45">Wilkinson <italic>et al.</italic>, 2016</xref>). Based on this, models of good metadata practices for data repositories have focused on components of dataset description in order to align with the semantic web proposal and the linked data perspective, enhancing the automatic synthesis of data and its reuse (<xref ref-type="bibr" rid="B12">Greenberg <italic>et al.</italic>, 2009</xref>). Interestingly, none of the studies analyzed mentioned FAIR principles. Despite this, some of the studies that described the repositories mentioned the use of systems built on open-source software (<xref ref-type="bibr" rid="B36">Sud <italic>et al.</italic>, 2016</xref>), metadata standards based on machine-readable XML and RDF schemas (<xref ref-type="bibr" rid="B21">Okuda <italic>et al.</italic>, 2017</xref>) and open-source data analysis tools (<xref ref-type="bibr" rid="B14">Kearnes <italic>et</italic> al., 2021</xref>).</p>
        </sec>
        <sec sec-type="conclusions">
            <title>Conclusion</title>
            <p>Based on the proposed method, and considering the limitations of the study, it was possible to conclude that the most impactful production has occurred in the biological, biomedical or interdisciplinary fields and highlights the structure involved in existing repositories. Data repositories provide systems for depositing, managing, searching, accessing and reusing data based on processes and technologies, most of which are developed using open-source software, in alignment with the proposed Open Science model.</p>
        </sec>
    </body>
    <back>
        <fn-group>
            <fn fn-type="other">
                <label>How to cite this article</label>
                <p>Rodrigues-Junior, S. A.; Texeira, M. V. Scientific production on data repositories and open science published in the Web of Science database: Methodi Ordinatio and content analysis. <italic>Transinformação</italic>, v. 37, e2513075, 2025. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1590/2318-0889202537e2513075">https://doi.org/10.1590/2318-0889202537e2513075</ext-link></p>
            </fn>
        </fn-group>
        <sec sec-type="data-availability" specific-use="data-in-article">
            <title>Data Availability</title>
            <p>The research data are available within the body of the document.</p>
        </sec>
        <ref-list>
            <title>References</title>
            <ref id="B01">
                <mixed-citation>Acharjya, D. P.; Kauser, A. P. A survey on big data analytics: challenges, open research issues and tools. <italic>International Journa l of Advanced Computer Science and Applications</italic>, v. 7, n. 2, p. 511-518, 2016. Available from: https://thesai.org/Downloads/Volume7No2/Paper_67-A_Survey_on_Big_Data_Analytics_Challenges.pdf. Cited: Oct. 1st 2023.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Acharjya</surname>
                            <given-names>D. P</given-names>
                        </name>
                        <name>
                            <surname>Kauser</surname>
                            <given-names>A. P</given-names>
                        </name>
                    </person-group>
                    <article-title>A survey on big data analytics: challenges, open research issues and tools</article-title>
                    <source>International Journa l of Advanced Computer Science and Applications</source>
                    <volume>7</volume>
                    <issue>2</issue>
                    <fpage>511</fpage>
                    <lpage>518</lpage>
                    <year>2016</year>
                    <comment>Available from: <ext-link ext-link-type="uri" xlink:href="https://thesai.org/Downloads/Volume7No2/Paper_67-A_Survey_on_Big_Data_Analytics_Challenges.pdf">https://thesai.org/Downloads/Volume7No2/Paper_67-A_Survey_on_Big_Data_Analytics_Challenges.pdf</ext-link></comment>
                    <date-in-citation content-type="access-date">Oct. 1st 2023</date-in-citation>
                </element-citation>
            </ref>
            <ref id="B02">
                <mixed-citation>Bardin, L. <italic>Análise de conteúdo</italic>. Lisboa: Edições 70, 2020.</mixed-citation>
                <element-citation publication-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Bardin</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <source>Análise de conteúdo</source>
                    <publisher-loc>Lisboa</publisher-loc>
                    <publisher-name>Edições 70</publisher-name>
                    <year>2020</year>
                </element-citation>
            </ref>
            <ref id="B03">
                <mixed-citation>Bertin, P. R. B. <italic>et al.</italic> A parceria para Governo Aberto como plataforma para o avanço da Ciência Aberta no Brasil. <italic>Transinformação</italic>, v. 31, e190020, 2019. Doi: http://dx.doi.org/10.1590/2318-0889201931e190020.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Bertin</surname>
                            <given-names>P. R. B</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>A parceria para Governo Aberto como plataforma para o avanço da Ciência Aberta no Brasil</article-title>
                    <source>Transinformação</source>
                    <volume>31</volume>
                    <elocation-id>e190020</elocation-id>
                    <year>2019</year>
                    <pub-id pub-id-type="doi">10.1590/2318-0889201931e190020</pub-id>
                </element-citation>
            </ref>
            <ref id="B04">
                <mixed-citation>Bhattacharya, S. <italic>et al.</italic> ImmPort, toward repurposing of open access immunological assay data for translational and clinical research. <italic>Scientific Data</italic>, v. 5, e180015, 2018. Doi: https://.doi.org/10.1038/sdata.2018.15.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Bhattacharya</surname>
                            <given-names>S.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>ImmPort, toward repurposing of open access immunological assay data for translational and clinical research</article-title>
                    <source>Scientific Data</source>
                    <volume>5</volume>
                    <elocation-id>e180015</elocation-id>
                    <year>2018</year>
                    <pub-id pub-id-type="doi">10.1038/sdata.2018.15</pub-id>
                </element-citation>
            </ref>
            <ref id="B05">
                <mixed-citation>Bishop, L.; Kuula-Luumi, A. Revisiting qualitative data reuse: a decade on. <italic>SAGE Open</italic>, p. 1-15, 2017. Doi: https://.doi.org/10.1177/2158244016685136.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Bishop</surname>
                            <given-names>L</given-names>
                        </name>
                        <name>
                            <surname>Kuula-Luumi</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Revisiting qualitative data reuse: a decade on</article-title>
                    <source>SAGE Open</source>
                    <fpage>1</fpage>
                    <lpage>15</lpage>
                    <year>2017</year>
                    <pub-id pub-id-type="doi">10.1177/2158244016685136</pub-id>
                </element-citation>
            </ref>
            <ref id="B06">
                <mixed-citation>Budapest Open Access Initiative. <italic>Budapest Open Access Initiative</italic>. Budapeste: BOAI, 2002. Available from: http://www.opensocietyfoundations.org/openaccess/read. Cited: Oct. 1st 2023.</mixed-citation>
                <element-citation publication-type="webpage">
                    <person-group person-group-type="author">
                        <collab>Budapest Open Access Initiative</collab>
                    </person-group>
                    <source>Budapest Open Access Initiative</source>
                    <publisher-loc>Budapeste</publisher-loc>
                    <publisher-name>BOAI</publisher-name>
                    <year>2002</year>
                    <comment>Available from: <ext-link ext-link-type="uri" xlink:href="http://www.opensocietyfoundations.org/openaccess/read">http://www.opensocietyfoundations.org/openaccess/read</ext-link></comment>
                    <date-in-citation content-type="access-date">Oct. 1st 2023</date-in-citation>
                </element-citation>
            </ref>
            <ref id="B07">
                <mixed-citation>Carlson, S. Lost in a sea of science data. <italic>Chronicle of Higher Ed ucation</italic>, v. 52, n. 42, p. A35, 2006.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Carlson</surname>
                            <given-names>S.</given-names>
                        </name>
                    </person-group>
                    <article-title>Lost in a sea of science data</article-title>
                    <source>Chronicle of Higher Ed ucation</source>
                    <volume>52</volume>
                    <issue>42</issue>
                    <fpage>A35</fpage>
                    <lpage>A35</lpage>
                    <year>2006</year>
                </element-citation>
            </ref>
            <ref id="B08">
                <mixed-citation>Chan, L. <italic>et al. Open Science Beyond Open Access</italic>: for and with communities. A step towards the decolonization of knowledge. Ottawa: The Canadian Commission for UNESCO’s IdeaLab., 2020.</mixed-citation>
                <element-citation publication-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Chan</surname>
                            <given-names>L.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <source><italic>et al. Open Science Beyond Open Access</italic>: for and with communities. A step towards the decolonization of knowledge</source>
                    <publisher-loc>Ottawa</publisher-loc>
                    <publisher-name>The Canadian Commission for UNESCO’s IdeaLab</publisher-name>
                    <year>2020</year>
                </element-citation>
            </ref>
            <ref id="B09">
                <mixed-citation>European Commission. <italic>Open innovation, open science, open to the world: a vision for Europe</italic>. Publications Office. 2015. Doi: https://doi.org/doi/10.2777/061652.</mixed-citation>
                <element-citation publication-type="book">
                    <person-group person-group-type="author">
                        <collab>European Commission</collab>
                    </person-group>
                    <source>Open innovation, open science, open to the world: a vision for Europe</source>
                    <publisher-name>Publications Office</publisher-name>
                    <year>2015</year>
                    <pub-id pub-id-type="doi">10.2777/061652</pub-id>
                </element-citation>
            </ref>
            <ref id="B10">
                <mixed-citation>Fecher, B.; Friesike, S. Open Science: One term, five schools of thought. <italic>In</italic>: Bartling, S.; Friesike, S. (ed.). <italic>Opening Science</italic>. New York: Springer, 2014. Doi: https://doi.org/10.1007/978-3-319-00026-8_2.</mixed-citation>
                <element-citation publication-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Fecher</surname>
                            <given-names>B</given-names>
                        </name>
                        <name>
                            <surname>Friesike</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <chapter-title>Open Science: One term, five schools of thought</chapter-title>
                    <person-group person-group-type="editor">
                        <name>
                            <surname>Bartling</surname>
                            <given-names>S</given-names>
                        </name>
                        <name>
                            <surname>Friesike</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>Opening Science</source>
                    <publisher-loc>New York</publisher-loc>
                    <publisher-name>Springer</publisher-name>
                    <year>2014</year>
                    <pub-id pub-id-type="doi">10.1007/978-3-319-00026-8_2</pub-id>
                </element-citation>
            </ref>
            <ref id="B11">
                <mixed-citation>Gad, A. G. <italic>et al.</italic> An improved binary sparrow search algorithm for feature selection in data classification. <italic>Neural Computing and Applications</italic>, v. 34, p. 15705-15752, 2022. Doi: https://doi.org/10.1007/s00521-022-07203-7.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Gad</surname>
                            <given-names>A. G.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>An improved binary sparrow search algorithm for feature selection in data classification</article-title>
                    <source>Neural Computing and Applications</source>
                    <volume>34</volume>
                    <fpage>15705</fpage>
                    <lpage>15752</lpage>
                    <year>2022</year>
                    <pub-id pub-id-type="doi">10.1007/s00521-022-07203-7</pub-id>
                </element-citation>
            </ref>
            <ref id="B12">
                <mixed-citation>Greenberg, J. <italic>et al.</italic> A metadata best practice for a scientific data repository. <italic>Journal of Library Metadata</italic>, v. 9, n. 3-4, p. 194-212, 2009. Doi: https://doi.org/10.1080/19386380903405090.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Greenberg</surname>
                            <given-names>J.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>A metadata best practice for a scientific data repository</article-title>
                    <source>Journal of Library Metadata</source>
                    <volume>9</volume>
                    <issue>3-4</issue>
                    <fpage>194</fpage>
                    <lpage>212</lpage>
                    <year>2009</year>
                    <pub-id pub-id-type="doi">10.1080/19386380903405090</pub-id>
                </element-citation>
            </ref>
            <ref id="B13">
                <mixed-citation>Guo, X. <italic>et al.</italic> CNSA: a data repository for archiving omics data. <italic>Database</italic>, v. 2020, p. 1-6, 2020. Doi: https://doi.org/10.1093/database/baaa055.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Guo</surname>
                            <given-names>X</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>CNSA: a data repository for archiving omics data</article-title>
                    <source>Database</source>
                    <volume>2020</volume>
                    <fpage>1</fpage>
                    <lpage>6</lpage>
                    <year>2020</year>
                    <pub-id pub-id-type="doi">10.1093/database/baaa055</pub-id>
                </element-citation>
            </ref>
            <ref id="B14">
                <mixed-citation>Kearnes, S. M. <italic>et al.</italic> The open reaction database. <italic>Journal of the American Chemic al Society</italic>, v. 143, p. 18820-18826, 2021. Doi: https://doi.org/10.1021/jacs.1c09820.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Kearnes</surname>
                            <given-names>S. M.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>The open reaction database</article-title>
                    <source>Journal of the American Chemic al Society</source>
                    <volume>143</volume>
                    <fpage>18820</fpage>
                    <lpage>18826</lpage>
                    <year>2021</year>
                    <pub-id pub-id-type="doi">10.1021/jacs.1c09820</pub-id>
                </element-citation>
            </ref>
            <ref id="B15">
                <mixed-citation>Kindling, M.; Strecker, D. List of Data Journals. <italic>Zenodo</italic>, Version 1.0., 2022. Doi: https://doi.org/10.5281/zenodo.7082125.</mixed-citation>
                <element-citation publication-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Kindling</surname>
                            <given-names>M</given-names>
                        </name>
                        <name>
                            <surname>Strecker</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <source>List of Data Journals</source>
                    <publisher-name>Zenodo</publisher-name>
                    <comment>Version 1.0.</comment>
                    <year>2022</year>
                    <pub-id pub-id-type="doi">10.5281/zenodo.7082125</pub-id>
                </element-citation>
            </ref>
            <ref id="B16">
                <mixed-citation>Lancaster, F. W. <italic>Information Retrieval Systems</italic>: Characteristics, Testing and Evaluation. 2. ed. Los Angeles: John Wiley &amp; Sons, 1979. (Information Sciences Series).</mixed-citation>
                <element-citation publication-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Lancaster</surname>
                            <given-names>F. W.</given-names>
                        </name>
                    </person-group>
                    <source><italic>Information Retrieval Systems</italic>: Characteristics, Testing and Evaluation</source>
                    <edition>2. ed.</edition>
                    <publisher-loc>Los Angeles</publisher-loc>
                    <publisher-name>John Wiley &amp; Sons</publisher-name>
                    <year>1979</year>
                    <comment>Information Sciences Series</comment>
                </element-citation>
            </ref>
            <ref id="B17">
                <mixed-citation>Michener, W. K. Ecological data sharing. <italic>Ecological Informatics</italic>, v. 29, n. 1, p. 33-44, 2015. Doi: https://doi.org/10.1016/j.ecoinf.2015.06.010.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Michener</surname>
                            <given-names>W. K.</given-names>
                        </name>
                    </person-group>
                    <article-title>Ecological data sharing</article-title>
                    <source>Ecological Informatics</source>
                    <volume>29</volume>
                    <issue>1</issue>
                    <fpage>33</fpage>
                    <lpage>44</lpage>
                    <year>2015</year>
                    <pub-id pub-id-type="doi">10.1016/j.ecoinf.2015.06.010</pub-id>
                </element-citation>
            </ref>
            <ref id="B18">
                <mixed-citation>Moriya, Y. <italic>et al.</italic> The jPOST environment: an integrated proteomics data repository and database. <italic>Nucleic Acids Research</italic>, v. 47, n. 1, p. D1218-D1224, 2019. Doi: https://doi.org/10.1093/nar/gky899.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Moriya</surname>
                            <given-names>Y.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>The jPOST environment: an integrated proteomics data repository and database</article-title>
                    <source>Nucleic Acids Research</source>
                    <volume>47</volume>
                    <issue>1</issue>
                    <fpage>D1218</fpage>
                    <lpage>D1224</lpage>
                    <year>2019</year>
                    <pub-id pub-id-type="doi">10.1093/nar/gky899</pub-id>
                </element-citation>
            </ref>
            <ref id="B19">
                <mixed-citation>Nargesian, F. <italic>et al.</italic> Table union search on open data. <italic>Proceedings of the VLDB Endowment</italic>, v. 11, n. 7, p. 813-825, 2018. Doi: https://doi.org/10.14778/3192965.3192973.</mixed-citation>
                <element-citation publication-type="confproc">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Nargesian</surname>
                            <given-names>F.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <conf-name>Table union search on open data</conf-name>
                    <source>Proceedings of the VLDB Endowment</source>
                    <volume>11</volume>
                    <issue>7</issue>
                    <fpage>813</fpage>
                    <lpage>825</lpage>
                    <year>2018</year>
                    <pub-id pub-id-type="doi">10.14778/3192965.3192973</pub-id>
                </element-citation>
            </ref>
            <ref id="B20">
                <mixed-citation>Nosek, B. A. <italic>et al.</italic> Promoting an open research culture. <italic>Science</italic>, v. 348, n. 6242, p. 1422. 2015. Doi: https://doi.org/10.1126/science.aab2374.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Nosek</surname>
                            <given-names>B. A.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>Promoting an open research culture</article-title>
                    <source>Science</source>
                    <volume>348</volume>
                    <issue>6242</issue>
                    <fpage>1422</fpage>
                    <lpage>1422</lpage>
                    <year>2015</year>
                    <pub-id pub-id-type="doi">10.1126/science.aab2374</pub-id>
                </element-citation>
            </ref>
            <ref id="B21">
                <mixed-citation>Okuda, S. <italic>et al.</italic> jPOSTrepo: an international standard data repository for proteomes. <italic>Nucleic Acids Research</italic>, v. 45, n. D1, p. D1107-D1111, 2017. Doi: https://doi.org/10.1093/nar/gkw1080.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Okuda</surname>
                            <given-names>S.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>jPOSTrepo: an international standard data repository for proteomes</article-title>
                    <source>Nucleic Acids Research</source>
                    <volume>45</volume>
                    <issue>D1</issue>
                    <fpage>D1107</fpage>
                    <lpage>D1111</lpage>
                    <year>2017</year>
                    <pub-id pub-id-type="doi">10.1093/nar/gkw1080</pub-id>
                </element-citation>
            </ref>
            <ref id="B22">
                <mixed-citation>Pagani, R. N.; Kovaleski, J. L.; Resende, L. M. Methodi Ordinatio: a proposed methodology to select and rank relevant scientific papers encompassing the impact factor, number of citation, and year of publication. <italic>Scientometrics</italic>, v. 105, p. 2109-2135, 2015. Doi: https://doi.org/10.1007/s11192-015-1744-x.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Pagani</surname>
                            <given-names>R. N.</given-names>
                        </name>
                        <name>
                            <surname>Kovaleski</surname>
                            <given-names>J. L.</given-names>
                        </name>
                        <name>
                            <surname>Resende</surname>
                            <given-names>L. M.</given-names>
                        </name>
                    </person-group>
                    <article-title>Methodi Ordinatio: a proposed methodology to select and rank relevant scientific papers encompassing the impact factor, number of citation, and year of publication</article-title>
                    <source>Scientometrics</source>
                    <volume>105</volume>
                    <fpage>2109</fpage>
                    <lpage>2135</lpage>
                    <year>2015</year>
                    <pub-id pub-id-type="doi">10.1007/s11192-015-1744-x</pub-id>
                </element-citation>
            </ref>
            <ref id="B23">
                <mixed-citation>Pampel, H. <italic>e t al.</italic> Re3data: Indexing the global research data repository landscape since 2012. <italic>Scientific Data</italic>, v. 10, n. 1, p. 571. 2023. Doi: https://doi.org/10.1038/s41597-023-02462-y.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Pampel</surname>
                            <given-names>H.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>Re3data: Indexing the global research data repository landscape since 2012</article-title>
                    <source>Scientific Data</source>
                    <volume>10</volume>
                    <issue>1</issue>
                    <fpage>571</fpage>
                    <lpage>571</lpage>
                    <year>2023</year>
                    <pub-id pub-id-type="doi">10.1038/s41597-023-02462-y</pub-id>
                </element-citation>
            </ref>
            <ref id="B24">
                <mixed-citation>Piwowar, H. A.; Vision, T. J. Data reuse and the open data citation advantage. <italic>PeerJ</italic>, v. 1, e175, 2013. Doi: https://doi.org/10.7717/peerj.175.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Piwowar</surname>
                            <given-names>H. A.</given-names>
                        </name>
                        <name>
                            <surname>Vision</surname>
                            <given-names>T. J.</given-names>
                        </name>
                    </person-group>
                    <article-title>Data reuse and the open data citation advantage</article-title>
                    <source>PeerJ</source>
                    <volume>1</volume>
                    <elocation-id>e175</elocation-id>
                    <year>2013</year>
                    <pub-id pub-id-type="doi">10.7717/peerj.175</pub-id>
                </element-citation>
            </ref>
            <ref id="B25">
                <mixed-citation>Pontika, N. <italic>et al.</italic> Fostering Open Science to research using a taxonomy and an eLearning Portal. <italic>In</italic>: iKnow: 15th International Conference on Knowledge Technologies and Data Driven Business, 21-22., 2015, Graz, Austria. <italic>Proceedings</italic> […]. New York: Association for Computing Machinery, 2015. p. 1-8. Doi: http://dx.doi.org/doi:10.1145/2809563.2809571.</mixed-citation>
                <element-citation publication-type="confproc">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Pontika</surname>
                            <given-names>N.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <comment>Fostering Open Science to research using a taxonomy and an eLearning Portal</comment>
                    <conf-name>iKnow: 15th International Conference on Knowledge Technologies and Data Driven Business</conf-name>
                    <conf-date>21-22., 2015</conf-date>
                    <conf-loc>Graz, Austria</conf-loc>
                    <source>Proceedings</source>
                    <comment>[…]</comment>
                    <publisher-loc>New York</publisher-loc>
                    <publisher-name>Association for Computing Machinery</publisher-name>
                    <year>2015</year>
                    <fpage>1</fpage>
                    <lpage>8</lpage>
                    <pub-id pub-id-type="doi">10.1145/2809563.2809571</pub-id>
                </element-citation>
            </ref>
            <ref id="B26">
                <mixed-citation>Sansone, S. A. <italic>et al.</italic> FAIRsharing as a community approach to standards, repositories and policies. <italic>Nature Biotechnology</italic>, v. 37, n. 4, p. 350-369, 2019. Doi: https://doi.org/10.1038.s41587-019-0080-8.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Sansone</surname>
                            <given-names>S. A.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>FAIRsharing as a community approach to standards, repositories and policies</article-title>
                    <source>Nature Biotechnology</source>
                    <volume>37</volume>
                    <issue>4</issue>
                    <fpage>350</fpage>
                    <lpage>369</lpage>
                    <year>2019</year>
                    <pub-id pub-id-type="doi">10.1038.s41587-019-0080-8</pub-id>
                </element-citation>
            </ref>
            <ref id="B27">
                <mixed-citation>Sayão, L. F.; Sales, L. F. Plataformas de gestão de dados de pesquisa: expandindo o conceito de repositórios de dados. <italic>Palabra Clave</italic>, v. 12, n. 1, e171, 2023. Doi: https://doi.org/10.24215/18539912e171.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Sayão</surname>
                            <given-names>L. F.</given-names>
                        </name>
                        <name>
                            <surname>Sales</surname>
                            <given-names>L. F.</given-names>
                        </name>
                    </person-group>
                    <article-title>Plataformas de gestão de dados de pesquisa: expandindo o conceito de repositórios de dados</article-title>
                    <source>Palabra Clave</source>
                    <volume>12</volume>
                    <issue>1</issue>
                    <elocation-id>e171</elocation-id>
                    <year>2023</year>
                    <pub-id pub-id-type="doi">10.24215/18539912e171</pub-id>
                </element-citation>
            </ref>
            <ref id="B28">
                <mixed-citation>Sena, P. M. B.; Segundo, W. L. R. C.; Melo, B. A. Ciência Aberta como parceria para Governo Aberto: compromisso por um novo modelo de avaliação. <italic>Informação &amp; Informação</italic>, v. 27, n. 3, p. 14-33, 2022. Doi: https://doi.org/10.5433/1981-8920.2022v27n3p14.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Sena</surname>
                            <given-names>P. M. B</given-names>
                        </name>
                        <name>
                            <surname>Segundo</surname>
                            <given-names>W. L. R. C</given-names>
                        </name>
                        <name>
                            <surname>Melo</surname>
                            <given-names>B. A</given-names>
                        </name>
                    </person-group>
                    <article-title>Ciência Aberta como parceria para Governo Aberto: compromisso por um novo modelo de avaliação</article-title>
                    <source>Informação &amp; Informação</source>
                    <volume>27</volume>
                    <issue>3</issue>
                    <fpage>14</fpage>
                    <lpage>33</lpage>
                    <year>2022</year>
                    <pub-id pub-id-type="doi">10.5433/1981-8920.2022v27n3p14</pub-id>
                </element-citation>
            </ref>
            <ref id="B29">
                <mixed-citation>Shi, G. <italic>et al.</italic> DRAMP 3.0: an enhanced comprehensive data repository of antimicrobial peptides. <italic>Nucleic Acids Research</italic>, v. 50, n. D1, p. D488-D496, 2022. Doi: https://doi.org/10.1093/nar/gkab651.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Shi</surname>
                            <given-names>G.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>DRAMP 3.0: an enhanced comprehensive data repository of antimicrobial peptides</article-title>
                    <source>Nucleic Acids Research</source>
                    <volume>50</volume>
                    <issue>D1</issue>
                    <fpage>D488</fpage>
                    <lpage>D496</lpage>
                    <year>2022</year>
                    <pub-id pub-id-type="doi">10.1093/nar/gkab651</pub-id>
                </element-citation>
            </ref>
            <ref id="B30">
                <mixed-citation>Silva, F. C. C.; Silveira, L. O ecossistema da Ciência Aberta. <italic>Transinformação</italic>, v. 31, e190001, 2019. http://dx.doi.org/10.1590/2318-0889201931e190001</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Silva</surname>
                            <given-names>F. C. C</given-names>
                        </name>
                        <name>
                            <surname>Silveira</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>O ecossistema da Ciência Aberta</article-title>
                    <source>Transinformação</source>
                    <volume>31</volume>
                    <elocation-id>e190001</elocation-id>
                    <year>2019</year>
                    <pub-id pub-id-type="doi">10.1590/2318-0889201931e190001</pub-id>
                </element-citation>
            </ref>
            <ref id="B31">
                <mixed-citation>Silveira, L. <italic>et al.</italic> Taxonomia da Ciência Aberta: revisada e ampliada. <italic>Encontros Bibli</italic>, v. 28, e91712, 2023. Doi: https://doi.org/10.5007/1518-2924.2023.e91712.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Silveira</surname>
                            <given-names>L</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>Taxonomia da Ciência Aberta: revisada e ampliada</article-title>
                    <source>Encontros Bibli</source>
                    <volume>28</volume>
                    <elocation-id>e91712</elocation-id>
                    <year>2023</year>
                    <pub-id pub-id-type="doi">10.5007/1518-2924.2023.e91712</pub-id>
                </element-citation>
            </ref>
            <ref id="B32">
                <mixed-citation>Smedley, D. <italic>et al.</italic> The BioMart community portal: an innovative alternative to large, centralized data repositories. <italic>Nucleic Acids Research</italic>, v. 43, n. W1, p. W589-W598, 2015. Doi: https://doi.org/10.1093/nar/gkv350.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Smedley</surname>
                            <given-names>D.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>The BioMart community portal: an innovative alternative to large, centralized data repositories</article-title>
                    <source>Nucleic Acids Research</source>
                    <volume>43</volume>
                    <issue>W1</issue>
                    <fpage>W589</fpage>
                    <lpage>W598</lpage>
                    <year>2015</year>
                    <pub-id pub-id-type="doi">10.1093/nar/gkv350</pub-id>
                </element-citation>
            </ref>
            <ref id="B33">
                <mixed-citation>Strasser, C.; Abrams, S.; Cruse, P. DMPTool 2: expanding functionality for better data management planning. <italic>International Journal of Digital Curation</italic>, v. 9, n. 1, 2014. Doi: https://doi.org//10.2218/ijdc.v9i1.319.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Strasser</surname>
                            <given-names>C</given-names>
                        </name>
                        <name>
                            <surname>Abrams</surname>
                            <given-names>S</given-names>
                        </name>
                        <name>
                            <surname>Cruse</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>DMPTool 2: expanding functionality for better data management planning</article-title>
                    <source>International Journal of Digital Curation</source>
                    <volume>9</volume>
                    <issue>1</issue>
                    <year>2014</year>
                    <pub-id pub-id-type="doi">10.2218/ijdc.v9i1.319</pub-id>
                </element-citation>
            </ref>
            <ref id="B34">
                <mixed-citation>Strasser, C. <italic>et al.</italic> Promoting data stewardship through best practices. <italic>In</italic>: Jones, M. B.; Gries, C. (ed.). <italic>Proceedings of the environmental information management conference</italic>. Santa Barbara: University of California, 2011. p. 126-131.</mixed-citation>
                <element-citation publication-type="confproc">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Strasser</surname>
                            <given-names>C.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <conf-name>Promoting data stewardship through best practices</conf-name>
                    <person-group person-group-type="editor">
                        <name>
                            <surname>Jones</surname>
                            <given-names>M. B.</given-names>
                        </name>
                        <name>
                            <surname>Gries</surname>
                            <given-names>C.</given-names>
                        </name>
                    </person-group>
                    <source>Proceedings of the environmental information management conference</source>
                    <conf-loc>Santa Barbara</conf-loc>
                    <publisher-name>University of California</publisher-name>
                    <year>2011</year>
                    <fpage>126</fpage>
                    <lpage>131</lpage>
                </element-citation>
            </ref>
            <ref id="B35">
                <mixed-citation>Strasser, C.; Cruse, P. The DMPTool and DataUp: helping researchers manage, archive, and share their data. <italic>Research Data Management Implementations Workshop</italic>, v. 13-14, 2013.</mixed-citation>
                <element-citation publication-type="confproc">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Strasser</surname>
                            <given-names>C.</given-names>
                        </name>
                        <name>
                            <surname>Cruse</surname>
                            <given-names>P.</given-names>
                        </name>
                    </person-group>
                    <conf-name>The DMPTool and DataUp: helping researchers manage, archive, and share their data</conf-name>
                    <source>Research Data Management Implementations Workshop</source>
                    <volume>13-14</volume>
                    <year>2013</year>
                </element-citation>
            </ref>
            <ref id="B36">
                <mixed-citation>Sud, M. <italic>et al.</italic> Metabolomics Workbench: an international repository for metabolomics data and metadata, metabolite standards, protocols, tutorials and training, and analysis tools. <italic>Nucleic Acids Research</italic>, v. 44, n. D1, p. D463-D470, 2016. Doi: https://doi.org/10.1093/nar/gkv1042.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Sud</surname>
                            <given-names>M.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>Metabolomics Workbench: an international repository for metabolomics data and metadata, metabolite standards, protocols, tutorials and training, and analysis tools</article-title>
                    <source>Nucleic Acids Research</source>
                    <volume>44</volume>
                    <issue>D1</issue>
                    <fpage>D463</fpage>
                    <lpage>D470</lpage>
                    <year>2016</year>
                    <pub-id pub-id-type="doi">10.1093/nar/gkv1042</pub-id>
                </element-citation>
            </ref>
            <ref id="B37">
                <mixed-citation>Taylor, J. R. <italic>et al.</italic> The Cambridge Centre for Ageing and Neuroscience (Cam-CAN) data repository: structural and functional MRI, MEG, and cognitive data from a cross-sectional adult lifespan sample. <italic>Neuroimage</italic>, v. 144, p. 262-269, 2017. Doi: https://doi.org/10.1016/j.neuroimage.2015.09.018.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Taylor</surname>
                            <given-names>J. R.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>The Cambridge Centre for Ageing and Neuroscience (Cam-CAN) data repository: structural and functional MRI, MEG, and cognitive data from a cross-sectional adult lifespan sample</article-title>
                    <source>Neuroimage</source>
                    <volume>144</volume>
                    <fpage>262</fpage>
                    <lpage>269</lpage>
                    <year>2017</year>
                    <pub-id pub-id-type="doi">10.1016/j.neuroimage.2015.09.018</pub-id>
                </element-citation>
            </ref>
            <ref id="B38">
                <mixed-citation>Tenopir, C. <italic>et al.</italic> Data sharing by scientists: practices and perceptions. <italic>Plos One</italic>, v. 6, e21101, 2011. Doi: http://dx.doi.org/10.1371/journal.pone.0021101.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Tenopir</surname>
                            <given-names>C.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>Data sharing by scientists: practices and perceptions</article-title>
                    <source>Plos One</source>
                    <volume>6</volume>
                    <elocation-id>e21101</elocation-id>
                    <year>2011</year>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0021101</pub-id>
                </element-citation>
            </ref>
            <ref id="B39">
                <mixed-citation>Ularu, E. G. <italic>et al.</italic> Perspectives on big data and big data analytics. <italic>Database Systems Journal</italic>, v. 3, n. 4, p. 3-14, 2012.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Ularu</surname>
                            <given-names>E. G.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>Perspectives on big data and big data analytics</article-title>
                    <source>Database Systems Journal</source>
                    <volume>3</volume>
                    <issue>4</issue>
                    <fpage>3</fpage>
                    <lpage>14</lpage>
                    <year>2012</year>
                </element-citation>
            </ref>
            <ref id="B40">
                <mixed-citation>United Nations Educational, Scientific and Cultural Organization. <italic>An introduction to the UNESCO recommendation on Open Science</italic>. Paris: UNESCO, 2022. Available in: https://www.unesco.org/en/open-science. Cited: October 1st 2023.</mixed-citation>
                <element-citation publication-type="webpage">
                    <person-group person-group-type="author">
                        <collab>United Nations Educational, Scientific and Cultural Organization</collab>
                    </person-group>
                    <source>An introduction to the UNESCO recommendation on Open Science</source>
                    <publisher-loc>Paris</publisher-loc>
                    <publisher-name>UNESCO</publisher-name>
                    <year>2022</year>
                    <comment>Available in: <ext-link ext-link-type="uri" xlink:href="https://www.unesco.org/en/open-science">https://www.unesco.org/en/open-science</ext-link></comment>
                    <date-in-citation content-type="access-date">October 1st 2023</date-in-citation>
                </element-citation>
            </ref>
            <ref id="B41">
                <mixed-citation>United Nations Educational, Scientific and Cultural Organization. <italic>Towards a global consensus on open science</italic>: report on UNESCO´s global online consultation on open science. Paris: UNESCO, 2020. Available in: https://www.unesco.org/en/open-science. Cited: October 1st 2023.</mixed-citation>
                <element-citation publication-type="webpage">
                    <person-group person-group-type="author">
                        <collab>United Nations Educational, Scientific and Cultural Organization</collab>
                    </person-group>
                    <source><italic>Towards a global consensus on open science</italic>: report on UNESCO´s global online consultation on open science</source>
                    <publisher-loc>Paris</publisher-loc>
                    <publisher-name>UNESCO</publisher-name>
                    <year>2020</year>
                    <comment>Available in: <ext-link ext-link-type="uri" xlink:href="https://www.unesco.org/en/open-science">https://www.unesco.org/en/open-science</ext-link></comment>
                    <date-in-citation content-type="access-date">October 1st 2023</date-in-citation>
                </element-citation>
            </ref>
            <ref id="B42">
                <mixed-citation>United Nations Educational, Scientific and Cultural Organization. <italic>Recommendation on Open Science</italic>. Paris: 2021. Available in: https://www.unesco.org/en/open-science. Cited: October 1st 2023.</mixed-citation>
                <element-citation publication-type="webpage">
                    <person-group person-group-type="author">
                        <collab>United Nations Educational, Scientific and Cultural Organization</collab>
                    </person-group>
                    <source>Recommendation on Open Science</source>
                    <publisher-loc>Paris</publisher-loc>
                    <year>2021</year>
                    <comment>Available in: <ext-link ext-link-type="uri" xlink:href="https://www.unesco.org/en/open-science">https://www.unesco.org/en/open-science</ext-link></comment>
                    <date-in-citation content-type="access-date">October 1st 2023</date-in-citation>
                </element-citation>
            </ref>
            <ref id="B43">
                <mixed-citation>Vicente-Saez, R.; Martinez-Fuentes, C. Open Science now: a systematic literature review for an integrated definition. <italic>Journal of Business Research</italic>, v. 88, p. 428, 2018. Doi: https://doi.org/10.1016/j.jbusres.2017.12.043</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Vicente-Saez</surname>
                            <given-names>R</given-names>
                        </name>
                        <name>
                            <surname>Martinez-Fuentes</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Open Science now: a systematic literature review for an integrated definition</article-title>
                    <source>Journal of Business Research</source>
                    <volume>88</volume>
                    <fpage>428</fpage>
                    <lpage>428</lpage>
                    <year>2018</year>
                    <pub-id pub-id-type="doi">10.1016/j.jbusres.2017.12.043</pub-id>
                </element-citation>
            </ref>
            <ref id="B44">
                <mixed-citation>Walters, W. H. Data journals: incentivizing data access and documentation within the scholarly communication system. <italic>Insights</italic>, v. 33, p. 18, 2020. Doi: https://doi.org/10.1629/uksg.510.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Walters</surname>
                            <given-names>W. H.</given-names>
                        </name>
                    </person-group>
                    <article-title>Data journals: incentivizing data access and documentation within the scholarly communication system</article-title>
                    <source>Insights</source>
                    <volume>33</volume>
                    <fpage>18</fpage>
                    <lpage>18</lpage>
                    <year>2020</year>
                    <pub-id pub-id-type="doi">10.1629/uksg.510</pub-id>
                </element-citation>
            </ref>
            <ref id="B45">
                <mixed-citation>Wilkinson, M. D. <italic>et al.</italic> The FAIR guiding principles for scientific data management and stewardship. <italic>Scientific Data</italic>, v. 15, n. 3, p. 160018, 2016. Doi: https://doi.org/10.1038/sdata.2016.18.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Wilkinson</surname>
                            <given-names>M. D.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>The FAIR guiding principles for scientific data management and stewardship</article-title>
                    <source>Scientific Data</source>
                    <volume>15</volume>
                    <issue>3</issue>
                    <fpage>160018</fpage>
                    <lpage>160018</lpage>
                    <year>2016</year>
                    <pub-id pub-id-type="doi">10.1038/sdata.2016.18</pub-id>
                </element-citation>
            </ref>
            <ref id="B46">
                <mixed-citation>Zheng, S. <italic>et al.</italic> DrugComb update: a more comprehensive drug sensitivity data repository and analysis portal. <italic>Nucleic Acids Research</italic>, v. 49, n. 1, p. 174-184, 2021. Doi: https://doi.org/10.1093/nar/gkab438.</mixed-citation>
                <element-citation publication-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Zheng</surname>
                            <given-names>S.</given-names>
                        </name>
                        <etal/>
                    </person-group>
                    <article-title>DrugComb update: a more comprehensive drug sensitivity data repository and analysis portal</article-title>
                    <source>Nucleic Acids Research</source>
                    <volume>49</volume>
                    <issue>1</issue>
                    <fpage>174</fpage>
                    <lpage>184</lpage>
                    <year>2021</year>
                    <pub-id pub-id-type="doi">10.1093/nar/gkab438</pub-id>
                </element-citation>
            </ref>
        </ref-list>
    </back>
</article>
