{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import ast\n", "import csv\n", "import json\n", "\n", "import numpy as np\n", "import pandas as pd\n", "\n", "pd.set_option('display.max_columns', None)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Loading data from registries" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
FAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.metadata.cross-referencesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.url-for-logoFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.data-access-condition.typeFAIRsharing_attributes.metadata.data-contact-informationFAIRsharing_attributes.metadata.data-deposition-condition.urlFAIRsharing_attributes.metadata.data-deposition-condition.typeFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.data-access-condition.urlFAIRsharing_attributes.metadata.resource-sustainability.urlFAIRsharing_attributes.metadata.resource-sustainability.nameFAIRsharing_attributes.metadata.data-preservation-policy.urlFAIRsharing_attributes.metadata.data-preservation-policy.nameFAIRsharing_attributes.metadata.data-access-for-pre-publication-reviewFAIRsharing_attributes.metadata.data-versioningFAIRsharing_attributes.metadata.data-curation.typeFAIRsharing_attributes.metadata.data-curation.urlFAIRsharing_attributes.metadata.citation-to-related-publicationsFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_id
03226fairsharing-records2020-12-09T11:53:44.000Z2022-02-08T10:42:36.452Z10.25504/FAIRsharing.d6423bWDC Sunspot Index and Long-term Solar Observat...ready[{'contact-name': 'Frédéric Clette', 'contact-...http://sidc.be/silso/home3226The WDC-SILSO is an activity of the Operationa...WDC-SILSO[{'url': 'http://www.sidc.be/silso/taxonomy/te...2013.0[{'url': 'http://www.sidc.be/silso/datafiles',...[{'url': 'https://www.re3data.org/repository/r...[biodbcore-001740, bsg-d001740]Databaserepository[Electromagnetism, Astrophysics and Astronomy,...[Climate, Observation design][Not applicable][Climate change, earth observation, Electromag...[Belgium]FAIRsharing record for: WDC Sunspot Index and ...WDC-SILSOhttps://fairsharing.org/10.25504/FAIRsharing.d...10.25504/FAIRsharing.d6423bhttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: The WDC-SIL...[][{'licence-name': 'SILSO legal notices', 'lice...NoneNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNFAIRsharing_3226
12114fairsharing-records2014-11-04T15:23:40.000Z2022-01-21T14:39:02.195Z10.25504/FAIRsharing.p06nmeBiological Magnetic Resonance Data Bankready[{'contact-name': 'Helpdesk', 'contact-email':...https://bmrb.io/2114BMRB collects, annotates, archives, and dissem...BMRB[{'url': 'https://bmrb.io/bmrb/news/', 'name':...1988.0[{'url': 'https://bmrb.io/data_library/rsync.s...[{'url': 'https://www.re3data.org/repository/r...[biodbcore-000584, bsg-d000584]Databaserepository[Structural Biology][Molecular structure, Protein structure, Pepti...[All][][United States]FAIRsharing record for: Biological Magnetic Re...BMRBhttps://fairsharing.org/10.25504/FAIRsharing.p...10.25504/FAIRsharing.p06nmehttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: BMRB collec...[{'id': 552, 'pubmed_id': 18288446, 'title': '...[{'licence-name': 'wwPDB Privacy and Usage Pol...None[{'doi': '10.1093/nar/gkm957', 'pubmed-id': 17...[{'url': 'https://bmrb.io/validate/', 'name': ...openyeshttps://bmrb.io/deposit/openNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNFAIRsharing_2114
23022fairsharing-records2020-06-17T10:25:30.000Z2022-02-08T10:41:04.073Z10.25504/FAIRsharing.8b7a2fFisheries and Oceans Canada Pacific Region Dat...ready[{'contact-name': 'Peter Chandler', 'contact-e...http://www.pac.dfo-mpo.gc.ca/science/oceans/da...3022The Institute of Ocean Sciences (IOS)/Ocean Sc...None[{'url': 'DFO.PAC.SCI.IOSData-DonneesISO.SCI.P...NaN[{'name': 'Users must contact the Senior Analy...[{'url': 'https://www.re3data.org/repository/r...[biodbcore-001530, bsg-d001530]Databaserepository[Environmental Science, Meteorology, Earth Sci...[Climate][Not applicable][Salinity, Temperature][Canada]FAIRsharing record for: Fisheries and Oceans C...Nonehttps://fairsharing.org/10.25504/FAIRsharing.8...10.25504/FAIRsharing.8b7a2fhttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: The Institu...[][{'licence-name': 'Fisheries and Oceans Canada...NoneNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNFAIRsharing_3022
32998fairsharing-records2020-05-21T07:42:30.000Z2022-02-08T10:40:19.531Z10.25504/FAIRsharing.e08886Climate Prediction Centerready[{'contact-name': 'Jon Hoopingarner', 'contact...https://www.cpc.ncep.noaa.gov/2998The Climate Prediction Center (CPC) produces o...CPC[{'url': 'https://www.cpc.ncep.noaa.gov/commen...1970.0[{'url': 'https://www.cpc.ncep.noaa.gov/', 'na...[{'url': 'https://www.re3data.org/repository/r...[biodbcore-001504, bsg-d001504]Databaserepository[Hydrogeology, Geography, Meteorology, Geodesy...[Climate][Not applicable][Forecasting, weather][United States]FAIRsharing record for: Climate Prediction CenterCPChttps://fairsharing.org/10.25504/FAIRsharing.e...10.25504/FAIRsharing.e08886https://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: The Climate...[][{'licence-name': 'National Weather Service Di...NoneNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNFAIRsharing_2998
42301fairsharing-records2016-06-03T14:54:08.000Z2021-11-24T13:17:51.201Z10.25504/FAIRsharing.meh9wzAcytostelium Gene Databasedeprecated[{'contact-name': 'Acytostelium genome consort...http://cosmos.bot.kyoto-u.ac.jp/acytodb//cgi-b...2301Genome and transcriptome database of Acytostel...NaNNaN2008.0NaNNaN[biodbcore-000775, bsg-d000775]Databaserepository[Genomics, Life Science, Transcriptomics][DNA sequence data, Gene model annotation][Acytostelium subglobosum][][United Kingdom, Japan]FAIRsharing record for: Acytostelium Gene Data...Nonehttps://fairsharing.org/10.25504/FAIRsharing.m...10.25504/FAIRsharing.meh9wzhttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: Genome and ...[{'id': 1139, 'pubmed_id': 25758444, 'title': ...[]NoneNaNNaNThis resource is no longer available at the st...NaNNaNNaNNaN2021-9-17NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNFAIRsharing_2301
\n", "
" ], "text/plain": [ " FAIRsharing_id FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 3226 fairsharing-records 2020-12-09T11:53:44.000Z \n", "1 2114 fairsharing-records 2014-11-04T15:23:40.000Z \n", "2 3022 fairsharing-records 2020-06-17T10:25:30.000Z \n", "3 2998 fairsharing-records 2020-05-21T07:42:30.000Z \n", "4 2301 fairsharing-records 2016-06-03T14:54:08.000Z \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 2022-02-08T10:42:36.452Z 10.25504/FAIRsharing.d6423b \n", "1 2022-01-21T14:39:02.195Z 10.25504/FAIRsharing.p06nme \n", "2 2022-02-08T10:41:04.073Z 10.25504/FAIRsharing.8b7a2f \n", "3 2022-02-08T10:40:19.531Z 10.25504/FAIRsharing.e08886 \n", "4 2021-11-24T13:17:51.201Z 10.25504/FAIRsharing.meh9wz \n", "\n", " FAIRsharing_attributes.metadata.name \\\n", "0 WDC Sunspot Index and Long-term Solar Observat... \n", "1 Biological Magnetic Resonance Data Bank \n", "2 Fisheries and Oceans Canada Pacific Region Dat... \n", "3 Climate Prediction Center \n", "4 Acytostelium Gene Database \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 ready \n", "1 ready \n", "2 ready \n", "3 ready \n", "4 deprecated \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [{'contact-name': 'Frédéric Clette', 'contact-... \n", "1 [{'contact-name': 'Helpdesk', 'contact-email':... \n", "2 [{'contact-name': 'Peter Chandler', 'contact-e... \n", "3 [{'contact-name': 'Jon Hoopingarner', 'contact... \n", "4 [{'contact-name': 'Acytostelium genome consort... \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 http://sidc.be/silso/home \n", "1 https://bmrb.io/ \n", "2 http://www.pac.dfo-mpo.gc.ca/science/oceans/da... \n", "3 https://www.cpc.ncep.noaa.gov/ \n", "4 http://cosmos.bot.kyoto-u.ac.jp/acytodb//cgi-b... \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 3226 \n", "1 2114 \n", "2 3022 \n", "3 2998 \n", "4 2301 \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 The WDC-SILSO is an activity of the Operationa... \n", "1 BMRB collects, annotates, archives, and dissem... \n", "2 The Institute of Ocean Sciences (IOS)/Ocean Sc... \n", "3 The Climate Prediction Center (CPC) produces o... \n", "4 Genome and transcriptome database of Acytostel... \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 WDC-SILSO \n", "1 BMRB \n", "2 None \n", "3 CPC \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [{'url': 'http://www.sidc.be/silso/taxonomy/te... \n", "1 [{'url': 'https://bmrb.io/bmrb/news/', 'name':... \n", "2 [{'url': 'DFO.PAC.SCI.IOSData-DonneesISO.SCI.P... \n", "3 [{'url': 'https://www.cpc.ncep.noaa.gov/commen... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 2013.0 \n", "1 1988.0 \n", "2 NaN \n", "3 1970.0 \n", "4 2008.0 \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [{'url': 'http://www.sidc.be/silso/datafiles',... \n", "1 [{'url': 'https://bmrb.io/data_library/rsync.s... \n", "2 [{'name': 'Users must contact the Senior Analy... \n", "3 [{'url': 'https://www.cpc.ncep.noaa.gov/', 'na... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.cross-references \\\n", "0 [{'url': 'https://www.re3data.org/repository/r... \n", "1 [{'url': 'https://www.re3data.org/repository/r... \n", "2 [{'url': 'https://www.re3data.org/repository/r... \n", "3 [{'url': 'https://www.re3data.org/repository/r... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [biodbcore-001740, bsg-d001740] \n", "1 [biodbcore-000584, bsg-d000584] \n", "2 [biodbcore-001530, bsg-d001530] \n", "3 [biodbcore-001504, bsg-d001504] \n", "4 [biodbcore-000775, bsg-d000775] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 Database \n", "1 Database \n", "2 Database \n", "3 Database \n", "4 Database \n", "\n", " FAIRsharing_attributes.record-type \\\n", "0 repository \n", "1 repository \n", "2 repository \n", "3 repository \n", "4 repository \n", "\n", " FAIRsharing_attributes.subjects \\\n", "0 [Electromagnetism, Astrophysics and Astronomy,... \n", "1 [Structural Biology] \n", "2 [Environmental Science, Meteorology, Earth Sci... \n", "3 [Hydrogeology, Geography, Meteorology, Geodesy... \n", "4 [Genomics, Life Science, Transcriptomics] \n", "\n", " FAIRsharing_attributes.domains \\\n", "0 [Climate, Observation design] \n", "1 [Molecular structure, Protein structure, Pepti... \n", "2 [Climate] \n", "3 [Climate] \n", "4 [DNA sequence data, Gene model annotation] \n", "\n", " FAIRsharing_attributes.taxonomies \\\n", "0 [Not applicable] \n", "1 [All] \n", "2 [Not applicable] \n", "3 [Not applicable] \n", "4 [Acytostelium subglobosum] \n", "\n", " FAIRsharing_attributes.user-defined-tags \\\n", "0 [Climate change, earth observation, Electromag... \n", "1 [] \n", "2 [Salinity, Temperature] \n", "3 [Forecasting, weather] \n", "4 [] \n", "\n", " FAIRsharing_attributes.countries \\\n", "0 [Belgium] \n", "1 [United States] \n", "2 [Canada] \n", "3 [United States] \n", "4 [United Kingdom, Japan] \n", "\n", " FAIRsharing_attributes.name \\\n", "0 FAIRsharing record for: WDC Sunspot Index and ... \n", "1 FAIRsharing record for: Biological Magnetic Re... \n", "2 FAIRsharing record for: Fisheries and Oceans C... \n", "3 FAIRsharing record for: Climate Prediction Center \n", "4 FAIRsharing record for: Acytostelium Gene Data... \n", "\n", " FAIRsharing_attributes.abbreviation \\\n", "0 WDC-SILSO \n", "1 BMRB \n", "2 None \n", "3 CPC \n", "4 None \n", "\n", " FAIRsharing_attributes.url \\\n", "0 https://fairsharing.org/10.25504/FAIRsharing.d... \n", "1 https://fairsharing.org/10.25504/FAIRsharing.p... \n", "2 https://fairsharing.org/10.25504/FAIRsharing.8... \n", "3 https://fairsharing.org/10.25504/FAIRsharing.e... \n", "4 https://fairsharing.org/10.25504/FAIRsharing.m... \n", "\n", " FAIRsharing_attributes.doi \\\n", "0 10.25504/FAIRsharing.d6423b \n", "1 10.25504/FAIRsharing.p06nme \n", "2 10.25504/FAIRsharing.8b7a2f \n", "3 10.25504/FAIRsharing.e08886 \n", "4 10.25504/FAIRsharing.meh9wz \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 https://creativecommons.org/licenses/by-sa/4.0... \n", "1 https://creativecommons.org/licenses/by-sa/4.0... \n", "2 https://creativecommons.org/licenses/by-sa/4.0... \n", "3 https://creativecommons.org/licenses/by-sa/4.0... \n", "4 https://creativecommons.org/licenses/by-sa/4.0... \n", "\n", " FAIRsharing_attributes.description \\\n", "0 This FAIRsharing record describes: The WDC-SIL... \n", "1 This FAIRsharing record describes: BMRB collec... \n", "2 This FAIRsharing record describes: The Institu... \n", "3 This FAIRsharing record describes: The Climate... \n", "4 This FAIRsharing record describes: Genome and ... \n", "\n", " FAIRsharing_attributes.publications \\\n", "0 [] \n", "1 [{'id': 552, 'pubmed_id': 18288446, 'title': '... \n", "2 [] \n", "3 [] \n", "4 [{'id': 1139, 'pubmed_id': 25758444, 'title': ... \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 [{'licence-name': 'SILSO legal notices', 'lice... \n", "1 [{'licence-name': 'wwPDB Privacy and Usage Pol... \n", "2 [{'licence-name': 'Fisheries and Oceans Canada... \n", "3 [{'licence-name': 'National Weather Service Di... \n", "4 [] \n", "\n", " FAIRsharing_attributes.url-for-logo \\\n", "0 None \n", "1 None \n", "2 None \n", "3 None \n", "4 None \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 [{'doi': '10.1093/nar/gkm957', 'pubmed-id': 17... \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 [{'url': 'https://bmrb.io/validate/', 'name': ... \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 \n", "2 NaN \n", "3 NaN \n", "4 This resource is no longer available at the st... \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.type \\\n", "0 NaN \n", "1 open \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-contact-information \\\n", "0 NaN \n", "1 yes \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.url \\\n", "0 NaN \n", "1 https://bmrb.io/deposit/ \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.type \\\n", "0 NaN \n", "1 open \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 2021-9-17 \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-for-pre-publication-review \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-versioning \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citation-to-related-publications \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \n", "0 NaN FAIRsharing_3226 \n", "1 NaN FAIRsharing_2114 \n", "2 NaN FAIRsharing_3022 \n", "3 NaN FAIRsharing_2998 \n", "4 NaN FAIRsharing_2301 " ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "with open('../data/raw/fairsharing_dump_api_02_2022.json') as f:\n", " lines = f.read().splitlines()\n", " \n", "fairsharing_df = pd.DataFrame(lines)\n", "fairsharing_df.columns = ['json_element']\n", "fairsharing_df['json_element'].apply(json.loads)\n", "fairsharing_df = pd.json_normalize(fairsharing_df['json_element'].apply(json.loads))\n", "\n", "fairsharing_df['unique_id'] = 'FAIRsharing_' + fairsharing_df.id\n", "fairsharing_df = fairsharing_df.add_prefix('FAIRsharing_')\n", "fairsharing_df.head()" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
re3data_orgIdentifierre3data_repositoryNamere3data_repositoryName.languagere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_repositoryContactre3data_descriptionre3data_description.languagere3data_typere3data_sizere3data_startDatere3data_endDatere3data_repositoryLanguagere3data_subjectre3data_missionStatementURLre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadTypere3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_id
0r3d100000001Odum Institute Archive Dataverseeng[]https://dataverse.unc.edu/dataverse/odum[][\"https://dataverse.unc.edu/dataverse/odum#\", ...The Odum Institute Archive Dataverse contains ...eng[disciplinary]{\"size\": \"13 dataverses; 3.050 datasets\", \"upd...NaNNaN[\"eng\"][{'name': '1 Humanities and Social Sciences', ...NaN[{'name': 'Databases', 'scheme': 'parse'}, {'n...[dataProvider][FAIR, Middle East, crime, demography, economy...[{'institutionName': 'Odum Institute for Resea...[{\"policyName\": \"Collection Development Policy...{\"databaseAccessType\": \"open\", \"databaseAcces...[{\"databaseLicenseName\": \"CC0\", \"databaseLicen...[{\"dataAccessType\": \"embargoed\", \"dataAccessRe...[{\"dataLicenseName\": \"CC\", \"dataLicenseURL\": \"...restricted[][\"DataVerse\"]NaN{}[\"DOI\"]NaN[]unknownyes[\"other\"][{\"metadataStandardName\": \"DDI - Data Document...{}Odum Dataverse is covered by Thomson Reuters D...2013-06-102021-07-06re3data_r3d100000001
1r3d100000002Access to Archival Databaseseng[{'additionalName': 'AAD', 'additionalNameLang...https://aad.archives.gov/aad/[RRID:SCR_010479, RRID:nlx_157752][\"https://www.archives.gov/contact\"]You will find in the Access to Archival Databa...eng[disciplinary]{\"size\": \"\", \"updatedp\": \"\"}1985NaN[\"eng\", \"spa\"][{'name': '1 Humanities and Social Sciences', ...https://www.archives.gov/publications/general-...[{'name': 'Images', 'scheme': 'parse'}, {'name...[dataProvider][US History][{'institutionName': 'The U.S. National Archiv...[{\"policyName\": \"Contribution Policy\", \"policy...{\"databaseAccessType\": \"open\", \"databaseAcces...[][{\"dataAccessType\": \"open\", \"dataAccessRestric...[{\"dataLicenseName\": \"Copyrights\", \"dataLicens...restricted[][\"unknown\"]no{\"api\": \"https://www.archives.gov/developer#to...[\"none\"]https://aad.archives.gov/aad/help/getting-star...[]unknownunknown[][]{\"syndication\": \"http://www.archives.gov/socia...NaN2012-07-042021-05-25re3data_r3d100000002
2r3d100000004Datenbank Gesprochenes Deutschdeu[{'additionalName': 'DGD', 'additionalNameLang...https://dgd.ids-mannheim.de/[][\"dgd@ids-mannheim.de\"]The \"Database for Spoken German (DGD)\" is a co...eng[disciplinary]{\"size\": \"34 corpora\", \"updatedp\": \"2020-02-03\"}2012NaN[\"deu\"][{'name': '1 Humanities and Social Sciences', ...https://dgd.ids-mannheim.de/dgd/pragdb.dgd_ext...[{'name': 'Audiovisual data', 'scheme': 'parse...[dataProvider, serviceProvider][Australian German, FOLK, German dialects, Pfe...[{'institutionName': 'Institut für Deutsche Sp...[{\"policyName\": \"Erfurter Aufruf zur Sicherung...{\"databaseAccessType\": \"restricted\", \"databas...[][{\"dataAccessType\": \"restricted\", \"dataAccessR...[{\"dataLicenseName\": \"other\", \"dataLicenseURL\"...restricted[][\"other\"]yes{}[\"none\"]http://agd.ids-mannheim.de/konditionen.shtml[]unknownunknown[\"RatSWD\"][]{}NaN2012-07-202020-08-27re3data_r3d100000004
3r3d100000005UNC Dataverseeng[{'additionalName': 'University of North Carol...https://dataverse.unc.edu/[FAIRsharing_doi:10.25504/FAIRsharing.pS2p8c][\"https://dataverse.unc.edu/\", \"odumarchive@un...UNC Dataverse is an open-source repository sof...eng[institutional]{\"size\": \"186 dataverses; 25.272 studies; 229....2011NaN[\"eng\"][{'name': '1 Humanities and Social Sciences', ...https://odum.unc.edu/about/mission-vision/[{'name': 'Archived data', 'scheme': 'parse'},...[dataProvider, serviceProvider][FAIR, census, demographic survey, demography,...[{'institutionName': 'Odum Institute for Resea...[{\"policyName\": \"Collection Development Policy...{\"databaseAccessType\": \"open\", \"databaseAcces...[][{\"dataAccessType\": \"open\", \"dataAccessRestric...[{\"dataLicenseName\": \"CC\", \"dataLicenseURL\": \"...restricted[{\"dataUploadLicenseName\": \"Data Deposit Form\"...[\"DataVerse\"]yes{\"api\": \"https://guides.dataverse.org/en/lates...[\"ARK\", \"DOI\", \"PURL\", \"URN\", \"hdl\"]https://dataverse.org/best-practices/data-cita...[]unknownyes[][{\"metadataStandardName\": \"DDI - Data Document...{}UNC Dataverse is covered by Clarivate Data Cit...2012-07-232021-10-25re3data_r3d100000005
4r3d100000006Archaeology Data Serviceeng[{'additionalName': 'ADS', 'additionalNameLang...https://archaeologydataservice.ac.uk/[FAIRsharing_doi:10.25504/FAIRsharing.hm1mfg][\"help@archaeologydataservice.ac.uk\", \"https:/...The ADS is an accredited digital repository fo...eng[disciplinary]{\"size\": \"1837 results\", \"updatedp\": \"2020-05-...1996-10-01NaN[\"eng\"][{'name': '1 Humanities and Social Sciences', ...https://archaeologydataservice.ac.uk/about/our...[{'name': 'Archived data', 'scheme': 'parse'},...[dataProvider, serviceProvider][FAIR, archaeology, cultural heritage, prehist...[{'institutionName': 'Arts and Humanities Rese...[{\"policyName\": \"ADS Guides to good practice\",...{\"databaseAccessType\": \"open\", \"databaseAcces...[{\"databaseLicenseName\": \"CC\", \"databaseLicens...[{\"dataAccessType\": \"open\", \"dataAccessRestric...[{\"dataLicenseName\": \"CC\", \"dataLicenseURL\": \"...restricted[{\"dataUploadLicenseName\": \"Guidelines for Dep...[\"other\"]yes{\"api\": \"https://archaeologydataservice.ac.uk/...[\"DOI\"]https://archaeologydataservice.ac.uk/advice/te...[]unknownyes[\"other\"][{\"metadataStandardName\": \"DataCite Metadata S...{\"syndication\": \"https://archaeologydataservic...ADS is covered by Clarivate Data Citation Inde...2012-07-232021-09-02re3data_r3d100000006
\n", "
" ], "text/plain": [ " re3data_orgIdentifier re3data_repositoryName \\\n", "0 r3d100000001 Odum Institute Archive Dataverse \n", "1 r3d100000002 Access to Archival Databases \n", "2 r3d100000004 Datenbank Gesprochenes Deutsch \n", "3 r3d100000005 UNC Dataverse \n", "4 r3d100000006 Archaeology Data Service \n", "\n", " re3data_repositoryName.language \\\n", "0 eng \n", "1 eng \n", "2 deu \n", "3 eng \n", "4 eng \n", "\n", " re3data_additionalName \\\n", "0 [] \n", "1 [{'additionalName': 'AAD', 'additionalNameLang... \n", "2 [{'additionalName': 'DGD', 'additionalNameLang... \n", "3 [{'additionalName': 'University of North Carol... \n", "4 [{'additionalName': 'ADS', 'additionalNameLang... \n", "\n", " re3data_repositoryURL \\\n", "0 https://dataverse.unc.edu/dataverse/odum \n", "1 https://aad.archives.gov/aad/ \n", "2 https://dgd.ids-mannheim.de/ \n", "3 https://dataverse.unc.edu/ \n", "4 https://archaeologydataservice.ac.uk/ \n", "\n", " re3data_repositoryIdentifier \\\n", "0 [] \n", "1 [RRID:SCR_010479, RRID:nlx_157752] \n", "2 [] \n", "3 [FAIRsharing_doi:10.25504/FAIRsharing.pS2p8c] \n", "4 [FAIRsharing_doi:10.25504/FAIRsharing.hm1mfg] \n", "\n", " re3data_repositoryContact \\\n", "0 [\"https://dataverse.unc.edu/dataverse/odum#\", ... \n", "1 [\"https://www.archives.gov/contact\"] \n", "2 [\"dgd@ids-mannheim.de\"] \n", "3 [\"https://dataverse.unc.edu/\", \"odumarchive@un... \n", "4 [\"help@archaeologydataservice.ac.uk\", \"https:/... \n", "\n", " re3data_description \\\n", "0 The Odum Institute Archive Dataverse contains ... \n", "1 You will find in the Access to Archival Databa... \n", "2 The \"Database for Spoken German (DGD)\" is a co... \n", "3 UNC Dataverse is an open-source repository sof... \n", "4 The ADS is an accredited digital repository fo... \n", "\n", " re3data_description.language re3data_type \\\n", "0 eng [disciplinary] \n", "1 eng [disciplinary] \n", "2 eng [disciplinary] \n", "3 eng [institutional] \n", "4 eng [disciplinary] \n", "\n", " re3data_size re3data_startDate \\\n", "0 {\"size\": \"13 dataverses; 3.050 datasets\", \"upd... NaN \n", "1 {\"size\": \"\", \"updatedp\": \"\"} 1985 \n", "2 {\"size\": \"34 corpora\", \"updatedp\": \"2020-02-03\"} 2012 \n", "3 {\"size\": \"186 dataverses; 25.272 studies; 229.... 2011 \n", "4 {\"size\": \"1837 results\", \"updatedp\": \"2020-05-... 1996-10-01 \n", "\n", " re3data_endDate re3data_repositoryLanguage \\\n", "0 NaN [\"eng\"] \n", "1 NaN [\"eng\", \"spa\"] \n", "2 NaN [\"deu\"] \n", "3 NaN [\"eng\"] \n", "4 NaN [\"eng\"] \n", "\n", " re3data_subject \\\n", "0 [{'name': '1 Humanities and Social Sciences', ... \n", "1 [{'name': '1 Humanities and Social Sciences', ... \n", "2 [{'name': '1 Humanities and Social Sciences', ... \n", "3 [{'name': '1 Humanities and Social Sciences', ... \n", "4 [{'name': '1 Humanities and Social Sciences', ... \n", "\n", " re3data_missionStatementURL \\\n", "0 NaN \n", "1 https://www.archives.gov/publications/general-... \n", "2 https://dgd.ids-mannheim.de/dgd/pragdb.dgd_ext... \n", "3 https://odum.unc.edu/about/mission-vision/ \n", "4 https://archaeologydataservice.ac.uk/about/our... \n", "\n", " re3data_contentType \\\n", "0 [{'name': 'Databases', 'scheme': 'parse'}, {'n... \n", "1 [{'name': 'Images', 'scheme': 'parse'}, {'name... \n", "2 [{'name': 'Audiovisual data', 'scheme': 'parse... \n", "3 [{'name': 'Archived data', 'scheme': 'parse'},... \n", "4 [{'name': 'Archived data', 'scheme': 'parse'},... \n", "\n", " re3data_providerType \\\n", "0 [dataProvider] \n", "1 [dataProvider] \n", "2 [dataProvider, serviceProvider] \n", "3 [dataProvider, serviceProvider] \n", "4 [dataProvider, serviceProvider] \n", "\n", " re3data_keyword \\\n", "0 [FAIR, Middle East, crime, demography, economy... \n", "1 [US History] \n", "2 [Australian German, FOLK, German dialects, Pfe... \n", "3 [FAIR, census, demographic survey, demography,... \n", "4 [FAIR, archaeology, cultural heritage, prehist... \n", "\n", " re3data_institution \\\n", "0 [{'institutionName': 'Odum Institute for Resea... \n", "1 [{'institutionName': 'The U.S. National Archiv... \n", "2 [{'institutionName': 'Institut für Deutsche Sp... \n", "3 [{'institutionName': 'Odum Institute for Resea... \n", "4 [{'institutionName': 'Arts and Humanities Rese... \n", "\n", " re3data_policy \\\n", "0 [{\"policyName\": \"Collection Development Policy... \n", "1 [{\"policyName\": \"Contribution Policy\", \"policy... \n", "2 [{\"policyName\": \"Erfurter Aufruf zur Sicherung... \n", "3 [{\"policyName\": \"Collection Development Policy... \n", "4 [{\"policyName\": \"ADS Guides to good practice\",... \n", "\n", " re3data_databaseAccess \\\n", "0 {\"databaseAccessType\": \"open\", \"databaseAcces... \n", "1 {\"databaseAccessType\": \"open\", \"databaseAcces... \n", "2 {\"databaseAccessType\": \"restricted\", \"databas... \n", "3 {\"databaseAccessType\": \"open\", \"databaseAcces... \n", "4 {\"databaseAccessType\": \"open\", \"databaseAcces... \n", "\n", " re3data_databaseLicense \\\n", "0 [{\"databaseLicenseName\": \"CC0\", \"databaseLicen... \n", "1 [] \n", "2 [] \n", "3 [] \n", "4 [{\"databaseLicenseName\": \"CC\", \"databaseLicens... \n", "\n", " re3data_dataAccess \\\n", "0 [{\"dataAccessType\": \"embargoed\", \"dataAccessRe... \n", "1 [{\"dataAccessType\": \"open\", \"dataAccessRestric... \n", "2 [{\"dataAccessType\": \"restricted\", \"dataAccessR... \n", "3 [{\"dataAccessType\": \"open\", \"dataAccessRestric... \n", "4 [{\"dataAccessType\": \"open\", \"dataAccessRestric... \n", "\n", " re3data_dataLicense re3data_dataUploadType \\\n", "0 [{\"dataLicenseName\": \"CC\", \"dataLicenseURL\": \"... restricted \n", "1 [{\"dataLicenseName\": \"Copyrights\", \"dataLicens... restricted \n", "2 [{\"dataLicenseName\": \"other\", \"dataLicenseURL\"... restricted \n", "3 [{\"dataLicenseName\": \"CC\", \"dataLicenseURL\": \"... restricted \n", "4 [{\"dataLicenseName\": \"CC\", \"dataLicenseURL\": \"... restricted \n", "\n", " re3data_dataUploadLicense re3data_software \\\n", "0 [] [\"DataVerse\"] \n", "1 [] [\"unknown\"] \n", "2 [] [\"other\"] \n", "3 [{\"dataUploadLicenseName\": \"Data Deposit Form\"... [\"DataVerse\"] \n", "4 [{\"dataUploadLicenseName\": \"Guidelines for Dep... [\"other\"] \n", "\n", " re3data_versioning re3data_api \\\n", "0 NaN {} \n", "1 no {\"api\": \"https://www.archives.gov/developer#to... \n", "2 yes {} \n", "3 yes {\"api\": \"https://guides.dataverse.org/en/lates... \n", "4 yes {\"api\": \"https://archaeologydataservice.ac.uk/... \n", "\n", " re3data_pidSystem \\\n", "0 [\"DOI\"] \n", "1 [\"none\"] \n", "2 [\"none\"] \n", "3 [\"ARK\", \"DOI\", \"PURL\", \"URN\", \"hdl\"] \n", "4 [\"DOI\"] \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem \\\n", "0 NaN [] \n", "1 https://aad.archives.gov/aad/help/getting-star... [] \n", "2 http://agd.ids-mannheim.de/konditionen.shtml [] \n", "3 https://dataverse.org/best-practices/data-cita... [] \n", "4 https://archaeologydataservice.ac.uk/advice/te... [] \n", "\n", " re3data_enhancedPublication re3data_qualityManagement re3data_certificate \\\n", "0 unknown yes [\"other\"] \n", "1 unknown unknown [] \n", "2 unknown unknown [\"RatSWD\"] \n", "3 unknown yes [] \n", "4 unknown yes [\"other\"] \n", "\n", " re3data_metadataStandard \\\n", "0 [{\"metadataStandardName\": \"DDI - Data Document... \n", "1 [] \n", "2 [] \n", "3 [{\"metadataStandardName\": \"DDI - Data Document... \n", "4 [{\"metadataStandardName\": \"DataCite Metadata S... \n", "\n", " re3data_syndication \\\n", "0 {} \n", "1 {\"syndication\": \"http://www.archives.gov/socia... \n", "2 {} \n", "3 {} \n", "4 {\"syndication\": \"https://archaeologydataservic... \n", "\n", " re3data_remarks re3data_entryDate \\\n", "0 Odum Dataverse is covered by Thomson Reuters D... 2013-06-10 \n", "1 NaN 2012-07-04 \n", "2 NaN 2012-07-20 \n", "3 UNC Dataverse is covered by Clarivate Data Cit... 2012-07-23 \n", "4 ADS is covered by Clarivate Data Citation Inde... 2012-07-23 \n", "\n", " re3data_lastUpdate re3data_unique_id \n", "0 2021-07-06 re3data_r3d100000001 \n", "1 2021-05-25 re3data_r3d100000002 \n", "2 2020-08-27 re3data_r3d100000004 \n", "3 2021-10-25 re3data_r3d100000005 \n", "4 2021-09-02 re3data_r3d100000006 " ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "re3data_df = pd.read_csv('../data/raw/re3data.tsv', delimiter='\\t',\n", " converters={'subject': ast.literal_eval,\n", " 'keyword': ast.literal_eval,\n", " 'additionalName': ast.literal_eval,\n", " 'repositoryIdentifier': ast.literal_eval,\n", " 'type': ast.literal_eval,\n", " 'contentType': ast.literal_eval,\n", " 'providerType': ast.literal_eval,\n", " 'institution': ast.literal_eval\n", " })\n", "\n", "re3data_df['unique_id'] = 're3data_' + re3data_df.orgIdentifier\n", "re3data_df = re3data_df.add_prefix('re3data_')\n", "re3data_df.head()" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
OpenDOAR_system_metadata.idOpenDOAR_repository_metadata.nameOpenDOAR_repository_metadata.alternativenameOpenDOAR_repository_metadata.urlOpenDOAR_repository_metadata.descriptionOpenDOAR_repository_metadata.typeOpenDOAR_repository_metadata.content_languagesOpenDOAR_system_metadata.date_modifiedOpenDOAR_system_metadata.date_createdOpenDOAR_repository_metadata.content_subjectsOpenDOAR_repository_metadata.content_typesOpenDOAR_organizationOpenDOAR_policy_urlsOpenDOAR_repository_metadata.softwareOpenDOAR_repository_metadata.oai_urlOpenDOAR_system_metadata.publicly_visibleOpenDOAR_repository_metadata.repository_statusOpenDOAR_repository_metadata.fulltext_record_countOpenDOAR_repository_metadata.metadata_record_countOpenDOAR_unique_id
0134{\"name\": \"eldorado - repository of the tu dort...[{'name': 'eldorado - ressourcen aus und für l...https://eldorado.tu-dortmund.deNaNinstitutional[]2022-01-12 15:34:542005-12-19 14:57:52[arts, humanities, science, mathematics, socia...[journal_articles, conference_and_workshop_pap...[{'name': 'technische universität dortmund', '...[]{\"name\": \"dspace\", \"version\": \"\"}https://eldorado.tu-dortmund.de/oai/requestyesNaN9629.020963.0OpenDOAR_134
158{\"name\": \"archive ouverte en sciences de linfo...[{'acronym': '@rchivesic'}]https://archivesic.ccsd.cnrs.frNaNinstitutional[]2022-01-12 15:34:532006-01-13 12:48:32[arts, science, technology, engineering, mathe...[journal_articles, conference_and_workshop_pap...[{'name': 'centre pour la communication scient...[]{\"name\": \"hal\", \"version\": \"\"}https://api.archives-ouvertes.fr/oai/archivesicyesNaN55492.01137498.0OpenDOAR_58
293{\"name\": \"digitalcommons@the texas medical cen...[]http://digitalcommons.library.tmc.edu/NaNinstitutional[]2022-01-12 15:34:532006-02-14 11:16:12[health and medicine][journal_articles, theses_and_dissertations][{'name': 'texas medical center', 'alternative...[]{\"name\": \"other\", \"version\": \"\"}http://digitalcommons.library.tmc.edu/do/oai/yesNaN2658.07268.0OpenDOAR_93
368{\"name\": \"cognitive sciences eprint archive\", ...[{'acronym': 'cogprints'}]http://cogprints.org/NaNdisciplinary[]2022-01-12 15:34:532006-01-04 15:01:23[humanities, health and medicine, science, soc...[journal_articles, conference_and_workshop_pap...[{'name': 'university of southampton', 'altern...[]{\"name\": \"eprints\", \"version\": \"\"}http://cogprints.org/cgi/oai2yesNaN2895.04277.0OpenDOAR_68
484{\"name\": \"digital commons@carleton college\", \"...[]http://digitalcommons.carleton.edu/NaNinstitutional[]2022-01-12 15:34:532006-01-04 16:07:58[humanities, science, social sciences][journal_articles, unpub_reports_and_working_p...[{'name': 'carleton college', 'alternativeName...[]{\"name\": \"other\", \"version\": \"\"}NaNyesNaNNaN42.0OpenDOAR_84
\n", "
" ], "text/plain": [ " OpenDOAR_system_metadata.id \\\n", "0 134 \n", "1 58 \n", "2 93 \n", "3 68 \n", "4 84 \n", "\n", " OpenDOAR_repository_metadata.name \\\n", "0 {\"name\": \"eldorado - repository of the tu dort... \n", "1 {\"name\": \"archive ouverte en sciences de linfo... \n", "2 {\"name\": \"digitalcommons@the texas medical cen... \n", "3 {\"name\": \"cognitive sciences eprint archive\", ... \n", "4 {\"name\": \"digital commons@carleton college\", \"... \n", "\n", " OpenDOAR_repository_metadata.alternativename \\\n", "0 [{'name': 'eldorado - ressourcen aus und für l... \n", "1 [{'acronym': '@rchivesic'}] \n", "2 [] \n", "3 [{'acronym': 'cogprints'}] \n", "4 [] \n", "\n", " OpenDOAR_repository_metadata.url \\\n", "0 https://eldorado.tu-dortmund.de \n", "1 https://archivesic.ccsd.cnrs.fr \n", "2 http://digitalcommons.library.tmc.edu/ \n", "3 http://cogprints.org/ \n", "4 http://digitalcommons.carleton.edu/ \n", "\n", " OpenDOAR_repository_metadata.description OpenDOAR_repository_metadata.type \\\n", "0 NaN institutional \n", "1 NaN institutional \n", "2 NaN institutional \n", "3 NaN disciplinary \n", "4 NaN institutional \n", "\n", " OpenDOAR_repository_metadata.content_languages \\\n", "0 [] \n", "1 [] \n", "2 [] \n", "3 [] \n", "4 [] \n", "\n", " OpenDOAR_system_metadata.date_modified \\\n", "0 2022-01-12 15:34:54 \n", "1 2022-01-12 15:34:53 \n", "2 2022-01-12 15:34:53 \n", "3 2022-01-12 15:34:53 \n", "4 2022-01-12 15:34:53 \n", "\n", " OpenDOAR_system_metadata.date_created \\\n", "0 2005-12-19 14:57:52 \n", "1 2006-01-13 12:48:32 \n", "2 2006-02-14 11:16:12 \n", "3 2006-01-04 15:01:23 \n", "4 2006-01-04 16:07:58 \n", "\n", " OpenDOAR_repository_metadata.content_subjects \\\n", "0 [arts, humanities, science, mathematics, socia... \n", "1 [arts, science, technology, engineering, mathe... \n", "2 [health and medicine] \n", "3 [humanities, health and medicine, science, soc... \n", "4 [humanities, science, social sciences] \n", "\n", " OpenDOAR_repository_metadata.content_types \\\n", "0 [journal_articles, conference_and_workshop_pap... \n", "1 [journal_articles, conference_and_workshop_pap... \n", "2 [journal_articles, theses_and_dissertations] \n", "3 [journal_articles, conference_and_workshop_pap... \n", "4 [journal_articles, unpub_reports_and_working_p... \n", "\n", " OpenDOAR_organization OpenDOAR_policy_urls \\\n", "0 [{'name': 'technische universität dortmund', '... [] \n", "1 [{'name': 'centre pour la communication scient... [] \n", "2 [{'name': 'texas medical center', 'alternative... [] \n", "3 [{'name': 'university of southampton', 'altern... [] \n", "4 [{'name': 'carleton college', 'alternativeName... [] \n", "\n", " OpenDOAR_repository_metadata.software \\\n", "0 {\"name\": \"dspace\", \"version\": \"\"} \n", "1 {\"name\": \"hal\", \"version\": \"\"} \n", "2 {\"name\": \"other\", \"version\": \"\"} \n", "3 {\"name\": \"eprints\", \"version\": \"\"} \n", "4 {\"name\": \"other\", \"version\": \"\"} \n", "\n", " OpenDOAR_repository_metadata.oai_url \\\n", "0 https://eldorado.tu-dortmund.de/oai/request \n", "1 https://api.archives-ouvertes.fr/oai/archivesic \n", "2 http://digitalcommons.library.tmc.edu/do/oai/ \n", "3 http://cogprints.org/cgi/oai2 \n", "4 NaN \n", "\n", " OpenDOAR_system_metadata.publicly_visible \\\n", "0 yes \n", "1 yes \n", "2 yes \n", "3 yes \n", "4 yes \n", "\n", " OpenDOAR_repository_metadata.repository_status \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.fulltext_record_count \\\n", "0 9629.0 \n", "1 55492.0 \n", "2 2658.0 \n", "3 2895.0 \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.metadata_record_count OpenDOAR_unique_id \n", "0 20963.0 OpenDOAR_134 \n", "1 1137498.0 OpenDOAR_58 \n", "2 7268.0 OpenDOAR_93 \n", "3 4277.0 OpenDOAR_68 \n", "4 42.0 OpenDOAR_84 " ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "opendoar_df = pd.read_csv('../data/raw/openDoar.tsv', delimiter='\\t',\n", " converters={'repository_metadata.content_subjects': ast.literal_eval,\n", " 'repository_metadata.alternativename': ast.literal_eval,\n", " 'repository_metadata.content_types': ast.literal_eval,\n", " 'organization': ast.literal_eval\n", " },\n", " dtype={'system_metadata.id': str})\n", "\n", "opendoar_df['unique_id'] = 'OpenDOAR_' + opendoar_df['system_metadata.id']\n", "opendoar_df = opendoar_df.add_prefix('OpenDOAR_')\n", "opendoar_df.head()" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
roar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
01633archive1NaNNaNdisk0/00/00/00/012010-01-06 13:43:482011-07-18 05:40:072010-01-06 13:43:48subjectNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://archivesic.ccsd.cnrs.fr/@RCHIVESIChttp://archivesic.ccsd.cnrs.fr/oai/oai.phpNaNNaNNaNNaNNaNNaNNaNNaNNaNfrNaNNaNNaNhalgeoname_2_FRotherNaN2002-05-17 19:24:41NaNNaN000250,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...NaNNaNNaNNaN[celestial, opendoar][58, 669]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_1
110511archive1NaNNaNdisk0/00/00/00/102010-01-06 13:43:482011-07-18 05:40:132010-01-06 13:43:48institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://www.diva-portal.org/mdh/Academic Archive On-line (Mälardalen Universit...http://www.diva-portal.org/oai/mdh/OAINaNNaNNaNNaNTRUETRUENaNNaNNaNseUppsala59.866717.6333divageoname_2_SEotherNaN2005-12-08 13:15:22NaNNaN0001000,0,0,0,0,0,0,0,0,0,0,0,0,0,2,8,39,100,100,100...NaNNaNNaNNaN[celestial, opendoar][526, 258]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_10
21000274archive1NaNNaNdisk0/00/00/10/002010-01-06 13:45:012011-07-06 08:21:212010-01-06 13:45:01subjectNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://pam.pisharp.org/PAM - Portuguese Archive of MathematicsNaNNaNNaNNaNNaNTRUETRUENaNNaNNaNptBellevue, WA47.6034-122.155dspacegeoname_2_PTotherNaN2006-05-04 10:48:14NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_1000
31000120archive91NaNNaNdisk0/00/01/00/012015-08-08 14:52:112016-03-21 19:44:012015-08-08 14:52:11subjectNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://edoc.sub.uni-hamburg.de/klimawandel/Klimawandel Dokumentenserverhttp://edoc.sub.uni-hamburg.de/klimawandel/oaiNaNNaNNaNThe \"Documentenserver Klimawandel\" (Repository...TRUETRUETRUE[Climate Service Center 2.0, Helmholtz-Zentrum...[http://www.klimzug.de/de/94.php, http://www.c...deHamburg53.55119.9937opusgeoname_2_DEother[HD, S1, GF, GE, G1]2015-07-02 08:08:31NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[celestial, opendoar][3408, 5881]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_10001
41000811archive404NaNNaNdisk0/00/01/00/082015-08-08 14:52:262016-03-21 19:43:512015-08-08 14:52:26institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://creativematter.skidmore.edu/Creative Matter | Skidmore College Researchhttp://creativematter.skidmore.edu/do/oai/NaNhttp://creativematter.skidmore.edu/recent.rssNaNWelcome to Creative Matter, a repository for t...TRUEFALSEFALSESkidmore Collegehttp://www.skidmore.edu/usSaratoga Springs43.0961-73.7818bepressgeoname_2_USotherNaN2015-07-06 17:35:50NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNcelestial5882NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_10008
\n", "
" ], "text/plain": [ " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "0 1 633 archive 1 NaN \n", "1 10 511 archive 1 NaN \n", "2 1000 274 archive 1 NaN \n", "3 10001 20 archive 91 NaN \n", "4 10008 11 archive 404 NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod \\\n", "0 NaN disk0/00/00/00/01 2010-01-06 13:43:48 2011-07-18 05:40:07 \n", "1 NaN disk0/00/00/00/10 2010-01-06 13:43:48 2011-07-18 05:40:13 \n", "2 NaN disk0/00/00/10/00 2010-01-06 13:45:01 2011-07-06 08:21:21 \n", "3 NaN disk0/00/01/00/01 2015-08-08 14:52:11 2016-03-21 19:44:01 \n", "4 NaN disk0/00/01/00/08 2015-08-08 14:52:26 2016-03-21 19:43:51 \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "0 2010-01-06 13:43:48 subject NaN NaN \n", "1 2010-01-06 13:43:48 institutional NaN NaN \n", "2 2010-01-06 13:45:01 subject NaN NaN \n", "3 2015-08-08 14:52:11 subject NaN NaN \n", "4 2015-08-08 14:52:26 institutional NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "0 show NaN NaN NaN \n", "1 show NaN NaN NaN \n", "2 show NaN NaN NaN \n", "3 show NaN NaN NaN \n", "4 show NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "0 0 NaN NaN NaN \n", "1 0 NaN NaN NaN \n", "2 0 NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_home_page \\\n", "0 http://archivesic.ccsd.cnrs.fr/ \n", "1 http://www.diva-portal.org/mdh/ \n", "2 http://pam.pisharp.org/ \n", "3 http://edoc.sub.uni-hamburg.de/klimawandel/ \n", "4 http://creativematter.skidmore.edu/ \n", "\n", " roar_title \\\n", "0 @RCHIVESIC \n", "1 Academic Archive On-line (Mälardalen Universit... \n", "2 PAM - Portuguese Archive of Mathematics \n", "3 Klimawandel Dokumentenserver \n", "4 Creative Matter | Skidmore College Research \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "0 http://archivesic.ccsd.cnrs.fr/oai/oai.php NaN \n", "1 http://www.diva-portal.org/oai/mdh/OAI NaN \n", "2 NaN NaN \n", "3 http://edoc.sub.uni-hamburg.de/klimawandel/oai NaN \n", "4 http://creativematter.skidmore.edu/do/oai/ NaN \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 http://creativematter.skidmore.edu/recent.rss NaN \n", "\n", " roar_description roar_fulltext \\\n", "0 NaN NaN \n", "1 NaN TRUE \n", "2 NaN TRUE \n", "3 The \"Documentenserver Klimawandel\" (Repository... TRUE \n", "4 Welcome to Creative Matter, a repository for t... TRUE \n", "\n", " roar_open_access roar_mandate \\\n", "0 NaN NaN \n", "1 TRUE NaN \n", "2 TRUE NaN \n", "3 TRUE TRUE \n", "4 FALSE FALSE \n", "\n", " roar_organisation_title \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 [Climate Service Center 2.0, Helmholtz-Zentrum... \n", "4 Skidmore College \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 NaN fr \n", "1 NaN se \n", "2 NaN pt \n", "3 [http://www.klimzug.de/de/94.php, http://www.c... de \n", "4 http://www.skidmore.edu/ us \n", "\n", " roar_location_city roar_location_latitude roar_location_longitude \\\n", "0 NaN NaN NaN \n", "1 Uppsala 59.8667 17.6333 \n", "2 Bellevue, WA 47.6034 -122.155 \n", "3 Hamburg 53.5511 9.9937 \n", "4 Saratoga Springs 43.0961 -73.7818 \n", "\n", " roar_software roar_geoname roar_version roar_subjects \\\n", "0 hal geoname_2_FR other NaN \n", "1 diva geoname_2_SE other NaN \n", "2 dspace geoname_2_PT other NaN \n", "3 opus geoname_2_DE other [HD, S1, GF, GE, G1] \n", "4 bepress geoname_2_US other NaN \n", "\n", " roar_date roar_note roar_suggestions roar_activity_low \\\n", "0 2002-05-17 19:24:41 NaN NaN 0 \n", "1 2005-12-08 13:15:22 NaN NaN 0 \n", "2 2006-05-04 10:48:14 NaN NaN NaN \n", "3 2015-07-02 08:08:31 NaN NaN NaN \n", "4 2015-07-06 17:35:50 NaN NaN NaN \n", "\n", " roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 0 0 25 \n", "1 0 0 100 \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,... NaN \n", "1 0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,8,39,100,100,100... NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_registry_name roar_registry_id roar_submit_to \\\n", "0 [celestial, opendoar] [58, 669] NaN \n", "1 [celestial, opendoar] [526, 258] NaN \n", "2 NaN NaN NaN \n", "3 [celestial, opendoar] [3408, 5881] NaN \n", "4 celestial 5882 NaN \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_total_deposits roar_association roar_unique_id \n", "0 NaN NaN roar_1 \n", "1 NaN NaN roar_10 \n", "2 NaN NaN roar_1000 \n", "3 NaN NaN roar_10001 \n", "4 NaN NaN roar_10008 " ] }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "roar_df = pd.read_csv('../data/raw/export_roar_CSV.csv', dtype='str')\n", "roar_df = roar_df.groupby('eprintid').aggregate(set)\n", "\n", "def value_or_list(cell_set):\n", " copy = set(cell_set)\n", " copy.discard(np.nan) \n", " if len(copy) == 0:\n", " return np.nan\n", " if len(copy) == 1:\n", " return copy.pop()\n", " return list(copy)\n", " \n", "roar_df = roar_df.applymap(value_or_list)\n", "roar_df.reset_index(inplace=True)\n", "\n", "roar_df['unique_id'] = 'roar_' + roar_df.eprintid\n", "roar_df = roar_df.add_prefix('roar_')\n", "roar_df.head()" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
roar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
71001331archive7104NaNNaNdisk0/00/01/00/132015-08-08 14:53:042016-03-21 19:54:432015-08-08 14:53:04institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://er.ucu.edu.ua/ErUCU: Electronic repository of the Ukrainian ...http://er.ucu.edu.ua/oai/requesthttp://er.ucu.edu.ua/sword/http://er.ucu.edu.ua/feed/rss_2.0/siteNaNUkrainian Catholic University’s institutional ...TRUETRUETRUEUkrainian Catholic Universityhttp://ucu.edu.ua/eng/uaLvivNaNNaNdspacegeoname_2_UAother[D1, DK, BL, BR, L1, BS, D901, B1, AC, BF, HM,...2015-07-07 12:38:37NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[celestial, opendoar][5883, 3410]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[russell_group, ivy_league]roar_10013
\n", "
" ], "text/plain": [ " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "7 10013 31 archive 7104 NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod \\\n", "7 NaN disk0/00/01/00/13 2015-08-08 14:53:04 2016-03-21 19:54:43 \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "7 2015-08-08 14:53:04 institutional NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "7 show NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "7 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "7 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "7 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "7 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "7 NaN NaN NaN NaN \n", "\n", " roar_home_page roar_title \\\n", "7 http://er.ucu.edu.ua/ ErUCU: Electronic repository of the Ukrainian ... \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "7 http://er.ucu.edu.ua/oai/request http://er.ucu.edu.ua/sword/ \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "7 http://er.ucu.edu.ua/feed/rss_2.0/site NaN \n", "\n", " roar_description roar_fulltext \\\n", "7 Ukrainian Catholic University’s institutional ... TRUE \n", "\n", " roar_open_access roar_mandate roar_organisation_title \\\n", "7 TRUE TRUE Ukrainian Catholic University \n", "\n", " roar_organisation_home_page roar_location_country roar_location_city \\\n", "7 http://ucu.edu.ua/eng/ ua Lviv \n", "\n", " roar_location_latitude roar_location_longitude roar_software roar_geoname \\\n", "7 NaN NaN dspace geoname_2_UA \n", "\n", " roar_version roar_subjects \\\n", "7 other [D1, DK, BL, BR, L1, BS, D901, B1, AC, BF, HM,... \n", "\n", " roar_date roar_note roar_suggestions roar_activity_low \\\n", "7 2015-07-07 12:38:37 NaN NaN NaN \n", "\n", " roar_activity_medium roar_activity_high roar_recordcount roar_recordhistory \\\n", "7 NaN NaN NaN NaN \n", "\n", " roar_fulltexts_total roar_fulltexts_docs roar_fulltexts_rtotal \\\n", "7 NaN NaN NaN \n", "\n", " roar_fulltexts_rdocs roar_registry_name roar_registry_id roar_submit_to \\\n", "7 NaN [celestial, opendoar] [5883, 3410] NaN \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "7 NaN NaN NaN \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "7 NaN NaN \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "7 NaN NaN NaN \n", "\n", " roar_total_deposits roar_association roar_unique_id \n", "7 NaN [russell_group, ivy_league] roar_10013 " ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "roar_df[roar_df.roar_eprintid == '10013']" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Loading dedup results" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
0dedup::001e6d882e54c780ce269d3c46997287https://fairsharing.org/10.25504/FAIRsharing.q...2094RESID Database of Protein ModificationsFAIRsharingFAIRsharing_2094
1dedup::001e6d882e54c780ce269d3c46997287re3data::r3d100011306r3d100011306RESID Database of Protein Modificationsre3datare3data_r3d100011306
2dedup::003ab6b40af9b488decea7c582d150a2re3data::r3d100011894r3d100011894Synapsere3datare3data_r3d100011894
3dedup::003ab6b40af9b488decea7c582d150a2https://fairsharing.org/10.25504/FAIRsharing.d...2315SynapseFAIRsharingFAIRsharing_2315
4dedup::0048f2e3aa55ab88aaaac0cfa4153ad5opendoar::45624562erzincan binali yıldırım university institutio...OpenDOAROpenDOAR_4562
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::001e6d882e54c780ce269d3c46997287 \n", "1 dedup::001e6d882e54c780ce269d3c46997287 \n", "2 dedup::003ab6b40af9b488decea7c582d150a2 \n", "3 dedup::003ab6b40af9b488decea7c582d150a2 \n", "4 dedup::0048f2e3aa55ab88aaaac0cfa4153ad5 \n", "\n", " duplicate_id original_id \\\n", "0 https://fairsharing.org/10.25504/FAIRsharing.q... 2094 \n", "1 re3data::r3d100011306 r3d100011306 \n", "2 re3data::r3d100011894 r3d100011894 \n", "3 https://fairsharing.org/10.25504/FAIRsharing.d... 2315 \n", "4 opendoar::4562 4562 \n", "\n", " name source \\\n", "0 RESID Database of Protein Modifications FAIRsharing \n", "1 RESID Database of Protein Modifications re3data \n", "2 Synapse re3data \n", "3 Synapse FAIRsharing \n", "4 erzincan binali yıldırım university institutio... OpenDOAR \n", "\n", " unique_id \n", "0 FAIRsharing_2094 \n", "1 re3data_r3d100011306 \n", "2 re3data_r3d100011894 \n", "3 FAIRsharing_2315 \n", "4 OpenDOAR_4562 " ] }, "execution_count": 7, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup = pd.read_csv('../data/processed/ds_dedup_2022-02-16_13.03.17.csv',\n", " sep=';', quotechar='\"',\n", " header=0, names=['dedup_id', 'duplicate_id', 'original_id', 'name', 'source'])\n", "dup['unique_id'] = dup.source + '_' + dup.original_id\n", "dup.head()" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
count471247124712471247124712
unique223947124238401744712
topdedup::67c12a6c3288a49f1db6a2343ec599cahttps://fairsharing.org/10.25504/FAIRsharing.q...3284UPN JATIM REPOSITORYroarFAIRsharing_2094
freq513419811
\n", "
" ], "text/plain": [ " dedup_id \\\n", "count 4712 \n", "unique 2239 \n", "top dedup::67c12a6c3288a49f1db6a2343ec599ca \n", "freq 5 \n", "\n", " duplicate_id original_id \\\n", "count 4712 4712 \n", "unique 4712 4238 \n", "top https://fairsharing.org/10.25504/FAIRsharing.q... 3284 \n", "freq 1 3 \n", "\n", " name source unique_id \n", "count 4712 4712 4712 \n", "unique 4017 4 4712 \n", "top UPN JATIM REPOSITORY roar FAIRsharing_2094 \n", "freq 4 1981 1 " ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup.describe()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Assessing duplicates distribution across registries" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [], "source": [ "dup_grouped = dup.groupby('dedup_id').aggregate(list)\n", "dup_grouped['source_set'] = dup_grouped.source.map(set)" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 6\n", "original_id 6\n", "name 6\n", "source 6\n", "unique_id 6\n", "source_set 6\n", "dtype: int64" ] }, "execution_count": 10, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 4].count()" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 61\n", "original_id 61\n", "name 61\n", "source 61\n", "unique_id 61\n", "source_set 61\n", "dtype: int64" ] }, "execution_count": 11, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 3].count()" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 2029\n", "original_id 2029\n", "name 2029\n", "source 2029\n", "unique_id 2029\n", "source_set 2029\n", "dtype: int64" ] }, "execution_count": 12, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 2].count()" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 143\n", "original_id 143\n", "name 143\n", "source 143\n", "unique_id 143\n", "source_set 143\n", "dtype: int64" ] }, "execution_count": 13, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 1].count()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Assessing duplicates within registries" ] }, { "cell_type": "code", "execution_count": 14, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_id
count249249249249249
sum518518518518518
\n", "
" ], "text/plain": [ " duplicate_id original_id name source unique_id\n", "count 249 249 249 249 249\n", "sum 518 518 518 518 518" ] }, "execution_count": 14, "metadata": {}, "output_type": "execute_result" } ], "source": [ "roar_dup = dup[dup.source == 'roar'].groupby('dedup_id').count()\n", "roar_dup = roar_dup[roar_dup.duplicate_id > 1]\n", "roar_dup.aggregate(['count', 'sum'])" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_id
count3030303030
sum6262626262
\n", "
" ], "text/plain": [ " duplicate_id original_id name source unique_id\n", "count 30 30 30 30 30\n", "sum 62 62 62 62 62" ] }, "execution_count": 15, "metadata": {}, "output_type": "execute_result" } ], "source": [ "opendoar_dup = dup[dup.source == 'OpenDOAR'].groupby('dedup_id').count()\n", "opendoar_dup = opendoar_dup[opendoar_dup.duplicate_id > 1]\n", "opendoar_dup.aggregate(['count', 'sum'])" ] }, { "cell_type": "code", "execution_count": 16, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_id
count33333
sum66666
\n", "
" ], "text/plain": [ " duplicate_id original_id name source unique_id\n", "count 3 3 3 3 3\n", "sum 6 6 6 6 6" ] }, "execution_count": 16, "metadata": {}, "output_type": "execute_result" } ], "source": [ "re3data_dup = dup[dup.source == 're3data'].groupby('dedup_id').count()\n", "re3data_dup = re3data_dup[re3data_dup.duplicate_id > 1]\n", "re3data_dup.aggregate(['count', 'sum'])" ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_id
count00000
sum00000
\n", "
" ], "text/plain": [ " duplicate_id original_id name source unique_id\n", "count 0 0 0 0 0\n", "sum 0 0 0 0 0" ] }, "execution_count": 17, "metadata": {}, "output_type": "execute_result" } ], "source": [ "fairsharing_dup = dup[dup.source == 'FAIRsharing'].groupby('dedup_id').count()\n", "fairsharing_dup = fairsharing_dup[fairsharing_dup.duplicate_id > 1]\n", "fairsharing_dup.aggregate(['count', 'sum'])" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "There is one record which is counted twice. All ok: 2 records in roar and 2 in opendoar ['OpenDOAR_5226', 'roar_14929', 'OpenDOAR_3820', 'roar_16263']" ] }, { "cell_type": "code", "execution_count": 18, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array(['dedup::6973375bbb56846f0d935bd1cd9e0b98'], dtype=object)" ] }, "execution_count": 18, "metadata": {}, "output_type": "execute_result" } ], "source": [ "np.intersect1d(roar_dup.index, opendoar_dup.index)" ] }, { "cell_type": "code", "execution_count": 19, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
1937dedup::6973375bbb56846f0d935bd1cd9e0b98opendoar::38203820repositorio - universidad de la costaOpenDOAROpenDOAR_3820
1938dedup::6973375bbb56846f0d935bd1cd9e0b98opendoar::52265226repositorio universidad de la costaOpenDOAROpenDOAR_5226
1939dedup::6973375bbb56846f0d935bd1cd9e0b98roar::1492914929Repositorio Universidad de la Costaroarroar_14929
1940dedup::6973375bbb56846f0d935bd1cd9e0b98roar::1626316263Repositorio Universidad de la Costaroarroar_16263
\n", "
" ], "text/plain": [ " dedup_id duplicate_id original_id \\\n", "1937 dedup::6973375bbb56846f0d935bd1cd9e0b98 opendoar::3820 3820 \n", "1938 dedup::6973375bbb56846f0d935bd1cd9e0b98 opendoar::5226 5226 \n", "1939 dedup::6973375bbb56846f0d935bd1cd9e0b98 roar::14929 14929 \n", "1940 dedup::6973375bbb56846f0d935bd1cd9e0b98 roar::16263 16263 \n", "\n", " name source unique_id \n", "1937 repositorio - universidad de la costa OpenDOAR OpenDOAR_3820 \n", "1938 repositorio universidad de la costa OpenDOAR OpenDOAR_5226 \n", "1939 Repositorio Universidad de la Costa roar roar_14929 \n", "1940 Repositorio Universidad de la Costa roar roar_16263 " ] }, "execution_count": 19, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup[dup.dedup_id == 'dedup::6973375bbb56846f0d935bd1cd9e0b98']" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Isolating single-registry duplicates" ] }, { "cell_type": "code", "execution_count": 20, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_idsource_set
dedup_id
dedup::07b65089515c8f99812d14bbb01334a6[roar::474, roar::5541][474, 5541][ECNIS Repository (Environmental Cancer Risk, ...[roar, roar][roar_474, roar_5541]{roar}
dedup::0be44aa69610e09805d4002baf7e0b10[roar::16867, roar::2907][16867, 2907][Chung Shan Medical University Institutional R...[roar, roar][roar_16867, roar_2907]{roar}
dedup::0c34770edc42a1d2ac361b64cfabfb63[roar::5432, roar::4030][5432, 4030][Digital Library of Jelenia Góra, Digital Libr...[roar, roar][roar_5432, roar_4030]{roar}
dedup::0c6ed4b110c461d9350bf5c620bc78d7[roar::3020, roar::3401, roar::5252][3020, 3401, 5252][KCE Repository, KCE Repository, KCE Repository][roar, roar, roar][roar_3020, roar_3401, roar_5252]{roar}
dedup::0e3c63baca694032044bbb00c2f1111e[roar::8405, roar::8716][8405, 8716][Content Pro IRX, Content Pro IRX][roar, roar][roar_8405, roar_8716]{roar}
\n", "
" ], "text/plain": [ " duplicate_id \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [roar::474, roar::5541] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [roar::16867, roar::2907] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [roar::5432, roar::4030] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [roar::3020, roar::3401, roar::5252] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [roar::8405, roar::8716] \n", "\n", " original_id \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [474, 5541] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [16867, 2907] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [5432, 4030] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [3020, 3401, 5252] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [8405, 8716] \n", "\n", " name \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [ECNIS Repository (Environmental Cancer Risk, ... \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [Chung Shan Medical University Institutional R... \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [Digital Library of Jelenia Góra, Digital Libr... \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [KCE Repository, KCE Repository, KCE Repository] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [Content Pro IRX, Content Pro IRX] \n", "\n", " source \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [roar, roar] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [roar, roar] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [roar, roar] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [roar, roar, roar] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [roar, roar] \n", "\n", " unique_id \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [roar_474, roar_5541] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [roar_16867, roar_2907] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [roar_5432, roar_4030] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [roar_3020, roar_3401, roar_5252] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [roar_8405, roar_8716] \n", "\n", " source_set \n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 {roar} \n", "dedup::0be44aa69610e09805d4002baf7e0b10 {roar} \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 {roar} \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 {roar} \n", "dedup::0e3c63baca694032044bbb00c2f1111e {roar} " ] }, "execution_count": 20, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup.groupby('dedup_id').aggregate(list)\n", "dup_within['source_set'] = dup_within.source.map(set)\n", "dup_within = dup_within[dup_within.source_set.str.len() == 1]\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 21, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_idsource_set
dedup_id
dedup::07b65089515c8f99812d14bbb01334a6[roar::474, roar::5541][474, 5541][ECNIS Repository (Environmental Cancer Risk, ...[roar, roar][roar_474, roar_5541]roar
dedup::0be44aa69610e09805d4002baf7e0b10[roar::16867, roar::2907][16867, 2907][Chung Shan Medical University Institutional R...[roar, roar][roar_16867, roar_2907]roar
dedup::0c34770edc42a1d2ac361b64cfabfb63[roar::5432, roar::4030][5432, 4030][Digital Library of Jelenia Góra, Digital Libr...[roar, roar][roar_5432, roar_4030]roar
dedup::0c6ed4b110c461d9350bf5c620bc78d7[roar::3020, roar::3401, roar::5252][3020, 3401, 5252][KCE Repository, KCE Repository, KCE Repository][roar, roar, roar][roar_3020, roar_3401, roar_5252]roar
dedup::0e3c63baca694032044bbb00c2f1111e[roar::8405, roar::8716][8405, 8716][Content Pro IRX, Content Pro IRX][roar, roar][roar_8405, roar_8716]roar
\n", "
" ], "text/plain": [ " duplicate_id \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [roar::474, roar::5541] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [roar::16867, roar::2907] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [roar::5432, roar::4030] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [roar::3020, roar::3401, roar::5252] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [roar::8405, roar::8716] \n", "\n", " original_id \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [474, 5541] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [16867, 2907] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [5432, 4030] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [3020, 3401, 5252] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [8405, 8716] \n", "\n", " name \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [ECNIS Repository (Environmental Cancer Risk, ... \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [Chung Shan Medical University Institutional R... \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [Digital Library of Jelenia Góra, Digital Libr... \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [KCE Repository, KCE Repository, KCE Repository] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [Content Pro IRX, Content Pro IRX] \n", "\n", " source \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [roar, roar] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [roar, roar] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [roar, roar] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [roar, roar, roar] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [roar, roar] \n", "\n", " unique_id \\\n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 [roar_474, roar_5541] \n", "dedup::0be44aa69610e09805d4002baf7e0b10 [roar_16867, roar_2907] \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 [roar_5432, roar_4030] \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 [roar_3020, roar_3401, roar_5252] \n", "dedup::0e3c63baca694032044bbb00c2f1111e [roar_8405, roar_8716] \n", "\n", " source_set \n", "dedup_id \n", "dedup::07b65089515c8f99812d14bbb01334a6 roar \n", "dedup::0be44aa69610e09805d4002baf7e0b10 roar \n", "dedup::0c34770edc42a1d2ac361b64cfabfb63 roar \n", "dedup::0c6ed4b110c461d9350bf5c620bc78d7 roar \n", "dedup::0e3c63baca694032044bbb00c2f1111e roar " ] }, "execution_count": 21, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within['source_set'] = dup_within.source_set.map(set.pop)\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "143" ] }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within.groupby('dedup_id').ngroups" ] }, { "cell_type": "code", "execution_count": 23, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_id
source_set
OpenDOAR1818181818
re3data22222
roar123123123123123
\n", "
" ], "text/plain": [ " duplicate_id original_id name source unique_id\n", "source_set \n", "OpenDOAR 18 18 18 18 18\n", "re3data 2 2 2 2 2\n", "roar 123 123 123 123 123" ] }, "execution_count": 23, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within.groupby('source_set').count()" ] }, { "cell_type": "code", "execution_count": 24, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
122dedup::07b65089515c8f99812d14bbb01334a6roar::474474ECNIS Repository (Environmental Cancer Riskroarroar_474
123dedup::07b65089515c8f99812d14bbb01334a6roar::55415541ECNIS Repository (Environmental Cancer Riskroarroar_5541
184dedup::0be44aa69610e09805d4002baf7e0b10roar::1686716867Chung Shan Medical University Institutional Re...roarroar_16867
185dedup::0be44aa69610e09805d4002baf7e0b10roar::29072907Chung Shan Medical University Institutional Re...roarroar_2907
192dedup::0c34770edc42a1d2ac361b64cfabfb63roar::54325432Digital Library of Jelenia Góraroarroar_5432
.....................
4583dedup::f9293f212c2f13c7cc7a2d2a967ac7d5roar::1313413134Repositorio Universidad de Sucreroarroar_13134
4608dedup::fab2415bf42ac76e4ae00aa68b61a4baroar::54825482Biblioteca Virtual del Centro de Documentaciónroarroar_5482
4609dedup::fab2415bf42ac76e4ae00aa68b61a4baroar::52145214Biblioteca Virtual del Centro de Documentaciónroarroar_5214
4690dedup::fee4180dcb5f2af4d963b6d74d82d8c2roar::39923992York St John University ArchivalWare Digital L...roarroar_3992
4691dedup::fee4180dcb5f2af4d963b6d74d82d8c2roar::51855185York St John University ArchivalWare Digital L...roarroar_5185
\n", "

296 rows × 6 columns

\n", "
" ], "text/plain": [ " dedup_id duplicate_id original_id \\\n", "122 dedup::07b65089515c8f99812d14bbb01334a6 roar::474 474 \n", "123 dedup::07b65089515c8f99812d14bbb01334a6 roar::5541 5541 \n", "184 dedup::0be44aa69610e09805d4002baf7e0b10 roar::16867 16867 \n", "185 dedup::0be44aa69610e09805d4002baf7e0b10 roar::2907 2907 \n", "192 dedup::0c34770edc42a1d2ac361b64cfabfb63 roar::5432 5432 \n", "... ... ... ... \n", "4583 dedup::f9293f212c2f13c7cc7a2d2a967ac7d5 roar::13134 13134 \n", "4608 dedup::fab2415bf42ac76e4ae00aa68b61a4ba roar::5482 5482 \n", "4609 dedup::fab2415bf42ac76e4ae00aa68b61a4ba roar::5214 5214 \n", "4690 dedup::fee4180dcb5f2af4d963b6d74d82d8c2 roar::3992 3992 \n", "4691 dedup::fee4180dcb5f2af4d963b6d74d82d8c2 roar::5185 5185 \n", "\n", " name source unique_id \n", "122 ECNIS Repository (Environmental Cancer Risk roar roar_474 \n", "123 ECNIS Repository (Environmental Cancer Risk roar roar_5541 \n", "184 Chung Shan Medical University Institutional Re... roar roar_16867 \n", "185 Chung Shan Medical University Institutional Re... roar roar_2907 \n", "192 Digital Library of Jelenia Góra roar roar_5432 \n", "... ... ... ... \n", "4583 Repositorio Universidad de Sucre roar roar_13134 \n", "4608 Biblioteca Virtual del Centro de Documentación roar roar_5482 \n", "4609 Biblioteca Virtual del Centro de Documentación roar roar_5214 \n", "4690 York St John University ArchivalWare Digital L... roar roar_3992 \n", "4691 York St John University ArchivalWare Digital L... roar roar_5185 \n", "\n", "[296 rows x 6 columns]" ] }, "execution_count": 24, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup[dup.dedup_id.isin(dup_within.index)]\n", "dup_within" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Isolating hybrid duplicates" ] }, { "cell_type": "code", "execution_count": 25, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
53dedup::038ef33e8d3de51d3536d62e6c103be7roar::61676167Institutional Repository UIN Syarif Hidayatull...roarroar_6167
54dedup::038ef33e8d3de51d3536d62e6c103be7opendoar::27172717institutional repository uin syarif hidayatull...OpenDOAROpenDOAR_2717
55dedup::038ef33e8d3de51d3536d62e6c103be7roar::65806580Institutional Repository UIN Syarif Hidayatull...roarroar_6580
72dedup::044edcd1c961b3942a7e0e90d1005e2droar::79027902The University of Arizona Campus Repositoryroarroar_7902
73dedup::044edcd1c961b3942a7e0e90d1005e2dopendoar::24682468university of arizona campus repositoryOpenDOAROpenDOAR_2468
.....................
4596dedup::fa0721f07402e0593da77a46fa687da6opendoar::25452545sanok digital libraryOpenDOAROpenDOAR_2545
4597dedup::fa0721f07402e0593da77a46fa687da6roar::57465746Sanok Digital Libraryroarroar_5746
4610dedup::fab888b1713fb886b13bbd2d569bba60opendoar::25392539publication server of the wuppertal instituteOpenDOAROpenDOAR_2539
4611dedup::fab888b1713fb886b13bbd2d569bba60roar::1121211212Publication Server of the Wuppertal Instituteroarroar_11212
4612dedup::fab888b1713fb886b13bbd2d569bba60roar::58915891Publication Server of the Wuppertal Instituteroarroar_5891
\n", "

434 rows × 6 columns

\n", "
" ], "text/plain": [ " dedup_id duplicate_id original_id \\\n", "53 dedup::038ef33e8d3de51d3536d62e6c103be7 roar::6167 6167 \n", "54 dedup::038ef33e8d3de51d3536d62e6c103be7 opendoar::2717 2717 \n", "55 dedup::038ef33e8d3de51d3536d62e6c103be7 roar::6580 6580 \n", "72 dedup::044edcd1c961b3942a7e0e90d1005e2d roar::7902 7902 \n", "73 dedup::044edcd1c961b3942a7e0e90d1005e2d opendoar::2468 2468 \n", "... ... ... ... \n", "4596 dedup::fa0721f07402e0593da77a46fa687da6 opendoar::2545 2545 \n", "4597 dedup::fa0721f07402e0593da77a46fa687da6 roar::5746 5746 \n", "4610 dedup::fab888b1713fb886b13bbd2d569bba60 opendoar::2539 2539 \n", "4611 dedup::fab888b1713fb886b13bbd2d569bba60 roar::11212 11212 \n", "4612 dedup::fab888b1713fb886b13bbd2d569bba60 roar::5891 5891 \n", "\n", " name source \\\n", "53 Institutional Repository UIN Syarif Hidayatull... roar \n", "54 institutional repository uin syarif hidayatull... OpenDOAR \n", "55 Institutional Repository UIN Syarif Hidayatull... roar \n", "72 The University of Arizona Campus Repository roar \n", "73 university of arizona campus repository OpenDOAR \n", "... ... ... \n", "4596 sanok digital library OpenDOAR \n", "4597 Sanok Digital Library roar \n", "4610 publication server of the wuppertal institute OpenDOAR \n", "4611 Publication Server of the Wuppertal Institute roar \n", "4612 Publication Server of the Wuppertal Institute roar \n", "\n", " unique_id \n", "53 roar_6167 \n", "54 OpenDOAR_2717 \n", "55 roar_6580 \n", "72 roar_7902 \n", "73 OpenDOAR_2468 \n", "... ... \n", "4596 OpenDOAR_2545 \n", "4597 roar_5746 \n", "4610 OpenDOAR_2539 \n", "4611 roar_11212 \n", "4612 roar_5891 \n", "\n", "[434 rows x 6 columns]" ] }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup[~dup.dedup_id.isin(dup_within.dedup_id)]\n", "dup_across = dup_across.groupby('dedup_id').aggregate(list)\n", "dup_across['source_set'] = dup_across.source.map(set)\n", "\n", "dup_hybrid = dup_across[dup_across.source_set.str.len() < dup_across.source.str.len()]\n", "dup_hybrid = dup[dup.dedup_id.isin(dup_hybrid.index)]\n", "dup_hybrid" ] }, { "cell_type": "code", "execution_count": 26, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "138" ] }, "execution_count": 26, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_hybrid.groupby('dedup_id').ngroups" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Isolating multiple-registry duplicates" ] }, { "cell_type": "code", "execution_count": 27, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
0dedup::001e6d882e54c780ce269d3c46997287https://fairsharing.org/10.25504/FAIRsharing.q...2094RESID Database of Protein ModificationsFAIRsharingFAIRsharing_2094
1dedup::001e6d882e54c780ce269d3c46997287re3data::r3d100011306r3d100011306RESID Database of Protein Modificationsre3datare3data_r3d100011306
2dedup::003ab6b40af9b488decea7c582d150a2re3data::r3d100011894r3d100011894Synapsere3datare3data_r3d100011894
3dedup::003ab6b40af9b488decea7c582d150a2https://fairsharing.org/10.25504/FAIRsharing.d...2315SynapseFAIRsharingFAIRsharing_2315
4dedup::0048f2e3aa55ab88aaaac0cfa4153ad5opendoar::45624562erzincan binali yıldırım university institutio...OpenDOAROpenDOAR_4562
.....................
4707dedup::ff7d2ea87cebddb182db2fb8cf32aa89opendoar::21262126sophiaOpenDOAROpenDOAR_2126
4708dedup::ffb342887a73ec0ead022e0414d765b1roar::668668Infoscience: École polytechnique fédérale de L...roarroar_668
4709dedup::ffb342887a73ec0ead022e0414d765b1opendoar::185185infoscience - école polytechnique fédérale de ...OpenDOAROpenDOAR_185
4710dedup::ffbb6800107747f9224cdde0df95da7copendoar::31223122istanbul bilgi university library open accessOpenDOAROpenDOAR_3122
4711dedup::ffbb6800107747f9224cdde0df95da7croar::1364613646Istanbul Bilgi University Library Open Accessroarroar_13646
\n", "

3982 rows × 6 columns

\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::001e6d882e54c780ce269d3c46997287 \n", "1 dedup::001e6d882e54c780ce269d3c46997287 \n", "2 dedup::003ab6b40af9b488decea7c582d150a2 \n", "3 dedup::003ab6b40af9b488decea7c582d150a2 \n", "4 dedup::0048f2e3aa55ab88aaaac0cfa4153ad5 \n", "... ... \n", "4707 dedup::ff7d2ea87cebddb182db2fb8cf32aa89 \n", "4708 dedup::ffb342887a73ec0ead022e0414d765b1 \n", "4709 dedup::ffb342887a73ec0ead022e0414d765b1 \n", "4710 dedup::ffbb6800107747f9224cdde0df95da7c \n", "4711 dedup::ffbb6800107747f9224cdde0df95da7c \n", "\n", " duplicate_id original_id \\\n", "0 https://fairsharing.org/10.25504/FAIRsharing.q... 2094 \n", "1 re3data::r3d100011306 r3d100011306 \n", "2 re3data::r3d100011894 r3d100011894 \n", "3 https://fairsharing.org/10.25504/FAIRsharing.d... 2315 \n", "4 opendoar::4562 4562 \n", "... ... ... \n", "4707 opendoar::2126 2126 \n", "4708 roar::668 668 \n", "4709 opendoar::185 185 \n", "4710 opendoar::3122 3122 \n", "4711 roar::13646 13646 \n", "\n", " name source \\\n", "0 RESID Database of Protein Modifications FAIRsharing \n", "1 RESID Database of Protein Modifications re3data \n", "2 Synapse re3data \n", "3 Synapse FAIRsharing \n", "4 erzincan binali yıldırım university institutio... OpenDOAR \n", "... ... ... \n", "4707 sophia OpenDOAR \n", "4708 Infoscience: École polytechnique fédérale de L... roar \n", "4709 infoscience - école polytechnique fédérale de ... OpenDOAR \n", "4710 istanbul bilgi university library open access OpenDOAR \n", "4711 Istanbul Bilgi University Library Open Access roar \n", "\n", " unique_id \n", "0 FAIRsharing_2094 \n", "1 re3data_r3d100011306 \n", "2 re3data_r3d100011894 \n", "3 FAIRsharing_2315 \n", "4 OpenDOAR_4562 \n", "... ... \n", "4707 OpenDOAR_2126 \n", "4708 roar_668 \n", "4709 OpenDOAR_185 \n", "4710 OpenDOAR_3122 \n", "4711 roar_13646 \n", "\n", "[3982 rows x 6 columns]" ] }, "execution_count": 27, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup_across[dup_across.source_set.str.len() == dup_across.source.str.len()]\n", "dup_across = dup[dup.dedup_id.isin(dup_across.index)]\n", "dup_across\n", "# dup[dup.dedup_id.isin(dup_across.index)]" ] }, { "cell_type": "code", "execution_count": 28, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "1958" ] }, "execution_count": 28, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across.groupby('dedup_id').ngroups" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Double check partitions" ] }, { "cell_type": "code", "execution_count": 29, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "dedup_id 4712\n", "duplicate_id 4712\n", "original_id 4712\n", "name 4712\n", "source 4712\n", "unique_id 4712\n", "dtype: int64" ] }, "execution_count": 29, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup.count()" ] }, { "cell_type": "code", "execution_count": 30, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "dedup_id 4712\n", "duplicate_id 4712\n", "original_id 4712\n", "name 4712\n", "source 4712\n", "unique_id 4712\n", "dtype: int64" ] }, "execution_count": 30, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across.count() + dup_within.count() + dup_hybrid.count()" ] }, { "cell_type": "code", "execution_count": 31, "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/plain": [ "2239" ] }, "execution_count": 31, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within.groupby('dedup_id').ngroups + dup_across.groupby('dedup_id').ngroups + dup_hybrid.groupby('dedup_id').ngroups" ] }, { "cell_type": "code", "execution_count": 32, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "2239" ] }, "execution_count": 32, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup.groupby('dedup_id').ngroups" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Joining information" ] }, { "cell_type": "code", "execution_count": 33, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.metadata.cross-referencesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.url-for-logoFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.data-access-condition.typeFAIRsharing_attributes.metadata.data-contact-informationFAIRsharing_attributes.metadata.data-deposition-condition.urlFAIRsharing_attributes.metadata.data-deposition-condition.typeFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.data-access-condition.urlFAIRsharing_attributes.metadata.resource-sustainability.urlFAIRsharing_attributes.metadata.resource-sustainability.nameFAIRsharing_attributes.metadata.data-preservation-policy.urlFAIRsharing_attributes.metadata.data-preservation-policy.nameFAIRsharing_attributes.metadata.data-access-for-pre-publication-reviewFAIRsharing_attributes.metadata.data-versioningFAIRsharing_attributes.metadata.data-curation.typeFAIRsharing_attributes.metadata.data-curation.urlFAIRsharing_attributes.metadata.citation-to-related-publicationsFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_orgIdentifierre3data_repositoryNamere3data_repositoryName.languagere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_repositoryContactre3data_descriptionre3data_description.languagere3data_typere3data_sizere3data_startDatere3data_endDatere3data_repositoryLanguagere3data_subjectre3data_missionStatementURLre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadTypere3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_system_metadata.idOpenDOAR_repository_metadata.nameOpenDOAR_repository_metadata.alternativenameOpenDOAR_repository_metadata.urlOpenDOAR_repository_metadata.descriptionOpenDOAR_repository_metadata.typeOpenDOAR_repository_metadata.content_languagesOpenDOAR_system_metadata.date_modifiedOpenDOAR_system_metadata.date_createdOpenDOAR_repository_metadata.content_subjectsOpenDOAR_repository_metadata.content_typesOpenDOAR_organizationOpenDOAR_policy_urlsOpenDOAR_repository_metadata.softwareOpenDOAR_repository_metadata.oai_urlOpenDOAR_system_metadata.publicly_visibleOpenDOAR_repository_metadata.repository_statusOpenDOAR_repository_metadata.fulltext_record_countOpenDOAR_repository_metadata.metadata_record_countOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
0dedup::07b65089515c8f99812d14bbb01334a6roar::474474ECNIS Repository (Environmental Cancer Riskroarroar_474NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN474281archive1NaNNaNdisk0/00/00/04/742010-01-06 13:44:222011-07-06 08:19:532010-01-06 13:44:22otherNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://ecnis.openrepository.com/ECNIS Repository (Environmental Cancer Risk, N...NaNNaNNaNNaNThis site is a subject specific repository con...TRUETRUENaNECNIS (Environmental Cancer Risk, Nutrition an...http://www.ecnis.orgplLodz51.819.5openrepogeoname_2_PLotherNaN2008-06-03 08:05:43NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar1254NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_474
1dedup::07b65089515c8f99812d14bbb01334a6roar::55415541ECNIS Repository (Environmental Cancer Riskroarroar_5541NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN55418archive8NaNNaNdisk0/00/00/55/412012-12-12 01:21:032012-12-15 02:51:352012-12-12 01:21:03institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://ecnis.openrepository.com/ecnis/ECNIS Repository (Environmental Cancer Risk, N...NaNNaNNaNNaNThis site is a subject specific repository con...NaNNaNNaNECNIS Network of Excellencehttp://www.ecnis.org/plNaN51.819.5NaNgeoname_2_PLotherNaN2012-07-01 15:13:36NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar1254NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_5541
2dedup::0be44aa69610e09805d4002baf7e0b10roar::1686716867Chung Shan Medical University Institutional Re...roarroar_16867NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN168673archive360NaNNaNdisk0/00/01/68/672021-02-25 13:06:192021-02-25 13:06:192021-02-25 13:06:19institutional2907NaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttps://ir.csmu.edu.tw:8080Chung Shan Medical University Institutional Re...https://ir.csmu.edu.tw:8080/ir-oai/request?ver...NaNNaNNaNNaNTRUETRUEFALSENaNNaNNaNNaNNaNNaNdspaceNaNother[RT, RC0254, RC1200, R1, RK]2009-10-21 00:00:00NaNNaN0001000,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28...NaNNaNNaNNaNNaNNaNcelestialNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_16867
3dedup::0be44aa69610e09805d4002baf7e0b10roar::29072907Chung Shan Medical University Institutional Re...roarroar_2907NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN2907548archive360NaNNaNdisk0/00/00/29/072010-07-29 01:40:552021-02-17 06:33:342010-07-29 01:40:55institutionalNaNNaNno_searchNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttps://ir.csmu.edu.tw:8080Chung Shan Medical University Institutional Re...https://ir.csmu.edu.tw:8080/ir-oai/request?ver...NaNNaNNaNNaNTRUETRUEFALSENaNNaNNaNNaNNaNNaNdspaceNaNother[RC0321, RT, RC0254, RC1200, R1, RK]2009-10-21 00:00:00NaNNaN0001000,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28...NaNNaNNaNNaNNaNNaNcelestialNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_2907
4dedup::0c34770edc42a1d2ac361b64cfabfb63roar::54325432Digital Library of Jelenia Góraroarroar_5432NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN54329archive8NaNNaNdisk0/00/00/54/322012-11-19 20:28:012012-11-26 06:53:382012-11-19 20:28:01institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://jbc.jelenia-gora.pl/dlibra.htmlDigital Library of Jelenia Górahttp://jbc.jelenia-gora.pl/dlibra/oai-pmh-repo...NaNNaNNaNUsers may set up RSS feeds to be alerted to ne...NaNNaNNaNJeleniogórskie Centrum Informacji i Edukacji R...http://biblioteka.jelenia-gora.pl/plNaN50.901215.7341NaNgeoname_2_PLotherNaN2012-07-01 15:12:22NaNNaN000200,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19...NaNNaNNaNNaN[celestial, opendoar][4595, 2211]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_5432
\n", "
" ], "text/plain": [ " dedup_id duplicate_id original_id \\\n", "0 dedup::07b65089515c8f99812d14bbb01334a6 roar::474 474 \n", "1 dedup::07b65089515c8f99812d14bbb01334a6 roar::5541 5541 \n", "2 dedup::0be44aa69610e09805d4002baf7e0b10 roar::16867 16867 \n", "3 dedup::0be44aa69610e09805d4002baf7e0b10 roar::2907 2907 \n", "4 dedup::0c34770edc42a1d2ac361b64cfabfb63 roar::5432 5432 \n", "\n", " name source unique_id \\\n", "0 ECNIS Repository (Environmental Cancer Risk roar roar_474 \n", "1 ECNIS Repository (Environmental Cancer Risk roar roar_5541 \n", "2 Chung Shan Medical University Institutional Re... roar roar_16867 \n", "3 Chung Shan Medical University Institutional Re... roar roar_2907 \n", "4 Digital Library of Jelenia Góra roar roar_5432 \n", "\n", " FAIRsharing_id FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.name FAIRsharing_attributes.metadata.status \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.cross-references \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.licence-links FAIRsharing_attributes.url-for-logo \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-contact-information \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-for-pre-publication-review \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-versioning \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citation-to-related-publications \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_orgIdentifier re3data_repositoryName \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryName.language re3data_additionalName \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryContact re3data_description re3data_description.language \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_type re3data_size re3data_startDate re3data_endDate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_repositoryLanguage re3data_subject re3data_missionStatementURL \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_contentType re3data_providerType re3data_keyword \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_institution re3data_policy re3data_databaseAccess \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_databaseLicense re3data_dataAccess re3data_dataLicense \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_dataUploadType re3data_dataUploadLicense re3data_software \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_versioning re3data_api re3data_pidSystem \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_unique_id OpenDOAR_system_metadata.id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_repository_metadata.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.alternativename \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.url OpenDOAR_repository_metadata.description \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_repository_metadata.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.content_languages \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_system_metadata.date_modified \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_system_metadata.date_created \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.content_subjects \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.content_types OpenDOAR_organization \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_policy_urls OpenDOAR_repository_metadata.software \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_repository_metadata.oai_url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_system_metadata.publicly_visible \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.repository_status \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.fulltext_record_count \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.metadata_record_count OpenDOAR_unique_id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "0 474 281 archive 1 NaN \n", "1 5541 8 archive 8 NaN \n", "2 16867 3 archive 360 NaN \n", "3 2907 548 archive 360 NaN \n", "4 5432 9 archive 8 NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod \\\n", "0 NaN disk0/00/00/04/74 2010-01-06 13:44:22 2011-07-06 08:19:53 \n", "1 NaN disk0/00/00/55/41 2012-12-12 01:21:03 2012-12-15 02:51:35 \n", "2 NaN disk0/00/01/68/67 2021-02-25 13:06:19 2021-02-25 13:06:19 \n", "3 NaN disk0/00/00/29/07 2010-07-29 01:40:55 2021-02-17 06:33:34 \n", "4 NaN disk0/00/00/54/32 2012-11-19 20:28:01 2012-11-26 06:53:38 \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "0 2010-01-06 13:44:22 other NaN NaN \n", "1 2012-12-12 01:21:03 institutional NaN NaN \n", "2 2021-02-25 13:06:19 institutional 2907 NaN \n", "3 2010-07-29 01:40:55 institutional NaN NaN \n", "4 2012-11-19 20:28:01 institutional NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "0 show NaN NaN NaN \n", "1 show NaN NaN NaN \n", "2 show NaN NaN NaN \n", "3 no_search NaN NaN NaN \n", "4 show NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "0 0 NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 0 NaN NaN NaN \n", "3 0 NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_home_page \\\n", "0 http://ecnis.openrepository.com/ \n", "1 http://ecnis.openrepository.com/ecnis/ \n", "2 https://ir.csmu.edu.tw:8080 \n", "3 https://ir.csmu.edu.tw:8080 \n", "4 http://jbc.jelenia-gora.pl/dlibra.html \n", "\n", " roar_title \\\n", "0 ECNIS Repository (Environmental Cancer Risk, N... \n", "1 ECNIS Repository (Environmental Cancer Risk, N... \n", "2 Chung Shan Medical University Institutional Re... \n", "3 Chung Shan Medical University Institutional Re... \n", "4 Digital Library of Jelenia Góra \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 https://ir.csmu.edu.tw:8080/ir-oai/request?ver... NaN \n", "3 https://ir.csmu.edu.tw:8080/ir-oai/request?ver... NaN \n", "4 http://jbc.jelenia-gora.pl/dlibra/oai-pmh-repo... NaN \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_description roar_fulltext \\\n", "0 This site is a subject specific repository con... TRUE \n", "1 This site is a subject specific repository con... NaN \n", "2 NaN TRUE \n", "3 NaN TRUE \n", "4 Users may set up RSS feeds to be alerted to ne... NaN \n", "\n", " roar_open_access roar_mandate \\\n", "0 TRUE NaN \n", "1 NaN NaN \n", "2 TRUE FALSE \n", "3 TRUE FALSE \n", "4 NaN NaN \n", "\n", " roar_organisation_title \\\n", "0 ECNIS (Environmental Cancer Risk, Nutrition an... \n", "1 ECNIS Network of Excellence \n", "2 NaN \n", "3 NaN \n", "4 Jeleniogórskie Centrum Informacji i Edukacji R... \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 http://www.ecnis.org pl \n", "1 http://www.ecnis.org/ pl \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 http://biblioteka.jelenia-gora.pl/ pl \n", "\n", " roar_location_city roar_location_latitude roar_location_longitude \\\n", "0 Lodz 51.8 19.5 \n", "1 NaN 51.8 19.5 \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN 50.9012 15.7341 \n", "\n", " roar_software roar_geoname roar_version \\\n", "0 openrepo geoname_2_PL other \n", "1 NaN geoname_2_PL other \n", "2 dspace NaN other \n", "3 dspace NaN other \n", "4 NaN geoname_2_PL other \n", "\n", " roar_subjects roar_date roar_note \\\n", "0 NaN 2008-06-03 08:05:43 NaN \n", "1 NaN 2012-07-01 15:13:36 NaN \n", "2 [RT, RC0254, RC1200, R1, RK] 2009-10-21 00:00:00 NaN \n", "3 [RC0321, RT, RC0254, RC1200, R1, RK] 2009-10-21 00:00:00 NaN \n", "4 NaN 2012-07-01 15:12:22 NaN \n", "\n", " roar_suggestions roar_activity_low roar_activity_medium roar_activity_high \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN 0 0 0 \n", "3 NaN 0 0 0 \n", "4 NaN 0 0 0 \n", "\n", " roar_recordcount roar_recordhistory \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 100 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28... \n", "3 100 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,28... \n", "4 20 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19... \n", "\n", " roar_fulltexts_total roar_fulltexts_docs roar_fulltexts_rtotal \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_fulltexts_rdocs roar_registry_name roar_registry_id roar_submit_to \\\n", "0 NaN opendoar 1254 NaN \n", "1 NaN opendoar 1254 NaN \n", "2 NaN NaN NaN celestial \n", "3 NaN NaN NaN celestial \n", "4 NaN [celestial, opendoar] [4595, 2211] NaN \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_total_deposits roar_association roar_unique_id \n", "0 NaN NaN roar_474 \n", "1 NaN NaN roar_5541 \n", "2 NaN NaN roar_16867 \n", "3 NaN NaN roar_2907 \n", "4 NaN NaN roar_5432 " ] }, "execution_count": 33, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup_within.merge(fairsharing_df, left_on='unique_id', right_on='FAIRsharing_unique_id', how='left')\n", "dup_within = dup_within.merge(re3data_df, left_on='unique_id', right_on='re3data_unique_id', how='left')\n", "dup_within = dup_within.merge(opendoar_df, left_on='unique_id', right_on='OpenDOAR_unique_id', how='left')\n", "dup_within = dup_within.merge(roar_df, left_on='unique_id', right_on='roar_unique_id', how='left')\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 34, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.metadata.cross-referencesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.url-for-logoFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.data-access-condition.typeFAIRsharing_attributes.metadata.data-contact-informationFAIRsharing_attributes.metadata.data-deposition-condition.urlFAIRsharing_attributes.metadata.data-deposition-condition.typeFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.data-access-condition.urlFAIRsharing_attributes.metadata.resource-sustainability.urlFAIRsharing_attributes.metadata.resource-sustainability.nameFAIRsharing_attributes.metadata.data-preservation-policy.urlFAIRsharing_attributes.metadata.data-preservation-policy.nameFAIRsharing_attributes.metadata.data-access-for-pre-publication-reviewFAIRsharing_attributes.metadata.data-versioningFAIRsharing_attributes.metadata.data-curation.typeFAIRsharing_attributes.metadata.data-curation.urlFAIRsharing_attributes.metadata.citation-to-related-publicationsFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_orgIdentifierre3data_repositoryNamere3data_repositoryName.languagere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_repositoryContactre3data_descriptionre3data_description.languagere3data_typere3data_sizere3data_startDatere3data_endDatere3data_repositoryLanguagere3data_subjectre3data_missionStatementURLre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadTypere3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_system_metadata.idOpenDOAR_repository_metadata.nameOpenDOAR_repository_metadata.alternativenameOpenDOAR_repository_metadata.urlOpenDOAR_repository_metadata.descriptionOpenDOAR_repository_metadata.typeOpenDOAR_repository_metadata.content_languagesOpenDOAR_system_metadata.date_modifiedOpenDOAR_system_metadata.date_createdOpenDOAR_repository_metadata.content_subjectsOpenDOAR_repository_metadata.content_typesOpenDOAR_organizationOpenDOAR_policy_urlsOpenDOAR_repository_metadata.softwareOpenDOAR_repository_metadata.oai_urlOpenDOAR_system_metadata.publicly_visibleOpenDOAR_repository_metadata.repository_statusOpenDOAR_repository_metadata.fulltext_record_countOpenDOAR_repository_metadata.metadata_record_countOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
0dedup::038ef33e8d3de51d3536d62e6c103be7roar::61676167Institutional Repository UIN Syarif Hidayatull...roarroar_6167NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN616713archive2178NaNNaNdisk0/00/00/61/672012-12-12 05:42:582013-07-14 15:12:122012-12-12 05:42:58institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://repository.uinjkt.ac.idInstitutional Repository UIN Syarif Hidayatull...[http://repository.uinjkt.ac.id/oai, http://re...http://repository.uinjkt.ac.id/sword/NaNNaNnstitutional Repository UIN Syarif Hidayatulla...TRUETRUEFALSE[UIN Syarif Hidayatullah Jakarta, Pascasarjana...[http://www.uinjkt.ac.id, http://graduate.uinj...idJakartaNaNNaNdspacegeoname_2_IDotherAI2012-11-07 08:11:19NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[celestial, opendoar][5108, 2717, 5109]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_6167
1dedup::038ef33e8d3de51d3536d62e6c103be7opendoar::27172717institutional repository uin syarif hidayatull...OpenDOAROpenDOAR_2717NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN2717{\"name\": \"institutional repository uin syarif ...[]http://repository.uinjkt.ac.id/dspace/NaNinstitutional[]2022-01-12 15:35:362013-07-11 15:52:01[science, arts, humanities, social sciences, h...[theses_and_dissertations][{'name': 'uin syarif hidayatullah jakarta, st...[]{\"name\": \"dspace\", \"version\": \"\"}http://repository.uinjkt.ac.id/oai/yesNaN0.036862.0OpenDOAR_2717NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
2dedup::038ef33e8d3de51d3536d62e6c103be7roar::65806580Institutional Repository UIN Syarif Hidayatull...roarroar_6580NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN658016archive2040NaNNaNdisk0/00/00/65/802013-03-31 16:02:512013-04-06 01:42:142013-03-31 16:02:51institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://repository.uinjkt.ac.idInstitutional Repository UIN Syarif Hidayatull...NaNNaNNaNNaNNaNFALSEFALSEFALSENaNNaNidJakarta106.756-6.30591dspacegeoname_2_IDother[AC, Z665, Z004, Z719, BP, Q1]2013-03-04 07:20:37NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_6580
3dedup::044edcd1c961b3942a7e0e90d1005e2droar::79027902The University of Arizona Campus Repositoryroarroar_7902NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN790212archive4910NaNNaNdisk0/00/00/79/022014-03-05 11:50:292014-05-08 13:10:292014-03-05 11:50:29institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://arizona.openrepository.com/arizona/The University of Arizona Campus Repositoryhttp://arizona.openrepository.com/arizona/oai/...NaNhttp://arizona.openrepository.com/arizona/feed...NaNThe UA Campus Repository is an institutional r...TRUETRUEFALSEThe University of Arizonahttp://www.arizona.edu/usTucsonNaNNaNdspacegeoname_2_USotherNaN2014-02-25 20:17:47NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[celestial, opendoar][5404, http://opendoar.org/id/2468/]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_7902
4dedup::044edcd1c961b3942a7e0e90d1005e2dopendoar::24682468university of arizona campus repositoryOpenDOAROpenDOAR_2468NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN2468{\"name\": \"university of arizona campus reposit...[]http://arizona.openrepository.com/arizona/NaNinstitutional[]2022-01-12 15:35:322012-05-02 09:50:07[science, arts, humanities, health and medicin...[journal_articles, theses_and_dissertations, u...[{'name': 'university of arizona', 'alternativ...[]{\"name\": \"other\", \"version\": \"\"}NaNyesNaNNaN63231.0OpenDOAR_2468NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
\n", "
" ], "text/plain": [ " dedup_id duplicate_id original_id \\\n", "0 dedup::038ef33e8d3de51d3536d62e6c103be7 roar::6167 6167 \n", "1 dedup::038ef33e8d3de51d3536d62e6c103be7 opendoar::2717 2717 \n", "2 dedup::038ef33e8d3de51d3536d62e6c103be7 roar::6580 6580 \n", "3 dedup::044edcd1c961b3942a7e0e90d1005e2d roar::7902 7902 \n", "4 dedup::044edcd1c961b3942a7e0e90d1005e2d opendoar::2468 2468 \n", "\n", " name source unique_id \\\n", "0 Institutional Repository UIN Syarif Hidayatull... roar roar_6167 \n", "1 institutional repository uin syarif hidayatull... OpenDOAR OpenDOAR_2717 \n", "2 Institutional Repository UIN Syarif Hidayatull... roar roar_6580 \n", "3 The University of Arizona Campus Repository roar roar_7902 \n", "4 university of arizona campus repository OpenDOAR OpenDOAR_2468 \n", "\n", " FAIRsharing_id FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.name FAIRsharing_attributes.metadata.status \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.cross-references \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.licence-links FAIRsharing_attributes.url-for-logo \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-contact-information \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-for-pre-publication-review \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-versioning \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citation-to-related-publications \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_orgIdentifier re3data_repositoryName \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryName.language re3data_additionalName \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryContact re3data_description re3data_description.language \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_type re3data_size re3data_startDate re3data_endDate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_repositoryLanguage re3data_subject re3data_missionStatementURL \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_contentType re3data_providerType re3data_keyword \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_institution re3data_policy re3data_databaseAccess \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_databaseLicense re3data_dataAccess re3data_dataLicense \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_dataUploadType re3data_dataUploadLicense re3data_software \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_versioning re3data_api re3data_pidSystem \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_unique_id OpenDOAR_system_metadata.id \\\n", "0 NaN NaN \n", "1 NaN 2717 \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN 2468 \n", "\n", " OpenDOAR_repository_metadata.name \\\n", "0 NaN \n", "1 {\"name\": \"institutional repository uin syarif ... \n", "2 NaN \n", "3 NaN \n", "4 {\"name\": \"university of arizona campus reposit... \n", "\n", " OpenDOAR_repository_metadata.alternativename \\\n", "0 NaN \n", "1 [] \n", "2 NaN \n", "3 NaN \n", "4 [] \n", "\n", " OpenDOAR_repository_metadata.url \\\n", "0 NaN \n", "1 http://repository.uinjkt.ac.id/dspace/ \n", "2 NaN \n", "3 NaN \n", "4 http://arizona.openrepository.com/arizona/ \n", "\n", " OpenDOAR_repository_metadata.description OpenDOAR_repository_metadata.type \\\n", "0 NaN NaN \n", "1 NaN institutional \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN institutional \n", "\n", " OpenDOAR_repository_metadata.content_languages \\\n", "0 NaN \n", "1 [] \n", "2 NaN \n", "3 NaN \n", "4 [] \n", "\n", " OpenDOAR_system_metadata.date_modified \\\n", "0 NaN \n", "1 2022-01-12 15:35:36 \n", "2 NaN \n", "3 NaN \n", "4 2022-01-12 15:35:32 \n", "\n", " OpenDOAR_system_metadata.date_created \\\n", "0 NaN \n", "1 2013-07-11 15:52:01 \n", "2 NaN \n", "3 NaN \n", "4 2012-05-02 09:50:07 \n", "\n", " OpenDOAR_repository_metadata.content_subjects \\\n", "0 NaN \n", "1 [science, arts, humanities, social sciences, h... \n", "2 NaN \n", "3 NaN \n", "4 [science, arts, humanities, health and medicin... \n", "\n", " OpenDOAR_repository_metadata.content_types \\\n", "0 NaN \n", "1 [theses_and_dissertations] \n", "2 NaN \n", "3 NaN \n", "4 [journal_articles, theses_and_dissertations, u... \n", "\n", " OpenDOAR_organization OpenDOAR_policy_urls \\\n", "0 NaN NaN \n", "1 [{'name': 'uin syarif hidayatullah jakarta, st... [] \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 [{'name': 'university of arizona', 'alternativ... [] \n", "\n", " OpenDOAR_repository_metadata.software OpenDOAR_repository_metadata.oai_url \\\n", "0 NaN NaN \n", "1 {\"name\": \"dspace\", \"version\": \"\"} http://repository.uinjkt.ac.id/oai/ \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 {\"name\": \"other\", \"version\": \"\"} NaN \n", "\n", " OpenDOAR_system_metadata.publicly_visible \\\n", "0 NaN \n", "1 yes \n", "2 NaN \n", "3 NaN \n", "4 yes \n", "\n", " OpenDOAR_repository_metadata.repository_status \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.fulltext_record_count \\\n", "0 NaN \n", "1 0.0 \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.metadata_record_count OpenDOAR_unique_id \\\n", "0 NaN NaN \n", "1 36862.0 OpenDOAR_2717 \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 63231.0 OpenDOAR_2468 \n", "\n", " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "0 6167 13 archive 2178 NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 6580 16 archive 2040 NaN \n", "3 7902 12 archive 4910 NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod \\\n", "0 NaN disk0/00/00/61/67 2012-12-12 05:42:58 2013-07-14 15:12:12 \n", "1 NaN NaN NaN NaN \n", "2 NaN disk0/00/00/65/80 2013-03-31 16:02:51 2013-04-06 01:42:14 \n", "3 NaN disk0/00/00/79/02 2014-03-05 11:50:29 2014-05-08 13:10:29 \n", "4 NaN NaN NaN NaN \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "0 2012-12-12 05:42:58 institutional NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 2013-03-31 16:02:51 institutional NaN NaN \n", "3 2014-03-05 11:50:29 institutional NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "0 show NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 show NaN NaN NaN \n", "3 show NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_home_page \\\n", "0 http://repository.uinjkt.ac.id \n", "1 NaN \n", "2 http://repository.uinjkt.ac.id \n", "3 http://arizona.openrepository.com/arizona/ \n", "4 NaN \n", "\n", " roar_title \\\n", "0 Institutional Repository UIN Syarif Hidayatull... \n", "1 NaN \n", "2 Institutional Repository UIN Syarif Hidayatull... \n", "3 The University of Arizona Campus Repository \n", "4 NaN \n", "\n", " roar_oai_pmh \\\n", "0 [http://repository.uinjkt.ac.id/oai, http://re... \n", "1 NaN \n", "2 NaN \n", "3 http://arizona.openrepository.com/arizona/oai/... \n", "4 NaN \n", "\n", " roar_sword_endpoint \\\n", "0 http://repository.uinjkt.ac.id/sword/ \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 http://arizona.openrepository.com/arizona/feed... NaN \n", "4 NaN NaN \n", "\n", " roar_description roar_fulltext \\\n", "0 nstitutional Repository UIN Syarif Hidayatulla... TRUE \n", "1 NaN NaN \n", "2 NaN FALSE \n", "3 The UA Campus Repository is an institutional r... TRUE \n", "4 NaN NaN \n", "\n", " roar_open_access roar_mandate \\\n", "0 TRUE FALSE \n", "1 NaN NaN \n", "2 FALSE FALSE \n", "3 TRUE FALSE \n", "4 NaN NaN \n", "\n", " roar_organisation_title \\\n", "0 [UIN Syarif Hidayatullah Jakarta, Pascasarjana... \n", "1 NaN \n", "2 NaN \n", "3 The University of Arizona \n", "4 NaN \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 [http://www.uinjkt.ac.id, http://graduate.uinj... id \n", "1 NaN NaN \n", "2 NaN id \n", "3 http://www.arizona.edu/ us \n", "4 NaN NaN \n", "\n", " roar_location_city roar_location_latitude roar_location_longitude \\\n", "0 Jakarta NaN NaN \n", "1 NaN NaN NaN \n", "2 Jakarta 106.756 -6.30591 \n", "3 Tucson NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_software roar_geoname roar_version roar_subjects \\\n", "0 dspace geoname_2_ID other AI \n", "1 NaN NaN NaN NaN \n", "2 dspace geoname_2_ID other [AC, Z665, Z004, Z719, BP, Q1] \n", "3 dspace geoname_2_US other NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_date roar_note roar_suggestions roar_activity_low \\\n", "0 2012-11-07 08:11:19 NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 2013-03-04 07:20:37 NaN NaN NaN \n", "3 2014-02-25 20:17:47 NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_activity_medium roar_activity_high roar_recordcount roar_recordhistory \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_fulltexts_total roar_fulltexts_docs roar_fulltexts_rtotal \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_fulltexts_rdocs roar_registry_name \\\n", "0 NaN [celestial, opendoar] \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN [celestial, opendoar] \n", "4 NaN NaN \n", "\n", " roar_registry_id roar_submit_to roar_submitted_to_name \\\n", "0 [5108, 2717, 5109] NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 [5404, http://opendoar.org/id/2468/] NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_submitted_to_done roar_webometrics_rank roar_webometrics_size \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_visibility roar_webometrics_rich_files \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_webometrics_scholar roar_monthly_deposits roar_total_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_association roar_unique_id \n", "0 NaN roar_6167 \n", "1 NaN NaN \n", "2 NaN roar_6580 \n", "3 NaN roar_7902 \n", "4 NaN NaN " ] }, "execution_count": 34, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_hybrid = dup_hybrid.merge(fairsharing_df, left_on='unique_id', right_on='FAIRsharing_unique_id', how='left')\n", "dup_hybrid = dup_hybrid.merge(re3data_df, left_on='unique_id', right_on='re3data_unique_id', how='left')\n", "dup_hybrid = dup_hybrid.merge(opendoar_df, left_on='unique_id', right_on='OpenDOAR_unique_id', how='left')\n", "dup_hybrid = dup_hybrid.merge(roar_df, left_on='unique_id', right_on='roar_unique_id', how='left')\n", "dup_hybrid.head()" ] }, { "cell_type": "code", "execution_count": 35, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.metadata.cross-referencesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.url-for-logoFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.data-access-condition.typeFAIRsharing_attributes.metadata.data-contact-informationFAIRsharing_attributes.metadata.data-deposition-condition.urlFAIRsharing_attributes.metadata.data-deposition-condition.typeFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.data-access-condition.urlFAIRsharing_attributes.metadata.resource-sustainability.urlFAIRsharing_attributes.metadata.resource-sustainability.nameFAIRsharing_attributes.metadata.data-preservation-policy.urlFAIRsharing_attributes.metadata.data-preservation-policy.nameFAIRsharing_attributes.metadata.data-access-for-pre-publication-reviewFAIRsharing_attributes.metadata.data-versioningFAIRsharing_attributes.metadata.data-curation.typeFAIRsharing_attributes.metadata.data-curation.urlFAIRsharing_attributes.metadata.citation-to-related-publicationsFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_orgIdentifierre3data_repositoryNamere3data_repositoryName.languagere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_repositoryContactre3data_descriptionre3data_description.languagere3data_typere3data_sizere3data_startDatere3data_endDatere3data_repositoryLanguagere3data_subjectre3data_missionStatementURLre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadTypere3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_system_metadata.idOpenDOAR_repository_metadata.nameOpenDOAR_repository_metadata.alternativenameOpenDOAR_repository_metadata.urlOpenDOAR_repository_metadata.descriptionOpenDOAR_repository_metadata.typeOpenDOAR_repository_metadata.content_languagesOpenDOAR_system_metadata.date_modifiedOpenDOAR_system_metadata.date_createdOpenDOAR_repository_metadata.content_subjectsOpenDOAR_repository_metadata.content_typesOpenDOAR_organizationOpenDOAR_policy_urlsOpenDOAR_repository_metadata.softwareOpenDOAR_repository_metadata.oai_urlOpenDOAR_system_metadata.publicly_visibleOpenDOAR_repository_metadata.repository_statusOpenDOAR_repository_metadata.fulltext_record_countOpenDOAR_repository_metadata.metadata_record_countOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
0dedup::001e6d882e54c780ce269d3c46997287https://fairsharing.org/10.25504/FAIRsharing.q...2094RESID Database of Protein ModificationsFAIRsharingFAIRsharing_20942094fairsharing-records2014-11-04T15:23:40.000Z2021-12-06T10:49:03.952Z10.25504/FAIRsharing.qaszjpRESID Database of Protein Modificationsready[{'contact-name': 'John S Garavelli', 'contact...http://pir.georgetown.edu/resid/2094.0The RESID Database of Protein Modifications is...RESID[{'url': 'http://pir.georgetown.edu/resid/faq....NaN[{'url': 'ftp://ftp.pir.georgetown.edu/pir_dat...[{'url': 'https://www.re3data.org/repository/r...[biodbcore-000563, bsg-d000563]Databaseknowledgebase[Life Science][Molecular structure, Small molecule, Structur...[All][][United Kingdom, European Union, Switzerland]FAIRsharing record for: RESID Database of Prot...RESIDhttps://fairsharing.org/10.25504/FAIRsharing.q...10.25504/FAIRsharing.qaszjphttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: The RESID D...[{'id': 334, 'pubmed_id': 12520062, 'title': '...[{'licence-name': 'Open Data Commons (ODC) Pub...NoneNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNFAIRsharing_2094NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
1dedup::001e6d882e54c780ce269d3c46997287re3data::r3d100011306r3d100011306RESID Database of Protein Modificationsre3datare3data_r3d100011306NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNr3d100011306RESID Database of Protein Modificationseng[]https://pir.georgetown.edu/resid/resid.shtml[FAIRsharing_doi:10.25504/FAIRsharing.qaszjp, ...[\"pirmail@georgetown.edu\"]The RESID Database of Protein Modifications is...eng[disciplinary]{\"size\": \"\", \"updatedp\": \"\"}2014NaN[\"eng\"][{'name': '2 Life Sciences', 'scheme': 'DFG'},...NaN[{'name': 'Images', 'scheme': 'parse'}, {'name...[dataProvider][genomes, life sciences, proteins, proteomes, ...[{'institutionName': 'Georgetown University, M...[{\"policyName\": \"Terms of Use\", \"policyURL\": \"...{\"databaseAccessType\": \"open\", \"databaseAcces...[][{\"dataAccessType\": \"open\", \"dataAccessRestric...[{\"dataLicenseName\": \"Copyrights\", \"dataLicens...closed[][\"unknown\"]yes{\"api\": \"ftp://ftp.pir.georgetown.edu/database...[\"none\"]NaN[]yesunknown[][]{}RESID is covered by Thomson Reuters Data Citat...2014-12-052019-01-17re3data_r3d100011306NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
2dedup::003ab6b40af9b488decea7c582d150a2re3data::r3d100011894r3d100011894Synapsere3datare3data_r3d100011894NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNr3d100011894Synapseeng[]https://www.synapse.org[FAIRsharing_DOI:10.25504/FAIRsharing.dnxzmk, ...[\"synapseinfo@sagebase.org\"]Synapse is an open source software platform th...eng[other]{\"size\": \"\", \"updatedp\": \"\"}2012-05-22NaN[\"eng\"][{'name': '2 Life Sciences', 'scheme': 'DFG'},...https://sagebionetworks.org/tools_resources/sy...[{'name': 'Raw data', 'scheme': 'parse'}, {'na...[dataProvider, serviceProvider][AMP-AD Knowledge Portal, DREAM Challenges, Gi...[{'institutionName': 'Alfred P. Sloan Foundati...[{\"policyName\": \"Synapse Commons Governance Ov...{\"databaseAccessType\": \"open\", \"databaseAcces...[][{\"dataAccessType\": \"closed\", \"dataAccessRestr...[{\"dataLicenseName\": \"other\", \"dataLicenseURL\"...restricted[][\"unknown\"]yes{\"api\": \"https://docs.synapse.org/rest/\", \"api...[\"DOI\"]NaN[]yesyes[][]{}NaN2015-12-032021-11-16re3data_r3d100011894NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
3dedup::003ab6b40af9b488decea7c582d150a2https://fairsharing.org/10.25504/FAIRsharing.d...2315SynapseFAIRsharingFAIRsharing_23152315fairsharing-records2016-08-02T13:56:30.000Z2021-12-06T10:48:25.700Z10.25504/FAIRsharing.dnxzmkSynapseready[{'contact-name': 'Meredith Slota', 'contact-e...https://www.synapse.org/2315.0Synapse is a collaborative research platform t...Synapse[{'url': 'SynapseInfo@sagebase.org', 'name': '...2010.0[{'url': 'https://www.synapse.org/', 'name': '...[{'url': 'https://www.re3data.org/repository/r...[biodbcore-000791, bsg-d000791]Databaserepository[Data Integration, Data Management, Biomedical...[Experimental measurement, Protocol, Data stor...[All][][United States]FAIRsharing record for: SynapseSynapsehttps://fairsharing.org/10.25504/FAIRsharing.d...10.25504/FAIRsharing.dnxzmkhttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: Synapse is ...[{'id': 2450, 'pubmed_id': 24071850, 'title': ...[{'licence-name': 'Creative Commons Attributio...NoneNaN[{'url': 'https://sage-bionetworks.github.io/r...NaNNaNNaNNaNNaNNaN[{'url': 'http://rest-docs.synapse.org/rest/',...NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNFAIRsharing_2315NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
4dedup::0048f2e3aa55ab88aaaac0cfa4153ad5opendoar::45624562erzincan binali yıldırım university institutio...OpenDOAROpenDOAR_4562NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN4562{\"name\": \"erzincan binali y\\u0131ld\\u0131r\\u01...[]http://earsiv.erzincan.edu.trNaNinstitutional[]2022-01-12 15:36:062019-04-24 09:06:10[social sciences][journal_articles][{'name': 'erzincan binali yıldırım university...[]{\"name\": \"dspace\", \"version\": \"\"}http://earsiv.erzincan.edu.tr/oaiyesNaNNaNNaNOpenDOAR_4562NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::001e6d882e54c780ce269d3c46997287 \n", "1 dedup::001e6d882e54c780ce269d3c46997287 \n", "2 dedup::003ab6b40af9b488decea7c582d150a2 \n", "3 dedup::003ab6b40af9b488decea7c582d150a2 \n", "4 dedup::0048f2e3aa55ab88aaaac0cfa4153ad5 \n", "\n", " duplicate_id original_id \\\n", "0 https://fairsharing.org/10.25504/FAIRsharing.q... 2094 \n", "1 re3data::r3d100011306 r3d100011306 \n", "2 re3data::r3d100011894 r3d100011894 \n", "3 https://fairsharing.org/10.25504/FAIRsharing.d... 2315 \n", "4 opendoar::4562 4562 \n", "\n", " name source \\\n", "0 RESID Database of Protein Modifications FAIRsharing \n", "1 RESID Database of Protein Modifications re3data \n", "2 Synapse re3data \n", "3 Synapse FAIRsharing \n", "4 erzincan binali yıldırım university institutio... OpenDOAR \n", "\n", " unique_id FAIRsharing_id FAIRsharing_type \\\n", "0 FAIRsharing_2094 2094 fairsharing-records \n", "1 re3data_r3d100011306 NaN NaN \n", "2 re3data_r3d100011894 NaN NaN \n", "3 FAIRsharing_2315 2315 fairsharing-records \n", "4 OpenDOAR_4562 NaN NaN \n", "\n", " FAIRsharing_attributes.created-at FAIRsharing_attributes.updated-at \\\n", "0 2014-11-04T15:23:40.000Z 2021-12-06T10:49:03.952Z \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 2016-08-02T13:56:30.000Z 2021-12-06T10:48:25.700Z \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.doi \\\n", "0 10.25504/FAIRsharing.qaszjp \n", "1 NaN \n", "2 NaN \n", "3 10.25504/FAIRsharing.dnxzmk \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.name \\\n", "0 RESID Database of Protein Modifications \n", "1 NaN \n", "2 NaN \n", "3 Synapse \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 ready \n", "1 NaN \n", "2 NaN \n", "3 ready \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [{'contact-name': 'John S Garavelli', 'contact... \n", "1 NaN \n", "2 NaN \n", "3 [{'contact-name': 'Meredith Slota', 'contact-e... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 http://pir.georgetown.edu/resid/ \n", "1 NaN \n", "2 NaN \n", "3 https://www.synapse.org/ \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 2094.0 \n", "1 NaN \n", "2 NaN \n", "3 2315.0 \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 The RESID Database of Protein Modifications is... \n", "1 NaN \n", "2 NaN \n", "3 Synapse is a collaborative research platform t... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 RESID \n", "1 NaN \n", "2 NaN \n", "3 Synapse \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [{'url': 'http://pir.georgetown.edu/resid/faq.... \n", "1 NaN \n", "2 NaN \n", "3 [{'url': 'SynapseInfo@sagebase.org', 'name': '... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 2010.0 \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [{'url': 'ftp://ftp.pir.georgetown.edu/pir_dat... \n", "1 NaN \n", "2 NaN \n", "3 [{'url': 'https://www.synapse.org/', 'name': '... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.cross-references \\\n", "0 [{'url': 'https://www.re3data.org/repository/r... \n", "1 NaN \n", "2 NaN \n", "3 [{'url': 'https://www.re3data.org/repository/r... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [biodbcore-000563, bsg-d000563] \n", "1 NaN \n", "2 NaN \n", "3 [biodbcore-000791, bsg-d000791] \n", "4 NaN \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 Database \n", "1 NaN \n", "2 NaN \n", "3 Database \n", "4 NaN \n", "\n", " FAIRsharing_attributes.record-type \\\n", "0 knowledgebase \n", "1 NaN \n", "2 NaN \n", "3 repository \n", "4 NaN \n", "\n", " FAIRsharing_attributes.subjects \\\n", "0 [Life Science] \n", "1 NaN \n", "2 NaN \n", "3 [Data Integration, Data Management, Biomedical... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.domains \\\n", "0 [Molecular structure, Small molecule, Structur... \n", "1 NaN \n", "2 NaN \n", "3 [Experimental measurement, Protocol, Data stor... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.taxonomies FAIRsharing_attributes.user-defined-tags \\\n", "0 [All] [] \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 [All] [] \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.countries \\\n", "0 [United Kingdom, European Union, Switzerland] \n", "1 NaN \n", "2 NaN \n", "3 [United States] \n", "4 NaN \n", "\n", " FAIRsharing_attributes.name \\\n", "0 FAIRsharing record for: RESID Database of Prot... \n", "1 NaN \n", "2 NaN \n", "3 FAIRsharing record for: Synapse \n", "4 NaN \n", "\n", " FAIRsharing_attributes.abbreviation \\\n", "0 RESID \n", "1 NaN \n", "2 NaN \n", "3 Synapse \n", "4 NaN \n", "\n", " FAIRsharing_attributes.url \\\n", "0 https://fairsharing.org/10.25504/FAIRsharing.q... \n", "1 NaN \n", "2 NaN \n", "3 https://fairsharing.org/10.25504/FAIRsharing.d... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.doi \\\n", "0 10.25504/FAIRsharing.qaszjp \n", "1 NaN \n", "2 NaN \n", "3 10.25504/FAIRsharing.dnxzmk \n", "4 NaN \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 https://creativecommons.org/licenses/by-sa/4.0... \n", "1 NaN \n", "2 NaN \n", "3 https://creativecommons.org/licenses/by-sa/4.0... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.description \\\n", "0 This FAIRsharing record describes: The RESID D... \n", "1 NaN \n", "2 NaN \n", "3 This FAIRsharing record describes: Synapse is ... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.publications \\\n", "0 [{'id': 334, 'pubmed_id': 12520062, 'title': '... \n", "1 NaN \n", "2 NaN \n", "3 [{'id': 2450, 'pubmed_id': 24071850, 'title': ... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 [{'licence-name': 'Open Data Commons (ODC) Pub... \n", "1 NaN \n", "2 NaN \n", "3 [{'licence-name': 'Creative Commons Attributio... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.url-for-logo \\\n", "0 None \n", "1 NaN \n", "2 NaN \n", "3 None \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 [{'url': 'https://sage-bionetworks.github.io/r... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-contact-information \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 [{'url': 'http://rest-docs.synapse.org/rest/',... \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-access-for-pre-publication-review \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-versioning \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-curation.url \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citation-to-related-publications \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 NaN FAIRsharing_2094 \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN FAIRsharing_2315 \n", "4 NaN NaN \n", "\n", " re3data_orgIdentifier re3data_repositoryName \\\n", "0 NaN NaN \n", "1 r3d100011306 RESID Database of Protein Modifications \n", "2 r3d100011894 Synapse \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryName.language re3data_additionalName \\\n", "0 NaN NaN \n", "1 eng [] \n", "2 eng [] \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_repositoryURL \\\n", "0 NaN \n", "1 https://pir.georgetown.edu/resid/resid.shtml \n", "2 https://www.synapse.org \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_repositoryIdentifier \\\n", "0 NaN \n", "1 [FAIRsharing_doi:10.25504/FAIRsharing.qaszjp, ... \n", "2 [FAIRsharing_DOI:10.25504/FAIRsharing.dnxzmk, ... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_repositoryContact \\\n", "0 NaN \n", "1 [\"pirmail@georgetown.edu\"] \n", "2 [\"synapseinfo@sagebase.org\"] \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_description \\\n", "0 NaN \n", "1 The RESID Database of Protein Modifications is... \n", "2 Synapse is an open source software platform th... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_description.language re3data_type re3data_size \\\n", "0 NaN NaN NaN \n", "1 eng [disciplinary] {\"size\": \"\", \"updatedp\": \"\"} \n", "2 eng [other] {\"size\": \"\", \"updatedp\": \"\"} \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_startDate re3data_endDate re3data_repositoryLanguage \\\n", "0 NaN NaN NaN \n", "1 2014 NaN [\"eng\"] \n", "2 2012-05-22 NaN [\"eng\"] \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_subject \\\n", "0 NaN \n", "1 [{'name': '2 Life Sciences', 'scheme': 'DFG'},... \n", "2 [{'name': '2 Life Sciences', 'scheme': 'DFG'},... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_missionStatementURL \\\n", "0 NaN \n", "1 NaN \n", "2 https://sagebionetworks.org/tools_resources/sy... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_contentType \\\n", "0 NaN \n", "1 [{'name': 'Images', 'scheme': 'parse'}, {'name... \n", "2 [{'name': 'Raw data', 'scheme': 'parse'}, {'na... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_providerType \\\n", "0 NaN \n", "1 [dataProvider] \n", "2 [dataProvider, serviceProvider] \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_keyword \\\n", "0 NaN \n", "1 [genomes, life sciences, proteins, proteomes, ... \n", "2 [AMP-AD Knowledge Portal, DREAM Challenges, Gi... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_institution \\\n", "0 NaN \n", "1 [{'institutionName': 'Georgetown University, M... \n", "2 [{'institutionName': 'Alfred P. Sloan Foundati... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_policy \\\n", "0 NaN \n", "1 [{\"policyName\": \"Terms of Use\", \"policyURL\": \"... \n", "2 [{\"policyName\": \"Synapse Commons Governance Ov... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_databaseAccess re3data_databaseLicense \\\n", "0 NaN NaN \n", "1 {\"databaseAccessType\": \"open\", \"databaseAcces... [] \n", "2 {\"databaseAccessType\": \"open\", \"databaseAcces... [] \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_dataAccess \\\n", "0 NaN \n", "1 [{\"dataAccessType\": \"open\", \"dataAccessRestric... \n", "2 [{\"dataAccessType\": \"closed\", \"dataAccessRestr... \n", "3 NaN \n", "4 NaN \n", "\n", " re3data_dataLicense re3data_dataUploadType \\\n", "0 NaN NaN \n", "1 [{\"dataLicenseName\": \"Copyrights\", \"dataLicens... closed \n", "2 [{\"dataLicenseName\": \"other\", \"dataLicenseURL\"... restricted \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_dataUploadLicense re3data_software re3data_versioning \\\n", "0 NaN NaN NaN \n", "1 [] [\"unknown\"] yes \n", "2 [] [\"unknown\"] yes \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_api re3data_pidSystem \\\n", "0 NaN NaN \n", "1 {\"api\": \"ftp://ftp.pir.georgetown.edu/database... [\"none\"] \n", "2 {\"api\": \"https://docs.synapse.org/rest/\", \"api... [\"DOI\"] \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 NaN NaN NaN \n", "1 NaN [] yes \n", "2 NaN [] yes \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 NaN NaN NaN \n", "1 unknown [] [] \n", "2 yes [] [] \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_syndication re3data_remarks \\\n", "0 NaN NaN \n", "1 {} RESID is covered by Thomson Reuters Data Citat... \n", "2 {} NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_entryDate re3data_lastUpdate re3data_unique_id \\\n", "0 NaN NaN NaN \n", "1 2014-12-05 2019-01-17 re3data_r3d100011306 \n", "2 2015-12-03 2021-11-16 re3data_r3d100011894 \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_system_metadata.id \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 4562 \n", "\n", " OpenDOAR_repository_metadata.name \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 {\"name\": \"erzincan binali y\\u0131ld\\u0131r\\u01... \n", "\n", " OpenDOAR_repository_metadata.alternativename \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 [] \n", "\n", " OpenDOAR_repository_metadata.url OpenDOAR_repository_metadata.description \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 http://earsiv.erzincan.edu.tr NaN \n", "\n", " OpenDOAR_repository_metadata.type \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 institutional \n", "\n", " OpenDOAR_repository_metadata.content_languages \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 [] \n", "\n", " OpenDOAR_system_metadata.date_modified \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 2022-01-12 15:36:06 \n", "\n", " OpenDOAR_system_metadata.date_created \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 2019-04-24 09:06:10 \n", "\n", " OpenDOAR_repository_metadata.content_subjects \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 [social sciences] \n", "\n", " OpenDOAR_repository_metadata.content_types \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 [journal_articles] \n", "\n", " OpenDOAR_organization OpenDOAR_policy_urls \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 [{'name': 'erzincan binali yıldırım university... [] \n", "\n", " OpenDOAR_repository_metadata.software OpenDOAR_repository_metadata.oai_url \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 {\"name\": \"dspace\", \"version\": \"\"} http://earsiv.erzincan.edu.tr/oai \n", "\n", " OpenDOAR_system_metadata.publicly_visible \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 yes \n", "\n", " OpenDOAR_repository_metadata.repository_status \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.fulltext_record_count \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_repository_metadata.metadata_record_count OpenDOAR_unique_id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN OpenDOAR_4562 \n", "\n", " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod roar_status_changed \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_type roar_succeeds roar_commentary roar_metadata_visibility \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_latitude roar_longitude roar_relation_type roar_relation_uri \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_item_issues_id roar_item_issues_type roar_item_issues_description \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_item_issues_timestamp roar_item_issues_status \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_reported_by roar_item_issues_resolved_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_comment roar_item_issues_count roar_sword_depositor \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_sword_slug roar_exemplar roar_home_page roar_title roar_oai_pmh \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_sword_endpoint roar_rss_feed roar_twitter_feed roar_description \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_fulltext roar_open_access roar_mandate roar_organisation_title \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_organisation_home_page roar_location_country roar_location_city \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_location_latitude roar_location_longitude roar_software roar_geoname \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_version roar_subjects roar_date roar_note roar_suggestions \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_activity_low roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_recordhistory roar_fulltexts_total roar_fulltexts_docs \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_fulltexts_rtotal roar_fulltexts_rdocs roar_registry_name \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_registry_id roar_submit_to roar_submitted_to_name \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_submitted_to_done roar_webometrics_rank roar_webometrics_size \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_visibility roar_webometrics_rich_files \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_webometrics_scholar roar_monthly_deposits roar_total_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_association roar_unique_id \n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN " ] }, "execution_count": 35, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup_across.merge(fairsharing_df, left_on='unique_id', right_on='FAIRsharing_unique_id', how='left')\n", "dup_across = dup_across.merge(re3data_df, left_on='unique_id', right_on='re3data_unique_id', how='left')\n", "dup_across = dup_across.merge(opendoar_df, left_on='unique_id', right_on='OpenDOAR_unique_id', how='left')\n", "dup_across = dup_across.merge(roar_df, left_on='unique_id', right_on='roar_unique_id', how='left')\n", "dup_across.head()" ] }, { "cell_type": "code", "execution_count": 36, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.metadata.cross-referencesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.url-for-logoFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.data-access-condition.typeFAIRsharing_attributes.metadata.data-contact-informationFAIRsharing_attributes.metadata.data-deposition-condition.urlFAIRsharing_attributes.metadata.data-deposition-condition.typeFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.data-access-condition.urlFAIRsharing_attributes.metadata.resource-sustainability.urlFAIRsharing_attributes.metadata.resource-sustainability.nameFAIRsharing_attributes.metadata.data-preservation-policy.urlFAIRsharing_attributes.metadata.data-preservation-policy.nameFAIRsharing_attributes.metadata.data-access-for-pre-publication-reviewFAIRsharing_attributes.metadata.data-versioningFAIRsharing_attributes.metadata.data-curation.typeFAIRsharing_attributes.metadata.data-curation.urlFAIRsharing_attributes.metadata.citation-to-related-publicationsFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_orgIdentifierre3data_repositoryNamere3data_repositoryName.languagere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_repositoryContactre3data_descriptionre3data_description.languagere3data_typere3data_sizere3data_startDatere3data_endDatere3data_repositoryLanguagere3data_subjectre3data_missionStatementURLre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadTypere3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_system_metadata.idOpenDOAR_repository_metadata.nameOpenDOAR_repository_metadata.alternativenameOpenDOAR_repository_metadata.urlOpenDOAR_repository_metadata.descriptionOpenDOAR_repository_metadata.typeOpenDOAR_repository_metadata.content_languagesOpenDOAR_system_metadata.date_modifiedOpenDOAR_system_metadata.date_createdOpenDOAR_repository_metadata.content_subjectsOpenDOAR_repository_metadata.content_typesOpenDOAR_organizationOpenDOAR_policy_urlsOpenDOAR_repository_metadata.softwareOpenDOAR_repository_metadata.oai_urlOpenDOAR_system_metadata.publicly_visibleOpenDOAR_repository_metadata.repository_statusOpenDOAR_repository_metadata.fulltext_record_countOpenDOAR_repository_metadata.metadata_record_countOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_idsource_set
0dedup::07b65089515c8f99812d14bbb01334a6[roar::474, roar::5541][474, 5541][ECNIS Repository (Environmental Cancer Risk, ...[roar, roar][roar_474, roar_5541][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][474, 5541][281, 8][archive, archive][1, 8][nan, nan][nan, nan][disk0/00/00/04/74, disk0/00/00/55/41][2010-01-06 13:44:22, 2012-12-12 01:21:03][2011-07-06 08:19:53, 2012-12-15 02:51:35][2010-01-06 13:44:22, 2012-12-12 01:21:03][other, institutional][nan, nan][nan, nan][show, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][0, nan][nan, nan][nan, nan][nan, nan][http://ecnis.openrepository.com/, http://ecni...[ECNIS Repository (Environmental Cancer Risk, ...[nan, nan][nan, nan][nan, nan][nan, nan][This site is a subject specific repository co...[TRUE, nan][TRUE, nan][nan, nan][ECNIS (Environmental Cancer Risk, Nutrition a...[http://www.ecnis.org, http://www.ecnis.org/][pl, pl][Lodz, nan][51.8, 51.8][19.5, 19.5][openrepo, nan][geoname_2_PL, geoname_2_PL][other, other][nan, nan][2008-06-03 08:05:43, 2012-07-01 15:13:36][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][opendoar, opendoar][1254, 1254][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_474, roar_5541]{roar}
1dedup::0be44aa69610e09805d4002baf7e0b10[roar::16867, roar::2907][16867, 2907][Chung Shan Medical University Institutional R...[roar, roar][roar_16867, roar_2907][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][16867, 2907][3, 548][archive, archive][360, 360][nan, nan][nan, nan][disk0/00/01/68/67, disk0/00/00/29/07][2021-02-25 13:06:19, 2010-07-29 01:40:55][2021-02-25 13:06:19, 2021-02-17 06:33:34][2021-02-25 13:06:19, 2010-07-29 01:40:55][institutional, institutional][2907, nan][nan, nan][show, no_search][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][0, 0][nan, nan][nan, nan][nan, nan][https://ir.csmu.edu.tw:8080, https://ir.csmu....[Chung Shan Medical University Institutional R...[https://ir.csmu.edu.tw:8080/ir-oai/request?ve...[nan, nan][nan, nan][nan, nan][nan, nan][TRUE, TRUE][TRUE, TRUE][FALSE, FALSE][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][dspace, dspace][nan, nan][other, other][[RT, RC0254, RC1200, R1, RK], [RC0321, RT, RC...[2009-10-21 00:00:00, 2009-10-21 00:00:00][nan, nan][nan, nan][0, 0][0, 0][0, 0][100, 100][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2...[nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][celestial, celestial][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_16867, roar_2907]{roar}
2dedup::0c34770edc42a1d2ac361b64cfabfb63[roar::5432, roar::4030][5432, 4030][Digital Library of Jelenia Góra, Digital Libr...[roar, roar][roar_5432, roar_4030][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][5432, 4030][9, 12][archive, archive][8, 8][nan, nan][nan, nan][disk0/00/00/54/32, disk0/00/00/40/30][2012-11-19 20:28:01, 2011-08-02 23:17:15][2012-11-26 06:53:38, 2012-02-06 06:58:00][2012-11-19 20:28:01, 2011-08-02 23:17:15][institutional, institutional][nan, nan][nan, nan][show, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][http://jbc.jelenia-gora.pl/dlibra.html, http:...[Digital Library of Jelenia Góra, Digital Libr...[http://jbc.jelenia-gora.pl/dlibra/oai-pmh-rep...[nan, nan][nan, nan][nan, nan][Users may set up RSS feeds to be alerted to n...[nan, nan][nan, nan][nan, nan][Jeleniogórskie Centrum Informacji i Edukacji ...[http://biblioteka.jelenia-gora.pl/, http://bi...[pl, pl][nan, nan][50.9012, 50.9012][15.7341, 15.7341][nan, nan][geoname_2_PL, geoname_2_PL][other, other][nan, nan][2012-07-01 15:12:22, 2009-10-21 11:09:50][nan, nan][nan, nan][0, 0][0, 0][0, 0][20, 20][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1...[nan, nan][nan, nan][nan, nan][nan, nan][[celestial, opendoar], [celestial, opendoar]][[4595, 2211], [4595, 2211]][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_5432, roar_4030]{roar}
3dedup::0c6ed4b110c461d9350bf5c620bc78d7[roar::3020, roar::3401, roar::5252][3020, 3401, 5252][KCE Repository, KCE Repository, KCE Repository][roar, roar, roar][roar_3020, roar_3401, roar_5252][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][3020, 3401, 5252][260, 82, 10][archive, archive, archive][8, 8, 8][nan, nan, nan][nan, nan, nan][disk0/00/00/30/20, disk0/00/00/34/01, disk0/0...[2010-09-13 09:52:23, 2010-12-20 21:30:30, 201...[2016-04-17 21:53:51, 2016-04-17 21:51:59, 201...[2010-09-13 09:52:22, 2010-12-20 21:30:30, 201...[other, other, other][nan, nan, nan][nan, nan, nan][show, show, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][0, 0, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://kce.docressources.info/opac/index.php?...[KCE Repository, KCE Repository, KCE Repository][http://kce.docressources.info/ws/PMBWs_2, htt...[nan, nan, nan][nan, nan, nan][nan, nan, nan][This site provides access to the publication ...[nan, nan, nan][nan, nan, nan][nan, nan, nan][Belgian Health Care Knowledge Centre, Belgian...[http://www.kce.fgov.be/, http://www.kce.fgov....[be, be, be][nan, nan, nan][50.8463, 50.8463, 50.8463][4.3547, 4.3547, 4.3547][nan, nan, nan][nan, nan, geoname_2_BE][other, other, other][nan, nan, nan][2009-01-19 09:04:11, 2009-01-19 09:04:11, 201...[nan, nan, nan][nan, nan, nan][0, 0, 0][0, 0, 0][0, 0, 0][250, 250, 250][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,2...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][[celestial, opendoar], [celestial, opendoar],...[[2246, 1879], [2246, 1879], [2246, 1879]][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0...[909, 909, 909][nan, nan, nan][roar_3020, roar_3401, roar_5252]{roar}
4dedup::0e3c63baca694032044bbb00c2f1111e[roar::8405, roar::8716][8405, 8716][Content Pro IRX, Content Pro IRX][roar, roar][roar_8405, roar_8716][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][8405, 8716][17, 12][archive, archive][5386, 5386][nan, nan][nan, nan][disk0/00/00/84/05, disk0/00/00/87/16][2014-06-24 10:13:16, 2014-10-08 18:39:33][2014-06-28 01:36:04, 2014-10-11 01:36:34][2014-06-24 10:13:16, 2014-10-08 18:39:33][institutional, institutional][nan, nan][nan, nan][show, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][http://encore.tut.ac.za/iii/cpro, http://enco...[Content Pro IRX, Content Pro IRX][nan, http://encore.tut.ac.za/iii/oairep/OAIRe...[http://encore.tut.ac.za/iii/cpro/, nan][nan, nan][nan, nan][Tshwane University of Technology Digital Open...[TRUE, TRUE][TRUE, TRUE][TRUE, FALSE][Tshwane University of Technology, Tshwane Uni...[http://lib.tut.ac.za, http://tut.ac.za][za, za][Pretoria, Pretoria][-25, 25][28, 28][other, nan][geoname_2_ZA, geoname_2_ZA][other, other][nan, nan][2014-05-26 13:47:54, 2014-07-24 06:31:10][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][opendoar, celestial][3078, 5657][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_8405, roar_8716]{roar}
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::07b65089515c8f99812d14bbb01334a6 \n", "1 dedup::0be44aa69610e09805d4002baf7e0b10 \n", "2 dedup::0c34770edc42a1d2ac361b64cfabfb63 \n", "3 dedup::0c6ed4b110c461d9350bf5c620bc78d7 \n", "4 dedup::0e3c63baca694032044bbb00c2f1111e \n", "\n", " duplicate_id original_id \\\n", "0 [roar::474, roar::5541] [474, 5541] \n", "1 [roar::16867, roar::2907] [16867, 2907] \n", "2 [roar::5432, roar::4030] [5432, 4030] \n", "3 [roar::3020, roar::3401, roar::5252] [3020, 3401, 5252] \n", "4 [roar::8405, roar::8716] [8405, 8716] \n", "\n", " name source \\\n", "0 [ECNIS Repository (Environmental Cancer Risk, ... [roar, roar] \n", "1 [Chung Shan Medical University Institutional R... [roar, roar] \n", "2 [Digital Library of Jelenia Góra, Digital Libr... [roar, roar] \n", "3 [KCE Repository, KCE Repository, KCE Repository] [roar, roar, roar] \n", "4 [Content Pro IRX, Content Pro IRX] [roar, roar] \n", "\n", " unique_id FAIRsharing_id FAIRsharing_type \\\n", "0 [roar_474, roar_5541] [nan, nan] [nan, nan] \n", "1 [roar_16867, roar_2907] [nan, nan] [nan, nan] \n", "2 [roar_5432, roar_4030] [nan, nan] [nan, nan] \n", "3 [roar_3020, roar_3401, roar_5252] [nan, nan, nan] [nan, nan, nan] \n", "4 [roar_8405, roar_8716] [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.created-at FAIRsharing_attributes.updated-at \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.doi FAIRsharing_attributes.metadata.name \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.cross-references \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.licence-links FAIRsharing_attributes.url-for-logo \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.type \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-contact-information \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.type \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.name \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.name \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-for-pre-publication-review \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-versioning \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-curation.type \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-curation.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citation-to-related-publications \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_orgIdentifier re3data_repositoryName \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryName.language re3data_additionalName \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryContact re3data_description re3data_description.language \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_type re3data_size re3data_startDate re3data_endDate \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryLanguage re3data_subject re3data_missionStatementURL \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_contentType re3data_providerType re3data_keyword \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_institution re3data_policy re3data_databaseAccess \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_databaseLicense re3data_dataAccess re3data_dataLicense \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_dataUploadType re3data_dataUploadLicense re3data_software \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_versioning re3data_api re3data_pidSystem \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_unique_id OpenDOAR_system_metadata.id \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.name \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.alternativename \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.url OpenDOAR_repository_metadata.description \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.type \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.content_languages \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_system_metadata.date_modified \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_system_metadata.date_created \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.content_subjects \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.content_types OpenDOAR_organization \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_policy_urls OpenDOAR_repository_metadata.software \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.oai_url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_system_metadata.publicly_visible \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.repository_status \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.fulltext_record_count \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.metadata_record_count OpenDOAR_unique_id \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_eprintid roar_rev_number roar_eprint_status \\\n", "0 [474, 5541] [281, 8] [archive, archive] \n", "1 [16867, 2907] [3, 548] [archive, archive] \n", "2 [5432, 4030] [9, 12] [archive, archive] \n", "3 [3020, 3401, 5252] [260, 82, 10] [archive, archive, archive] \n", "4 [8405, 8716] [17, 12] [archive, archive] \n", "\n", " roar_userid roar_importid roar_source \\\n", "0 [1, 8] [nan, nan] [nan, nan] \n", "1 [360, 360] [nan, nan] [nan, nan] \n", "2 [8, 8] [nan, nan] [nan, nan] \n", "3 [8, 8, 8] [nan, nan, nan] [nan, nan, nan] \n", "4 [5386, 5386] [nan, nan] [nan, nan] \n", "\n", " roar_dir \\\n", "0 [disk0/00/00/04/74, disk0/00/00/55/41] \n", "1 [disk0/00/01/68/67, disk0/00/00/29/07] \n", "2 [disk0/00/00/54/32, disk0/00/00/40/30] \n", "3 [disk0/00/00/30/20, disk0/00/00/34/01, disk0/0... \n", "4 [disk0/00/00/84/05, disk0/00/00/87/16] \n", "\n", " roar_datestamp \\\n", "0 [2010-01-06 13:44:22, 2012-12-12 01:21:03] \n", "1 [2021-02-25 13:06:19, 2010-07-29 01:40:55] \n", "2 [2012-11-19 20:28:01, 2011-08-02 23:17:15] \n", "3 [2010-09-13 09:52:23, 2010-12-20 21:30:30, 201... \n", "4 [2014-06-24 10:13:16, 2014-10-08 18:39:33] \n", "\n", " roar_lastmod \\\n", "0 [2011-07-06 08:19:53, 2012-12-15 02:51:35] \n", "1 [2021-02-25 13:06:19, 2021-02-17 06:33:34] \n", "2 [2012-11-26 06:53:38, 2012-02-06 06:58:00] \n", "3 [2016-04-17 21:53:51, 2016-04-17 21:51:59, 201... \n", "4 [2014-06-28 01:36:04, 2014-10-11 01:36:34] \n", "\n", " roar_status_changed \\\n", "0 [2010-01-06 13:44:22, 2012-12-12 01:21:03] \n", "1 [2021-02-25 13:06:19, 2010-07-29 01:40:55] \n", "2 [2012-11-19 20:28:01, 2011-08-02 23:17:15] \n", "3 [2010-09-13 09:52:22, 2010-12-20 21:30:30, 201... \n", "4 [2014-06-24 10:13:16, 2014-10-08 18:39:33] \n", "\n", " roar_type roar_succeeds roar_commentary \\\n", "0 [other, institutional] [nan, nan] [nan, nan] \n", "1 [institutional, institutional] [2907, nan] [nan, nan] \n", "2 [institutional, institutional] [nan, nan] [nan, nan] \n", "3 [other, other, other] [nan, nan, nan] [nan, nan, nan] \n", "4 [institutional, institutional] [nan, nan] [nan, nan] \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude \\\n", "0 [show, show] [nan, nan] [nan, nan] \n", "1 [show, no_search] [nan, nan] [nan, nan] \n", "2 [show, show] [nan, nan] [nan, nan] \n", "3 [show, show, show] [nan, nan, nan] [nan, nan, nan] \n", "4 [show, show] [nan, nan] [nan, nan] \n", "\n", " roar_relation_type roar_relation_uri roar_item_issues_id \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_type roar_item_issues_description \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_timestamp roar_item_issues_status \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_reported_by roar_item_issues_resolved_by \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_comment roar_item_issues_count roar_sword_depositor \\\n", "0 [nan, nan] [0, nan] [nan, nan] \n", "1 [nan, nan] [0, 0] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [0, 0, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_sword_slug roar_exemplar \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_home_page \\\n", "0 [http://ecnis.openrepository.com/, http://ecni... \n", "1 [https://ir.csmu.edu.tw:8080, https://ir.csmu.... \n", "2 [http://jbc.jelenia-gora.pl/dlibra.html, http:... \n", "3 [http://kce.docressources.info/opac/index.php?... \n", "4 [http://encore.tut.ac.za/iii/cpro, http://enco... \n", "\n", " roar_title \\\n", "0 [ECNIS Repository (Environmental Cancer Risk, ... \n", "1 [Chung Shan Medical University Institutional R... \n", "2 [Digital Library of Jelenia Góra, Digital Libr... \n", "3 [KCE Repository, KCE Repository, KCE Repository] \n", "4 [Content Pro IRX, Content Pro IRX] \n", "\n", " roar_oai_pmh \\\n", "0 [nan, nan] \n", "1 [https://ir.csmu.edu.tw:8080/ir-oai/request?ve... \n", "2 [http://jbc.jelenia-gora.pl/dlibra/oai-pmh-rep... \n", "3 [http://kce.docressources.info/ws/PMBWs_2, htt... \n", "4 [nan, http://encore.tut.ac.za/iii/oairep/OAIRe... \n", "\n", " roar_sword_endpoint roar_rss_feed \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [http://encore.tut.ac.za/iii/cpro/, nan] [nan, nan] \n", "\n", " roar_twitter_feed roar_description \\\n", "0 [nan, nan] [This site is a subject specific repository co... \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [Users may set up RSS feeds to be alerted to n... \n", "3 [nan, nan, nan] [This site provides access to the publication ... \n", "4 [nan, nan] [Tshwane University of Technology Digital Open... \n", "\n", " roar_fulltext roar_open_access roar_mandate \\\n", "0 [TRUE, nan] [TRUE, nan] [nan, nan] \n", "1 [TRUE, TRUE] [TRUE, TRUE] [FALSE, FALSE] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [TRUE, TRUE] [TRUE, TRUE] [TRUE, FALSE] \n", "\n", " roar_organisation_title \\\n", "0 [ECNIS (Environmental Cancer Risk, Nutrition a... \n", "1 [nan, nan] \n", "2 [Jeleniogórskie Centrum Informacji i Edukacji ... \n", "3 [Belgian Health Care Knowledge Centre, Belgian... \n", "4 [Tshwane University of Technology, Tshwane Uni... \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 [http://www.ecnis.org, http://www.ecnis.org/] [pl, pl] \n", "1 [nan, nan] [nan, nan] \n", "2 [http://biblioteka.jelenia-gora.pl/, http://bi... [pl, pl] \n", "3 [http://www.kce.fgov.be/, http://www.kce.fgov.... [be, be, be] \n", "4 [http://lib.tut.ac.za, http://tut.ac.za] [za, za] \n", "\n", " roar_location_city roar_location_latitude \\\n", "0 [Lodz, nan] [51.8, 51.8] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [50.9012, 50.9012] \n", "3 [nan, nan, nan] [50.8463, 50.8463, 50.8463] \n", "4 [Pretoria, Pretoria] [-25, 25] \n", "\n", " roar_location_longitude roar_software roar_geoname \\\n", "0 [19.5, 19.5] [openrepo, nan] [geoname_2_PL, geoname_2_PL] \n", "1 [nan, nan] [dspace, dspace] [nan, nan] \n", "2 [15.7341, 15.7341] [nan, nan] [geoname_2_PL, geoname_2_PL] \n", "3 [4.3547, 4.3547, 4.3547] [nan, nan, nan] [nan, nan, geoname_2_BE] \n", "4 [28, 28] [other, nan] [geoname_2_ZA, geoname_2_ZA] \n", "\n", " roar_version roar_subjects \\\n", "0 [other, other] [nan, nan] \n", "1 [other, other] [[RT, RC0254, RC1200, R1, RK], [RC0321, RT, RC... \n", "2 [other, other] [nan, nan] \n", "3 [other, other, other] [nan, nan, nan] \n", "4 [other, other] [nan, nan] \n", "\n", " roar_date roar_note \\\n", "0 [2008-06-03 08:05:43, 2012-07-01 15:13:36] [nan, nan] \n", "1 [2009-10-21 00:00:00, 2009-10-21 00:00:00] [nan, nan] \n", "2 [2012-07-01 15:12:22, 2009-10-21 11:09:50] [nan, nan] \n", "3 [2009-01-19 09:04:11, 2009-01-19 09:04:11, 201... [nan, nan, nan] \n", "4 [2014-05-26 13:47:54, 2014-07-24 06:31:10] [nan, nan] \n", "\n", " roar_suggestions roar_activity_low roar_activity_medium roar_activity_high \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [0, 0] [0, 0] [0, 0] \n", "2 [nan, nan] [0, 0] [0, 0] [0, 0] \n", "3 [nan, nan, nan] [0, 0, 0] [0, 0, 0] [0, 0, 0] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_recordcount roar_recordhistory \\\n", "0 [nan, nan] [nan, nan] \n", "1 [100, 100] [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2... \n", "2 [20, 20] [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1... \n", "3 [250, 250, 250] [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,2... \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_fulltexts_total roar_fulltexts_docs roar_fulltexts_rtotal \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_fulltexts_rdocs roar_registry_name \\\n", "0 [nan, nan] [opendoar, opendoar] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [[celestial, opendoar], [celestial, opendoar]] \n", "3 [nan, nan, nan] [[celestial, opendoar], [celestial, opendoar],... \n", "4 [nan, nan] [opendoar, celestial] \n", "\n", " roar_registry_id roar_submit_to \\\n", "0 [1254, 1254] [nan, nan] \n", "1 [nan, nan] [celestial, celestial] \n", "2 [[4595, 2211], [4595, 2211]] [nan, nan] \n", "3 [[2246, 1879], [2246, 1879], [2246, 1879]] [nan, nan, nan] \n", "4 [3078, 5657] [nan, nan] \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_monthly_deposits roar_total_deposits \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0... [909, 909, 909] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_association roar_unique_id source_set \n", "0 [nan, nan] [roar_474, roar_5541] {roar} \n", "1 [nan, nan] [roar_16867, roar_2907] {roar} \n", "2 [nan, nan] [roar_5432, roar_4030] {roar} \n", "3 [nan, nan, nan] [roar_3020, roar_3401, roar_5252] {roar} \n", "4 [nan, nan] [roar_8405, roar_8716] {roar} " ] }, "execution_count": 36, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup_within.groupby('dedup_id').aggregate(list).reset_index()\n", "dup_within['source_set'] = dup_within.source.map(set)\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 37, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.metadata.cross-referencesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.url-for-logoFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.data-access-condition.typeFAIRsharing_attributes.metadata.data-contact-informationFAIRsharing_attributes.metadata.data-deposition-condition.urlFAIRsharing_attributes.metadata.data-deposition-condition.typeFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.data-access-condition.urlFAIRsharing_attributes.metadata.resource-sustainability.urlFAIRsharing_attributes.metadata.resource-sustainability.nameFAIRsharing_attributes.metadata.data-preservation-policy.urlFAIRsharing_attributes.metadata.data-preservation-policy.nameFAIRsharing_attributes.metadata.data-access-for-pre-publication-reviewFAIRsharing_attributes.metadata.data-versioningFAIRsharing_attributes.metadata.data-curation.typeFAIRsharing_attributes.metadata.data-curation.urlFAIRsharing_attributes.metadata.citation-to-related-publicationsFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_orgIdentifierre3data_repositoryNamere3data_repositoryName.languagere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_repositoryContactre3data_descriptionre3data_description.languagere3data_typere3data_sizere3data_startDatere3data_endDatere3data_repositoryLanguagere3data_subjectre3data_missionStatementURLre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadTypere3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_system_metadata.idOpenDOAR_repository_metadata.nameOpenDOAR_repository_metadata.alternativenameOpenDOAR_repository_metadata.urlOpenDOAR_repository_metadata.descriptionOpenDOAR_repository_metadata.typeOpenDOAR_repository_metadata.content_languagesOpenDOAR_system_metadata.date_modifiedOpenDOAR_system_metadata.date_createdOpenDOAR_repository_metadata.content_subjectsOpenDOAR_repository_metadata.content_typesOpenDOAR_organizationOpenDOAR_policy_urlsOpenDOAR_repository_metadata.softwareOpenDOAR_repository_metadata.oai_urlOpenDOAR_system_metadata.publicly_visibleOpenDOAR_repository_metadata.repository_statusOpenDOAR_repository_metadata.fulltext_record_countOpenDOAR_repository_metadata.metadata_record_countOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_idsource_set
0dedup::038ef33e8d3de51d3536d62e6c103be7[roar::6167, opendoar::2717, roar::6580][6167, 2717, 6580][Institutional Repository UIN Syarif Hidayatul...[roar, OpenDOAR, roar][roar_6167, OpenDOAR_2717, roar_6580][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, 2717, nan][nan, {\"name\": \"institutional repository uin s...[nan, [], nan][nan, http://repository.uinjkt.ac.id/dspace/, ...[nan, nan, nan][nan, institutional, nan][nan, [], nan][nan, 2022-01-12 15:35:36, nan][nan, 2013-07-11 15:52:01, nan][nan, [science, arts, humanities, social scien...[nan, [theses_and_dissertations], nan][nan, [{'name': 'uin syarif hidayatullah jakar...[nan, [], nan][nan, {\"name\": \"dspace\", \"version\": \"\"}, nan][nan, http://repository.uinjkt.ac.id/oai/, nan][nan, yes, nan][nan, nan, nan][nan, 0.0, nan][nan, 36862.0, nan][nan, OpenDOAR_2717, nan][6167, nan, 6580][13, nan, 16][archive, nan, archive][2178, nan, 2040][nan, nan, nan][nan, nan, nan][disk0/00/00/61/67, nan, disk0/00/00/65/80][2012-12-12 05:42:58, nan, 2013-03-31 16:02:51][2013-07-14 15:12:12, nan, 2013-04-06 01:42:14][2012-12-12 05:42:58, nan, 2013-03-31 16:02:51][institutional, nan, institutional][nan, nan, nan][nan, nan, nan][show, nan, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://repository.uinjkt.ac.id, nan, http://r...[Institutional Repository UIN Syarif Hidayatul...[[http://repository.uinjkt.ac.id/oai, http://r...[http://repository.uinjkt.ac.id/sword/, nan, nan][nan, nan, nan][nan, nan, nan][nstitutional Repository UIN Syarif Hidayatull...[TRUE, nan, FALSE][TRUE, nan, FALSE][FALSE, nan, FALSE][[UIN Syarif Hidayatullah Jakarta, Pascasarjan...[[http://www.uinjkt.ac.id, http://graduate.uin...[id, nan, id][Jakarta, nan, Jakarta][nan, nan, 106.756][nan, nan, -6.30591][dspace, nan, dspace][geoname_2_ID, nan, geoname_2_ID][other, nan, other][AI, nan, [AC, Z665, Z004, Z719, BP, Q1]][2012-11-07 08:11:19, nan, 2013-03-04 07:20:37][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][[celestial, opendoar], nan, nan][[5108, 2717, 5109], nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][roar_6167, nan, roar_6580]{OpenDOAR, roar}
1dedup::044edcd1c961b3942a7e0e90d1005e2d[roar::7902, opendoar::2468, roar::5216][7902, 2468, 5216][The University of Arizona Campus Repository, ...[roar, OpenDOAR, roar][roar_7902, OpenDOAR_2468, roar_5216][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, 2468, nan][nan, {\"name\": \"university of arizona campus r...[nan, [], nan][nan, http://arizona.openrepository.com/arizon...[nan, nan, nan][nan, institutional, nan][nan, [], nan][nan, 2022-01-12 15:35:32, nan][nan, 2012-05-02 09:50:07, nan][nan, [science, arts, humanities, health and m...[nan, [journal_articles, theses_and_dissertati...[nan, [{'name': 'university of arizona', 'alte...[nan, [], nan][nan, {\"name\": \"other\", \"version\": \"\"}, nan][nan, nan, nan][nan, yes, nan][nan, nan, nan][nan, nan, nan][nan, 63231.0, nan][nan, OpenDOAR_2468, nan][7902, nan, 5216][12, nan, 8][archive, nan, archive][4910, nan, 8][nan, nan, nan][nan, nan, nan][disk0/00/00/79/02, nan, disk0/00/00/52/16][2014-03-05 11:50:29, nan, 2012-05-16 23:47:28][2014-05-08 13:10:29, nan, 2012-05-19 01:46:06][2014-03-05 11:50:29, nan, 2012-05-16 23:47:28][institutional, nan, institutional][nan, nan, nan][nan, nan, nan][show, nan, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://arizona.openrepository.com/arizona/, n...[The University of Arizona Campus Repository, ...[http://arizona.openrepository.com/arizona/oai...[nan, nan, nan][http://arizona.openrepository.com/arizona/fee...[nan, nan, nan][The UA Campus Repository is an institutional ...[TRUE, nan, nan][TRUE, nan, nan][FALSE, nan, nan][The University of Arizona, nan, University of...[http://www.arizona.edu/, nan, http://www.ariz...[us, nan, us][Tucson, nan, nan][nan, nan, 32.2531][nan, nan, -110.948][dspace, nan, nan][geoname_2_US, nan, geoname_2_US][other, nan, other][nan, nan, nan][2014-02-25 20:17:47, nan, 2012-05-13 15:12:37][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][[celestial, opendoar], nan, opendoar][[5404, http://opendoar.org/id/2468/], nan, 2468][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][roar_7902, nan, roar_5216]{OpenDOAR, roar}
2dedup::0468c62a26a75be73109e1efa74bee44[roar::12182, opendoar::3096, roar::8677][12182, 3096, 8677][ScholarWorks @ UVM, scholarworks @ uvm, Schol...[roar, OpenDOAR, roar][roar_12182, OpenDOAR_3096, roar_8677][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, 3096, nan][nan, {\"name\": \"scholarworks @ uvm\", \"language...[nan, [], nan][nan, http://scholarworks.uvm.edu/, nan][nan, nan, nan][nan, institutional, nan][nan, [], nan][nan, 2022-01-12 15:35:42, nan][nan, 2014-06-26 16:50:45, nan][nan, [science, technology, engineering, mathe...[nan, [journal_articles, conference_and_worksh...[nan, [{'name': 'university of vermont', 'alte...[nan, [{\"policy_url\": \"http://scholarworks.uvm...[nan, {\"name\": \"other\", \"version\": \"\"}, nan][nan, http://scholarworks.uvm.edu/do/oai/, nan][nan, yes, nan][nan, nan, nan][nan, nan, nan][nan, 2871.0, nan][nan, OpenDOAR_3096, nan][12182, nan, 8677][11, nan, 11][archive, nan, archive][404, nan, 5634][nan, nan, nan][nan, nan, nan][disk0/00/01/21/82, nan, disk0/00/00/86/77][2017-03-11 17:50:59, nan, 2014-10-08 18:32:00][2017-03-18 02:36:55, nan, 2014-10-11 01:36:04][2017-03-11 17:50:59, nan, 2014-10-08 18:32:00][institutional, nan, institutional][nan, nan, nan][nan, nan, nan][show, nan, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://scholarworks.uvm.edu/, nan, http://sch...[ScholarWorks @ UVM, nan, ScholarWorks @ UVM][http://scholarworks.uvm.edu/do/oai/, nan, htt...[nan, nan, nan][http://scholarworks.uvm.edu/recent.rss, nan, ...[nan, nan, nan][ScholarWorks @ UVM collects, preserves, and s...[TRUE, nan, TRUE][TRUE, nan, TRUE][FALSE, nan, FALSE][University of Vermont, nan, University of Ver...[https://www.uvm.edu/, nan, http://www.uvm.edu][us, nan, us][Burlington, VT, nan, Burington][44.4759, nan, 44.4856][-73.2121, nan, -73.2117][bepress, nan, bepress][geoname_2_US, nan, geoname_2_US][other, nan, other][nan, nan, nan][2017-01-13 20:44:06, nan, 2014-07-16 21:08:43][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][celestial, nan, [celestial, opendoar]][5654, nan, [http://opendoar.org/id/3096/, 5654]][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][roar_12182, nan, roar_8677]{OpenDOAR, roar}
3dedup::053eb8ab14c76525fd6f1daeb061f064[opendoar::9528, roar::15805, roar::15765][9528, 15805, 15765][repositorio institucional históricas - unam, ...[OpenDOAR, roar, roar][OpenDOAR_9528, roar_15805, roar_15765][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][9528, nan, nan][{\"name\": \"repositorio institucional hist\\u00f...[[], nan, nan][http://ru.historicas.unam.mx, nan, nan][nan, nan, nan][institutional, nan, nan][[], nan, nan][2022-01-12 15:36:31, nan, nan][2020-02-25 08:36:10, nan, nan][[humanities, technology], nan, nan][[journal_articles, other_special_item_types],...[[{'name': 'unam', 'alternativeName': 'institu...[[], nan, nan][{\"name\": \"dspace\", \"version\": \"\"}, nan, nan][http://ru.historicas.unam.mx/oai/request, nan...[yes, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][OpenDOAR_9528, nan, nan][nan, 15805, 15765][nan, 5, 19][nan, archive, archive][nan, 12662, 12662][nan, nan, nan][nan, nan, nan][nan, disk0/00/01/58/05, disk0/00/01/57/65][nan, 2020-10-19 15:32:48, 2020-10-19 15:31:52][nan, 2021-01-25 22:20:40, 2021-01-26 20:47:24][nan, 2020-10-19 15:32:48, 2020-10-19 15:31:52][nan, institutional, institutional][nan, 15765, nan][nan, nan, nan][nan, show, no_search][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, http://ru.historicas.unam.mx/, https://r...[nan, Repositorio Institucional Históricas-UNA...[nan, http://ru.historicas.unam.mx/oai/request...[nan, nan, nan][nan, http://ru.historicas.unam.mx/feed/rss_1....[nan, nan, nan][nan, El Repositorio Institucional Históricas-...[nan, TRUE, TRUE][nan, TRUE, TRUE][nan, TRUE, TRUE][nan, Instituto de Investigaciones Históricas,...[nan, http://www.historicas.unam.mx/, http://w...[nan, mx, mx][nan, Ciudad de México, Ciudad de México][nan, nan, nan][nan, nan, nan][nan, dspace, dspace][nan, geoname_2_MX, geoname_2_MX][nan, other, other][nan, [D1, E11, F1201, D111, D901, DP, D204, D...[nan, 2020-02-14 18:36:03, 2020-02-14 18:36:03][nan, ¿Quién puede depositar documentos en el ...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, opendoar][nan, nan, 9528][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, [russell_group, ivy_league], [russell_gr...[nan, roar_15805, roar_15765]{OpenDOAR, roar}
4dedup::06a4be0dca480e71b823fd599ed221a0[opendoar::2557, roar::5840, roar::5915][2557, 5840, 5915][biblioteka cyfrowa diecezji legnickiej, Bibli...[OpenDOAR, roar, roar][OpenDOAR_2557, roar_5840, roar_5915][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][2557, nan, nan][{\"name\": \"biblioteka cyfrowa diecezji legnick...[[], nan, nan][http://bcdl.pl/dlibra, nan, nan][nan, nan, nan][institutional, nan, nan][[], nan, nan][2022-01-12 15:35:34, nan, nan][2012-08-20 11:35:42, nan, nan][[humanities], nan, nan][[journal_articles, books_chapters_and_section...[[{'name': 'biblioteka wyższego seminarium duc...[[], nan, nan][{\"name\": \"dlibra\", \"version\": \"\"}, nan, nan][http://bcdl.pl/dlibra/oai-pmh-repository.xml,...[yes, nan, nan][nan, nan, nan][0.0, nan, nan][368.0, nan, nan][OpenDOAR_2557, nan, nan][nan, 5840, 5915][nan, 9, 9][nan, archive, archive][nan, 8, 8][nan, nan, nan][nan, nan, nan][nan, disk0/00/00/58/40, disk0/00/00/59/15][nan, 2012-12-12 04:59:36, 2012-12-12 05:12:30][nan, 2012-12-17 06:53:45, 2012-12-17 06:53:50][nan, 2012-12-12 04:59:36, 2012-12-12 05:12:30][nan, institutional, institutional][nan, nan, nan][nan, nan, nan][nan, show, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, http://bcdl.pl/, http://bcdl.pl/dlibra][nan, Biblioteka Cyfrowa Diecezji Legnickiej, ...[nan, http://bcdl.pl/dlibra/oai-pmh-repository...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, This site provides access to the digitis...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, Biblioteka Wyższego Seminarium Duchowneg...[nan, http://www.biblioteka.diecezja.legnica.p...[nan, pl, pl][nan, nan, nan][nan, 51.207, 51.207][nan, 16.1553, 16.1553][nan, nan, nan][nan, geoname_2_PL, geoname_2_PL][nan, other, other][nan, nan, nan][nan, 2012-08-26 15:12:13, 2012-09-16 15:12:16][nan, nan, nan][nan, nan, nan][nan, 0, 0][nan, 0, 0][nan, 0, 0][nan, 20, 20][nan, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, [celestial, opendoar], [celestial, opend...[nan, [2557, 5081], [2557, 5081]][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, roar_5840, roar_5915]{OpenDOAR, roar}
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::038ef33e8d3de51d3536d62e6c103be7 \n", "1 dedup::044edcd1c961b3942a7e0e90d1005e2d \n", "2 dedup::0468c62a26a75be73109e1efa74bee44 \n", "3 dedup::053eb8ab14c76525fd6f1daeb061f064 \n", "4 dedup::06a4be0dca480e71b823fd599ed221a0 \n", "\n", " duplicate_id original_id \\\n", "0 [roar::6167, opendoar::2717, roar::6580] [6167, 2717, 6580] \n", "1 [roar::7902, opendoar::2468, roar::5216] [7902, 2468, 5216] \n", "2 [roar::12182, opendoar::3096, roar::8677] [12182, 3096, 8677] \n", "3 [opendoar::9528, roar::15805, roar::15765] [9528, 15805, 15765] \n", "4 [opendoar::2557, roar::5840, roar::5915] [2557, 5840, 5915] \n", "\n", " name source \\\n", "0 [Institutional Repository UIN Syarif Hidayatul... [roar, OpenDOAR, roar] \n", "1 [The University of Arizona Campus Repository, ... [roar, OpenDOAR, roar] \n", "2 [ScholarWorks @ UVM, scholarworks @ uvm, Schol... [roar, OpenDOAR, roar] \n", "3 [repositorio institucional históricas - unam, ... [OpenDOAR, roar, roar] \n", "4 [biblioteka cyfrowa diecezji legnickiej, Bibli... [OpenDOAR, roar, roar] \n", "\n", " unique_id FAIRsharing_id FAIRsharing_type \\\n", "0 [roar_6167, OpenDOAR_2717, roar_6580] [nan, nan, nan] [nan, nan, nan] \n", "1 [roar_7902, OpenDOAR_2468, roar_5216] [nan, nan, nan] [nan, nan, nan] \n", "2 [roar_12182, OpenDOAR_3096, roar_8677] [nan, nan, nan] [nan, nan, nan] \n", "3 [OpenDOAR_9528, roar_15805, roar_15765] [nan, nan, nan] [nan, nan, nan] \n", "4 [OpenDOAR_2557, roar_5840, roar_5915] [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.created-at FAIRsharing_attributes.updated-at \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.doi FAIRsharing_attributes.metadata.name \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.cross-references \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.licence-links FAIRsharing_attributes.url-for-logo \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.type \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-contact-information \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.url \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.type \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.url \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.url \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.name \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.url \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.name \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-for-pre-publication-review \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-versioning \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-curation.type \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-curation.url \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citation-to-related-publications \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_orgIdentifier re3data_repositoryName \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_repositoryName.language re3data_additionalName \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_repositoryContact re3data_description re3data_description.language \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_type re3data_size re3data_startDate re3data_endDate \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_repositoryLanguage re3data_subject re3data_missionStatementURL \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_contentType re3data_providerType re3data_keyword \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_institution re3data_policy re3data_databaseAccess \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_databaseLicense re3data_dataAccess re3data_dataLicense \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_dataUploadType re3data_dataUploadLicense re3data_software \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_versioning re3data_api re3data_pidSystem \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_unique_id OpenDOAR_system_metadata.id \\\n", "0 [nan, nan, nan] [nan, 2717, nan] \n", "1 [nan, nan, nan] [nan, 2468, nan] \n", "2 [nan, nan, nan] [nan, 3096, nan] \n", "3 [nan, nan, nan] [9528, nan, nan] \n", "4 [nan, nan, nan] [2557, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.name \\\n", "0 [nan, {\"name\": \"institutional repository uin s... \n", "1 [nan, {\"name\": \"university of arizona campus r... \n", "2 [nan, {\"name\": \"scholarworks @ uvm\", \"language... \n", "3 [{\"name\": \"repositorio institucional hist\\u00f... \n", "4 [{\"name\": \"biblioteka cyfrowa diecezji legnick... \n", "\n", " OpenDOAR_repository_metadata.alternativename \\\n", "0 [nan, [], nan] \n", "1 [nan, [], nan] \n", "2 [nan, [], nan] \n", "3 [[], nan, nan] \n", "4 [[], nan, nan] \n", "\n", " OpenDOAR_repository_metadata.url \\\n", "0 [nan, http://repository.uinjkt.ac.id/dspace/, ... \n", "1 [nan, http://arizona.openrepository.com/arizon... \n", "2 [nan, http://scholarworks.uvm.edu/, nan] \n", "3 [http://ru.historicas.unam.mx, nan, nan] \n", "4 [http://bcdl.pl/dlibra, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.description OpenDOAR_repository_metadata.type \\\n", "0 [nan, nan, nan] [nan, institutional, nan] \n", "1 [nan, nan, nan] [nan, institutional, nan] \n", "2 [nan, nan, nan] [nan, institutional, nan] \n", "3 [nan, nan, nan] [institutional, nan, nan] \n", "4 [nan, nan, nan] [institutional, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.content_languages \\\n", "0 [nan, [], nan] \n", "1 [nan, [], nan] \n", "2 [nan, [], nan] \n", "3 [[], nan, nan] \n", "4 [[], nan, nan] \n", "\n", " OpenDOAR_system_metadata.date_modified \\\n", "0 [nan, 2022-01-12 15:35:36, nan] \n", "1 [nan, 2022-01-12 15:35:32, nan] \n", "2 [nan, 2022-01-12 15:35:42, nan] \n", "3 [2022-01-12 15:36:31, nan, nan] \n", "4 [2022-01-12 15:35:34, nan, nan] \n", "\n", " OpenDOAR_system_metadata.date_created \\\n", "0 [nan, 2013-07-11 15:52:01, nan] \n", "1 [nan, 2012-05-02 09:50:07, nan] \n", "2 [nan, 2014-06-26 16:50:45, nan] \n", "3 [2020-02-25 08:36:10, nan, nan] \n", "4 [2012-08-20 11:35:42, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.content_subjects \\\n", "0 [nan, [science, arts, humanities, social scien... \n", "1 [nan, [science, arts, humanities, health and m... \n", "2 [nan, [science, technology, engineering, mathe... \n", "3 [[humanities, technology], nan, nan] \n", "4 [[humanities], nan, nan] \n", "\n", " OpenDOAR_repository_metadata.content_types \\\n", "0 [nan, [theses_and_dissertations], nan] \n", "1 [nan, [journal_articles, theses_and_dissertati... \n", "2 [nan, [journal_articles, conference_and_worksh... \n", "3 [[journal_articles, other_special_item_types],... \n", "4 [[journal_articles, books_chapters_and_section... \n", "\n", " OpenDOAR_organization \\\n", "0 [nan, [{'name': 'uin syarif hidayatullah jakar... \n", "1 [nan, [{'name': 'university of arizona', 'alte... \n", "2 [nan, [{'name': 'university of vermont', 'alte... \n", "3 [[{'name': 'unam', 'alternativeName': 'institu... \n", "4 [[{'name': 'biblioteka wyższego seminarium duc... \n", "\n", " OpenDOAR_policy_urls \\\n", "0 [nan, [], nan] \n", "1 [nan, [], nan] \n", "2 [nan, [{\"policy_url\": \"http://scholarworks.uvm... \n", "3 [[], nan, nan] \n", "4 [[], nan, nan] \n", "\n", " OpenDOAR_repository_metadata.software \\\n", "0 [nan, {\"name\": \"dspace\", \"version\": \"\"}, nan] \n", "1 [nan, {\"name\": \"other\", \"version\": \"\"}, nan] \n", "2 [nan, {\"name\": \"other\", \"version\": \"\"}, nan] \n", "3 [{\"name\": \"dspace\", \"version\": \"\"}, nan, nan] \n", "4 [{\"name\": \"dlibra\", \"version\": \"\"}, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.oai_url \\\n", "0 [nan, http://repository.uinjkt.ac.id/oai/, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, http://scholarworks.uvm.edu/do/oai/, nan] \n", "3 [http://ru.historicas.unam.mx/oai/request, nan... \n", "4 [http://bcdl.pl/dlibra/oai-pmh-repository.xml,... \n", "\n", " OpenDOAR_system_metadata.publicly_visible \\\n", "0 [nan, yes, nan] \n", "1 [nan, yes, nan] \n", "2 [nan, yes, nan] \n", "3 [yes, nan, nan] \n", "4 [yes, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.repository_status \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.fulltext_record_count \\\n", "0 [nan, 0.0, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [0.0, nan, nan] \n", "\n", " OpenDOAR_repository_metadata.metadata_record_count \\\n", "0 [nan, 36862.0, nan] \n", "1 [nan, 63231.0, nan] \n", "2 [nan, 2871.0, nan] \n", "3 [nan, nan, nan] \n", "4 [368.0, nan, nan] \n", "\n", " OpenDOAR_unique_id roar_eprintid roar_rev_number \\\n", "0 [nan, OpenDOAR_2717, nan] [6167, nan, 6580] [13, nan, 16] \n", "1 [nan, OpenDOAR_2468, nan] [7902, nan, 5216] [12, nan, 8] \n", "2 [nan, OpenDOAR_3096, nan] [12182, nan, 8677] [11, nan, 11] \n", "3 [OpenDOAR_9528, nan, nan] [nan, 15805, 15765] [nan, 5, 19] \n", "4 [OpenDOAR_2557, nan, nan] [nan, 5840, 5915] [nan, 9, 9] \n", "\n", " roar_eprint_status roar_userid roar_importid \\\n", "0 [archive, nan, archive] [2178, nan, 2040] [nan, nan, nan] \n", "1 [archive, nan, archive] [4910, nan, 8] [nan, nan, nan] \n", "2 [archive, nan, archive] [404, nan, 5634] [nan, nan, nan] \n", "3 [nan, archive, archive] [nan, 12662, 12662] [nan, nan, nan] \n", "4 [nan, archive, archive] [nan, 8, 8] [nan, nan, nan] \n", "\n", " roar_source roar_dir \\\n", "0 [nan, nan, nan] [disk0/00/00/61/67, nan, disk0/00/00/65/80] \n", "1 [nan, nan, nan] [disk0/00/00/79/02, nan, disk0/00/00/52/16] \n", "2 [nan, nan, nan] [disk0/00/01/21/82, nan, disk0/00/00/86/77] \n", "3 [nan, nan, nan] [nan, disk0/00/01/58/05, disk0/00/01/57/65] \n", "4 [nan, nan, nan] [nan, disk0/00/00/58/40, disk0/00/00/59/15] \n", "\n", " roar_datestamp \\\n", "0 [2012-12-12 05:42:58, nan, 2013-03-31 16:02:51] \n", "1 [2014-03-05 11:50:29, nan, 2012-05-16 23:47:28] \n", "2 [2017-03-11 17:50:59, nan, 2014-10-08 18:32:00] \n", "3 [nan, 2020-10-19 15:32:48, 2020-10-19 15:31:52] \n", "4 [nan, 2012-12-12 04:59:36, 2012-12-12 05:12:30] \n", "\n", " roar_lastmod \\\n", "0 [2013-07-14 15:12:12, nan, 2013-04-06 01:42:14] \n", "1 [2014-05-08 13:10:29, nan, 2012-05-19 01:46:06] \n", "2 [2017-03-18 02:36:55, nan, 2014-10-11 01:36:04] \n", "3 [nan, 2021-01-25 22:20:40, 2021-01-26 20:47:24] \n", "4 [nan, 2012-12-17 06:53:45, 2012-12-17 06:53:50] \n", "\n", " roar_status_changed \\\n", "0 [2012-12-12 05:42:58, nan, 2013-03-31 16:02:51] \n", "1 [2014-03-05 11:50:29, nan, 2012-05-16 23:47:28] \n", "2 [2017-03-11 17:50:59, nan, 2014-10-08 18:32:00] \n", "3 [nan, 2020-10-19 15:32:48, 2020-10-19 15:31:52] \n", "4 [nan, 2012-12-12 04:59:36, 2012-12-12 05:12:30] \n", "\n", " roar_type roar_succeeds roar_commentary \\\n", "0 [institutional, nan, institutional] [nan, nan, nan] [nan, nan, nan] \n", "1 [institutional, nan, institutional] [nan, nan, nan] [nan, nan, nan] \n", "2 [institutional, nan, institutional] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, institutional, institutional] [nan, 15765, nan] [nan, nan, nan] \n", "4 [nan, institutional, institutional] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude \\\n", "0 [show, nan, show] [nan, nan, nan] [nan, nan, nan] \n", "1 [show, nan, show] [nan, nan, nan] [nan, nan, nan] \n", "2 [show, nan, show] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, show, no_search] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, show, show] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_relation_type roar_relation_uri roar_item_issues_id \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_type roar_item_issues_description \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_timestamp roar_item_issues_status \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_reported_by roar_item_issues_resolved_by \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_comment roar_item_issues_count roar_sword_depositor \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_sword_slug roar_exemplar \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_home_page \\\n", "0 [http://repository.uinjkt.ac.id, nan, http://r... \n", "1 [http://arizona.openrepository.com/arizona/, n... \n", "2 [http://scholarworks.uvm.edu/, nan, http://sch... \n", "3 [nan, http://ru.historicas.unam.mx/, https://r... \n", "4 [nan, http://bcdl.pl/, http://bcdl.pl/dlibra] \n", "\n", " roar_title \\\n", "0 [Institutional Repository UIN Syarif Hidayatul... \n", "1 [The University of Arizona Campus Repository, ... \n", "2 [ScholarWorks @ UVM, nan, ScholarWorks @ UVM] \n", "3 [nan, Repositorio Institucional Históricas-UNA... \n", "4 [nan, Biblioteka Cyfrowa Diecezji Legnickiej, ... \n", "\n", " roar_oai_pmh \\\n", "0 [[http://repository.uinjkt.ac.id/oai, http://r... \n", "1 [http://arizona.openrepository.com/arizona/oai... \n", "2 [http://scholarworks.uvm.edu/do/oai/, nan, htt... \n", "3 [nan, http://ru.historicas.unam.mx/oai/request... \n", "4 [nan, http://bcdl.pl/dlibra/oai-pmh-repository... \n", "\n", " roar_sword_endpoint \\\n", "0 [http://repository.uinjkt.ac.id/sword/, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [http://arizona.openrepository.com/arizona/fee... [nan, nan, nan] \n", "2 [http://scholarworks.uvm.edu/recent.rss, nan, ... [nan, nan, nan] \n", "3 [nan, http://ru.historicas.unam.mx/feed/rss_1.... [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_description roar_fulltext \\\n", "0 [nstitutional Repository UIN Syarif Hidayatull... [TRUE, nan, FALSE] \n", "1 [The UA Campus Repository is an institutional ... [TRUE, nan, nan] \n", "2 [ScholarWorks @ UVM collects, preserves, and s... [TRUE, nan, TRUE] \n", "3 [nan, El Repositorio Institucional Históricas-... [nan, TRUE, TRUE] \n", "4 [nan, This site provides access to the digitis... [nan, nan, nan] \n", "\n", " roar_open_access roar_mandate \\\n", "0 [TRUE, nan, FALSE] [FALSE, nan, FALSE] \n", "1 [TRUE, nan, nan] [FALSE, nan, nan] \n", "2 [TRUE, nan, TRUE] [FALSE, nan, FALSE] \n", "3 [nan, TRUE, TRUE] [nan, TRUE, TRUE] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_organisation_title \\\n", "0 [[UIN Syarif Hidayatullah Jakarta, Pascasarjan... \n", "1 [The University of Arizona, nan, University of... \n", "2 [University of Vermont, nan, University of Ver... \n", "3 [nan, Instituto de Investigaciones Históricas,... \n", "4 [nan, Biblioteka Wyższego Seminarium Duchowneg... \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 [[http://www.uinjkt.ac.id, http://graduate.uin... [id, nan, id] \n", "1 [http://www.arizona.edu/, nan, http://www.ariz... [us, nan, us] \n", "2 [https://www.uvm.edu/, nan, http://www.uvm.edu] [us, nan, us] \n", "3 [nan, http://www.historicas.unam.mx/, http://w... [nan, mx, mx] \n", "4 [nan, http://www.biblioteka.diecezja.legnica.p... [nan, pl, pl] \n", "\n", " roar_location_city roar_location_latitude \\\n", "0 [Jakarta, nan, Jakarta] [nan, nan, 106.756] \n", "1 [Tucson, nan, nan] [nan, nan, 32.2531] \n", "2 [Burlington, VT, nan, Burington] [44.4759, nan, 44.4856] \n", "3 [nan, Ciudad de México, Ciudad de México] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, 51.207, 51.207] \n", "\n", " roar_location_longitude roar_software \\\n", "0 [nan, nan, -6.30591] [dspace, nan, dspace] \n", "1 [nan, nan, -110.948] [dspace, nan, nan] \n", "2 [-73.2121, nan, -73.2117] [bepress, nan, bepress] \n", "3 [nan, nan, nan] [nan, dspace, dspace] \n", "4 [nan, 16.1553, 16.1553] [nan, nan, nan] \n", "\n", " roar_geoname roar_version \\\n", "0 [geoname_2_ID, nan, geoname_2_ID] [other, nan, other] \n", "1 [geoname_2_US, nan, geoname_2_US] [other, nan, other] \n", "2 [geoname_2_US, nan, geoname_2_US] [other, nan, other] \n", "3 [nan, geoname_2_MX, geoname_2_MX] [nan, other, other] \n", "4 [nan, geoname_2_PL, geoname_2_PL] [nan, other, other] \n", "\n", " roar_subjects \\\n", "0 [AI, nan, [AC, Z665, Z004, Z719, BP, Q1]] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, [D1, E11, F1201, D111, D901, DP, D204, D... \n", "4 [nan, nan, nan] \n", "\n", " roar_date \\\n", "0 [2012-11-07 08:11:19, nan, 2013-03-04 07:20:37] \n", "1 [2014-02-25 20:17:47, nan, 2012-05-13 15:12:37] \n", "2 [2017-01-13 20:44:06, nan, 2014-07-16 21:08:43] \n", "3 [nan, 2020-02-14 18:36:03, 2020-02-14 18:36:03] \n", "4 [nan, 2012-08-26 15:12:13, 2012-09-16 15:12:16] \n", "\n", " roar_note roar_suggestions \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, ¿Quién puede depositar documentos en el ... [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_activity_low roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, 0, 0] [nan, 0, 0] [nan, 0, 0] [nan, 20, 20] \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,... [nan, nan, nan] \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_registry_name \\\n", "0 [[celestial, opendoar], nan, nan] \n", "1 [[celestial, opendoar], nan, opendoar] \n", "2 [celestial, nan, [celestial, opendoar]] \n", "3 [nan, nan, opendoar] \n", "4 [nan, [celestial, opendoar], [celestial, opend... \n", "\n", " roar_registry_id roar_submit_to \\\n", "0 [[5108, 2717, 5109], nan, nan] [nan, nan, nan] \n", "1 [[5404, http://opendoar.org/id/2468/], nan, 2468] [nan, nan, nan] \n", "2 [5654, nan, [http://opendoar.org/id/3096/, 5654]] [nan, nan, nan] \n", "3 [nan, nan, 9528] [nan, nan, nan] \n", "4 [nan, [2557, 5081], [2557, 5081]] [nan, nan, nan] \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_total_deposits roar_association \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, [russell_group, ivy_league], [russell_gr... \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_unique_id source_set \n", "0 [roar_6167, nan, roar_6580] {OpenDOAR, roar} \n", "1 [roar_7902, nan, roar_5216] {OpenDOAR, roar} \n", "2 [roar_12182, nan, roar_8677] {OpenDOAR, roar} \n", "3 [nan, roar_15805, roar_15765] {OpenDOAR, roar} \n", "4 [nan, roar_5840, roar_5915] {OpenDOAR, roar} " ] }, "execution_count": 37, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_hybrid = dup_hybrid.groupby('dedup_id').aggregate(list).reset_index()\n", "dup_hybrid['source_set'] = dup_hybrid.source.map(set)\n", "dup_hybrid.head()" ] }, { "cell_type": "code", "execution_count": 38, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.metadata.cross-referencesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.url-for-logoFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.data-access-condition.typeFAIRsharing_attributes.metadata.data-contact-informationFAIRsharing_attributes.metadata.data-deposition-condition.urlFAIRsharing_attributes.metadata.data-deposition-condition.typeFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.data-access-condition.urlFAIRsharing_attributes.metadata.resource-sustainability.urlFAIRsharing_attributes.metadata.resource-sustainability.nameFAIRsharing_attributes.metadata.data-preservation-policy.urlFAIRsharing_attributes.metadata.data-preservation-policy.nameFAIRsharing_attributes.metadata.data-access-for-pre-publication-reviewFAIRsharing_attributes.metadata.data-versioningFAIRsharing_attributes.metadata.data-curation.typeFAIRsharing_attributes.metadata.data-curation.urlFAIRsharing_attributes.metadata.citation-to-related-publicationsFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_orgIdentifierre3data_repositoryNamere3data_repositoryName.languagere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_repositoryContactre3data_descriptionre3data_description.languagere3data_typere3data_sizere3data_startDatere3data_endDatere3data_repositoryLanguagere3data_subjectre3data_missionStatementURLre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadTypere3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_system_metadata.idOpenDOAR_repository_metadata.nameOpenDOAR_repository_metadata.alternativenameOpenDOAR_repository_metadata.urlOpenDOAR_repository_metadata.descriptionOpenDOAR_repository_metadata.typeOpenDOAR_repository_metadata.content_languagesOpenDOAR_system_metadata.date_modifiedOpenDOAR_system_metadata.date_createdOpenDOAR_repository_metadata.content_subjectsOpenDOAR_repository_metadata.content_typesOpenDOAR_organizationOpenDOAR_policy_urlsOpenDOAR_repository_metadata.softwareOpenDOAR_repository_metadata.oai_urlOpenDOAR_system_metadata.publicly_visibleOpenDOAR_repository_metadata.repository_statusOpenDOAR_repository_metadata.fulltext_record_countOpenDOAR_repository_metadata.metadata_record_countOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_idsource_set
0dedup::001e6d882e54c780ce269d3c46997287[https://fairsharing.org/10.25504/FAIRsharing....[2094, r3d100011306][RESID Database of Protein Modifications, RESI...[FAIRsharing, re3data][FAIRsharing_2094, re3data_r3d100011306][2094, nan][fairsharing-records, nan][2014-11-04T15:23:40.000Z, nan][2021-12-06T10:49:03.952Z, nan][10.25504/FAIRsharing.qaszjp, nan][RESID Database of Protein Modifications, nan][ready, nan][[{'contact-name': 'John S Garavelli', 'contac...[http://pir.georgetown.edu/resid/, nan][2094.0, nan][The RESID Database of Protein Modifications i...[RESID, nan][[{'url': 'http://pir.georgetown.edu/resid/faq...[nan, nan][[{'url': 'ftp://ftp.pir.georgetown.edu/pir_da...[[{'url': 'https://www.re3data.org/repository/...[[biodbcore-000563, bsg-d000563], nan][Database, nan][knowledgebase, nan][[Life Science], nan][[Molecular structure, Small molecule, Structu...[[All], nan][[], nan][[United Kingdom, European Union, Switzerland]...[FAIRsharing record for: RESID Database of Pro...[RESID, nan][https://fairsharing.org/10.25504/FAIRsharing....[10.25504/FAIRsharing.qaszjp, nan][https://creativecommons.org/licenses/by-sa/4....[This FAIRsharing record describes: The RESID ...[[{'id': 334, 'pubmed_id': 12520062, 'title': ...[[{'licence-name': 'Open Data Commons (ODC) Pu...[None, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][FAIRsharing_2094, nan][nan, r3d100011306][nan, RESID Database of Protein Modifications][nan, eng][nan, []][nan, https://pir.georgetown.edu/resid/resid.s...[nan, [FAIRsharing_doi:10.25504/FAIRsharing.qa...[nan, [\"pirmail@georgetown.edu\"]][nan, The RESID Database of Protein Modificati...[nan, eng][nan, [disciplinary]][nan, {\"size\": \"\", \"updatedp\": \"\"}][nan, 2014][nan, nan][nan, [\"eng\"]][nan, [{'name': '2 Life Sciences', 'scheme': '...[nan, nan][nan, [{'name': 'Images', 'scheme': 'parse'}, ...[nan, [dataProvider]][nan, [genomes, life sciences, proteins, prote...[nan, [{'institutionName': 'Georgetown Univers...[nan, [{\"policyName\": \"Terms of Use\", \"policyU...[nan, {\"databaseAccessType\": \"open\", \"databas...[nan, []][nan, [{\"dataAccessType\": \"open\", \"dataAccessR...[nan, [{\"dataLicenseName\": \"Copyrights\", \"data...[nan, closed][nan, []][nan, [\"unknown\"]][nan, yes][nan, {\"api\": \"ftp://ftp.pir.georgetown.edu/da...[nan, [\"none\"]][nan, nan][nan, []][nan, yes][nan, unknown][nan, []][nan, []][nan, {}][nan, RESID is covered by Thomson Reuters Data...[nan, 2014-12-05][nan, 2019-01-17][nan, re3data_r3d100011306][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan]{FAIRsharing, re3data}
1dedup::003ab6b40af9b488decea7c582d150a2[re3data::r3d100011894, https://fairsharing.or...[r3d100011894, 2315][Synapse, Synapse][re3data, FAIRsharing][re3data_r3d100011894, FAIRsharing_2315][nan, 2315][nan, fairsharing-records][nan, 2016-08-02T13:56:30.000Z][nan, 2021-12-06T10:48:25.700Z][nan, 10.25504/FAIRsharing.dnxzmk][nan, Synapse][nan, ready][nan, [{'contact-name': 'Meredith Slota', 'con...[nan, https://www.synapse.org/][nan, 2315.0][nan, Synapse is a collaborative research plat...[nan, Synapse][nan, [{'url': 'SynapseInfo@sagebase.org', 'na...[nan, 2010.0][nan, [{'url': 'https://www.synapse.org/', 'na...[nan, [{'url': 'https://www.re3data.org/reposi...[nan, [biodbcore-000791, bsg-d000791]][nan, Database][nan, repository][nan, [Data Integration, Data Management, Biom...[nan, [Experimental measurement, Protocol, Dat...[nan, [All]][nan, []][nan, [United States]][nan, FAIRsharing record for: Synapse][nan, Synapse][nan, https://fairsharing.org/10.25504/FAIRsha...[nan, 10.25504/FAIRsharing.dnxzmk][nan, https://creativecommons.org/licenses/by-...[nan, This FAIRsharing record describes: Synap...[nan, [{'id': 2450, 'pubmed_id': 24071850, 'ti...[nan, [{'licence-name': 'Creative Commons Attr...[nan, None][nan, nan][nan, [{'url': 'https://sage-bionetworks.githu...[nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, [{'url': 'http://rest-docs.synapse.org/r...[nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, FAIRsharing_2315][r3d100011894, nan][Synapse, nan][eng, nan][[], nan][https://www.synapse.org, nan][[FAIRsharing_DOI:10.25504/FAIRsharing.dnxzmk,...[[\"synapseinfo@sagebase.org\"], nan][Synapse is an open source software platform t...[eng, nan][[other], nan][{\"size\": \"\", \"updatedp\": \"\"}, nan][2012-05-22, nan][nan, nan][[\"eng\"], nan][[{'name': '2 Life Sciences', 'scheme': 'DFG'}...[https://sagebionetworks.org/tools_resources/s...[[{'name': 'Raw data', 'scheme': 'parse'}, {'n...[[dataProvider, serviceProvider], nan][[AMP-AD Knowledge Portal, DREAM Challenges, G...[[{'institutionName': 'Alfred P. Sloan Foundat...[[{\"policyName\": \"Synapse Commons Governance O...[ {\"databaseAccessType\": \"open\", \"databaseAcce...[[], nan][[{\"dataAccessType\": \"closed\", \"dataAccessRest...[[{\"dataLicenseName\": \"other\", \"dataLicenseURL...[restricted, nan][[], nan][[\"unknown\"], nan][yes, nan][{\"api\": \"https://docs.synapse.org/rest/\", \"ap...[[\"DOI\"], nan][nan, nan][[], nan][yes, nan][yes, nan][[], nan][[], nan][{}, nan][nan, nan][2015-12-03, nan][2021-11-16, nan][re3data_r3d100011894, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan]{FAIRsharing, re3data}
2dedup::0048f2e3aa55ab88aaaac0cfa4153ad5[opendoar::4562, roar::14673][4562, 14673][erzincan binali yıldırım university instituti...[OpenDOAR, roar][OpenDOAR_4562, roar_14673][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][4562, nan][{\"name\": \"erzincan binali y\\u0131ld\\u0131r\\u0...[[], nan][http://earsiv.erzincan.edu.tr, nan][nan, nan][institutional, nan][[], nan][2022-01-12 15:36:06, nan][2019-04-24 09:06:10, nan][[social sciences], nan][[journal_articles], nan][[{'name': 'erzincan binali yıldırım universit...[[], nan][{\"name\": \"dspace\", \"version\": \"\"}, nan][http://earsiv.erzincan.edu.tr/oai, nan][yes, nan][nan, nan][nan, nan][nan, nan][OpenDOAR_4562, nan][nan, 14673][nan, 9][nan, archive][nan, 11738][nan, nan][nan, nan][nan, disk0/00/01/46/73][nan, 2019-07-19 14:26:33][nan, 2019-07-22 08:07:03][nan, 2019-07-19 14:26:33][nan, institutional][nan, nan][nan, nan][nan, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, http://earsiv.erzincan.edu.tr][nan, Erzincan Binali Yıldırım University Inst...[nan, http://earsiv.erzincan.edu.tr/oai][nan, nan][nan, nan][nan, nan][nan, DSpace@Erzincan is a growing collection ...[nan, TRUE][nan, TRUE][nan, TRUE][nan, Erzincan Binali Yıldırım University][nan, http://www.ebyu.edu.tr][nan, tr][nan, Erzincan][nan, 39.7463][nan, 39.5149][nan, dspace][nan, geoname_2_TR][nan, other][nan, nan][nan, 2019-04-18 19:09:41][nan, DSpace@Erzincan is a growing collection ...[nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, roar_14673]{OpenDOAR, roar}
3dedup::00a35b4a2495a342f5632d18cf5985f6[opendoar::6787, roar::13960][6787, 13960][scholarly commons university of the pacific, ...[OpenDOAR, roar][OpenDOAR_6787, roar_13960][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][6787, nan][{\"name\": \"scholarly commons university of the...[[], nan][https://scholarlycommons.pacific.edu, nan][nan, nan][institutional, nan][[], nan][2022-01-12 15:36:16, nan][2019-09-28 02:20:20, nan][[science, technology, engineering, mathematic...[[journal_articles, theses_and_dissertations, ...[[{'name': 'university of the pacific', 'alter...[[], nan][{\"name\": \"digital_commons\", \"version\": \"\"}, nan][https://scholarlycommons.pacific.edu/do/oai, ...[yes, nan][nan, nan][6534.0, nan][59858.0, nan][OpenDOAR_6787, nan][nan, 13960][nan, 10][nan, archive][nan, 11103][nan, nan][nan, nan][nan, disk0/00/01/39/60][nan, 2018-10-07 12:48:04][nan, 2018-10-13 01:35:50][nan, 2018-10-07 12:48:04][nan, institutional][nan, nan][nan, nan][nan, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, https://scholarlycommons.pacific.edu/][nan, Scholarly Commons - University of the Pa...[nan, https://scholarlycommons.pacific.edu/do/...[nan, nan][nan, https://scholarlycommons.pacific.edu/rec...[nan, nan][nan, Scholarly Commons is a service of the Un...[nan, TRUE][nan, TRUE][nan, FALSE][nan, University of the Pacific][nan, https://www.pacific.edu/][nan, us][nan, [Sacramento, Stockton, San Francisco]][nan, nan][nan, nan][nan, bepress][nan, geoname_2_US][nan, other][nan, nan][nan, 2018-09-05 23:09:53][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, celestial][nan, 6700][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, roar_13960]{OpenDOAR, roar}
4dedup::00a6af15fba302b272b110ac88924779[roar::755, opendoar::1285][755, 1285][KFUPM ePrints, kfupm eprints][roar, OpenDOAR][roar_755, OpenDOAR_1285][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, 1285][nan, {\"name\": \"kfupm eprints\", \"language\": \"e...[nan, []][nan, http://eprints.kfupm.edu.sa/][nan, nan][nan, institutional][nan, []][nan, 2022-01-12 15:35:13][nan, 2008-07-18 11:11:28][nan, [science, humanities, mathematics, techn...[nan, [journal_articles, conference_and_worksh...[nan, [{'name': 'king fahd university of petro...[nan, []][nan, {\"name\": \"eprints\", \"version\": \"\"}][nan, http://eprints.kfupm.edu.sa/cgi/oai2][nan, yes][nan, nan][nan, 4890.0][nan, 6221.0][nan, OpenDOAR_1285][755, nan][511, nan][archive, nan][1, nan][nan, nan][nan, nan][disk0/00/00/07/55, nan][2010-01-06 13:44:43, nan][2011-07-18 05:50:28, nan][2010-01-06 13:44:43, nan][institutional, nan][nan, nan][nan, nan][show, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][0, nan][nan, nan][nan, nan][nan, nan][http://eprints.kfupm.edu.sa/, nan][KFUPM ePrints, nan][http://eprints.kfupm.edu.sa/perl/oai2, nan][nan, nan][http://eprints.kfupm.edu.sa/cgi/latest_tool?o...[nan, nan][nan, nan][TRUE, nan][TRUE, nan][nan, nan][King Fahd University of Petroleum and Mineral...[http://www.kfupm.edu.sa, nan][sa, nan][ DHAHRAN, nan][17.4333, nan][43.2167, nan][eprints, nan][geoname_2_SA, nan][3.2.7, nan][nan, nan][2007-09-10 11:33:13, nan][nan, nan][nan, nan][0, nan][0, nan][0, nan][100, nan][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,100...[nan, nan][nan, nan][nan, nan][nan, nan][[celestial, opendoar], nan][[1234, 1285], nan][nan, nan][nan, nan][nan, nan][37, nan][26, nan][69, nan][23, nan][203, nan][nan, nan][nan, nan][nan, nan][roar_755, nan]{OpenDOAR, roar}
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::001e6d882e54c780ce269d3c46997287 \n", "1 dedup::003ab6b40af9b488decea7c582d150a2 \n", "2 dedup::0048f2e3aa55ab88aaaac0cfa4153ad5 \n", "3 dedup::00a35b4a2495a342f5632d18cf5985f6 \n", "4 dedup::00a6af15fba302b272b110ac88924779 \n", "\n", " duplicate_id original_id \\\n", "0 [https://fairsharing.org/10.25504/FAIRsharing.... [2094, r3d100011306] \n", "1 [re3data::r3d100011894, https://fairsharing.or... [r3d100011894, 2315] \n", "2 [opendoar::4562, roar::14673] [4562, 14673] \n", "3 [opendoar::6787, roar::13960] [6787, 13960] \n", "4 [roar::755, opendoar::1285] [755, 1285] \n", "\n", " name source \\\n", "0 [RESID Database of Protein Modifications, RESI... [FAIRsharing, re3data] \n", "1 [Synapse, Synapse] [re3data, FAIRsharing] \n", "2 [erzincan binali yıldırım university instituti... [OpenDOAR, roar] \n", "3 [scholarly commons university of the pacific, ... [OpenDOAR, roar] \n", "4 [KFUPM ePrints, kfupm eprints] [roar, OpenDOAR] \n", "\n", " unique_id FAIRsharing_id \\\n", "0 [FAIRsharing_2094, re3data_r3d100011306] [2094, nan] \n", "1 [re3data_r3d100011894, FAIRsharing_2315] [nan, 2315] \n", "2 [OpenDOAR_4562, roar_14673] [nan, nan] \n", "3 [OpenDOAR_6787, roar_13960] [nan, nan] \n", "4 [roar_755, OpenDOAR_1285] [nan, nan] \n", "\n", " FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 [fairsharing-records, nan] [2014-11-04T15:23:40.000Z, nan] \n", "1 [nan, fairsharing-records] [nan, 2016-08-02T13:56:30.000Z] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 [2021-12-06T10:49:03.952Z, nan] [10.25504/FAIRsharing.qaszjp, nan] \n", "1 [nan, 2021-12-06T10:48:25.700Z] [nan, 10.25504/FAIRsharing.dnxzmk] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.name \\\n", "0 [RESID Database of Protein Modifications, nan] \n", "1 [nan, Synapse] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 [ready, nan] \n", "1 [nan, ready] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [[{'contact-name': 'John S Garavelli', 'contac... \n", "1 [nan, [{'contact-name': 'Meredith Slota', 'con... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 [http://pir.georgetown.edu/resid/, nan] \n", "1 [nan, https://www.synapse.org/] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 [2094.0, nan] \n", "1 [nan, 2315.0] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 [The RESID Database of Protein Modifications i... \n", "1 [nan, Synapse is a collaborative research plat... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 [RESID, nan] \n", "1 [nan, Synapse] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [[{'url': 'http://pir.georgetown.edu/resid/faq... \n", "1 [nan, [{'url': 'SynapseInfo@sagebase.org', 'na... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 [nan, nan] \n", "1 [nan, 2010.0] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [[{'url': 'ftp://ftp.pir.georgetown.edu/pir_da... \n", "1 [nan, [{'url': 'https://www.synapse.org/', 'na... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.cross-references \\\n", "0 [[{'url': 'https://www.re3data.org/repository/... \n", "1 [nan, [{'url': 'https://www.re3data.org/reposi... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [[biodbcore-000563, bsg-d000563], nan] \n", "1 [nan, [biodbcore-000791, bsg-d000791]] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 [Database, nan] \n", "1 [nan, Database] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.record-type \\\n", "0 [knowledgebase, nan] \n", "1 [nan, repository] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.subjects \\\n", "0 [[Life Science], nan] \n", "1 [nan, [Data Integration, Data Management, Biom... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.domains \\\n", "0 [[Molecular structure, Small molecule, Structu... \n", "1 [nan, [Experimental measurement, Protocol, Dat... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.taxonomies FAIRsharing_attributes.user-defined-tags \\\n", "0 [[All], nan] [[], nan] \n", "1 [nan, [All]] [nan, []] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.countries \\\n", "0 [[United Kingdom, European Union, Switzerland]... \n", "1 [nan, [United States]] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.name \\\n", "0 [FAIRsharing record for: RESID Database of Pro... \n", "1 [nan, FAIRsharing record for: Synapse] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.abbreviation \\\n", "0 [RESID, nan] \n", "1 [nan, Synapse] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.url \\\n", "0 [https://fairsharing.org/10.25504/FAIRsharing.... \n", "1 [nan, https://fairsharing.org/10.25504/FAIRsha... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.doi \\\n", "0 [10.25504/FAIRsharing.qaszjp, nan] \n", "1 [nan, 10.25504/FAIRsharing.dnxzmk] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 [https://creativecommons.org/licenses/by-sa/4.... \n", "1 [nan, https://creativecommons.org/licenses/by-... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.description \\\n", "0 [This FAIRsharing record describes: The RESID ... \n", "1 [nan, This FAIRsharing record describes: Synap... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.publications \\\n", "0 [[{'id': 334, 'pubmed_id': 12520062, 'title': ... \n", "1 [nan, [{'id': 2450, 'pubmed_id': 24071850, 'ti... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 [[{'licence-name': 'Open Data Commons (ODC) Pu... \n", "1 [nan, [{'licence-name': 'Creative Commons Attr... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.url-for-logo \\\n", "0 [None, nan] \n", "1 [nan, None] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 [nan, nan] \n", "1 [nan, [{'url': 'https://sage-bionetworks.githu... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.type \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-contact-information \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-deposition-condition.type \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 [nan, nan] \n", "1 [nan, [{'url': 'http://rest-docs.synapse.org/r... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-condition.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.resource-sustainability.name \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-preservation-policy.name \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-access-for-pre-publication-review \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-versioning \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-curation.type \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-curation.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citation-to-related-publications \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 [nan, nan] [FAIRsharing_2094, nan] \n", "1 [nan, nan] [nan, FAIRsharing_2315] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_orgIdentifier re3data_repositoryName \\\n", "0 [nan, r3d100011306] [nan, RESID Database of Protein Modifications] \n", "1 [r3d100011894, nan] [Synapse, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryName.language re3data_additionalName \\\n", "0 [nan, eng] [nan, []] \n", "1 [eng, nan] [[], nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryURL \\\n", "0 [nan, https://pir.georgetown.edu/resid/resid.s... \n", "1 [https://www.synapse.org, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_repositoryIdentifier \\\n", "0 [nan, [FAIRsharing_doi:10.25504/FAIRsharing.qa... \n", "1 [[FAIRsharing_DOI:10.25504/FAIRsharing.dnxzmk,... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_repositoryContact \\\n", "0 [nan, [\"pirmail@georgetown.edu\"]] \n", "1 [[\"synapseinfo@sagebase.org\"], nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_description \\\n", "0 [nan, The RESID Database of Protein Modificati... \n", "1 [Synapse is an open source software platform t... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_description.language re3data_type \\\n", "0 [nan, eng] [nan, [disciplinary]] \n", "1 [eng, nan] [[other], nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_size re3data_startDate re3data_endDate \\\n", "0 [nan, {\"size\": \"\", \"updatedp\": \"\"}] [nan, 2014] [nan, nan] \n", "1 [{\"size\": \"\", \"updatedp\": \"\"}, nan] [2012-05-22, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryLanguage \\\n", "0 [nan, [\"eng\"]] \n", "1 [[\"eng\"], nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_subject \\\n", "0 [nan, [{'name': '2 Life Sciences', 'scheme': '... \n", "1 [[{'name': '2 Life Sciences', 'scheme': 'DFG'}... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_missionStatementURL \\\n", "0 [nan, nan] \n", "1 [https://sagebionetworks.org/tools_resources/s... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_contentType \\\n", "0 [nan, [{'name': 'Images', 'scheme': 'parse'}, ... \n", "1 [[{'name': 'Raw data', 'scheme': 'parse'}, {'n... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_providerType \\\n", "0 [nan, [dataProvider]] \n", "1 [[dataProvider, serviceProvider], nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_keyword \\\n", "0 [nan, [genomes, life sciences, proteins, prote... \n", "1 [[AMP-AD Knowledge Portal, DREAM Challenges, G... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_institution \\\n", "0 [nan, [{'institutionName': 'Georgetown Univers... \n", "1 [[{'institutionName': 'Alfred P. Sloan Foundat... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_policy \\\n", "0 [nan, [{\"policyName\": \"Terms of Use\", \"policyU... \n", "1 [[{\"policyName\": \"Synapse Commons Governance O... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_databaseAccess re3data_databaseLicense \\\n", "0 [nan, {\"databaseAccessType\": \"open\", \"databas... [nan, []] \n", "1 [ {\"databaseAccessType\": \"open\", \"databaseAcce... [[], nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_dataAccess \\\n", "0 [nan, [{\"dataAccessType\": \"open\", \"dataAccessR... \n", "1 [[{\"dataAccessType\": \"closed\", \"dataAccessRest... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_dataLicense re3data_dataUploadType \\\n", "0 [nan, [{\"dataLicenseName\": \"Copyrights\", \"data... [nan, closed] \n", "1 [[{\"dataLicenseName\": \"other\", \"dataLicenseURL... [restricted, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_dataUploadLicense re3data_software re3data_versioning \\\n", "0 [nan, []] [nan, [\"unknown\"]] [nan, yes] \n", "1 [[], nan] [[\"unknown\"], nan] [yes, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_api re3data_pidSystem \\\n", "0 [nan, {\"api\": \"ftp://ftp.pir.georgetown.edu/da... [nan, [\"none\"]] \n", "1 [{\"api\": \"https://docs.synapse.org/rest/\", \"ap... [[\"DOI\"], nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 [nan, nan] [nan, []] [nan, yes] \n", "1 [nan, nan] [[], nan] [yes, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 [nan, unknown] [nan, []] [nan, []] \n", "1 [yes, nan] [[], nan] [[], nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_syndication re3data_remarks \\\n", "0 [nan, {}] [nan, RESID is covered by Thomson Reuters Data... \n", "1 [{}, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_entryDate re3data_lastUpdate re3data_unique_id \\\n", "0 [nan, 2014-12-05] [nan, 2019-01-17] [nan, re3data_r3d100011306] \n", "1 [2015-12-03, nan] [2021-11-16, nan] [re3data_r3d100011894, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_system_metadata.id \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [4562, nan] \n", "3 [6787, nan] \n", "4 [nan, 1285] \n", "\n", " OpenDOAR_repository_metadata.name \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [{\"name\": \"erzincan binali y\\u0131ld\\u0131r\\u0... \n", "3 [{\"name\": \"scholarly commons university of the... \n", "4 [nan, {\"name\": \"kfupm eprints\", \"language\": \"e... \n", "\n", " OpenDOAR_repository_metadata.alternativename \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [[], nan] \n", "3 [[], nan] \n", "4 [nan, []] \n", "\n", " OpenDOAR_repository_metadata.url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [http://earsiv.erzincan.edu.tr, nan] \n", "3 [https://scholarlycommons.pacific.edu, nan] \n", "4 [nan, http://eprints.kfupm.edu.sa/] \n", "\n", " OpenDOAR_repository_metadata.description OpenDOAR_repository_metadata.type \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [institutional, nan] \n", "3 [nan, nan] [institutional, nan] \n", "4 [nan, nan] [nan, institutional] \n", "\n", " OpenDOAR_repository_metadata.content_languages \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [[], nan] \n", "3 [[], nan] \n", "4 [nan, []] \n", "\n", " OpenDOAR_system_metadata.date_modified \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [2022-01-12 15:36:06, nan] \n", "3 [2022-01-12 15:36:16, nan] \n", "4 [nan, 2022-01-12 15:35:13] \n", "\n", " OpenDOAR_system_metadata.date_created \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [2019-04-24 09:06:10, nan] \n", "3 [2019-09-28 02:20:20, nan] \n", "4 [nan, 2008-07-18 11:11:28] \n", "\n", " OpenDOAR_repository_metadata.content_subjects \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [[social sciences], nan] \n", "3 [[science, technology, engineering, mathematic... \n", "4 [nan, [science, humanities, mathematics, techn... \n", "\n", " OpenDOAR_repository_metadata.content_types \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [[journal_articles], nan] \n", "3 [[journal_articles, theses_and_dissertations, ... \n", "4 [nan, [journal_articles, conference_and_worksh... \n", "\n", " OpenDOAR_organization OpenDOAR_policy_urls \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [[{'name': 'erzincan binali yıldırım universit... [[], nan] \n", "3 [[{'name': 'university of the pacific', 'alter... [[], nan] \n", "4 [nan, [{'name': 'king fahd university of petro... [nan, []] \n", "\n", " OpenDOAR_repository_metadata.software \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [{\"name\": \"dspace\", \"version\": \"\"}, nan] \n", "3 [{\"name\": \"digital_commons\", \"version\": \"\"}, nan] \n", "4 [nan, {\"name\": \"eprints\", \"version\": \"\"}] \n", "\n", " OpenDOAR_repository_metadata.oai_url \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [http://earsiv.erzincan.edu.tr/oai, nan] \n", "3 [https://scholarlycommons.pacific.edu/do/oai, ... \n", "4 [nan, http://eprints.kfupm.edu.sa/cgi/oai2] \n", "\n", " OpenDOAR_system_metadata.publicly_visible \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [yes, nan] \n", "3 [yes, nan] \n", "4 [nan, yes] \n", "\n", " OpenDOAR_repository_metadata.repository_status \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " OpenDOAR_repository_metadata.fulltext_record_count \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [6534.0, nan] \n", "4 [nan, 4890.0] \n", "\n", " OpenDOAR_repository_metadata.metadata_record_count OpenDOAR_unique_id \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [OpenDOAR_4562, nan] \n", "3 [59858.0, nan] [OpenDOAR_6787, nan] \n", "4 [nan, 6221.0] [nan, OpenDOAR_1285] \n", "\n", " roar_eprintid roar_rev_number roar_eprint_status roar_userid \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, 14673] [nan, 9] [nan, archive] [nan, 11738] \n", "3 [nan, 13960] [nan, 10] [nan, archive] [nan, 11103] \n", "4 [755, nan] [511, nan] [archive, nan] [1, nan] \n", "\n", " roar_importid roar_source roar_dir \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, disk0/00/01/46/73] \n", "3 [nan, nan] [nan, nan] [nan, disk0/00/01/39/60] \n", "4 [nan, nan] [nan, nan] [disk0/00/00/07/55, nan] \n", "\n", " roar_datestamp roar_lastmod \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, 2019-07-19 14:26:33] [nan, 2019-07-22 08:07:03] \n", "3 [nan, 2018-10-07 12:48:04] [nan, 2018-10-13 01:35:50] \n", "4 [2010-01-06 13:44:43, nan] [2011-07-18 05:50:28, nan] \n", "\n", " roar_status_changed roar_type roar_succeeds \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, 2019-07-19 14:26:33] [nan, institutional] [nan, nan] \n", "3 [nan, 2018-10-07 12:48:04] [nan, institutional] [nan, nan] \n", "4 [2010-01-06 13:44:43, nan] [institutional, nan] [nan, nan] \n", "\n", " roar_commentary roar_metadata_visibility roar_latitude roar_longitude \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, show] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, show] [nan, nan] [nan, nan] \n", "4 [nan, nan] [show, nan] [nan, nan] [nan, nan] \n", "\n", " roar_relation_type roar_relation_uri roar_item_issues_id \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_type roar_item_issues_description \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_timestamp roar_item_issues_status \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_reported_by roar_item_issues_resolved_by \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_comment roar_item_issues_count roar_sword_depositor \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [0, nan] [nan, nan] \n", "\n", " roar_sword_slug roar_exemplar roar_home_page \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, http://earsiv.erzincan.edu.tr] \n", "3 [nan, nan] [nan, nan] [nan, https://scholarlycommons.pacific.edu/] \n", "4 [nan, nan] [nan, nan] [http://eprints.kfupm.edu.sa/, nan] \n", "\n", " roar_title \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, Erzincan Binali Yıldırım University Inst... \n", "3 [nan, Scholarly Commons - University of the Pa... \n", "4 [KFUPM ePrints, nan] \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, http://earsiv.erzincan.edu.tr/oai] [nan, nan] \n", "3 [nan, https://scholarlycommons.pacific.edu/do/... [nan, nan] \n", "4 [http://eprints.kfupm.edu.sa/perl/oai2, nan] [nan, nan] \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, https://scholarlycommons.pacific.edu/rec... [nan, nan] \n", "4 [http://eprints.kfupm.edu.sa/cgi/latest_tool?o... [nan, nan] \n", "\n", " roar_description roar_fulltext \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, DSpace@Erzincan is a growing collection ... [nan, TRUE] \n", "3 [nan, Scholarly Commons is a service of the Un... [nan, TRUE] \n", "4 [nan, nan] [TRUE, nan] \n", "\n", " roar_open_access roar_mandate \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, TRUE] [nan, TRUE] \n", "3 [nan, TRUE] [nan, FALSE] \n", "4 [TRUE, nan] [nan, nan] \n", "\n", " roar_organisation_title \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, Erzincan Binali Yıldırım University] \n", "3 [nan, University of the Pacific] \n", "4 [King Fahd University of Petroleum and Mineral... \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, http://www.ebyu.edu.tr] [nan, tr] \n", "3 [nan, https://www.pacific.edu/] [nan, us] \n", "4 [http://www.kfupm.edu.sa, nan] [sa, nan] \n", "\n", " roar_location_city roar_location_latitude \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, Erzincan] [nan, 39.7463] \n", "3 [nan, [Sacramento, Stockton, San Francisco]] [nan, nan] \n", "4 [ DHAHRAN, nan] [17.4333, nan] \n", "\n", " roar_location_longitude roar_software roar_geoname roar_version \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, 39.5149] [nan, dspace] [nan, geoname_2_TR] [nan, other] \n", "3 [nan, nan] [nan, bepress] [nan, geoname_2_US] [nan, other] \n", "4 [43.2167, nan] [eprints, nan] [geoname_2_SA, nan] [3.2.7, nan] \n", "\n", " roar_subjects roar_date \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, 2019-04-18 19:09:41] \n", "3 [nan, nan] [nan, 2018-09-05 23:09:53] \n", "4 [nan, nan] [2007-09-10 11:33:13, nan] \n", "\n", " roar_note roar_suggestions \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, DSpace@Erzincan is a growing collection ... [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_activity_low roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [0, nan] [0, nan] [0, nan] [100, nan] \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,100... [nan, nan] \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_registry_name roar_registry_id roar_submit_to \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, celestial] [nan, 6700] [nan, nan] \n", "4 [[celestial, opendoar], nan] [[1234, 1285], nan] [nan, nan] \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [37, nan] \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [26, nan] [69, nan] \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [23, nan] [203, nan] [nan, nan] \n", "\n", " roar_total_deposits roar_association roar_unique_id \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, roar_14673] \n", "3 [nan, nan] [nan, nan] [nan, roar_13960] \n", "4 [nan, nan] [nan, nan] [roar_755, nan] \n", "\n", " source_set \n", "0 {FAIRsharing, re3data} \n", "1 {FAIRsharing, re3data} \n", "2 {OpenDOAR, roar} \n", "3 {OpenDOAR, roar} \n", "4 {OpenDOAR, roar} " ] }, "execution_count": 38, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup_across.groupby('dedup_id').aggregate(list).reset_index()\n", "dup_across['source_set'] = dup_across.source.map(set)\n", "dup_across.head()" ] }, { "cell_type": "code", "execution_count": 39, "metadata": {}, "outputs": [], "source": [ "def remove_nan(list_obj):\n", " if isinstance(list_obj, list):\n", " while np.nan in list_obj:\n", " list_obj.remove(np.nan)\n", " return list_obj\n", " \n", "dup_within.applymap(remove_nan).to_csv('../data/processed/dup_within.csv')\n", "dup_hybrid.applymap(remove_nan).to_csv('../data/processed/dup_hybrid.csv')\n", "dup_across.applymap(remove_nan).to_csv('../data/processed/dup_across.csv')" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.8.3" } }, "nbformat": 4, "nbformat_minor": 4 }