{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import ast\n", "import csv\n", "import json\n", "import glom\n", "\n", "import numpy as np\n", "import pandas as pd\n", "\n", "import matplotlib.pyplot as plt\n", "from matplotlib_venn import venn2, venn2_circles\n", "\n", "import plotly\n", "from plotly.offline import iplot, init_notebook_mode\n", "import plotly.graph_objs as go\n", "import plotly.express as px\n", "\n", "pd.set_option('display.max_columns', None)" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
FAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_id
01723fairsharing-records2014-11-04T15:23:40.000Z2021-09-30T11:39:06.829Z10.25504/FAIRsharing.8t18teCell Image Libraryready[{'contact-name': 'David Orloff', 'contact-ema...http://www.cellimagelibrary.org1723This library is a public and easily accessible...[{'url': 'http://www.cellimagelibrary.org/page...2010.0[{'name': 'live update', 'type': 'data release...[biodbcore-000180, bsg-d000180]Databaserepository[Cell Biology, Life Science][Cell, Microscopy, Light microscopy, Electron ...[All][][United States]FAIRsharing record for: Cell Image LibraryNonehttps://fairsharing.org/10.25504/FAIRsharing.8...10.25504/FAIRsharing.8t18tehttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: This librar...[{'id': 232, 'pubmed_id': 23203874, 'title': '...[{'licence-name': 'Cell Image Library Data Pol...NaNNaNNaNNaNNaNNaNNaNFAIRsharing_1723
13101fairsharing-records2020-09-16T08:49:13.000Z2021-09-30T11:36:45.452ZNaNWHOI Ship Data-Grabber SystemreadyNaNhttp://4dgeo.whoi.edu/shipdata/SDG_shipdata.html3101The WHOI Ship DataGrabber system provides the ...[{'url': 'http://4dgeo.whoi.edu/shipdata/SDG_o...2004.0[{'url': 'http://4dgeo.whoi.edu/sdg-bin/dv_mai...[biodbcore-001609, bsg-d001609]Databaserepository[Earth Science, Water Research, Oceanography][][Not applicable][subseafloor environments][United States]FAIRsharing record for: WHOI Ship Data-Grabber...Nonehttps://fairsharing.org/fairsharing_records/3101Nonehttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: The WHOI Sh...[][{'licence-name': 'NDSF Data Archive Policy', ...NaNNaNNaNNaNNaNNaNNaNFAIRsharing_3101
22649fairsharing-records2018-08-07T20:23:32.000Z2021-09-30T11:39:07.898ZNaNElectron Microscope Public Image Archiveready[{'contact-name': 'General contact', 'contact-...https://www.ebi.ac.uk/pdbe/emdb/empiar/2649EMPIAR, the Electron Microscopy Public Image A...[{'url': 'https://www.ebi.ac.uk/support/EMPIAR...2015.0[{'url': 'https://www.ebi.ac.uk/pdbe/emdb/empi...[biodbcore-001140, bsg-d001140]Databaserepository[Bioinformatics, Biology][Protein image, Microscopy, Electron microscop...[All][][Greece, Czech Republic, United Kingdom, Icela...FAIRsharing record for: Electron Microscope Pu...EMPIARhttps://fairsharing.org/fairsharing_records/2649Nonehttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: EMPIAR, the...[{'id': 2232, 'pubmed_id': 27067018, 'title': ...[{'licence-name': 'EMBL-EBI Terms of Use', 'li...[{'doi': '10.1038/nmeth.3806', 'pubmed-id': 27...EMPIAR[{'url': 'https://www.ebi.ac.uk/pdbe/emdb/empi...[{'url': 'https://www.ebi.ac.uk/pdbe/emdb/empi...NaNNaNNaNFAIRsharing_2649
32657fairsharing-records2018-08-13T15:12:11.000Z2021-09-30T11:37:28.736Z10.25504/FAIRsharing.tnByoGClinicalStudyDataRequest.comready[{'contact-email': 'support@clinicalstudydatar...https://clinicalstudydatarequest.com/2657ClinicalStudyDataRequest.com (CSDR) is a conso...[{'url': 'https://clinicalstudydatarequest.com...2014.0[{'url': 'https://clinicalstudydatarequest.com...[biodbcore-001149, bsg-d001149]Databaserepository[Preclinical Studies, Biomedical Science][][Homo sapiens][][Worldwide]FAIRsharing record for: ClinicalStudyDataReque...CSDRhttps://fairsharing.org/10.25504/FAIRsharing.t...10.25504/FAIRsharing.tnByoGhttps://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: ClinicalStu...[][{'licence-name': 'CSDR Data Sharing Agreement...NaNCSDRNaNNaNNaNNaNNaNFAIRsharing_2657
42078fairsharing-records2014-11-04T15:23:40.000Z2021-09-30T11:34:43.129Z10.25504/FAIRsharing.3axym7Germplasm Resources Information Networkready[{'contact-email': 'dbmu@ars-grin.gov'}]https://www.ars-grin.gov/2078GRIN provides National Genetic Resources Progr...[{'url': 'https://www.ars-grin.gov/Pages/Colle...2010.0[{'url': 'https://www.ars-grin.gov/', 'name': ...[biodbcore-000546, bsg-d000546]Databaserepository[Life Science][Cell, Cell culture, Germplasm][Bacteria, Metazoa, Viridiplantae][][United States]FAIRsharing record for: Germplasm Resources In...GRINhttps://fairsharing.org/10.25504/FAIRsharing.3...10.25504/FAIRsharing.3axym7https://creativecommons.org/licenses/by-sa/4.0...This FAIRsharing record describes: GRIN provid...[][]NaNGRINNaNNaNNaNNaNNaNFAIRsharing_2078
\n", "
" ], "text/plain": [ " FAIRsharing_id FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 1723 fairsharing-records 2014-11-04T15:23:40.000Z \n", "1 3101 fairsharing-records 2020-09-16T08:49:13.000Z \n", "2 2649 fairsharing-records 2018-08-07T20:23:32.000Z \n", "3 2657 fairsharing-records 2018-08-13T15:12:11.000Z \n", "4 2078 fairsharing-records 2014-11-04T15:23:40.000Z \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 2021-09-30T11:39:06.829Z 10.25504/FAIRsharing.8t18te \n", "1 2021-09-30T11:36:45.452Z NaN \n", "2 2021-09-30T11:39:07.898Z NaN \n", "3 2021-09-30T11:37:28.736Z 10.25504/FAIRsharing.tnByoG \n", "4 2021-09-30T11:34:43.129Z 10.25504/FAIRsharing.3axym7 \n", "\n", " FAIRsharing_attributes.metadata.name \\\n", "0 Cell Image Library \n", "1 WHOI Ship Data-Grabber System \n", "2 Electron Microscope Public Image Archive \n", "3 ClinicalStudyDataRequest.com \n", "4 Germplasm Resources Information Network \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 ready \n", "1 ready \n", "2 ready \n", "3 ready \n", "4 ready \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [{'contact-name': 'David Orloff', 'contact-ema... \n", "1 NaN \n", "2 [{'contact-name': 'General contact', 'contact-... \n", "3 [{'contact-email': 'support@clinicalstudydatar... \n", "4 [{'contact-email': 'dbmu@ars-grin.gov'}] \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 http://www.cellimagelibrary.org \n", "1 http://4dgeo.whoi.edu/shipdata/SDG_shipdata.html \n", "2 https://www.ebi.ac.uk/pdbe/emdb/empiar/ \n", "3 https://clinicalstudydatarequest.com/ \n", "4 https://www.ars-grin.gov/ \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 1723 \n", "1 3101 \n", "2 2649 \n", "3 2657 \n", "4 2078 \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 This library is a public and easily accessible... \n", "1 The WHOI Ship DataGrabber system provides the ... \n", "2 EMPIAR, the Electron Microscopy Public Image A... \n", "3 ClinicalStudyDataRequest.com (CSDR) is a conso... \n", "4 GRIN provides National Genetic Resources Progr... \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [{'url': 'http://www.cellimagelibrary.org/page... \n", "1 [{'url': 'http://4dgeo.whoi.edu/shipdata/SDG_o... \n", "2 [{'url': 'https://www.ebi.ac.uk/support/EMPIAR... \n", "3 [{'url': 'https://clinicalstudydatarequest.com... \n", "4 [{'url': 'https://www.ars-grin.gov/Pages/Colle... \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 2010.0 \n", "1 2004.0 \n", "2 2015.0 \n", "3 2014.0 \n", "4 2010.0 \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [{'name': 'live update', 'type': 'data release... \n", "1 [{'url': 'http://4dgeo.whoi.edu/sdg-bin/dv_mai... \n", "2 [{'url': 'https://www.ebi.ac.uk/pdbe/emdb/empi... \n", "3 [{'url': 'https://clinicalstudydatarequest.com... \n", "4 [{'url': 'https://www.ars-grin.gov/', 'name': ... \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [biodbcore-000180, bsg-d000180] \n", "1 [biodbcore-001609, bsg-d001609] \n", "2 [biodbcore-001140, bsg-d001140] \n", "3 [biodbcore-001149, bsg-d001149] \n", "4 [biodbcore-000546, bsg-d000546] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 Database \n", "1 Database \n", "2 Database \n", "3 Database \n", "4 Database \n", "\n", " FAIRsharing_attributes.record-type \\\n", "0 repository \n", "1 repository \n", "2 repository \n", "3 repository \n", "4 repository \n", "\n", " FAIRsharing_attributes.subjects \\\n", "0 [Cell Biology, Life Science] \n", "1 [Earth Science, Water Research, Oceanography] \n", "2 [Bioinformatics, Biology] \n", "3 [Preclinical Studies, Biomedical Science] \n", "4 [Life Science] \n", "\n", " FAIRsharing_attributes.domains \\\n", "0 [Cell, Microscopy, Light microscopy, Electron ... \n", "1 [] \n", "2 [Protein image, Microscopy, Electron microscop... \n", "3 [] \n", "4 [Cell, Cell culture, Germplasm] \n", "\n", " FAIRsharing_attributes.taxonomies \\\n", "0 [All] \n", "1 [Not applicable] \n", "2 [All] \n", "3 [Homo sapiens] \n", "4 [Bacteria, Metazoa, Viridiplantae] \n", "\n", " FAIRsharing_attributes.user-defined-tags \\\n", "0 [] \n", "1 [subseafloor environments] \n", "2 [] \n", "3 [] \n", "4 [] \n", "\n", " FAIRsharing_attributes.countries \\\n", "0 [United States] \n", "1 [United States] \n", "2 [Greece, Czech Republic, United Kingdom, Icela... \n", "3 [Worldwide] \n", "4 [United States] \n", "\n", " FAIRsharing_attributes.name \\\n", "0 FAIRsharing record for: Cell Image Library \n", "1 FAIRsharing record for: WHOI Ship Data-Grabber... \n", "2 FAIRsharing record for: Electron Microscope Pu... \n", "3 FAIRsharing record for: ClinicalStudyDataReque... \n", "4 FAIRsharing record for: Germplasm Resources In... \n", "\n", " FAIRsharing_attributes.abbreviation \\\n", "0 None \n", "1 None \n", "2 EMPIAR \n", "3 CSDR \n", "4 GRIN \n", "\n", " FAIRsharing_attributes.url \\\n", "0 https://fairsharing.org/10.25504/FAIRsharing.8... \n", "1 https://fairsharing.org/fairsharing_records/3101 \n", "2 https://fairsharing.org/fairsharing_records/2649 \n", "3 https://fairsharing.org/10.25504/FAIRsharing.t... \n", "4 https://fairsharing.org/10.25504/FAIRsharing.3... \n", "\n", " FAIRsharing_attributes.doi \\\n", "0 10.25504/FAIRsharing.8t18te \n", "1 None \n", "2 None \n", "3 10.25504/FAIRsharing.tnByoG \n", "4 10.25504/FAIRsharing.3axym7 \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 https://creativecommons.org/licenses/by-sa/4.0... \n", "1 https://creativecommons.org/licenses/by-sa/4.0... \n", "2 https://creativecommons.org/licenses/by-sa/4.0... \n", "3 https://creativecommons.org/licenses/by-sa/4.0... \n", "4 https://creativecommons.org/licenses/by-sa/4.0... \n", "\n", " FAIRsharing_attributes.description \\\n", "0 This FAIRsharing record describes: This librar... \n", "1 This FAIRsharing record describes: The WHOI Sh... \n", "2 This FAIRsharing record describes: EMPIAR, the... \n", "3 This FAIRsharing record describes: ClinicalStu... \n", "4 This FAIRsharing record describes: GRIN provid... \n", "\n", " FAIRsharing_attributes.publications \\\n", "0 [{'id': 232, 'pubmed_id': 23203874, 'title': '... \n", "1 [] \n", "2 [{'id': 2232, 'pubmed_id': 27067018, 'title': ... \n", "3 [] \n", "4 [] \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 [{'licence-name': 'Cell Image Library Data Pol... \n", "1 [{'licence-name': 'NDSF Data Archive Policy', ... \n", "2 [{'licence-name': 'EMBL-EBI Terms of Use', 'li... \n", "3 [{'licence-name': 'CSDR Data Sharing Agreement... \n", "4 [] \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 NaN \n", "2 [{'doi': '10.1038/nmeth.3806', 'pubmed-id': 27... \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 NaN \n", "1 NaN \n", "2 EMPIAR \n", "3 CSDR \n", "4 GRIN \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 [{'url': 'https://www.ebi.ac.uk/pdbe/emdb/empi... \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 NaN \n", "2 [{'url': 'https://www.ebi.ac.uk/pdbe/emdb/empi... \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \n", "0 NaN FAIRsharing_1723 \n", "1 NaN FAIRsharing_3101 \n", "2 NaN FAIRsharing_2649 \n", "3 NaN FAIRsharing_2657 \n", "4 NaN FAIRsharing_2078 " ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "with open('../data/raw/fairsharing_dump_api_09_2021.json') as f:\n", " lines = f.read().splitlines()\n", " \n", "fairsharing_df = pd.DataFrame(lines)\n", "fairsharing_df.columns = ['json_element']\n", "fairsharing_df['json_element'].apply(json.loads)\n", "fairsharing_df = pd.json_normalize(fairsharing_df['json_element'].apply(json.loads))\n", "\n", "fairsharing_df['unique_id'] = 'FAIRsharing_' + fairsharing_df.id\n", "fairsharing_df = fairsharing_df.add_prefix('FAIRsharing_')\n", "fairsharing_df.head()" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
re3data_OpenAIREIDre3data_orgIdentifierre3data_repositoryNamere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_descriptionre3data_typere3data_sizere3data_updateDatere3data_startDatere3data_endDatere3data_subjectre3data_missionStatementre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadre3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_id
0re3data_____::91780fe96da5ba32f804e43359c154bar3d100000001Odum Institute Archive Dataverse[]https://dataverse.unc.edu/dataverse/odum[]The Odum Institute Archive Dataverse contains ...[disciplinary]13 dataverses; 3.050 datasets2020-12-04NaNNaN[1 Humanities and Social Sciences, 111 Social ...False[Databases, Plain text, Scientific and statist...[dataProvider][FAIR, Middle East, crime, demography, economy...[[Odum Institute for Research in Social Scienc...TruetrueTrueTrueTrueTrueFalseTrueNaNFalseTrueTrueTrueunknownyesTrueTrueFalseOdum Dataverse is covered by Thomson Reuters D...2013-06-102021-07-06re3data_r3d100000001
1re3data_____::cc3ea05c863cd49af75f7f54e0e86f09r3d100000002Access to Archival Databases[AAD]https://aad.archives.gov/aad/[RRID:SCR_010479, RRID:nlx_157752]You will find in the Access to Archival Databa...[disciplinary]NaNNaN1985NaN[1 Humanities and Social Sciences, 102 History...True[Images, Standard office documents, Structured...[dataProvider][US History][[The U.S. National Archives and Records Admin...TruetrueFalseTrueTrueTrueFalseTruenoTrueTrueTrueTrueunknownunknownFalseFalseTrueNaN2012-07-042021-05-25re3data_r3d100000002
2re3data_____::a2f73fbe91311f4356d0d7957c441773r3d100000004Datenbank Gesprochenes Deutsch[DGD, DGD2 (formerly), Database for Spoken Ger...https://dgd.ids-mannheim.de/[]The \"Database for Spoken German (DGD)\" is a co...[disciplinary]34 corpora2020-02-032012NaN[1 Humanities and Social Sciences, 104 Linguis...True[Audiovisual data, Standard office documents, ...[dataProvider, serviceProvider][Australian German, FOLK, German dialects, Pfe...[[Institut für Deutsche Sprache, Archiv für Ge...TruetrueFalseTrueTrueTrueFalseTrueyesFalseTrueTrueTrueunknownunknownTrueFalseFalseNaN2012-07-202020-08-27re3data_r3d100000004
3re3data_____::0394b97eb11f19785cbca1ec830429dar3d100000005UNC Dataverse[University of North Carolina Dataverse]https://dataverse.unc.edu/[]UNC Dataverse is an open-source repository sof...[institutional]186 dataverses; 25.272 studies; 229.442 files2020-11-302011NaN[1 Humanities and Social Sciences, 111 Social ...True[Archived data, Plain text, Raw data, Scientif...[dataProvider, serviceProvider][FAIR, census, demographic survey, demography,...[[Odum Institute for Research in Social Scienc...TruetrueFalseTrueTrueTrueTrueTrueyesTrueTrueTrueTrueunknownyesFalseTrueFalseUNC Dataverse is covered by Clarivate Data Cit...2012-07-232021-08-11re3data_r3d100000005
4re3data_____::a48f09c562b247a9919acfe195549b47r3d100000006Archaeology Data Service[ADS]https://archaeologydataservice.ac.uk/[FAIRsharing_doi:10.25504/FAIRsharing.hm1mfg]The ADS is an accredited digital repository fo...[disciplinary]1837 results2020-05-201996-10-01NaN[1 Humanities and Social Sciences, 101 Ancient...True[Archived data, Audiovisual data, Databases, I...[dataProvider, serviceProvider][FAIR, archaeology, cultural heritage, prehist...[[Arts and Humanities Research Council, [AHRC]...TruetrueTrueTrueTrueTrueTrueTrueyesTrueTrueTrueTrueunknownyesTrueTrueTrueADS is covered by Clarivate Data Citation Inde...2012-07-232021-09-02re3data_r3d100000006
\n", "
" ], "text/plain": [ " re3data_OpenAIREID re3data_orgIdentifier \\\n", "0 re3data_____::91780fe96da5ba32f804e43359c154ba r3d100000001 \n", "1 re3data_____::cc3ea05c863cd49af75f7f54e0e86f09 r3d100000002 \n", "2 re3data_____::a2f73fbe91311f4356d0d7957c441773 r3d100000004 \n", "3 re3data_____::0394b97eb11f19785cbca1ec830429da r3d100000005 \n", "4 re3data_____::a48f09c562b247a9919acfe195549b47 r3d100000006 \n", "\n", " re3data_repositoryName \\\n", "0 Odum Institute Archive Dataverse \n", "1 Access to Archival Databases \n", "2 Datenbank Gesprochenes Deutsch \n", "3 UNC Dataverse \n", "4 Archaeology Data Service \n", "\n", " re3data_additionalName \\\n", "0 [] \n", "1 [AAD] \n", "2 [DGD, DGD2 (formerly), Database for Spoken Ger... \n", "3 [University of North Carolina Dataverse] \n", "4 [ADS] \n", "\n", " re3data_repositoryURL \\\n", "0 https://dataverse.unc.edu/dataverse/odum \n", "1 https://aad.archives.gov/aad/ \n", "2 https://dgd.ids-mannheim.de/ \n", "3 https://dataverse.unc.edu/ \n", "4 https://archaeologydataservice.ac.uk/ \n", "\n", " re3data_repositoryIdentifier \\\n", "0 [] \n", "1 [RRID:SCR_010479, RRID:nlx_157752] \n", "2 [] \n", "3 [] \n", "4 [FAIRsharing_doi:10.25504/FAIRsharing.hm1mfg] \n", "\n", " re3data_description re3data_type \\\n", "0 The Odum Institute Archive Dataverse contains ... [disciplinary] \n", "1 You will find in the Access to Archival Databa... [disciplinary] \n", "2 The \"Database for Spoken German (DGD)\" is a co... [disciplinary] \n", "3 UNC Dataverse is an open-source repository sof... [institutional] \n", "4 The ADS is an accredited digital repository fo... [disciplinary] \n", "\n", " re3data_size re3data_updateDate \\\n", "0 13 dataverses; 3.050 datasets 2020-12-04 \n", "1 NaN NaN \n", "2 34 corpora 2020-02-03 \n", "3 186 dataverses; 25.272 studies; 229.442 files 2020-11-30 \n", "4 1837 results 2020-05-20 \n", "\n", " re3data_startDate re3data_endDate \\\n", "0 NaN NaN \n", "1 1985 NaN \n", "2 2012 NaN \n", "3 2011 NaN \n", "4 1996-10-01 NaN \n", "\n", " re3data_subject \\\n", "0 [1 Humanities and Social Sciences, 111 Social ... \n", "1 [1 Humanities and Social Sciences, 102 History... \n", "2 [1 Humanities and Social Sciences, 104 Linguis... \n", "3 [1 Humanities and Social Sciences, 111 Social ... \n", "4 [1 Humanities and Social Sciences, 101 Ancient... \n", "\n", " re3data_missionStatement \\\n", "0 False \n", "1 True \n", "2 True \n", "3 True \n", "4 True \n", "\n", " re3data_contentType \\\n", "0 [Databases, Plain text, Scientific and statist... \n", "1 [Images, Standard office documents, Structured... \n", "2 [Audiovisual data, Standard office documents, ... \n", "3 [Archived data, Plain text, Raw data, Scientif... \n", "4 [Archived data, Audiovisual data, Databases, I... \n", "\n", " re3data_providerType \\\n", "0 [dataProvider] \n", "1 [dataProvider] \n", "2 [dataProvider, serviceProvider] \n", "3 [dataProvider, serviceProvider] \n", "4 [dataProvider, serviceProvider] \n", "\n", " re3data_keyword \\\n", "0 [FAIR, Middle East, crime, demography, economy... \n", "1 [US History] \n", "2 [Australian German, FOLK, German dialects, Pfe... \n", "3 [FAIR, census, demographic survey, demography,... \n", "4 [FAIR, archaeology, cultural heritage, prehist... \n", "\n", " re3data_institution re3data_policy \\\n", "0 [[Odum Institute for Research in Social Scienc... True \n", "1 [[The U.S. National Archives and Records Admin... True \n", "2 [[Institut für Deutsche Sprache, Archiv für Ge... True \n", "3 [[Odum Institute for Research in Social Scienc... True \n", "4 [[Arts and Humanities Research Council, [AHRC]... True \n", "\n", " re3data_databaseAccess re3data_databaseLicense re3data_dataAccess \\\n", "0 true True True \n", "1 true False True \n", "2 true False True \n", "3 true False True \n", "4 true True True \n", "\n", " re3data_dataLicense re3data_dataUpload re3data_dataUploadLicense \\\n", "0 True True False \n", "1 True True False \n", "2 True True False \n", "3 True True True \n", "4 True True True \n", "\n", " re3data_software re3data_versioning re3data_api re3data_pidSystem \\\n", "0 True NaN False True \n", "1 True no True True \n", "2 True yes False True \n", "3 True yes True True \n", "4 True yes True True \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem \\\n", "0 True True \n", "1 True True \n", "2 True True \n", "3 True True \n", "4 True True \n", "\n", " re3data_enhancedPublication re3data_qualityManagement re3data_certificate \\\n", "0 unknown yes True \n", "1 unknown unknown False \n", "2 unknown unknown True \n", "3 unknown yes False \n", "4 unknown yes True \n", "\n", " re3data_metadataStandard re3data_syndication \\\n", "0 True False \n", "1 False True \n", "2 False False \n", "3 True False \n", "4 True True \n", "\n", " re3data_remarks re3data_entryDate \\\n", "0 Odum Dataverse is covered by Thomson Reuters D... 2013-06-10 \n", "1 NaN 2012-07-04 \n", "2 NaN 2012-07-20 \n", "3 UNC Dataverse is covered by Clarivate Data Cit... 2012-07-23 \n", "4 ADS is covered by Clarivate Data Citation Inde... 2012-07-23 \n", "\n", " re3data_lastUpdate re3data_unique_id \n", "0 2021-07-06 re3data_r3d100000001 \n", "1 2021-05-25 re3data_r3d100000002 \n", "2 2020-08-27 re3data_r3d100000004 \n", "3 2021-08-11 re3data_r3d100000005 \n", "4 2021-09-02 re3data_r3d100000006 " ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "re3data_df = pd.read_csv('../data/raw/re3data.tsv', delimiter='\\t',\n", " converters={'subject': ast.literal_eval,\n", " 'keyword': ast.literal_eval,\n", " 'additionalName': ast.literal_eval,\n", " 'repositoryIdentifier': ast.literal_eval,\n", " 'type': ast.literal_eval,\n", " 'contentType': ast.literal_eval,\n", " 'providerType': ast.literal_eval,\n", " 'institution': ast.literal_eval\n", " })\n", "\n", "re3data_df['unique_id'] = 're3data_' + re3data_df.orgIdentifier\n", "re3data_df = re3data_df.add_prefix('re3data_')\n", "re3data_df.head()" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
OpenDOAR_OpenAIREIDOpenDOAR_orgIdentifierOpenDOAR_repositoryNameOpenDOAR_alternativeNamesOpenDOAR_repositoryURLOpenDOAR_descriptionOpenDOAR_typeOpenDOAR_updateDateOpenDOAR_startDateOpenDOAR_subjectOpenDOAR_contentTypeOpenDOAR_institutionOpenDOAR_metadataPolicyOpenDOAR_dataPolicyOpenDOAR_submissionPolicyOpenDOAR_contentPolicyOpenDOAR_softwareOpenDOAR_apiOpenDOAR_unique_id
0opendoar____::82161242827b703e6acf9c726942a1e4175hku theses online[]http://hub.hku.hk/handle/10722/1057this is an institutional repository providing ...institutional2021-03-25 10:16:182005-12-21 12:44:08[multidisciplinary][bibliographic_references, theses_and_disserta...[[university of hong kong, [香港大學, hku], cn, ht...FalseFalseFalseFalsedspace cris-5.3.1-snapshotfalseOpenDOAR_175
1opendoar____::ea5d2f1c4608232e07d3aa3d998e513564research support scheme - central european uni...[]http://rss.archives.ceu.hu/this is an institutional repository collecting...institutional2021-03-25 09:48:312006-01-04 14:59:30[multidisciplinary][unpub_reports_and_working_papers][[central european university, [ceu], hu, http...FalseFalseFalseFalseeprints 2.2.1trueOpenDOAR_64
2opendoar____::a8f15eda80c50adb0e71943adc8015cf151cadmus, eui research repository[]http://cadmus.eui.eu/cadmus is the name of the eui research reposit...institutional2021-09-13 13:35:362006-01-04 12:07:07[history and archaeology, multidisciplinary, s...[journal_articles, theses_and_dissertations, u...[[european university institute, [eui], it, ht...FalseFalseFalseFalsedspace 5.2trueOpenDOAR_151
3opendoar____::65b9eea6e1cc6bb9f0cd2a47751a186f105document server@uhasselt[]https://doclib.uhasselt.be/dspace/this site is a university repository providing...institutional2021-04-16 15:23:522006-01-24 15:46:44[multidisciplinary][journal_articles, conference_and_workshop_pap...[[hasselt university, [universiteit hasselt, u...FalseFalseFalseFalsedspace 1.7.2trueOpenDOAR_105
4opendoar____::38b3eff8baf56627478ec76a704e9b52101utrecht university repository[]http://dspace.library.uu.nlthis site is a university repository providing...institutional2021-04-16 15:22:032006-01-13 12:55:13[multidisciplinary][journal_articles, conference_and_workshop_pap...[[university of utrecht, [universiteit utrecht...FalseFalseFalseFalsedspacetrueOpenDOAR_101
\n", "
" ], "text/plain": [ " OpenDOAR_OpenAIREID OpenDOAR_orgIdentifier \\\n", "0 opendoar____::82161242827b703e6acf9c726942a1e4 175 \n", "1 opendoar____::ea5d2f1c4608232e07d3aa3d998e5135 64 \n", "2 opendoar____::a8f15eda80c50adb0e71943adc8015cf 151 \n", "3 opendoar____::65b9eea6e1cc6bb9f0cd2a47751a186f 105 \n", "4 opendoar____::38b3eff8baf56627478ec76a704e9b52 101 \n", "\n", " OpenDOAR_repositoryName \\\n", "0 hku theses online \n", "1 research support scheme - central european uni... \n", "2 cadmus, eui research repository \n", "3 document server@uhasselt \n", "4 utrecht university repository \n", "\n", " OpenDOAR_alternativeNames OpenDOAR_repositoryURL \\\n", "0 [] http://hub.hku.hk/handle/10722/1057 \n", "1 [] http://rss.archives.ceu.hu/ \n", "2 [] http://cadmus.eui.eu/ \n", "3 [] https://doclib.uhasselt.be/dspace/ \n", "4 [] http://dspace.library.uu.nl \n", "\n", " OpenDOAR_description OpenDOAR_type \\\n", "0 this is an institutional repository providing ... institutional \n", "1 this is an institutional repository collecting... institutional \n", "2 cadmus is the name of the eui research reposit... institutional \n", "3 this site is a university repository providing... institutional \n", "4 this site is a university repository providing... institutional \n", "\n", " OpenDOAR_updateDate OpenDOAR_startDate \\\n", "0 2021-03-25 10:16:18 2005-12-21 12:44:08 \n", "1 2021-03-25 09:48:31 2006-01-04 14:59:30 \n", "2 2021-09-13 13:35:36 2006-01-04 12:07:07 \n", "3 2021-04-16 15:23:52 2006-01-24 15:46:44 \n", "4 2021-04-16 15:22:03 2006-01-13 12:55:13 \n", "\n", " OpenDOAR_subject \\\n", "0 [multidisciplinary] \n", "1 [multidisciplinary] \n", "2 [history and archaeology, multidisciplinary, s... \n", "3 [multidisciplinary] \n", "4 [multidisciplinary] \n", "\n", " OpenDOAR_contentType \\\n", "0 [bibliographic_references, theses_and_disserta... \n", "1 [unpub_reports_and_working_papers] \n", "2 [journal_articles, theses_and_dissertations, u... \n", "3 [journal_articles, conference_and_workshop_pap... \n", "4 [journal_articles, conference_and_workshop_pap... \n", "\n", " OpenDOAR_institution OpenDOAR_metadataPolicy \\\n", "0 [[university of hong kong, [香港大學, hku], cn, ht... False \n", "1 [[central european university, [ceu], hu, http... False \n", "2 [[european university institute, [eui], it, ht... False \n", "3 [[hasselt university, [universiteit hasselt, u... False \n", "4 [[university of utrecht, [universiteit utrecht... False \n", "\n", " OpenDOAR_dataPolicy OpenDOAR_submissionPolicy OpenDOAR_contentPolicy \\\n", "0 False False False \n", "1 False False False \n", "2 False False False \n", "3 False False False \n", "4 False False False \n", "\n", " OpenDOAR_software OpenDOAR_api OpenDOAR_unique_id \n", "0 dspace cris-5.3.1-snapshot false OpenDOAR_175 \n", "1 eprints 2.2.1 true OpenDOAR_64 \n", "2 dspace 5.2 true OpenDOAR_151 \n", "3 dspace 1.7.2 true OpenDOAR_105 \n", "4 dspace true OpenDOAR_101 " ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "opendoar_df = pd.read_csv('../data/raw/openDoar.tsv', delimiter='\\t',\n", " converters={'subject': ast.literal_eval,\n", " 'alternativeNames': ast.literal_eval,\n", " 'contentType': ast.literal_eval,\n", " 'institution': ast.literal_eval\n", " },\n", " dtype={'orgIdentifier': str})\n", "\n", "opendoar_df['unique_id'] = 'OpenDOAR_' + opendoar_df.orgIdentifier\n", "opendoar_df = opendoar_df.add_prefix('OpenDOAR_')\n", "opendoar_df.head()" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
roar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
01633archive1NaNNaNdisk0/00/00/00/012010-01-06 13:43:482011-07-18 05:40:072010-01-06 13:43:48subjectNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://archivesic.ccsd.cnrs.fr/@RCHIVESIChttp://archivesic.ccsd.cnrs.fr/oai/oai.phpNaNNaNNaNNaNNaNNaNNaNNaNNaNfrNaNNaNNaNhalgeoname_2_FRotherNaN2002-05-17 19:24:41NaNNaN000250,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...NaNNaNNaNNaN[opendoar, celestial][669, 58]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_1
110511archive1NaNNaNdisk0/00/00/00/102010-01-06 13:43:482011-07-18 05:40:132010-01-06 13:43:48institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://www.diva-portal.org/mdh/Academic Archive On-line (Mälardalen Universit...http://www.diva-portal.org/oai/mdh/OAINaNNaNNaNNaNTRUETRUENaNNaNNaNseUppsala59.866717.6333divageoname_2_SEotherNaN2005-12-08 13:15:22NaNNaN0001000,0,0,0,0,0,0,0,0,0,0,0,0,0,2,8,39,100,100,100...NaNNaNNaNNaN[opendoar, celestial][526, 258]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_10
21000274archive1NaNNaNdisk0/00/00/10/002010-01-06 13:45:012011-07-06 08:21:212010-01-06 13:45:01subjectNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://pam.pisharp.org/PAM - Portuguese Archive of MathematicsNaNNaNNaNNaNNaNTRUETRUENaNNaNNaNptBellevue, WA47.6034-122.155dspacegeoname_2_PTotherNaN2006-05-04 10:48:14NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_1000
31000120archive91NaNNaNdisk0/00/01/00/012015-08-08 14:52:112016-03-21 19:44:012015-08-08 14:52:11subjectNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://edoc.sub.uni-hamburg.de/klimawandel/Klimawandel Dokumentenserverhttp://edoc.sub.uni-hamburg.de/klimawandel/oaiNaNNaNNaNThe \"Documentenserver Klimawandel\" (Repository...TRUETRUETRUE[Helmholtz-Zentrum Geesthacht, Climate Service...[http://www.climateservicecenter.de/, http://w...deHamburg53.55119.9937opusgeoname_2_DEother[GE, S1, G1, HD, GF]2015-07-02 08:08:31NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[opendoar, celestial][5881, 3408]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_10001
41000811archive404NaNNaNdisk0/00/01/00/082015-08-08 14:52:262016-03-21 19:43:512015-08-08 14:52:26institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://creativematter.skidmore.edu/Creative Matter | Skidmore College Researchhttp://creativematter.skidmore.edu/do/oai/NaNhttp://creativematter.skidmore.edu/recent.rssNaNWelcome to Creative Matter, a repository for t...TRUEFALSEFALSESkidmore Collegehttp://www.skidmore.edu/usSaratoga Springs43.0961-73.7818bepressgeoname_2_USotherNaN2015-07-06 17:35:50NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNcelestial5882NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_10008
\n", "
" ], "text/plain": [ " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "0 1 633 archive 1 NaN \n", "1 10 511 archive 1 NaN \n", "2 1000 274 archive 1 NaN \n", "3 10001 20 archive 91 NaN \n", "4 10008 11 archive 404 NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod \\\n", "0 NaN disk0/00/00/00/01 2010-01-06 13:43:48 2011-07-18 05:40:07 \n", "1 NaN disk0/00/00/00/10 2010-01-06 13:43:48 2011-07-18 05:40:13 \n", "2 NaN disk0/00/00/10/00 2010-01-06 13:45:01 2011-07-06 08:21:21 \n", "3 NaN disk0/00/01/00/01 2015-08-08 14:52:11 2016-03-21 19:44:01 \n", "4 NaN disk0/00/01/00/08 2015-08-08 14:52:26 2016-03-21 19:43:51 \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "0 2010-01-06 13:43:48 subject NaN NaN \n", "1 2010-01-06 13:43:48 institutional NaN NaN \n", "2 2010-01-06 13:45:01 subject NaN NaN \n", "3 2015-08-08 14:52:11 subject NaN NaN \n", "4 2015-08-08 14:52:26 institutional NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "0 show NaN NaN NaN \n", "1 show NaN NaN NaN \n", "2 show NaN NaN NaN \n", "3 show NaN NaN NaN \n", "4 show NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "0 0 NaN NaN NaN \n", "1 0 NaN NaN NaN \n", "2 0 NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_home_page \\\n", "0 http://archivesic.ccsd.cnrs.fr/ \n", "1 http://www.diva-portal.org/mdh/ \n", "2 http://pam.pisharp.org/ \n", "3 http://edoc.sub.uni-hamburg.de/klimawandel/ \n", "4 http://creativematter.skidmore.edu/ \n", "\n", " roar_title \\\n", "0 @RCHIVESIC \n", "1 Academic Archive On-line (Mälardalen Universit... \n", "2 PAM - Portuguese Archive of Mathematics \n", "3 Klimawandel Dokumentenserver \n", "4 Creative Matter | Skidmore College Research \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "0 http://archivesic.ccsd.cnrs.fr/oai/oai.php NaN \n", "1 http://www.diva-portal.org/oai/mdh/OAI NaN \n", "2 NaN NaN \n", "3 http://edoc.sub.uni-hamburg.de/klimawandel/oai NaN \n", "4 http://creativematter.skidmore.edu/do/oai/ NaN \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 http://creativematter.skidmore.edu/recent.rss NaN \n", "\n", " roar_description roar_fulltext \\\n", "0 NaN NaN \n", "1 NaN TRUE \n", "2 NaN TRUE \n", "3 The \"Documentenserver Klimawandel\" (Repository... TRUE \n", "4 Welcome to Creative Matter, a repository for t... TRUE \n", "\n", " roar_open_access roar_mandate \\\n", "0 NaN NaN \n", "1 TRUE NaN \n", "2 TRUE NaN \n", "3 TRUE TRUE \n", "4 FALSE FALSE \n", "\n", " roar_organisation_title \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 [Helmholtz-Zentrum Geesthacht, Climate Service... \n", "4 Skidmore College \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 NaN fr \n", "1 NaN se \n", "2 NaN pt \n", "3 [http://www.climateservicecenter.de/, http://w... de \n", "4 http://www.skidmore.edu/ us \n", "\n", " roar_location_city roar_location_latitude roar_location_longitude \\\n", "0 NaN NaN NaN \n", "1 Uppsala 59.8667 17.6333 \n", "2 Bellevue, WA 47.6034 -122.155 \n", "3 Hamburg 53.5511 9.9937 \n", "4 Saratoga Springs 43.0961 -73.7818 \n", "\n", " roar_software roar_geoname roar_version roar_subjects \\\n", "0 hal geoname_2_FR other NaN \n", "1 diva geoname_2_SE other NaN \n", "2 dspace geoname_2_PT other NaN \n", "3 opus geoname_2_DE other [GE, S1, G1, HD, GF] \n", "4 bepress geoname_2_US other NaN \n", "\n", " roar_date roar_note roar_suggestions roar_activity_low \\\n", "0 2002-05-17 19:24:41 NaN NaN 0 \n", "1 2005-12-08 13:15:22 NaN NaN 0 \n", "2 2006-05-04 10:48:14 NaN NaN NaN \n", "3 2015-07-02 08:08:31 NaN NaN NaN \n", "4 2015-07-06 17:35:50 NaN NaN NaN \n", "\n", " roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 0 0 25 \n", "1 0 0 100 \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,... NaN \n", "1 0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,8,39,100,100,100... NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_registry_name roar_registry_id roar_submit_to \\\n", "0 [opendoar, celestial] [669, 58] NaN \n", "1 [opendoar, celestial] [526, 258] NaN \n", "2 NaN NaN NaN \n", "3 [opendoar, celestial] [5881, 3408] NaN \n", "4 celestial 5882 NaN \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_total_deposits roar_association roar_unique_id \n", "0 NaN NaN roar_1 \n", "1 NaN NaN roar_10 \n", "2 NaN NaN roar_1000 \n", "3 NaN NaN roar_10001 \n", "4 NaN NaN roar_10008 " ] }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "roar_df = pd.read_csv('../data/raw/export_roar_CSV.csv', dtype='str')\n", "roar_df = roar_df.groupby('eprintid').aggregate(set)\n", "\n", "def value_or_list(cell_set):\n", " copy = set(cell_set)\n", " copy.discard(np.nan) \n", " if len(copy) == 0:\n", " return np.nan\n", " if len(copy) == 1:\n", " return copy.pop()\n", " return list(copy)\n", " \n", "roar_df = roar_df.applymap(value_or_list)\n", "roar_df.reset_index(inplace=True)\n", "\n", "roar_df['unique_id'] = 'roar_' + roar_df.eprintid\n", "roar_df = roar_df.add_prefix('roar_')\n", "roar_df.head()" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
roar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
71001331archive7104NaNNaNdisk0/00/01/00/132015-08-08 14:53:042016-03-21 19:54:432015-08-08 14:53:04institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://er.ucu.edu.ua/ErUCU: Electronic repository of the Ukrainian ...http://er.ucu.edu.ua/oai/requesthttp://er.ucu.edu.ua/sword/http://er.ucu.edu.ua/feed/rss_2.0/siteNaNUkrainian Catholic University’s institutional ...TRUETRUETRUEUkrainian Catholic Universityhttp://ucu.edu.ua/eng/uaLvivNaNNaNdspacegeoname_2_UAother[B1, BS, BL, AC, D204, DK, HM, BF, L1, D1, H1,...2015-07-07 12:38:37NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[opendoar, celestial][5883, 3410]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN[russell_group, ivy_league]roar_10013
\n", "
" ], "text/plain": [ " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "7 10013 31 archive 7104 NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod \\\n", "7 NaN disk0/00/01/00/13 2015-08-08 14:53:04 2016-03-21 19:54:43 \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "7 2015-08-08 14:53:04 institutional NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "7 show NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "7 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "7 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "7 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "7 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "7 NaN NaN NaN NaN \n", "\n", " roar_home_page roar_title \\\n", "7 http://er.ucu.edu.ua/ ErUCU: Electronic repository of the Ukrainian ... \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "7 http://er.ucu.edu.ua/oai/request http://er.ucu.edu.ua/sword/ \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "7 http://er.ucu.edu.ua/feed/rss_2.0/site NaN \n", "\n", " roar_description roar_fulltext \\\n", "7 Ukrainian Catholic University’s institutional ... TRUE \n", "\n", " roar_open_access roar_mandate roar_organisation_title \\\n", "7 TRUE TRUE Ukrainian Catholic University \n", "\n", " roar_organisation_home_page roar_location_country roar_location_city \\\n", "7 http://ucu.edu.ua/eng/ ua Lviv \n", "\n", " roar_location_latitude roar_location_longitude roar_software roar_geoname \\\n", "7 NaN NaN dspace geoname_2_UA \n", "\n", " roar_version roar_subjects \\\n", "7 other [B1, BS, BL, AC, D204, DK, HM, BF, L1, D1, H1,... \n", "\n", " roar_date roar_note roar_suggestions roar_activity_low \\\n", "7 2015-07-07 12:38:37 NaN NaN NaN \n", "\n", " roar_activity_medium roar_activity_high roar_recordcount roar_recordhistory \\\n", "7 NaN NaN NaN NaN \n", "\n", " roar_fulltexts_total roar_fulltexts_docs roar_fulltexts_rtotal \\\n", "7 NaN NaN NaN \n", "\n", " roar_fulltexts_rdocs roar_registry_name roar_registry_id roar_submit_to \\\n", "7 NaN [opendoar, celestial] [5883, 3410] NaN \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "7 NaN NaN NaN \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "7 NaN NaN \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "7 NaN NaN NaN \n", "\n", " roar_total_deposits roar_association roar_unique_id \n", "7 NaN [russell_group, ivy_league] roar_10013 " ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "roar_df[roar_df.roar_eprintid == '10013']" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Loading dedup results" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
0dedup::860320be12a1c050cd7731794e231bd3opendoar____::2290a7385ed77cc5592dc2153229f0821064oxford university research archiveOpenDOAROpenDOAR_1064
1dedup::1aa7a8773e6a7fdacbcedf9999009a38opendoar____::191f8f858acda435ae0daf994e2a72c28648digital commons@georgia southernOpenDOAROpenDOAR_8648
2dedup::31bceb0c3e2a260593e1e36655ebcee4opendoar____::d5776aeecb3c45ab15adce6f5cb355f39713materials data repositoryOpenDOAROpenDOAR_9713
3dedup::e37b08dd3015330dcbb5d6663667b8b8opendoar____::18997733ec258a9fcaf239cc55d53363427digital repository at the university of marylandOpenDOAROpenDOAR_427
4dedup::2841194266115ac1cc04d19630cde46bre3data_____::3afbb2b45a3dd218a5a091ca773cf6c5r3d100011189PRISM: University of Calgary's Digital Repositoryre3datare3data_r3d100011189
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::860320be12a1c050cd7731794e231bd3 \n", "1 dedup::1aa7a8773e6a7fdacbcedf9999009a38 \n", "2 dedup::31bceb0c3e2a260593e1e36655ebcee4 \n", "3 dedup::e37b08dd3015330dcbb5d6663667b8b8 \n", "4 dedup::2841194266115ac1cc04d19630cde46b \n", "\n", " duplicate_id original_id \\\n", "0 opendoar____::2290a7385ed77cc5592dc2153229f082 1064 \n", "1 opendoar____::191f8f858acda435ae0daf994e2a72c2 8648 \n", "2 opendoar____::d5776aeecb3c45ab15adce6f5cb355f3 9713 \n", "3 opendoar____::18997733ec258a9fcaf239cc55d53363 427 \n", "4 re3data_____::3afbb2b45a3dd218a5a091ca773cf6c5 r3d100011189 \n", "\n", " name source \\\n", "0 oxford university research archive OpenDOAR \n", "1 digital commons@georgia southern OpenDOAR \n", "2 materials data repository OpenDOAR \n", "3 digital repository at the university of maryland OpenDOAR \n", "4 PRISM: University of Calgary's Digital Repository re3data \n", "\n", " unique_id \n", "0 OpenDOAR_1064 \n", "1 OpenDOAR_8648 \n", "2 OpenDOAR_9713 \n", "3 OpenDOAR_427 \n", "4 re3data_r3d100011189 " ] }, "execution_count": 7, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup = pd.read_csv('../data/interim/fairsharing_dedup.csv', sep=';', quotechar='\"', header=None, names=['dedup_id', 'duplicate_id', 'original_id', 'name', 'source'])\n", "dup['unique_id'] = dup.source + '_' + dup.original_id\n", "dup.head()" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
count461746174617461746174617
unique219146174159396844617
topdedup::75e33da9b103b7b91dcd8da0abe1354bopendoar____::2290a7385ed77cc5592dc2153229f0822399UPN JATIM REPOSITORYroarOpenDOAR_1064
freq513419771
\n", "
" ], "text/plain": [ " dedup_id \\\n", "count 4617 \n", "unique 2191 \n", "top dedup::75e33da9b103b7b91dcd8da0abe1354b \n", "freq 5 \n", "\n", " duplicate_id original_id \\\n", "count 4617 4617 \n", "unique 4617 4159 \n", "top opendoar____::2290a7385ed77cc5592dc2153229f082 2399 \n", "freq 1 3 \n", "\n", " name source unique_id \n", "count 4617 4617 4617 \n", "unique 3968 4 4617 \n", "top UPN JATIM REPOSITORY roar OpenDOAR_1064 \n", "freq 4 1977 1 " ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup.describe()" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [], "source": [ "dup_grouped = dup.groupby('dedup_id').aggregate(list)\n", "dup_grouped['source_set'] = dup_grouped.source.map(set)" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 6\n", "original_id 6\n", "name 6\n", "source 6\n", "unique_id 6\n", "source_set 6\n", "dtype: int64" ] }, "execution_count": 10, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 4].count()" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 60\n", "original_id 60\n", "name 60\n", "source 60\n", "unique_id 60\n", "source_set 60\n", "dtype: int64" ] }, "execution_count": 11, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 3].count()" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 1986\n", "original_id 1986\n", "name 1986\n", "source 1986\n", "unique_id 1986\n", "source_set 1986\n", "dtype: int64" ] }, "execution_count": 12, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 2].count()" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "duplicate_id 139\n", "original_id 139\n", "name 139\n", "source 139\n", "unique_id 139\n", "source_set 139\n", "dtype: int64" ] }, "execution_count": 13, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_grouped[dup_grouped.source_set.str.len() == 1].count()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Isolating duplicates within a registry" ] }, { "cell_type": "code", "execution_count": 14, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_idsource_set
dedup_id
dedup::000871c1fc726f0b52dc86a4eeb027de[4612, 4649][4612, 4649][IIT Bombay Institutional Repository, IIT Bomb...[roar, roar][roar_4612, roar_4649]{roar}
dedup::0163cceb20f5ca7b313419c068abd9dc[7943, 8003][7943, 8003][EPrints@NIRT Library Welcomes! - EPrints@NITR...[roar, roar][roar_7943, roar_8003]{roar}
dedup::028ee724157b05d04e7bdcf237d12e60[2670, 2698, 2741][2670, 2698, 2741][HSF Brage Open Research Archive, HSF Brage Op...[roar, roar, roar][roar_2670, roar_2698, roar_2741]{roar}
dedup::03593ce517feac573fdaafa6dcedef61[4393, 4394][4393, 4394][Institutional Repository of Kunming Institute...[roar, roar][roar_4393, roar_4394]{roar}
dedup::03e0704b5690a2dee1861dc3ad3316c9[1019, 5550][1019, 5550][PolyU Institutional Repository, PolyU Institu...[roar, roar][roar_1019, roar_5550]{roar}
\n", "
" ], "text/plain": [ " duplicate_id \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [4612, 4649] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [7943, 8003] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [2670, 2698, 2741] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [4393, 4394] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [1019, 5550] \n", "\n", " original_id \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [4612, 4649] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [7943, 8003] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [2670, 2698, 2741] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [4393, 4394] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [1019, 5550] \n", "\n", " name \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [IIT Bombay Institutional Repository, IIT Bomb... \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [EPrints@NIRT Library Welcomes! - EPrints@NITR... \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [HSF Brage Open Research Archive, HSF Brage Op... \n", "dedup::03593ce517feac573fdaafa6dcedef61 [Institutional Repository of Kunming Institute... \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [PolyU Institutional Repository, PolyU Institu... \n", "\n", " source \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [roar, roar] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [roar, roar] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [roar, roar, roar] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [roar, roar] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [roar, roar] \n", "\n", " unique_id \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [roar_4612, roar_4649] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [roar_7943, roar_8003] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [roar_2670, roar_2698, roar_2741] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [roar_4393, roar_4394] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [roar_1019, roar_5550] \n", "\n", " source_set \n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de {roar} \n", "dedup::0163cceb20f5ca7b313419c068abd9dc {roar} \n", "dedup::028ee724157b05d04e7bdcf237d12e60 {roar} \n", "dedup::03593ce517feac573fdaafa6dcedef61 {roar} \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 {roar} " ] }, "execution_count": 14, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup.groupby('dedup_id').aggregate(list)\n", "dup_within['source_set'] = dup_within.source.map(set)\n", "dup_within = dup_within[dup_within.source_set.str.len() == 1]\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_idsource_set
dedup_id
dedup::000871c1fc726f0b52dc86a4eeb027de[4612, 4649][4612, 4649][IIT Bombay Institutional Repository, IIT Bomb...[roar, roar][roar_4612, roar_4649]roar
dedup::0163cceb20f5ca7b313419c068abd9dc[7943, 8003][7943, 8003][EPrints@NIRT Library Welcomes! - EPrints@NITR...[roar, roar][roar_7943, roar_8003]roar
dedup::028ee724157b05d04e7bdcf237d12e60[2670, 2698, 2741][2670, 2698, 2741][HSF Brage Open Research Archive, HSF Brage Op...[roar, roar, roar][roar_2670, roar_2698, roar_2741]roar
dedup::03593ce517feac573fdaafa6dcedef61[4393, 4394][4393, 4394][Institutional Repository of Kunming Institute...[roar, roar][roar_4393, roar_4394]roar
dedup::03e0704b5690a2dee1861dc3ad3316c9[1019, 5550][1019, 5550][PolyU Institutional Repository, PolyU Institu...[roar, roar][roar_1019, roar_5550]roar
\n", "
" ], "text/plain": [ " duplicate_id \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [4612, 4649] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [7943, 8003] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [2670, 2698, 2741] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [4393, 4394] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [1019, 5550] \n", "\n", " original_id \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [4612, 4649] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [7943, 8003] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [2670, 2698, 2741] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [4393, 4394] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [1019, 5550] \n", "\n", " name \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [IIT Bombay Institutional Repository, IIT Bomb... \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [EPrints@NIRT Library Welcomes! - EPrints@NITR... \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [HSF Brage Open Research Archive, HSF Brage Op... \n", "dedup::03593ce517feac573fdaafa6dcedef61 [Institutional Repository of Kunming Institute... \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [PolyU Institutional Repository, PolyU Institu... \n", "\n", " source \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [roar, roar] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [roar, roar] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [roar, roar, roar] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [roar, roar] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [roar, roar] \n", "\n", " unique_id \\\n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de [roar_4612, roar_4649] \n", "dedup::0163cceb20f5ca7b313419c068abd9dc [roar_7943, roar_8003] \n", "dedup::028ee724157b05d04e7bdcf237d12e60 [roar_2670, roar_2698, roar_2741] \n", "dedup::03593ce517feac573fdaafa6dcedef61 [roar_4393, roar_4394] \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 [roar_1019, roar_5550] \n", "\n", " source_set \n", "dedup_id \n", "dedup::000871c1fc726f0b52dc86a4eeb027de roar \n", "dedup::0163cceb20f5ca7b313419c068abd9dc roar \n", "dedup::028ee724157b05d04e7bdcf237d12e60 roar \n", "dedup::03593ce517feac573fdaafa6dcedef61 roar \n", "dedup::03e0704b5690a2dee1861dc3ad3316c9 roar " ] }, "execution_count": 15, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within['source_set'] = dup_within.source_set.map(set.pop)\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 16, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
duplicate_idoriginal_idnamesourceunique_id
source_set
OpenDOAR1616161616
re3data22222
roar121121121121121
\n", "
" ], "text/plain": [ " duplicate_id original_id name source unique_id\n", "source_set \n", "OpenDOAR 16 16 16 16 16\n", "re3data 2 2 2 2 2\n", "roar 121 121 121 121 121" ] }, "execution_count": 16, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within.groupby('source_set').count()" ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
28dedup::d2ddea18f00665ce8623e36bd4e3c7c582378237AIR | Archivio Istituzionale della Ricercaroarroar_8237
31dedup::4c5bcfec8584af0d967f1ab10179ca4b28202820USU Repository: Open Access Repositoryroarroar_2820
46dedup::c2ae5cb2426d96ed19a50b0b7d7c8e1194879487IR at NRF: Homeroarroar_9487
53dedup::1c65cef3dfd1e00c0b03923a1c591db412411241Swansea Metropolitan University Repositoryroarroar_1241
59dedup::4217ec5d78c4bc4e5bd006783482441f1514215142Repositorio Institucionalroarroar_15142
.....................
4560dedup::fc394e9935fbd62c8aedc372464e196571617161Welcome to IR@NPLroarroar_7161
4586dedup::000871c1fc726f0b52dc86a4eeb027de46494649IIT Bombay Institutional Repositoryroarroar_4649
4587dedup::72c288a828485e5b1d4c52910d1067341686716867Chung Shan Medical University Institutional Re...roarroar_16867
4598dedup::0163cceb20f5ca7b313419c068abd9dc80038003EPrints@NIRT Library Welcomes! - EPrints@NIRTroarroar_8003
4608dedup::2aeb1a8f8475cef63900be5d0780e8721547115471Repository STIE Nobel Indonesiaroarroar_15471
\n", "

287 rows × 6 columns

\n", "
" ], "text/plain": [ " dedup_id duplicate_id original_id \\\n", "28 dedup::d2ddea18f00665ce8623e36bd4e3c7c5 8237 8237 \n", "31 dedup::4c5bcfec8584af0d967f1ab10179ca4b 2820 2820 \n", "46 dedup::c2ae5cb2426d96ed19a50b0b7d7c8e11 9487 9487 \n", "53 dedup::1c65cef3dfd1e00c0b03923a1c591db4 1241 1241 \n", "59 dedup::4217ec5d78c4bc4e5bd006783482441f 15142 15142 \n", "... ... ... ... \n", "4560 dedup::fc394e9935fbd62c8aedc372464e1965 7161 7161 \n", "4586 dedup::000871c1fc726f0b52dc86a4eeb027de 4649 4649 \n", "4587 dedup::72c288a828485e5b1d4c52910d106734 16867 16867 \n", "4598 dedup::0163cceb20f5ca7b313419c068abd9dc 8003 8003 \n", "4608 dedup::2aeb1a8f8475cef63900be5d0780e872 15471 15471 \n", "\n", " name source unique_id \n", "28 AIR | Archivio Istituzionale della Ricerca roar roar_8237 \n", "31 USU Repository: Open Access Repository roar roar_2820 \n", "46 IR at NRF: Home roar roar_9487 \n", "53 Swansea Metropolitan University Repository roar roar_1241 \n", "59 Repositorio Institucional roar roar_15142 \n", "... ... ... ... \n", "4560 Welcome to IR@NPL roar roar_7161 \n", "4586 IIT Bombay Institutional Repository roar roar_4649 \n", "4587 Chung Shan Medical University Institutional Re... roar roar_16867 \n", "4598 EPrints@NIRT Library Welcomes! - EPrints@NIRT roar roar_8003 \n", "4608 Repository STIE Nobel Indonesia roar roar_15471 \n", "\n", "[287 rows x 6 columns]" ] }, "execution_count": 17, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup[dup.dedup_id.isin(dup_within.index)]\n", "dup_within" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Isolating duplicates across registries (hybrid)" ] }, { "cell_type": "code", "execution_count": 18, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
12dedup::471c50ad1a156d7256eddfd747d77931opendoar____::6351bf9dce654515bf1ddbd6426dfa971996ehtc repositorio institucionalOpenDOAROpenDOAR_1996
21dedup::69dafe8b58066478aea48f3d0f38482023122312Göteborgs universitets publikationer - e-publi...roarroar_2312
26dedup::8f822ac814829da24a7065b8131bdf47opendoar____::a34bacf839b923770b2c360eefa267481035kitami institute of technology repositoryOpenDOAROpenDOAR_1035
41dedup::63a99723ebb3af94d52b474c3b21dbe157795779Sanok Digital Libraryroarroar_5779
47dedup::82680bfec0fa08346c1b10d30a3e3d4a1121211212Publication Server of the Wuppertal Instituteroarroar_11212
.....................
4601dedup::7810ccd41bf26faaa2c4e1f20db70a7131723172Tesis Electrónicas UAChroarroar_3172
4602dedup::e655c7716a4b3ea67f48c6322fc42ed6opendoar____::52c5189391854c93e8a0e1326e56c14f1637vtext digital repositoryOpenDOAROpenDOAR_1637
4603dedup::5ebe5626b9f1cd89fbb9f665a527591f1622516225Necmettin Erbakan University Institutional Rep...roarroar_16225
4605dedup::ec0bfd000f253eff3acb1043e1c06979opendoar____::aa2a77371374094fe9e0bc1de3f94ed91829npue irOpenDOAROpenDOAR_1829
4610dedup::1c7836dbabd12c458d20e3b35633733a1461614616SOAR@USA: Scholarship and Open Access Repositoryroarroar_14616
\n", "

440 rows × 6 columns

\n", "
" ], "text/plain": [ " dedup_id \\\n", "12 dedup::471c50ad1a156d7256eddfd747d77931 \n", "21 dedup::69dafe8b58066478aea48f3d0f384820 \n", "26 dedup::8f822ac814829da24a7065b8131bdf47 \n", "41 dedup::63a99723ebb3af94d52b474c3b21dbe1 \n", "47 dedup::82680bfec0fa08346c1b10d30a3e3d4a \n", "... ... \n", "4601 dedup::7810ccd41bf26faaa2c4e1f20db70a71 \n", "4602 dedup::e655c7716a4b3ea67f48c6322fc42ed6 \n", "4603 dedup::5ebe5626b9f1cd89fbb9f665a527591f \n", "4605 dedup::ec0bfd000f253eff3acb1043e1c06979 \n", "4610 dedup::1c7836dbabd12c458d20e3b35633733a \n", "\n", " duplicate_id original_id \\\n", "12 opendoar____::6351bf9dce654515bf1ddbd6426dfa97 1996 \n", "21 2312 2312 \n", "26 opendoar____::a34bacf839b923770b2c360eefa26748 1035 \n", "41 5779 5779 \n", "47 11212 11212 \n", "... ... ... \n", "4601 3172 3172 \n", "4602 opendoar____::52c5189391854c93e8a0e1326e56c14f 1637 \n", "4603 16225 16225 \n", "4605 opendoar____::aa2a77371374094fe9e0bc1de3f94ed9 1829 \n", "4610 14616 14616 \n", "\n", " name source \\\n", "12 ehtc repositorio institucional OpenDOAR \n", "21 Göteborgs universitets publikationer - e-publi... roar \n", "26 kitami institute of technology repository OpenDOAR \n", "41 Sanok Digital Library roar \n", "47 Publication Server of the Wuppertal Institute roar \n", "... ... ... \n", "4601 Tesis Electrónicas UACh roar \n", "4602 vtext digital repository OpenDOAR \n", "4603 Necmettin Erbakan University Institutional Rep... roar \n", "4605 npue ir OpenDOAR \n", "4610 SOAR@USA: Scholarship and Open Access Repository roar \n", "\n", " unique_id \n", "12 OpenDOAR_1996 \n", "21 roar_2312 \n", "26 OpenDOAR_1035 \n", "41 roar_5779 \n", "47 roar_11212 \n", "... ... \n", "4601 roar_3172 \n", "4602 OpenDOAR_1637 \n", "4603 roar_16225 \n", "4605 OpenDOAR_1829 \n", "4610 roar_14616 \n", "\n", "[440 rows x 6 columns]" ] }, "execution_count": 18, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup[~dup.dedup_id.isin(dup_within.dedup_id)]\n", "dup_across = dup_across.groupby('dedup_id').aggregate(list)\n", "dup_across['source_set'] = dup_across.source.map(set)\n", "\n", "dup_hybrid = dup_across[dup_across.source_set.str.len() < dup_across.source.str.len()]\n", "dup_hybrid = dup[dup.dedup_id.isin(dup_hybrid.index)]\n", "dup_hybrid" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Isolating duplicates across registries (pure)" ] }, { "cell_type": "code", "execution_count": 19, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_id
0dedup::860320be12a1c050cd7731794e231bd3opendoar____::2290a7385ed77cc5592dc2153229f0821064oxford university research archiveOpenDOAROpenDOAR_1064
1dedup::1aa7a8773e6a7fdacbcedf9999009a38opendoar____::191f8f858acda435ae0daf994e2a72c28648digital commons@georgia southernOpenDOAROpenDOAR_8648
2dedup::31bceb0c3e2a260593e1e36655ebcee4opendoar____::d5776aeecb3c45ab15adce6f5cb355f39713materials data repositoryOpenDOAROpenDOAR_9713
3dedup::e37b08dd3015330dcbb5d6663667b8b8opendoar____::18997733ec258a9fcaf239cc55d53363427digital repository at the university of marylandOpenDOAROpenDOAR_427
4dedup::2841194266115ac1cc04d19630cde46bre3data_____::3afbb2b45a3dd218a5a091ca773cf6c5r3d100011189PRISM: University of Calgary's Digital Repositoryre3datare3data_r3d100011189
.....................
4612dedup::5ef0b4eba35ab2d6180b0bca7e46b6f9475475Ecological Restoration Institute - Northern Ar...roarroar_475
4613dedup::66e8d052ec2230c66bd11ee6b5a0e3c81419914199Repositori STKIP PGRI Sumeneproarroar_14199
4614dedup::1216a1bca4361c39d1d77965c5d95ee349604960Virtual Archive of Polish Armeniansroarroar_4960
4615dedup::1408358fe6a7f9327dd41a5651ac284c1382413824Digital Commons @ New Jersey Institute of Tech...roarroar_13824
4616dedup::5cc33dfe7e069a757ca0fcbe6b95c89eopendoar____::d8a4e572d866aa45da78418d9d2ff9f94351odu digital commonsOpenDOAROpenDOAR_4351
\n", "

3890 rows × 6 columns

\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::860320be12a1c050cd7731794e231bd3 \n", "1 dedup::1aa7a8773e6a7fdacbcedf9999009a38 \n", "2 dedup::31bceb0c3e2a260593e1e36655ebcee4 \n", "3 dedup::e37b08dd3015330dcbb5d6663667b8b8 \n", "4 dedup::2841194266115ac1cc04d19630cde46b \n", "... ... \n", "4612 dedup::5ef0b4eba35ab2d6180b0bca7e46b6f9 \n", "4613 dedup::66e8d052ec2230c66bd11ee6b5a0e3c8 \n", "4614 dedup::1216a1bca4361c39d1d77965c5d95ee3 \n", "4615 dedup::1408358fe6a7f9327dd41a5651ac284c \n", "4616 dedup::5cc33dfe7e069a757ca0fcbe6b95c89e \n", "\n", " duplicate_id original_id \\\n", "0 opendoar____::2290a7385ed77cc5592dc2153229f082 1064 \n", "1 opendoar____::191f8f858acda435ae0daf994e2a72c2 8648 \n", "2 opendoar____::d5776aeecb3c45ab15adce6f5cb355f3 9713 \n", "3 opendoar____::18997733ec258a9fcaf239cc55d53363 427 \n", "4 re3data_____::3afbb2b45a3dd218a5a091ca773cf6c5 r3d100011189 \n", "... ... ... \n", "4612 475 475 \n", "4613 14199 14199 \n", "4614 4960 4960 \n", "4615 13824 13824 \n", "4616 opendoar____::d8a4e572d866aa45da78418d9d2ff9f9 4351 \n", "\n", " name source \\\n", "0 oxford university research archive OpenDOAR \n", "1 digital commons@georgia southern OpenDOAR \n", "2 materials data repository OpenDOAR \n", "3 digital repository at the university of maryland OpenDOAR \n", "4 PRISM: University of Calgary's Digital Repository re3data \n", "... ... ... \n", "4612 Ecological Restoration Institute - Northern Ar... roar \n", "4613 Repositori STKIP PGRI Sumenep roar \n", "4614 Virtual Archive of Polish Armenians roar \n", "4615 Digital Commons @ New Jersey Institute of Tech... roar \n", "4616 odu digital commons OpenDOAR \n", "\n", " unique_id \n", "0 OpenDOAR_1064 \n", "1 OpenDOAR_8648 \n", "2 OpenDOAR_9713 \n", "3 OpenDOAR_427 \n", "4 re3data_r3d100011189 \n", "... ... \n", "4612 roar_475 \n", "4613 roar_14199 \n", "4614 roar_4960 \n", "4615 roar_13824 \n", "4616 OpenDOAR_4351 \n", "\n", "[3890 rows x 6 columns]" ] }, "execution_count": 19, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup_across[dup_across.source_set.str.len() == dup_across.source.str.len()]\n", "dup_across = dup[dup.dedup_id.isin(dup_across.index)]\n", "dup_across\n", "# dup[dup.dedup_id.isin(dup_across.index)]" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Double check partitions" ] }, { "cell_type": "code", "execution_count": 20, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "dedup_id 4617\n", "duplicate_id 4617\n", "original_id 4617\n", "name 4617\n", "source 4617\n", "unique_id 4617\n", "dtype: int64" ] }, "execution_count": 20, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup.count()" ] }, { "cell_type": "code", "execution_count": 21, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "dedup_id 4617\n", "duplicate_id 4617\n", "original_id 4617\n", "name 4617\n", "source 4617\n", "unique_id 4617\n", "dtype: int64" ] }, "execution_count": 21, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across.count() + dup_within.count() + dup_hybrid.count()" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "2191" ] }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within.groupby('dedup_id').ngroups + dup_across.groupby('dedup_id').ngroups + dup_hybrid.groupby('dedup_id').ngroups" ] }, { "cell_type": "code", "execution_count": 23, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "2191" ] }, "execution_count": 23, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup.groupby('dedup_id').ngroups" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Joining information" ] }, { "cell_type": "code", "execution_count": 24, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_OpenAIREIDre3data_orgIdentifierre3data_repositoryNamere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_descriptionre3data_typere3data_sizere3data_updateDatere3data_startDatere3data_endDatere3data_subjectre3data_missionStatementre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadre3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_OpenAIREIDOpenDOAR_orgIdentifierOpenDOAR_repositoryNameOpenDOAR_alternativeNamesOpenDOAR_repositoryURLOpenDOAR_descriptionOpenDOAR_typeOpenDOAR_updateDateOpenDOAR_startDateOpenDOAR_subjectOpenDOAR_contentTypeOpenDOAR_institutionOpenDOAR_metadataPolicyOpenDOAR_dataPolicyOpenDOAR_submissionPolicyOpenDOAR_contentPolicyOpenDOAR_softwareOpenDOAR_apiOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
0dedup::d2ddea18f00665ce8623e36bd4e3c7c582378237AIR | Archivio Istituzionale della Ricercaroarroar_8237NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN823717archive5268NaNNaNdisk0/00/00/82/372014-05-15 11:23:302014-05-19 05:42:472014-05-15 11:23:30institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://air.unimi.itAIR | Archivio Istituzionale della Ricercahttp://air.unimi.it/dspace-oai/requestNaNNaNNaNAIR (Archivio Istituzionale della ricerca) is ...FALSEFALSETRUEUniversità degli Studi di Milanohttp://www.unimi.ititMilan45.469.1947dspacegeoname_2_ITotherNaN2014-05-04 17:40:53NaNNaN000990,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19,6...NaNNaNNaNNaNcelestial1596NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_8237
1dedup::4c5bcfec8584af0d967f1ab10179ca4b28202820USU Repository: Open Access Repositoryroarroar_2820NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN2820525archive65NaNNaNdisk0/00/00/28/202010-07-29 01:40:272012-01-19 11:37:492010-07-29 01:40:27institutional2372NaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://repository.usu.ac.idUSU Repository: Open Access Repositoryhttp://repository.usu.ac.id/oai/requestNaNhttp://repository.usu.ac.id/feed/rss_2.0/siteNaNComprises of works by and/or about the univers...TRUETRUEFALSE[USU Library, University of Sumatera Utara][http://library.usu.ac.id, http://www.usu.ac.id]idMedan3.559598.6572dspacegeoname_2_IDotherNaN2010-01-15 10:09:25NaNNaN0001000,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,51,52,...NaNNaNNaNNaN[opendoar, roarmap, celestial][1717, 2101, 283]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_2820
2dedup::c2ae5cb2426d96ed19a50b0b7d7c8e1194879487IR at NRF: Homeroarroar_9487NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN948716archive6458NaNNaNdisk0/00/00/94/872015-05-15 14:03:552016-03-21 20:21:022015-05-15 14:03:55multiNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://ir.nrf.ac.za/IR at NRF: HomeNaNNaNNaNNaNThe NRF receives its mandate from the National...TRUETRUEFALSENational Research Foundation of South Africahttp://www.nrf.ac.za/zaPretoriaNaNNaNdspacegeoname_2_ZAother[B1, AI, AS]2015-02-10 06:35:50NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroarmapNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_9487
3dedup::1c65cef3dfd1e00c0b03923a1c591db412411241Swansea Metropolitan University Repositoryroarroar_1241NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN1241583archive1NaNNaNdisk0/00/00/12/412010-01-06 13:45:322011-07-18 05:57:232010-01-06 13:45:32institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://dspace.smu.ac.uk/dspace/Swansea Metropolitan University Repositoryhttp://dspace.smu.ac.uk/dspace-oai/requestNaNNaNNaNUsers may set up RSS feeds to be alerted to ne...NaNNaNNaNSwansea Metropolitan Universityhttp://www.smu.ac.uk/gbSwansea51.6144-3.8727dspacegeoname_2_GBotherNaN2008-05-15 11:29:17NaNNaN0001350,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,3,135,13...0000[opendoar, celestial][1779, 1627]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_1241
4dedup::4217ec5d78c4bc4e5bd006783482441f1514215142Repositorio Institucionalroarroar_15142NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN1514211archive12132NaNNaNdisk0/00/01/51/422020-08-08 12:35:502021-01-25 22:45:102020-08-08 12:35:50institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://repositorio.undar.edu.pe/Repositorio Institucionalhttp://repositorio.undar.edu.pe/NaNNaNNaNNaNFALSEFALSEFALSENaNNaNpehuanuco-9.9269-76.2396dspacegeoname_2_PEotherNaN2019-09-02 21:20:31NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoarhttp://v2.sherpa.ac.uk/id/repository/4422NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_15142
\n", "
" ], "text/plain": [ " dedup_id duplicate_id original_id \\\n", "0 dedup::d2ddea18f00665ce8623e36bd4e3c7c5 8237 8237 \n", "1 dedup::4c5bcfec8584af0d967f1ab10179ca4b 2820 2820 \n", "2 dedup::c2ae5cb2426d96ed19a50b0b7d7c8e11 9487 9487 \n", "3 dedup::1c65cef3dfd1e00c0b03923a1c591db4 1241 1241 \n", "4 dedup::4217ec5d78c4bc4e5bd006783482441f 15142 15142 \n", "\n", " name source unique_id \\\n", "0 AIR | Archivio Istituzionale della Ricerca roar roar_8237 \n", "1 USU Repository: Open Access Repository roar roar_2820 \n", "2 IR at NRF: Home roar roar_9487 \n", "3 Swansea Metropolitan University Repository roar roar_1241 \n", "4 Repositorio Institucional roar roar_15142 \n", "\n", " FAIRsharing_id FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.name FAIRsharing_attributes.metadata.status \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_OpenAIREID re3data_orgIdentifier re3data_repositoryName \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_additionalName re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_description re3data_type re3data_size re3data_updateDate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_startDate re3data_endDate re3data_subject re3data_missionStatement \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_contentType re3data_providerType re3data_keyword \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_institution re3data_policy re3data_databaseAccess \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_databaseLicense re3data_dataAccess re3data_dataLicense \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_dataUpload re3data_dataUploadLicense re3data_software \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_versioning re3data_api re3data_pidSystem \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_unique_id OpenDOAR_OpenAIREID OpenDOAR_orgIdentifier \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_repositoryName OpenDOAR_alternativeNames OpenDOAR_repositoryURL \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_description OpenDOAR_type OpenDOAR_updateDate OpenDOAR_startDate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " OpenDOAR_subject OpenDOAR_contentType OpenDOAR_institution \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_metadataPolicy OpenDOAR_dataPolicy OpenDOAR_submissionPolicy \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_contentPolicy OpenDOAR_software OpenDOAR_api OpenDOAR_unique_id \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_eprintid roar_rev_number roar_eprint_status roar_userid roar_importid \\\n", "0 8237 17 archive 5268 NaN \n", "1 2820 525 archive 65 NaN \n", "2 9487 16 archive 6458 NaN \n", "3 1241 583 archive 1 NaN \n", "4 15142 11 archive 12132 NaN \n", "\n", " roar_source roar_dir roar_datestamp roar_lastmod \\\n", "0 NaN disk0/00/00/82/37 2014-05-15 11:23:30 2014-05-19 05:42:47 \n", "1 NaN disk0/00/00/28/20 2010-07-29 01:40:27 2012-01-19 11:37:49 \n", "2 NaN disk0/00/00/94/87 2015-05-15 14:03:55 2016-03-21 20:21:02 \n", "3 NaN disk0/00/00/12/41 2010-01-06 13:45:32 2011-07-18 05:57:23 \n", "4 NaN disk0/00/01/51/42 2020-08-08 12:35:50 2021-01-25 22:45:10 \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "0 2014-05-15 11:23:30 institutional NaN NaN \n", "1 2010-07-29 01:40:27 institutional 2372 NaN \n", "2 2015-05-15 14:03:55 multi NaN NaN \n", "3 2010-01-06 13:45:32 institutional NaN NaN \n", "4 2020-08-08 12:35:50 institutional NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "0 show NaN NaN NaN \n", "1 show NaN NaN NaN \n", "2 show NaN NaN NaN \n", "3 show NaN NaN NaN \n", "4 show NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "0 NaN NaN NaN NaN \n", "1 0 NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 0 NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_home_page \\\n", "0 http://air.unimi.it \n", "1 http://repository.usu.ac.id \n", "2 http://ir.nrf.ac.za/ \n", "3 http://dspace.smu.ac.uk/dspace/ \n", "4 http://repositorio.undar.edu.pe/ \n", "\n", " roar_title \\\n", "0 AIR | Archivio Istituzionale della Ricerca \n", "1 USU Repository: Open Access Repository \n", "2 IR at NRF: Home \n", "3 Swansea Metropolitan University Repository \n", "4 Repositorio Institucional \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "0 http://air.unimi.it/dspace-oai/request NaN \n", "1 http://repository.usu.ac.id/oai/request NaN \n", "2 NaN NaN \n", "3 http://dspace.smu.ac.uk/dspace-oai/request NaN \n", "4 http://repositorio.undar.edu.pe/ NaN \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 NaN NaN \n", "1 http://repository.usu.ac.id/feed/rss_2.0/site NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_description roar_fulltext \\\n", "0 AIR (Archivio Istituzionale della ricerca) is ... FALSE \n", "1 Comprises of works by and/or about the univers... TRUE \n", "2 The NRF receives its mandate from the National... TRUE \n", "3 Users may set up RSS feeds to be alerted to ne... NaN \n", "4 NaN FALSE \n", "\n", " roar_open_access roar_mandate roar_organisation_title \\\n", "0 FALSE TRUE Università degli Studi di Milano \n", "1 TRUE FALSE [USU Library, University of Sumatera Utara] \n", "2 TRUE FALSE National Research Foundation of South Africa \n", "3 NaN NaN Swansea Metropolitan University \n", "4 FALSE FALSE NaN \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 http://www.unimi.it it \n", "1 [http://library.usu.ac.id, http://www.usu.ac.id] id \n", "2 http://www.nrf.ac.za/ za \n", "3 http://www.smu.ac.uk/ gb \n", "4 NaN pe \n", "\n", " roar_location_city roar_location_latitude roar_location_longitude \\\n", "0 Milan 45.46 9.1947 \n", "1 Medan 3.5595 98.6572 \n", "2 Pretoria NaN NaN \n", "3 Swansea 51.6144 -3.8727 \n", "4 huanuco -9.9269 -76.2396 \n", "\n", " roar_software roar_geoname roar_version roar_subjects roar_date \\\n", "0 dspace geoname_2_IT other NaN 2014-05-04 17:40:53 \n", "1 dspace geoname_2_ID other NaN 2010-01-15 10:09:25 \n", "2 dspace geoname_2_ZA other [B1, AI, AS] 2015-02-10 06:35:50 \n", "3 dspace geoname_2_GB other NaN 2008-05-15 11:29:17 \n", "4 dspace geoname_2_PE other NaN 2019-09-02 21:20:31 \n", "\n", " roar_note roar_suggestions roar_activity_low roar_activity_medium \\\n", "0 NaN NaN 0 0 \n", "1 NaN NaN 0 0 \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN 0 0 \n", "4 NaN NaN NaN NaN \n", "\n", " roar_activity_high roar_recordcount \\\n", "0 0 99 \n", "1 0 100 \n", "2 NaN NaN \n", "3 0 135 \n", "4 NaN NaN \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19,6... NaN \n", "1 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,51,52,... NaN \n", "2 NaN NaN \n", "3 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,3,135,13... 0 \n", "4 NaN NaN \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 0 0 0 \n", "4 NaN NaN NaN \n", "\n", " roar_registry_name roar_registry_id \\\n", "0 celestial 1596 \n", "1 [opendoar, roarmap, celestial] [1717, 2101, 283] \n", "2 roarmap NaN \n", "3 [opendoar, celestial] [1779, 1627] \n", "4 opendoar http://v2.sherpa.ac.uk/id/repository/4422 \n", "\n", " roar_submit_to roar_submitted_to_name roar_submitted_to_done \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_rank roar_webometrics_size roar_webometrics_visibility \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_total_deposits roar_association roar_unique_id \n", "0 NaN NaN roar_8237 \n", "1 NaN NaN roar_2820 \n", "2 NaN NaN roar_9487 \n", "3 NaN NaN roar_1241 \n", "4 NaN NaN roar_15142 " ] }, "execution_count": 24, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup_within.merge(fairsharing_df, left_on='unique_id', right_on='FAIRsharing_unique_id', how='left')\n", "dup_within = dup_within.merge(re3data_df, left_on='unique_id', right_on='re3data_unique_id', how='left')\n", "dup_within = dup_within.merge(opendoar_df, left_on='unique_id', right_on='OpenDOAR_unique_id', how='left')\n", "dup_within = dup_within.merge(roar_df, left_on='unique_id', right_on='roar_unique_id', how='left')\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 25, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_OpenAIREIDre3data_orgIdentifierre3data_repositoryNamere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_descriptionre3data_typere3data_sizere3data_updateDatere3data_startDatere3data_endDatere3data_subjectre3data_missionStatementre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadre3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_OpenAIREIDOpenDOAR_orgIdentifierOpenDOAR_repositoryNameOpenDOAR_alternativeNamesOpenDOAR_repositoryURLOpenDOAR_descriptionOpenDOAR_typeOpenDOAR_updateDateOpenDOAR_startDateOpenDOAR_subjectOpenDOAR_contentTypeOpenDOAR_institutionOpenDOAR_metadataPolicyOpenDOAR_dataPolicyOpenDOAR_submissionPolicyOpenDOAR_contentPolicyOpenDOAR_softwareOpenDOAR_apiOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
0dedup::471c50ad1a156d7256eddfd747d77931opendoar____::6351bf9dce654515bf1ddbd6426dfa971996ehtc repositorio institucionalOpenDOAROpenDOAR_1996NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar____::6351bf9dce654515bf1ddbd6426dfa971996ehtc repositorio institucional[]http://www.repositorio.ehtc.cu/jspui/this site provides access to the hospitality a...institutional2019-10-17 14:34:312010-12-01 11:11:57[business and economics, education][journal_articles, conference_and_workshop_pap...[[escuela de hotelería y turismo de camagüey, ...FalseFalseFalseFalsedspace 1.6.2falseOpenDOAR_1996NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
1dedup::69dafe8b58066478aea48f3d0f38482023122312Göteborgs universitets publikationer - e-publi...roarroar_2312NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN2312736archive1NaNNaNdisk0/00/00/23/122010-01-14 12:10:062011-07-18 06:01:082010-01-14 12:10:06institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN0NaNNaNNaNhttp://gupea.ub.gu.se/dspace/index.jspGöteborgs universitets publikationer - e-publi...http://gupea.ub.gu.se/dspace-oai/requestNaNNaNNaNThis is an institutional repository providing ...FALSEFALSEFALSEGöteborgs Universitethttp://www.gu.se/seNaN57.697511.9608dspaceNaNotherNaN2005-06-07 12:57:08NaNNaN000960,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...NaNNaNNaNNaN[opendoar, celestial][1832, 1149]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_2312
2dedup::8f822ac814829da24a7065b8131bdf47opendoar____::a34bacf839b923770b2c360eefa267481035kitami institute of technology repositoryOpenDOAROpenDOAR_1035NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar____::a34bacf839b923770b2c360eefa267481035kitami institute of technology repository[北見工業大学学術機関リポジトリ kit-r]https://kitami-it.repo.nii.ac.jp/this site is a university repository providing...institutional2020-09-09 11:57:562007-10-09 09:09:40[technology general][journal_articles, unpub_reports_and_working_p...[[kitami institute of technology, [北見工業大学], jp...FalseFalseFalseFalsewekotrueOpenDOAR_1035NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
3dedup::63a99723ebb3af94d52b474c3b21dbe157795779Sanok Digital Libraryroarroar_5779NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN57799archive8NaNNaNdisk0/00/00/57/792012-12-12 04:54:202012-12-15 02:36:202012-12-12 04:54:20otherNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttp://sanockabibliotekacyfrowa.pl/dlibraSanok Digital Libraryhttp://sanockabibliotekacyfrowa.pl/dlibra/oai-...NaNNaNNaNThis site provides access to the digitised col...NaNNaNNaNDigital-Centerhttp://www.digital-center.pl/plNaN52.487216.8493NaNgeoname_2_PLotherNaN2012-08-05 15:12:12NaNNaN000190,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19,19,19...NaNNaNNaNNaN[opendoar, celestial][5072, 2545]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_5779
4dedup::82680bfec0fa08346c1b10d30a3e3d4a1121211212Publication Server of the Wuppertal Instituteroarroar_11212NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN1121212archive5611NaNNaNdisk0/00/01/12/122016-05-04 11:37:142016-05-07 01:37:182016-05-04 11:37:14institutionalNaNNaNshowNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNhttps://epub.wupperinst.org/homePublication Server of the Wuppertal Institute\\...https://epub.wupperinst.org/oaiNaNhttps://epub.wupperinst.org/rssNaN\\n\\nOn this Publication Server of the Wupperta...TRUETRUEFALSEWuppertal Institut für Klima, Umwelt, Energiehttp://wupperinst.org/deWuppertal51.25627.1508opusgeoname_2_DEother[HB, GE, T1]2016-04-28 13:58:38NaNplease delete ID 5891NaNNaNNaNNaNNaNNaNNaNNaNNaN[opendoar, celestial][6112, 2539]NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNroar_11212
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::471c50ad1a156d7256eddfd747d77931 \n", "1 dedup::69dafe8b58066478aea48f3d0f384820 \n", "2 dedup::8f822ac814829da24a7065b8131bdf47 \n", "3 dedup::63a99723ebb3af94d52b474c3b21dbe1 \n", "4 dedup::82680bfec0fa08346c1b10d30a3e3d4a \n", "\n", " duplicate_id original_id \\\n", "0 opendoar____::6351bf9dce654515bf1ddbd6426dfa97 1996 \n", "1 2312 2312 \n", "2 opendoar____::a34bacf839b923770b2c360eefa26748 1035 \n", "3 5779 5779 \n", "4 11212 11212 \n", "\n", " name source unique_id \\\n", "0 ehtc repositorio institucional OpenDOAR OpenDOAR_1996 \n", "1 Göteborgs universitets publikationer - e-publi... roar roar_2312 \n", "2 kitami institute of technology repository OpenDOAR OpenDOAR_1035 \n", "3 Sanok Digital Library roar roar_5779 \n", "4 Publication Server of the Wuppertal Institute roar roar_11212 \n", "\n", " FAIRsharing_id FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.name FAIRsharing_attributes.metadata.status \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_OpenAIREID re3data_orgIdentifier re3data_repositoryName \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_additionalName re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_description re3data_type re3data_size re3data_updateDate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_startDate re3data_endDate re3data_subject re3data_missionStatement \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_contentType re3data_providerType re3data_keyword \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_institution re3data_policy re3data_databaseAccess \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_databaseLicense re3data_dataAccess re3data_dataLicense \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_dataUpload re3data_dataUploadLicense re3data_software \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_versioning re3data_api re3data_pidSystem \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_unique_id OpenDOAR_OpenAIREID \\\n", "0 NaN opendoar____::6351bf9dce654515bf1ddbd6426dfa97 \n", "1 NaN NaN \n", "2 NaN opendoar____::a34bacf839b923770b2c360eefa26748 \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_orgIdentifier OpenDOAR_repositoryName \\\n", "0 1996 ehtc repositorio institucional \n", "1 NaN NaN \n", "2 1035 kitami institute of technology repository \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_alternativeNames OpenDOAR_repositoryURL \\\n", "0 [] http://www.repositorio.ehtc.cu/jspui/ \n", "1 NaN NaN \n", "2 [北見工業大学学術機関リポジトリ kit-r] https://kitami-it.repo.nii.ac.jp/ \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_description OpenDOAR_type \\\n", "0 this site provides access to the hospitality a... institutional \n", "1 NaN NaN \n", "2 this site is a university repository providing... institutional \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_updateDate OpenDOAR_startDate \\\n", "0 2019-10-17 14:34:31 2010-12-01 11:11:57 \n", "1 NaN NaN \n", "2 2020-09-09 11:57:56 2007-10-09 09:09:40 \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_subject \\\n", "0 [business and economics, education] \n", "1 NaN \n", "2 [technology general] \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_contentType \\\n", "0 [journal_articles, conference_and_workshop_pap... \n", "1 NaN \n", "2 [journal_articles, unpub_reports_and_working_p... \n", "3 NaN \n", "4 NaN \n", "\n", " OpenDOAR_institution OpenDOAR_metadataPolicy \\\n", "0 [[escuela de hotelería y turismo de camagüey, ... False \n", "1 NaN NaN \n", "2 [[kitami institute of technology, [北見工業大学], jp... False \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " OpenDOAR_dataPolicy OpenDOAR_submissionPolicy OpenDOAR_contentPolicy \\\n", "0 False False False \n", "1 NaN NaN NaN \n", "2 False False False \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_software OpenDOAR_api OpenDOAR_unique_id roar_eprintid \\\n", "0 dspace 1.6.2 false OpenDOAR_1996 NaN \n", "1 NaN NaN NaN 2312 \n", "2 weko true OpenDOAR_1035 NaN \n", "3 NaN NaN NaN 5779 \n", "4 NaN NaN NaN 11212 \n", "\n", " roar_rev_number roar_eprint_status roar_userid roar_importid roar_source \\\n", "0 NaN NaN NaN NaN NaN \n", "1 736 archive 1 NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 9 archive 8 NaN NaN \n", "4 12 archive 5611 NaN NaN \n", "\n", " roar_dir roar_datestamp roar_lastmod \\\n", "0 NaN NaN NaN \n", "1 disk0/00/00/23/12 2010-01-14 12:10:06 2011-07-18 06:01:08 \n", "2 NaN NaN NaN \n", "3 disk0/00/00/57/79 2012-12-12 04:54:20 2012-12-15 02:36:20 \n", "4 disk0/00/01/12/12 2016-05-04 11:37:14 2016-05-07 01:37:18 \n", "\n", " roar_status_changed roar_type roar_succeeds roar_commentary \\\n", "0 NaN NaN NaN NaN \n", "1 2010-01-14 12:10:06 institutional NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 2012-12-12 04:54:20 other NaN NaN \n", "4 2016-05-04 11:37:14 institutional NaN NaN \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "0 NaN NaN NaN NaN \n", "1 show NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 show NaN NaN NaN \n", "4 show NaN NaN NaN \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "0 NaN NaN NaN NaN \n", "1 0 NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_home_page \\\n", "0 NaN \n", "1 http://gupea.ub.gu.se/dspace/index.jsp \n", "2 NaN \n", "3 http://sanockabibliotekacyfrowa.pl/dlibra \n", "4 https://epub.wupperinst.org/home \n", "\n", " roar_title \\\n", "0 NaN \n", "1 Göteborgs universitets publikationer - e-publi... \n", "2 NaN \n", "3 Sanok Digital Library \n", "4 Publication Server of the Wuppertal Institute\\... \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "0 NaN NaN \n", "1 http://gupea.ub.gu.se/dspace-oai/request NaN \n", "2 NaN NaN \n", "3 http://sanockabibliotekacyfrowa.pl/dlibra/oai-... NaN \n", "4 https://epub.wupperinst.org/oai NaN \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 https://epub.wupperinst.org/rss NaN \n", "\n", " roar_description roar_fulltext \\\n", "0 NaN NaN \n", "1 This is an institutional repository providing ... FALSE \n", "2 NaN NaN \n", "3 This site provides access to the digitised col... NaN \n", "4 \\n\\nOn this Publication Server of the Wupperta... TRUE \n", "\n", " roar_open_access roar_mandate \\\n", "0 NaN NaN \n", "1 FALSE FALSE \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 TRUE FALSE \n", "\n", " roar_organisation_title \\\n", "0 NaN \n", "1 Göteborgs Universitet \n", "2 NaN \n", "3 Digital-Center \n", "4 Wuppertal Institut für Klima, Umwelt, Energie \n", "\n", " roar_organisation_home_page roar_location_country roar_location_city \\\n", "0 NaN NaN NaN \n", "1 http://www.gu.se/ se NaN \n", "2 NaN NaN NaN \n", "3 http://www.digital-center.pl/ pl NaN \n", "4 http://wupperinst.org/ de Wuppertal \n", "\n", " roar_location_latitude roar_location_longitude roar_software roar_geoname \\\n", "0 NaN NaN NaN NaN \n", "1 57.6975 11.9608 dspace NaN \n", "2 NaN NaN NaN NaN \n", "3 52.4872 16.8493 NaN geoname_2_PL \n", "4 51.2562 7.1508 opus geoname_2_DE \n", "\n", " roar_version roar_subjects roar_date roar_note \\\n", "0 NaN NaN NaN NaN \n", "1 other NaN 2005-06-07 12:57:08 NaN \n", "2 NaN NaN NaN NaN \n", "3 other NaN 2012-08-05 15:12:12 NaN \n", "4 other [HB, GE, T1] 2016-04-28 13:58:38 NaN \n", "\n", " roar_suggestions roar_activity_low roar_activity_medium \\\n", "0 NaN NaN NaN \n", "1 NaN 0 0 \n", "2 NaN NaN NaN \n", "3 NaN 0 0 \n", "4 please delete ID 5891 NaN NaN \n", "\n", " roar_activity_high roar_recordcount \\\n", "0 NaN NaN \n", "1 0 96 \n", "2 NaN NaN \n", "3 0 19 \n", "4 NaN NaN \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 NaN NaN \n", "1 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,... NaN \n", "2 NaN NaN \n", "3 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19,19,19... NaN \n", "4 NaN NaN \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_registry_name roar_registry_id roar_submit_to \\\n", "0 NaN NaN NaN \n", "1 [opendoar, celestial] [1832, 1149] NaN \n", "2 NaN NaN NaN \n", "3 [opendoar, celestial] [5072, 2545] NaN \n", "4 [opendoar, celestial] [6112, 2539] NaN \n", "\n", " roar_submitted_to_name roar_submitted_to_done roar_webometrics_rank \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_size roar_webometrics_visibility \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_total_deposits roar_association roar_unique_id \n", "0 NaN NaN NaN \n", "1 NaN NaN roar_2312 \n", "2 NaN NaN NaN \n", "3 NaN NaN roar_5779 \n", "4 NaN NaN roar_11212 " ] }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_hybrid = dup_hybrid.merge(fairsharing_df, left_on='unique_id', right_on='FAIRsharing_unique_id', how='left')\n", "dup_hybrid = dup_hybrid.merge(re3data_df, left_on='unique_id', right_on='re3data_unique_id', how='left')\n", "dup_hybrid = dup_hybrid.merge(opendoar_df, left_on='unique_id', right_on='OpenDOAR_unique_id', how='left')\n", "dup_hybrid = dup_hybrid.merge(roar_df, left_on='unique_id', right_on='roar_unique_id', how='left')\n", "dup_hybrid.head()" ] }, { "cell_type": "code", "execution_count": 26, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_OpenAIREIDre3data_orgIdentifierre3data_repositoryNamere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_descriptionre3data_typere3data_sizere3data_updateDatere3data_startDatere3data_endDatere3data_subjectre3data_missionStatementre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadre3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_OpenAIREIDOpenDOAR_orgIdentifierOpenDOAR_repositoryNameOpenDOAR_alternativeNamesOpenDOAR_repositoryURLOpenDOAR_descriptionOpenDOAR_typeOpenDOAR_updateDateOpenDOAR_startDateOpenDOAR_subjectOpenDOAR_contentTypeOpenDOAR_institutionOpenDOAR_metadataPolicyOpenDOAR_dataPolicyOpenDOAR_submissionPolicyOpenDOAR_contentPolicyOpenDOAR_softwareOpenDOAR_apiOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_id
0dedup::860320be12a1c050cd7731794e231bd3opendoar____::2290a7385ed77cc5592dc2153229f0821064oxford university research archiveOpenDOAROpenDOAR_1064NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar____::2290a7385ed77cc5592dc2153229f0821064oxford university research archive[ora]http://ora.ox.ac.ukthis site provides access to the collected res...institutional2021-09-13 13:35:442007-10-10 16:16:02[multidisciplinary][journal_articles, conference_and_workshop_pap...[[university of oxford, [], gb, http://www.ox....FalseFalseFalseFalsefedora 4.6.2trueOpenDOAR_1064NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
1dedup::1aa7a8773e6a7fdacbcedf9999009a38opendoar____::191f8f858acda435ae0daf994e2a72c28648digital commons@georgia southernOpenDOAROpenDOAR_8648NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar____::191f8f858acda435ae0daf994e2a72c28648digital commons@georgia southern[]https://digitalcommons.georgiasouthern.eduthis site provides access to the research outp...institutional2021-02-18 18:13:342019-09-28 04:24:47[multidisciplinary][journal_articles, conference_and_workshop_pap...[[georgia southern university, [], us, https:/...FalseFalseFalseFalsedigital_commonstrueOpenDOAR_8648NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
2dedup::31bceb0c3e2a260593e1e36655ebcee4opendoar____::d5776aeecb3c45ab15adce6f5cb355f39713materials data repositoryOpenDOAROpenDOAR_9713NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar____::d5776aeecb3c45ab15adce6f5cb355f39713materials data repository[mdr]https://mdr.nims.go.jpmdr : materials data repository is a data repo...institutional2021-05-21 18:04:322020-07-13 10:09:55[science general][journal_articles, conference_and_workshop_pap...[[national institute for materials science, [n...FalseFalseFalseFalsefedoratrueOpenDOAR_9713NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
3dedup::e37b08dd3015330dcbb5d6663667b8b8opendoar____::18997733ec258a9fcaf239cc55d53363427digital repository at the university of marylandOpenDOAROpenDOAR_427NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNopendoar____::18997733ec258a9fcaf239cc55d53363427digital repository at the university of maryland[drum]http://drum.lib.umd.edu/this site is a university repository providing...institutional2021-09-13 13:35:392006-08-04 09:09:20[multidisciplinary][journal_articles, theses_and_dissertations, u...[[university of maryland, [], us, http://www.u...FalseFalseFalseFalsedspace 4.1.0trueOpenDOAR_427NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
4dedup::2841194266115ac1cc04d19630cde46bre3data_____::3afbb2b45a3dd218a5a091ca773cf6c5r3d100011189PRISM: University of Calgary's Digital Repositoryre3datare3data_r3d100011189NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNre3data_____::3afbb2b45a3dd218a5a091ca773cf6c5r3d100011189PRISM: University of Calgary's Digital Repository[]https://prism.ucalgary.ca/[OpenDOAR:7771]PRISM is a digital archive of the University o...[institutional]NaNNaNNaNNaN[1 Humanities and Social Sciences, 11 Humaniti...False[Audiovisual data, Images, Standard office doc...[dataProvider][multidisciplinary][[University of Calgary, Libraries and Cultura...TruetrueFalseTrueTrueTrueTrueTrueNaNFalseTrueTrueTruenoyesFalseFalseTrueNaN2014-10-202020-01-09re3data_r3d100011189NaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::860320be12a1c050cd7731794e231bd3 \n", "1 dedup::1aa7a8773e6a7fdacbcedf9999009a38 \n", "2 dedup::31bceb0c3e2a260593e1e36655ebcee4 \n", "3 dedup::e37b08dd3015330dcbb5d6663667b8b8 \n", "4 dedup::2841194266115ac1cc04d19630cde46b \n", "\n", " duplicate_id original_id \\\n", "0 opendoar____::2290a7385ed77cc5592dc2153229f082 1064 \n", "1 opendoar____::191f8f858acda435ae0daf994e2a72c2 8648 \n", "2 opendoar____::d5776aeecb3c45ab15adce6f5cb355f3 9713 \n", "3 opendoar____::18997733ec258a9fcaf239cc55d53363 427 \n", "4 re3data_____::3afbb2b45a3dd218a5a091ca773cf6c5 r3d100011189 \n", "\n", " name source \\\n", "0 oxford university research archive OpenDOAR \n", "1 digital commons@georgia southern OpenDOAR \n", "2 materials data repository OpenDOAR \n", "3 digital repository at the university of maryland OpenDOAR \n", "4 PRISM: University of Calgary's Digital Repository re3data \n", "\n", " unique_id FAIRsharing_id FAIRsharing_type \\\n", "0 OpenDOAR_1064 NaN NaN \n", "1 OpenDOAR_8648 NaN NaN \n", "2 OpenDOAR_9713 NaN NaN \n", "3 OpenDOAR_427 NaN NaN \n", "4 re3data_r3d100011189 NaN NaN \n", "\n", " FAIRsharing_attributes.created-at FAIRsharing_attributes.updated-at \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.doi FAIRsharing_attributes.metadata.name \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 NaN \n", "1 NaN \n", "2 NaN \n", "3 NaN \n", "4 NaN \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " re3data_OpenAIREID re3data_orgIdentifier \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 re3data_____::3afbb2b45a3dd218a5a091ca773cf6c5 r3d100011189 \n", "\n", " re3data_repositoryName re3data_additionalName \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 PRISM: University of Calgary's Digital Repository [] \n", "\n", " re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 https://prism.ucalgary.ca/ [OpenDOAR:7771] \n", "\n", " re3data_description re3data_type \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 PRISM is a digital archive of the University o... [institutional] \n", "\n", " re3data_size re3data_updateDate re3data_startDate re3data_endDate \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " re3data_subject re3data_missionStatement \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 [1 Humanities and Social Sciences, 11 Humaniti... False \n", "\n", " re3data_contentType re3data_providerType \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 [Audiovisual data, Images, Standard office doc... [dataProvider] \n", "\n", " re3data_keyword re3data_institution \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 [multidisciplinary] [[University of Calgary, Libraries and Cultura... \n", "\n", " re3data_policy re3data_databaseAccess re3data_databaseLicense \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 True true False \n", "\n", " re3data_dataAccess re3data_dataLicense re3data_dataUpload \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 True True True \n", "\n", " re3data_dataUploadLicense re3data_software re3data_versioning re3data_api \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 True True NaN False \n", "\n", " re3data_pidSystem re3data_citationGuidelineURL re3data_aidSystem \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 True True True \n", "\n", " re3data_enhancedPublication re3data_qualityManagement re3data_certificate \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 no yes False \n", "\n", " re3data_metadataStandard re3data_syndication re3data_remarks \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 False True NaN \n", "\n", " re3data_entryDate re3data_lastUpdate re3data_unique_id \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 2014-10-20 2020-01-09 re3data_r3d100011189 \n", "\n", " OpenDOAR_OpenAIREID OpenDOAR_orgIdentifier \\\n", "0 opendoar____::2290a7385ed77cc5592dc2153229f082 1064 \n", "1 opendoar____::191f8f858acda435ae0daf994e2a72c2 8648 \n", "2 opendoar____::d5776aeecb3c45ab15adce6f5cb355f3 9713 \n", "3 opendoar____::18997733ec258a9fcaf239cc55d53363 427 \n", "4 NaN NaN \n", "\n", " OpenDOAR_repositoryName OpenDOAR_alternativeNames \\\n", "0 oxford university research archive [ora] \n", "1 digital commons@georgia southern [] \n", "2 materials data repository [mdr] \n", "3 digital repository at the university of maryland [drum] \n", "4 NaN NaN \n", "\n", " OpenDOAR_repositoryURL \\\n", "0 http://ora.ox.ac.uk \n", "1 https://digitalcommons.georgiasouthern.edu \n", "2 https://mdr.nims.go.jp \n", "3 http://drum.lib.umd.edu/ \n", "4 NaN \n", "\n", " OpenDOAR_description OpenDOAR_type \\\n", "0 this site provides access to the collected res... institutional \n", "1 this site provides access to the research outp... institutional \n", "2 mdr : materials data repository is a data repo... institutional \n", "3 this site is a university repository providing... institutional \n", "4 NaN NaN \n", "\n", " OpenDOAR_updateDate OpenDOAR_startDate OpenDOAR_subject \\\n", "0 2021-09-13 13:35:44 2007-10-10 16:16:02 [multidisciplinary] \n", "1 2021-02-18 18:13:34 2019-09-28 04:24:47 [multidisciplinary] \n", "2 2021-05-21 18:04:32 2020-07-13 10:09:55 [science general] \n", "3 2021-09-13 13:35:39 2006-08-04 09:09:20 [multidisciplinary] \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_contentType \\\n", "0 [journal_articles, conference_and_workshop_pap... \n", "1 [journal_articles, conference_and_workshop_pap... \n", "2 [journal_articles, conference_and_workshop_pap... \n", "3 [journal_articles, theses_and_dissertations, u... \n", "4 NaN \n", "\n", " OpenDOAR_institution OpenDOAR_metadataPolicy \\\n", "0 [[university of oxford, [], gb, http://www.ox.... False \n", "1 [[georgia southern university, [], us, https:/... False \n", "2 [[national institute for materials science, [n... False \n", "3 [[university of maryland, [], us, http://www.u... False \n", "4 NaN NaN \n", "\n", " OpenDOAR_dataPolicy OpenDOAR_submissionPolicy OpenDOAR_contentPolicy \\\n", "0 False False False \n", "1 False False False \n", "2 False False False \n", "3 False False False \n", "4 NaN NaN NaN \n", "\n", " OpenDOAR_software OpenDOAR_api OpenDOAR_unique_id roar_eprintid \\\n", "0 fedora 4.6.2 true OpenDOAR_1064 NaN \n", "1 digital_commons true OpenDOAR_8648 NaN \n", "2 fedora true OpenDOAR_9713 NaN \n", "3 dspace 4.1.0 true OpenDOAR_427 NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_rev_number roar_eprint_status roar_userid roar_importid roar_source \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_dir roar_datestamp roar_lastmod roar_status_changed roar_type \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_succeeds roar_commentary roar_metadata_visibility roar_latitude \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_longitude roar_relation_type roar_relation_uri roar_item_issues_id \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_item_issues_type roar_item_issues_description \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_timestamp roar_item_issues_status \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_reported_by roar_item_issues_resolved_by \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_item_issues_comment roar_item_issues_count roar_sword_depositor \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_sword_slug roar_exemplar roar_home_page roar_title roar_oai_pmh \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_sword_endpoint roar_rss_feed roar_twitter_feed roar_description \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_fulltext roar_open_access roar_mandate roar_organisation_title \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_organisation_home_page roar_location_country roar_location_city \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_location_latitude roar_location_longitude roar_software roar_geoname \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_version roar_subjects roar_date roar_note roar_suggestions \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN NaN \n", "\n", " roar_activity_low roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 NaN NaN NaN NaN \n", "4 NaN NaN NaN NaN \n", "\n", " roar_recordhistory roar_fulltexts_total roar_fulltexts_docs \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_fulltexts_rtotal roar_fulltexts_rdocs roar_registry_name \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_registry_id roar_submit_to roar_submitted_to_name \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_submitted_to_done roar_webometrics_rank roar_webometrics_size \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_webometrics_visibility roar_webometrics_rich_files \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN \n", "\n", " roar_webometrics_scholar roar_monthly_deposits roar_total_deposits \\\n", "0 NaN NaN NaN \n", "1 NaN NaN NaN \n", "2 NaN NaN NaN \n", "3 NaN NaN NaN \n", "4 NaN NaN NaN \n", "\n", " roar_association roar_unique_id \n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 NaN NaN \n", "4 NaN NaN " ] }, "execution_count": 26, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup_across.merge(fairsharing_df, left_on='unique_id', right_on='FAIRsharing_unique_id', how='left')\n", "dup_across = dup_across.merge(re3data_df, left_on='unique_id', right_on='re3data_unique_id', how='left')\n", "dup_across = dup_across.merge(opendoar_df, left_on='unique_id', right_on='OpenDOAR_unique_id', how='left')\n", "dup_across = dup_across.merge(roar_df, left_on='unique_id', right_on='roar_unique_id', how='left')\n", "dup_across.head()" ] }, { "cell_type": "code", "execution_count": 27, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ ":1: PerformanceWarning:\n", "\n", "DataFrame is highly fragmented. This is usually the result of calling `frame.insert` many times, which has poor performance. Consider using pd.concat instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n", "\n", ":2: PerformanceWarning:\n", "\n", "DataFrame is highly fragmented. This is usually the result of calling `frame.insert` many times, which has poor performance. Consider using pd.concat instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n", "\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_OpenAIREIDre3data_orgIdentifierre3data_repositoryNamere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_descriptionre3data_typere3data_sizere3data_updateDatere3data_startDatere3data_endDatere3data_subjectre3data_missionStatementre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadre3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_OpenAIREIDOpenDOAR_orgIdentifierOpenDOAR_repositoryNameOpenDOAR_alternativeNamesOpenDOAR_repositoryURLOpenDOAR_descriptionOpenDOAR_typeOpenDOAR_updateDateOpenDOAR_startDateOpenDOAR_subjectOpenDOAR_contentTypeOpenDOAR_institutionOpenDOAR_metadataPolicyOpenDOAR_dataPolicyOpenDOAR_submissionPolicyOpenDOAR_contentPolicyOpenDOAR_softwareOpenDOAR_apiOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_idsource_set
0dedup::000871c1fc726f0b52dc86a4eeb027de[4612, 4649][4612, 4649][IIT Bombay Institutional Repository, IIT Bomb...[roar, roar][roar_4612, roar_4649][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][4612, 4649][28, 8][archive, archive][1380, 1380][nan, nan][nan, nan][disk0/00/00/46/12, disk0/00/00/46/49][2012-01-08 03:17:02, 2012-02-05 13:57:01][2012-04-16 10:53:04, 2012-04-16 10:39:58][2012-01-08 03:17:02, 2012-02-05 13:57:01][institutional, institutional][nan, nan][nan, nan][show, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][http://dspace.library.iitb.ac.in/jspui/, http...[IIT Bombay Institutional Repository, IIT Bomb...[http://dspace.library.iitb.ac.in/oai/request,...[nan, nan][http://dspace.library.iitb.ac.in/xmlui/feed/a...[nan, nan][nan, nan][TRUE, TRUE][TRUE, TRUE][TRUE, FALSE][IIT Bombay, IIT Bombay][http://www.iitb.ac.in, http://www.iitb.ac.in][in, in][Mumbai, Mumbai][19.133, 19.133][72.9166, 72.9166][dspace, dspace][geoname_2_IN, geoname_2_IN][other, other][[TN, TA, TK, TH, TP, TD, TJ], [TA, T1]][2011-12-15 09:01:35, 2012-01-05 12:09:37][nan, nan][nan, nan][0, nan][0, nan][0, nan][99, nan][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,95,...[nan, nan][nan, nan][nan, nan][nan, nan][celestial, celestial][4790, 4789][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_4612, roar_4649]{roar}
1dedup::0163cceb20f5ca7b313419c068abd9dc[7943, 8003][7943, 8003][EPrints@NIRT Library Welcomes! - EPrints@NITR...[roar, roar][roar_7943, roar_8003][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][7943, 8003][16, 19][archive, archive][4963, 5023][nan, nan][nan, nan][disk0/00/00/79/43, disk0/00/00/80/03][2014-03-11 11:54:06, 2014-03-30 18:13:01][2014-05-08 13:07:12, 2014-05-08 12:55:41][2014-03-11 11:54:06, 2014-03-30 18:13:01][institutional, institutional][nan, nan][nan, nan][show, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][http://eprints.nirt.res.in/, http://eprints.n...[EPrints@NIRT Library Welcomes! - EPrints@NITR...[http://eprints.nirt.res.in/cgi/oai2, http://e...[nan, nan][http://eprints.nirt.res.in/cgi/latest_tool?ou...[nan, nan][This is the Institutional Repository of the N...[TRUE, FALSE][TRUE, FALSE][FALSE, FALSE][National Institute for Research in Tuberculos...[http://www.nirt.res.in/, http://www.nirt.res.in][in, in][Chennai, Chennai (Madras)][nan, 13][nan, 80][eprints, eprints][geoname_2_IN, geoname_2_IN][3.3.15 eps, 3.3.15 eps][[RM, RB], [R1, RZ]][2014-03-07 15:07:45, 2014-03-19 07:05:04][The National Institute for Research in Tuberc...[nan, Please include \"Tuberculosis\" as a Speci...[nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][[opendoar, celestial], celestial][[5410, 2725], 5430][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_7943, roar_8003]{roar}
2dedup::028ee724157b05d04e7bdcf237d12e60[2670, 2698, 2741][2670, 2698, 2741][HSF Brage Open Research Archive, HSF Brage Op...[roar, roar, roar][roar_2670, roar_2698, roar_2741][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][2670, 2698, 2741][470, 317, 231][archive, archive, archive][235, 8, 8][nan, nan, nan][nan, nan, nan][disk0/00/00/26/70, disk0/00/00/26/98, disk0/0...[2010-05-04 02:19:51, 2010-05-13 11:01:53, 201...[2011-07-18 06:02:42, 2011-07-06 08:24:10, 201...[2010-05-04 02:19:51, 2010-05-13 11:01:53, 201...[institutional, institutional, institutional][nan, nan, nan][nan, nan, nan][show, show, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][0, 0, 0][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://brage.bibsys.no/hsf/, http://brage.bib...[HSF Brage Open Research Archive, HSF Brage Op...[http://oai.bibsys.no/oai/repository/nora_hsf_...[http://brage.bibsys.no/hsf/?locale=en, nan, nan][nan, nan, nan][nan, nan, nan][This site provides access to the research out...[TRUE, FALSE, FALSE][TRUE, FALSE, FALSE][FALSE, FALSE, FALSE][Sogn og Fjordane University College, Høgskule...[http://www.hisf.no/, http://www.hisf.no/, htt...[no, no, no][Sogndal, nan, nan][61.2174, 61.2174, 60.3904][7.1082, 7.1082, 5.3332][dspace, dspace, dspace][geoname_2_NO, nan, nan][other, other, other][nan, nan, nan][2010-04-06 13:51:52, 2010-05-09 15:12:16, 201...[nan, nan, nan][nan, nan, nan][0, nan, nan][0, nan, nan][0, nan, nan][50, nan, nan][0,0,1,1,1,4,4,6,6,7,8,11,12,14,15,17,18,18,18...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][[opendoar, celestial], opendoar, opendoar][[1781, 2426], 1781, 1807][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][roar_2670, roar_2698, roar_2741]{roar}
3dedup::03593ce517feac573fdaafa6dcedef61[4393, 4394][4393, 4394][Institutional Repository of Kunming Institute...[roar, roar][roar_4393, roar_4394][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][4393, 4394][14, 14][archive, archive][986, 986][nan, nan][nan, nan][disk0/00/00/43/93, disk0/00/00/43/94][2011-11-09 23:14:52, 2011-11-09 23:14:46][2012-02-06 06:58:40, 2012-02-06 06:58:41][2011-11-09 23:14:52, 2011-11-09 23:14:46][institutional, institutional][nan, nan][nan, nan][show, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][http://159.226.149.42:8088/, http://159.226.1...[Institutional Repository of Kunming Institute...[http://159.226.149.42:8088/casirgrid-oai/requ...[nan, nan][nan, nan][nan, nan][This site provides access to the output of th...[TRUE, TRUE][TRUE, TRUE][FALSE, FALSE][ Kunming Institute of Zoology Chinese Academy...[http://www.kiz.ac.cn/, http://www.kiz.ac.cn/][cn, cn][kunming, kunming][25.0416, 25.0416][102.755, 102.755][dspace, dspace][geoname_2_CN, geoname_2_CN][other, other][nan, nan][2010-07-22 16:00:13, 2010-07-22 16:00:13][nan, nan][nan, nan][0, 0][0, 0][0, 0][100, 100][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0...[nan, nan][nan, nan][nan, nan][nan, nan][celestial, celestial][4715, 4715][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_4393, roar_4394]{roar}
4dedup::03e0704b5690a2dee1861dc3ad3316c9[1019, 5550][1019, 5550][PolyU Institutional Repository, PolyU Institu...[roar, roar][roar_1019, roar_5550][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][1019, 5550][526, 9][archive, archive][1, 8][nan, nan][nan, nan][disk0/00/00/10/19, disk0/00/00/55/50][2010-01-06 13:45:03, 2012-12-12 01:25:48][2012-01-19 11:35:09, 2012-12-17 06:53:14][2010-01-06 13:45:03, 2012-12-12 01:25:48][institutional, institutional][nan, nan][nan, nan][show, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][0, nan][nan, nan][nan, nan][nan, nan][http://repository.lib.polyu.edu.hk/, http://r...[PolyU Institutional Repository, PolyU Institu...[http://repository.lib.polyu.edu.hk/oai/reques...[nan, nan][nan, nan][nan, nan][nan, This is an Institutional repository prov...[TRUE, nan][TRUE, nan][nan, nan][The Hong Kong Polytechnic University Pao Yue-...[http://www.lib.polyu.edu.hk, http://www.polyu...[hk, cn][Hong Kong, nan][22.25, 22.3964][114.167, 114.109][dspace, dspace][geoname_2_HK, geoname_2_CN][other, other][nan, nan][2008-10-30 07:50:38, 2012-07-01 15:13:40][nan, nan][nan, nan][0, 0][0, 0][0, 0][86, 86][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,54,71,80,...[nan, nan][nan, nan][nan, nan][nan, nan][[opendoar, roarmap, celestial], [opendoar, ce...[[193, 1456, 1441], [1456, 1441]][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_1019, roar_5550]{roar}
\n", "
" ], "text/plain": [ " dedup_id duplicate_id \\\n", "0 dedup::000871c1fc726f0b52dc86a4eeb027de [4612, 4649] \n", "1 dedup::0163cceb20f5ca7b313419c068abd9dc [7943, 8003] \n", "2 dedup::028ee724157b05d04e7bdcf237d12e60 [2670, 2698, 2741] \n", "3 dedup::03593ce517feac573fdaafa6dcedef61 [4393, 4394] \n", "4 dedup::03e0704b5690a2dee1861dc3ad3316c9 [1019, 5550] \n", "\n", " original_id name \\\n", "0 [4612, 4649] [IIT Bombay Institutional Repository, IIT Bomb... \n", "1 [7943, 8003] [EPrints@NIRT Library Welcomes! - EPrints@NITR... \n", "2 [2670, 2698, 2741] [HSF Brage Open Research Archive, HSF Brage Op... \n", "3 [4393, 4394] [Institutional Repository of Kunming Institute... \n", "4 [1019, 5550] [PolyU Institutional Repository, PolyU Institu... \n", "\n", " source unique_id FAIRsharing_id \\\n", "0 [roar, roar] [roar_4612, roar_4649] [nan, nan] \n", "1 [roar, roar] [roar_7943, roar_8003] [nan, nan] \n", "2 [roar, roar, roar] [roar_2670, roar_2698, roar_2741] [nan, nan, nan] \n", "3 [roar, roar] [roar_4393, roar_4394] [nan, nan] \n", "4 [roar, roar] [roar_1019, roar_5550] [nan, nan] \n", "\n", " FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.name FAIRsharing_attributes.metadata.status \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_OpenAIREID re3data_orgIdentifier re3data_repositoryName \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_additionalName re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_description re3data_type re3data_size re3data_updateDate \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_startDate re3data_endDate re3data_subject \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_missionStatement re3data_contentType re3data_providerType \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_keyword re3data_institution re3data_policy \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_databaseAccess re3data_databaseLicense re3data_dataAccess \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_dataLicense re3data_dataUpload re3data_dataUploadLicense \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_software re3data_versioning re3data_api re3data_pidSystem \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_unique_id OpenDOAR_OpenAIREID OpenDOAR_orgIdentifier \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_repositoryName OpenDOAR_alternativeNames OpenDOAR_repositoryURL \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_description OpenDOAR_type OpenDOAR_updateDate \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_startDate OpenDOAR_subject OpenDOAR_contentType \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_institution OpenDOAR_metadataPolicy OpenDOAR_dataPolicy \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_submissionPolicy OpenDOAR_contentPolicy OpenDOAR_software \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_api OpenDOAR_unique_id roar_eprintid roar_rev_number \\\n", "0 [nan, nan] [nan, nan] [4612, 4649] [28, 8] \n", "1 [nan, nan] [nan, nan] [7943, 8003] [16, 19] \n", "2 [nan, nan, nan] [nan, nan, nan] [2670, 2698, 2741] [470, 317, 231] \n", "3 [nan, nan] [nan, nan] [4393, 4394] [14, 14] \n", "4 [nan, nan] [nan, nan] [1019, 5550] [526, 9] \n", "\n", " roar_eprint_status roar_userid roar_importid \\\n", "0 [archive, archive] [1380, 1380] [nan, nan] \n", "1 [archive, archive] [4963, 5023] [nan, nan] \n", "2 [archive, archive, archive] [235, 8, 8] [nan, nan, nan] \n", "3 [archive, archive] [986, 986] [nan, nan] \n", "4 [archive, archive] [1, 8] [nan, nan] \n", "\n", " roar_source roar_dir \\\n", "0 [nan, nan] [disk0/00/00/46/12, disk0/00/00/46/49] \n", "1 [nan, nan] [disk0/00/00/79/43, disk0/00/00/80/03] \n", "2 [nan, nan, nan] [disk0/00/00/26/70, disk0/00/00/26/98, disk0/0... \n", "3 [nan, nan] [disk0/00/00/43/93, disk0/00/00/43/94] \n", "4 [nan, nan] [disk0/00/00/10/19, disk0/00/00/55/50] \n", "\n", " roar_datestamp \\\n", "0 [2012-01-08 03:17:02, 2012-02-05 13:57:01] \n", "1 [2014-03-11 11:54:06, 2014-03-30 18:13:01] \n", "2 [2010-05-04 02:19:51, 2010-05-13 11:01:53, 201... \n", "3 [2011-11-09 23:14:52, 2011-11-09 23:14:46] \n", "4 [2010-01-06 13:45:03, 2012-12-12 01:25:48] \n", "\n", " roar_lastmod \\\n", "0 [2012-04-16 10:53:04, 2012-04-16 10:39:58] \n", "1 [2014-05-08 13:07:12, 2014-05-08 12:55:41] \n", "2 [2011-07-18 06:02:42, 2011-07-06 08:24:10, 201... \n", "3 [2012-02-06 06:58:40, 2012-02-06 06:58:41] \n", "4 [2012-01-19 11:35:09, 2012-12-17 06:53:14] \n", "\n", " roar_status_changed \\\n", "0 [2012-01-08 03:17:02, 2012-02-05 13:57:01] \n", "1 [2014-03-11 11:54:06, 2014-03-30 18:13:01] \n", "2 [2010-05-04 02:19:51, 2010-05-13 11:01:53, 201... \n", "3 [2011-11-09 23:14:52, 2011-11-09 23:14:46] \n", "4 [2010-01-06 13:45:03, 2012-12-12 01:25:48] \n", "\n", " roar_type roar_succeeds \\\n", "0 [institutional, institutional] [nan, nan] \n", "1 [institutional, institutional] [nan, nan] \n", "2 [institutional, institutional, institutional] [nan, nan, nan] \n", "3 [institutional, institutional] [nan, nan] \n", "4 [institutional, institutional] [nan, nan] \n", "\n", " roar_commentary roar_metadata_visibility roar_latitude roar_longitude \\\n", "0 [nan, nan] [show, show] [nan, nan] [nan, nan] \n", "1 [nan, nan] [show, show] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [show, show, show] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [show, show] [nan, nan] [nan, nan] \n", "4 [nan, nan] [show, show] [nan, nan] [nan, nan] \n", "\n", " roar_relation_type roar_relation_uri roar_item_issues_id \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_type roar_item_issues_description \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_timestamp roar_item_issues_status \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_reported_by roar_item_issues_resolved_by \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_comment roar_item_issues_count roar_sword_depositor \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [0, 0, 0] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [0, nan] [nan, nan] \n", "\n", " roar_sword_slug roar_exemplar \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_home_page \\\n", "0 [http://dspace.library.iitb.ac.in/jspui/, http... \n", "1 [http://eprints.nirt.res.in/, http://eprints.n... \n", "2 [http://brage.bibsys.no/hsf/, http://brage.bib... \n", "3 [http://159.226.149.42:8088/, http://159.226.1... \n", "4 [http://repository.lib.polyu.edu.hk/, http://r... \n", "\n", " roar_title \\\n", "0 [IIT Bombay Institutional Repository, IIT Bomb... \n", "1 [EPrints@NIRT Library Welcomes! - EPrints@NITR... \n", "2 [HSF Brage Open Research Archive, HSF Brage Op... \n", "3 [Institutional Repository of Kunming Institute... \n", "4 [PolyU Institutional Repository, PolyU Institu... \n", "\n", " roar_oai_pmh \\\n", "0 [http://dspace.library.iitb.ac.in/oai/request,... \n", "1 [http://eprints.nirt.res.in/cgi/oai2, http://e... \n", "2 [http://oai.bibsys.no/oai/repository/nora_hsf_... \n", "3 [http://159.226.149.42:8088/casirgrid-oai/requ... \n", "4 [http://repository.lib.polyu.edu.hk/oai/reques... \n", "\n", " roar_sword_endpoint \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [http://brage.bibsys.no/hsf/?locale=en, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 [http://dspace.library.iitb.ac.in/xmlui/feed/a... [nan, nan] \n", "1 [http://eprints.nirt.res.in/cgi/latest_tool?ou... [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_description roar_fulltext \\\n", "0 [nan, nan] [TRUE, TRUE] \n", "1 [This is the Institutional Repository of the N... [TRUE, FALSE] \n", "2 [This site provides access to the research out... [TRUE, FALSE, FALSE] \n", "3 [This site provides access to the output of th... [TRUE, TRUE] \n", "4 [nan, This is an Institutional repository prov... [TRUE, nan] \n", "\n", " roar_open_access roar_mandate \\\n", "0 [TRUE, TRUE] [TRUE, FALSE] \n", "1 [TRUE, FALSE] [FALSE, FALSE] \n", "2 [TRUE, FALSE, FALSE] [FALSE, FALSE, FALSE] \n", "3 [TRUE, TRUE] [FALSE, FALSE] \n", "4 [TRUE, nan] [nan, nan] \n", "\n", " roar_organisation_title \\\n", "0 [IIT Bombay, IIT Bombay] \n", "1 [National Institute for Research in Tuberculos... \n", "2 [Sogn og Fjordane University College, Høgskule... \n", "3 [ Kunming Institute of Zoology Chinese Academy... \n", "4 [The Hong Kong Polytechnic University Pao Yue-... \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 [http://www.iitb.ac.in, http://www.iitb.ac.in] [in, in] \n", "1 [http://www.nirt.res.in/, http://www.nirt.res.in] [in, in] \n", "2 [http://www.hisf.no/, http://www.hisf.no/, htt... [no, no, no] \n", "3 [http://www.kiz.ac.cn/, http://www.kiz.ac.cn/] [cn, cn] \n", "4 [http://www.lib.polyu.edu.hk, http://www.polyu... [hk, cn] \n", "\n", " roar_location_city roar_location_latitude \\\n", "0 [Mumbai, Mumbai] [19.133, 19.133] \n", "1 [Chennai, Chennai (Madras)] [nan, 13] \n", "2 [Sogndal, nan, nan] [61.2174, 61.2174, 60.3904] \n", "3 [kunming, kunming] [25.0416, 25.0416] \n", "4 [Hong Kong, nan] [22.25, 22.3964] \n", "\n", " roar_location_longitude roar_software \\\n", "0 [72.9166, 72.9166] [dspace, dspace] \n", "1 [nan, 80] [eprints, eprints] \n", "2 [7.1082, 7.1082, 5.3332] [dspace, dspace, dspace] \n", "3 [102.755, 102.755] [dspace, dspace] \n", "4 [114.167, 114.109] [dspace, dspace] \n", "\n", " roar_geoname roar_version \\\n", "0 [geoname_2_IN, geoname_2_IN] [other, other] \n", "1 [geoname_2_IN, geoname_2_IN] [3.3.15 eps, 3.3.15 eps] \n", "2 [geoname_2_NO, nan, nan] [other, other, other] \n", "3 [geoname_2_CN, geoname_2_CN] [other, other] \n", "4 [geoname_2_HK, geoname_2_CN] [other, other] \n", "\n", " roar_subjects \\\n", "0 [[TN, TA, TK, TH, TP, TD, TJ], [TA, T1]] \n", "1 [[RM, RB], [R1, RZ]] \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " roar_date \\\n", "0 [2011-12-15 09:01:35, 2012-01-05 12:09:37] \n", "1 [2014-03-07 15:07:45, 2014-03-19 07:05:04] \n", "2 [2010-04-06 13:51:52, 2010-05-09 15:12:16, 201... \n", "3 [2010-07-22 16:00:13, 2010-07-22 16:00:13] \n", "4 [2008-10-30 07:50:38, 2012-07-01 15:13:40] \n", "\n", " roar_note \\\n", "0 [nan, nan] \n", "1 [The National Institute for Research in Tuberc... \n", "2 [nan, nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " roar_suggestions roar_activity_low \\\n", "0 [nan, nan] [0, nan] \n", "1 [nan, Please include \"Tuberculosis\" as a Speci... [nan, nan] \n", "2 [nan, nan, nan] [0, nan, nan] \n", "3 [nan, nan] [0, 0] \n", "4 [nan, nan] [0, 0] \n", "\n", " roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 [0, nan] [0, nan] [99, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [0, nan, nan] [0, nan, nan] [50, nan, nan] \n", "3 [0, 0] [0, 0] [100, 100] \n", "4 [0, 0] [0, 0] [86, 86] \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,95,... [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [0,0,1,1,1,4,4,6,6,7,8,11,12,14,15,17,18,18,18... [nan, nan, nan] \n", "3 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0... [nan, nan] \n", "4 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,54,71,80,... [nan, nan] \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_registry_name \\\n", "0 [celestial, celestial] \n", "1 [[opendoar, celestial], celestial] \n", "2 [[opendoar, celestial], opendoar, opendoar] \n", "3 [celestial, celestial] \n", "4 [[opendoar, roarmap, celestial], [opendoar, ce... \n", "\n", " roar_registry_id roar_submit_to roar_submitted_to_name \\\n", "0 [4790, 4789] [nan, nan] [nan, nan] \n", "1 [[5410, 2725], 5430] [nan, nan] [nan, nan] \n", "2 [[1781, 2426], 1781, 1807] [nan, nan, nan] [nan, nan, nan] \n", "3 [4715, 4715] [nan, nan] [nan, nan] \n", "4 [[193, 1456, 1441], [1456, 1441]] [nan, nan] [nan, nan] \n", "\n", " roar_submitted_to_done roar_webometrics_rank roar_webometrics_size \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_webometrics_visibility roar_webometrics_rich_files \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_webometrics_scholar roar_monthly_deposits roar_total_deposits \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_association roar_unique_id source_set \n", "0 [nan, nan] [roar_4612, roar_4649] {roar} \n", "1 [nan, nan] [roar_7943, roar_8003] {roar} \n", "2 [nan, nan, nan] [roar_2670, roar_2698, roar_2741] {roar} \n", "3 [nan, nan] [roar_4393, roar_4394] {roar} \n", "4 [nan, nan] [roar_1019, roar_5550] {roar} " ] }, "execution_count": 27, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_within = dup_within.groupby('dedup_id').aggregate(list).reset_index()\n", "dup_within['source_set'] = dup_within.source.map(set)\n", "dup_within.head()" ] }, { "cell_type": "code", "execution_count": 28, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ ":1: PerformanceWarning:\n", "\n", "DataFrame is highly fragmented. This is usually the result of calling `frame.insert` many times, which has poor performance. Consider using pd.concat instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n", "\n", ":2: PerformanceWarning:\n", "\n", "DataFrame is highly fragmented. This is usually the result of calling `frame.insert` many times, which has poor performance. Consider using pd.concat instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n", "\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_OpenAIREIDre3data_orgIdentifierre3data_repositoryNamere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_descriptionre3data_typere3data_sizere3data_updateDatere3data_startDatere3data_endDatere3data_subjectre3data_missionStatementre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadre3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_OpenAIREIDOpenDOAR_orgIdentifierOpenDOAR_repositoryNameOpenDOAR_alternativeNamesOpenDOAR_repositoryURLOpenDOAR_descriptionOpenDOAR_typeOpenDOAR_updateDateOpenDOAR_startDateOpenDOAR_subjectOpenDOAR_contentTypeOpenDOAR_institutionOpenDOAR_metadataPolicyOpenDOAR_dataPolicyOpenDOAR_submissionPolicyOpenDOAR_contentPolicyOpenDOAR_softwareOpenDOAR_apiOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_idsource_set
0dedup::01b6397888c09d84f3dc89d807aa1004[4745, opendoar____::a9365bd906e11324065c35be4...[4745, 2429, 4320][RU-Económicas, ru-económicas, ru económicas][roar, OpenDOAR, OpenDOAR][roar_4745, OpenDOAR_2429, OpenDOAR_4320][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, opendoar____::a9365bd906e11324065c35be47...[nan, 2429, 4320][nan, ru-económicas, ru económicas][nan, [], []][nan, http://ru.iiec.unam.mx/, http://ru.iiec....[nan, this site provides access to the researc...[nan, institutional, institutional][nan, 2021-09-13 13:35:56, 2021-09-13 13:36:17][nan, 2012-02-28 12:12:09, 2019-02-19 10:51:49][nan, [multidisciplinary], [business and econo...[nan, [journal_articles, theses_and_dissertati...[nan, [[universidad nacional autónoma de méxic...[nan, False, False][nan, False, False][nan, False, False][nan, False, False][nan, eprints 3.3.15, eprints ][nan, true , false ][nan, OpenDOAR_2429, OpenDOAR_4320][4745, nan, nan][31, nan, nan][archive, nan, nan][1447, nan, nan][nan, nan, nan][nan, nan, nan][disk0/00/00/47/45, nan, nan][2012-02-05 14:27:15, nan, nan][2012-04-16 10:34:36, nan, nan][2012-02-05 14:27:15, nan, nan][institutional, nan, nan][nan, nan, nan][nan, nan, nan][show, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://ru.iiec.unam.mx, nan, nan][RU-Económicas, nan, nan][http://ru.iiec.unam.mx/cgi/oai2, nan, nan][nan, nan, nan][http://ru.iiec.unam.mx/cgi/latest_tool?output...[nan, nan, nan][Productos académicos del Instituto de Investi...[TRUE, nan, nan][TRUE, nan, nan][TRUE, nan, nan][Instituto de Investigaciones Económicas UNAM,...[http://www.iiec.unam.mx/, nan, nan][mx, nan, nan][Mexico, nan, nan][19.3162, nan, nan][-99.1799, nan, nan][eprints, nan, nan][geoname_2_MX, nan, nan][3.3.15 eps, nan, nan][[HB, HD, HT, GF, HC, HF, HJ, HN, HX, H1, HG, ...[2012-02-03 05:18:16, nan, nan][nan, nan, nan][nan, nan, nan][0, nan, nan][0, nan, nan][0, nan, nan][94, nan, nan][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,7...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][[opendoar, celestial], nan, nan][[4818, 2429], nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][roar_4745, nan, nan]{OpenDOAR, roar}
1dedup::03db60c2331018b18c4166c1787072fe[opendoar____::78bc62d08a9a0b9b0b9c0ad339ef82d...[3087, 4500, 8504][landmark university repository, landmark univ...[OpenDOAR, OpenDOAR, roar][OpenDOAR_3087, OpenDOAR_4500, roar_8504][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][opendoar____::78bc62d08a9a0b9b0b9c0ad339ef82d...[3087, 4500, nan][landmark university repository, landmark univ...[[], [], nan][http://eprints.lmu.edu.ng/, http://eprints.lm...[this site provides access to the multi-discip...[institutional, institutional, nan][2021-09-13 13:36:06, 2021-02-18 18:01:12, nan][2014-06-16 13:36:00, 2019-03-26 14:07:30, nan][[multidisciplinary], [multidisciplinary], nan][[journal_articles], [journal_articles, biblio...[[[landmark university, [], ng, http://lmu.edu...[False, False, nan][False, False, nan][False, False, nan][False, False, nan][eprints 3.3.12, eprints , nan][true , false , nan][OpenDOAR_3087, OpenDOAR_4500, nan][nan, nan, 8504][nan, nan, 12][nan, nan, archive][nan, nan, 5459][nan, nan, nan][nan, nan, nan][nan, nan, disk0/00/00/85/04][nan, nan, 2014-06-24 10:14:07][nan, nan, 2014-06-28 01:38:49][nan, nan, 2014-06-24 10:14:07][nan, nan, institutional][nan, nan, nan][nan, nan, nan][nan, nan, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, http://eprints.lmu.edu.ng][nan, nan, Landmark University Repository][nan, nan, http://eprints.lmu.edu.ng/cgi/oai][nan, nan, nan][nan, nan, http://eprints.lmu.edu.ng/cgi/lates...[nan, nan, nan][nan, nan, nan][nan, nan, TRUE][nan, nan, TRUE][nan, nan, TRUE][nan, nan, Landmark University][nan, nan, http://lmu.edu.ng][nan, nan, ng][nan, nan, Omu-Aran][nan, nan, 8.12421][nan, nan, 5.09488][nan, nan, eprints][nan, nan, geoname_2_NG][nan, nan, 3.3.16 eps][nan, nan, nan][nan, nan, 2014-06-07 22:16:23][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, [opendoar, celestial]][nan, nan, [3087, 5621]][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, roar_8504]{OpenDOAR, roar}
2dedup::05128e44e27c36bdba71221bfccf735d[opendoar____::426f990b332ef8193a61cc90516c124...[2318, 5503, 4271][iława biblioteka cyrfrowa (iława digital libr...[OpenDOAR, roar, roar][OpenDOAR_2318, roar_5503, roar_4271][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][opendoar____::426f990b332ef8193a61cc90516c124...[2318, nan, nan][iława biblioteka cyrfrowa (iława digital libr...[[], nan, nan][http://ibc.ilawa.pl/dlibra, nan, nan][this site provides access to digitised articl...[governmental, nan, nan][2019-10-17 14:34:36, nan, nan][2011-10-11 13:13:58, nan, nan][[multidisciplinary], nan, nan][[journal_articles], nan, nan][[[iława, [], pl, http://www.ilawa.pl/_portal,...[False, nan, nan][False, nan, nan][False, nan, nan][False, nan, nan][dlibra 4, nan, nan][true , nan, nan][OpenDOAR_2318, nan, nan][nan, 5503, 4271][nan, 9, 11][nan, archive, archive][nan, 8, 8][nan, nan, nan][nan, nan, nan][nan, disk0/00/00/55/03, disk0/00/00/42/71][nan, 2012-11-19 20:33:30, 2011-10-27 01:25:14][nan, 2012-11-26 06:53:42, 2011-12-19 07:07:23][nan, 2012-11-19 20:33:30, 2011-10-27 01:25:14][nan, other, other][nan, nan, nan][nan, nan, nan][nan, show, show][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, http://ibc.ilawa.pl/dlibra, http://ibc.i...[nan, Iława Biblioteka Cyrfrowa (Iława Digital...[nan, http://ibc.ilawa.pl/dlibra/oai-pmh-repos...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, This site provides access to digitised a...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, Iława, Iława][nan, http://www.ilawa.pl/_portal, http://www....[nan, pl, pl][nan, nan, nan][nan, 53.596, 53.596][nan, 19.5684, 19.5684][nan, nan, nan][nan, geoname_2_PL, geoname_2_PL][nan, other, other][nan, nan, nan][nan, 2012-07-01 15:13:09, 2009-10-12 10:46:08][nan, nan, nan][nan, nan, nan][nan, 0, 0][nan, 0, 0][nan, 0, 0][nan, 20, 20][nan, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, [opendoar, celestial], [opendoar, celest...[nan, [2318, 4672], [2318, 4672]][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, roar_5503, roar_4271]{OpenDOAR, roar}
3dedup::069059b7ef840f0c74a814ec9237b6ec[5711, 126, opendoar____::1cd3882394520876dc88...[5711, 126, 1509][Bibioteca Digital Ação Educativa, Biblioteca ...[roar, roar, OpenDOAR][roar_5711, roar_126, OpenDOAR_1509][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, opendoar____::1cd3882394520876dc88d...[nan, nan, 1509][nan, nan, bibioteca digital ação educativa][nan, nan, []][nan, nan, http://www.bdae.org.br/dspace/][nan, nan, this site provides access to the ou...[nan, nan, institutional][nan, nan, 2019-10-17 14:34:23][nan, nan, 2009-05-01 10:10:47][nan, nan, [education]][nan, nan, [theses_and_dissertations, unpub_re...[nan, nan, [[ação educativa, [], br, http://ww...[nan, nan, False][nan, nan, False][nan, nan, False][nan, nan, False][nan, nan, dspace ][nan, nan, true ][nan, nan, OpenDOAR_1509][5711, 126, nan][9, 503, nan][archive, archive, nan][8, 1, nan][nan, nan, nan][nan, nan, nan][disk0/00/00/57/11, disk0/00/00/01/26, nan][2012-12-12 04:37:14, 2010-01-06 13:43:56, nan][2012-12-17 06:53:38, 2011-07-18 05:42:07, nan][2012-12-12 04:37:14, 2010-01-06 13:43:56, nan][institutional, other, nan][nan, nan, nan][nan, nan, nan][show, show, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, 0, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://www.bdae.org.br/dspace/, http://www.bd...[Bibioteca Digital Ação Educativa, Biblioteca ...[http://www.bdae.org.br/dspace-oai/request, ht...[nan, nan, nan][nan, nan, nan][nan, nan, nan][This site provides access to the output of th...[nan, nan, nan][nan, nan, nan][nan, nan, nan][Ação Educativa, Ação Educativa, nan][http://www.acaoeducativa.org/, http://www.aca...[br, br, nan][nan, São Paulo, nan][-23.5445, -23.5445, nan][-46.6509, -46.6509, nan][dspace, dspace, nan][geoname_2_BR, geoname_2_BR, nan][other, other, nan][nan, nan, nan][2012-07-22 15:12:34, 2008-03-31 20:07:33, nan][nan, nan, nan][nan, nan, nan][0, 0, nan][0, 0, nan][0, 0, nan][100, 100, nan][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,97,100,...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][[opendoar, celestial], [opendoar, celestial],...[[1509, 1430], [1509, 1430], nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][roar_5711, roar_126, nan]{OpenDOAR, roar}
4dedup::0e139b17a92b2df7d6c3c840e51465fe[4379, 4266, opendoar____::f976b57bb9dd27aa2e7...[4379, 4266, 2306][Institutional Repository of Ningbo Institute ...[roar, roar, OpenDOAR][roar_4379, roar_4266, OpenDOAR_2306][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, opendoar____::f976b57bb9dd27aa2e7e7...[nan, nan, 2306][nan, nan, institutional repository of ningbo ...[nan, nan, [nimte openir]][nan, nan, http://ir.nimte.ac.cn/][nan, nan, this site provides access to the ou...[nan, nan, institutional][nan, nan, 2019-10-17 14:34:36][nan, nan, 2011-10-10 13:13:11][nan, nan, [technology general, mechanical eng...[nan, nan, [journal_articles, bibliographic_re...[nan, nan, [[chinese academy of science (中国科学院...[nan, nan, False][nan, nan, False][nan, nan, False][nan, nan, False][nan, nan, dspace ][nan, nan, true ][nan, nan, OpenDOAR_2306][4379, 4266, nan][15, 11, nan][archive, archive, nan][986, 8, nan][nan, nan, nan][nan, nan, nan][disk0/00/00/43/79, disk0/00/00/42/66, nan][2011-11-09 23:16:22, 2011-10-27 01:26:05, nan][2011-12-21 15:25:04, 2011-12-19 07:07:21, nan][2011-11-09 23:16:22, 2011-10-27 01:26:05, nan][institutional, institutional, nan][nan, nan, nan][nan, nan, nan][show, show, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][http://ir.nimte.ac.cn/, http://ir.nimte.ac.cn...[Institutional Repository of Ningbo Institute ...[http://ir.nimte.ac.cn/casirgrid-oai/request, ...[nan, nan, nan][nan, nan, nan][nan, nan, nan][This site provides access to the output of th...[TRUE, nan, nan][TRUE, nan, nan][FALSE, nan, nan][Ningbo Institute of Material Technology & Eng...[http://www.nimte.ac.cn/, http://www.cas.cn/, ...[cn, cn, nan][ningbo, nan, nan][29.8807, 29.8807, nan][121.672, 121.672, nan][dspace, dspace, nan][geoname_2_CN, geoname_2_CN, nan][other, other, nan][nan, nan, nan][2009-12-21 02:27:07, 2009-12-21 02:27:07, nan][nan, nan, nan][nan, nan, nan][0, 0, nan][0, 0, nan][0, 0, nan][100, 100, nan][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0...[nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][celestial, [opendoar, celestial], nan][4668, [4668, 2306], nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][nan, nan, nan][roar_4379, roar_4266, nan]{OpenDOAR, roar}
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::01b6397888c09d84f3dc89d807aa1004 \n", "1 dedup::03db60c2331018b18c4166c1787072fe \n", "2 dedup::05128e44e27c36bdba71221bfccf735d \n", "3 dedup::069059b7ef840f0c74a814ec9237b6ec \n", "4 dedup::0e139b17a92b2df7d6c3c840e51465fe \n", "\n", " duplicate_id original_id \\\n", "0 [4745, opendoar____::a9365bd906e11324065c35be4... [4745, 2429, 4320] \n", "1 [opendoar____::78bc62d08a9a0b9b0b9c0ad339ef82d... [3087, 4500, 8504] \n", "2 [opendoar____::426f990b332ef8193a61cc90516c124... [2318, 5503, 4271] \n", "3 [5711, 126, opendoar____::1cd3882394520876dc88... [5711, 126, 1509] \n", "4 [4379, 4266, opendoar____::f976b57bb9dd27aa2e7... [4379, 4266, 2306] \n", "\n", " name \\\n", "0 [RU-Económicas, ru-económicas, ru económicas] \n", "1 [landmark university repository, landmark univ... \n", "2 [iława biblioteka cyrfrowa (iława digital libr... \n", "3 [Bibioteca Digital Ação Educativa, Biblioteca ... \n", "4 [Institutional Repository of Ningbo Institute ... \n", "\n", " source unique_id \\\n", "0 [roar, OpenDOAR, OpenDOAR] [roar_4745, OpenDOAR_2429, OpenDOAR_4320] \n", "1 [OpenDOAR, OpenDOAR, roar] [OpenDOAR_3087, OpenDOAR_4500, roar_8504] \n", "2 [OpenDOAR, roar, roar] [OpenDOAR_2318, roar_5503, roar_4271] \n", "3 [roar, roar, OpenDOAR] [roar_5711, roar_126, OpenDOAR_1509] \n", "4 [roar, roar, OpenDOAR] [roar_4379, roar_4266, OpenDOAR_2306] \n", "\n", " FAIRsharing_id FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.name FAIRsharing_attributes.metadata.status \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.record-type FAIRsharing_attributes.subjects \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.domains FAIRsharing_attributes.taxonomies \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.user-defined-tags FAIRsharing_attributes.countries \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.name FAIRsharing_attributes.abbreviation \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.url FAIRsharing_attributes.doi \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.description FAIRsharing_attributes.publications \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 [nan, nan, nan] \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_OpenAIREID re3data_orgIdentifier re3data_repositoryName \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_additionalName re3data_repositoryURL re3data_repositoryIdentifier \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_description re3data_type re3data_size re3data_updateDate \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_startDate re3data_endDate re3data_subject \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_missionStatement re3data_contentType re3data_providerType \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_keyword re3data_institution re3data_policy \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_databaseAccess re3data_databaseLicense re3data_dataAccess \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_dataLicense re3data_dataUpload re3data_dataUploadLicense \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_software re3data_versioning re3data_api re3data_pidSystem \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_syndication re3data_remarks re3data_entryDate re3data_lastUpdate \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " re3data_unique_id OpenDOAR_OpenAIREID \\\n", "0 [nan, nan, nan] [nan, opendoar____::a9365bd906e11324065c35be47... \n", "1 [nan, nan, nan] [opendoar____::78bc62d08a9a0b9b0b9c0ad339ef82d... \n", "2 [nan, nan, nan] [opendoar____::426f990b332ef8193a61cc90516c124... \n", "3 [nan, nan, nan] [nan, nan, opendoar____::1cd3882394520876dc88d... \n", "4 [nan, nan, nan] [nan, nan, opendoar____::f976b57bb9dd27aa2e7e7... \n", "\n", " OpenDOAR_orgIdentifier OpenDOAR_repositoryName \\\n", "0 [nan, 2429, 4320] [nan, ru-económicas, ru económicas] \n", "1 [3087, 4500, nan] [landmark university repository, landmark univ... \n", "2 [2318, nan, nan] [iława biblioteka cyrfrowa (iława digital libr... \n", "3 [nan, nan, 1509] [nan, nan, bibioteca digital ação educativa] \n", "4 [nan, nan, 2306] [nan, nan, institutional repository of ningbo ... \n", "\n", " OpenDOAR_alternativeNames \\\n", "0 [nan, [], []] \n", "1 [[], [], nan] \n", "2 [[], nan, nan] \n", "3 [nan, nan, []] \n", "4 [nan, nan, [nimte openir]] \n", "\n", " OpenDOAR_repositoryURL \\\n", "0 [nan, http://ru.iiec.unam.mx/, http://ru.iiec.... \n", "1 [http://eprints.lmu.edu.ng/, http://eprints.lm... \n", "2 [http://ibc.ilawa.pl/dlibra, nan, nan] \n", "3 [nan, nan, http://www.bdae.org.br/dspace/] \n", "4 [nan, nan, http://ir.nimte.ac.cn/] \n", "\n", " OpenDOAR_description \\\n", "0 [nan, this site provides access to the researc... \n", "1 [this site provides access to the multi-discip... \n", "2 [this site provides access to digitised articl... \n", "3 [nan, nan, this site provides access to the ou... \n", "4 [nan, nan, this site provides access to the ou... \n", "\n", " OpenDOAR_type \\\n", "0 [nan, institutional, institutional] \n", "1 [institutional, institutional, nan] \n", "2 [governmental, nan, nan] \n", "3 [nan, nan, institutional] \n", "4 [nan, nan, institutional] \n", "\n", " OpenDOAR_updateDate \\\n", "0 [nan, 2021-09-13 13:35:56, 2021-09-13 13:36:17] \n", "1 [2021-09-13 13:36:06, 2021-02-18 18:01:12, nan] \n", "2 [2019-10-17 14:34:36, nan, nan] \n", "3 [nan, nan, 2019-10-17 14:34:23] \n", "4 [nan, nan, 2019-10-17 14:34:36] \n", "\n", " OpenDOAR_startDate \\\n", "0 [nan, 2012-02-28 12:12:09, 2019-02-19 10:51:49] \n", "1 [2014-06-16 13:36:00, 2019-03-26 14:07:30, nan] \n", "2 [2011-10-11 13:13:58, nan, nan] \n", "3 [nan, nan, 2009-05-01 10:10:47] \n", "4 [nan, nan, 2011-10-10 13:13:11] \n", "\n", " OpenDOAR_subject \\\n", "0 [nan, [multidisciplinary], [business and econo... \n", "1 [[multidisciplinary], [multidisciplinary], nan] \n", "2 [[multidisciplinary], nan, nan] \n", "3 [nan, nan, [education]] \n", "4 [nan, nan, [technology general, mechanical eng... \n", "\n", " OpenDOAR_contentType \\\n", "0 [nan, [journal_articles, theses_and_dissertati... \n", "1 [[journal_articles], [journal_articles, biblio... \n", "2 [[journal_articles], nan, nan] \n", "3 [nan, nan, [theses_and_dissertations, unpub_re... \n", "4 [nan, nan, [journal_articles, bibliographic_re... \n", "\n", " OpenDOAR_institution OpenDOAR_metadataPolicy \\\n", "0 [nan, [[universidad nacional autónoma de méxic... [nan, False, False] \n", "1 [[[landmark university, [], ng, http://lmu.edu... [False, False, nan] \n", "2 [[[iława, [], pl, http://www.ilawa.pl/_portal,... [False, nan, nan] \n", "3 [nan, nan, [[ação educativa, [], br, http://ww... [nan, nan, False] \n", "4 [nan, nan, [[chinese academy of science (中国科学院... [nan, nan, False] \n", "\n", " OpenDOAR_dataPolicy OpenDOAR_submissionPolicy OpenDOAR_contentPolicy \\\n", "0 [nan, False, False] [nan, False, False] [nan, False, False] \n", "1 [False, False, nan] [False, False, nan] [False, False, nan] \n", "2 [False, nan, nan] [False, nan, nan] [False, nan, nan] \n", "3 [nan, nan, False] [nan, nan, False] [nan, nan, False] \n", "4 [nan, nan, False] [nan, nan, False] [nan, nan, False] \n", "\n", " OpenDOAR_software OpenDOAR_api \\\n", "0 [nan, eprints 3.3.15, eprints ] [nan, true , false ] \n", "1 [eprints 3.3.12, eprints , nan] [true , false , nan] \n", "2 [dlibra 4, nan, nan] [true , nan, nan] \n", "3 [nan, nan, dspace ] [nan, nan, true ] \n", "4 [nan, nan, dspace ] [nan, nan, true ] \n", "\n", " OpenDOAR_unique_id roar_eprintid roar_rev_number \\\n", "0 [nan, OpenDOAR_2429, OpenDOAR_4320] [4745, nan, nan] [31, nan, nan] \n", "1 [OpenDOAR_3087, OpenDOAR_4500, nan] [nan, nan, 8504] [nan, nan, 12] \n", "2 [OpenDOAR_2318, nan, nan] [nan, 5503, 4271] [nan, 9, 11] \n", "3 [nan, nan, OpenDOAR_1509] [5711, 126, nan] [9, 503, nan] \n", "4 [nan, nan, OpenDOAR_2306] [4379, 4266, nan] [15, 11, nan] \n", "\n", " roar_eprint_status roar_userid roar_importid \\\n", "0 [archive, nan, nan] [1447, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, archive] [nan, nan, 5459] [nan, nan, nan] \n", "2 [nan, archive, archive] [nan, 8, 8] [nan, nan, nan] \n", "3 [archive, archive, nan] [8, 1, nan] [nan, nan, nan] \n", "4 [archive, archive, nan] [986, 8, nan] [nan, nan, nan] \n", "\n", " roar_source roar_dir \\\n", "0 [nan, nan, nan] [disk0/00/00/47/45, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, disk0/00/00/85/04] \n", "2 [nan, nan, nan] [nan, disk0/00/00/55/03, disk0/00/00/42/71] \n", "3 [nan, nan, nan] [disk0/00/00/57/11, disk0/00/00/01/26, nan] \n", "4 [nan, nan, nan] [disk0/00/00/43/79, disk0/00/00/42/66, nan] \n", "\n", " roar_datestamp \\\n", "0 [2012-02-05 14:27:15, nan, nan] \n", "1 [nan, nan, 2014-06-24 10:14:07] \n", "2 [nan, 2012-11-19 20:33:30, 2011-10-27 01:25:14] \n", "3 [2012-12-12 04:37:14, 2010-01-06 13:43:56, nan] \n", "4 [2011-11-09 23:16:22, 2011-10-27 01:26:05, nan] \n", "\n", " roar_lastmod \\\n", "0 [2012-04-16 10:34:36, nan, nan] \n", "1 [nan, nan, 2014-06-28 01:38:49] \n", "2 [nan, 2012-11-26 06:53:42, 2011-12-19 07:07:23] \n", "3 [2012-12-17 06:53:38, 2011-07-18 05:42:07, nan] \n", "4 [2011-12-21 15:25:04, 2011-12-19 07:07:21, nan] \n", "\n", " roar_status_changed \\\n", "0 [2012-02-05 14:27:15, nan, nan] \n", "1 [nan, nan, 2014-06-24 10:14:07] \n", "2 [nan, 2012-11-19 20:33:30, 2011-10-27 01:25:14] \n", "3 [2012-12-12 04:37:14, 2010-01-06 13:43:56, nan] \n", "4 [2011-11-09 23:16:22, 2011-10-27 01:26:05, nan] \n", "\n", " roar_type roar_succeeds roar_commentary \\\n", "0 [institutional, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, institutional] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, other, other] [nan, nan, nan] [nan, nan, nan] \n", "3 [institutional, other, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [institutional, institutional, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude \\\n", "0 [show, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, show] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, show, show] [nan, nan, nan] [nan, nan, nan] \n", "3 [show, show, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [show, show, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_relation_type roar_relation_uri roar_item_issues_id \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_type roar_item_issues_description \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_timestamp roar_item_issues_status \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_reported_by roar_item_issues_resolved_by \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_item_issues_comment roar_item_issues_count roar_sword_depositor \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, 0, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_sword_slug roar_exemplar \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_home_page \\\n", "0 [http://ru.iiec.unam.mx, nan, nan] \n", "1 [nan, nan, http://eprints.lmu.edu.ng] \n", "2 [nan, http://ibc.ilawa.pl/dlibra, http://ibc.i... \n", "3 [http://www.bdae.org.br/dspace/, http://www.bd... \n", "4 [http://ir.nimte.ac.cn/, http://ir.nimte.ac.cn... \n", "\n", " roar_title \\\n", "0 [RU-Económicas, nan, nan] \n", "1 [nan, nan, Landmark University Repository] \n", "2 [nan, Iława Biblioteka Cyrfrowa (Iława Digital... \n", "3 [Bibioteca Digital Ação Educativa, Biblioteca ... \n", "4 [Institutional Repository of Ningbo Institute ... \n", "\n", " roar_oai_pmh roar_sword_endpoint \\\n", "0 [http://ru.iiec.unam.mx/cgi/oai2, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, http://eprints.lmu.edu.ng/cgi/oai] [nan, nan, nan] \n", "2 [nan, http://ibc.ilawa.pl/dlibra/oai-pmh-repos... [nan, nan, nan] \n", "3 [http://www.bdae.org.br/dspace-oai/request, ht... [nan, nan, nan] \n", "4 [http://ir.nimte.ac.cn/casirgrid-oai/request, ... [nan, nan, nan] \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 [http://ru.iiec.unam.mx/cgi/latest_tool?output... [nan, nan, nan] \n", "1 [nan, nan, http://eprints.lmu.edu.ng/cgi/lates... [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_description roar_fulltext \\\n", "0 [Productos académicos del Instituto de Investi... [TRUE, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, TRUE] \n", "2 [nan, This site provides access to digitised a... [nan, nan, nan] \n", "3 [This site provides access to the output of th... [nan, nan, nan] \n", "4 [This site provides access to the output of th... [TRUE, nan, nan] \n", "\n", " roar_open_access roar_mandate \\\n", "0 [TRUE, nan, nan] [TRUE, nan, nan] \n", "1 [nan, nan, TRUE] [nan, nan, TRUE] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [TRUE, nan, nan] [FALSE, nan, nan] \n", "\n", " roar_organisation_title \\\n", "0 [Instituto de Investigaciones Económicas UNAM,... \n", "1 [nan, nan, Landmark University] \n", "2 [nan, Iława, Iława] \n", "3 [Ação Educativa, Ação Educativa, nan] \n", "4 [Ningbo Institute of Material Technology & Eng... \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 [http://www.iiec.unam.mx/, nan, nan] [mx, nan, nan] \n", "1 [nan, nan, http://lmu.edu.ng] [nan, nan, ng] \n", "2 [nan, http://www.ilawa.pl/_portal, http://www.... [nan, pl, pl] \n", "3 [http://www.acaoeducativa.org/, http://www.aca... [br, br, nan] \n", "4 [http://www.nimte.ac.cn/, http://www.cas.cn/, ... [cn, cn, nan] \n", "\n", " roar_location_city roar_location_latitude \\\n", "0 [Mexico, nan, nan] [19.3162, nan, nan] \n", "1 [nan, nan, Omu-Aran] [nan, nan, 8.12421] \n", "2 [nan, nan, nan] [nan, 53.596, 53.596] \n", "3 [nan, São Paulo, nan] [-23.5445, -23.5445, nan] \n", "4 [ningbo, nan, nan] [29.8807, 29.8807, nan] \n", "\n", " roar_location_longitude roar_software \\\n", "0 [-99.1799, nan, nan] [eprints, nan, nan] \n", "1 [nan, nan, 5.09488] [nan, nan, eprints] \n", "2 [nan, 19.5684, 19.5684] [nan, nan, nan] \n", "3 [-46.6509, -46.6509, nan] [dspace, dspace, nan] \n", "4 [121.672, 121.672, nan] [dspace, dspace, nan] \n", "\n", " roar_geoname roar_version \\\n", "0 [geoname_2_MX, nan, nan] [3.3.15 eps, nan, nan] \n", "1 [nan, nan, geoname_2_NG] [nan, nan, 3.3.16 eps] \n", "2 [nan, geoname_2_PL, geoname_2_PL] [nan, other, other] \n", "3 [geoname_2_BR, geoname_2_BR, nan] [other, other, nan] \n", "4 [geoname_2_CN, geoname_2_CN, nan] [other, other, nan] \n", "\n", " roar_subjects \\\n", "0 [[HB, HD, HT, GF, HC, HF, HJ, HN, HX, H1, HG, ... \n", "1 [nan, nan, nan] \n", "2 [nan, nan, nan] \n", "3 [nan, nan, nan] \n", "4 [nan, nan, nan] \n", "\n", " roar_date roar_note \\\n", "0 [2012-02-03 05:18:16, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, 2014-06-07 22:16:23] [nan, nan, nan] \n", "2 [nan, 2012-07-01 15:13:09, 2009-10-12 10:46:08] [nan, nan, nan] \n", "3 [2012-07-22 15:12:34, 2008-03-31 20:07:33, nan] [nan, nan, nan] \n", "4 [2009-12-21 02:27:07, 2009-12-21 02:27:07, nan] [nan, nan, nan] \n", "\n", " roar_suggestions roar_activity_low roar_activity_medium roar_activity_high \\\n", "0 [nan, nan, nan] [0, nan, nan] [0, nan, nan] [0, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, 0, 0] [nan, 0, 0] [nan, 0, 0] \n", "3 [nan, nan, nan] [0, 0, nan] [0, 0, nan] [0, 0, nan] \n", "4 [nan, nan, nan] [0, 0, nan] [0, 0, nan] [0, 0, nan] \n", "\n", " roar_recordcount roar_recordhistory \\\n", "0 [94, nan, nan] [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,7... \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, 20, 20] [nan, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,... \n", "3 [100, 100, nan] [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,97,100,... \n", "4 [100, 100, nan] [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0... \n", "\n", " roar_fulltexts_total roar_fulltexts_docs roar_fulltexts_rtotal \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_fulltexts_rdocs roar_registry_name \\\n", "0 [nan, nan, nan] [[opendoar, celestial], nan, nan] \n", "1 [nan, nan, nan] [nan, nan, [opendoar, celestial]] \n", "2 [nan, nan, nan] [nan, [opendoar, celestial], [opendoar, celest... \n", "3 [nan, nan, nan] [[opendoar, celestial], [opendoar, celestial],... \n", "4 [nan, nan, nan] [celestial, [opendoar, celestial], nan] \n", "\n", " roar_registry_id roar_submit_to roar_submitted_to_name \\\n", "0 [[4818, 2429], nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, [3087, 5621]] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, [2318, 4672], [2318, 4672]] [nan, nan, nan] [nan, nan, nan] \n", "3 [[1509, 1430], [1509, 1430], nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [4668, [4668, 2306], nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_submitted_to_done roar_webometrics_rank roar_webometrics_size \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_webometrics_visibility roar_webometrics_rich_files \\\n", "0 [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_webometrics_scholar roar_monthly_deposits roar_total_deposits \\\n", "0 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "1 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "2 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "3 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "4 [nan, nan, nan] [nan, nan, nan] [nan, nan, nan] \n", "\n", " roar_association roar_unique_id source_set \n", "0 [nan, nan, nan] [roar_4745, nan, nan] {OpenDOAR, roar} \n", "1 [nan, nan, nan] [nan, nan, roar_8504] {OpenDOAR, roar} \n", "2 [nan, nan, nan] [nan, roar_5503, roar_4271] {OpenDOAR, roar} \n", "3 [nan, nan, nan] [roar_5711, roar_126, nan] {OpenDOAR, roar} \n", "4 [nan, nan, nan] [roar_4379, roar_4266, nan] {OpenDOAR, roar} " ] }, "execution_count": 28, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_hybrid = dup_hybrid.groupby('dedup_id').aggregate(list).reset_index()\n", "dup_hybrid['source_set'] = dup_hybrid.source.map(set)\n", "dup_hybrid.head()" ] }, { "cell_type": "code", "execution_count": 29, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ ":1: PerformanceWarning:\n", "\n", "DataFrame is highly fragmented. This is usually the result of calling `frame.insert` many times, which has poor performance. Consider using pd.concat instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n", "\n", ":2: PerformanceWarning:\n", "\n", "DataFrame is highly fragmented. This is usually the result of calling `frame.insert` many times, which has poor performance. Consider using pd.concat instead. To get a de-fragmented frame, use `newframe = frame.copy()`\n", "\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
dedup_idduplicate_idoriginal_idnamesourceunique_idFAIRsharing_idFAIRsharing_typeFAIRsharing_attributes.created-atFAIRsharing_attributes.updated-atFAIRsharing_attributes.metadata.doiFAIRsharing_attributes.metadata.nameFAIRsharing_attributes.metadata.statusFAIRsharing_attributes.metadata.contactsFAIRsharing_attributes.metadata.homepageFAIRsharing_attributes.metadata.identifierFAIRsharing_attributes.metadata.descriptionFAIRsharing_attributes.metadata.support-linksFAIRsharing_attributes.metadata.year-creationFAIRsharing_attributes.metadata.data-processesFAIRsharing_attributes.legacy-idsFAIRsharing_attributes.fairsharing-registryFAIRsharing_attributes.record-typeFAIRsharing_attributes.subjectsFAIRsharing_attributes.domainsFAIRsharing_attributes.taxonomiesFAIRsharing_attributes.user-defined-tagsFAIRsharing_attributes.countriesFAIRsharing_attributes.nameFAIRsharing_attributes.abbreviationFAIRsharing_attributes.urlFAIRsharing_attributes.doiFAIRsharing_attributes.fairsharing-licenceFAIRsharing_attributes.descriptionFAIRsharing_attributes.publicationsFAIRsharing_attributes.licence-linksFAIRsharing_attributes.metadata.citationsFAIRsharing_attributes.metadata.abbreviationFAIRsharing_attributes.metadata.access-pointsFAIRsharing_attributes.metadata.associated-toolsFAIRsharing_attributes.metadata.deprecation-dateFAIRsharing_attributes.metadata.deprecation-reasonFAIRsharing_attributes.metadata.tombstoneFAIRsharing_unique_idre3data_OpenAIREIDre3data_orgIdentifierre3data_repositoryNamere3data_additionalNamere3data_repositoryURLre3data_repositoryIdentifierre3data_descriptionre3data_typere3data_sizere3data_updateDatere3data_startDatere3data_endDatere3data_subjectre3data_missionStatementre3data_contentTypere3data_providerTypere3data_keywordre3data_institutionre3data_policyre3data_databaseAccessre3data_databaseLicensere3data_dataAccessre3data_dataLicensere3data_dataUploadre3data_dataUploadLicensere3data_softwarere3data_versioningre3data_apire3data_pidSystemre3data_citationGuidelineURLre3data_aidSystemre3data_enhancedPublicationre3data_qualityManagementre3data_certificatere3data_metadataStandardre3data_syndicationre3data_remarksre3data_entryDatere3data_lastUpdatere3data_unique_idOpenDOAR_OpenAIREIDOpenDOAR_orgIdentifierOpenDOAR_repositoryNameOpenDOAR_alternativeNamesOpenDOAR_repositoryURLOpenDOAR_descriptionOpenDOAR_typeOpenDOAR_updateDateOpenDOAR_startDateOpenDOAR_subjectOpenDOAR_contentTypeOpenDOAR_institutionOpenDOAR_metadataPolicyOpenDOAR_dataPolicyOpenDOAR_submissionPolicyOpenDOAR_contentPolicyOpenDOAR_softwareOpenDOAR_apiOpenDOAR_unique_idroar_eprintidroar_rev_numberroar_eprint_statusroar_useridroar_importidroar_sourceroar_dirroar_datestamproar_lastmodroar_status_changedroar_typeroar_succeedsroar_commentaryroar_metadata_visibilityroar_latituderoar_longituderoar_relation_typeroar_relation_uriroar_item_issues_idroar_item_issues_typeroar_item_issues_descriptionroar_item_issues_timestamproar_item_issues_statusroar_item_issues_reported_byroar_item_issues_resolved_byroar_item_issues_commentroar_item_issues_countroar_sword_depositorroar_sword_slugroar_exemplarroar_home_pageroar_titleroar_oai_pmhroar_sword_endpointroar_rss_feedroar_twitter_feedroar_descriptionroar_fulltextroar_open_accessroar_mandateroar_organisation_titleroar_organisation_home_pageroar_location_countryroar_location_cityroar_location_latituderoar_location_longituderoar_softwareroar_geonameroar_versionroar_subjectsroar_dateroar_noteroar_suggestionsroar_activity_lowroar_activity_mediumroar_activity_highroar_recordcountroar_recordhistoryroar_fulltexts_totalroar_fulltexts_docsroar_fulltexts_rtotalroar_fulltexts_rdocsroar_registry_nameroar_registry_idroar_submit_toroar_submitted_to_nameroar_submitted_to_doneroar_webometrics_rankroar_webometrics_sizeroar_webometrics_visibilityroar_webometrics_rich_filesroar_webometrics_scholarroar_monthly_depositsroar_total_depositsroar_associationroar_unique_idsource_set
0dedup::001e6d882e54c780ce269d3c46997287[re3data_____::4af9fe2bb93511a5e0f0c39e94d6557...[r3d100011306, 2094][RESID Database of Protein Modifications, RESI...[re3data, FAIRsharing][re3data_r3d100011306, FAIRsharing_2094][nan, 2094][nan, fairsharing-records][nan, 2014-11-04T15:23:40.000Z][nan, 2021-09-30T11:38:37.114Z][nan, 10.25504/FAIRsharing.qaszjp][nan, RESID Database of Protein Modifications][nan, ready][nan, [{'contact-name': 'John S Garavelli', 'c...[nan, http://pir.georgetown.edu/resid/][nan, 2094.0][nan, The RESID Database of Protein Modificati...[nan, [{'url': 'http://pir.georgetown.edu/resi...[nan, nan][nan, [{'url': 'ftp://ftp.pir.georgetown.edu/p...[nan, [biodbcore-000563, bsg-d000563]][nan, Database][nan, knowledgebase][nan, [Life Science]][nan, [Molecular structure, Small molecule, St...[nan, [All]][nan, []][nan, [United Kingdom, European Union, Switzer...[nan, FAIRsharing record for: RESID Database o...[nan, RESID][nan, https://fairsharing.org/10.25504/FAIRsha...[nan, 10.25504/FAIRsharing.qaszjp][nan, https://creativecommons.org/licenses/by-...[nan, This FAIRsharing record describes: The R...[nan, [{'id': 334, 'pubmed_id': 12520062, 'tit...[nan, [{'licence-name': 'Open Data Commons (OD...[nan, nan][nan, RESID][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, FAIRsharing_2094][re3data_____::4af9fe2bb93511a5e0f0c39e94d6557...[r3d100011306, nan][RESID Database of Protein Modifications, nan][[], nan][https://pir.georgetown.edu/resid/resid.shtml,...[[FAIRsharing_doi:10.25504/FAIRsharing.qaszjp,...[The RESID Database of Protein Modifications i...[[disciplinary], nan][nan, nan][nan, nan][2014, nan][nan, nan][[2 Life Sciences, 201 Basic Biological and Me...[False, nan][[Images, Structured text], nan][[dataProvider], nan][[genomes, life sciences, proteins, proteomes,...[[[Georgetown University, Medical Center, ['GU...[True, nan][ true, nan][False, nan][True, nan][True, nan][True, nan][False, nan][True, nan][yes, nan][True, nan][True, nan][True, nan][True, nan][yes, nan][unknown, nan][False, nan][False, nan][False, nan][RESID is covered by Thomson Reuters Data Cita...[2014-12-05, nan][2019-01-17, nan][re3data_r3d100011306, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan]{FAIRsharing, re3data}
1dedup::0023a1e3447fdb31836536cc903f1310[opendoar____::c6f798b844366ccd65d99bc7f31e0e0...[3410, 10013][erucu: electronic repository of the ukrainian...[OpenDOAR, roar][OpenDOAR_3410, roar_10013][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][opendoar____::c6f798b844366ccd65d99bc7f31e0e0...[3410, nan][erucu: electronic repository of the ukrainian...[[], nan][http://er.ucu.edu.ua/, nan][ukrainian catholic university’s institutional...[institutional, nan][2019-10-17 14:34:57, nan][2015-07-08 12:43:38, nan][[multidisciplinary], nan][[journal_articles, conference_and_workshop_pa...[[[ukrainian catholic university, ['ucu'], ua,...[False, nan][False, nan][False, nan][False, nan][dspace , nan][false , nan][OpenDOAR_3410, nan][nan, 10013][nan, 31][nan, archive][nan, 7104][nan, nan][nan, nan][nan, disk0/00/01/00/13][nan, 2015-08-08 14:53:04][nan, 2016-03-21 19:54:43][nan, 2015-08-08 14:53:04][nan, institutional][nan, nan][nan, nan][nan, show][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, http://er.ucu.edu.ua/][nan, ErUCU: Electronic repository of the Ukra...[nan, http://er.ucu.edu.ua/oai/request][nan, http://er.ucu.edu.ua/sword/][nan, http://er.ucu.edu.ua/feed/rss_2.0/site][nan, nan][nan, Ukrainian Catholic University’s institut...[nan, TRUE][nan, TRUE][nan, TRUE][nan, Ukrainian Catholic University][nan, http://ucu.edu.ua/eng/][nan, ua][nan, Lviv][nan, nan][nan, nan][nan, dspace][nan, geoname_2_UA][nan, other][nan, [B1, BS, BL, AC, D204, DK, HM, BF, L1, D...[nan, 2015-07-07 12:38:37][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, [opendoar, celestial]][nan, [5883, 3410]][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, [russell_group, ivy_league]][nan, roar_10013]{OpenDOAR, roar}
2dedup::003ab6b40af9b488decea7c582d150a2[https://fairsharing.org/10.25504/FAIRsharing....[2315, r3d100011894][Synapse, Synapse][FAIRsharing, re3data][FAIRsharing_2315, re3data_r3d100011894][2315, nan][fairsharing-records, nan][2016-08-02T13:56:30.000Z, nan][2021-09-30T11:38:43.134Z, nan][10.25504/FAIRsharing.dnxzmk, nan][Synapse, nan][ready, nan][[{'contact-name': 'Meredith Slota', 'contact-...[https://www.synapse.org/, nan][2315.0, nan][Synapse is a collaborative research platform ...[[{'url': 'SynapseInfo@sagebase.org', 'name': ...[2010.0, nan][[{'url': 'https://www.synapse.org/', 'name': ...[[biodbcore-000791, bsg-d000791], nan][Database, nan][repository, nan][[Biomedical Science, Data Management, Data In...[[Experimental measurement, Protocol, Data sto...[[All], nan][[], nan][[United States], nan][FAIRsharing record for: Synapse, nan][Synapse, nan][https://fairsharing.org/10.25504/FAIRsharing....[10.25504/FAIRsharing.dnxzmk, nan][https://creativecommons.org/licenses/by-sa/4....[This FAIRsharing record describes: Synapse is...[[{'id': 2450, 'pubmed_id': 24071850, 'title':...[[{'licence-name': 'Creative Commons Attributi...[nan, nan][Synapse, nan][[{'url': 'http://rest-docs.synapse.org/rest/'...[[{'url': 'https://sage-bionetworks.github.io/...[nan, nan][nan, nan][nan, nan][FAIRsharing_2315, nan][nan, re3data_____::cafc5d99b7c187e24b40d958a1...[nan, r3d100011894][nan, Synapse][nan, []][nan, https://www.synapse.org][nan, [RRID:SCR_006307, RRID:nlx_151983]][nan, Synapse is an open source software platf...[nan, [other]][nan, nan][nan, nan][nan, 2012-05-22][nan, nan][nan, [2 Life Sciences, 201 Basic Biological a...[nan, True][nan, [Raw data, Scientific and statistical da...[nan, [dataProvider, serviceProvider]][nan, [AMP-AD Knowledge Portal, DREAM Challeng...[nan, [[Alfred P. Sloan Foundation, [], USA, [...[nan, True][nan, true][nan, False][nan, True][nan, True][nan, True][nan, False][nan, True][nan, yes][nan, True][nan, True][nan, True][nan, True][nan, yes][nan, yes][nan, False][nan, False][nan, False][nan, nan][nan, 2015-12-03][nan, 2021-05-17][nan, re3data_r3d100011894][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan]{FAIRsharing, re3data}
3dedup::0064f599ed0adb5870a5b3ffe438e485[16034, opendoar____::d1f157379ea7e51d4a8c07af...[16034, 9647][Giresun University Institutional Repository, ...[roar, OpenDOAR][roar_16034, OpenDOAR_9647][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, opendoar____::d1f157379ea7e51d4a8c07aff1...[nan, 9647][nan, giresun university institutional reposit...[nan, [giresun üniversitesi akademik arşiv sis...[nan, http://acikerisim.giresun.edu.tr][nan, this site provides access to the researc...[nan, institutional][nan, 2021-05-21 18:05:06][nan, 2020-06-02 09:14:18][nan, [multidisciplinary]][nan, [journal_articles]][nan, [[giresun university, ['giresun üniversi...[nan, False][nan, False][nan, False][nan, False][nan, dspace 6.2][nan, true ][nan, OpenDOAR_9647][16034, nan][7, nan][archive, nan][12932, nan][nan, nan][nan, nan][disk0/00/01/60/34, nan][2020-06-01 20:13:50, nan][2020-06-01 20:14:04, nan][2020-06-01 20:13:50, nan][institutional, nan][nan, nan][nan, nan][show, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][https://acikerisim.giresun.edu.tr, nan][Giresun University Institutional Repository, ...[https://acikerisim.giresun.edu.tr/oai, nan][nan, nan][nan, nan][nan, nan][DSpace@Giresun is a growing collection of Gir...[TRUE, nan][TRUE, nan][TRUE, nan][Giresun University, nan][https://www.giresun.edu.tr/, nan][tr, nan][Giresun, nan][40.9147, nan][38.323, nan][dspace, nan][geoname_2_TR, nan][other, nan][nan, nan][2020-05-29 18:13:17, nan][DSpace@Giresun is a growing collection of Gir...[nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roarmap, nan][http://roarmap.eprints.org/1046/, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][roar_16034, nan]{OpenDOAR, roar}
4dedup::00ac8ed3b4327bdd4ebbebcb2ba10a00[610, opendoar____::299fb2142d7de959380f91c01c...[610, 1426][Hedatuz, hedatuz][roar, OpenDOAR][roar_610, OpenDOAR_1426][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, opendoar____::299fb2142d7de959380f91c01c...[nan, 1426][nan, hedatuz][nan, []][nan, http://hedatuz.euskomedia.org/][nan, this site contains works published by eu...[nan, disciplinary][nan, 2019-10-17 14:34:21][nan, 2009-02-02 13:13:26][nan, [multidisciplinary]][nan, [journal_articles, books_chapters_and_se...[nan, [[euskomedia, [], es, http://www.euskome...[nan, False][nan, False][nan, False][nan, False][nan, eprints 3.0.5][nan, true ][nan, OpenDOAR_1426][610, nan][514, nan][archive, nan][1, nan][nan, nan][nan, nan][disk0/00/00/06/10, nan][2010-01-06 13:44:32, nan][2011-07-18 05:48:34, nan][2010-01-06 13:44:32, nan][institutional, nan][nan, nan][nan, nan][show, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][nan, nan][0, nan][nan, nan][nan, nan][nan, nan][http://hedatuz.euskomedia.org/, nan][Hedatuz, nan][http://hedatuz.euskomedia.org/cgi/oai2, nan][nan, nan][http://hedatuz.euskomedia.org/cgi/latest_tool...[nan, nan][Hedatuz, created by the Euskomedia Fundazioa,...[TRUE, nan][TRUE, nan][nan, nan][Euskomedia Fundazioa, nan][http://www.euskomedia.org, nan][org, nan][ (Unknown city), nan][nan, nan][nan, nan][eprints, nan][geoname_2_ORG, nan][eprints-3.0.5, nan][nan, nan][2008-10-03 15:36:07, nan][nan, nan][nan, nan][0, nan][0, nan][0, nan][100, nan][0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,90,90,91,...[nan, nan][nan, nan][nan, nan][nan, nan][[opendoar, celestial], nan][[1426, 1294], nan][nan, nan][nan, nan][nan, nan][570, nan][331, nan][519, nan][145, nan][806, nan][nan, nan][nan, nan][nan, nan][roar_610, nan]{OpenDOAR, roar}
\n", "
" ], "text/plain": [ " dedup_id \\\n", "0 dedup::001e6d882e54c780ce269d3c46997287 \n", "1 dedup::0023a1e3447fdb31836536cc903f1310 \n", "2 dedup::003ab6b40af9b488decea7c582d150a2 \n", "3 dedup::0064f599ed0adb5870a5b3ffe438e485 \n", "4 dedup::00ac8ed3b4327bdd4ebbebcb2ba10a00 \n", "\n", " duplicate_id original_id \\\n", "0 [re3data_____::4af9fe2bb93511a5e0f0c39e94d6557... [r3d100011306, 2094] \n", "1 [opendoar____::c6f798b844366ccd65d99bc7f31e0e0... [3410, 10013] \n", "2 [https://fairsharing.org/10.25504/FAIRsharing.... [2315, r3d100011894] \n", "3 [16034, opendoar____::d1f157379ea7e51d4a8c07af... [16034, 9647] \n", "4 [610, opendoar____::299fb2142d7de959380f91c01c... [610, 1426] \n", "\n", " name source \\\n", "0 [RESID Database of Protein Modifications, RESI... [re3data, FAIRsharing] \n", "1 [erucu: electronic repository of the ukrainian... [OpenDOAR, roar] \n", "2 [Synapse, Synapse] [FAIRsharing, re3data] \n", "3 [Giresun University Institutional Repository, ... [roar, OpenDOAR] \n", "4 [Hedatuz, hedatuz] [roar, OpenDOAR] \n", "\n", " unique_id FAIRsharing_id \\\n", "0 [re3data_r3d100011306, FAIRsharing_2094] [nan, 2094] \n", "1 [OpenDOAR_3410, roar_10013] [nan, nan] \n", "2 [FAIRsharing_2315, re3data_r3d100011894] [2315, nan] \n", "3 [roar_16034, OpenDOAR_9647] [nan, nan] \n", "4 [roar_610, OpenDOAR_1426] [nan, nan] \n", "\n", " FAIRsharing_type FAIRsharing_attributes.created-at \\\n", "0 [nan, fairsharing-records] [nan, 2014-11-04T15:23:40.000Z] \n", "1 [nan, nan] [nan, nan] \n", "2 [fairsharing-records, nan] [2016-08-02T13:56:30.000Z, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.updated-at FAIRsharing_attributes.metadata.doi \\\n", "0 [nan, 2021-09-30T11:38:37.114Z] [nan, 10.25504/FAIRsharing.qaszjp] \n", "1 [nan, nan] [nan, nan] \n", "2 [2021-09-30T11:38:43.134Z, nan] [10.25504/FAIRsharing.dnxzmk, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.name \\\n", "0 [nan, RESID Database of Protein Modifications] \n", "1 [nan, nan] \n", "2 [Synapse, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.status \\\n", "0 [nan, ready] \n", "1 [nan, nan] \n", "2 [ready, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.contacts \\\n", "0 [nan, [{'contact-name': 'John S Garavelli', 'c... \n", "1 [nan, nan] \n", "2 [[{'contact-name': 'Meredith Slota', 'contact-... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.homepage \\\n", "0 [nan, http://pir.georgetown.edu/resid/] \n", "1 [nan, nan] \n", "2 [https://www.synapse.org/, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.identifier \\\n", "0 [nan, 2094.0] \n", "1 [nan, nan] \n", "2 [2315.0, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.description \\\n", "0 [nan, The RESID Database of Protein Modificati... \n", "1 [nan, nan] \n", "2 [Synapse is a collaborative research platform ... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.support-links \\\n", "0 [nan, [{'url': 'http://pir.georgetown.edu/resi... \n", "1 [nan, nan] \n", "2 [[{'url': 'SynapseInfo@sagebase.org', 'name': ... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.year-creation \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [2010.0, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.data-processes \\\n", "0 [nan, [{'url': 'ftp://ftp.pir.georgetown.edu/p... \n", "1 [nan, nan] \n", "2 [[{'url': 'https://www.synapse.org/', 'name': ... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.legacy-ids \\\n", "0 [nan, [biodbcore-000563, bsg-d000563]] \n", "1 [nan, nan] \n", "2 [[biodbcore-000791, bsg-d000791], nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-registry \\\n", "0 [nan, Database] \n", "1 [nan, nan] \n", "2 [Database, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.record-type \\\n", "0 [nan, knowledgebase] \n", "1 [nan, nan] \n", "2 [repository, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.subjects \\\n", "0 [nan, [Life Science]] \n", "1 [nan, nan] \n", "2 [[Biomedical Science, Data Management, Data In... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.domains \\\n", "0 [nan, [Molecular structure, Small molecule, St... \n", "1 [nan, nan] \n", "2 [[Experimental measurement, Protocol, Data sto... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.taxonomies FAIRsharing_attributes.user-defined-tags \\\n", "0 [nan, [All]] [nan, []] \n", "1 [nan, nan] [nan, nan] \n", "2 [[All], nan] [[], nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " FAIRsharing_attributes.countries \\\n", "0 [nan, [United Kingdom, European Union, Switzer... \n", "1 [nan, nan] \n", "2 [[United States], nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.name \\\n", "0 [nan, FAIRsharing record for: RESID Database o... \n", "1 [nan, nan] \n", "2 [FAIRsharing record for: Synapse, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.abbreviation \\\n", "0 [nan, RESID] \n", "1 [nan, nan] \n", "2 [Synapse, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.url \\\n", "0 [nan, https://fairsharing.org/10.25504/FAIRsha... \n", "1 [nan, nan] \n", "2 [https://fairsharing.org/10.25504/FAIRsharing.... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.doi \\\n", "0 [nan, 10.25504/FAIRsharing.qaszjp] \n", "1 [nan, nan] \n", "2 [10.25504/FAIRsharing.dnxzmk, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.fairsharing-licence \\\n", "0 [nan, https://creativecommons.org/licenses/by-... \n", "1 [nan, nan] \n", "2 [https://creativecommons.org/licenses/by-sa/4.... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.description \\\n", "0 [nan, This FAIRsharing record describes: The R... \n", "1 [nan, nan] \n", "2 [This FAIRsharing record describes: Synapse is... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.publications \\\n", "0 [nan, [{'id': 334, 'pubmed_id': 12520062, 'tit... \n", "1 [nan, nan] \n", "2 [[{'id': 2450, 'pubmed_id': 24071850, 'title':... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.licence-links \\\n", "0 [nan, [{'licence-name': 'Open Data Commons (OD... \n", "1 [nan, nan] \n", "2 [[{'licence-name': 'Creative Commons Attributi... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.citations \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.abbreviation \\\n", "0 [nan, RESID] \n", "1 [nan, nan] \n", "2 [Synapse, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.access-points \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [[{'url': 'http://rest-docs.synapse.org/rest/'... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.associated-tools \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [[{'url': 'https://sage-bionetworks.github.io/... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-date \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.deprecation-reason \\\n", "0 [nan, nan] \n", "1 [nan, nan] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " FAIRsharing_attributes.metadata.tombstone FAIRsharing_unique_id \\\n", "0 [nan, nan] [nan, FAIRsharing_2094] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [FAIRsharing_2315, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_OpenAIREID re3data_orgIdentifier \\\n", "0 [re3data_____::4af9fe2bb93511a5e0f0c39e94d6557... [r3d100011306, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, re3data_____::cafc5d99b7c187e24b40d958a1... [nan, r3d100011894] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryName re3data_additionalName \\\n", "0 [RESID Database of Protein Modifications, nan] [[], nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, Synapse] [nan, []] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_repositoryURL \\\n", "0 [https://pir.georgetown.edu/resid/resid.shtml,... \n", "1 [nan, nan] \n", "2 [nan, https://www.synapse.org] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_repositoryIdentifier \\\n", "0 [[FAIRsharing_doi:10.25504/FAIRsharing.qaszjp,... \n", "1 [nan, nan] \n", "2 [nan, [RRID:SCR_006307, RRID:nlx_151983]] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_description re3data_type \\\n", "0 [The RESID Database of Protein Modifications i... [[disciplinary], nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, Synapse is an open source software platf... [nan, [other]] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_size re3data_updateDate re3data_startDate re3data_endDate \\\n", "0 [nan, nan] [nan, nan] [2014, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, 2012-05-22] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_subject re3data_missionStatement \\\n", "0 [[2 Life Sciences, 201 Basic Biological and Me... [False, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, [2 Life Sciences, 201 Basic Biological a... [nan, True] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_contentType \\\n", "0 [[Images, Structured text], nan] \n", "1 [nan, nan] \n", "2 [nan, [Raw data, Scientific and statistical da... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_providerType \\\n", "0 [[dataProvider], nan] \n", "1 [nan, nan] \n", "2 [nan, [dataProvider, serviceProvider]] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_keyword \\\n", "0 [[genomes, life sciences, proteins, proteomes,... \n", "1 [nan, nan] \n", "2 [nan, [AMP-AD Knowledge Portal, DREAM Challeng... \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " re3data_institution re3data_policy \\\n", "0 [[[Georgetown University, Medical Center, ['GU... [True, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, [[Alfred P. Sloan Foundation, [], USA, [... [nan, True] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_databaseAccess re3data_databaseLicense re3data_dataAccess \\\n", "0 [ true, nan] [False, nan] [True, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, true] [nan, False] [nan, True] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_dataLicense re3data_dataUpload re3data_dataUploadLicense \\\n", "0 [True, nan] [True, nan] [False, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, True] [nan, True] [nan, False] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_software re3data_versioning re3data_api re3data_pidSystem \\\n", "0 [True, nan] [yes, nan] [True, nan] [True, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, True] [nan, yes] [nan, True] [nan, True] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_citationGuidelineURL re3data_aidSystem re3data_enhancedPublication \\\n", "0 [True, nan] [True, nan] [yes, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, True] [nan, True] [nan, yes] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_qualityManagement re3data_certificate re3data_metadataStandard \\\n", "0 [unknown, nan] [False, nan] [False, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, yes] [nan, False] [nan, False] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " re3data_syndication re3data_remarks \\\n", "0 [False, nan] [RESID is covered by Thomson Reuters Data Cita... \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, False] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " re3data_entryDate re3data_lastUpdate re3data_unique_id \\\n", "0 [2014-12-05, nan] [2019-01-17, nan] [re3data_r3d100011306, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, 2015-12-03] [nan, 2021-05-17] [nan, re3data_r3d100011894] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " OpenDOAR_OpenAIREID OpenDOAR_orgIdentifier \\\n", "0 [nan, nan] [nan, nan] \n", "1 [opendoar____::c6f798b844366ccd65d99bc7f31e0e0... [3410, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, opendoar____::d1f157379ea7e51d4a8c07aff1... [nan, 9647] \n", "4 [nan, opendoar____::299fb2142d7de959380f91c01c... [nan, 1426] \n", "\n", " OpenDOAR_repositoryName \\\n", "0 [nan, nan] \n", "1 [erucu: electronic repository of the ukrainian... \n", "2 [nan, nan] \n", "3 [nan, giresun university institutional reposit... \n", "4 [nan, hedatuz] \n", "\n", " OpenDOAR_alternativeNames \\\n", "0 [nan, nan] \n", "1 [[], nan] \n", "2 [nan, nan] \n", "3 [nan, [giresun üniversitesi akademik arşiv sis... \n", "4 [nan, []] \n", "\n", " OpenDOAR_repositoryURL \\\n", "0 [nan, nan] \n", "1 [http://er.ucu.edu.ua/, nan] \n", "2 [nan, nan] \n", "3 [nan, http://acikerisim.giresun.edu.tr] \n", "4 [nan, http://hedatuz.euskomedia.org/] \n", "\n", " OpenDOAR_description OpenDOAR_type \\\n", "0 [nan, nan] [nan, nan] \n", "1 [ukrainian catholic university’s institutional... [institutional, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, this site provides access to the researc... [nan, institutional] \n", "4 [nan, this site contains works published by eu... [nan, disciplinary] \n", "\n", " OpenDOAR_updateDate OpenDOAR_startDate \\\n", "0 [nan, nan] [nan, nan] \n", "1 [2019-10-17 14:34:57, nan] [2015-07-08 12:43:38, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, 2021-05-21 18:05:06] [nan, 2020-06-02 09:14:18] \n", "4 [nan, 2019-10-17 14:34:21] [nan, 2009-02-02 13:13:26] \n", "\n", " OpenDOAR_subject \\\n", "0 [nan, nan] \n", "1 [[multidisciplinary], nan] \n", "2 [nan, nan] \n", "3 [nan, [multidisciplinary]] \n", "4 [nan, [multidisciplinary]] \n", "\n", " OpenDOAR_contentType \\\n", "0 [nan, nan] \n", "1 [[journal_articles, conference_and_workshop_pa... \n", "2 [nan, nan] \n", "3 [nan, [journal_articles]] \n", "4 [nan, [journal_articles, books_chapters_and_se... \n", "\n", " OpenDOAR_institution OpenDOAR_metadataPolicy \\\n", "0 [nan, nan] [nan, nan] \n", "1 [[[ukrainian catholic university, ['ucu'], ua,... [False, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, [[giresun university, ['giresun üniversi... [nan, False] \n", "4 [nan, [[euskomedia, [], es, http://www.euskome... [nan, False] \n", "\n", " OpenDOAR_dataPolicy OpenDOAR_submissionPolicy OpenDOAR_contentPolicy \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [False, nan] [False, nan] [False, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, False] [nan, False] [nan, False] \n", "4 [nan, False] [nan, False] [nan, False] \n", "\n", " OpenDOAR_software OpenDOAR_api OpenDOAR_unique_id roar_eprintid \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [dspace , nan] [false , nan] [OpenDOAR_3410, nan] [nan, 10013] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, dspace 6.2] [nan, true ] [nan, OpenDOAR_9647] [16034, nan] \n", "4 [nan, eprints 3.0.5] [nan, true ] [nan, OpenDOAR_1426] [610, nan] \n", "\n", " roar_rev_number roar_eprint_status roar_userid roar_importid roar_source \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, 31] [nan, archive] [nan, 7104] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [7, nan] [archive, nan] [12932, nan] [nan, nan] [nan, nan] \n", "4 [514, nan] [archive, nan] [1, nan] [nan, nan] [nan, nan] \n", "\n", " roar_dir roar_datestamp \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, disk0/00/01/00/13] [nan, 2015-08-08 14:53:04] \n", "2 [nan, nan] [nan, nan] \n", "3 [disk0/00/01/60/34, nan] [2020-06-01 20:13:50, nan] \n", "4 [disk0/00/00/06/10, nan] [2010-01-06 13:44:32, nan] \n", "\n", " roar_lastmod roar_status_changed \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, 2016-03-21 19:54:43] [nan, 2015-08-08 14:53:04] \n", "2 [nan, nan] [nan, nan] \n", "3 [2020-06-01 20:14:04, nan] [2020-06-01 20:13:50, nan] \n", "4 [2011-07-18 05:48:34, nan] [2010-01-06 13:44:32, nan] \n", "\n", " roar_type roar_succeeds roar_commentary \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, institutional] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [institutional, nan] [nan, nan] [nan, nan] \n", "4 [institutional, nan] [nan, nan] [nan, nan] \n", "\n", " roar_metadata_visibility roar_latitude roar_longitude roar_relation_type \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, show] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [show, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [show, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_relation_uri roar_item_issues_id roar_item_issues_type \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_description roar_item_issues_timestamp \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_status roar_item_issues_reported_by \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_resolved_by roar_item_issues_comment \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_item_issues_count roar_sword_depositor roar_sword_slug roar_exemplar \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [0, nan] [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_home_page \\\n", "0 [nan, nan] \n", "1 [nan, http://er.ucu.edu.ua/] \n", "2 [nan, nan] \n", "3 [https://acikerisim.giresun.edu.tr, nan] \n", "4 [http://hedatuz.euskomedia.org/, nan] \n", "\n", " roar_title \\\n", "0 [nan, nan] \n", "1 [nan, ErUCU: Electronic repository of the Ukra... \n", "2 [nan, nan] \n", "3 [Giresun University Institutional Repository, ... \n", "4 [Hedatuz, nan] \n", "\n", " roar_oai_pmh \\\n", "0 [nan, nan] \n", "1 [nan, http://er.ucu.edu.ua/oai/request] \n", "2 [nan, nan] \n", "3 [https://acikerisim.giresun.edu.tr/oai, nan] \n", "4 [http://hedatuz.euskomedia.org/cgi/oai2, nan] \n", "\n", " roar_sword_endpoint \\\n", "0 [nan, nan] \n", "1 [nan, http://er.ucu.edu.ua/sword/] \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " roar_rss_feed roar_twitter_feed \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, http://er.ucu.edu.ua/feed/rss_2.0/site] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [http://hedatuz.euskomedia.org/cgi/latest_tool... [nan, nan] \n", "\n", " roar_description roar_fulltext \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, Ukrainian Catholic University’s institut... [nan, TRUE] \n", "2 [nan, nan] [nan, nan] \n", "3 [DSpace@Giresun is a growing collection of Gir... [TRUE, nan] \n", "4 [Hedatuz, created by the Euskomedia Fundazioa,... [TRUE, nan] \n", "\n", " roar_open_access roar_mandate roar_organisation_title \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, TRUE] [nan, TRUE] [nan, Ukrainian Catholic University] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [TRUE, nan] [TRUE, nan] [Giresun University, nan] \n", "4 [TRUE, nan] [nan, nan] [Euskomedia Fundazioa, nan] \n", "\n", " roar_organisation_home_page roar_location_country \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, http://ucu.edu.ua/eng/] [nan, ua] \n", "2 [nan, nan] [nan, nan] \n", "3 [https://www.giresun.edu.tr/, nan] [tr, nan] \n", "4 [http://www.euskomedia.org, nan] [org, nan] \n", "\n", " roar_location_city roar_location_latitude roar_location_longitude \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, Lviv] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [Giresun, nan] [40.9147, nan] [38.323, nan] \n", "4 [ (Unknown city), nan] [nan, nan] [nan, nan] \n", "\n", " roar_software roar_geoname roar_version \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, dspace] [nan, geoname_2_UA] [nan, other] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [dspace, nan] [geoname_2_TR, nan] [other, nan] \n", "4 [eprints, nan] [geoname_2_ORG, nan] [eprints-3.0.5, nan] \n", "\n", " roar_subjects \\\n", "0 [nan, nan] \n", "1 [nan, [B1, BS, BL, AC, D204, DK, HM, BF, L1, D... \n", "2 [nan, nan] \n", "3 [nan, nan] \n", "4 [nan, nan] \n", "\n", " roar_date \\\n", "0 [nan, nan] \n", "1 [nan, 2015-07-07 12:38:37] \n", "2 [nan, nan] \n", "3 [2020-05-29 18:13:17, nan] \n", "4 [2008-10-03 15:36:07, nan] \n", "\n", " roar_note roar_suggestions \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [DSpace@Giresun is a growing collection of Gir... [nan, nan] \n", "4 [nan, nan] [nan, nan] \n", "\n", " roar_activity_low roar_activity_medium roar_activity_high roar_recordcount \\\n", "0 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] [nan, nan] \n", "4 [0, nan] [0, nan] [0, nan] [100, nan] \n", "\n", " roar_recordhistory roar_fulltexts_total \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] \n", "4 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,90,90,91,... [nan, nan] \n", "\n", " roar_fulltexts_docs roar_fulltexts_rtotal roar_fulltexts_rdocs \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_registry_name roar_registry_id \\\n", "0 [nan, nan] [nan, nan] \n", "1 [nan, [opendoar, celestial]] [nan, [5883, 3410]] \n", "2 [nan, nan] [nan, nan] \n", "3 [roarmap, nan] [http://roarmap.eprints.org/1046/, nan] \n", "4 [[opendoar, celestial], nan] [[1426, 1294], nan] \n", "\n", " roar_submit_to roar_submitted_to_name roar_submitted_to_done \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [nan, nan] [nan, nan] [nan, nan] \n", "\n", " roar_webometrics_rank roar_webometrics_size roar_webometrics_visibility \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [570, nan] [331, nan] [519, nan] \n", "\n", " roar_webometrics_rich_files roar_webometrics_scholar roar_monthly_deposits \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, nan] [nan, nan] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [nan, nan] \n", "4 [145, nan] [806, nan] [nan, nan] \n", "\n", " roar_total_deposits roar_association roar_unique_id \\\n", "0 [nan, nan] [nan, nan] [nan, nan] \n", "1 [nan, nan] [nan, [russell_group, ivy_league]] [nan, roar_10013] \n", "2 [nan, nan] [nan, nan] [nan, nan] \n", "3 [nan, nan] [nan, nan] [roar_16034, nan] \n", "4 [nan, nan] [nan, nan] [roar_610, nan] \n", "\n", " source_set \n", "0 {FAIRsharing, re3data} \n", "1 {OpenDOAR, roar} \n", "2 {FAIRsharing, re3data} \n", "3 {OpenDOAR, roar} \n", "4 {OpenDOAR, roar} " ] }, "execution_count": 29, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dup_across = dup_across.groupby('dedup_id').aggregate(list).reset_index()\n", "dup_across['source_set'] = dup_across.source.map(set)\n", "dup_across.head()" ] }, { "cell_type": "code", "execution_count": 30, "metadata": {}, "outputs": [], "source": [ "def remove_nan(list_obj):\n", " if isinstance(list_obj, list):\n", " while np.nan in list_obj:\n", " list_obj.remove(np.nan)\n", " return list_obj\n", " \n", "dup_within.applymap(remove_nan).to_csv('../data/processed/dup_within.csv')\n", "dup_hybrid.applymap(remove_nan).to_csv('../data/processed/dup_hybrid.csv')\n", "dup_across.applymap(remove_nan).to_csv('../data/processed/dup_across.csv')" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.8.3" } }, "nbformat": 4, "nbformat_minor": 4 }