registries_analysis/notebooks/02-subjects&geographic.ipynb

9945 lines
401 KiB
Plaintext
Raw Normal View History

2021-07-22 11:03:05 +02:00
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"import ast\n",
"import csv\n",
"import json\n",
"import reverse_geocoder as rg\n",
"\n",
"import numpy as np\n",
"import pandas as pd\n",
"\n",
"import pycountry_convert\n",
"\n",
"import matplotlib.pyplot as plt\n",
"from matplotlib_venn import venn2, venn2_circles\n",
"\n",
"import plotly\n",
"from plotly.offline import iplot, init_notebook_mode\n",
"import plotly.graph_objs as go\n",
"import plotly.express as px\n",
"\n",
"pd.set_option('display.max_columns', None)"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"def country_to_countrycode(country):\n",
" if pd.isna(country):\n",
" return np.nan\n",
" else:\n",
" try:\n",
" return pycountry_convert.country_name_to_country_alpha3(country)\n",
" except:\n",
" return np.nan\n",
" \n",
"def countrycode_iso2_to_countrycode_iso3(country):\n",
" if pd.isna(country):\n",
" return np.nan\n",
" else:\n",
" try:\n",
" return pycountry_convert.country_name_to_country_alpha3(pycountry_convert.country_alpha2_to_country_name(country))\n",
" except:\n",
" return np.nan\n",
"\n",
"def countrycode_to_continent(country_code):\n",
" if pd.isna(country_code):\n",
" return np.nan\n",
" else:\n",
" try:\n",
" return pycountry_convert.country_alpha2_to_continent_code(pycountry_convert.country_alpha3_to_country_alpha2(country_code))\n",
" except:\n",
" return np.nan"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Loading datasets"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**re3data**"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>re3data_id</th>\n",
" <th>repository_name</th>\n",
" <th>type</th>\n",
" <th>subject</th>\n",
" <th>provider_type</th>\n",
" <th>keyword</th>\n",
" <th>institution</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>r3d100000001</td>\n",
" <td>Odum Institute Archive Dataverse</td>\n",
" <td>[disciplinary]</td>\n",
" <td>[1 Humanities and Social Sciences, 111 Social ...</td>\n",
" <td>[dataProvider]</td>\n",
" <td>[FAIR, Middle East, crime, demography, economy...</td>\n",
" <td>[[Odum Institute for Research in Social Scienc...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>r3d100000002</td>\n",
" <td>Access to Archival Databases</td>\n",
" <td>[disciplinary]</td>\n",
" <td>[1 Humanities and Social Sciences, 102 History...</td>\n",
" <td>[dataProvider]</td>\n",
" <td>[US History]</td>\n",
" <td>[[The U.S. National Archives and Records Admin...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>r3d100000004</td>\n",
" <td>Datenbank Gesprochenes Deutsch</td>\n",
" <td>[disciplinary]</td>\n",
" <td>[1 Humanities and Social Sciences, 104 Linguis...</td>\n",
" <td>[dataProvider, serviceProvider]</td>\n",
" <td>[Australian German, FOLK, German dialects, Pfe...</td>\n",
" <td>[[Institut für Deutsche Sprache, Archiv für Ge...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>r3d100000005</td>\n",
" <td>UNC Dataverse</td>\n",
" <td>[institutional]</td>\n",
" <td>[1 Humanities and Social Sciences, 111 Social ...</td>\n",
" <td>[dataProvider, serviceProvider]</td>\n",
" <td>[FAIR, census, demographic survey, demography,...</td>\n",
" <td>[[Odum Institute for Research in Social Scienc...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>r3d100000006</td>\n",
" <td>Archaeology Data Service</td>\n",
" <td>[disciplinary]</td>\n",
" <td>[1 Humanities and Social Sciences, 101 Ancient...</td>\n",
" <td>[dataProvider, serviceProvider]</td>\n",
" <td>[FAIR, archaeology, cultural heritage, prehist...</td>\n",
" <td>[[Arts and Humanities Research Council, [AHRC]...</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" re3data_id repository_name type \\\n",
"0 r3d100000001 Odum Institute Archive Dataverse [disciplinary] \n",
"1 r3d100000002 Access to Archival Databases [disciplinary] \n",
"2 r3d100000004 Datenbank Gesprochenes Deutsch [disciplinary] \n",
"3 r3d100000005 UNC Dataverse [institutional] \n",
"4 r3d100000006 Archaeology Data Service [disciplinary] \n",
"\n",
" subject \\\n",
"0 [1 Humanities and Social Sciences, 111 Social ... \n",
"1 [1 Humanities and Social Sciences, 102 History... \n",
"2 [1 Humanities and Social Sciences, 104 Linguis... \n",
"3 [1 Humanities and Social Sciences, 111 Social ... \n",
"4 [1 Humanities and Social Sciences, 101 Ancient... \n",
"\n",
" provider_type \\\n",
"0 [dataProvider] \n",
"1 [dataProvider] \n",
"2 [dataProvider, serviceProvider] \n",
"3 [dataProvider, serviceProvider] \n",
"4 [dataProvider, serviceProvider] \n",
"\n",
" keyword \\\n",
"0 [FAIR, Middle East, crime, demography, economy... \n",
"1 [US History] \n",
"2 [Australian German, FOLK, German dialects, Pfe... \n",
"3 [FAIR, census, demographic survey, demography,... \n",
"4 [FAIR, archaeology, cultural heritage, prehist... \n",
"\n",
" institution \n",
"0 [[Odum Institute for Research in Social Scienc... \n",
"1 [[The U.S. National Archives and Records Admin... \n",
"2 [[Institut für Deutsche Sprache, Archiv für Ge... \n",
"3 [[Odum Institute for Research in Social Scienc... \n",
"4 [[Arts and Humanities Research Council, [AHRC]... "
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"re3data_df = pd.read_csv('../data/raw/re3data.tsv', delimiter='\\t', \n",
" converters={'subject': ast.literal_eval,\n",
" 'keyword': ast.literal_eval,\n",
" 'additional_name': ast.literal_eval,\n",
" 'repository_id': ast.literal_eval,\n",
" 'type': ast.literal_eval,\n",
" 'content_type': ast.literal_eval,\n",
" 'provider_type': ast.literal_eval,\n",
" 'institution': ast.literal_eval\n",
" },\n",
" usecols=['re3data_id', 'repository_name', 'subject', 'keyword', 'type', 'provider_type', 'institution'])\n",
"re3data_df.head()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**HERE I AM FILTERING SERVICE PROVIDERS OUT!!**"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [],
"source": [
"re3data_df = re3data_df.explode('provider_type')\n",
"re3data_df = re3data_df[re3data_df.provider_type != 'serviceProvider']"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {
"scrolled": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>re3data_id</th>\n",
" <th>repository_name</th>\n",
" <th>type</th>\n",
" <th>subject</th>\n",
" <th>provider_type</th>\n",
" <th>keyword</th>\n",
" <th>institution</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>count</th>\n",
" <td>2467</td>\n",
" <td>2467</td>\n",
" <td>2467</td>\n",
" <td>2467</td>\n",
" <td>2459</td>\n",
" <td>2467</td>\n",
" <td>2467</td>\n",
" </tr>\n",
" <tr>\n",
" <th>unique</th>\n",
" <td>2466</td>\n",
" <td>2463</td>\n",
" <td>9</td>\n",
" <td>1282</td>\n",
" <td>1</td>\n",
" <td>2248</td>\n",
" <td>2447</td>\n",
" </tr>\n",
" <tr>\n",
" <th>top</th>\n",
" <td>r3d100011987</td>\n",
" <td>Landmap</td>\n",
" <td>[disciplinary]</td>\n",
" <td>[1 Humanities and Social Sciences, 2 Life Scie...</td>\n",
" <td>dataProvider</td>\n",
" <td>[multidisciplinary]</td>\n",
" <td>[[National Center for Biotechnology Informatio...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>freq</th>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>1573</td>\n",
" <td>200</td>\n",
" <td>2459</td>\n",
" <td>181</td>\n",
" <td>6</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" re3data_id repository_name type \\\n",
"count 2467 2467 2467 \n",
"unique 2466 2463 9 \n",
"top r3d100011987 Landmap [disciplinary] \n",
"freq 2 2 1573 \n",
"\n",
" subject provider_type \\\n",
"count 2467 2459 \n",
"unique 1282 1 \n",
"top [1 Humanities and Social Sciences, 2 Life Scie... dataProvider \n",
"freq 200 2459 \n",
"\n",
" keyword institution \n",
"count 2467 2467 \n",
"unique 2248 2447 \n",
"top [multidisciplinary] [[National Center for Biotechnology Informatio... \n",
"freq 181 6 "
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"re3data_df.describe(include='all')"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**openDOAR**"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>opendoar_id</th>\n",
" <th>repository_name</th>\n",
" <th>type</th>\n",
" <th>subject</th>\n",
" <th>institution</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>101</td>\n",
" <td>utrecht university repository</td>\n",
" <td>institutional</td>\n",
" <td>[multidisciplinary]</td>\n",
" <td>[[university of utrecht, [universiteit utrecht...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>115</td>\n",
" <td>dspace at indian institute of management kozhi...</td>\n",
" <td>institutional</td>\n",
" <td>[ecology and environment, social sciences gene...</td>\n",
" <td>[[indian institute of management kozhikode, [i...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>41</td>\n",
" <td>caltech engineering and science online</td>\n",
" <td>institutional</td>\n",
" <td>[biology and biochemistry, chemistry and chemi...</td>\n",
" <td>[[california institute of technology, [caltech...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>119</td>\n",
" <td>dcu online research access service</td>\n",
" <td>institutional</td>\n",
" <td>[multidisciplinary]</td>\n",
" <td>[[dublin city university, [dcu], ie, [], , htt...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>129</td>\n",
" <td>earth-prints repository</td>\n",
" <td>disciplinary</td>\n",
" <td>[earth and planetary sciences]</td>\n",
" <td>[[istituto nazionale di geofisica e vulcanolog...</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" opendoar_id repository_name \\\n",
"0 101 utrecht university repository \n",
"1 115 dspace at indian institute of management kozhi... \n",
"2 41 caltech engineering and science online \n",
"3 119 dcu online research access service \n",
"4 129 earth-prints repository \n",
"\n",
" type subject \\\n",
"0 institutional [multidisciplinary] \n",
"1 institutional [ecology and environment, social sciences gene... \n",
"2 institutional [biology and biochemistry, chemistry and chemi... \n",
"3 institutional [multidisciplinary] \n",
"4 disciplinary [earth and planetary sciences] \n",
"\n",
" institution \n",
"0 [[university of utrecht, [universiteit utrecht... \n",
"1 [[indian institute of management kozhikode, [i... \n",
"2 [[california institute of technology, [caltech... \n",
"3 [[dublin city university, [dcu], ie, [], , htt... \n",
"4 [[istituto nazionale di geofisica e vulcanolog... "
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"opendoar_df = pd.read_csv('../data/raw/openDoar.tsv', delimiter='\\t',\n",
" converters={'subject': ast.literal_eval,\n",
" 'additional_name': ast.literal_eval,\n",
" 'opendoar_id': ast.literal_eval,\n",
" 'content_type': ast.literal_eval,\n",
" 'institution': ast.literal_eval\n",
" },\n",
" usecols=['opendoar_id', 'repository_name', 'subject', 'type', 'institution'])\n",
"opendoar_df.head()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>opendoar_id</th>\n",
" <th>repository_name</th>\n",
" <th>type</th>\n",
" <th>subject</th>\n",
" <th>institution</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>count</th>\n",
" <td>5707.000000</td>\n",
" <td>5707</td>\n",
" <td>5707</td>\n",
" <td>5707</td>\n",
" <td>5707</td>\n",
" </tr>\n",
" <tr>\n",
" <th>unique</th>\n",
" <td>NaN</td>\n",
" <td>5670</td>\n",
" <td>4</td>\n",
" <td>820</td>\n",
" <td>5098</td>\n",
" </tr>\n",
" <tr>\n",
" <th>top</th>\n",
" <td>NaN</td>\n",
" <td>arch</td>\n",
" <td>institutional</td>\n",
" <td>[multidisciplinary]</td>\n",
" <td>[[rijksuniversiteit groningen, [rug], nl, [], ...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>freq</th>\n",
" <td>NaN</td>\n",
" <td>3</td>\n",
" <td>5067</td>\n",
" <td>3212</td>\n",
" <td>26</td>\n",
" </tr>\n",
" <tr>\n",
" <th>mean</th>\n",
" <td>4008.118801</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>std</th>\n",
" <td>2869.948770</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>min</th>\n",
" <td>2.000000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25%</th>\n",
" <td>1823.000000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50%</th>\n",
" <td>3361.000000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>75%</th>\n",
" <td>5095.000000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>max</th>\n",
" <td>10175.000000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" opendoar_id repository_name type subject \\\n",
"count 5707.000000 5707 5707 5707 \n",
"unique NaN 5670 4 820 \n",
"top NaN arch institutional [multidisciplinary] \n",
"freq NaN 3 5067 3212 \n",
"mean 4008.118801 NaN NaN NaN \n",
"std 2869.948770 NaN NaN NaN \n",
"min 2.000000 NaN NaN NaN \n",
"25% 1823.000000 NaN NaN NaN \n",
"50% 3361.000000 NaN NaN NaN \n",
"75% 5095.000000 NaN NaN NaN \n",
"max 10175.000000 NaN NaN NaN \n",
"\n",
" institution \n",
"count 5707 \n",
"unique 5098 \n",
"top [[rijksuniversiteit groningen, [rug], nl, [], ... \n",
"freq 26 \n",
"mean NaN \n",
"std NaN \n",
"min NaN \n",
"25% NaN \n",
"50% NaN \n",
"75% NaN \n",
"max NaN "
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"opendoar_df.describe(include='all')"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**ROAR**"
]
},
{
"cell_type": "code",
"execution_count": 45,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>eprintid</th>\n",
" <th>home_page</th>\n",
" <th>title</th>\n",
" <th>location_country</th>\n",
" <th>subjects</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>921</td>\n",
" <td>http://alcme.oclc.org/ndltd/index.html</td>\n",
" <td>Networked Digital Library of Theses and Disser...</td>\n",
" <td>us</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>1489</td>\n",
" <td>http://prensahistorica.mcu.es/prensahistorica/...</td>\n",
" <td>Virtual Library of Historical Press</td>\n",
" <td>es</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>606</td>\n",
" <td>http://hal.archives-ouvertes.fr/</td>\n",
" <td>HAL: Hyper Article en Ligne</td>\n",
" <td>fr</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>606</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>606</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" eprintid home_page \\\n",
"0 921 http://alcme.oclc.org/ndltd/index.html \n",
"1 1489 http://prensahistorica.mcu.es/prensahistorica/... \n",
"2 606 http://hal.archives-ouvertes.fr/ \n",
"3 606 NaN \n",
"4 606 NaN \n",
"\n",
" title location_country subjects \n",
"0 Networked Digital Library of Theses and Disser... us NaN \n",
"1 Virtual Library of Historical Press es NaN \n",
"2 HAL: Hyper Article en Ligne fr NaN \n",
"3 NaN NaN NaN \n",
"4 NaN NaN NaN "
]
},
"execution_count": 45,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"roar_df = pd.read_csv('../data/raw/export_roar_CSV.csv',\n",
" usecols=['eprintid', 'home_page', 'title', 'location_country', 'subjects'])\n",
"roar_df.head()"
]
},
{
"cell_type": "code",
"execution_count": 43,
"metadata": {},
"outputs": [],
"source": [
"# roar_df.drop_duplicates(subset=['home_page', 'title' , 'location_country', 'subjects'], keep=False, inplace=True)"
]
},
{
"cell_type": "code",
"execution_count": 47,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>eprintid</th>\n",
" <th>home_page</th>\n",
" <th>title</th>\n",
" <th>location_country</th>\n",
" <th>subjects</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>106</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>Faculty Scholarship at The Claremont Colleges</td>\n",
" <td>us</td>\n",
" <td>AS</td>\n",
" </tr>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>BF</td>\n",
" </tr>\n",
" <tr>\n",
" <th>108</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>BL</td>\n",
" </tr>\n",
" <tr>\n",
" <th>109</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>CC</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>GN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>111</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>H1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>112</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>HB</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>JA</td>\n",
" </tr>\n",
" <tr>\n",
" <th>114</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>LB</td>\n",
" </tr>\n",
" <tr>\n",
" <th>115</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NX</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>PQ</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>2303</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>QA</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" eprintid home_page title \\\n",
"106 2303 NaN Faculty Scholarship at The Claremont Colleges \n",
"107 2303 NaN NaN \n",
"108 2303 NaN NaN \n",
"109 2303 NaN NaN \n",
"110 2303 NaN NaN \n",
"111 2303 NaN NaN \n",
"112 2303 NaN NaN \n",
"113 2303 NaN NaN \n",
"114 2303 NaN NaN \n",
"115 2303 NaN NaN \n",
"116 2303 NaN NaN \n",
"117 2303 NaN NaN \n",
"\n",
" location_country subjects \n",
"106 us AS \n",
"107 NaN BF \n",
"108 NaN BL \n",
"109 NaN CC \n",
"110 NaN GN \n",
"111 NaN H1 \n",
"112 NaN HB \n",
"113 NaN JA \n",
"114 NaN LB \n",
"115 NaN NX \n",
"116 NaN PQ \n",
"117 NaN QA "
]
},
"execution_count": 47,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"roar_df[roar_df.eprintid == 2303]"
]
},
{
"cell_type": "code",
"execution_count": 44,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>eprintid</th>\n",
" <th>home_page</th>\n",
" <th>title</th>\n",
" <th>location_country</th>\n",
" <th>subjects</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>count</th>\n",
" <td>5314.000000</td>\n",
" <td>5263</td>\n",
" <td>5268</td>\n",
" <td>5024</td>\n",
" <td>1225</td>\n",
" </tr>\n",
" <tr>\n",
" <th>unique</th>\n",
" <td>NaN</td>\n",
" <td>5156</td>\n",
" <td>5027</td>\n",
" <td>134</td>\n",
" <td>123</td>\n",
" </tr>\n",
" <tr>\n",
" <th>top</th>\n",
" <td>NaN</td>\n",
" <td>http://ir.lib.isu.edu.tw/</td>\n",
" <td>Repositorio Institucional</td>\n",
" <td>us</td>\n",
" <td>H1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>freq</th>\n",
" <td>NaN</td>\n",
" <td>3</td>\n",
" <td>7</td>\n",
" <td>877</td>\n",
" <td>147</td>\n",
" </tr>\n",
" <tr>\n",
" <th>mean</th>\n",
" <td>6389.464434</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>std</th>\n",
" <td>5159.573937</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>min</th>\n",
" <td>1.000000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25%</th>\n",
" <td>1490.250000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>50%</th>\n",
" <td>4990.500000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>75%</th>\n",
" <td>10452.750000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>max</th>\n",
" <td>17302.000000</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" eprintid home_page title \\\n",
"count 5314.000000 5263 5268 \n",
"unique NaN 5156 5027 \n",
"top NaN http://ir.lib.isu.edu.tw/ Repositorio Institucional \n",
"freq NaN 3 7 \n",
"mean 6389.464434 NaN NaN \n",
"std 5159.573937 NaN NaN \n",
"min 1.000000 NaN NaN \n",
"25% 1490.250000 NaN NaN \n",
"50% 4990.500000 NaN NaN \n",
"75% 10452.750000 NaN NaN \n",
"max 17302.000000 NaN NaN \n",
"\n",
" location_country subjects \n",
"count 5024 1225 \n",
"unique 134 123 \n",
"top us H1 \n",
"freq 877 147 \n",
"mean NaN NaN \n",
"std NaN NaN \n",
"min NaN NaN \n",
"25% NaN NaN \n",
"50% NaN NaN \n",
"75% NaN NaN \n",
"max NaN NaN "
]
},
"execution_count": 44,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"roar_df.describe(include='all')"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**FAIRsharing**"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>full_name</th>\n",
" <th>short_name</th>\n",
" <th>fs_url</th>\n",
" <th>url</th>\n",
" <th>countries</th>\n",
" <th>subjects</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>GenBank</td>\n",
" <td>GenBank</td>\n",
" <td>https://fairsharing.org/10.25504/FAIRsharing.9...</td>\n",
" <td>https://www.ncbi.nlm.nih.gov/genbank/</td>\n",
" <td>European Union,Japan,United States</td>\n",
" <td>Bioinformatics,Data Management,Data Submission...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>GlycoNAVI</td>\n",
" <td>GlycoNAVI</td>\n",
" <td>https://fairsharing.org/10.25504/FAIRsharing.w...</td>\n",
" <td>https://glyconavi.org/</td>\n",
" <td>Japan</td>\n",
" <td>Chemistry,Glycomics,Life Science,Organic Chemi...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>ADHDgene</td>\n",
" <td>ADHDgene</td>\n",
" <td>https://fairsharing.org/10.25504/FAIRsharing.m...</td>\n",
" <td>http://adhd.psych.ac.cn/</td>\n",
" <td>China</td>\n",
" <td>Biomedical Science,Genetics</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>Allele frequency resource for research and tea...</td>\n",
" <td>ALFRED</td>\n",
" <td>https://fairsharing.org/10.25504/FAIRsharing.y...</td>\n",
" <td>http://alfred.med.yale.edu</td>\n",
" <td>United States</td>\n",
" <td>Life Science</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>Animal Transcription Factor Database</td>\n",
" <td>AnimalTFDB</td>\n",
" <td>https://fairsharing.org/10.25504/FAIRsharing.e...</td>\n",
" <td>http://bioinfo.life.hust.edu.cn/AnimalTFDB/</td>\n",
" <td>China</td>\n",
" <td>Life Science</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" full_name short_name \\\n",
"0 GenBank GenBank \n",
"1 GlycoNAVI GlycoNAVI \n",
"2 ADHDgene ADHDgene \n",
"3 Allele frequency resource for research and tea... ALFRED \n",
"4 Animal Transcription Factor Database AnimalTFDB \n",
"\n",
" fs_url \\\n",
"0 https://fairsharing.org/10.25504/FAIRsharing.9... \n",
"1 https://fairsharing.org/10.25504/FAIRsharing.w... \n",
"2 https://fairsharing.org/10.25504/FAIRsharing.m... \n",
"3 https://fairsharing.org/10.25504/FAIRsharing.y... \n",
"4 https://fairsharing.org/10.25504/FAIRsharing.e... \n",
"\n",
" url \\\n",
"0 https://www.ncbi.nlm.nih.gov/genbank/ \n",
"1 https://glyconavi.org/ \n",
"2 http://adhd.psych.ac.cn/ \n",
"3 http://alfred.med.yale.edu \n",
"4 http://bioinfo.life.hust.edu.cn/AnimalTFDB/ \n",
"\n",
" countries \\\n",
"0 European Union,Japan,United States \n",
"1 Japan \n",
"2 China \n",
"3 United States \n",
"4 China \n",
"\n",
" subjects \n",
"0 Bioinformatics,Data Management,Data Submission... \n",
"1 Chemistry,Glycomics,Life Science,Organic Chemi... \n",
"2 Biomedical Science,Genetics \n",
"3 Life Science \n",
"4 Life Science "
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"fairsharing_df = pd.read_csv('../data/raw/FAIRsharingDBrec_summary20210304.csv', \n",
" delimiter='|', header=0,\n",
" names=['full_name', 'short_name', 'fs_url', 'url', 'countries', 'subjects'])\n",
"fairsharing_df.head()"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>full_name</th>\n",
" <th>short_name</th>\n",
" <th>fs_url</th>\n",
" <th>url</th>\n",
" <th>countries</th>\n",
" <th>subjects</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>count</th>\n",
" <td>1752</td>\n",
" <td>1752</td>\n",
" <td>1752</td>\n",
" <td>1752</td>\n",
" <td>1749</td>\n",
" <td>1690</td>\n",
" </tr>\n",
" <tr>\n",
" <th>unique</th>\n",
" <td>1752</td>\n",
" <td>1741</td>\n",
" <td>1752</td>\n",
" <td>1752</td>\n",
" <td>178</td>\n",
" <td>834</td>\n",
" </tr>\n",
" <tr>\n",
" <th>top</th>\n",
" <td>CiteAb</td>\n",
" <td>CGD</td>\n",
" <td>https://fairsharing.org/10.25504/FAIRsharing.1...</td>\n",
" <td>http://www.plexdb.org/</td>\n",
" <td>United States</td>\n",
" <td>Life Science</td>\n",
" </tr>\n",
" <tr>\n",
" <th>freq</th>\n",
" <td>1</td>\n",
" <td>3</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>588</td>\n",
" <td>367</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" full_name short_name \\\n",
"count 1752 1752 \n",
"unique 1752 1741 \n",
"top CiteAb CGD \n",
"freq 1 3 \n",
"\n",
" fs_url \\\n",
"count 1752 \n",
"unique 1752 \n",
"top https://fairsharing.org/10.25504/FAIRsharing.1... \n",
"freq 1 \n",
"\n",
" url countries subjects \n",
"count 1752 1749 1690 \n",
"unique 1752 178 834 \n",
"top http://www.plexdb.org/ United States Life Science \n",
"freq 1 588 367 "
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"fairsharing_df.describe(include='all')"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Subjects analysis"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**re3data**"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [],
"source": [
"re3data_subjects = re3data_df.explode('subject')"
]
},
{
"cell_type": "code",
"execution_count": 37,
"metadata": {},
"outputs": [
{
"data": {
"application/vnd.plotly.v1+json": {
"config": {
"plotlyServerURL": "https://plot.ly"
},
"data": [
{
"name": "re3data tier 1-digits",
"type": "bar",
"x": [
"2 Life Sciences",
"3 Natural Sciences",
"1 Humanities and Social Sciences",
"4 Engineering Sciences"
],
"y": [
1346,
1216,
894,
468
]
},
{
"name": "re3data tier 2-digits",
"type": "bar",
"x": [
"21 Biology",
"34 Geosciences (including Geography)",
"22 Medicine",
"12 Social and Behavioural Sciences",
"11 Humanities",
"32 Physics",
"31 Chemistry",
"23 Agriculture, Forestry, Horticulture and Veterinary Medicine",
"44 Computer Science, Electrical and System Engineering",
"45 Construction Engineering and Architecture",
"43 Materials Science and Engineering",
"33 Mathematics",
"42 Thermal Engineering/Process Engineering",
"41 Mechanical and industrial Engineering"
],
"y": [
816,
689,
579,
417,
287,
284,
202,
178,
135,
43,
37,
30,
18,
10
]
},
{
"name": "re3data tier 3-digits",
"type": "bar",
"x": [
"201 Basic Biological and Medical Research",
"205 Medicine",
"313 Atmospheric Science and Oceanography",
"111 Social Sciences",
"315 Geophysics and Geodesy",
"203 Zoology",
"204 Microbiology, Virology and Immunology",
"112 Economics",
"202 Plant Sciences",
"311 Astrophysics and Astronomy",
"317 Geography",
"318 Water Research",
"207 Agriculture, Forestry, Horticulture and Veterinary Medicine",
"104 Linguistics",
"102 History",
"316 Geochemistry, Mineralogy and Crystallography",
"409 Computer Science",
"206 Neurosciences",
"308 Optics, Quantum Optics and Physics of Atoms, Molecules and Plasmas",
"314 Geology and Palaeontology",
"103 Fine Arts, Music, Theatre and Media Studies",
"101 Ancient Cultures",
"109 Education Sciences",
"309 Particles, Nuclei and Fields",
"113 Jurisprudence",
"301 Molecular Chemistry",
"106 Non-European Languages and Cultures, Social and Cultural Anthropology, Jewish Studies and Religious Studies",
"110 Psychology",
"410 Construction Engineering and Architecture",
"303 Physical and Theoretical Chemistry",
"105 Literary Studies",
"307 Condensed Matter Physics",
"407 Systems Engineering",
"304 Analytical Chemistry, Method Development (Chemistry)",
"406 Materials Science",
"305 Biological Chemistry and Food Chemistry",
"302 Chemical Solid State and Surface Research",
"107 Theology",
"408 Electrical Engineering",
"403 Process Engineering, Technical Chemistry",
"405 Materials Engineering",
"404 Heat Energy Technology, Thermal Machines, Fluid Mechanics",
"108 Philosophy",
"312 Mathematics",
"402 Mechanics and Constructive Mechanical Engineering",
"310 Statistical Physics, Soft Matter, Biological Physics, Nonlinear Dynamics",
"306 Polymer Research"
],
"y": [
477,
373,
359,
272,
240,
213,
200,
195,
195,
163,
143,
130,
124,
96,
94,
83,
81,
78,
72,
70,
70,
63,
58,
49,
48,
42,
42,
37,
35,
31,
26,
25,
24,
22,
22,
20,
20,
19,
14,
10,
9,
9,
8,
7,
5,
5,
4
]
},
{
"name": "re3data tier 5-digits",
"type": "bar",
"x": [
"20105 General Genetics",
"20107 Bioinformatics and Theoretical Biology",
"31302 Oceanography",
"20502 Public Health, Health Services Research, Social Medicine",
"31301 Atmospheric Science",
"20503 Human Genetics",
"11102 Empirical Social Research",
"31502 Geodesy, Photogrammetry, Remote Sensing, Geoinformatics, Cartogaphy",
"20306 Animal Genetics, Cell and Developmental Biology",
"20103 Cell Biology",
"20303 Animal Ecology, Biodiversity and Ecosystem Research",
"20101 Biochemistry",
"20202 Plant Ecology and Ecosystem Analysis",
"31501 Geophysics",
"11205 Statistics and Econometrics",
"20207 Plant Genetics",
"20501 Epidemiology, Medical Biometry, Medical Informatics",
"11104 Political Science",
"11202 Economic and Social Policy",
"31801 Hydrogeology, Hydrology, Limnology, Urban Water Management, Water Chemistry, Integrated Water Resources Management",
"20104 Structural Biology",
"20401 Metabolism, Biochemistry and Genetics of Microorganisms",
"20704 Ecology of Agricultural Landscapes",
"20701 Soil Sciences",
"31101 Astrophysics and Astronomy",
"31702 Human Geography",
"20710 Basic Forest Research",
"20509 Pharmacology",
"31701 Physical Geography",
"30301 Physical Chemistry of Molecules, Interfaces and Liquids - Spectroscopy, Kinetics",
"40904 Artificial Intelligence, Image and Language Processing",
"30801 Optics, Quantum Optics, Atoms, Molecules, Plasmas",
"20405 Immunology",
"20302 Evolution, Anthropology",
"10601 Social and Cultural Anthropology and Ethnology/Folklore",
"31601 Geochemistry, Mineralogy and Crystallography",
"20708 Agricultural Economics and Sociology",
"10203 Modern and Current History",
"31401 Geology and Palaeontology",
"10302 Musicology",
"10301 Art History",
"20532 Biomedical Technology and Medical Physics",
"20404 Virology",
"41002 Urbanism, Spatial Planning, Transportation and Infrastructure Planning, Landscape Planning",
"20606 Cognitive Neuroscience and Neuroimaging",
"20403 Medical Microbiology, Molecular Infection Biology",
"11204 Business Administration",
"20709 Inventory Control and Use of Forest Resources",
"20514 Hematology, Oncology, Transfusion Medicine",
"11103 Communication Science",
"20201 Plant Systematics and Evolution",
"20301 Systematics and Morphology",
"11203 Public Finance",
"41001 Architecture, Building and Construction History, Sustainable Building Technology, Building Design",
"40704 Traffic and Transport Systems, Logistics",
"20510 Toxicology and Occupational Medicine",
"20508 Pharmacy",
"20108 Anatomy",
"10104 Classical Archaeology",
"20205 Plant Biochemistry and Biophysics",
"20504 Physiology",
"11206 Economic and Social History",
"20102 Biophysics",
"10204 History of Science",
"30901 Particles, Nuclei and Fields",
"10902 Research on Teaching, Learning and Training",
"20305 Biochemistry and Animal Physiology",
"10903 Research on Socialization and Educational Institutions and Professions",
"30102 Organic Molecular Chemistry",
"11301 Legal and Political Philosophy, Legal History, Legal Theory",
"20530 Radiology and Nuclear Medicine",
"20705 Plant Breeding",
"20520 Pediatric and Adolescent Medicine",
"10605 Religious Studies and Jewish Studies",
"20702 Plant Cultivation",
"20604 Systemic Neuroscience, Computational Neuroscience, Behaviour",
"20402 Microbial Ecology and Applied Microbiology",
"10201 Medieval History",
"11303 Public Law",
"10403 Typology, Non-European Languages, Historical Linguistics",
"20707 Agricultural and Food Process Engineering",
"40902 Software Technology",
"20506 Pathology and Forensic Medicine",
"10202 Early Modern History",
"20713 Basic Veterinary Medical Science",
"30202 Physical Chemistry of Solids and Surfaces, Material Characterisation",
"10103 Ancient History",
"10101 Prehistory",
"30203 Theory and Modelling",
"10105 Egyptology and Ancient Near Eastern Studies",
"30101 Inorganic Molecular Chemistry",
"11305 Criminology",
"20515 Gastroenterology, Metabolism",
"20513 Pneumology, Clinical Infectiology Intensive Care Medicine",
"30501 Biological and Biomimetic Chemistry",
"40803 Electrical Energy Generation, Distribution, Application",
"40705 Human Factors, Ergonomics, Human-Machine Systems",
"40204 Acoustics",
"10303 Theatre and Media Studies",
"20601 Molecular Neuroscience and Neurogenetics",
"20531 Radiation Oncology and Radiobiology",
"30201 Solid State and Surface Chemistry, Material Synthesis",
"10402 Individual Linguistics",
"40903 Operating, Communication and Information Systems",
"20517 Endocrinology, Diabetology",
"20521 Gynaecology and Obstetrics",
"20505 Nutritional Sciences",
"20711 Animal Husbandry, Breeding and Hygiene",
"10401 General and Applied Linguistics",
"20714 Basic Research on Pathogenesis, Diagnostics and Therapy and Clinical Veterinary Medicine",
"20304 Sensory and Behavioural Biology",
"10603 African, American and Oceania Studies",
"30401 Analytical Chemistry, Method Development (Chemistry)",
"30302 General Theoretical Chemistry",
"11004 Differential Psychology, Clinical Psychology, Medical Psychology, Methodology",
"20611 Clinical Neurosciences III - Ophthalmology",
"20518 Rheumatology, Clinical Immunology, Allergology",
"20507 Clinical Chemistry and Pathobiochemistry",
"41004 Sructural Engineering, Building Informatics, Construction Operation",
"20524 Gerontology and Geriatric Medicine",
"30701 Experimental Condensed Matter Physics",
"20703 Plant Nutrition",
"10503 European and American Literature",
"20106 Developmental Biology",
"40401 Energy Process Engineering",
"10604 Islamic Studies, Arabian Studies, Semitic Studies",
"10701 Protestant Theology",
"11101 Sociological Theory",
"40802 Communication, High-Frequency and Network Technology, Theoretical Electrical Engineering",
"11003 Social Psychology, Industrial and Organisational Psychology",
"20204 Plant Physiology",
"11002 Developmental and Educational Psychology",
"40503 Composite Materials",
"40502 Sintered Metallic and Ceramic Materials",
"30502 Food Chemistry",
"40601 Thermodynamics and Kinetics of Materials",
"40605 Biomaterials",
"11001 General, Biological and Mathematical Psychology",
"40701 Automation, Control Systems, Robotics, Mechatronics",
"20206 Plant Cell and Developmental Biology",
"41006 Geotechnics, Hydraulic Engineering",
"11201 Economic Theory",
"10901 General Education and History of Education",
"10702 Roman Catholic Theology",
"11304 Criminal Law and Law of Criminal Procedure",
"10602 Asian Studies",
"40304 Biological Process Engineering",
"10504 General and Comparative Literature and Cultural Studies",
"20528 Dentistry, Oral Surgery",
"20519 Dermatology",
"20522 Reproductive Medicine/Biology",
"20512 Cardiology, Angiology",
"30603 Polymer Materials",
"30601 Preparatory and Physical Chemistry of Polymers",
"20609 Biological Psychiatry",
"40901 Theoretical Computer Science",
"41003 Construction Material Sciences, Chemistry, Building Physics",
"30702 Theoretical Condensed Matter Physics",
"20608 Clinical Neurosciences I - Neurology, Neurosurgery",
"20605 Comparative Neurobiology",
"30602 Experimental and Theoretical Physics of Polymers",
"11302 Private Law",
"20203 Inter-organismic Interactions of Plants",
"20603 Developmental Neurobiology",
"31001 Statistical Physics, Soft Matter, Biological Physics, Nonlinear Dynamics",
"10801 History of Philosophy",
"10102 Classical Philology",
"10501 Medieval German Literature",
"40801 Electronic Semiconductors, Components, Circuits, Systems",
"31201 Mathematics",
"20527 Traumatology and Orthopaedics",
"40702 Measurement Systems",
"20526 Cardiothoracic Surgery",
"20523 Urology",
"40603 Microstructural Mechanical Properties of Materials",
"40301 Chemical and Thermal Process Engineering",
"40501 Metallurgical and Thermal Processes, Thermomechanical Treatment of Materials",
"40302 Technical Chemistry",
"40402 Technical Thermodynamics",
"20602 Cellular Neuroscience"
],
"y": [
199,
166,
149,
125,
115,
109,
95,
89,
81,
77,
73,
68,
66,
63,
60,
59,
56,
51,
49,
45,
44,
33,
32,
32,
27,
26,
24,
23,
22,
22,
20,
20,
19,
19,
19,
18,
17,
17,
17,
17,
17,
16,
16,
15,
15,
15,
14,
14,
14,
14,
14,
14,
13,
13,
13,
12,
12,
12,
11,
11,
11,
11,
10,
10,
10,
10,
9,
9,
9,
9,
9,
9,
9,
9,
8,
8,
8,
8,
8,
7,
7,
7,
7,
7,
7,
7,
6,
6,
6,
6,
6,
6,
6,
5,
5,
5,
5,
5,
5,
5,
5,
5,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1
]
}
],
"layout": {
"template": {
"data": {
"bar": [
{
"error_x": {
"color": "#2a3f5f"
},
"error_y": {
"color": "#2a3f5f"
},
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "bar"
}
],
"barpolar": [
{
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "barpolar"
}
],
"carpet": [
{
"aaxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"baxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"type": "carpet"
}
],
"choropleth": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "choropleth"
}
],
"contour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "contour"
}
],
"contourcarpet": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "contourcarpet"
}
],
"heatmap": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmap"
}
],
"heatmapgl": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmapgl"
}
],
"histogram": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "histogram"
}
],
"histogram2d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2d"
}
],
"histogram2dcontour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2dcontour"
}
],
"mesh3d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "mesh3d"
}
],
"parcoords": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "parcoords"
}
],
"pie": [
{
"automargin": true,
"type": "pie"
}
],
"scatter": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter"
}
],
"scatter3d": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter3d"
}
],
"scattercarpet": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattercarpet"
}
],
"scattergeo": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergeo"
}
],
"scattergl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergl"
}
],
"scattermapbox": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattermapbox"
}
],
"scatterpolar": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolar"
}
],
"scatterpolargl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolargl"
}
],
"scatterternary": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterternary"
}
],
"surface": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "surface"
}
],
"table": [
{
"cells": {
"fill": {
"color": "#EBF0F8"
},
"line": {
"color": "white"
}
},
"header": {
"fill": {
"color": "#C8D4E3"
},
"line": {
"color": "white"
}
},
"type": "table"
}
]
},
"layout": {
"annotationdefaults": {
"arrowcolor": "#2a3f5f",
"arrowhead": 0,
"arrowwidth": 1
},
"autotypenumbers": "strict",
"coloraxis": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"colorscale": {
"diverging": [
[
0,
"#8e0152"
],
[
0.1,
"#c51b7d"
],
[
0.2,
"#de77ae"
],
[
0.3,
"#f1b6da"
],
[
0.4,
"#fde0ef"
],
[
0.5,
"#f7f7f7"
],
[
0.6,
"#e6f5d0"
],
[
0.7,
"#b8e186"
],
[
0.8,
"#7fbc41"
],
[
0.9,
"#4d9221"
],
[
1,
"#276419"
]
],
"sequential": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"sequentialminus": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
]
},
"colorway": [
"#636efa",
"#EF553B",
"#00cc96",
"#ab63fa",
"#FFA15A",
"#19d3f3",
"#FF6692",
"#B6E880",
"#FF97FF",
"#FECB52"
],
"font": {
"color": "#2a3f5f"
},
"geo": {
"bgcolor": "white",
"lakecolor": "white",
"landcolor": "#E5ECF6",
"showlakes": true,
"showland": true,
"subunitcolor": "white"
},
"hoverlabel": {
"align": "left"
},
"hovermode": "closest",
"mapbox": {
"style": "light"
},
"paper_bgcolor": "white",
"plot_bgcolor": "#E5ECF6",
"polar": {
"angularaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"radialaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"scene": {
"xaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"yaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"zaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
}
},
"shapedefaults": {
"line": {
"color": "#2a3f5f"
}
},
"ternary": {
"aaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"baxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"caxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"title": {
"x": 0.05
},
"xaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
},
"yaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
}
}
},
"title": {
"text": "Subject coverage re3data"
},
"xaxis": {
"tickangle": 45,
"tickfont": {
"size": 12
}
}
}
},
"text/html": [
"<div> <div id=\"1223706d-19c0-49a5-b3ba-d268c6c646b6\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div> <script type=\"text/javascript\"> require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {}; if (document.getElementById(\"1223706d-19c0-49a5-b3ba-d268c6c646b6\")) { Plotly.newPlot( \"1223706d-19c0-49a5-b3ba-d268c6c646b6\", [{\"name\": \"re3data tier 1-digits\", \"type\": \"bar\", \"x\": [\"2 Life Sciences\", \"3 Natural Sciences\", \"1 Humanities and Social Sciences\", \"4 Engineering Sciences\"], \"y\": [1346, 1216, 894, 468]}, {\"name\": \"re3data tier 2-digits\", \"type\": \"bar\", \"x\": [\"21 Biology\", \"34 Geosciences (including Geography)\", \"22 Medicine\", \"12 Social and Behavioural Sciences\", \"11 Humanities\", \"32 Physics\", \"31 Chemistry\", \"23 Agriculture, Forestry, Horticulture and Veterinary Medicine\", \"44 Computer Science, Electrical and System Engineering\", \"45 Construction Engineering and Architecture\", \"43 Materials Science and Engineering\", \"33 Mathematics\", \"42 Thermal Engineering/Process Engineering\", \"41 Mechanical and industrial Engineering\"], \"y\": [816, 689, 579, 417, 287, 284, 202, 178, 135, 43, 37, 30, 18, 10]}, {\"name\": \"re3data tier 3-digits\", \"type\": \"bar\", \"x\": [\"201 Basic Biological and Medical Research\", \"205 Medicine\", \"313 Atmospheric Science and Oceanography\", \"111 Social Sciences\", \"315 Geophysics and Geodesy\", \"203 Zoology\", \"204 Microbiology, Virology and Immunology\", \"112 Economics\", \"202 Plant Sciences\", \"311 Astrophysics and Astronomy\", \"317 Geography\", \"318 Water Research\", \"207 Agriculture, Forestry, Horticulture and Veterinary Medicine\", \"104 Linguistics\", \"102 History\", \"316 Geochemistry, Mineralogy and Crystallography\", \"409 Computer Science\", \"206 Neurosciences\", \"308 Optics, Quantum Optics and Physics of Atoms, Molecules and Plasmas\", \"314 Geology and Palaeontology\", \"103 Fine Arts, Music, Theatre and Media Studies\", \"101 Ancient Cultures\", \"109 Education Sciences\", \"309 Particles, Nuclei and Fields\", \"113 Jurisprudence\", \"301 Molecular Chemistry\", \"106 Non-European Languages and Cultures, Social and Cultural Anthropology, Jewish Studies and Religious Studies\", \"110 Psychology\", \"410 Construction Engineering and Architecture\", \"303 Physical and Theoretical Chemistry\", \"105 Literary Studies\", \"307 Condensed Matter Physics\", \"407 Systems Engineering\", \"304 Analytical Chemistry, Method Development (Chemistry)\", \"406 Materials Science\", \"305 Biological Chemistry and Food Chemistry\", \"302 Chemical Solid State and Surface Research\", \"107 Theology\", \"408 Electrical Engineering\", \"403 Process Engineering, Technical Chemistry\", \"405 Materials Engineering\", \"404 Heat Energy Technology, Thermal Machines, Fluid Mechanics\", \"108 Philosophy\", \"312 Mathematics\", \"402 Mechanics and Constructive Mechanical Engineering\", \"310 Statistical Physics, Soft Matter, Biological Physics, Nonlinear Dynamics\", \"306 Polymer Research\"], \"y\": [477, 373, 359, 272, 240, 213, 200, 195, 195, 163, 143, 130, 124, 96, 94, 83, 81, 78, 72, 70, 70, 63, 58, 49, 48, 42, 42, 37, 35, 31, 26, 25, 24, 22, 22, 20, 20, 19, 14, 10, 9, 9, 8, 7, 5, 5, 4]}, {\"name\": \"re3data tier 5-digits\", \"type\": \"bar\", \"x\": [\"20105 General Genetics\", \"20107 Bioinformatics and Theoretical Biology\", \"31302 Oceanography\", \"20502 Public Health, Health Services Research, Social Medicine\", \"31301 Atmospheric Science\", \"20503 Human Genetics\", \"11102 Empirical Social Research\", \"31502 Geodesy, Photogrammetry, Remote Sensing, Geoinformatics, Cartogaphy\", \"20306 Animal Genetics, Cell and Developmental Biology\", \"20103 Cell Biology\", \"20303 Animal Ecology, Biodiversity and Ecosystem Research\", \"20101 Biochemistry\", \"20202 Plant Ecology and Ecosystem Analysis\", \"3150
" \n",
"var gd = document.getElementById('1223706d-19c0-49a5-b3ba-d268c6c646b6');\n",
"var x = new MutationObserver(function (mutations, observer) {{\n",
" var display = window.getComputedStyle(gd).display;\n",
" if (!display || display === 'none') {{\n",
" console.log([gd, 'removed!']);\n",
" Plotly.purge(gd);\n",
" observer.disconnect();\n",
" }}\n",
"}});\n",
"\n",
"// Listen for the removal of the full notebook cells\n",
"var notebookContainer = gd.closest('#notebook-container');\n",
"if (notebookContainer) {{\n",
" x.observe(notebookContainer, {childList: true});\n",
"}}\n",
"\n",
"// Listen for the clearing of the current output cell\n",
"var outputEl = gd.closest('.output');\n",
"if (outputEl) {{\n",
" x.observe(outputEl, {childList: true});\n",
"}}\n",
"\n",
" }) }; }); </script> </div>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"data = re3data_subjects.groupby('subject')[['re3data_id']].count().sort_values('re3data_id', ascending=False)\n",
"plot = [\n",
" go.Bar(\n",
" x=data[data.index.str.contains('^\\d{%s}\\s' % tier, regex=True)].index,\n",
" y=data[data.index.str.contains('^\\d{%s}\\s' % tier, regex=True)]['re3data_id'],\n",
" name='re3data tier %s-digits' % tier\n",
" ) for tier in [1,2,3,5]\n",
"] \n",
"\n",
"layout = go.Layout(\n",
" title='Subject coverage re3data',\n",
" xaxis=dict(tickangle=45, tickfont=dict(size=12))\n",
")\n",
"\n",
"fig = go.Figure(plot, layout).show()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**OpenDOAR**"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [],
"source": [
"opendoar_subjects = opendoar_df.explode('subject')"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {},
"outputs": [
{
"data": {
"application/vnd.plotly.v1+json": {
"config": {
"plotlyServerURL": "https://plot.ly"
},
"data": [
{
"type": "bar",
"x": [
"multidisciplinary",
"health and medicine",
"science general",
"technology general",
"business and economics",
"social sciences general",
"law and politics",
"history and archaeology",
"arts and humanities general",
"education",
"ecology and environment",
"agriculture, food and veterinary",
"biology and biochemistry",
"computers and it",
"geography and regional studies",
"language and literature",
"philosophy and religion",
"mathematics and statistics",
"library and information science",
"fine and performing arts",
"chemistry and chemical technology",
"physics and astronomy",
"earth and planetary sciences",
"management and planning",
"mechanical engineering and materials",
"psychology",
"electrical and electronic engineering",
"civil engineering",
"architecture"
],
"y": [
3359,
541,
370,
369,
334,
321,
305,
287,
259,
245,
222,
217,
207,
201,
197,
169,
169,
144,
143,
137,
131,
129,
121,
118,
106,
84,
80,
75,
74
]
}
],
"layout": {
"template": {
"data": {
"bar": [
{
"error_x": {
"color": "#2a3f5f"
},
"error_y": {
"color": "#2a3f5f"
},
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "bar"
}
],
"barpolar": [
{
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "barpolar"
}
],
"carpet": [
{
"aaxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"baxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"type": "carpet"
}
],
"choropleth": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "choropleth"
}
],
"contour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "contour"
}
],
"contourcarpet": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "contourcarpet"
}
],
"heatmap": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmap"
}
],
"heatmapgl": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmapgl"
}
],
"histogram": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "histogram"
}
],
"histogram2d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2d"
}
],
"histogram2dcontour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2dcontour"
}
],
"mesh3d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "mesh3d"
}
],
"parcoords": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "parcoords"
}
],
"pie": [
{
"automargin": true,
"type": "pie"
}
],
"scatter": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter"
}
],
"scatter3d": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter3d"
}
],
"scattercarpet": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattercarpet"
}
],
"scattergeo": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergeo"
}
],
"scattergl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergl"
}
],
"scattermapbox": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattermapbox"
}
],
"scatterpolar": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolar"
}
],
"scatterpolargl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolargl"
}
],
"scatterternary": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterternary"
}
],
"surface": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "surface"
}
],
"table": [
{
"cells": {
"fill": {
"color": "#EBF0F8"
},
"line": {
"color": "white"
}
},
"header": {
"fill": {
"color": "#C8D4E3"
},
"line": {
"color": "white"
}
},
"type": "table"
}
]
},
"layout": {
"annotationdefaults": {
"arrowcolor": "#2a3f5f",
"arrowhead": 0,
"arrowwidth": 1
},
"autotypenumbers": "strict",
"coloraxis": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"colorscale": {
"diverging": [
[
0,
"#8e0152"
],
[
0.1,
"#c51b7d"
],
[
0.2,
"#de77ae"
],
[
0.3,
"#f1b6da"
],
[
0.4,
"#fde0ef"
],
[
0.5,
"#f7f7f7"
],
[
0.6,
"#e6f5d0"
],
[
0.7,
"#b8e186"
],
[
0.8,
"#7fbc41"
],
[
0.9,
"#4d9221"
],
[
1,
"#276419"
]
],
"sequential": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"sequentialminus": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
]
},
"colorway": [
"#636efa",
"#EF553B",
"#00cc96",
"#ab63fa",
"#FFA15A",
"#19d3f3",
"#FF6692",
"#B6E880",
"#FF97FF",
"#FECB52"
],
"font": {
"color": "#2a3f5f"
},
"geo": {
"bgcolor": "white",
"lakecolor": "white",
"landcolor": "#E5ECF6",
"showlakes": true,
"showland": true,
"subunitcolor": "white"
},
"hoverlabel": {
"align": "left"
},
"hovermode": "closest",
"mapbox": {
"style": "light"
},
"paper_bgcolor": "white",
"plot_bgcolor": "#E5ECF6",
"polar": {
"angularaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"radialaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"scene": {
"xaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"yaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"zaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
}
},
"shapedefaults": {
"line": {
"color": "#2a3f5f"
}
},
"ternary": {
"aaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"baxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"caxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"title": {
"x": 0.05
},
"xaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
},
"yaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
}
}
},
"title": {
"text": "Subject coverage OpenDOAR"
},
"xaxis": {
"tickangle": 45,
"tickfont": {
"size": 12
}
}
}
},
"text/html": [
"<div> <div id=\"4eae2fe2-9946-4be7-9629-6c7eea715428\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div> <script type=\"text/javascript\"> require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {}; if (document.getElementById(\"4eae2fe2-9946-4be7-9629-6c7eea715428\")) { Plotly.newPlot( \"4eae2fe2-9946-4be7-9629-6c7eea715428\", [{\"type\": \"bar\", \"x\": [\"multidisciplinary\", \"health and medicine\", \"science general\", \"technology general\", \"business and economics\", \"social sciences general\", \"law and politics\", \"history and archaeology\", \"arts and humanities general\", \"education\", \"ecology and environment\", \"agriculture, food and veterinary\", \"biology and biochemistry\", \"computers and it\", \"geography and regional studies\", \"language and literature\", \"philosophy and religion\", \"mathematics and statistics\", \"library and information science\", \"fine and performing arts\", \"chemistry and chemical technology\", \"physics and astronomy\", \"earth and planetary sciences\", \"management and planning\", \"mechanical engineering and materials\", \"psychology\", \"electrical and electronic engineering\", \"civil engineering\", \"architecture\"], \"y\": [3359, 541, 370, 369, 334, 321, 305, 287, 259, 245, 222, 217, 207, 201, 197, 169, 169, 144, 143, 137, 131, 129, 121, 118, 106, 84, 80, 75, 74]}], {\"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.
" \n",
"var gd = document.getElementById('4eae2fe2-9946-4be7-9629-6c7eea715428');\n",
"var x = new MutationObserver(function (mutations, observer) {{\n",
" var display = window.getComputedStyle(gd).display;\n",
" if (!display || display === 'none') {{\n",
" console.log([gd, 'removed!']);\n",
" Plotly.purge(gd);\n",
" observer.disconnect();\n",
" }}\n",
"}});\n",
"\n",
"// Listen for the removal of the full notebook cells\n",
"var notebookContainer = gd.closest('#notebook-container');\n",
"if (notebookContainer) {{\n",
" x.observe(notebookContainer, {childList: true});\n",
"}}\n",
"\n",
"// Listen for the clearing of the current output cell\n",
"var outputEl = gd.closest('.output');\n",
"if (outputEl) {{\n",
" x.observe(outputEl, {childList: true});\n",
"}}\n",
"\n",
" }) }; }); </script> </div>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"data = opendoar_subjects.groupby('subject')[['opendoar_id']].count().sort_values('opendoar_id', ascending=False)\n",
"plot = [\n",
" go.Bar(\n",
" x=data.index,\n",
" y=data['opendoar_id'],\n",
" ) \n",
"] \n",
"\n",
"layout = go.Layout(\n",
" title='Subject coverage OpenDOAR',\n",
" xaxis=dict(tickangle=45, tickfont=dict(size=12))\n",
")\n",
"\n",
"fig = go.Figure(plot, layout).show()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**ROAR**"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([nan, 'DP', 'Q1', 'AS', 'AC', 'AM', 'H1', 'L1', 'AI', 'GC', 'HD28',\n",
" 'F1201', 'R1', 'QM', 'BF', 'Z665', 'B1', 'DS', 'NX', 'K1', 'G1',\n",
" 'HA', 'D051', 'T1', 'QA', 'E151', 'D901', 'BP', 'QK', 'D1', 'HB',\n",
" 'GE', 'QE', 'QA76', 'QC', 'LB', 'RT', 'N1', 'BQ', 'QD', 'RA0421',\n",
" 'S1', 'LG', 'SH', 'ZA', 'LE', 'HV', 'DAW', 'C1', 'JA', 'AZ', 'QR',\n",
" 'F001', 'QH301', 'QB', 'QL', 'TJ', 'RZ', 'RS', 'GV', 'LB2300',\n",
" 'RF', 'RG', 'LA', 'Z004', 'HM', 'GA', 'M1', 'PI', 'BJ', 'BH', 'BC',\n",
" 'JL', 'J1', 'RK', 'TP', 'PE', 'TL', 'P1', 'HD61', 'BL', 'RM', 'RB',\n",
" 'QA75', 'SD', 'E11', 'HF5601', 'TA', 'D839', 'LF', 'CB', 'PG',\n",
" 'QH', 'HC', 'Z719', 'HE', 'TK', 'HT', 'CC', 'PL', 'HF', 'ZA4050',\n",
" 'NB', 'CT', 'HJ', 'HG', 'PD', 'JN', 'LD', 'DE', 'DF', 'DK', 'GN',\n",
" 'JX', 'QP', 'LC', 'TC'], dtype=object)"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"roar_df.subjects.unique()"
]
},
{
"cell_type": "code",
"execution_count": 39,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>eprintid</th>\n",
" <th>home_page</th>\n",
" <th>title</th>\n",
" <th>location_country</th>\n",
" <th>subjects</th>\n",
" <th>continent</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>352</th>\n",
" <td>6412</td>\n",
" <td>https://dspace.cvut.cz/</td>\n",
" <td>Digital Library of the Czech Technical Univers...</td>\n",
" <td>CZE</td>\n",
" <td>HD28</td>\n",
" <td>EU</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8164</th>\n",
" <td>14592</td>\n",
" <td>http://repository.stie-aub.ac.id</td>\n",
" <td>Welcome to Repository STIE AUB Surakarta - Rep...</td>\n",
" <td>IDN</td>\n",
" <td>HD28</td>\n",
" <td>AS</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9402</th>\n",
" <td>13418</td>\n",
" <td>http://repositorio.gerens.edu.pe/</td>\n",
" <td>Repositorio de la Escuela de Postgrado Gerens</td>\n",
" <td>PER</td>\n",
" <td>HD28</td>\n",
" <td>SA</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10929</th>\n",
" <td>11743</td>\n",
" <td>http://publikaciotar.repozitorium.uni-bge.hu/</td>\n",
" <td>BORY: Budapest Business School Repository</td>\n",
" <td>HUN</td>\n",
" <td>HD28</td>\n",
" <td>EU</td>\n",
" </tr>\n",
" <tr>\n",
" <th>11428</th>\n",
" <td>11134</td>\n",
" <td>https://eduq.info</td>\n",
" <td>ÉDUQ: Archive ouverte du réseau collégial du Q...</td>\n",
" <td>CAN</td>\n",
" <td>HD28</td>\n",
" <td>NA</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" eprintid home_page \\\n",
"352 6412 https://dspace.cvut.cz/ \n",
"8164 14592 http://repository.stie-aub.ac.id \n",
"9402 13418 http://repositorio.gerens.edu.pe/ \n",
"10929 11743 http://publikaciotar.repozitorium.uni-bge.hu/ \n",
"11428 11134 https://eduq.info \n",
"\n",
" title location_country \\\n",
"352 Digital Library of the Czech Technical Univers... CZE \n",
"8164 Welcome to Repository STIE AUB Surakarta - Rep... IDN \n",
"9402 Repositorio de la Escuela de Postgrado Gerens PER \n",
"10929 BORY: Budapest Business School Repository HUN \n",
"11428 ÉDUQ: Archive ouverte du réseau collégial du Q... CAN \n",
"\n",
" subjects continent \n",
"352 HD28 EU \n",
"8164 HD28 AS \n",
"9402 HD28 SA \n",
"10929 HD28 EU \n",
"11428 HD28 NA "
]
},
"execution_count": 39,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"roar_df[roar_df.subjects == 'HD28']"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**FAIRsharing**"
]
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {},
"outputs": [],
"source": [
"fairsharing_subjects = fairsharing_df.explode('subjects')"
]
},
{
"cell_type": "code",
"execution_count": 20,
"metadata": {},
"outputs": [
{
"data": {
"application/vnd.plotly.v1+json": {
"config": {
"plotlyServerURL": "https://plot.ly"
},
"data": [
{
"name": "FAIRsharing",
"type": "bar",
"x": [
"Life Science",
"Biomedical Science,Life Science",
"Genomics,Life Science",
"Biodiversity,Life Science",
"Biomedical Science",
"Earth Science,Environmental Science",
"Data Management",
"Life Science,Proteomics",
"Genomics",
"Comparative Genomics,Life Science",
"Earth Science",
"Life Science,Metabolomics",
"Biology",
"Epidemiology,Life Science,Virology",
"Biomedical Science,Preclinical Studies",
"Life Science,Ontology and Terminology",
"Engineering Science,Humanities and Social Sciences,Natural Science",
"Life Science,Phylogenetics",
"Knowledge and Information Systems,Software Engineering",
"Atmospheric Science,Earth Science,Oceanography",
"Anatomy,Life Science",
"Clinical Studies,Critical Care Medicine,Health Science,Infectious Disease Medicine,Medical Virology,Medicine",
"Glycomics,Life Science",
"Functional Genomics,Life Science",
"Biology,Life Science",
"Structural Biology",
"Atmospheric Science,Earth Science",
"Bioinformatics",
"Earth Science,Meteorology",
"Genetics,Life Science",
"Astrophysics and Astronomy",
"Bioinformatics,Biology",
"Comparative Genomics,Genomics,Life Science",
"Biomedical Science,Immunogenetics,Immunology",
"Earth Science,Environmental Science,Oceanography",
"Biochemistry,Life Science",
"Life Science,Neurobiology",
"Earth Science,Geology,Geophysics",
"Oceanography",
"Environmental Science",
"Biomedical Science,Life Science,Neurobiology",
"Biomedical Science,Genetics,Life Science",
"Comparative Genomics,Genomics",
"Life Science,Transcriptomics",
"Genetics,Genomics,Life Science",
"Developmental Biology,Life Science",
"Genetics",
"Computational Biology,Life Science",
"Atmospheric Science,Earth Science,Environmental Science,Geology",
"Biomedical Science,Genomics,Life Science",
"Epigenetics,Epigenomics",
"Atmospheric Science,Earth Science,Meteorology",
"Epigenetics,Life Science",
"Functional Genomics,Genomics,Life Science",
"Biomedical Science,Drug Development,Drug Discovery,Epidemiology,Virology",
"Biomedical Science,Health Science",
"Transcriptomics",
"Earth Science,Geophysics",
"Earth Science,Environmental Science,Geology",
"Agriculture,Genomics,Life Science,Plant Breeding",
"Environmental Science,Oceanography",
"Earth Science,Geology",
"Environmental Science,Marine Biology",
"Data Submission, Annotation and Curation,Life Science",
"Proteomics",
"Life Science,Systems Biology",
"Atmospheric Science,Remote Sensing",
"Computer Science",
"Earth Science,Geology,Hydrogeology,Mineralogy",
"Earth Science,Geology,Geophysics,Geotechnics",
"Earth Science,Geography,Remote Sensing",
"Earth Science,Geography,Geology,Oceanography",
"Earth Science,Geodesy,Geophysics",
"Bioinformatics,Computational Neuroscience,Neuroscience",
"Bioinformatics,Data Management,Data Submission, Annotation and Curation,Functional Genomics,Genomics,Metagenomics,Transcriptomics",
"Computational Biology,Systems Biology",
"Atmospheric Science,Earth Science,Environmental Science",
"Astrophysics and Astronomy,Earth Science,Geophysics",
"Biomedical Science,Glycomics",
"Bioinformatics,Structural Biology",
"Earth Science,Environmental Science,Geophysics",
"Biology,Genomics,Life Science",
"Earth Science,Oceanography,Water Research",
"Earth Science,Oceanography",
"Biomedical Science,Epidemiology,Virology",
"Atmospheric Science,Meteorology,Oceanography,Remote Sensing",
"Data Mining,Life Science",
"Biomedical Science,Health Science,Life Science",
"Atmospheric Science,Environmental Science",
"Epidemiology,Virology",
"Biomedical Science,Data Submission, Annotation and Curation,Epidemiology,Life Science,Virology",
"Biochemistry,Enzymology",
"Data Visualization,Life Science",
"Critical Care Medicine,Gastroenterology,Health Science,Infectious Disease Medicine,Medical Virology",
"Biomedical Science,Genomics",
"Functional Genomics",
"Biomedical Science,Genetics",
"Biomedical Science,Genetics,Genomics",
"Biomedical Science,Clinical Studies,Epidemiology,Virology",
"Biodiversity,Botany,Ontology and Terminology",
"Biomedical Science,Clinical Studies,Epidemiology,Preclinical Studies,Virology",
"Biomedical Science,Genetics,Preclinical Studies",
"Data Management,Engineering Science,Humanities and Social Sciences,Natural Science",
"Chemistry",
"Bioinformatics,Life Science",
"Genomics,Life Science,Transcriptomics",
"Biomedical Science,Pharmacology",
"Comparative Genomics",
"Immunogenetics,Immunology",
"Immunology,Life Science",
"Chemistry,Materials Science",
"Clinical Studies,Medicine",
"Life Science,Metabolomics,Systems Biology",
"Botany,Genomics,Life Science",
"Life Science,Molecular biology",
"Biomedical Science,Life Science,Proteomics",
"Agriculture,Life Science",
"Clinical Studies,Epidemiology,Preclinical Studies,Virology",
"Agriculture,Genetics,Genomics,Life Science",
"Botany",
"Life Science,Phylogeny",
"Life Science,Statistics",
"Life Science,Preclinical Studies",
"Hydrology,Meteorology",
"Chemistry,Natural Science,Physics",
"Biomedical Science,Health Science,Preclinical Studies",
"Systems Biology",
"Biomedical Science,Human Genetics,Life Science",
"Comparative Genomics,Population Genetics",
"Social Science",
"Chemistry,Computational Chemistry,Drug Discovery,Life Science,Medicinal Chemistry",
"Demographics,Population Genetics",
"Developmental Biology",
"Clinical Chemistry,Metabolomics,Metagenomics,Systems Biology",
"Developmental Biology,Life Science,Proteomics",
"Chemistry,Earth Science,Mineralogy,Physics",
"Developmental Biology,Life Science,Transcriptomics",
"Demographics,Epidemiology,Social Science,Virology",
"Digital Image Processing,Earth Science,Geology,Geophysics,Oceanography",
"Earth Science,Environmental Science,Geography,Oceanography",
"Drug Development,Drug Discovery,Drug Repositioning,Life Science",
"Drug Development,Epidemiology,Life Science,Virology",
"Demographics,Geography",
"Earth Science,Environmental Science,Geography,Oceanography,Water Management",
"Demographics,Economics,Humanities and Social Sciences,Public Health,Social Psychology,Social and Behavioural Science",
"Demographics,Economics,Geography,Humanities and Social Sciences",
"Classical Archaeology,Earth Science,Economics,Humanities,Life Science,Social Science,Social and Behavioural Science",
"Demographics,Economic and Social History,Economics,Social Science",
"Database Management",
"Clinical Studies,Clinical Veterinary Medicine,Life Science,Personalized Medicine,Pharmacogenomics,Pharmacology,Preclinical Studies",
"Clinical Studies,Critical Care Medicine,Health Science,Infectious Disease Medicine,Medical Virology,Medicine,Oncology",
"Data Visualization,Life Science,Proteomics",
"Data Visualization,Life Science,Ontology and Terminology",
"Data Visualization,Life Science,Metabolomics,Proteomics,Systems Biology,Transcriptomics",
"Data Visualization,Life Science,Metabolomics",
"Earth Science,Environmental Science,Geology,Oceanography",
"Classical Archaeology,History,Humanities,Natural Science,Prehistory",
"Chemistry,Earth Science",
"Chemistry,Environmental Science",
"Classical Archaeology,Earth Science",
"Chemistry,Environmental Science,Toxicology",
"Earth Science,Engineering Science,Mineralogy",
"Earth Science,Economics,Meteorology",
"Chemistry,Genomics,Metabolomics,Proteomics",
"Earth Science,Ecology,Geography,Life Science,Natural History,Natural Science,Paleontology",
"Earth Science,Ecology,Environmental Science,Geoinformatics,Hydrology,Oceanography",
"Chemistry,Glycomics,Life Science,Organic Chemistry",
"Chemistry,Earth Science,Mineralogy",
"Chemistry,Earth Science,Environmental Science,Geochemistry,Natural Science",
"Chemistry,Health Science",
"Earth Science,Environmental Science,Fisheries Science,Hydrology,Water Management",
"Chemistry,Inorganic Molecular Chemistry",
"Earth Science,Environmental Science,Freshwater Science,Geology,Oceanography,Water Research",
"Chemistry,Inorganic Molecular Chemistry,Organic Chemistry",
"Earth Science,Ecology,Environmental Science,Freshwater Science,Hydrology",
"Chemistry,Life Science",
"Earth Science,Ecology,Environmental Science,Freshwater Science",
"Chemistry,Life Science,Physics",
"Earth Science,Environmental Science,Geodesy,Geology,Geophysics,Hydrology",
"Chemistry,Nanotechnology,Physics",
"Clinical Studies,Critical Care Medicine,Health Science,Infectious Disease Medicine,Medical Virology,Medicine,Respiratory Medicine",
"Earth Science,Ecology,Environmental Science,Forest Management,Hydrology,Natural Science,Soil Science",
"Earth Science,Ecology,Environmental Science",
"Earth Science,Ecology,Energy Engineering",
"Chemistry,Ontology and Terminology",
"Earth Science,Environmental Science,Geography,Geology,Oceanography",
"Civil Engineering,Construction Engineering,Materials Science,Transportation Planning,Urban Planning",
"Drug Discovery,Life Science",
"Chemistry,Earth Science,Engineering Science,Environmental Science,Health Science,Life Science,Social Science",
"Data Visualization,Epigenetics,Oncology",
"Clinical Studies,Data Integration,Genomics,Oncology",
"Data Visualization",
"Community Care,Health Science,Primary Health Care,Public Health",
"Comparative Genomics,Epigenomics,Functional Genomics,Genomics,Life Science,Ontology and Terminology,Phylogenomics,Plant Genetics,Structural Genomics",
"Earth Science,Environmental Science,Geophysics,Meteorology,Oceanography",
"Comparative Genomics,Developmental Biology,Life Science",
"Computer Science,Informatics,Knowledge and Information Systems",
"Comparative Genomics,Data Integration,Molecular Infection Biology,Phylogenomics",
"Computer Science,Software Engineering",
"Computer Science,Software Engineering,Statistics",
"Data Submission, Annotation and Curation,Omics",
"Criminal Law,Criminology,Demographics,Social and Behavioural Science",
"Criminology,Humanities,Jurisprudence,Political Science,Social Science,Social and Behavioural Science",
"Communication Science,Evolutionary Biology,Functional Genomics,Genomics,Life Science,Phylogenetics",
"Critical Care Medicine,Health Science,Hematology,Infectious Disease Medicine,Medical Virology",
"Cultural Studies,Culture,Education Science,Engineering Science,History,Humanities and Social Sciences,Natural Science",
"Communication Science,Education Science,Media Studies,Political Science,Psychology,Social Psychology,Social Science,Social and Behavioural Science",
"Comparative Genomics,Functional Genomics,Genomics,Phylogenetics,Proteomics",
"Comparative Genomics,Functional Genomics,Genomics,Population Dynamics,Population Genetics",
"Comparative Genomics,Genetics,Genomics",
"Comparative Genomics,Genomics,Infectious Disease Medicine",
"Computer Science,Data Management",
"Comparative Genomics,Genomics,Metagenomics",
"Comparative Genomics,Genomics,Microbial Ecology,Microbial Genetics,Phenomics,Taxonomy",
"Computational Neuroscience,Neuroscience,Systemic Neuroscience,Systems Biology",
"Computational Neuroscience,Neuroscience",
"Comparative Genomics,Genomics,Population Genetics",
"Comparative Genomics,Immunology,Life Science,Microbiology,Proteomics,Transcriptomics",
"Computational Biology,Mathematics,Statistics,Systems Biology",
"Computational Biology,Life Science,Neurobiology",
"Comparative Genomics,Phylogenomics,Phylogeny",
"Computational Biology,Genetics,Life Science,Virology",
"Computational Biology,Ecology,Genetics,Life Science",
"Computational Biology,Genetics,Genomics,Life Science,Proteomics",
"Culture,Data Visualization,History,Humanities,Natural Science",
"Cognitive Neuroscience,Developmental Neurobiology,Pediatrics",
"Data Governance",
"Data Management,Earth Science,Environmental Science,Humanities and Social Sciences,Life Science",
"Data Submission, Annotation and Curation,Metabolomics,Structural Biology",
"Data Submission, Annotation and Curation,Life Science,Transcriptomics",
"Clinical Studies,Critical Care Medicine,Health Science,Infectious Disease Medicine,Medical Virology,Medicine,Rheumatology",
"Data Submission, Annotation and Curation,Life Science,Metabolomics",
"Computational Biology,Genetics,Life Science",
"Clinical Studies,Dermatology,Health Science,Infectious Disease Medicine,Medical Virology,Medicine",
"Data Submission, Annotation and Curation,Functional Genomics,Proteomics,Structural Biology,Systems Biology",
"Clinical Studies,Epidemiology,Health Science,Public Health",
"Data Submission, Annotation and Curation,Education Science,Health Science,Humanities and Social Sciences,Social Science,Social and Behavioural Science",
"Data Submission, Annotation and Curation",
"Data Management,Humanities and Social Sciences",
"Data Management,Environmental Science,Oceanography",
"Clinical Studies,Epidemiology,Virology",
"Data Management,Earth Science,Environmental Science,Marine Biology,Oceanography,Ontology and Terminology",
"Data Management,Data Visualization",
"Data Governance,Data Submission, Annotation and Curation",
"Data Management,Data Submission, Annotation and Curation,Demographics,Population Dynamics,Social Science",
"Clinical Studies,Genomics,Human Genetics,Life Science,Medicine,Pharmacy,Proteomics,Public Health,Reproductive Health",
"Data Management,Data Submission, Annotation and Curation",
"Data Management,Data Quality,Data Submission, Annotation and Curation",
"Clinical Studies,Health Science,Infectious Disease Medicine,Medical Virology",
"Clinical Studies,Health Science,Life Science,Medicine",
"Data Integration,Genomics,Life Science,Microbiology",
"Data Integration,Genomics,Life Science,Metabolomics,Proteomics,Transcriptomics",
"Data Integration,Data Management,Database Management,Knowledge and Information Systems",
"Data Integration,Data Management,Data Submission, Annotation and Curation,Life Science",
"Clinical Studies,Health Science,Medical Informatics",
"Data Integration,Data Management,Data Quality,Data Visualization,Life Science,Microbiology,Virology",
"Clinical Studies,Virology",
"Data Governance,Data Submission, Annotation and Curation,Humanities and Social Sciences",
"Computer Science,Education Science,Research on Teaching, Learning and Training",
"Acoustics,Biodiversity,Earth Science,Oceanography,Remote Sensing,Transportation Planning,Water Management",
"Earth Science,Environmental Science,Hydrogeology",
"Genomics,Systems Biology",
"Geochemistry,Geology",
"Geochemistry,Microbial Ecology,Mineralogy,Thermodynamics",
"Geochemistry,Oceanography",
"Geodesy,Geology,Oceanography",
"Geography,Hydrogeology,Transportation Planning",
"Geology,Hydrogeology,Life Science,Oceanography",
"Geology,Mineralogy,Paleontology,Soil Science",
"Geology,Oceanography",
"Geriatric Medicine,Life Science",
"Glycomics,Life Science,Proteomics",
"Glycomics,Structural Biology",
"Health Science,Human Biology,Life Science",
"Health Science,Human Biology,Life Science,Oncology,Pathology",
"Health Science,Social Policy",
"Hydrology,Limnology",
"Hydrology,Marine Biology,Oceanography",
"Hydrology,Social and Behavioural Science",
"Immunogenetics",
"Immunology,Life Science,Pharmacology",
"Genomics,Virology",
"Genomics,Structural Biology",
"Informatics",
"Genomics,Population Genetics",
"Genetics,Genomics",
"Genetics,Genomics,Life Science,Systems Biology",
"Genetics,Genomics,Life Science,Virology",
"Genetics,Human Genetics",
"Genetics,Immunogenetics,Immunology",
"Genetics,Immunogenetics,Immunology,Life Science",
"Genetics,Life Science,Phylogenomics",
"Genetics,Life Science,Population Dynamics,Population Genetics",
"Genetics,Life Science,Transcriptomics",
"Genetics,Pathology,Physiology",
"Genetics,Preclinical Studies,Translational Medicine",
"Genetics,Proteomics",
"Genomics,Life Science,Phenomics",
"Genomics,Life Science,Proteomics,Transcriptomics",
"Genomics,Life Science,Systems Biology",
"Genomics,Marine Biology,Metagenomics",
"Genomics,Metabolomics,Metagenomics,Phylogenetics",
"Genomics,Microbiology,Virology",
"Genomics,Phenomics,Proteomics",
"Immunology,Molecular biology",
"Informatics,Knowledge and Information Systems,Life Science,Ontology and Terminology",
"Functional Genomics,Phenomics",
"Materials Science,Natural Science",
"Materials Science,Physics",
"Medical Informatics",
"Metagenomics,Microbial Ecology,Virology",
"Molecular biology,Proteomics",
"Nanotechnology,Organic Chemistry",
"Neurology,Neurophysiology,Neuroscience",
"Neurophysiology,Neuroscience",
"Neuroscience,Phenomics",
"Omics,Transcriptomics",
"Oncology",
"Oncology,Proteogenomics,Proteomics",
"Ontology and Terminology",
"Phylogenetics,Phylogenomics",
"Phylogenetics,Phylogenomics,Phylogeny,Proteogenomics,Proteomics",
"Population Genetics",
"Preclinical Studies",
"Primary Health Care,Public Health",
"Proteomics,Transcriptomics",
"Public Health",
"Materials Science,Natural Science,Physics",
"Materials Science,Nanotechnology",
"Knowledge and Information Systems,Ontology and Terminology",
"Materials Informatics,Materials Science,Physics",
"Life Science,Metabolomics,Proteomics",
"Life Science,Microbiology",
"Life Science,Microbiology,Molecular Infection Biology",
"Life Science,Microbiology,Molecular Microbiology,Virology",
"Life Science,Neurophysiology",
"Life Science,Neurophysiology,Statistics,Synthetic Biology",
"Life Science,Oceanography",
"Life Science,Oncology",
"Life Science,Phylogenetics,Phylogenomics",
"Life Science,Phylogenetics,Phylogeny",
"Life Science,Phylogenomics",
"Life Science,Population Dynamics,Transcriptomics",
"Life Science,Proteomics,Transcriptomics",
"Life Science,Structural Biology",
"Life Science,Systems Biology,Virology",
"Life Science,Thermodynamics",
"Life Science,Translational Medicine",
"Marine Biology",
"Marine Biology,Oceanography,Ontology and Terminology",
"Functional Genomics,Transcriptomics",
"Functional Genomics,Life Science,Transcriptomics",
"Earth Science,Environmental Science,Hydrology",
"Earth Science,Knowledge and Information Systems,Ontology and Terminology",
"Earth Science,Meteorology,Oceanography",
"Earth Science,Meteorology,Remote Sensing",
"Earth Science,Social Science,Urban Planning",
"Earth Science,Soil Science",
"Ecology,Ecosystem Science,Environmental Science",
"Ecology,Ecosystem Science,Life Science",
"Ecology,Environmental Science,Paleontology",
"Economic Policy,Economics,Empirical Social Research,Humanities and Social Sciences,Political Science,Social Science,Social and Behavioural Science",
"Economic and Social History,Epidemiology,Health Science,Humanities and Social Sciences,Virology",
"Economic and Social History,Epidemiology,Humanities and Social Sciences,Virology",
"Economics,Ecosystem Science,Environmental Science,Freshwater Science,Global Health,Health Science,Human Geography,Physical Geography",
"Economics,Engineering Science,Life Science,Natural Science,Social Science,Social and Behavioural Science",
"Economics,Geography,Humanities and Social Sciences,Social and Behavioural Science",
"Economics,Humanities,Political Science,Social Science",
"Economics,Humanities,Social Science",
"Economics,Social Science",
"Economics,Social Science,Statistics",
"Ecosystem Science,Forest Management,Plant Ecology",
"Ecosystem Science,Freshwater Science,Hydrology",
"Cheminformatics,Life Science,Pharmacology",
"Earth Science,Hydrogeology,Meteorology,Oceanography",
"Embryology,Life Science",
"Earth Science,Humanities and Social Sciences",
"Earth Science,Environmental Science,Hydrology,Oceanography",
"Earth Science,Environmental Science,Marine Biology",
"Earth Science,Environmental Science,Marine Biology,Oceanography",
"Earth Science,Environmental Science,Meteorology,Oceanography",
"Earth Science,Environmental Science,Natural Science,Oceanography",
"Earth Science,Environmental Science,Social Science",
"Earth Science,Environmental Science,Soil Science",
"Earth Science,Epidemiology,Humanities and Social Sciences,Virology",
"Earth Science,Freshwater Science,Water Management,Water Research",
"Earth Science,Geochemistry,Geography,Geology,Mineralogy,Paleontology",
"Earth Science,Geography,Geology",
"Earth Science,Geography,Geology,Oceanography,Physical Geography",
"Earth Science,Geography,Geology,Physical Geography",
"Earth Science,Geoinformatics",
"Earth Science,Geoinformatics,Geology",
"Earth Science,Geology,Hydrology",
"Earth Science,Geology,Oceanography,Paleontology",
"Earth Science,Geophysics,Hydrogeology,Water Research",
"Earth Science,Health Science,Humanities,Life Science,Medicine,Natural Science,Social Science,Social and Behavioural Science",
"Electrophysiology",
"Endocrinology,Life Science,Systems Biology",
"Functional Genomics,Genomics,Parasitology",
"Epidemiology,Life Science,Proteomics,Virology",
"Epidemiology,Medicine",
"Epidemiology,Meteorology,Statistics",
"Epidemiology,Public Health",
"Epidemiology,Social Science",
"Epigenetics",
"Epigenetics,Epigenomics,Life Science,Toxicology",
"Epigenetics,Functional Genomics,Life Science",
"Epigenetics,Genomics,Life Science,Metabolomics,Metagenomics,Proteomics,Systems Biology,Transcriptomics",
"Epigenetics,Life Science,Proteomics,Transcriptomics",
"Evolutionary Biology,Functional Genomics,Genomics,Life Science",
"Evolutionary Biology,Genomics,Life Science,Transcriptomics",
"Evolutionary Biology,Life Science",
"Fisheries Science,Life Science",
"Freshwater Science,Hydrogeology,Hydrology,Water Management,Water Research",
"Freshwater Science,Marine Biology",
"Functional Genomics,Genetics,Molecular Genetics,Systems Biology",
"Functional Genomics,Genetics,Transcriptomics",
"Functional Genomics,Genomics",
"Functional Genomics,Genomics,Life Science,Transcriptomics",
"Epidemiology,Life Science,Statistics",
"Epidemiology,Life Science,Phylogenetics,Virology",
"Energy Engineering,Geochemistry,Geology",
"Epidemiology,Life Science,Molecular biology,Virology",
"Engineering Science,Humanities and Social Sciences,Informatics,Knowledge and Information Systems,Natural Science,Ontology and Terminology",
"Engineering Science,Humanities,Natural Science,Social Science",
"Engineering Science,Materials Science",
"Environmental Science,Geochemistry,Geophysics,Oceanography",
"Environmental Science,Geology,Geophysics,Hydrogeology,Meteorology,Oceanography",
"Environmental Science,Geophysics,Meteorology,Oceanography",
"Environmental Science,Geophysics,Oceanography,Physical Geography",
"Environmental Science,Maritime Engineering,Meteorology,Oceanography,Transportation Planning",
"Environmental Science,Meteorology,Oceanography,Remote Sensing",
"Enzymology",
"Epidemiology,Genomics,Life Science,Taxonomy,Virology",
"Epidemiology,Genomics,Life Science,Virology",
"Epidemiology,Global Health,Health Science,Health Services Research,Medical Informatics,Primary Health Care,Public Health,Virology",
"Epidemiology,Health Science,Humanities and Social Sciences,Microbiology,Tropical Medicine",
"Epidemiology,Health Science,Humanities and Social Sciences,Virology",
"Epidemiology,Human Genetics,Quantitative Genetics",
"Epidemiology,Immunogenetics,Immunology,Life Science,Virology",
"Epidemiology,Life Science,Microbiology",
"Epidemiology,Life Science,Molecular biology,Systems Biology,Virology",
"Earth Science,Marine Biology,Meteorology,Oceanography",
"Botany,Functional Genomics,Genomics,Life Science,Plant Genetics",
"Cheminformatics,Life Science,Pharmacogenomics,Pharmacology",
"Atmospheric Science,Ecosystem Science,Environmental Science",
"Atmospheric Science,Earth Science,Environmental Science,Remote Sensing",
"Atmospheric Science,Earth Science,Environmental Science,Water Research",
"Atmospheric Science,Earth Science,Geochemistry",
"Atmospheric Science,Earth Science,Geochemistry,Geophysics",
"Atmospheric Science,Earth Science,Geodesy,Geography,Hydrogeology,Meteorology",
"Atmospheric Science,Earth Science,Geodesy,Geophysics",
"Atmospheric Science,Earth Science,Geodesy,Geophysics,Meteorology",
"Atmospheric Science,Earth Science,Geodesy,Marine Biology,Oceanography",
"Atmospheric Science,Earth Science,Geography,Hydrogeology,Hydrology,Meteorology,Water Management",
"Atmospheric Science,Earth Science,Geography,Meteorology,Oceanography",
"Atmospheric Science,Earth Science,Geology,Geophysics,Hydrology,Oceanography",
"Atmospheric Science,Earth Science,Geology,Natural Science,Oceanography",
"Atmospheric Science,Earth Science,Geology,Oceanography,Paleontology",
"Atmospheric Science,Earth Science,Geology,Oceanography,Physical Geography",
"Atmospheric Science,Earth Science,Geophysics",
"Atmospheric Science,Earth Science,Geophysics,Hydrology,Meteorology,Oceanography,Water Research",
"Atmospheric Science,Earth Science,Health Science",
"Atmospheric Science,Earth Science,Hydrogeology,Oceanography",
"Atmospheric Science,Earth Science,Meteorology,Oceanography",
"Atmospheric Science,Earth Science,Meteorology,Oceanography,Remote Sensing,Social Science",
"Atmospheric Science,Earth Science,Meteorology,Soil Science",
"Atmospheric Science,Earth Science,Environmental Science,Meteorology,Oceanography",
"Atmospheric Science,Earth Science,Environmental Science,Hydrology,Oceanography",
"Atmospheric Science,Earth Science,Environmental Science,Hydrology",
"Astrophysics and Astronomy,Geochemistry",
"Astrophysics and Astronomy,Biology,Demographics,Ecosystem Science,Humanities and Social Sciences,Marine Biology,Materials Science,Tropical Medicine,Urban Planning",
"Astrophysics and Astronomy,Biomedical Science,Chemistry,Humanities,Life Science,Medicine,Natural Science,Physics,Social Science,Social and Behavioural Science",
"Astrophysics and Astronomy,Cartography,Earth Science,Geodesy",
"Astrophysics and Astronomy,Chemistry,Nanotechnology,Pharmacology",
"Astrophysics and Astronomy,Computer Science,Culture,Data Submission, Annotation and Curation,Earth Science,Engineering Science,Environmental Science,Health Science,Life Science,Physics,Social Science",
"Astrophysics and Astronomy,Data Management,Earth Science,Humanities and Social Sciences,Life Science",
"Astrophysics and Astronomy,Earth Science",
"Astrophysics and Astronomy,Earth Science,Geodesy",
"Astrophysics and Astronomy,Earth Science,Natural Science,Physics",
"Astrophysics and Astronomy,Natural Science,Physics",
"Atmospheric Science,Earth Science,Environmental Science,Hydrogeology,Oceanography",
"Atmospheric Science,Biochemistry,Biodiversity,Biology,Ecology,Genomics,Geography,Life Science,Limnology,Microbiology,Oceanography,Proteomics",
"Atmospheric Science,Biodiversity,Earth Science,Environmental Science,Geology,Geophysics,Oceanography,Remote Sensing",
"Atmospheric Science,Biology,Earth Science,Environmental Science,Geology,Geophysics,Life Science,Natural Science,Oceanography",
"Atmospheric Science,Biology,Earth Science,Geophysics,Oceanography,Physics",
"Atmospheric Science,Chemistry,Earth Science",
"Atmospheric Science,Data Management,Engineering Science,Humanities and Social Sciences,Natural Science",
"Atmospheric Science,Earth Science,Ecology,Geography,Geology,Geophysics,Hydrology,Water Research",
"Atmospheric Science,Earth Science,Environmental Science,Geology,Oceanography",
"Atmospheric Science,Earth Science,Environmental Science,Health Science,Meteorology",
"Atmospheric Science,Earth Science,Remote Sensing",
"Atmospheric Science,Ecosystem Science,Environmental Science,Forest Management",
"Astrophysics and Astronomy,Atmospheric Science,Earth Science,Environmental Science,Geology",
"Atmospheric Science,Energy Engineering",
"Biodiversity,Bioinformatics,Life Science",
"Biodiversity,Biology,Earth Science,Environmental Science,Forest Management,Landscape Planning,Plant Genetics,Population Dynamics",
"Biodiversity,Biology,Ecology,Taxonomy",
"Biodiversity,Biomedical Science,Data Submission, Annotation and Curation,Environmental Science,Life Science,Phylogenomics,Phylogeny,Taxonomy",
"Biodiversity,Botany,Cartography,Earth Science,Ecology,Environmental Science,Geoinformatics,Life Science,Zoology",
"Biodiversity,Botany,Earth Science,Ecology,Forest Management,Life Science,Meteorology,Plant Ecology,Soil Science,Water Management",
"Biodiversity,Botany,Ecology,Ecosystem Science,Forest Management,Plant Breeding",
"Biodiversity,Botany,Ecology,Soil Science,Zoology",
"Biodiversity,Botany,Life Science,Natural History,Paleontology",
"Biodiversity,Botany,Natural History,Paleontology,Zoology",
"Biodiversity,Chemistry,Earth Science,Environmental Science,Geography,Geophysics,Marine Biology,Oceanography,Taxonomy",
"Biodiversity,Earth Science,Ecology,Economics,Ecosystem Science,Environmental Science,Marine Biology,Oceanography,Zoology",
"Biodiversity,Earth Science,Economics,Meteorology,Water Management",
"Biodiversity,Earth Science,Ecosystem Science,Life Science,Marine Biology,Oceanography",
"Biodiversity,Earth Science,Environmental Science,Geography,Geophysics,Marine Biology,Oceanography,Physical Geography",
"Biodiversity,Earth Science,Environmental Science,Geography,Marine Biology,Oceanography",
"Biodiversity,Earth Science,Environmental Science,Geography,Marine Biology,Oceanography,Taxonomy",
"Biodiversity,Earth Science,Environmental Science,Marine Biology,Oceanography",
"Biodiversity,Earth Science,Environmental Science,Marine Biology,Oceanography,Taxonomy",
"Biodiversity,Ecology",
"Biodiversity,Ecology,Ecosystem Science,Environmental Science",
"Biodiversity",
"Biochemistry,Life Science,Proteomics",
"Biochemistry,Life Science,Metabolomics,Molecular biology",
"Biochemistry,Bioinformatics,Cheminformatics,Computational Biology,Life Science",
"Atmospheric Science,Environmental Science,Geology,Marine Biology,Oceanography",
"Atmospheric Science,Geology,Marine Biology,Meteorology,Remote Sensing",
"Atmospheric Science,Geophysics,Hydrology,Meteorology,Soil Science",
"Atmospheric Science,Meteorology",
"Atomic, Molecular, Optical and Plasma Physics,Materials Science,Medical Physics,Physical Chemistry",
"Biochemistry",
"Biochemistry,Biodiversity,Bioinformatics,Biology,Earth Science,Ecology,Environmental Science,Evolutionary Biology,Geochemistry,Geography,Geology,Geophysics,Life Science,Marine Biology,Microbial Ecology,Oceanography,Population Dynamics,Population Genetics",
"Biochemistry,Bioinformatics,Biology,Biomaterials,Biophysics,Computational Biology,Structural Biology",
"Biochemistry,Bioinformatics,Chemical Biology,Cheminformatics,Life Science,Proteomics,Systems Biology",
"Biochemistry,Biology,Enzymology",
"Biochemistry,Genetics,Life Science",
"Biochemistry,Biomedical Science,Life Science",
"Biochemistry,Biomedical Science,Life Science,Preclinical Studies,Systems Biology",
"Biochemistry,Cheminformatics,Chemistry,Computational Chemistry,Molecular Chemistry,Molecular Dynamics,Molecular Physical Chemistry,Molecular biology",
"Biochemistry,Cheminformatics,Systems Biology",
"Biochemistry,Chemistry,Organic Chemistry,Organic Molecular Chemistry",
"Biochemistry,Data Integration,Genomics,Metabolomics,Molecular biology,Omics,Systems Biology",
"Biochemistry,Data Integration,Life Science",
"Biochemistry,Data Submission, Annotation and Curation,Life Science",
"Biochemistry,Drug Discovery,Genomics,Medicinal Chemistry",
"Astrophysics and Astronomy,Atmospheric Science,Earth Science,Geophysics",
"Astrophysics and Astronomy,Atmospheric Science,Earth Science,Energy Engineering,Geodesy,Geophysics,Oceanography,Remote Sensing,Water Research",
"Cheminformatics,Life Science",
"Agriculture,Genomics,Life Science",
"Agriculture,Botany,Forest Management",
"Agriculture,Botany,Genomics,Life Science,Plant Breeding",
"Agriculture,Botany,Genomics,Life Science,Plant Breeding,Plant Genetics",
"Agriculture,Botany,Genomics,Plant Genetics",
"Agriculture,Botany,Life Science",
"Agriculture,Botany,Life Science,Plant Genetics",
"Agriculture,Comparative Genomics,Genomics",
"Agriculture,Comparative Genomics,Life Science,Plant Breeding",
"Agriculture,Computer Science,Earth Science,Engineering Science,Humanities,Humanities and Social Sciences,Life Science,Medicine,Natural Science,Social Science",
"Agriculture,Criminology,Demographics,Developmental Biology,Energy Engineering,Environmental Science,Global Health,Health Science,Public Finance",
"Agriculture,Demographics,Earth Science,Ecology,Energy Engineering,Environmental Science,Global Health,Public Health,Public Law,Water Management",
"Agriculture,Demographics,Earth Science,Economics,Energy Engineering,Global Health,Public Health,Social Science",
"Agriculture,Earth Science,Ecology,Environmental Science,Hydrology",
"Agriculture,Earth Science,Energy Engineering,Geriatric Medicine,Health Science,Maritime Engineering,Oceanography",
"Agriculture,Earth Science,Engineering Science,Environmental Science,Health Science,Humanities and Social Sciences,Natural Science",
"Agriculture,Earth Science,Food Security,Forest Management,Soil Science",
"Agriculture,Ecology,Population Dynamics,Remote Sensing",
"Agriculture,Environmental Science,Social Science",
"Agriculture,Food Security,Nutritional Science",
"Agriculture,Forest Management,Health Science,Health Services Research,Meteorology",
"Agriculture,Genetics,Genomics,Life Science,Plant Breeding,Plant Genetics",
"Agriculture,Botany,Comparative Genomics,Genomics",
"Agriculture,Biotechnology,Life Science,Nutritional Science",
"Agriculture,Biomedical Science,Earth Science,Environmental Science,Humanities,Life Science,Natural Science",
"Agriculture,Animal Genetics,Animal Husbandry,Animal Physiology,Aquaculture,Biology,Biomedical Science,Botany,Economics,Food Security,Genomics,Horticulture,Life Science,Nutritional Science,Plant Genetics,Soil Science,Veterinary Medicine",
"Aerospace Engineering,Astrophysics and Astronomy",
"Aerospace Engineering,Biology,Chemical Engineering,Data Management,Earth Science,Life Science,Mechanics",
"Agricultural Economics,Agriculture,Business Administration,Earth Science",
"Agricultural Economics,Economic Theory,Economic and Social History,Social Policy",
"Agricultural Engineering,Agricultural Law,Agriculture,Animal Husbandry,Aquaculture,Biodiversity,Botany,Ecology,Entomology,Farming Systems Research,Fisheries Science,Food Security,Health Science,Nutritional Science,Pathology,Physics,Plant Anatomy,Plant Breeding,Plant Cell Biology,Rural and Agricultural Sociology",
"Agricultural Engineering,Agriculture,Agroecology,Agronomy,Animal Husbandry,Biology,Botany,Data Management,Data Visualization,Economics,Engineering Science,Entomology,Environmental Science,Farming Systems Research,Genomics,Health Science,Hydrology,Jurisprudence,Life Science,Nutritional Science,Pathology,Physics,Rural and Agricultural Sociology,Soil Science",
"Agriculture,Agroecology,Biodiversity,Biology,Botany,Ecosystem Science,Life Science,Taxonomy",
"Agriculture,Agronomy,Biotechnology",
"Agriculture,Animal Breeding,Animal Husbandry,Environmental Science,Food Security,Forest Management",
"Agriculture,Animal Husbandry,Biodiversity,Earth Science,Economics,Energy Engineering,Environmental Science,Forest Management,Health Science,Water Research",
"Agriculture,Biology,Life Science",
"Agriculture,Art,Biodiversity,Biology,Chemistry,Ecology,Engineering Science,Environmental Science,Humanities,Humanities and Social Sciences,Life Science,Physics,Social Science,Veterinary Medicine",
"Agriculture,Art,Biotechnology,Culture,Demographics,Economics,Energy Engineering,Forest Management,Global Health,Humanities and Social Sciences,Life Science,Telecommunication Engineering,Urban Planning,Water Management",
"Agriculture,Art,Communication Science,Culture,Economics,Education Science,Environmental Science,Forest Management,Health Science,Humanities and Social Sciences,Industrial Engineering,Public Finance,Water Management",
"Agriculture,Atmospheric Science,Biodiversity,Biology,Chemistry,Earth Science,Ecology,Environmental Science,Fisheries Science,Freshwater Science,Geophysics,Life Science,Oceanography,Paleontology",
"Agriculture,Atmospheric Science,Biology,Botany,Chemistry,Earth Science,Environmental Science,Geochemistry,Geography,Humanities,Humanities and Social Sciences,Hydrogeology,Life Science,Mineralogy,Natural Science,Oceanography,Physics,Soil Science,Zoology",
"Agriculture,Atmospheric Science,Biology,Botany,Earth Science,Ecology,Ecosystem Science,Environmental Science,Geophysics,Life Science,Microbial Ecology,Microbiology,Natural Science,Oceanography,Plant Ecology,Zoology",
"Agriculture,Biodiversity,Biotechnology,Life Science,Nutritional Science,Phylogenetics",
"Agriculture,Biodiversity,Food Security",
"Agriculture,Biology,Genetics,Genomics,Life Science,Plant Genetics",
"Agriculture,Genetics,Genomics,Life Science,Transcriptomics",
"Agriculture,Genomics,Life Science,Plant Breeding,Plant Genetics",
"Astrophysics and Astronomy,Atmospheric Science,Earth Science",
"Agriculture,Knowledge and Information Systems,Life Science",
"Ancient Cultures,Cartography,Earth Science,Geoinformatics,Humanities",
"Animal Genetics",
"Animal Genetics,Bioinformatics,Biology,Cell Biology,Cheminformatics,Database Management,Drug Metabolism,Endocrinology,Genetics,Human Genetics,Medical Informatics,Metabolomics,Microbiology,Molecular Microbiology,Molecular biology,Plant Genetics,Proteomics,Systems Biology,Transcriptomics",
"Animal Genetics,Genetics,Genomics,Life Science",
"Animal Genetics,Genetics,Life Science",
"Animal Genetics,Genetics,Life Science,Systems Biology",
"Animal Genetics,Life Science",
"Animal Genetics,Pathology",
"Anthropology,Classical Archaeology,Data Integration,Data Management",
"Anthropology,Criminology,Data Governance,Data Management,Data Submission, Annotation and Curation,Demographics,Economics,Political Science,Psychology,Public Health,Social Science,Social and Behavioural Science",
"Anthropology,Cultural Studies,Culture,Historical Linguistics,Human Geography,Linguistics",
"Anthropology,Fine Arts,Geography,History,Humanities and Social Sciences,Life Science,Literary Studies,Political Science,Psychology,Social Science",
"Applied Linguistics,Classical Philology,Historical Linguistics,Linguistics",
"Applied Mathematics,Biology,Biotechnology,Communication Science,Computer Science,Data Management,Earth Science,Economics,Education Science,Environmental Science,Humanities and Social Sciences,Materials Science,Medicine,Physics,Psychology,Statistics,Surgery",
"Applied Microbiology,Data Integration,Data Management,Data Quality,Data Submission, Annotation and Curation,Microbial Ecology,Microbial Physiology,Proteomics,Transcriptomics",
"Aquaculture,Earth Science,Geography,Maritime Engineering",
"Architecture,Bioengineering,Civil Engineering,Computer Science,Earth Science,Economics,Environmental Science,Health Science,Humanities and Social Sciences,Life Science,Mathematics,Physics,Political Science",
"Architecture,Building Engineering Physics,Chemistry,Construction Engineering,Earth Science,Economics,Energy Engineering,Engineering Science,Environmental Science,Geography,Physics,Power Engineering",
"Art,Art History,Culture,Economics,Fine Arts,Humanities,Social Science",
"Artificial Intelligence,Biomedical Science,Digital Image Processing,Oncology,Radiology",
"Astrophysics and Astronomy,Atmospheric Science,Chemistry",
"Ancient Cultures,Architecture,Art History,Astrophysics and Astronomy,Chemistry,Classical Archaeology,Earth Science,History of Science,Humanities,Linguistics,Philosophy,Prehistory,Religious Studies",
"Anatomy,Endocrinology,Genetics,Life Science",
"Anatomy,Developmental Biology,Embryology,Life Science",
"Analytical Chemistry,Biology,Chemistry,Engineering Science,Life Science,Physics,Synthetic Chemistry",
"Agriculture,Life Science,Ontology and Terminology",
"Agriculture,Plant Breeding,Plant Cultivation",
"Agriculture,Soil Science",
"Agriculture,Soil Science,Urban Planning",
"Agroecology,Biodiversity,Ecology,Genomics,Metagenomics,Microbial Ecology,Phylogenomics",
"Agronomy,Bioinformatics,Botany,Genetics,Genomics,Life Science",
"Agronomy,Botany,Genetics,Life Science,Plant Genetics",
"Analytical Chemistry",
"Analytical Chemistry,Biology,Chemistry,Composite Materials,Materials Engineering,Materials Informatics,Nanotechnology,Occupational Medicine,Safety Science,Toxicogenomics,Toxicology",
"Analytical Chemistry,Biomimetic Chemistry,Chemistry,Inorganic Molecular Chemistry,Medicinal Chemistry,Molecular Chemistry,Organic Chemistry,Synthesis Chemistry,Synthetic Chemistry,Technical Chemistry",
"Anatomy,Comparative Genomics,Life Science",
"Analytical Chemistry,Drug Metabolism,Environmental Science,Metabolomics",
"Anatomy",
"Anatomy,Behavioural Biology,Biodiversity,Biology,Evolutionary Biology,Paleontology,Phylogenetics,Phylogeny",
"Anatomy,Bioinformatics,Comparative Genomics,Data Submission, Annotation and Curation,Functional Genomics,Genetics,Genomics,Life Science,Molecular Genetics,Molecular biology",
"Anatomy,Biomedical Science,Comparative Genomics,Environmental Science,Systems Biology,Toxicogenomics,Toxicology",
"Anatomy,Biomedical Science,Life Science",
"Anatomy,Cell Biology,Developmental Biology,Functional Genomics,Genetics,Genomics,Proteomics",
"Anatomy,Comparative Genomics,Developmental Biology,Embryology,Epigenomics,Functional Genomics,Genomics,Life Science,Ontology and Terminology,Phylogenomics,Transcriptomics",
"Anatomy,Comparative Genomics,Functional Genomics,Life Science",
"Biodiversity,Ecology,Evolutionary Biology,Genetics,Oceanography",
"Biodiversity,Environmental Science",
"Biodiversity,Environmental Science,Marine Biology",
"Biomedical Science,Life Science,Transcriptomics",
"Biomedical Science,Genomics,Life Science,Proteomics,Transcriptomics",
"Biomedical Science,Genomics,Medicine,Phenomics",
"Biomedical Science,Genomics,Preclinical Studies",
"Biomedical Science,Genomics,Preclinical Studies,Proteomics",
"Biomedical Science,Genomics,Structural Biology,Structural Genomics",
"Biomedical Science,Glycomics,Health Science",
"Biomedical Science,Glycomics,Life Science",
"Biomedical Science,Health Science,Humanities,Life Science,Social Science,Social and Behavioural Science",
"Biomedical Science,Health Science,Life Science,Medicine",
"Biomedical Science,Health Science,Medicine,Preclinical Studies",
"Biomedical Science,Health Science,Oncology",
"Biomedical Science,Human Genetics,Medicine,Ophthalmology,Preclinical Studies",
"Biomedical Science,Immunology",
"Biomedical Science,Immunology,Life Science",
"Biomedical Science,Immunology,Life Science,Preclinical Studies",
"Biomedical Science,Life Science,Mathematics,Physiology,Systems Biology",
"Biomedical Science,Life Science,Neurobiology,Neuroscience",
"Biomedical Science,Life Science,Oncology",
"Biomedical Science,Life Science,Population Genetics",
"Biomedical Science,Life Science,Preclinical Studies",
"Biomedical Science,Life Science,Preclinical Studies,Proteomics",
"Biomedical Science,Genomics,Life Science,Proteomics",
"Biomedical Science,Genomics,Geriatric Medicine",
"Biomedical Science,Genetics,Preclinical Studies,Proteomics",
"Biomedical Science,Epidemiology,Life Science,Molecular biology",
"Biomedical Science,Ecology,Epidemiology,Life Science,Preclinical Studies",
"Biomedical Science,Endocrinology,Life Science,Systems Biology",
"Biomedical Science,Epidemiology,Genomics",
"Biomedical Science,Epidemiology,Genomics,Life Science,Proteomics,Virology",
"Biomedical Science,Epidemiology,Genomics,Medicine,Preclinical Studies",
"Biomedical Science,Epidemiology,Genomics,Proteomics,Virology",
"Biomedical Science,Epidemiology,Global Health,Health Science,Medicine",
"Biomedical Science,Epidemiology,Health Science,Virology",
"Biomedical Science,Epidemiology,Life Science",
"Biomedical Science,Epidemiology,Life Science,Virology",
"Biomedical Science,Genetics,Life Science,Oncology,Preclinical Studies",
"Biomedical Science,Epidemiology,Preclinical Studies",
"Biomedical Science,Epidemiology,Translational Medicine,Virology",
"Biomedical Science,Epigenetics,Functional Genomics,Life Science",
"Biomedical Science,Epigenetics,Genetics",
"Biomedical Science,Epigenetics,Life Science",
"Biomedical Science,Epigenetics,Life Science,Population Genetics,Transcriptomics",
"Biomedical Science,Evolutionary Biology",
"Biomedical Science,Functional Genomics,Genomics,Life Science",
"Biomedical Science,Genetics,Life Science,Medicine",
"Biomedical Science,Life Science,Systems Biology",
"Biomedical Science,Medical Informatics,Medicine",
"Biodiversity,Environmental Science,Marine Biology,Oceanography",
"Biomedical Science,Medicine",
"Botany,Genetics,Life Science",
"Botany,Life Science,Ontology and Terminology,Plant Anatomy",
"Botany,Life Science,Plant Anatomy",
"Botany,Life Science,Plant Breeding,Population Genetics",
"Botany,Life Science,Plant Genetics",
"Botany,Paleontology,Plant Anatomy",
"Botany,Plant Genetics",
"Botany,Plant Genetics,Transcriptomics",
"Botany,Taxonomy",
"Business Administration,Chemistry,Clinical Psychology,Computer Science,Education Science,Engineering Science,Geography,History,Life Science,Medicine,Physics,Policy,Psychology,Research on Teaching, Learning and Training",
"Cardiology,Clinical Studies,Community Care,Epidemiology,Genomics,Global Health,Health Science,Health Services Research,Medical Virology,Occupational Medicine,Primary Health Care,Public Health,Reproductive Health,Respiratory Medicine,Virology",
"Cardiology,Clinical Studies,Critical Care Medicine,Health Science,Infectious Disease Medicine,Medical Virology,Medicine,Respiratory Medicine",
"Cardiology,Clinical Studies,Health Science,Infectious Disease Medicine,Medical Virology,Medicine",
"Cardiology,Genetics",
"Cartography,Earth Science,Environmental Science,Photogrammetry,Physical Geography,Remote Sensing",
"Cartography,Earth Science,Geography,Remote Sensing",
"Cell Biology,Developmental Biology,Molecular Dynamics",
"Cell Biology,Life Science",
"Cell Biology,Life Science,Transcriptomics",
"Cellular Neuroscience,Comparative Neurobiology,Molecular Neuroscience,Neurobiology,Neurophysiology",
"Chemical Engineering,Chemistry,Thermodynamics",
"Botany,Genetics,Genomics,Life Science,Plant Breeding,Plant Genetics",
"Aerospace Engineering,Agricultural Engineering,Agriculture,Architecture,Atmospheric Science,Bioengineering,Biological Process Engineering,Biology,Building Design,Building Engineering Physics,Business Administration,Chemical Engineering,Chemistry,Civil Engineering,Component Engineering,Computer Science,Construction Engineering,Earth Science,Electrical Engineering,Energy Engineering,Engineering Science,Environmental Science,Food Process Engineering,Geography,Health Science,Human-Machine Systems Engineering,Hydraulic Engineering,Hydrology,Industrial Engineering,Informatics,Life Science,Logistics Engineering,Maritime Engineering,Materials Engineering,Mathematics,Mechanical Engineering,Mechanical Process Engineering,Metal-Cutting Manufacturing Engineering,Nanotechnology,Physics,Plastics Engineering,Power Engineering,Process Engineering,Water Research",
"Botany,Entomology,Geochemistry,Life Science,Natural History,Paleontology,Zoology",
"Biomedical Science,Oncology",
"Biomedical Science,Medicine,Neurobiology,Translational Medicine",
"Biomedical Science,Medicine,Preclinical Studies",
"Biomedical Science,Medicine,Translational Medicine",
"Biomedical Science,Molecular biology",
"Biomedical Science,Nanotechnology",
"Biomedical Science,Neurobiology,Neurophysiology",
"Biomedical Science,Neurobiology,Neuroscience",
"Biomedical Science,Neurobiology,Preclinical Studies",
"Biomedical Science,Neuroscience",
"Biomedical Science,Pathology,Toxicogenomics",
"Botany,Data Visualization,Genomics,Life Science",
"Biomedical Science,Physiology",
"Biomedical Science,Physiology,Preclinical Studies",
"Biomedical Science,Preclinical Studies,Psychology,Social and Behavioural Science",
"Biomedical Science,Proteomics",
"Biomedical Science,Public Health,Social Science,Social and Behavioural Science",
"Biomedical Science,Social Science",
"Biomedical Science,Translational Medicine",
"Biotherapeutics,Structural Biology",
"Botany,Data Management",
"Biomedical Science,Earth Science,Environmental Science,Life Science,Traditional Medicine",
"Biomedical Science,Earth Science,Environmental Science,Epidemiology,Life Science,Virology",
"Biomedical Science,Drug Repositioning,Epidemiology,Life Science,Virology",
"Biomedical Science,Drug Metabolism,Medical Informatics,Medicine",
"Bioinformatics,Data Management,Data Submission, Annotation and Curation,Epidemiology,Functional Genomics,Genomics,Metagenomics,Transcriptomics,Virology",
"Bioinformatics,Data Management,Epidemiology,Functional Genomics,Genomics,Life Science,Metagenomics,Virology",
"Bioinformatics,Data Submission, Annotation and Curation,Epigenomics,Genetics,Genomics,Knowledge and Information Systems,Life Science,Metagenomics,Omics,Transcriptomics",
"Bioinformatics,Data Visualization,Functional Genomics,Genomics,Life Science,Phylogenetics",
"Bioinformatics,Data Visualization,Functional Genomics,Life Science",
"Bioinformatics,Enzymology",
"Bioinformatics,Epigenetics,Genomics,Life Science",
"Bioinformatics,Epigenomics",
"Bioinformatics,Functional Genomics,Life Science",
"Bioinformatics,Functional Genomics,Transcriptomics",
"Bioinformatics,Genetics,Transcriptomics",
"Bioinformatics,Genomics",
"Bioinformatics,Genomics,Life Science,Ontology and Terminology",
"Bioinformatics,Immunology,Life Science",
"Bioinformatics,Life Science,Microbiology,Phylogenetics",
"Bioinformatics,Microbiology",
"Bioinformatics,Molecular Genetics,Molecular biology",
"Bioinformatics,Proteomics",
"Bioinformatics,Proteomics,Transcriptomics",
"Bioinformatics,Software Engineering",
"Bioinformatics,Systems Biology",
"Bioinformatics,Computational Biology,Life Science,Systems Biology",
"Bioinformatics,Computational Biology,Life Science,Metabolomics,Proteomics,Transcriptomics",
"Bioinformatics,Computational Biology,Genomics",
"Bioengineering,Biomedical Science,Computational Biology,Computer Science,Neurobiology,Neuroscience",
"Biodiversity,Freshwater Science,Life Science",
"Biodiversity,Life Science,Microbiology",
"Biodiversity,Life Science,Natural History",
"Biodiversity,Life Science,Oceanography",
"Biodiversity,Life Science,Phylogeny",
"Biodiversity,Life Science,Tropical Medicine",
"Biodiversity,Natural History",
"Biodiversity,Population Genetics",
"Biodiversity,Taxonomy",
"Bioengineering,Genetics",
"Bioinformatics,Comparative Genomics,Oncology,Translational Medicine",
"Bioengineering,Synthetic Biology",
"Bioinformatics,Biological Psychology,Computational Neuroscience,Epigenomics,Life Science,Neuroscience",
"Bioinformatics,Biology,Data Integration,Data Submission, Annotation and Curation,Genetics,Life Science,Molecular Genetics",
"Bioinformatics,Biomedical Science,Genomics,Life Science",
"Bioinformatics,Biomedical Science,Health Science,Immunogenetics,Medicine",
"Bioinformatics,Biomedical Science,Life Science",
"Bioinformatics,Biotechnology,Data Management,Life Science,Metabolomics,Microbiology,Molecular biology,Proteomics,Systems Biology,Transcriptomics",
"Bioinformatics,Botany,Genetics,Plant Anatomy,Plant Genetics",
"Bioinformatics,Cell Biology,Developmental Biology,Life Science",
"Biology,Biomedical Science",
"Biology,Biomedical Science,Genetics,Life Science,Molecular biology",
"Biology,Biomedical Science,Life Science",
"Biomedical Science,Computer Science,Humanities,Mathematics,Physics,Social Science",
"Biomedical Science,Clinical Studies,Epidemiology,Medical Informatics,Preclinical Studies",
"Biomedical Science,Clinical Studies,Epidemiology,Preclinical Studies",
"Biomedical Science,Clinical Studies,Epidemiology,Public Health,Virology",
"Biomedical Science,Clinical Studies,Genomics,Preclinical Studies",
"Biomedical Science,Clinical Studies,Health Science,Medicine,Preclinical Studies,Virology",
"Biomedical Science,Clinical Studies,Medical Informatics,Medicine",
"Biomedical Science,Clinical Studies,Preclinical Studies",
"Biomedical Science,Comparative Genomics,Genomics",
"Biomedical Science,Computational Neuroscience,Neuroscience",
"Biomedical Science,Data Integration,Data Management",
"Biomedical Science,Clinical Studies,Epidemiology,Health Science,Medical Informatics,Preclinical Studies,Public Health,Virology",
"Biomedical Science,Data Integration,Epidemiology,Virology",
"Biomedical Science,Data Mining,Life Science",
"Biomedical Science,Data Security",
"Biomedical Science,Developmental Biology,Neurobiology",
"Biomedical Science,Drug Development,Drug Discovery",
"Biomedical Science,Drug Development,Drug Discovery,Drug Repositioning,Pharmacology,Pharmacy",
"Biomedical Science,Drug Discovery,Drug Metabolism",
"Biomedical Science,Drug Discovery,Epigenetics,Genetics,Genomics,Human Genetics,Molecular biology,Transcriptomics",
"Biomedical Science,Drug Discovery,Life Science",
"Biomedical Science,Clinical Studies,Epidemiology,Life Science,Virology",
"Biomedical Science,Clinical Studies,Drug Discovery,Epidemiology,Virology",
"Biology,Botany",
"Biology,Taxonomy",
"Biology,Cell Biology,Life Science",
"Biology,Chemistry,Clinical Studies,Computer Science,Health Science,Informatics,Materials Engineering,Mathematics,Physics,Psychology,Public Health",
"Biology,Chemistry,Computer Science,Engineering Science,Life Science,Mathematics,Natural Science,Physics",
"Biology,Chemistry,Life Science,Metabolomics",
"Biology,Data Submission, Annotation and Curation,Database Management,Genetics,Life Science,Quantitative Genetics",
"Biology,Earth Science,Environmental Science,Geochemistry,Geology,Mineralogy",
"Biology,Epidemiology,Virology",
"Biology,Life Science,Oncology",
"Biology,Life Science,Transcriptomics",
"Biology,Thermodynamics",
"Biomedical Science,Clinical Studies,Data Security,Demographics,Epidemiology,Health Science,Medicine,Preclinical Studies",
"Biomaterials,Composite Materials,Functional Materials Research,Materials Engineering,Materials Informatics,Materials Science,Materials Structuring and Functionalisation,Mechanical Behaviour of Construction Materials,Microstructural Mechanical Properties of Materials",
"Biomedical Science,Botany",
"Biomedical Science,Cell Biology,Clinical Studies,Life Science,Molecular biology,Preclinical Studies",
"Biomedical Science,Cell Biology,Life Science,Pediatrics",
"Biomedical Science,Cell Biology,Life Science,Transcriptomics",
"Biomedical Science,Cell Biology,Medicine,Medicines Research and Development,Oncology",
"Biomedical Science,Chemistry",
"Biomedical Science,Chemistry,Health Science,Pharmacology",
"Biomedical Science,Clinical Studies,Critical Care Medicine,Data Governance,Data Management,Data Submission, Annotation and Curation,Demographics,Gynecology,Life Science,Medicine,Musculoskeletal Medicine,Obstetrics,Pediatrics,Pharmacology,Reproductive Health,Social Science",
"Water Management,Water Research"
],
"y": [
367,
44,
33,
30,
30,
16,
15,
15,
12,
12,
11,
11,
10,
10,
10,
9,
9,
8,
8,
7,
7,
7,
7,
7,
7,
7,
6,
6,
5,
5,
5,
5,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1
]
}
],
"layout": {
"template": {
"data": {
"bar": [
{
"error_x": {
"color": "#2a3f5f"
},
"error_y": {
"color": "#2a3f5f"
},
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "bar"
}
],
"barpolar": [
{
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "barpolar"
}
],
"carpet": [
{
"aaxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"baxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"type": "carpet"
}
],
"choropleth": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "choropleth"
}
],
"contour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "contour"
}
],
"contourcarpet": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "contourcarpet"
}
],
"heatmap": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmap"
}
],
"heatmapgl": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmapgl"
}
],
"histogram": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "histogram"
}
],
"histogram2d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2d"
}
],
"histogram2dcontour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2dcontour"
}
],
"mesh3d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "mesh3d"
}
],
"parcoords": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "parcoords"
}
],
"pie": [
{
"automargin": true,
"type": "pie"
}
],
"scatter": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter"
}
],
"scatter3d": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter3d"
}
],
"scattercarpet": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattercarpet"
}
],
"scattergeo": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergeo"
}
],
"scattergl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergl"
}
],
"scattermapbox": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattermapbox"
}
],
"scatterpolar": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolar"
}
],
"scatterpolargl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolargl"
}
],
"scatterternary": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterternary"
}
],
"surface": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "surface"
}
],
"table": [
{
"cells": {
"fill": {
"color": "#EBF0F8"
},
"line": {
"color": "white"
}
},
"header": {
"fill": {
"color": "#C8D4E3"
},
"line": {
"color": "white"
}
},
"type": "table"
}
]
},
"layout": {
"annotationdefaults": {
"arrowcolor": "#2a3f5f",
"arrowhead": 0,
"arrowwidth": 1
},
"autotypenumbers": "strict",
"coloraxis": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"colorscale": {
"diverging": [
[
0,
"#8e0152"
],
[
0.1,
"#c51b7d"
],
[
0.2,
"#de77ae"
],
[
0.3,
"#f1b6da"
],
[
0.4,
"#fde0ef"
],
[
0.5,
"#f7f7f7"
],
[
0.6,
"#e6f5d0"
],
[
0.7,
"#b8e186"
],
[
0.8,
"#7fbc41"
],
[
0.9,
"#4d9221"
],
[
1,
"#276419"
]
],
"sequential": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"sequentialminus": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
]
},
"colorway": [
"#636efa",
"#EF553B",
"#00cc96",
"#ab63fa",
"#FFA15A",
"#19d3f3",
"#FF6692",
"#B6E880",
"#FF97FF",
"#FECB52"
],
"font": {
"color": "#2a3f5f"
},
"geo": {
"bgcolor": "white",
"lakecolor": "white",
"landcolor": "#E5ECF6",
"showlakes": true,
"showland": true,
"subunitcolor": "white"
},
"hoverlabel": {
"align": "left"
},
"hovermode": "closest",
"mapbox": {
"style": "light"
},
"paper_bgcolor": "white",
"plot_bgcolor": "#E5ECF6",
"polar": {
"angularaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"radialaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"scene": {
"xaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"yaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"zaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
}
},
"shapedefaults": {
"line": {
"color": "#2a3f5f"
}
},
"ternary": {
"aaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"baxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"caxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"title": {
"x": 0.05
},
"xaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
},
"yaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
}
}
},
"title": {
"text": "Subject coverage FAIRsharing"
},
"xaxis": {
"tickangle": 45,
"tickfont": {
"size": 12
}
}
}
},
"text/html": [
"<div> <div id=\"2cda32ef-3158-4505-8c17-b37ad66f7d04\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div> <script type=\"text/javascript\"> require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {}; if (document.getElementById(\"2cda32ef-3158-4505-8c17-b37ad66f7d04\")) { Plotly.newPlot( \"2cda32ef-3158-4505-8c17-b37ad66f7d04\", [{\"name\": \"FAIRsharing\", \"type\": \"bar\", \"x\": [\"Life Science\", \"Biomedical Science,Life Science\", \"Genomics,Life Science\", \"Biodiversity,Life Science\", \"Biomedical Science\", \"Earth Science,Environmental Science\", \"Data Management\", \"Life Science,Proteomics\", \"Genomics\", \"Comparative Genomics,Life Science\", \"Earth Science\", \"Life Science,Metabolomics\", \"Biology\", \"Epidemiology,Life Science,Virology\", \"Biomedical Science,Preclinical Studies\", \"Life Science,Ontology and Terminology\", \"Engineering Science,Humanities and Social Sciences,Natural Science\", \"Life Science,Phylogenetics\", \"Knowledge and Information Systems,Software Engineering\", \"Atmospheric Science,Earth Science,Oceanography\", \"Anatomy,Life Science\", \"Clinical Studies,Critical Care Medicine,Health Science,Infectious Disease Medicine,Medical Virology,Medicine\", \"Glycomics,Life Science\", \"Functional Genomics,Life Science\", \"Biology,Life Science\", \"Structural Biology\", \"Atmospheric Science,Earth Science\", \"Bioinformatics\", \"Earth Science,Meteorology\", \"Genetics,Life Science\", \"Astrophysics and Astronomy\", \"Bioinformatics,Biology\", \"Comparative Genomics,Genomics,Life Science\", \"Biomedical Science,Immunogenetics,Immunology\", \"Earth Science,Environmental Science,Oceanography\", \"Biochemistry,Life Science\", \"Life Science,Neurobiology\", \"Earth Science,Geology,Geophysics\", \"Oceanography\", \"Environmental Science\", \"Biomedical Science,Life Science,Neurobiology\", \"Biomedical Science,Genetics,Life Science\", \"Comparative Genomics,Genomics\", \"Life Science,Transcriptomics\", \"Genetics,Genomics,Life Science\", \"Developmental Biology,Life Science\", \"Genetics\", \"Computational Biology,Life Science\", \"Atmospheric Science,Earth Science,Environmental Science,Geology\", \"Biomedical Science,Genomics,Life Science\", \"Epigenetics,Epigenomics\", \"Atmospheric Science,Earth Science,Meteorology\", \"Epigenetics,Life Science\", \"Functional Genomics,Genomics,Life Science\", \"Biomedical Science,Drug Development,Drug Discovery,Epidemiology,Virology\", \"Biomedical Science,Health Science\", \"Transcriptomics\", \"Earth Science,Geophysics\", \"Earth Science,Environmental Science,Geology\", \"Agriculture,Genomics,Life Science,Plant Breeding\", \"Environmental Science,Oceanography\", \"Earth Science,Geology\", \"Environmental Science,Marine Biology\", \"Data Submission, Annotation and Curation,Life Science\", \"Proteomics\", \"Life Science,Systems Biology\", \"Atmospheric Science,Remote Sensing\", \"Computer Science\", \"Earth Science,Geology,Hydrogeology,Mineralogy\", \"Earth Science,Geology,Geophysics,Geotechnics\", \"Earth Science,Geography,Remote Sensing\", \"Earth Science,Geography,Geology,Oceanography\", \"Earth Science,Geodesy,Geophysics\", \"Bioinformatics,Computational Neuroscience,Neuroscience\", \"Bioinformatics,Data Management,Data Submission, Annotation and Curation,Functional Genomics,Genomics,Metagenomics,Transcriptomics\", \"Computational Biology,Systems Biology\", \"Atmospheric Science,Earth Science,Environmental Science\", \"Astrophysics and Astronomy,Earth Science,Geophysics\", \"Biomedical Science,Glycomics\", \"Bioinformatics,Structural Biology\", \"Earth Science,Environmental Science,Geophysics\", \"Biology,Genomics,Life Science\", \"Earth Science,Oceanography,Water Research\", \"Earth Science,Oceanography\", \"Biomedical Science,Epidemiology,Virology\", \"Atmospheric Science,Meteorology,Oceanography,Remote Sensing\", \"Data Mining
" \n",
"var gd = document.getElementById('2cda32ef-3158-4505-8c17-b37ad66f7d04');\n",
"var x = new MutationObserver(function (mutations, observer) {{\n",
" var display = window.getComputedStyle(gd).display;\n",
" if (!display || display === 'none') {{\n",
" console.log([gd, 'removed!']);\n",
" Plotly.purge(gd);\n",
" observer.disconnect();\n",
" }}\n",
"}});\n",
"\n",
"// Listen for the removal of the full notebook cells\n",
"var notebookContainer = gd.closest('#notebook-container');\n",
"if (notebookContainer) {{\n",
" x.observe(notebookContainer, {childList: true});\n",
"}}\n",
"\n",
"// Listen for the clearing of the current output cell\n",
"var outputEl = gd.closest('.output');\n",
"if (outputEl) {{\n",
" x.observe(outputEl, {childList: true});\n",
"}}\n",
"\n",
" }) }; }); </script> </div>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"data = fairsharing_subjects.groupby('subjects')[['url']].count().sort_values('url', ascending=False)\n",
"plot = [\n",
" go.Bar(\n",
" x=data.index,\n",
" y=data['url'],\n",
" name='FAIRsharing'\n",
" )\n",
"]\n",
"\n",
"layout = go.Layout(\n",
" title='Subject coverage FAIRsharing',\n",
" xaxis=dict(tickangle=45, tickfont=dict(size=12))\n",
")\n",
"\n",
"fig = go.Figure(plot, layout).show()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Geographic analysis"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**re3data**"
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>re3data_id</th>\n",
" <th>institution</th>\n",
" <th>org_name</th>\n",
" <th>org_other_names</th>\n",
" <th>org_country</th>\n",
" <th>org_3</th>\n",
" <th>org_noprofit</th>\n",
" <th>org_url</th>\n",
" <th>org_ids</th>\n",
" <th>org_date1</th>\n",
" <th>org_date2</th>\n",
" <th>org_contact</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>r3d100000001</td>\n",
" <td>[Odum Institute for Research in Social Science...</td>\n",
" <td>Odum Institute for Research in Social Science</td>\n",
" <td>[]</td>\n",
" <td>USA</td>\n",
" <td>[general]</td>\n",
" <td>non-profit</td>\n",
" <td>https://odum.unc.edu/archive/</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>r3d100000002</td>\n",
" <td>[The U.S. National Archives and Records Admini...</td>\n",
" <td>The U.S. National Archives and Records Adminis...</td>\n",
" <td>[NARA, National Archives]</td>\n",
" <td>USA</td>\n",
" <td>[general]</td>\n",
" <td>non-profit</td>\n",
" <td>http://www.archives.gov/</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[http://www.archives.gov/contact/]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>r3d100000002</td>\n",
" <td>[The USA.gov, [], USA, [general], non-profit, ...</td>\n",
" <td>The USA.gov</td>\n",
" <td>[]</td>\n",
" <td>USA</td>\n",
" <td>[general]</td>\n",
" <td>non-profit</td>\n",
" <td>http://www.usa.gov/</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[http://www.usa.gov/Contact.shtml]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>r3d100000004</td>\n",
" <td>[Institut für Deutsche Sprache, Archiv für Ges...</td>\n",
" <td>Institut für Deutsche Sprache, Archiv für Gesp...</td>\n",
" <td>[AGD]</td>\n",
" <td>DEU</td>\n",
" <td>[funding, general]</td>\n",
" <td>non-profit</td>\n",
" <td>http://agd.ids-mannheim.de/index.shtml</td>\n",
" <td>[]</td>\n",
" <td>2004</td>\n",
" <td></td>\n",
" <td>[agd@ids-mannheim.de]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>r3d100000005</td>\n",
" <td>[Odum Institute for Research in Social Science...</td>\n",
" <td>Odum Institute for Research in Social Science</td>\n",
" <td>[]</td>\n",
" <td>USA</td>\n",
" <td>[technical]</td>\n",
" <td>non-profit</td>\n",
" <td>https://odum.unc.edu/</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[https://odum.unc.edu/contact/contact-form/, o...</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" re3data_id institution \\\n",
"0 r3d100000001 [Odum Institute for Research in Social Science... \n",
"1 r3d100000002 [The U.S. National Archives and Records Admini... \n",
"2 r3d100000002 [The USA.gov, [], USA, [general], non-profit, ... \n",
"3 r3d100000004 [Institut für Deutsche Sprache, Archiv für Ges... \n",
"4 r3d100000005 [Odum Institute for Research in Social Science... \n",
"\n",
" org_name \\\n",
"0 Odum Institute for Research in Social Science \n",
"1 The U.S. National Archives and Records Adminis... \n",
"2 The USA.gov \n",
"3 Institut für Deutsche Sprache, Archiv für Gesp... \n",
"4 Odum Institute for Research in Social Science \n",
"\n",
" org_other_names org_country org_3 org_noprofit \\\n",
"0 [] USA [general] non-profit \n",
"1 [NARA, National Archives] USA [general] non-profit \n",
"2 [] USA [general] non-profit \n",
"3 [AGD] DEU [funding, general] non-profit \n",
"4 [] USA [technical] non-profit \n",
"\n",
" org_url org_ids org_date1 org_date2 \\\n",
"0 https://odum.unc.edu/archive/ [] \n",
"1 http://www.archives.gov/ [] \n",
"2 http://www.usa.gov/ [] \n",
"3 http://agd.ids-mannheim.de/index.shtml [] 2004 \n",
"4 https://odum.unc.edu/ [] \n",
"\n",
" org_contact \n",
"0 [] \n",
"1 [http://www.archives.gov/contact/] \n",
"2 [http://www.usa.gov/Contact.shtml] \n",
"3 [agd@ids-mannheim.de] \n",
"4 [https://odum.unc.edu/contact/contact-form/, o... "
]
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"re3data_institutions = re3data_df.explode('institution')[['re3data_id', 'institution']]\n",
"re3data_institutions = re3data_institutions[~re3data_institutions.institution.isna()].reset_index(drop=True)\n",
"re3data_institutions = re3data_institutions.join(pd.DataFrame(re3data_institutions.institution.to_list(), columns=['org_name', 'org_other_names', \n",
" 'org_country', 'org_3', 'org_noprofit', \n",
" 'org_url', 'org_ids', 'org_date1', \n",
" 'org_date2', 'org_contact']))\n",
"re3data_institutions.head()"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [],
"source": [
"re3data_institutions['org_continent'] = re3data_institutions.org_country.map(countrycode_to_continent)"
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['AAA', 'EEC'], dtype=object)"
]
},
"execution_count": 23,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"re3data_institutions[re3data_institutions.org_continent.isna()].org_country.unique()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"AAA is used for international collaborations; we skip this.\n",
"EEC is used for the EU commission; we fix the continent manually."
]
},
{
"cell_type": "code",
"execution_count": 24,
"metadata": {},
"outputs": [],
"source": [
"re3data_institutions.loc[re3data_institutions.org_country == 'EEC', 'org_continent'] = 'EU'"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**OpenDOAR**"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>opendoar_id</th>\n",
" <th>institution</th>\n",
" <th>org_name</th>\n",
" <th>org_other_names</th>\n",
" <th>org_country</th>\n",
" <th>org_3</th>\n",
" <th>org_noprofit</th>\n",
" <th>org_url</th>\n",
" <th>org_ids</th>\n",
" <th>org_date1</th>\n",
" <th>org_date2</th>\n",
" <th>org_contact</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>101</td>\n",
" <td>[university of utrecht, [universiteit utrecht]...</td>\n",
" <td>university of utrecht</td>\n",
" <td>[universiteit utrecht]</td>\n",
" <td>NLD</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td>https://www.uu.nl</td>\n",
" <td>[https://ror.org/04pp8hn57]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>115</td>\n",
" <td>[indian institute of management kozhikode, [ii...</td>\n",
" <td>indian institute of management kozhikode</td>\n",
" <td>[iimk]</td>\n",
" <td>IND</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td>http://www.iimk.ac.in/</td>\n",
" <td>[https://ror.org/03m1xdc36]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>41</td>\n",
" <td>[california institute of technology, [caltech]...</td>\n",
" <td>california institute of technology</td>\n",
" <td>[caltech]</td>\n",
" <td>USA</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td>http://www.caltech.edu/</td>\n",
" <td>[https://ror.org/05dxps055]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>119</td>\n",
" <td>[dublin city university, [dcu], ie, [], , http...</td>\n",
" <td>dublin city university</td>\n",
" <td>[dcu]</td>\n",
" <td>IRL</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td>http://www.dcu.ie/</td>\n",
" <td>[https://ror.org/04a1a1e81]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[]</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>129</td>\n",
" <td>[istituto nazionale di geofisica e vulcanologi...</td>\n",
" <td>istituto nazionale di geofisica e vulcanologia</td>\n",
" <td>[ingv]</td>\n",
" <td>ITA</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td>http://www.ingv.it</td>\n",
" <td>[https://ror.org/00qps9a02]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[]</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" opendoar_id institution \\\n",
"0 101 [university of utrecht, [universiteit utrecht]... \n",
"1 115 [indian institute of management kozhikode, [ii... \n",
"2 41 [california institute of technology, [caltech]... \n",
"3 119 [dublin city university, [dcu], ie, [], , http... \n",
"4 129 [istituto nazionale di geofisica e vulcanologi... \n",
"\n",
" org_name org_other_names \\\n",
"0 university of utrecht [universiteit utrecht] \n",
"1 indian institute of management kozhikode [iimk] \n",
"2 california institute of technology [caltech] \n",
"3 dublin city university [dcu] \n",
"4 istituto nazionale di geofisica e vulcanologia [ingv] \n",
"\n",
" org_country org_3 org_noprofit org_url \\\n",
"0 NLD [] https://www.uu.nl \n",
"1 IND [] http://www.iimk.ac.in/ \n",
"2 USA [] http://www.caltech.edu/ \n",
"3 IRL [] http://www.dcu.ie/ \n",
"4 ITA [] http://www.ingv.it \n",
"\n",
" org_ids org_date1 org_date2 org_contact \n",
"0 [https://ror.org/04pp8hn57] [] \n",
"1 [https://ror.org/03m1xdc36] [] \n",
"2 [https://ror.org/05dxps055] [] \n",
"3 [https://ror.org/04a1a1e81] [] \n",
"4 [https://ror.org/00qps9a02] [] "
]
},
"execution_count": 25,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"opendoar_institutions = opendoar_df.explode('institution')[['opendoar_id', 'institution']]\n",
"opendoar_institutions = opendoar_institutions[~opendoar_institutions.institution.isna()].reset_index(drop=True)\n",
"opendoar_institutions = opendoar_institutions.join(pd.DataFrame(opendoar_institutions.institution.to_list(), columns=['org_name', 'org_other_names', \n",
" 'org_country', 'org_3', 'org_noprofit', \n",
" 'org_url', 'org_ids', 'org_date1', \n",
" 'org_date2', 'org_contact']))\n",
"opendoar_institutions['org_country'] = opendoar_institutions.org_country.map(str.upper, na_action='ignore')\n",
"opendoar_institutions['org_country'] = opendoar_institutions.org_country.map(countrycode_iso2_to_countrycode_iso3, na_action='ignore')\n",
"opendoar_institutions.head()"
]
},
{
"cell_type": "code",
"execution_count": 26,
"metadata": {},
"outputs": [],
"source": [
"opendoar_institutions['org_continent'] = opendoar_institutions.org_country.map(countrycode_to_continent)"
]
},
{
"cell_type": "code",
"execution_count": 27,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([nan, 'UMI'], dtype=object)"
]
},
"execution_count": 27,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"opendoar_institutions[opendoar_institutions.org_continent.isna()].org_country.unique()"
]
},
{
"cell_type": "code",
"execution_count": 28,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>opendoar_id</th>\n",
" <th>institution</th>\n",
" <th>org_name</th>\n",
" <th>org_other_names</th>\n",
" <th>org_country</th>\n",
" <th>org_3</th>\n",
" <th>org_noprofit</th>\n",
" <th>org_url</th>\n",
" <th>org_ids</th>\n",
" <th>org_date1</th>\n",
" <th>org_date2</th>\n",
" <th>org_contact</th>\n",
" <th>org_continent</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>4349</th>\n",
" <td>5379</td>\n",
" <td>[kettering university, [], um, [], , https://w...</td>\n",
" <td>kettering university</td>\n",
" <td>[]</td>\n",
" <td>UMI</td>\n",
" <td>[]</td>\n",
" <td></td>\n",
" <td>https://www.kettering.edu</td>\n",
" <td>[https://ror.org/03rcspa57]</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>[]</td>\n",
" <td>NA</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" opendoar_id institution \\\n",
"4349 5379 [kettering university, [], um, [], , https://w... \n",
"\n",
" org_name org_other_names org_country org_3 org_noprofit \\\n",
"4349 kettering university [] UMI [] \n",
"\n",
" org_url org_ids org_date1 \\\n",
"4349 https://www.kettering.edu [https://ror.org/03rcspa57] \n",
"\n",
" org_date2 org_contact org_continent \n",
"4349 [] NA "
]
},
"execution_count": 28,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"opendoar_institutions.loc[opendoar_institutions.org_country == 'UMI', 'org_continent'] = 'NA'\n",
"opendoar_institutions[opendoar_institutions.org_country == 'UMI']"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**ROAR**"
]
},
{
"cell_type": "code",
"execution_count": 29,
"metadata": {},
"outputs": [],
"source": [
"roar_df['location_country'] = roar_df.location_country.map(str.upper, na_action='ignore')\n",
"roar_df['location_country'] = roar_df.location_country.map(countrycode_iso2_to_countrycode_iso3)\n",
"roar_df['continent'] = roar_df.location_country.map(countrycode_to_continent)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**FAIRsharing**"
]
},
{
"cell_type": "code",
"execution_count": 30,
"metadata": {},
"outputs": [],
"source": [
"fairsharing_df['subjects'] = fairsharing_df.subjects.str.split(pat=',')\n",
"fairsharing_df['countries'] = fairsharing_df.countries.str.split(pat=',')\n",
"\n",
"fairsharing_countries = fairsharing_df.explode('countries')\n",
"fairsharing_countries['countrycode'] = fairsharing_countries.countries.map(country_to_countrycode)\n",
"fairsharing_countries['continent'] = fairsharing_countries.countrycode.map(countrycode_to_continent)"
]
},
{
"cell_type": "code",
"execution_count": 31,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['European Union', 'Republic of Ireland', 'Worldwide', nan],\n",
" dtype=object)"
]
},
"execution_count": 31,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"fairsharing_countries[fairsharing_countries.countrycode.isna()].countries.unique()"
]
},
{
"cell_type": "code",
"execution_count": 32,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['European Union', 'Republic of Ireland', 'Worldwide', 'Antarctica',\n",
" nan], dtype=object)"
]
},
"execution_count": 32,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"fairsharing_countries[fairsharing_countries.continent.isna()].countries.unique()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Fix manually some rows"
]
},
{
"cell_type": "code",
"execution_count": 33,
"metadata": {},
"outputs": [],
"source": [
"fairsharing_countries.loc[fairsharing_countries.countries == 'Republic of Ireland', ['countries', 'countrycode', 'continent']] = ['Ireland', 'IE', 'EU']\n",
"fairsharing_countries.loc[fairsharing_countries.countries == 'European Union', ['countrycode', 'continent']] = ['EU', 'EU']"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Make Antactica disappear (only one repo)"
]
},
{
"cell_type": "code",
"execution_count": 34,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>full_name</th>\n",
" <th>short_name</th>\n",
" <th>fs_url</th>\n",
" <th>url</th>\n",
" <th>countries</th>\n",
" <th>subjects</th>\n",
" <th>countrycode</th>\n",
" <th>continent</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>915</th>\n",
" <td>Antabif IPT - AntOBIS IPT - GBIF Belgium</td>\n",
" <td>Antabif IPT - AntOBIS IPT - GBIF Belgium</td>\n",
" <td>https://fairsharing.org/10.25504/FAIRsharing.e...</td>\n",
" <td>http://ipt.biodiversity.aq/</td>\n",
" <td>Antarctica</td>\n",
" <td>[Biodiversity, Life Science]</td>\n",
" <td>AQ</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" full_name \\\n",
"915 Antabif IPT - AntOBIS IPT - GBIF Belgium \n",
"\n",
" short_name \\\n",
"915 Antabif IPT - AntOBIS IPT - GBIF Belgium \n",
"\n",
" fs_url \\\n",
"915 https://fairsharing.org/10.25504/FAIRsharing.e... \n",
"\n",
" url countries subjects \\\n",
"915 http://ipt.biodiversity.aq/ Antarctica [Biodiversity, Life Science] \n",
"\n",
" countrycode continent \n",
"915 AQ NaN "
]
},
"execution_count": 34,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"fairsharing_countries.loc[fairsharing_countries.countries == 'Antarctica', ['countrycode', 'continent']] = ['AQ', np.nan]\n",
"fairsharing_countries[fairsharing_countries.countrycode == 'AQ']"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Country coverage"
]
},
{
"cell_type": "code",
"execution_count": 35,
"metadata": {},
"outputs": [
{
"data": {
"application/vnd.plotly.v1+json": {
"config": {
"plotlyServerURL": "https://plot.ly"
},
"data": [
{
"name": "re3data",
"type": "bar",
"x": [
"USA",
"DEU",
"CAN",
"GBR",
"EEC",
"AAA",
"FRA",
"AUS",
"CHE",
"JPN",
"NLD",
"ESP",
"IND",
"CHN",
"ITA",
"AUT",
"NOR",
"SWE",
"BEL",
"DNK",
"POL",
"RUS",
"GRC",
"ZAF",
"CZE",
"IRL",
"MEX",
"BRA",
"TWN",
"FIN",
"PRT",
"NZL",
"EST",
"KOR",
"COL",
"SRB",
"LTU",
"ARG",
"SGP",
"HUN",
"ISR",
"TUR",
"SVN",
"ISL",
"KEN",
"UKR",
"ROU",
"IDN",
"LUX",
"SVK",
"HKG",
"PER",
"PAK",
"LVA",
"GRL",
"THA",
"CHL",
"BEN",
"PAN",
"CMR",
"CYP",
"MKD",
"SDN",
"HRV",
"BFA",
"TUN",
"CIV",
"GHA",
"SEN",
"PYF",
"PHL",
"NCL",
"NAM",
"LBN",
"KAZ",
"FJI",
"AZE",
"LKA"
],
"y": [
2690,
1040,
573,
514,
349,
294,
233,
215,
118,
113,
111,
88,
79,
74,
62,
54,
52,
39,
39,
38,
33,
33,
31,
22,
21,
21,
18,
17,
16,
15,
15,
15,
14,
14,
13,
11,
11,
9,
9,
9,
8,
7,
7,
6,
6,
4,
4,
4,
4,
4,
4,
3,
3,
3,
3,
3,
3,
2,
2,
2,
2,
2,
2,
2,
2,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1
]
},
{
"name": "openDOAR",
"type": "bar",
"visible": "legendonly",
"x": [
"USA",
"JPN",
"GBR",
"DEU",
"ESP",
"PER",
"TUR",
"IDN",
"FRA",
"BRA",
"HRV",
"ITA",
"POL",
"UKR",
"CAN",
"IND",
"COL",
"AUS",
"NLD",
"ARG",
"NOR",
"CHN",
"PRT",
"TWN",
"MEX",
"SWE",
"RUS",
"AUT",
"HUN",
"ZAF",
"SRB",
"KEN",
"KOR",
"GRC",
"ECU",
"BLR",
"CHE",
"BEL",
"NGA",
"IRL",
"CHL",
"CZE",
"MYS",
"FIN",
"DZA",
"NZL",
"LTU",
"IRN",
"THA",
"VEN",
"LKA",
"DNK",
"BGD",
"TZA",
"CUB",
"KAZ",
"SVN",
"MDA",
"SDN",
"UGA",
"SAU",
"NIC",
"ZWE",
"BGR",
"CRI",
"HKG",
"SLV",
"PHL",
"URY",
"EST",
"EGY",
"SGP",
"PSE",
"CYP",
"JAM",
"GHA",
"ROU",
"PAN",
"LVA",
"MKD",
"ETH",
"PAK",
"SVK",
"SEN",
"HND",
"ISL",
"DOM",
"LUX",
"MMR",
"ARE",
"MAR",
"BWA",
"LBY",
"GEO",
"LBN",
"ZMB",
"IRQ",
"ARM",
"AZE",
"RWA",
"LSO",
"MOZ",
"PRY",
"BIH",
"TUN",
"BOL",
"FJI",
"NAM",
"CPV",
"UMI",
"VNM",
"TTO",
"AFG",
"SOM",
"QAT",
"PRI",
"NPL",
"NCL",
"MWI",
"MLT",
"LAO",
"ALA",
"KGZ",
"GTM",
"GLP",
"CMR",
"AND",
"ALB",
"KWT"
],
"y": [
910,
682,
315,
280,
175,
162,
161,
156,
154,
151,
148,
141,
124,
105,
99,
98,
97,
91,
75,
72,
67,
60,
60,
60,
50,
50,
48,
46,
44,
44,
44,
43,
41,
38,
37,
37,
35,
33,
30,
30,
27,
26,
25,
22,
20,
19,
18,
18,
17,
16,
16,
15,
15,
14,
14,
12,
12,
12,
12,
11,
11,
11,
11,
11,
10,
9,
9,
9,
9,
8,
8,
7,
7,
6,
6,
6,
6,
6,
5,
5,
5,
4,
4,
4,
4,
4,
4,
4,
3,
3,
3,
3,
3,
3,
3,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1
]
},
{
"name": "ROAR",
"type": "bar",
"visible": "legendonly",
"x": [
"USA",
"GBR",
"DEU",
"JPN",
"ESP",
"BRA",
"TUR",
"IDN",
"PER",
"POL",
"IND",
"COL",
"UKR",
"FRA",
"CAN",
"ITA",
"CHN",
"AUS",
"TWN",
"SWE",
"RUS",
"ARG",
"PRT",
"NOR",
"KOR",
"MEX",
"ZAF",
"NLD",
"HUN",
"MYS",
"GRC",
"SRB",
"BEL",
"BLR",
"ECU",
"CHE",
"KEN",
"CHL",
"IRL",
"AUT",
"VEN",
"FIN",
"NZL",
"ROU",
"DNK",
"CZE",
"IRN",
"MDA",
"NGA",
"DZA",
"CUB",
"THA",
"SLV",
"SDN",
"PHL",
"ZWE",
"EGY",
"LTU",
"BGD",
"BGR",
"KAZ",
"SVN",
"HKG",
"CRI",
"SAU",
"TZA",
"CYP",
"URY",
"NIC",
"UGA",
"SGP",
"HRV",
"PSE",
"GHA",
"PAK",
"EST",
"AZE",
"LVA",
"DOM",
"MAR",
"BWA",
"KGZ",
"PAN",
"JAM",
"ETH",
"BIH",
"BOL",
"LBN",
"NPL",
"MKD",
"IRQ",
"FJI",
"SEN",
"SVK",
"LBY",
"LKA",
"LSO",
"LUX",
"ISL",
"TUN",
"DMA",
"ARM",
"MOZ",
"NAM",
"GEO",
"UMI",
"WSM",
"ARE",
"PRI",
"SYR",
"CMR",
"SOM",
"RWA",
"QAT",
"PRK",
"HND",
"MTQ",
"MLT",
"ALB",
"ISR",
"AFG"
],
"y": [
873,
258,
258,
234,
195,
181,
158,
151,
149,
126,
122,
119,
111,
101,
97,
96,
91,
82,
80,
76,
68,
65,
59,
56,
53,
48,
48,
46,
45,
41,
39,
38,
37,
35,
29,
29,
29,
27,
26,
26,
23,
23,
22,
17,
17,
16,
16,
16,
15,
14,
14,
13,
13,
13,
13,
12,
12,
11,
11,
11,
10,
10,
10,
9,
9,
8,
7,
7,
7,
7,
7,
7,
7,
6,
6,
5,
5,
5,
4,
4,
4,
4,
4,
4,
3,
3,
3,
3,
3,
3,
3,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1
]
},
{
"name": "FAIRsharing",
"type": "bar",
"visible": "legendonly",
"x": [
"USA",
"GBR",
"DEU",
"FRA",
"CHE",
"CHN",
"NLD",
"ITA",
"CAN",
"BEL",
"ESP",
"JPN",
"SWE",
"CZE",
"NOR",
"DNK",
"EU",
"AUT",
"FIN",
"IE",
"AUS",
"ISR",
"PRT",
"HUN",
"GRC",
"MLT",
"LTU",
"ISL",
"LUX",
"SVK",
"MNE",
"HRV",
"IND",
"POL",
"KOR",
"SGP",
"ZAF",
"RUS",
"NZL",
"TWN",
"MEX",
"BRA",
"SAU",
"HKG",
"ARG",
"TUR",
"BGR",
"EST",
"MAR",
"ROU",
"UGA",
"CYP",
"PAK",
"THA",
"CRI",
"SLV",
"TGO",
"URY",
"PAN",
"AQ",
"NIC",
"NGA",
"BEN",
"CHL",
"CMR",
"COL",
"EGY",
"ETH",
"FRO",
"GRL",
"HND",
"IDN",
"ARE",
"KEN",
"LVA",
"MDG",
"MLI",
"MOZ",
"MRT",
"MWI",
"NER",
"ZWE"
],
"y": [
686,
248,
192,
162,
114,
99,
96,
91,
86,
83,
83,
80,
76,
71,
69,
67,
66,
64,
63,
62,
62,
61,
60,
59,
58,
53,
52,
52,
52,
52,
51,
51,
32,
11,
10,
10,
9,
9,
8,
8,
8,
8,
6,
3,
3,
3,
3,
2,
2,
2,
2,
2,
2,
2,
2,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1
]
}
],
"layout": {
"template": {
"data": {
"bar": [
{
"error_x": {
"color": "#2a3f5f"
},
"error_y": {
"color": "#2a3f5f"
},
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "bar"
}
],
"barpolar": [
{
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "barpolar"
}
],
"carpet": [
{
"aaxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"baxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"type": "carpet"
}
],
"choropleth": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "choropleth"
}
],
"contour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "contour"
}
],
"contourcarpet": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "contourcarpet"
}
],
"heatmap": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmap"
}
],
"heatmapgl": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmapgl"
}
],
"histogram": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "histogram"
}
],
"histogram2d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2d"
}
],
"histogram2dcontour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2dcontour"
}
],
"mesh3d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "mesh3d"
}
],
"parcoords": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "parcoords"
}
],
"pie": [
{
"automargin": true,
"type": "pie"
}
],
"scatter": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter"
}
],
"scatter3d": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter3d"
}
],
"scattercarpet": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattercarpet"
}
],
"scattergeo": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergeo"
}
],
"scattergl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergl"
}
],
"scattermapbox": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattermapbox"
}
],
"scatterpolar": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolar"
}
],
"scatterpolargl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolargl"
}
],
"scatterternary": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterternary"
}
],
"surface": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "surface"
}
],
"table": [
{
"cells": {
"fill": {
"color": "#EBF0F8"
},
"line": {
"color": "white"
}
},
"header": {
"fill": {
"color": "#C8D4E3"
},
"line": {
"color": "white"
}
},
"type": "table"
}
]
},
"layout": {
"annotationdefaults": {
"arrowcolor": "#2a3f5f",
"arrowhead": 0,
"arrowwidth": 1
},
"autotypenumbers": "strict",
"coloraxis": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"colorscale": {
"diverging": [
[
0,
"#8e0152"
],
[
0.1,
"#c51b7d"
],
[
0.2,
"#de77ae"
],
[
0.3,
"#f1b6da"
],
[
0.4,
"#fde0ef"
],
[
0.5,
"#f7f7f7"
],
[
0.6,
"#e6f5d0"
],
[
0.7,
"#b8e186"
],
[
0.8,
"#7fbc41"
],
[
0.9,
"#4d9221"
],
[
1,
"#276419"
]
],
"sequential": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"sequentialminus": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
]
},
"colorway": [
"#636efa",
"#EF553B",
"#00cc96",
"#ab63fa",
"#FFA15A",
"#19d3f3",
"#FF6692",
"#B6E880",
"#FF97FF",
"#FECB52"
],
"font": {
"color": "#2a3f5f"
},
"geo": {
"bgcolor": "white",
"lakecolor": "white",
"landcolor": "#E5ECF6",
"showlakes": true,
"showland": true,
"subunitcolor": "white"
},
"hoverlabel": {
"align": "left"
},
"hovermode": "closest",
"mapbox": {
"style": "light"
},
"paper_bgcolor": "white",
"plot_bgcolor": "#E5ECF6",
"polar": {
"angularaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"radialaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"scene": {
"xaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"yaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"zaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
}
},
"shapedefaults": {
"line": {
"color": "#2a3f5f"
}
},
"ternary": {
"aaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"baxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"caxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"title": {
"x": 0.05
},
"xaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
},
"yaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
}
}
},
"title": {
"text": "Country coverage"
},
"xaxis": {
"tickangle": 45,
"tickfont": {
"size": 12
}
}
}
},
"text/html": [
"<div> <div id=\"3e2361db-b571-4e06-aad9-b7257a0b43f2\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div> <script type=\"text/javascript\"> require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {}; if (document.getElementById(\"3e2361db-b571-4e06-aad9-b7257a0b43f2\")) { Plotly.newPlot( \"3e2361db-b571-4e06-aad9-b7257a0b43f2\", [{\"name\": \"re3data\", \"type\": \"bar\", \"x\": [\"USA\", \"DEU\", \"CAN\", \"GBR\", \"EEC\", \"AAA\", \"FRA\", \"AUS\", \"CHE\", \"JPN\", \"NLD\", \"ESP\", \"IND\", \"CHN\", \"ITA\", \"AUT\", \"NOR\", \"SWE\", \"BEL\", \"DNK\", \"POL\", \"RUS\", \"GRC\", \"ZAF\", \"CZE\", \"IRL\", \"MEX\", \"BRA\", \"TWN\", \"FIN\", \"PRT\", \"NZL\", \"EST\", \"KOR\", \"COL\", \"SRB\", \"LTU\", \"ARG\", \"SGP\", \"HUN\", \"ISR\", \"TUR\", \"SVN\", \"ISL\", \"KEN\", \"UKR\", \"ROU\", \"IDN\", \"LUX\", \"SVK\", \"HKG\", \"PER\", \"PAK\", \"LVA\", \"GRL\", \"THA\", \"CHL\", \"BEN\", \"PAN\", \"CMR\", \"CYP\", \"MKD\", \"SDN\", \"HRV\", \"BFA\", \"TUN\", \"CIV\", \"GHA\", \"SEN\", \"PYF\", \"PHL\", \"NCL\", \"NAM\", \"LBN\", \"KAZ\", \"FJI\", \"AZE\", \"LKA\"], \"y\": [2690, 1040, 573, 514, 349, 294, 233, 215, 118, 113, 111, 88, 79, 74, 62, 54, 52, 39, 39, 38, 33, 33, 31, 22, 21, 21, 18, 17, 16, 15, 15, 15, 14, 14, 13, 11, 11, 9, 9, 9, 8, 7, 7, 6, 6, 4, 4, 4, 4, 4, 4, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}, {\"name\": \"openDOAR\", \"type\": \"bar\", \"visible\": \"legendonly\", \"x\": [\"USA\", \"JPN\", \"GBR\", \"DEU\", \"ESP\", \"PER\", \"TUR\", \"IDN\", \"FRA\", \"BRA\", \"HRV\", \"ITA\", \"POL\", \"UKR\", \"CAN\", \"IND\", \"COL\", \"AUS\", \"NLD\", \"ARG\", \"NOR\", \"CHN\", \"PRT\", \"TWN\", \"MEX\", \"SWE\", \"RUS\", \"AUT\", \"HUN\", \"ZAF\", \"SRB\", \"KEN\", \"KOR\", \"GRC\", \"ECU\", \"BLR\", \"CHE\", \"BEL\", \"NGA\", \"IRL\", \"CHL\", \"CZE\", \"MYS\", \"FIN\", \"DZA\", \"NZL\", \"LTU\", \"IRN\", \"THA\", \"VEN\", \"LKA\", \"DNK\", \"BGD\", \"TZA\", \"CUB\", \"KAZ\", \"SVN\", \"MDA\", \"SDN\", \"UGA\", \"SAU\", \"NIC\", \"ZWE\", \"BGR\", \"CRI\", \"HKG\", \"SLV\", \"PHL\", \"URY\", \"EST\", \"EGY\", \"SGP\", \"PSE\", \"CYP\", \"JAM\", \"GHA\", \"ROU\", \"PAN\", \"LVA\", \"MKD\", \"ETH\", \"PAK\", \"SVK\", \"SEN\", \"HND\", \"ISL\", \"DOM\", \"LUX\", \"MMR\", \"ARE\", \"MAR\", \"BWA\", \"LBY\", \"GEO\", \"LBN\", \"ZMB\", \"IRQ\", \"ARM\", \"AZE\", \"RWA\", \"LSO\", \"MOZ\", \"PRY\", \"BIH\", \"TUN\", \"BOL\", \"FJI\", \"NAM\", \"CPV\", \"UMI\", \"VNM\", \"TTO\", \"AFG\", \"SOM\", \"QAT\", \"PRI\", \"NPL\", \"NCL\", \"MWI\", \"MLT\", \"LAO\", \"ALA\", \"KGZ\", \"GTM\", \"GLP\", \"CMR\", \"AND\", \"ALB\", \"KWT\"], \"y\": [910, 682, 315, 280, 175, 162, 161, 156, 154, 151, 148, 141, 124, 105, 99, 98, 97, 91, 75, 72, 67, 60, 60, 60, 50, 50, 48, 46, 44, 44, 44, 43, 41, 38, 37, 37, 35, 33, 30, 30, 27, 26, 25, 22, 20, 19, 18, 18, 17, 16, 16, 15, 15, 14, 14, 12, 12, 12, 12, 11, 11, 11, 11, 11, 10, 9, 9, 9, 9, 8, 8, 7, 7, 6, 6, 6, 6, 6, 5, 5, 5, 4, 4, 4, 4, 4, 4, 4, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}, {\"name\": \"ROAR\", \"type\": \"bar\", \"visible\": \"legendonly\", \"x\": [\"USA\", \"GBR\", \"DEU\", \"JPN\", \"ESP\", \"BRA\", \"TUR\", \"IDN\", \"PER\", \"POL\", \"IND\", \"COL\", \"UKR\", \"FRA\", \"CAN\", \"ITA\", \"CHN\", \"AUS\", \"TWN\", \"SWE\", \"RUS\", \"ARG\", \"PRT\", \"NOR\", \"KOR\", \"MEX\", \"ZAF\", \"NLD\", \"HUN\", \"MYS\", \"GRC\", \"SRB\", \"BEL\", \"BLR\", \"ECU\", \"CHE\", \"KEN\", \"CHL\", \"IRL\", \"AUT\", \"VEN\", \"FIN\", \"NZL\", \"ROU\", \"DNK\", \"CZE\", \"IRN\", \"MDA\", \"NGA\", \"DZA\", \"CUB\", \"THA\", \"SLV\", \"SDN\", \"PHL\", \"ZWE\", \"EGY\", \"LTU\", \"BGD\", \"BGR\", \"KAZ\", \"SVN\", \"HKG\", \"CRI\", \"SAU\", \"TZA\", \"CYP\", \"URY\", \"NIC\", \"UGA\", \"SGP\", \"HRV\", \"PSE\", \"GHA\", \"PAK\", \"EST\", \"AZE\", \"LVA
" \n",
"var gd = document.getElementById('3e2361db-b571-4e06-aad9-b7257a0b43f2');\n",
"var x = new MutationObserver(function (mutations, observer) {{\n",
" var display = window.getComputedStyle(gd).display;\n",
" if (!display || display === 'none') {{\n",
" console.log([gd, 'removed!']);\n",
" Plotly.purge(gd);\n",
" observer.disconnect();\n",
" }}\n",
"}});\n",
"\n",
"// Listen for the removal of the full notebook cells\n",
"var notebookContainer = gd.closest('#notebook-container');\n",
"if (notebookContainer) {{\n",
" x.observe(notebookContainer, {childList: true});\n",
"}}\n",
"\n",
"// Listen for the clearing of the current output cell\n",
"var outputEl = gd.closest('.output');\n",
"if (outputEl) {{\n",
" x.observe(outputEl, {childList: true});\n",
"}}\n",
"\n",
" }) }; }); </script> </div>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"data1 = re3data_institutions.groupby('org_country')[['re3data_id']].count().sort_values('re3data_id', ascending=False)\n",
"data2 = opendoar_institutions.groupby('org_country')[['opendoar_id']].count().sort_values('opendoar_id', ascending=False)\n",
"data3 = roar_df.groupby('location_country')[['eprintid']].count().sort_values('eprintid', ascending=False)\n",
"data4 = fairsharing_countries.groupby('countrycode')[['url']].count().sort_values('url', ascending=False)\n",
"\n",
"plot = [\n",
" go.Bar(\n",
" x=data1.index,\n",
" y=data1['re3data_id'],\n",
" name='re3data'\n",
" ),\n",
" go.Bar(\n",
" x=data2.index,\n",
" y=data2['opendoar_id'],\n",
" name='openDOAR',\n",
" visible = 'legendonly'\n",
" ),\n",
" go.Bar(\n",
" x=data3.index,\n",
" y=data3['eprintid'],\n",
" name='ROAR',\n",
" visible = 'legendonly'\n",
" ),\n",
" go.Bar(\n",
" x=data4.index,\n",
" y=data4['url'],\n",
" name='FAIRsharing',\n",
" visible = 'legendonly'\n",
" )\n",
"]\n",
"\n",
"layout = go.Layout(\n",
" title='Country coverage',\n",
" xaxis=dict(tickangle=45, tickfont=dict(size=12))\n",
")\n",
"\n",
"go.Figure(plot, layout).show()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Continental coverage"
]
},
{
"cell_type": "code",
"execution_count": 36,
"metadata": {},
"outputs": [
{
"data": {
"application/vnd.plotly.v1+json": {
"config": {
"plotlyServerURL": "https://plot.ly"
},
"data": [
{
"fill": "toself",
"name": "re3data",
"r": [
41,
341,
2987,
3286,
233,
45
],
"theta": [
"AF",
"AS",
"EU",
"NA",
"OC",
"SA"
],
"type": "scatterpolar"
},
{
"fill": "toself",
"name": "OpenDOAR",
"r": [
234,
1439,
2207,
1128,
113,
575
],
"theta": [
"AF",
"AS",
"EU",
"NA",
"OC",
"SA"
],
"type": "scatterpolar"
},
{
"fill": "toself",
"name": "ROAR",
"r": [
190,
1069,
1877,
1078,
107,
603
],
"theta": [
"AF",
"AS",
"EU",
"NA",
"OC",
"SA"
],
"type": "scatterpolar"
},
{
"fill": "toself",
"name": "FAIRsharing",
"r": [
27,
320,
2176,
787,
70,
14
],
"theta": [
"AF",
"AS",
"EU",
"NA",
"OC",
"SA"
],
"type": "scatterpolar"
}
],
"layout": {
"polar": {
"radialaxis": {
"visible": true
}
},
"template": {
"data": {
"bar": [
{
"error_x": {
"color": "#2a3f5f"
},
"error_y": {
"color": "#2a3f5f"
},
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "bar"
}
],
"barpolar": [
{
"marker": {
"line": {
"color": "#E5ECF6",
"width": 0.5
}
},
"type": "barpolar"
}
],
"carpet": [
{
"aaxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"baxis": {
"endlinecolor": "#2a3f5f",
"gridcolor": "white",
"linecolor": "white",
"minorgridcolor": "white",
"startlinecolor": "#2a3f5f"
},
"type": "carpet"
}
],
"choropleth": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "choropleth"
}
],
"contour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "contour"
}
],
"contourcarpet": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "contourcarpet"
}
],
"heatmap": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmap"
}
],
"heatmapgl": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "heatmapgl"
}
],
"histogram": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "histogram"
}
],
"histogram2d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2d"
}
],
"histogram2dcontour": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "histogram2dcontour"
}
],
"mesh3d": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"type": "mesh3d"
}
],
"parcoords": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "parcoords"
}
],
"pie": [
{
"automargin": true,
"type": "pie"
}
],
"scatter": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter"
}
],
"scatter3d": [
{
"line": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatter3d"
}
],
"scattercarpet": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattercarpet"
}
],
"scattergeo": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergeo"
}
],
"scattergl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattergl"
}
],
"scattermapbox": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scattermapbox"
}
],
"scatterpolar": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolar"
}
],
"scatterpolargl": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterpolargl"
}
],
"scatterternary": [
{
"marker": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"type": "scatterternary"
}
],
"surface": [
{
"colorbar": {
"outlinewidth": 0,
"ticks": ""
},
"colorscale": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"type": "surface"
}
],
"table": [
{
"cells": {
"fill": {
"color": "#EBF0F8"
},
"line": {
"color": "white"
}
},
"header": {
"fill": {
"color": "#C8D4E3"
},
"line": {
"color": "white"
}
},
"type": "table"
}
]
},
"layout": {
"annotationdefaults": {
"arrowcolor": "#2a3f5f",
"arrowhead": 0,
"arrowwidth": 1
},
"autotypenumbers": "strict",
"coloraxis": {
"colorbar": {
"outlinewidth": 0,
"ticks": ""
}
},
"colorscale": {
"diverging": [
[
0,
"#8e0152"
],
[
0.1,
"#c51b7d"
],
[
0.2,
"#de77ae"
],
[
0.3,
"#f1b6da"
],
[
0.4,
"#fde0ef"
],
[
0.5,
"#f7f7f7"
],
[
0.6,
"#e6f5d0"
],
[
0.7,
"#b8e186"
],
[
0.8,
"#7fbc41"
],
[
0.9,
"#4d9221"
],
[
1,
"#276419"
]
],
"sequential": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
],
"sequentialminus": [
[
0,
"#0d0887"
],
[
0.1111111111111111,
"#46039f"
],
[
0.2222222222222222,
"#7201a8"
],
[
0.3333333333333333,
"#9c179e"
],
[
0.4444444444444444,
"#bd3786"
],
[
0.5555555555555556,
"#d8576b"
],
[
0.6666666666666666,
"#ed7953"
],
[
0.7777777777777778,
"#fb9f3a"
],
[
0.8888888888888888,
"#fdca26"
],
[
1,
"#f0f921"
]
]
},
"colorway": [
"#636efa",
"#EF553B",
"#00cc96",
"#ab63fa",
"#FFA15A",
"#19d3f3",
"#FF6692",
"#B6E880",
"#FF97FF",
"#FECB52"
],
"font": {
"color": "#2a3f5f"
},
"geo": {
"bgcolor": "white",
"lakecolor": "white",
"landcolor": "#E5ECF6",
"showlakes": true,
"showland": true,
"subunitcolor": "white"
},
"hoverlabel": {
"align": "left"
},
"hovermode": "closest",
"mapbox": {
"style": "light"
},
"paper_bgcolor": "white",
"plot_bgcolor": "#E5ECF6",
"polar": {
"angularaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"radialaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"scene": {
"xaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"yaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
},
"zaxis": {
"backgroundcolor": "#E5ECF6",
"gridcolor": "white",
"gridwidth": 2,
"linecolor": "white",
"showbackground": true,
"ticks": "",
"zerolinecolor": "white"
}
},
"shapedefaults": {
"line": {
"color": "#2a3f5f"
}
},
"ternary": {
"aaxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"baxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
},
"bgcolor": "#E5ECF6",
"caxis": {
"gridcolor": "white",
"linecolor": "white",
"ticks": ""
}
},
"title": {
"x": 0.05
},
"xaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
},
"yaxis": {
"automargin": true,
"gridcolor": "white",
"linecolor": "white",
"ticks": "",
"title": {
"standoff": 15
},
"zerolinecolor": "white",
"zerolinewidth": 2
}
}
}
}
},
"text/html": [
"<div> <div id=\"9cbcf419-3870-4cb7-8136-03297410e899\" class=\"plotly-graph-div\" style=\"height:525px; width:100%;\"></div> <script type=\"text/javascript\"> require([\"plotly\"], function(Plotly) { window.PLOTLYENV=window.PLOTLYENV || {}; if (document.getElementById(\"9cbcf419-3870-4cb7-8136-03297410e899\")) { Plotly.newPlot( \"9cbcf419-3870-4cb7-8136-03297410e899\", [{\"fill\": \"toself\", \"name\": \"re3data\", \"r\": [41, 341, 2987, 3286, 233, 45], \"theta\": [\"AF\", \"AS\", \"EU\", \"NA\", \"OC\", \"SA\"], \"type\": \"scatterpolar\"}, {\"fill\": \"toself\", \"name\": \"OpenDOAR\", \"r\": [234, 1439, 2207, 1128, 113, 575], \"theta\": [\"AF\", \"AS\", \"EU\", \"NA\", \"OC\", \"SA\"], \"type\": \"scatterpolar\"}, {\"fill\": \"toself\", \"name\": \"ROAR\", \"r\": [190, 1069, 1877, 1078, 107, 603], \"theta\": [\"AF\", \"AS\", \"EU\", \"NA\", \"OC\", \"SA\"], \"type\": \"scatterpolar\"}, {\"fill\": \"toself\", \"name\": \"FAIRsharing\", \"r\": [27, 320, 2176, 787, 70, 14], \"theta\": [\"AF\", \"AS\", \"EU\", \"NA\", \"OC\", \"SA\"], \"type\": \"scatterpolar\"}], {\"polar\": {\"radialaxis\": {\"visible\": true}}, \"template\": {\"data\": {\"bar\": [{\"error_x\": {\"color\": \"#2a3f5f\"}, \"error_y\": {\"color\": \"#2a3f5f\"}, \"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"bar\"}], \"barpolar\": [{\"marker\": {\"line\": {\"color\": \"#E5ECF6\", \"width\": 0.5}}, \"type\": \"barpolar\"}], \"carpet\": [{\"aaxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"baxis\": {\"endlinecolor\": \"#2a3f5f\", \"gridcolor\": \"white\", \"linecolor\": \"white\", \"minorgridcolor\": \"white\", \"startlinecolor\": \"#2a3f5f\"}, \"type\": \"carpet\"}], \"choropleth\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"choropleth\"}], \"contour\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"contour\"}], \"contourcarpet\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"type\": \"contourcarpet\"}], \"heatmap\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmap\"}], \"heatmapgl\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"heatmapgl\"}], \"histogram\": [{\"marker\": {\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}}, \"type\": \"histogram\"}], \"histogram2d\": [{\"colorbar\": {\"outlinewidth\": 0, \"ticks\": \"\"}, \"colorscale\": [[0.0, \"#0d0887\"], [0.1111111111111111, \"#46039f\"], [0.2222222222222222, \"#7201a8\"], [0.3333333333333333, \"#9c179e\"], [0.4444444444444444, \"#bd3786\"], [0.5555555555555556, \"#d8576b\"], [0.6666666666666666, \"#ed7953\"], [0.7777777777777778, \"#fb9f3a\"], [0.8888888888888888, \"#fdca26\"], [1.0, \"#f0f921\"]], \"type\": \"histogram2d\"}], \"histogram2dcontour\": [{\"colorba
" \n",
"var gd = document.getElementById('9cbcf419-3870-4cb7-8136-03297410e899');\n",
"var x = new MutationObserver(function (mutations, observer) {{\n",
" var display = window.getComputedStyle(gd).display;\n",
" if (!display || display === 'none') {{\n",
" console.log([gd, 'removed!']);\n",
" Plotly.purge(gd);\n",
" observer.disconnect();\n",
" }}\n",
"}});\n",
"\n",
"// Listen for the removal of the full notebook cells\n",
"var notebookContainer = gd.closest('#notebook-container');\n",
"if (notebookContainer) {{\n",
" x.observe(notebookContainer, {childList: true});\n",
"}}\n",
"\n",
"// Listen for the clearing of the current output cell\n",
"var outputEl = gd.closest('.output');\n",
"if (outputEl) {{\n",
" x.observe(outputEl, {childList: true});\n",
"}}\n",
"\n",
" }) }; }); </script> </div>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"data1 = re3data_institutions.groupby('org_continent')[['re3data_id']].count()\n",
"data2 = opendoar_institutions.groupby('org_continent')[['opendoar_id']].count()\n",
"data3 = roar_df.groupby('continent')[['eprintid']].count()\n",
"data4 = fairsharing_countries.groupby('continent')[['url']].count()\n",
"\n",
"plot = [\n",
" go.Scatterpolar(\n",
" r=data1.re3data_id,\n",
" theta=data1.index,\n",
" fill='toself',\n",
" name='re3data'),\n",
" go.Scatterpolar(\n",
" r=data2.opendoar_id,\n",
" theta=data2.index,\n",
" fill='toself',\n",
" name='OpenDOAR'),\n",
" go.Scatterpolar(\n",
" r=data3.eprintid,\n",
" theta=data3.index,\n",
" fill='toself',\n",
" name='ROAR'),\n",
" go.Scatterpolar(\n",
" r=data4.url,\n",
" theta=data4.index,\n",
" fill='toself',\n",
" name='FAIRsharing')\n",
"]\n",
"\n",
"layout = go.Layout(polar=dict(\n",
" radialaxis=dict(\n",
" visible=True\n",
" ),\n",
" )\n",
")\n",
"\n",
"go.Figure(plot, layout).show()"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.8.3"
}
},
"nbformat": 4,
"nbformat_minor": 4
}