{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import json\n", "import requests\n", "import ast\n", "\n", "import numpy as np\n", "import pandas as pd\n" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | url | \n", "head_final_code | \n", "head_url | \n", "head_chain | \n", "head_codes | \n", "head_elapsed | \n", "head_error | \n", "get_final_code | \n", "get_url | \n", "get_chain | \n", "get_codes | \n", "get_elapsed | \n", "get_error | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "http://sidc.be/silso/home | \n", "200.0 | \n", "https://www.sidc.be/silso/home | \n", "['http://sidc.be/silso/home'] | \n", "[302] | \n", "0.151548 | \n", "NaN | \n", "200.0 | \n", "https://www.sidc.be/silso/home | \n", "['http://sidc.be/silso/home'] | \n", "[302] | \n", "0.145799 | \n", "NaN | \n", "
1 | \n", "https://bmrb.io/ | \n", "200.0 | \n", "https://bmrb.io/ | \n", "[] | \n", "[] | \n", "0.527131 | \n", "NaN | \n", "200.0 | \n", "https://bmrb.io/ | \n", "[] | \n", "[] | \n", "0.487402 | \n", "NaN | \n", "
2 | \n", "http://www.pac.dfo-mpo.gc.ca/science/oceans/da... | \n", "200.0 | \n", "https://www.pac.dfo-mpo.gc.ca/science/oceans/d... | \n", "['http://www.pac.dfo-mpo.gc.ca/science/oceans/... | \n", "[307] | \n", "0.530466 | \n", "NaN | \n", "200.0 | \n", "https://www.pac.dfo-mpo.gc.ca/science/oceans/d... | \n", "['http://www.pac.dfo-mpo.gc.ca/science/oceans/... | \n", "[307] | \n", "0.510097 | \n", "NaN | \n", "
3 | \n", "https://www.cpc.ncep.noaa.gov/ | \n", "200.0 | \n", "https://www.cpc.ncep.noaa.gov/ | \n", "[] | \n", "[] | \n", "0.507708 | \n", "NaN | \n", "200.0 | \n", "https://www.cpc.ncep.noaa.gov/ | \n", "[] | \n", "[] | \n", "0.492151 | \n", "NaN | \n", "
4 | \n", "http://cosmos.bot.kyoto-u.ac.jp/acytodb//cgi-b... | \n", "404.0 | \n", "http://cosmos.bot.kyoto-u.ac.jp/acytodb//cgi-b... | \n", "[] | \n", "[] | \n", "0.586088 | \n", "NaN | \n", "404.0 | \n", "http://cosmos.bot.kyoto-u.ac.jp/acytodb//cgi-b... | \n", "[] | \n", "[] | \n", "0.542670 | \n", "NaN | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13352 | \n", "http://radar.brookes.ac.uk/radar/access/home.do | \n", "200.0 | \n", "https://radar.brookes.ac.uk/radar/home.do | \n", "['http://radar.brookes.ac.uk/radar/access/home... | \n", "[302, 302, 302] | \n", "0.082406 | \n", "NaN | \n", "200.0 | \n", "https://radar.brookes.ac.uk/radar/home.do | \n", "['http://radar.brookes.ac.uk/radar/access/home... | \n", "[302, 302, 302] | \n", "0.088766 | \n", "NaN | \n", "
13353 | \n", "http://www.ub.uni-siegen.de/opus | \n", "200.0 | \n", "https://www.ub.uni-siegen.de/opus/ | \n", "['http://www.ub.uni-siegen.de/opus', 'https://... | \n", "[301, 301] | \n", "0.056328 | \n", "NaN | \n", "200.0 | \n", "https://www.ub.uni-siegen.de/opus/ | \n", "['http://www.ub.uni-siegen.de/opus', 'https://... | \n", "[301, 301] | \n", "0.039649 | \n", "NaN | \n", "
13354 | \n", "http://numerique.bibliotheque.toulouse.fr/cgi-... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='numerique.bibliothequ... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='numerique.bibliothequ... | \n", "
13355 | \n", "https://www.utas.edu.au/library | \n", "200.0 | \n", "https://www.utas.edu.au/library | \n", "[] | \n", "[] | \n", "0.223856 | \n", "NaN | \n", "200.0 | \n", "https://www.utas.edu.au/library | \n", "[] | \n", "[] | \n", "0.595001 | \n", "NaN | \n", "
13356 | \n", "http://204.232.200.153:8080/jspui/ | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='204.232.200.153', por... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='204.232.200.153', por... | \n", "
13356 rows × 13 columns
\n", "\n", " | url | \n", "head_final_code | \n", "head_url | \n", "head_chain | \n", "head_codes | \n", "head_elapsed | \n", "head_error | \n", "get_final_code | \n", "get_url | \n", "get_chain | \n", "get_codes | \n", "get_elapsed | \n", "get_error | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "13356 | \n", "10926.000000 | \n", "10926 | \n", "10926 | \n", "10926 | \n", "10926.000000 | \n", "2430 | \n", "10954.00000 | \n", "10954 | \n", "10954 | \n", "10954 | \n", "10954.000000 | \n", "2402 | \n", "
unique | \n", "13356 | \n", "NaN | \n", "9331 | \n", "4056 | \n", "59 | \n", "NaN | \n", "2299 | \n", "NaN | \n", "9353 | \n", "4082 | \n", "57 | \n", "NaN | \n", "2301 | \n", "
top | \n", "http://sidc.be/silso/home | \n", "NaN | \n", "https://www.unit.no/ugyldig-lenke-til-dokument... | \n", "[] | \n", "[] | \n", "NaN | \n", "('Connection aborted.', RemoteDisconnected('Re... | \n", "NaN | \n", "https://www.unit.no/ugyldig-lenke-til-dokument... | \n", "[] | \n", "[] | \n", "NaN | \n", "('Connection aborted.', RemoteDisconnected('Re... | \n", "
freq | \n", "1 | \n", "NaN | \n", "16 | \n", "6596 | \n", "6596 | \n", "NaN | \n", "34 | \n", "NaN | \n", "16 | \n", "6595 | \n", "6595 | \n", "NaN | \n", "22 | \n", "
mean | \n", "NaN | \n", "218.406736 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "1.124777 | \n", "NaN | \n", "215.73407 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "1.125515 | \n", "NaN | \n", "
std | \n", "NaN | \n", "61.035428 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "3.103610 | \n", "NaN | \n", "56.89142 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "3.184153 | \n", "NaN | \n", "
min | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.013261 | \n", "NaN | \n", "200.00000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.013800 | \n", "NaN | \n", "
25% | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.276535 | \n", "NaN | \n", "200.00000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.254967 | \n", "NaN | \n", "
50% | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.583665 | \n", "NaN | \n", "200.00000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.527238 | \n", "NaN | \n", "
75% | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "1.059370 | \n", "NaN | \n", "200.00000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.944213 | \n", "NaN | \n", "
max | \n", "NaN | \n", "504.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "61.235589 | \n", "NaN | \n", "504.00000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "61.500941 | \n", "NaN | \n", "
\n", " | url | \n", "
---|---|
head_final_code | \n", "\n", " |
200.0 | \n", "9976 | \n", "
201.0 | \n", "19 | \n", "
400.0 | \n", "19 | \n", "
401.0 | \n", "14 | \n", "
403.0 | \n", "205 | \n", "
404.0 | \n", "489 | \n", "
405.0 | \n", "50 | \n", "
406.0 | \n", "20 | \n", "
410.0 | \n", "15 | \n", "
412.0 | \n", "1 | \n", "
419.0 | \n", "1 | \n", "
429.0 | \n", "1 | \n", "
444.0 | \n", "1 | \n", "
500.0 | \n", "47 | \n", "
501.0 | \n", "3 | \n", "
502.0 | \n", "15 | \n", "
503.0 | \n", "49 | \n", "
504.0 | \n", "1 | \n", "
\n", " | url | \n", "head_final_code | \n", "
---|---|---|
class | \n", "\n", " | \n", " |
200.0 | \n", "9995 | \n", "9995 | \n", "
400.0 | \n", "816 | \n", "816 | \n", "
500.0 | \n", "115 | \n", "115 | \n", "
\n", " | url | \n", "head_final_code | \n", "
---|---|---|
class | \n", "\n", " | \n", " |
200.0 | \n", "74.835280 | \n", "74.835280 | \n", "
400.0 | \n", "6.109614 | \n", "6.109614 | \n", "
500.0 | \n", "0.861036 | \n", "0.861036 | \n", "
\n", " | url | \n", "
---|---|
get_final_code | \n", "\n", " |
200.0 | \n", "10139 | \n", "
201.0 | \n", "19 | \n", "
400.0 | \n", "8 | \n", "
401.0 | \n", "13 | \n", "
403.0 | \n", "168 | \n", "
404.0 | \n", "464 | \n", "
405.0 | \n", "1 | \n", "
406.0 | \n", "21 | \n", "
410.0 | \n", "15 | \n", "
412.0 | \n", "1 | \n", "
419.0 | \n", "1 | \n", "
429.0 | \n", "1 | \n", "
444.0 | \n", "1 | \n", "
500.0 | \n", "40 | \n", "
502.0 | \n", "13 | \n", "
503.0 | \n", "48 | \n", "
504.0 | \n", "1 | \n", "
\n", " | url | \n", "get_final_code | \n", "
---|---|---|
class | \n", "\n", " | \n", " |
200.0 | \n", "10158 | \n", "10158 | \n", "
400.0 | \n", "694 | \n", "694 | \n", "
500.0 | \n", "102 | \n", "102 | \n", "
\n", " | url | \n", "get_final_code | \n", "
---|---|---|
class | \n", "\n", " | \n", " |
200.0 | \n", "76.055705 | \n", "76.055705 | \n", "
400.0 | \n", "5.196167 | \n", "5.196167 | \n", "
500.0 | \n", "0.763702 | \n", "0.763702 | \n", "
\n", " | url | \n", "head_error | \n", "
---|---|---|
10 | \n", "https://isoarch.eu/ | \n", "HTTPSConnectionPool(host='isoarch.eu', port=44... | \n", "
13 | \n", "https://www.chinare.org.cn/en/ | \n", "HTTPSConnectionPool(host='www.chinare.org.cn',... | \n", "
26 | \n", "http://www.flyrnai.org/ | \n", "HTTPSConnectionPool(host='www.flyrnai.org', po... | \n", "
71 | \n", "http://alternaria.vbi.vt.edu/index.html | \n", "HTTPConnectionPool(host='alternaria.vbi.vt.edu... | \n", "
83 | \n", "http://www.pazar.info/ | \n", "HTTPConnectionPool(host='www.pazar.info', port... | \n", "
... | \n", "... | \n", "... | \n", "
13344 | \n", "http://intranet.thomasdanby.ac.uk/dspace/ | \n", "HTTPConnectionPool(host='intranet.thomasdanby.... | \n", "
13345 | \n", "http://dspace.dgsca.unam.mx:8080/dspace/ | \n", "HTTPConnectionPool(host='dspace.dgsca.unam.mx'... | \n", "
13347 | \n", "https://library.for.nau.edu:8443/ | \n", "HTTPSConnectionPool(host='library.for.nau.edu'... | \n", "
13354 | \n", "http://numerique.bibliotheque.toulouse.fr/cgi-... | \n", "HTTPConnectionPool(host='numerique.bibliothequ... | \n", "
13356 | \n", "http://204.232.200.153:8080/jspui/ | \n", "HTTPConnectionPool(host='204.232.200.153', por... | \n", "
2242 rows × 2 columns
\n", "\n", " | url | \n", "get_error | \n", "
---|---|---|
10 | \n", "https://isoarch.eu/ | \n", "HTTPSConnectionPool(host='isoarch.eu', port=44... | \n", "
13 | \n", "https://www.chinare.org.cn/en/ | \n", "HTTPSConnectionPool(host='www.chinare.org.cn',... | \n", "
26 | \n", "http://www.flyrnai.org/ | \n", "HTTPSConnectionPool(host='www.flyrnai.org', po... | \n", "
57 | \n", "http://stellabase.org | \n", "HTTPConnectionPool(host='cnidarians.bu.edu', p... | \n", "
71 | \n", "http://alternaria.vbi.vt.edu/index.html | \n", "HTTPConnectionPool(host='alternaria.vbi.vt.edu... | \n", "
... | \n", "... | \n", "... | \n", "
13344 | \n", "http://intranet.thomasdanby.ac.uk/dspace/ | \n", "HTTPConnectionPool(host='intranet.thomasdanby.... | \n", "
13345 | \n", "http://dspace.dgsca.unam.mx:8080/dspace/ | \n", "HTTPConnectionPool(host='dspace.dgsca.unam.mx'... | \n", "
13347 | \n", "https://library.for.nau.edu:8443/ | \n", "HTTPSConnectionPool(host='library.for.nau.edu'... | \n", "
13354 | \n", "http://numerique.bibliotheque.toulouse.fr/cgi-... | \n", "HTTPConnectionPool(host='numerique.bibliothequ... | \n", "
13356 | \n", "http://204.232.200.153:8080/jspui/ | \n", "HTTPConnectionPool(host='204.232.200.153', por... | \n", "
2256 rows × 2 columns
\n", "\n", " | url | \n", "head_error | \n", "
---|---|---|
485 | \n", "https://idr.openmicroscopy.org | \n", "Exceeded 30 redirects. | \n", "
1191 | \n", "http://hgtree.snu.ac.kr | \n", "Exceeded 30 redirects. | \n", "
1462 | \n", "http://cfgp.snu.ac.kr | \n", "Exceeded 30 redirects. | \n", "
2526 | \n", "https://incois.gov.in/tropflux/index.jsp | \n", "Exceeded 30 redirects. | \n", "
2550 | \n", "https://odis.incois.gov.in/ | \n", "Exceeded 30 redirects. | \n", "
3872 | \n", "https://www.projectdatasphere.org/projectdatas... | \n", "Exceeded 30 redirects. | \n", "
6141 | \n", "http://repository.poligran.edu.co/ | \n", "Exceeded 30 redirects. | \n", "
10841 | \n", "http://library.wur.nl/way/ | \n", "Exceeded 30 redirects. | \n", "
\n", " | url | \n", "get_error | \n", "
---|---|---|
6141 | \n", "http://repository.poligran.edu.co/ | \n", "Exceeded 30 redirects. | \n", "
\n", " | url | \n", "get_error | \n", "
---|---|---|
4892 | \n", "http://eprints.isofts.kiev.ua/ | \n", "('Connection aborted.', ConnectionResetError(5... | \n", "
4943 | \n", "http://www.library.ukma.kiev.ua/dspace/ | \n", "HTTPConnectionPool(host='www.library.ukma.kiev... | \n", "
4983 | \n", "http://repository.ibss.org.ua/dspace/ | \n", "HTTPConnectionPool(host='repository.ibss.org.u... | \n", "
5147 | \n", "http://www.rarelib.undp.org.ua/eng/index.php3 | \n", "HTTPConnectionPool(host='www.rarelib.undp.org.... | \n", "
5817 | \n", "http://openarchive.nure.ua/ | \n", "HTTPSConnectionPool(host='openarchive.nure.ua'... | \n", "
5827 | \n", "http://dspace.uabs.edu.ua/jspui/ | \n", "HTTPConnectionPool(host='dspace.uabs.edu.ua', ... | \n", "
6135 | \n", "http://kgmtu.edu.ua/jspui/ | \n", "HTTPConnectionPool(host='kgmtu.edu.ua', port=8... | \n", "
6231 | \n", "http://dspace.uccu.org.ua/ | \n", "HTTPConnectionPool(host='dspace.uccu.org.ua', ... | \n", "
6474 | \n", "http://repo.uipa.edu.ua/jspui/ | \n", "HTTPConnectionPool(host='repo.uipa.edu.ua', po... | \n", "
7067 | \n", "http://ir.asta.edu.ua/jspui/ | \n", "HTTPConnectionPool(host='ir.asta.edu.ua', port... | \n", "
7490 | \n", "http://dspace.hnpu.edu.ua/ | \n", "HTTPConnectionPool(host='dspace.hnpu.edu.ua', ... | \n", "
7989 | \n", "http://repository.mdu.in.ua/jspui/ | \n", "HTTPConnectionPool(host='repository.mdu.in.ua'... | \n", "
8085 | \n", "http://elar.tsatu.edu.ua/ | \n", "HTTPConnectionPool(host='elar.tsatu.edu.ua', p... | \n", "
8105 | \n", "http://dspace.zsea.edu.ua/ | \n", "HTTPSConnectionPool(host='dspace.znu.edu.ua', ... | \n", "
8197 | \n", "http://dspace.knau.kharkov.ua/jspui/ | \n", "HTTPConnectionPool(host='dspace.knau.kharkov.u... | \n", "
8199 | \n", "http://rep.btsau.edu.ua | \n", "HTTPConnectionPool(host='rep.btsau.edu.ua', po... | \n", "
8206 | \n", "https://biblio.onat.edu.ua/ | \n", "HTTPSConnectionPool(host='biblio.onat.edu.ua',... | \n", "
8419 | \n", "https://rep.ksma.ks.ua | \n", "HTTPSConnectionPool(host='rep.ksma.ks.ua', por... | \n", "
10016 | \n", "http://eprints.ksame.kharkov.ua/ | \n", "HTTPConnectionPool(host='eprints.ksame.kharkov... | \n", "
10107 | \n", "http://dspace.uabs.edu.ua/ | \n", "HTTPConnectionPool(host='dspace.uabs.edu.ua', ... | \n", "
10799 | \n", "http://repository.ibss.org.ua/dspace | \n", "HTTPConnectionPool(host='repository.ibss.org.u... | \n", "
10906 | \n", "http://repo.sau.sumy.ua/ | \n", "HTTPConnectionPool(host='repo.sau.sumy.ua', po... | \n", "
10976 | \n", "http://www.dspace.humanities.org.ua/dspace/ | \n", "HTTPConnectionPool(host='www.dspace.humanities... | \n", "
11616 | \n", "http:// visnykagro.knau.kharkov.ua | \n", "HTTPConnectionPool(host='%20visnykagro.knau.kh... | \n", "
11803 | \n", "http://repository.mdu.in.ua/ | \n", "HTTPConnectionPool(host='repository.mdu.in.ua'... | \n", "
11831 | \n", "http://sj-dstu.dp.ua/ | \n", "HTTPConnectionPool(host='sj-dstu.dp.ua', port=... | \n", "
12107 | \n", "http://www.hups.mil.gov.ua/periodic-app/journal | \n", "HTTPConnectionPool(host='www.hups.mil.gov.ua',... | \n", "
12746 | \n", "http://www.e-archive.org.ua/ | \n", "HTTPConnectionPool(host='www.e-archive.org.ua'... | \n", "
12753 | \n", "http://library.khnu.km.ua/jspui/ | \n", "HTTPConnectionPool(host='library.khnu.km.ua', ... | \n", "
12916 | \n", "http://dspace.ukrfa.kharkov.ua/ | \n", "HTTPConnectionPool(host='dspace.ukrfa.kharkov.... | \n", "
12922 | \n", "http://dspace.ukrfa.kharkov.ua | \n", "HTTPConnectionPool(host='dspace.ukrfa.kharkov.... | \n", "
12970 | \n", "http://evrica.org.ua | \n", "HTTPConnectionPool(host='evrica.org.ua', port=... | \n", "
12992 | \n", "http://dspace.academy.sumy.ua/ | \n", "HTTPConnectionPool(host='dspace.academy.sumy.u... | \n", "
13017 | \n", "http://open-archive.kture.kharkov.ua/ | \n", "HTTPConnectionPool(host='open-archive.kture.kh... | \n", "
13034 | \n", "http://dspace.onu.edu.ua/ | \n", "HTTPConnectionPool(host='192.168.30.200', port... | \n", "
13052 | \n", "http://open-arhive.kture.kharkov.ua | \n", "HTTPConnectionPool(host='open-arhive.kture.kha... | \n", "
\n", " | url | \n", "head_final_code | \n", "head_url | \n", "head_chain | \n", "head_codes | \n", "head_elapsed | \n", "head_error | \n", "get_final_code | \n", "get_url | \n", "get_chain | \n", "get_codes | \n", "get_elapsed | \n", "get_error | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
2185 | \n", "http://inform.ikd.kiev.ua/index.php?path=/en/i... | \n", "200.0 | \n", "http://inform.ikd.kiev.ua/?path=/en/index | \n", "['http://inform.ikd.kiev.ua/index.php?path=/en... | \n", "[301] | \n", "0.402488 | \n", "NaN | \n", "200.0 | \n", "http://inform.ikd.kiev.ua/?path=/en/index | \n", "['http://inform.ikd.kiev.ua/index.php?path=/en... | \n", "[301] | \n", "0.452971 | \n", "NaN | \n", "
2286 | \n", "http://wdc.org.ua/ | \n", "200.0 | \n", "http://wdc.org.ua/ | \n", "[] | \n", "[] | \n", "0.905063 | \n", "NaN | \n", "200.0 | \n", "http://wdc.org.ua/ | \n", "[] | \n", "[] | \n", "0.816887 | \n", "NaN | \n", "
4892 | \n", "http://eprints.isofts.kiev.ua/ | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "('Connection aborted.', ConnectionResetError(5... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "('Connection aborted.', ConnectionResetError(5... | \n", "
4943 | \n", "http://www.library.ukma.kiev.ua/dspace/ | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='www.library.ukma.kiev... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='www.library.ukma.kiev... | \n", "
4950 | \n", "http://www.dspace.ucu.edu.ua/dspace/ | \n", "403.0 | \n", "http://www.dspace.ucu.edu.ua/dspace/ | \n", "[] | \n", "[] | \n", "0.073373 | \n", "NaN | \n", "403.0 | \n", "http://www.dspace.ucu.edu.ua/dspace/ | \n", "[] | \n", "[] | \n", "0.073223 | \n", "NaN | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13015 | \n", "http://ir.kneu.edu.ua | \n", "200.0 | \n", "http://ir.kneu.edu.ua/ | \n", "[] | \n", "[] | \n", "1.609602 | \n", "NaN | \n", "200.0 | \n", "http://ir.kneu.edu.ua/ | \n", "[] | \n", "[] | \n", "1.508854 | \n", "NaN | \n", "
13017 | \n", "http://open-archive.kture.kharkov.ua/ | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='open-archive.kture.kh... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='open-archive.kture.kh... | \n", "
13034 | \n", "http://dspace.onu.edu.ua/ | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='192.168.30.200', port... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='192.168.30.200', port... | \n", "
13052 | \n", "http://open-arhive.kture.kharkov.ua | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='open-arhive.kture.kha... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "HTTPConnectionPool(host='open-arhive.kture.kha... | \n", "
13248 | \n", "http://www.ekmair.ukma.edu.ua | \n", "200.0 | \n", "http://ekmair.ukma.edu.ua/ | \n", "['http://www.ekmair.ukma.edu.ua/'] | \n", "[301] | \n", "0.661039 | \n", "NaN | \n", "200.0 | \n", "http://ekmair.ukma.edu.ua/ | \n", "['http://www.ekmair.ukma.edu.ua/'] | \n", "[301] | \n", "0.755170 | \n", "NaN | \n", "
146 rows × 13 columns
\n", "\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "
---|---|---|---|---|
len | \n", "\n", " | \n", " | \n", " | \n", " |
0 | \n", "6596 | \n", "6596 | \n", "6596 | \n", "6596 | \n", "
1 | \n", "3364 | \n", "3364 | \n", "3364 | \n", "3364 | \n", "
2 | \n", "686 | \n", "686 | \n", "686 | \n", "686 | \n", "
3 | \n", "233 | \n", "233 | \n", "233 | \n", "233 | \n", "
4 | \n", "37 | \n", "37 | \n", "37 | \n", "37 | \n", "
5 | \n", "10 | \n", "10 | \n", "10 | \n", "10 | \n", "
\n", " | url | \n", "get_url | \n", "get_final_code | \n", "get_codes | \n", "
---|---|---|---|---|
len | \n", "\n", " | \n", " | \n", " | \n", " |
0 | \n", "6595 | \n", "6595 | \n", "6595 | \n", "6595 | \n", "
1 | \n", "3376 | \n", "3376 | \n", "3376 | \n", "3376 | \n", "
2 | \n", "699 | \n", "699 | \n", "699 | \n", "699 | \n", "
3 | \n", "229 | \n", "229 | \n", "229 | \n", "229 | \n", "
4 | \n", "43 | \n", "43 | \n", "43 | \n", "43 | \n", "
5 | \n", "12 | \n", "12 | \n", "12 | \n", "12 | \n", "
\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
11 | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "403.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
84 | \n", "https://protocols.io/welcome | \n", "https://www.protocols.io:443/welcome | \n", "400.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
177 | \n", "http://agris.fao.org/agris-search/index.do | \n", "https://agris.fao.org:443/agris-search/index.do | \n", "404.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
228 | \n", "http://oryzatagline.cirad.fr/ | \n", "https://oryzatagline.cirad.fr/ | \n", "403.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
243 | \n", "http://www.ncbi.nlm.nih.gov/unists | \n", "https://www.ncbi.nlm.nih.gov/unists | \n", "410.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13262 | \n", "http://www.kumc.edu/archie | \n", "https://www.kumc.edu/archie | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13320 | \n", "http://trinity.cdmhost.com/index.php | \n", "https://www.oclc.org/url/?404;http://trinity.c... | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13340 | \n", "http://calvados.c3sl.ufpr.br/ojs2/index.php/ve... | \n", "https://revistas.ufpr.br/index.php/veterinary/... | \n", "404.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
13346 | \n", "http://www4.furg.br/ojs/biblos/ojs/index.php | \n", "https://sistemas.furg.br/ojs/biblos/ojs/index.php | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13348 | \n", "http://lss.fnal.gov/ird/fermilab_spires.html | \n", "https://lss.fnal.gov/ird/fermilab_spires.html | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
378 rows × 6 columns
\n", "\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "
---|---|---|---|---|---|
class | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
400.0 | \n", "338 | \n", "338 | \n", "338 | \n", "338 | \n", "338 | \n", "
500.0 | \n", "40 | \n", "40 | \n", "40 | \n", "40 | \n", "40 | \n", "
\n", " | url | \n", "get_url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
11 | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "403.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
177 | \n", "http://agris.fao.org/agris-search/index.do | \n", "https://agris.fao.org:443/agris-search/index.do | \n", "404.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
228 | \n", "http://oryzatagline.cirad.fr/ | \n", "https://oryzatagline.cirad.fr/ | \n", "403.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
243 | \n", "http://www.ncbi.nlm.nih.gov/unists | \n", "https://www.ncbi.nlm.nih.gov/unists | \n", "410.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
288 | \n", "http://www.ncbi.nlm.nih.gov/dbSTS/index.html | \n", "https://www.ncbi.nlm.nih.gov/dbSTS/index.html | \n", "403.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13262 | \n", "http://www.kumc.edu/archie | \n", "https://www.kumc.edu/archie | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13320 | \n", "http://trinity.cdmhost.com/index.php | \n", "https://www.oclc.org/url/notfound | \n", "404.0 | \n", "[302, 302] | \n", "2 | \n", "400.0 | \n", "
13340 | \n", "http://calvados.c3sl.ufpr.br/ojs2/index.php/ve... | \n", "https://revistas.ufpr.br/index.php/veterinary/... | \n", "404.0 | \n", "[301] | \n", "1 | \n", "400.0 | \n", "
13346 | \n", "http://www4.furg.br/ojs/biblos/ojs/index.php | \n", "https://sistemas.furg.br/ojs/biblos/ojs/index.php | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13348 | \n", "http://lss.fnal.gov/ird/fermilab_spires.html | \n", "https://lss.fnal.gov/ird/fermilab_spires.html | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
344 rows × 6 columns
\n", "\n", " | url | \n", "get_url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "
---|---|---|---|---|---|
class | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
400.0 | \n", "307 | \n", "307 | \n", "307 | \n", "307 | \n", "307 | \n", "
500.0 | \n", "37 | \n", "37 | \n", "37 | \n", "37 | \n", "37 | \n", "
\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
0 | \n", "http://sidc.be/silso/home | \n", "https://www.sidc.be/silso/home | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
2 | \n", "http://www.pac.dfo-mpo.gc.ca/science/oceans/da... | \n", "https://www.pac.dfo-mpo.gc.ca/science/oceans/d... | \n", "200.0 | \n", "[307] | \n", "1 | \n", "200.0 | \n", "
6 | \n", "http://ipt.taibif.tw/ | \n", "https://ipt.taibif.tw/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
9 | \n", "http://arabidopsis.info | \n", "https://arabidopsis.info/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
11 | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "403.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13341 | \n", "http://calvados.c3sl.ufpr.br/ojs2/index.php/acta/ | \n", "https://revistas.ufpr.br/index.php/acta/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13346 | \n", "http://www4.furg.br/ojs/biblos/ojs/index.php | \n", "https://sistemas.furg.br/ojs/biblos/ojs/index.php | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13348 | \n", "http://lss.fnal.gov/ird/fermilab_spires.html | \n", "https://lss.fnal.gov/ird/fermilab_spires.html | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13350 | \n", "http://cloud.ncl.edu.tw/chna/ | \n", "https://cloud.ncl.edu.tw/chna/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13351 | \n", "http://www.myopenarchive.org/ | \n", "https://www.myopenarchive.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
3364 rows × 6 columns
\n", "\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
2 | \n", "http://www.pac.dfo-mpo.gc.ca/science/oceans/da... | \n", "https://www.pac.dfo-mpo.gc.ca/science/oceans/d... | \n", "200.0 | \n", "[307] | \n", "1 | \n", "200.0 | \n", "
6 | \n", "http://ipt.taibif.tw/ | \n", "https://ipt.taibif.tw/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
27 | \n", "http://www.hgvd.genome.med.kyoto-u.ac.jp/ | \n", "https://www.hgvd.genome.med.kyoto-u.ac.jp/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
30 | \n", "http://archive.researchdata.leeds.ac.uk/ | \n", "https://archive.researchdata.leeds.ac.uk/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
33 | \n", "http://biodb.swu.edu.cn/qprimerdb/ | \n", "https://biodb.swu.edu.cn/qprimerdb/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13288 | \n", "http://dspace.sunyconnect.suny.edu/ | \n", "https://dspace.sunyconnect.suny.edu/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13295 | \n", "http://scholar.google.com/ | \n", "https://scholar.google.com/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13348 | \n", "http://lss.fnal.gov/ird/fermilab_spires.html | \n", "https://lss.fnal.gov/ird/fermilab_spires.html | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13350 | \n", "http://cloud.ncl.edu.tw/chna/ | \n", "https://cloud.ncl.edu.tw/chna/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13351 | \n", "http://www.myopenarchive.org/ | \n", "https://www.myopenarchive.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
1665 rows × 6 columns
\n", "\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
119 | \n", "https://www.biosino.org/node | \n", "https://www.biosino.org/node/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
314 | \n", "http://metacat.tfri.gov.tw/tfri | \n", "http://metacat.tfri.gov.tw/tfri/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
463 | \n", "https://nda.nih.gov/abcd | \n", "https://nda.nih.gov/abcd/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
551 | \n", "https://www1.usgs.gov/obis-usa/ipt | \n", "https://www1.usgs.gov/obis-usa/ipt/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
559 | \n", "https://www.arm.gov/data | \n", "https://www.arm.gov/data/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
12642 | \n", "http://repositorio.utec.edu.sv:8080/jspui | \n", "http://repositorio.utec.edu.sv:8080/jspui/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
12706 | \n", "http://adudspace.adu.edu.tr:8080/jspui | \n", "http://adudspace.adu.edu.tr:8080/jspui/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
12874 | \n", "http://160.97.80.9:8080/jspui | \n", "http://160.97.80.9:8080/jspui/ | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13030 | \n", "http://library.pdpu.ac.in:8080/xmlui | \n", "http://library.pdpu.ac.in:8080/xmlui/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13267 | \n", "http://cab.unime.it/mus | \n", "http://cab.unime.it/mus/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
134 rows × 6 columns
\n", "\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
9 | \n", "http://arabidopsis.info | \n", "https://arabidopsis.info/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
46 | \n", "http://pcddb.cryst.bbk.ac.uk | \n", "https://pcddb.cryst.bbk.ac.uk/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
113 | \n", "http://www.marinedataarchive.eu | \n", "https://www.marinedataarchive.eu/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
119 | \n", "https://www.biosino.org/node | \n", "https://www.biosino.org/node/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
200 | \n", "http://www.hydroshare.org | \n", "https://www.hydroshare.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13032 | \n", "http://repositorio.ipsantarem.pt | \n", "https://repositorio.ipsantarem.pt/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13077 | \n", "http://bibliotecadigital.ipb.pt | \n", "https://bibliotecadigital.ipb.pt/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13091 | \n", "http://eprints.nmlindia.org | \n", "https://eprints.nmlindia.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13124 | \n", "http://www.ju.edu.et | \n", "https://www.ju.edu.et/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13137 | \n", "http://scholarship.rollins.edu | \n", "https://scholarship.rollins.edu/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
487 rows × 6 columns
\n", "\n", " | url | \n", "get_url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
0 | \n", "http://sidc.be/silso/home | \n", "https://www.sidc.be/silso/home | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
2 | \n", "http://www.pac.dfo-mpo.gc.ca/science/oceans/da... | \n", "https://www.pac.dfo-mpo.gc.ca/science/oceans/d... | \n", "200.0 | \n", "[307] | \n", "1 | \n", "200.0 | \n", "
6 | \n", "http://ipt.taibif.tw/ | \n", "https://ipt.taibif.tw/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
9 | \n", "http://arabidopsis.info | \n", "https://arabidopsis.info/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
11 | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "http://epi.minsal.cl/bases-de-datos/ | \n", "403.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13341 | \n", "http://calvados.c3sl.ufpr.br/ojs2/index.php/acta/ | \n", "https://revistas.ufpr.br/index.php/acta/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13346 | \n", "http://www4.furg.br/ojs/biblos/ojs/index.php | \n", "https://sistemas.furg.br/ojs/biblos/ojs/index.php | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13348 | \n", "http://lss.fnal.gov/ird/fermilab_spires.html | \n", "https://lss.fnal.gov/ird/fermilab_spires.html | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13350 | \n", "http://cloud.ncl.edu.tw/chna/ | \n", "https://cloud.ncl.edu.tw/chna/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13351 | \n", "http://www.myopenarchive.org/ | \n", "https://www.myopenarchive.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
3376 rows × 6 columns
\n", "\n", " | url | \n", "get_url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
2 | \n", "http://www.pac.dfo-mpo.gc.ca/science/oceans/da... | \n", "https://www.pac.dfo-mpo.gc.ca/science/oceans/d... | \n", "200.0 | \n", "[307] | \n", "1 | \n", "200.0 | \n", "
6 | \n", "http://ipt.taibif.tw/ | \n", "https://ipt.taibif.tw/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
27 | \n", "http://www.hgvd.genome.med.kyoto-u.ac.jp/ | \n", "https://www.hgvd.genome.med.kyoto-u.ac.jp/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
30 | \n", "http://archive.researchdata.leeds.ac.uk/ | \n", "https://archive.researchdata.leeds.ac.uk/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
33 | \n", "http://biodb.swu.edu.cn/qprimerdb/ | \n", "https://biodb.swu.edu.cn/qprimerdb/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13288 | \n", "http://dspace.sunyconnect.suny.edu/ | \n", "https://dspace.sunyconnect.suny.edu/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13295 | \n", "http://scholar.google.com/ | \n", "https://scholar.google.com/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13348 | \n", "http://lss.fnal.gov/ird/fermilab_spires.html | \n", "https://lss.fnal.gov/ird/fermilab_spires.html | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13350 | \n", "http://cloud.ncl.edu.tw/chna/ | \n", "https://cloud.ncl.edu.tw/chna/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13351 | \n", "http://www.myopenarchive.org/ | \n", "https://www.myopenarchive.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
1668 rows × 6 columns
\n", "\n", " | url | \n", "get_url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
119 | \n", "https://www.biosino.org/node | \n", "https://www.biosino.org/node/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
314 | \n", "http://metacat.tfri.gov.tw/tfri | \n", "http://metacat.tfri.gov.tw/tfri/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
463 | \n", "https://nda.nih.gov/abcd | \n", "https://nda.nih.gov/abcd/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
551 | \n", "https://www1.usgs.gov/obis-usa/ipt | \n", "https://www1.usgs.gov/obis-usa/ipt/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
559 | \n", "https://www.arm.gov/data | \n", "https://www.arm.gov/data/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
12642 | \n", "http://repositorio.utec.edu.sv:8080/jspui | \n", "http://repositorio.utec.edu.sv:8080/jspui/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
12706 | \n", "http://adudspace.adu.edu.tr:8080/jspui | \n", "http://adudspace.adu.edu.tr:8080/jspui/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
12874 | \n", "http://160.97.80.9:8080/jspui | \n", "http://160.97.80.9:8080/jspui/ | \n", "404.0 | \n", "[302] | \n", "1 | \n", "400.0 | \n", "
13030 | \n", "http://library.pdpu.ac.in:8080/xmlui | \n", "http://library.pdpu.ac.in:8080/xmlui/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13267 | \n", "http://cab.unime.it/mus | \n", "http://cab.unime.it/mus/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
134 rows × 6 columns
\n", "\n", " | url | \n", "get_url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
9 | \n", "http://arabidopsis.info | \n", "https://arabidopsis.info/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
46 | \n", "http://pcddb.cryst.bbk.ac.uk | \n", "https://pcddb.cryst.bbk.ac.uk/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
113 | \n", "http://www.marinedataarchive.eu | \n", "https://www.marinedataarchive.eu/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
119 | \n", "https://www.biosino.org/node | \n", "https://www.biosino.org/node/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
200 | \n", "http://www.hydroshare.org | \n", "https://www.hydroshare.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13032 | \n", "http://repositorio.ipsantarem.pt | \n", "https://repositorio.ipsantarem.pt/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13077 | \n", "http://bibliotecadigital.ipb.pt | \n", "https://bibliotecadigital.ipb.pt/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13091 | \n", "http://eprints.nmlindia.org | \n", "https://eprints.nmlindia.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13124 | \n", "http://www.ju.edu.et | \n", "https://www.ju.edu.et/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13137 | \n", "http://scholarship.rollins.edu | \n", "https://scholarship.rollins.edu/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
490 rows × 6 columns
\n", "\n", " | url | \n", "head_final_code | \n", "head_url | \n", "head_chain | \n", "head_codes | \n", "head_elapsed | \n", "head_error | \n", "get_final_code | \n", "get_url | \n", "get_chain | \n", "get_codes | \n", "get_elapsed | \n", "get_error | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
127 | \n", "https://models.physiomeproject.org | \n", "200.0 | \n", "https://models.physiomeproject.org/ | \n", "[] | \n", "[] | \n", "0.658525 | \n", "NaN | \n", "200.0 | \n", "https://models.physiomeproject.org/welcome | \n", "['https://models.physiomeproject.org/'] | \n", "[302] | \n", "0.575681 | \n", "NaN | \n", "
371 | \n", "https://rdp.utas.edu.au | \n", "200.0 | \n", "https://login.microsoftonline.com/15eb5d55-199... | \n", "['https://rdp.utas.edu.au/'] | \n", "[302] | \n", "0.297592 | \n", "NaN | \n", "200.0 | \n", "https://login.microsoftonline.com/15eb5d55-199... | \n", "['https://rdp.utas.edu.au/'] | \n", "[302] | \n", "0.285739 | \n", "NaN | \n", "
479 | \n", "https://sciflection.com | \n", "200.0 | \n", "https://sciflection.com/ | \n", "[] | \n", "[] | \n", "0.176450 | \n", "NaN | \n", "200.0 | \n", "https://sciflection.com/main | \n", "['https://sciflection.com/', 'http://sciflecti... | \n", "[302, 301] | \n", "0.391234 | \n", "NaN | \n", "
684 | \n", "http://www.ntrr-nti.org/ | \n", "405.0 | \n", "http://www.ntrr-nti.org/ | \n", "[] | \n", "[] | \n", "1.133437 | \n", "NaN | \n", "200.0 | \n", "https://www.nattrauma.org/research/ntrr/ | \n", "['http://www.ntrr-nti.org/'] | \n", "[301] | \n", "2.539869 | \n", "NaN | \n", "
697 | \n", "http://www.jcm.riken.go.jp/ | \n", "200.0 | \n", "https://jcm.brc.riken.jp/en/ | \n", "['http://www.jcm.riken.go.jp/', 'https://www.j... | \n", "[301, 301, 301, 301] | \n", "0.506354 | \n", "NaN | \n", "200.0 | \n", "https://jcm.brc.riken.jp/en/?doing_wp_cron=165... | \n", "['http://www.jcm.riken.go.jp/', 'https://www.j... | \n", "[301, 301, 301, 301, 302] | \n", "0.630979 | \n", "NaN | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13132 | \n", "http://hik.diva-portal.org/smash/search.jsf | \n", "200.0 | \n", "http://lnu.diva-portal.org/smash/search.jsf?ds... | \n", "['http://hik.diva-portal.org/smash/search.jsf'... | \n", "[301, 302] | \n", "0.287171 | \n", "NaN | \n", "200.0 | \n", "http://lnu.diva-portal.org/smash/search.jsf?ds... | \n", "['http://hik.diva-portal.org/smash/search.jsf'... | \n", "[301, 302] | \n", "0.291231 | \n", "NaN | \n", "
13133 | \n", "http://hgo.diva-portal.org/smash/search.jsf | \n", "200.0 | \n", "http://uu.diva-portal.org/smash/search.jsf?dsw... | \n", "['http://hgo.diva-portal.org/smash/search.jsf'... | \n", "[301, 302] | \n", "0.292740 | \n", "NaN | \n", "200.0 | \n", "http://uu.diva-portal.org/smash/search.jsf?dsw... | \n", "['http://hgo.diva-portal.org/smash/search.jsf'... | \n", "[301, 302] | \n", "0.289726 | \n", "NaN | \n", "
13266 | \n", "http://www.diva-portal.org/gih/ | \n", "200.0 | \n", "http://gih.diva-portal.org/smash/search.jsf?ds... | \n", "['http://www.diva-portal.org/gih/', 'http://gi... | \n", "[301, 302] | \n", "0.301519 | \n", "NaN | \n", "200.0 | \n", "http://gih.diva-portal.org/smash/search.jsf?ds... | \n", "['http://www.diva-portal.org/gih/', 'http://gi... | \n", "[301, 302] | \n", "2.143105 | \n", "NaN | \n", "
13283 | \n", "http://www.compscipreprints.com/ | \n", "200.0 | \n", "http://survey-smiles.com | \n", "['http://www.compscipreprints.com/'] | \n", "[302] | \n", "0.257651 | \n", "NaN | \n", "200.0 | \n", "http://www.compscipreprints.com/ | \n", "[] | \n", "[] | \n", "0.093911 | \n", "NaN | \n", "
13320 | \n", "http://trinity.cdmhost.com/index.php | \n", "404.0 | \n", "https://www.oclc.org/url/?404;http://trinity.c... | \n", "['http://trinity.cdmhost.com/index.php'] | \n", "[302] | \n", "0.589119 | \n", "NaN | \n", "404.0 | \n", "https://www.oclc.org/url/notfound | \n", "['http://trinity.cdmhost.com/index.php', 'http... | \n", "[302, 302] | \n", "0.139563 | \n", "NaN | \n", "
146 rows × 13 columns
\n", "\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
0 | \n", "http://sidc.be/silso/home | \n", "https://www.sidc.be/silso/home | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
1 | \n", "https://bmrb.io/ | \n", "https://bmrb.io/ | \n", "200.0 | \n", "[] | \n", "0 | \n", "200.0 | \n", "
2 | \n", "http://www.pac.dfo-mpo.gc.ca/science/oceans/da... | \n", "https://www.pac.dfo-mpo.gc.ca/science/oceans/d... | \n", "200.0 | \n", "[307] | \n", "1 | \n", "200.0 | \n", "
3 | \n", "https://www.cpc.ncep.noaa.gov/ | \n", "https://www.cpc.ncep.noaa.gov/ | \n", "200.0 | \n", "[] | \n", "0 | \n", "200.0 | \n", "
4 | \n", "http://cosmos.bot.kyoto-u.ac.jp/acytodb//cgi-b... | \n", "http://cosmos.bot.kyoto-u.ac.jp/acytodb//cgi-b... | \n", "404.0 | \n", "[] | \n", "0 | \n", "400.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
13350 | \n", "http://cloud.ncl.edu.tw/chna/ | \n", "https://cloud.ncl.edu.tw/chna/ | \n", "200.0 | \n", "[302] | \n", "1 | \n", "200.0 | \n", "
13351 | \n", "http://www.myopenarchive.org/ | \n", "https://www.myopenarchive.org/ | \n", "200.0 | \n", "[301] | \n", "1 | \n", "200.0 | \n", "
13352 | \n", "http://radar.brookes.ac.uk/radar/access/home.do | \n", "https://radar.brookes.ac.uk/radar/home.do | \n", "200.0 | \n", "[302, 302, 302] | \n", "3 | \n", "200.0 | \n", "
13353 | \n", "http://www.ub.uni-siegen.de/opus | \n", "https://www.ub.uni-siegen.de/opus/ | \n", "200.0 | \n", "[301, 301] | \n", "2 | \n", "200.0 | \n", "
13355 | \n", "https://www.utas.edu.au/library | \n", "https://www.utas.edu.au/library | \n", "200.0 | \n", "[] | \n", "0 | \n", "200.0 | \n", "
10926 rows × 6 columns
\n", "\n", " | url | \n", "head_url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|---|
count | \n", "10926 | \n", "10926 | \n", "10926.000000 | \n", "10926 | \n", "10926.000000 | \n", "10926.000000 | \n", "
unique | \n", "10926 | \n", "9331 | \n", "NaN | \n", "59 | \n", "NaN | \n", "NaN | \n", "
top | \n", "http://sidc.be/silso/home | \n", "https://www.unit.no/ugyldig-lenke-til-dokument... | \n", "NaN | \n", "[] | \n", "NaN | \n", "NaN | \n", "
freq | \n", "1 | \n", "16 | \n", "NaN | \n", "6596 | \n", "NaN | \n", "NaN | \n", "
mean | \n", "NaN | \n", "NaN | \n", "218.406736 | \n", "NaN | \n", "0.515559 | \n", "218.094454 | \n", "
std | \n", "NaN | \n", "NaN | \n", "61.035428 | \n", "NaN | \n", "0.749850 | \n", "60.063069 | \n", "
min | \n", "NaN | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "0.000000 | \n", "200.000000 | \n", "
25% | \n", "NaN | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "0.000000 | \n", "200.000000 | \n", "
50% | \n", "NaN | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "0.000000 | \n", "200.000000 | \n", "
75% | \n", "NaN | \n", "NaN | \n", "200.000000 | \n", "NaN | \n", "1.000000 | \n", "200.000000 | \n", "
max | \n", "NaN | \n", "NaN | \n", "504.000000 | \n", "NaN | \n", "5.000000 | \n", "500.000000 | \n", "
\n", " | url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|
head_url | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
https://www.unit.no/ugyldig-lenke-til-dokument-i-vitenarkiv | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "
https://www.nlm.nih.gov/toxnet/index.html | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "
http://survey-smiles.com | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "
https://nda.nih.gov/ | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "
https://digitalrepository.unm.edu/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://ir.vanderbilt.edu/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://ddd.uab.cat/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://intellectum.unisabana.edu.co/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://opus.bibliothek.uni-augsburg.de/opus4/home | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://pure.iiasa.ac.at/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
http://eprints.nottingham.ac.uk/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://research.usc.edu.au/esploro/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dataverse.harvard.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://epub.wupperinst.org/home | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://pure.mpg.de/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dlib.york.ac.uk/yodl/app/home/index | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://archiv.ub.uni-marburg.de/ubfind/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://eprints.unife.it/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dataspace.princeton.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://eprints.lib.hokudai.ac.jp/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://pub.uni-bielefeld.de/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://aquadocs.org/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dataverse.tdl.org/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://uwspace.uwaterloo.ca/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research.utwente.nl/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://datadryad.org/stash | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://er.knutd.edu.ua/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://esango.cput.ac.za/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repositorio.fucsalud.edu.co/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repository.up.ac.za/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repository.usta.edu.co/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repositori.upf.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://bibliotecadigital.exactas.uba.ar/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repo.odmu.edu.ua/xmlui/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://bcnroc.ajuntament.barcelona.cat/jspui/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://data.gov.uk/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://mru.arcabc.ca/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://munin.uit.no/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://red.uao.edu.co/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research-repository.st-andrews.ac.uk/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research-repository.uwa.edu.au/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research.cbs.dk/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://webext.pasteur.fr/genolist/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://prism.ucalgary.ca/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://air.unimi.it/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
http://rua.ua.es/dspace/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dial.uclouvain.be/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://sc.lib.miamioh.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dspace.ankara.edu.tr/xmlui/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://scholar.smu.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
\n", " | url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|
get_url | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
https://www.unit.no/ugyldig-lenke-til-dokument-i-vitenarkiv | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "16 | \n", "
https://www.oclc.org/url/notfound | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "7 | \n", "
https://www.nlm.nih.gov/toxnet/index.html | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "6 | \n", "
https://nda.nih.gov/ | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "5 | \n", "
https://digitalrepository.unm.edu/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://opus.bibliothek.uni-augsburg.de/opus4/home | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://intellectum.unisabana.edu.co/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://pure.iiasa.ac.at/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://ir.vanderbilt.edu/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
http://eprints.nottingham.ac.uk/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://ddd.uab.cat/ | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "4 | \n", "
https://mru.arcabc.ca/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research.usc.edu.au/esploro/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://aquadocs.org/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://uwspace.uwaterloo.ca/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://pub.uni-bielefeld.de/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dataverse.tdl.org/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://eprints.lib.hokudai.ac.jp/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://archiv.ub.uni-marburg.de/ubfind/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://eprints.unife.it/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repositorio.fucsalud.edu.co/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research.utwente.nl/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repository.up.ac.za/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://pure.mpg.de/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://epub.wupperinst.org/home | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://archive.researchdata.leeds.ac.uk/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repository.usta.edu.co/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dataverse.harvard.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://bcnroc.ajuntament.barcelona.cat/jspui/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://er.knutd.edu.ua/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dataspace.princeton.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repositori.upf.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://bibliotecadigital.exactas.uba.ar/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://prism.ucalgary.ca/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research.cbs.dk/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://webext.pasteur.fr/genolist/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://ngdc.cncb.ac.cn/idog/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research-repository.uwa.edu.au/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://research-repository.st-andrews.ac.uk/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://repo.odmu.edu.ua/xmlui/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://red.uao.edu.co/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://data.gov.uk/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://munin.uit.no/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://datadryad.org/stash | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
http://rua.ua.es/dspace/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
http://dspace.uevora.pt/rdpc/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://sc.lib.miamioh.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://papyrus.bib.umontreal.ca/xmlui/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://scholar.smu.edu/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
https://dro.deakin.edu.au/ | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "3 | \n", "
\n", " | url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|
head_url | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
http://103.82.172.44:8080/xmlui/ | \n", "[http://103.82.172.44:8080/xmlui/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
http://109.185.200.51/ | \n", "[http://109.185.200.51/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
http://119.3.41.228/dnmivd/ | \n", "[http://www.unimd.org/dnmivd/] | \n", "[200.0] | \n", "[[302]] | \n", "[1] | \n", "[200.0] | \n", "
http://119.78.100.183/ | \n", "[http://119.78.100.183] | \n", "[403.0] | \n", "[[]] | \n", "[0] | \n", "[400.0] | \n", "
http://125.99.47.158:8090/jspui/ | \n", "[http://125.99.47.158:8090/jspui, http://125.9... | \n", "[200.0, 200.0] | \n", "[[302], []] | \n", "[1, 0] | \n", "[200.0, 200.0] | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
https://zks.uni-koeln.de/index.php?s=studien&c=studien_klinische-studien | \n", "[http://zks.uni-koeln.de/index.php?s=studien&c... | \n", "[200.0] | \n", "[[301]] | \n", "[1] | \n", "[200.0] | \n", "
https://zokei.repo.nii.ac.jp/ | \n", "[https://zokei.repo.nii.ac.jp/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
https://zoltardata.com/ | \n", "[https://zoltardata.com/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
https://zone.biblio.laurentian.ca/ | \n", "[https://zone.biblio.laurentian.ca, https://zo... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
https://zuscholars.zu.ac.ae/ | \n", "[https://zuscholars.zu.ac.ae, https://zuschola... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
9331 rows × 5 columns
\n", "\n", " | url | \n", "head_final_code | \n", "head_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|
head_url | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
http://125.99.47.158:8090/jspui/ | \n", "[http://125.99.47.158:8090/jspui, http://125.9... | \n", "[200.0, 200.0] | \n", "[[302], []] | \n", "[1, 0] | \n", "[200.0, 200.0] | \n", "
http://160.97.80.9:8080/jspui/ | \n", "[http://160.97.80.9:8080/jspui/, http://160.97... | \n", "[404.0, 404.0] | \n", "[[], [302]] | \n", "[0, 1] | \n", "[400.0, 400.0] | \n", "
http://acikarsiv.atauni.edu.tr/ | \n", "[http://acikarsiv.atauni.edu.tr/, http://acika... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
http://acikarsiv.atilim.edu.tr/ | \n", "[http://acikarsiv.atilim.edu.tr/, http://acika... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
http://acikerisim.afsu.edu.tr/xmlui/ | \n", "[http://acikerisim.afsu.edu.tr, http://acikeri... | \n", "[200.0, 200.0] | \n", "[[302, 302], [302, 302]] | \n", "[2, 2] | \n", "[200.0, 200.0] | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
https://zaguan.unizar.es/ | \n", "[http://zaguan.unizar.es/, http://zaguan.uniza... | \n", "[200.0, 200.0] | \n", "[[301], [301]] | \n", "[1, 1] | \n", "[200.0, 200.0] | \n", "
https://zbc.ksiaznica.szczecin.pl/dlibra | \n", "[http://zbc.ksiaznica.szczecin.pl/dlibra, http... | \n", "[200.0, 200.0] | \n", "[[302], [302, 302]] | \n", "[1, 2] | \n", "[200.0, 200.0] | \n", "
https://zenodo.org/ | \n", "[https://zenodo.org/, http://zenodo.org/] | \n", "[200.0, 200.0] | \n", "[[], [301]] | \n", "[0, 1] | \n", "[200.0, 200.0] | \n", "
https://zone.biblio.laurentian.ca/ | \n", "[https://zone.biblio.laurentian.ca, https://zo... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
https://zuscholars.zu.ac.ae/ | \n", "[https://zuscholars.zu.ac.ae, https://zuschola... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
1456 rows × 5 columns
\n", "\n", " | url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|
get_url | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
http://103.82.172.44:8080/xmlui/ | \n", "[http://103.82.172.44:8080/xmlui/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
http://109.185.200.51/ | \n", "[http://109.185.200.51/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
http://119.3.41.228/dnmivd/ | \n", "[http://www.unimd.org/dnmivd/] | \n", "[200.0] | \n", "[[302]] | \n", "[1] | \n", "[200.0] | \n", "
http://119.78.100.183/ | \n", "[http://119.78.100.183] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
http://125.99.47.158:8090/jspui/ | \n", "[http://125.99.47.158:8090/jspui, http://125.9... | \n", "[200.0, 200.0] | \n", "[[302], []] | \n", "[1, 0] | \n", "[200.0, 200.0] | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
https://zks.uni-koeln.de/index.php?s=studien&c=studien_klinische-studien | \n", "[http://zks.uni-koeln.de/index.php?s=studien&c... | \n", "[200.0] | \n", "[[301]] | \n", "[1] | \n", "[200.0] | \n", "
https://zokei.repo.nii.ac.jp/ | \n", "[https://zokei.repo.nii.ac.jp/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
https://zoltardata.com/ | \n", "[https://zoltardata.com/] | \n", "[200.0] | \n", "[[]] | \n", "[0] | \n", "[200.0] | \n", "
https://zone.biblio.laurentian.ca/ | \n", "[https://zone.biblio.laurentian.ca, https://zo... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
https://zuscholars.zu.ac.ae/ | \n", "[https://zuscholars.zu.ac.ae, https://zuschola... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
9353 rows × 5 columns
\n", "\n", " | url | \n", "get_final_code | \n", "get_codes | \n", "len | \n", "class | \n", "
---|---|---|---|---|---|
get_url | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
http://125.99.47.158:8090/jspui/ | \n", "[http://125.99.47.158:8090/jspui, http://125.9... | \n", "[200.0, 200.0] | \n", "[[302], []] | \n", "[1, 0] | \n", "[200.0, 200.0] | \n", "
http://160.97.80.9:8080/jspui/ | \n", "[http://160.97.80.9:8080/jspui/, http://160.97... | \n", "[404.0, 404.0] | \n", "[[], [302]] | \n", "[0, 1] | \n", "[400.0, 400.0] | \n", "
http://acikarsiv.atauni.edu.tr/ | \n", "[http://acikarsiv.atauni.edu.tr/, http://acika... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
http://acikarsiv.atilim.edu.tr/ | \n", "[http://acikarsiv.atilim.edu.tr/, http://acika... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
http://acikerisim.afsu.edu.tr/xmlui/ | \n", "[http://acikerisim.afsu.edu.tr, http://acikeri... | \n", "[200.0, 200.0] | \n", "[[302, 302], [302, 302]] | \n", "[2, 2] | \n", "[200.0, 200.0] | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
https://zaguan.unizar.es/ | \n", "[http://zaguan.unizar.es/, http://zaguan.uniza... | \n", "[200.0, 200.0] | \n", "[[301], [301]] | \n", "[1, 1] | \n", "[200.0, 200.0] | \n", "
https://zbc.ksiaznica.szczecin.pl/dlibra | \n", "[http://zbc.ksiaznica.szczecin.pl/dlibra, http... | \n", "[200.0, 200.0] | \n", "[[302], [302, 302]] | \n", "[1, 2] | \n", "[200.0, 200.0] | \n", "
https://zenodo.org/ | \n", "[https://zenodo.org/, http://zenodo.org/] | \n", "[200.0, 200.0] | \n", "[[], [301]] | \n", "[0, 1] | \n", "[200.0, 200.0] | \n", "
https://zone.biblio.laurentian.ca/ | \n", "[https://zone.biblio.laurentian.ca, https://zo... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
https://zuscholars.zu.ac.ae/ | \n", "[https://zuscholars.zu.ac.ae, https://zuschola... | \n", "[200.0, 200.0] | \n", "[[], []] | \n", "[0, 0] | \n", "[200.0, 200.0] | \n", "
1459 rows × 5 columns
\n", "