added cc_licences and abstracts in observatory db
This commit is contained in:
parent
9b1936701c
commit
de9bf3a161
|
@ -23,6 +23,11 @@ CREATE OR REPLACE VIEW ${stats_db_name}.rndexpediture AS
|
||||||
SELECT *
|
SELECT *
|
||||||
FROM ${external_stats_db_name}.rndexpediture;
|
FROM ${external_stats_db_name}.rndexpediture;
|
||||||
|
|
||||||
|
CREATE OR REPLACE VIEW ${stats_db_name}.licenses_normalized AS
|
||||||
|
SELECT *
|
||||||
|
FROM ${external_stats_db_name}.licenses_normalized;
|
||||||
|
|
||||||
|
|
||||||
------------------------------------------------------------------------------------------------
|
------------------------------------------------------------------------------------------------
|
||||||
------------------------------------------------------------------------------------------------
|
------------------------------------------------------------------------------------------------
|
||||||
-- Creation date of the database
|
-- Creation date of the database
|
||||||
|
|
|
@ -1,41 +1,44 @@
|
||||||
create table TARGET.result_affiliated_country stored as parquet as
|
create table TARGET.result_affiliated_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_year stored as parquet as
|
create table TARGET.result_affiliated_year stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, r.type, r.year
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, r.year
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, r.year;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, r.year;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_year_country stored as parquet as
|
create table TARGET.result_affiliated_year_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, r.year, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, r.year, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, r.year, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, r.year, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_datasource stored as parquet as
|
create table TARGET.result_affiliated_datasource stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, r.type, d.name as dname
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, d.name as dname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
|
@ -44,12 +47,13 @@ left outer join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
left outer join SOURCE.datasource d on d.id=rd.datasource
|
left outer join SOURCE.datasource d on d.id=rd.datasource
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, d.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, d.name;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_datasource_country stored as parquet as
|
create table TARGET.result_affiliated_datasource_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, d.name as dname, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, d.name as dname, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
|
@ -58,35 +62,38 @@ left outer join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
left outer join SOURCE.datasource d on d.id=rd.datasource
|
left outer join SOURCE.datasource d on d.id=rd.datasource
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, d.name, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, d.name, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_organization stored as parquet as
|
create table TARGET.result_affiliated_organization stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, o.name as oname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, o.name as oname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, o.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, o.name;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_organization_country stored as parquet as
|
create table TARGET.result_affiliated_organization_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, o.name as oname, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, o.name as oname, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, o.name, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, o.name, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_funder stored as parquet as
|
create table TARGET.result_affiliated_funder stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, r.type, p.funder as pfunder
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, p.funder as pfunder
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
|
@ -95,12 +102,13 @@ join SOURCE.result_projects rp on rp.id=r.id
|
||||||
join SOURCE.project p on p.id=rp.project
|
join SOURCE.project p on p.id=rp.project
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, p.funder;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, p.funder;
|
||||||
|
|
||||||
create table TARGET.result_affiliated_funder_country stored as parquet as
|
create table TARGET.result_affiliated_funder_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, p.funder as pfunder, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, p.funder as pfunder, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_organization ro on ro.id=r.id
|
join SOURCE.result_organization ro on ro.id=r.id
|
||||||
join SOURCE.organization o on o.id=ro.organization
|
join SOURCE.organization o on o.id=ro.organization
|
||||||
|
@ -109,12 +117,13 @@ join SOURCE.result_projects rp on rp.id=r.id
|
||||||
join SOURCE.project p on p.id=rp.project
|
join SOURCE.project p on p.id=rp.project
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, p.funder, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, p.funder, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_deposited_country stored as parquet as
|
create table TARGET.result_deposited_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -123,11 +132,12 @@ join SOURCE.organization o on o.id=dor.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_deposited_year stored as parquet as
|
create table TARGET.result_deposited_year stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, r.type, r.year
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, r.year
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -136,12 +146,13 @@ join SOURCE.organization o on o.id=dor.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, r.year;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, r.year;
|
||||||
|
|
||||||
create table TARGET.result_deposited_year_country stored as parquet as
|
create table TARGET.result_deposited_year_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, r.year, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, r.year, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -150,12 +161,13 @@ join SOURCE.organization o on o.id=dor.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, r.year, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, r.year, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_deposited_datasource stored as parquet as
|
create table TARGET.result_deposited_datasource stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, d.name as dname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, d.name as dname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -164,12 +176,13 @@ join SOURCE.organization o on o.id=dor.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, d.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, d.name;
|
||||||
|
|
||||||
create table TARGET.result_deposited_datasource_country stored as parquet as
|
create table TARGET.result_deposited_datasource_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, d.name as dname, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, d.name as dname, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -178,11 +191,12 @@ join SOURCE.organization o on o.id=dor.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, d.name, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, d.name, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_deposited_organization stored as parquet as
|
create table TARGET.result_deposited_organization stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, r.type, o.name as oname
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa, r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, o.name as oname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -191,12 +205,13 @@ join SOURCE.organization o on o.id=dor.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, o.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, o.name;
|
||||||
|
|
||||||
create table TARGET.result_deposited_organization_country stored as parquet as
|
create table TARGET.result_deposited_organization_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, o.name as oname, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, o.name as oname, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -205,12 +220,13 @@ join SOURCE.organization o on o.id=dor.organization
|
||||||
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
join SOURCE.country c on c.code=o.country and c.continent_name='Europe'
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, o.name, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, o.name, c.code, c.name;
|
||||||
|
|
||||||
create table TARGET.result_deposited_funder stored as parquet as
|
create table TARGET.result_deposited_funder stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, p.funder as pfunder
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, p.funder as pfunder
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -221,12 +237,13 @@ join SOURCE.result_projects rp on rp.id=r.id
|
||||||
join SOURCE.project p on p.id=rp.project
|
join SOURCE.project p on p.id=rp.project
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, p.funder;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, p.funder;
|
||||||
|
|
||||||
create table TARGET.result_deposited_funder_country stored as parquet as
|
create table TARGET.result_deposited_funder_country stored as parquet as
|
||||||
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
select count(distinct r.id) as total, r.green, r.gold, case when rl.type is not null then true else false end as licence,
|
||||||
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
case when pids.pid is not null then true else false end as pid, case when r.access_mode in ('Open Access', 'Open Source') then true else false end as oa,
|
||||||
r.peer_reviewed, r.type, p.funder as pfunder, c.code as ccode, c.name as cname
|
r.peer_reviewed, case when lower(rln.normalized) like 'cc-%' then true else false end as cc_licence, r.abstract as abstract, r.type, p.funder as pfunder, c.code as ccode, c.name as cname
|
||||||
from SOURCE.result r
|
from SOURCE.result r
|
||||||
join SOURCE.result_datasources rd on rd.id=r.id
|
join SOURCE.result_datasources rd on rd.id=r.id
|
||||||
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
join SOURCE.datasource d on d.id=rd.datasource and d.type in ('Institutional Repository','Data Repository', 'Repository', 'Publication Repository')
|
||||||
|
@ -237,7 +254,8 @@ join SOURCE.result_projects rp on rp.id=r.id
|
||||||
join SOURCE.project p on p.id=rp.project
|
join SOURCE.project p on p.id=rp.project
|
||||||
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
left outer join SOURCE.result_licenses rl on rl.id=r.id
|
||||||
left outer join SOURCE.result_pids pids on pids.id=r.id
|
left outer join SOURCE.result_pids pids on pids.id=r.id
|
||||||
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, p.funder, c.code, c.name;
|
left outer join SOURCE.licenses_normalized rln on rln.license=rl.type
|
||||||
|
group by r.green, r.gold, licence, pid, oa, r.peer_reviewed, r.type, cc_licence, abstract, p.funder, c.code, c.name;
|
||||||
|
|
||||||
compute stats TARGET.result_affiliated_country;
|
compute stats TARGET.result_affiliated_country;
|
||||||
compute stats TARGET.result_affiliated_year;
|
compute stats TARGET.result_affiliated_year;
|
||||||
|
|
Loading…
Reference in New Issue