From de89887e7e1758a5906ce2ad018a001418c6045c Mon Sep 17 00:00:00 2001 From: Serafeim Chatzopoulos Date: Wed, 15 Mar 2023 20:19:49 +0200 Subject: [PATCH] Update url path for graph-production-workflow; add more details in indictors ingestion page --- docs/changelog.md | 4 +- docs/data-model/entities/other.md | 12 ++-- docs/data-model/entities/result.md | 2 +- docs/data-model/pids-and-identifiers.md | 2 +- docs/data-provision/_category_.json | 8 --- .../graph-production-workflow/_category_.json | 8 +++ .../aggregation/aggregation.md | 0 .../aggregation/compatible-sources.md | 0 .../non-compatible-sources/datacite.md | 0 .../non-compatible-sources/doiboost.md | 0 .../aggregation/non-compatible-sources/ebi.md | 0 .../non-compatible-sources/pubmed.md | 0 .../non-compatible-sources/uniprot.md | 0 .../cleaning.md | 0 .../deduction-and-propagation/bulk-tagging.md | 0 .../deduction-and-propagation/propagation.md | 0 .../deduplication/_category_.json | 0 .../deduplication/clustering-functions.md | 0 .../deduplication/deduplication.md | 0 .../deduplication/organizations.md | 0 .../deduplication/research-products.md | 0 .../enrichment-by-mining/_category_.json | 0 .../enrichment-by-mining/acks.md | 0 .../affiliation_matching.md | 0 .../enrichment-by-mining/citation_matching.md | 0 .../enrichment-by-mining/cites.md | 0 .../enrichment-by-mining/classifies.md | 0 .../documents_similarity.md | 0 .../enrichment-by-mining/img.png | Bin .../metadata_extraction.md | 0 .../finalisation.md | 2 +- .../graph-production-workflow.md} | 0 .../indexing.md | 0 .../indicators-ingestion/impact-indicators.md | 3 +- .../indicators-ingestion.md | 8 +++ .../indicators-ingestion/usage-counts.md | 4 +- .../merge-by-id.md | 0 .../stats.md | 0 sidebars.js | 59 +++++++++--------- versioned_docs/version-5.2.0/changelog.md | 4 +- .../data-model/entities/other.md | 12 ++-- .../data-model/entities/result.md | 2 +- .../data-model/pids-and-identifiers.md | 2 +- .../data-provision/_category_.json | 8 --- .../version-5.2.0/downloads/subgraphs.md | 2 +- .../graph-production-workflow/_category_.json | 8 +++ .../aggregation/aggregation.md | 0 .../aggregation/compatible-sources.md | 0 .../non-compatible-sources/datacite.md | 0 .../non-compatible-sources/doiboost.md | 0 .../aggregation/non-compatible-sources/ebi.md | 0 .../non-compatible-sources/pubmed.md | 0 .../non-compatible-sources/uniprot.md | 0 .../cleaning.md | 0 .../deduction-and-propagation/bulk-tagging.md | 0 .../deduction-and-propagation/propagation.md | 0 .../deduplication/_category_.json | 0 .../deduplication/clustering-functions.md | 0 .../deduplication/deduplication.md | 0 .../deduplication/organizations.md | 0 .../deduplication/research-products.md | 0 .../enrichment-by-mining/_category_.json | 0 .../enrichment-by-mining/acks.md | 0 .../affiliation_matching.md | 0 .../enrichment-by-mining/citation_matching.md | 0 .../enrichment-by-mining/cites.md | 0 .../enrichment-by-mining/classifies.md | 0 .../documents_similarity.md | 0 .../enrichment-by-mining/img.png | Bin .../metadata_extraction.md | 0 .../finalisation.md | 2 +- .../graph-production-workflow.md} | 0 .../indexing.md | 0 .../indicators-ingestion/impact-indicators.md | 3 +- .../indicators-ingestion.md | 8 +++ .../indicators-ingestion/usage-counts.md | 4 +- .../merge-by-id.md | 0 .../stats.md | 0 .../version-5.2.0-sidebars.json | 58 ++++++++--------- 79 files changed, 120 insertions(+), 105 deletions(-) delete mode 100644 docs/data-provision/_category_.json create mode 100644 docs/graph-production-workflow/_category_.json rename docs/{data-provision => graph-production-workflow}/aggregation/aggregation.md (100%) rename docs/{data-provision => graph-production-workflow}/aggregation/compatible-sources.md (100%) rename docs/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/datacite.md (100%) rename docs/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/doiboost.md (100%) rename docs/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/ebi.md (100%) rename docs/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/pubmed.md (100%) rename docs/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/uniprot.md (100%) rename docs/{data-provision => graph-production-workflow}/cleaning.md (100%) rename docs/{data-provision => graph-production-workflow}/deduction-and-propagation/bulk-tagging.md (100%) rename docs/{data-provision => graph-production-workflow}/deduction-and-propagation/propagation.md (100%) rename docs/{data-provision => graph-production-workflow}/deduplication/_category_.json (100%) rename docs/{data-provision => graph-production-workflow}/deduplication/clustering-functions.md (100%) rename docs/{data-provision => graph-production-workflow}/deduplication/deduplication.md (100%) rename docs/{data-provision => graph-production-workflow}/deduplication/organizations.md (100%) rename docs/{data-provision => graph-production-workflow}/deduplication/research-products.md (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/_category_.json (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/acks.md (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/affiliation_matching.md (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/citation_matching.md (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/cites.md (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/classifies.md (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/documents_similarity.md (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/img.png (100%) rename docs/{data-provision => graph-production-workflow}/enrichment-by-mining/metadata_extraction.md (100%) rename docs/{data-provision => graph-production-workflow}/finalisation.md (89%) rename docs/{data-provision/data-provision.md => graph-production-workflow/graph-production-workflow.md} (100%) rename docs/{data-provision => graph-production-workflow}/indexing.md (100%) rename versioned_docs/version-5.2.0/data-provision/indicators-ingestion/impact-scores.md => docs/graph-production-workflow/indicators-ingestion/impact-indicators.md (96%) create mode 100644 docs/graph-production-workflow/indicators-ingestion/indicators-ingestion.md rename {versioned_docs/version-5.2.0/data-provision => docs/graph-production-workflow}/indicators-ingestion/usage-counts.md (88%) rename docs/{data-provision => graph-production-workflow}/merge-by-id.md (100%) rename docs/{data-provision => graph-production-workflow}/stats.md (100%) delete mode 100644 versioned_docs/version-5.2.0/data-provision/_category_.json create mode 100644 versioned_docs/version-5.2.0/graph-production-workflow/_category_.json rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/aggregation/aggregation.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/aggregation/compatible-sources.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/datacite.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/doiboost.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/ebi.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/pubmed.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/aggregation/non-compatible-sources/uniprot.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/cleaning.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/deduction-and-propagation/bulk-tagging.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/deduction-and-propagation/propagation.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/deduplication/_category_.json (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/deduplication/clustering-functions.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/deduplication/deduplication.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/deduplication/organizations.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/deduplication/research-products.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/_category_.json (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/acks.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/affiliation_matching.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/citation_matching.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/cites.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/classifies.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/documents_similarity.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/img.png (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/enrichment-by-mining/metadata_extraction.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/finalisation.md (89%) rename versioned_docs/version-5.2.0/{data-provision/data-provision.md => graph-production-workflow/graph-production-workflow.md} (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/indexing.md (100%) rename docs/data-provision/indicators-ingestion/impact-scores.md => versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/impact-indicators.md (96%) create mode 100644 versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/indicators-ingestion.md rename {docs/data-provision => versioned_docs/version-5.2.0/graph-production-workflow}/indicators-ingestion/usage-counts.md (88%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/merge-by-id.md (100%) rename versioned_docs/version-5.2.0/{data-provision => graph-production-workflow}/stats.md (100%) diff --git a/docs/changelog.md b/docs/changelog.md index c874cb7..c0ca8be 100644 --- a/docs/changelog.md +++ b/docs/changelog.md @@ -27,8 +27,8 @@ _Start Date: 2023-02-13 • Release Date: 2023-03-01 • Dump release: **n - Revised SDG classification: improved coverage (+600K classified DOIs) - General increase of the funded scientific outputs, thanks to the full text mining scanning new OpenAccess publications - Integrated contents from - - [EMBL-EBIs Protein Data Bank in Europe](/data-provision/aggregation/non-compatible-sources/ebi) - - [UniProtKB/Swiss-Prot](/data-provision/aggregation/non-compatible-sources/uniprot) + - [EMBL-EBIs Protein Data Bank in Europe](/graph-production-workflow/aggregation/non-compatible-sources/ebi) + - [UniProtKB/Swiss-Prot](/graph-production-workflow//aggregation/non-compatible-sources/uniprot) #### Changed diff --git a/docs/data-model/entities/other.md b/docs/data-model/entities/other.md index e066b5b..18c585a 100644 --- a/docs/data-model/entities/other.md +++ b/docs/data-model/entities/other.md @@ -615,7 +615,7 @@ _Type: [ImpactMeasures](#impactmeasures-1) • Cardinality: ONE_ These impact-based indicators, provided by [BIP!](https://bip.imsi.athenarc.gr/), estimate the impact of a result. -For details about their calculation, please refer [here](/data-provision/indicators-ingestion/impact-scores). +For details about their calculation, please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores). ```json "impactMeasures": { @@ -682,7 +682,7 @@ The different impact-based indicators as computed by [BIP!](https://bip.imsi.ath _Type: [Score](#score) • Cardinality: ONE_ This indicator reflects the overall/total impact of an article in the research community at large, based on the underlying citation network (diachronically). -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#pagerank-pr). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#pagerank-pr). ```json "influence": { @@ -695,7 +695,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This is an alternative to the "Influence" indicator, which also reflects the overall/total impact of an article in the research community at large, based on the underlying citation network (diachronically). -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#citation-count-cc). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#citation-count-cc). ```json "influence_alt" :{ @@ -708,7 +708,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This indicator reflects the "current" impact/attention (the "hype") of an article in the research community at large, based on the underlying citation network. -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#attrank). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#attrank). ```json "popularity":{ @@ -722,7 +722,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This is an alternative to the "Popularity" indicator, which also reflects the "current" impact/attention (the "hype") of an article in the research community at large, based on the underlying citation network. -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#ram). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#ram). ```json "popularity_alt":{ @@ -736,7 +736,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This indicator reflects the initial momentum of an article directly after its publication, based on the underlying citation network. -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#incubation-citation-count-icc). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#incubation-citation-count-icc). ```json "impulse":{ diff --git a/docs/data-model/entities/result.md b/docs/data-model/entities/result.md index f0abfcc..4b1a321 100644 --- a/docs/data-model/entities/result.md +++ b/docs/data-model/entities/result.md @@ -187,7 +187,7 @@ Date when the embargo ends and this result turns Open Access. _Type: [Indicator](other#indicator) • Cardinality: ONE_ The indicators computed for this result; -currently, the following two types of indicators are supported: [impact indicators](/data-provision/indicators-ingestion/impact-scores) and [usage statistics indicators](/data-provision/indicators-ingestion/usage-counts). +currently, the following two types of indicators are supported: [impact indicators](/graph-production-workflow/indicators-ingestion/impact-scores) and [usage statistics indicators](/graph-production-workflow/indicators-ingestion/usage-counts). ```json "indicators": { diff --git a/docs/data-model/pids-and-identifiers.md b/docs/data-model/pids-and-identifiers.md index de31912..c613366 100644 --- a/docs/data-model/pids-and-identifiers.md +++ b/docs/data-model/pids-and-identifiers.md @@ -77,5 +77,5 @@ Currently, the following data sources are used as "PID authorities": | pdb | `pdb_________` | EMBL-EBI | | uniprot | `uniprot_____` | EMBL-EBI | -OpenAIRE also perform duplicate identification (see the [dedicated section for details](/data-provision/deduplication)). +OpenAIRE also perform duplicate identification (see the [dedicated section for details](/graph-production-workflow/deduplication)). All duplicates are **merged** together in a **representative record** which must be assigned a dedicated OpenAIRE identifier (i.e. it cannot have the identifier of one of the aggregated record). diff --git a/docs/data-provision/_category_.json b/docs/data-provision/_category_.json deleted file mode 100644 index 80915c5..0000000 --- a/docs/data-provision/_category_.json +++ /dev/null @@ -1,8 +0,0 @@ -{ - "label": "Data provision", - "position": 6, - "link": { - "type": "doc", - "id": "data-provision" - } -} \ No newline at end of file diff --git a/docs/graph-production-workflow/_category_.json b/docs/graph-production-workflow/_category_.json new file mode 100644 index 0000000..8da8ce0 --- /dev/null +++ b/docs/graph-production-workflow/_category_.json @@ -0,0 +1,8 @@ +{ + "label": "Graph production workflow", + "position": 6, + "link": { + "type": "doc", + "id": "graph-production-workflow" + } +} \ No newline at end of file diff --git a/docs/data-provision/aggregation/aggregation.md b/docs/graph-production-workflow/aggregation/aggregation.md similarity index 100% rename from docs/data-provision/aggregation/aggregation.md rename to docs/graph-production-workflow/aggregation/aggregation.md diff --git a/docs/data-provision/aggregation/compatible-sources.md b/docs/graph-production-workflow/aggregation/compatible-sources.md similarity index 100% rename from docs/data-provision/aggregation/compatible-sources.md rename to docs/graph-production-workflow/aggregation/compatible-sources.md diff --git a/docs/data-provision/aggregation/non-compatible-sources/datacite.md b/docs/graph-production-workflow/aggregation/non-compatible-sources/datacite.md similarity index 100% rename from docs/data-provision/aggregation/non-compatible-sources/datacite.md rename to docs/graph-production-workflow/aggregation/non-compatible-sources/datacite.md diff --git a/docs/data-provision/aggregation/non-compatible-sources/doiboost.md b/docs/graph-production-workflow/aggregation/non-compatible-sources/doiboost.md similarity index 100% rename from docs/data-provision/aggregation/non-compatible-sources/doiboost.md rename to docs/graph-production-workflow/aggregation/non-compatible-sources/doiboost.md diff --git a/docs/data-provision/aggregation/non-compatible-sources/ebi.md b/docs/graph-production-workflow/aggregation/non-compatible-sources/ebi.md similarity index 100% rename from docs/data-provision/aggregation/non-compatible-sources/ebi.md rename to docs/graph-production-workflow/aggregation/non-compatible-sources/ebi.md diff --git a/docs/data-provision/aggregation/non-compatible-sources/pubmed.md b/docs/graph-production-workflow/aggregation/non-compatible-sources/pubmed.md similarity index 100% rename from docs/data-provision/aggregation/non-compatible-sources/pubmed.md rename to docs/graph-production-workflow/aggregation/non-compatible-sources/pubmed.md diff --git a/docs/data-provision/aggregation/non-compatible-sources/uniprot.md b/docs/graph-production-workflow/aggregation/non-compatible-sources/uniprot.md similarity index 100% rename from docs/data-provision/aggregation/non-compatible-sources/uniprot.md rename to docs/graph-production-workflow/aggregation/non-compatible-sources/uniprot.md diff --git a/docs/data-provision/cleaning.md b/docs/graph-production-workflow/cleaning.md similarity index 100% rename from docs/data-provision/cleaning.md rename to docs/graph-production-workflow/cleaning.md diff --git a/docs/data-provision/deduction-and-propagation/bulk-tagging.md b/docs/graph-production-workflow/deduction-and-propagation/bulk-tagging.md similarity index 100% rename from docs/data-provision/deduction-and-propagation/bulk-tagging.md rename to docs/graph-production-workflow/deduction-and-propagation/bulk-tagging.md diff --git a/docs/data-provision/deduction-and-propagation/propagation.md b/docs/graph-production-workflow/deduction-and-propagation/propagation.md similarity index 100% rename from docs/data-provision/deduction-and-propagation/propagation.md rename to docs/graph-production-workflow/deduction-and-propagation/propagation.md diff --git a/docs/data-provision/deduplication/_category_.json b/docs/graph-production-workflow/deduplication/_category_.json similarity index 100% rename from docs/data-provision/deduplication/_category_.json rename to docs/graph-production-workflow/deduplication/_category_.json diff --git a/docs/data-provision/deduplication/clustering-functions.md b/docs/graph-production-workflow/deduplication/clustering-functions.md similarity index 100% rename from docs/data-provision/deduplication/clustering-functions.md rename to docs/graph-production-workflow/deduplication/clustering-functions.md diff --git a/docs/data-provision/deduplication/deduplication.md b/docs/graph-production-workflow/deduplication/deduplication.md similarity index 100% rename from docs/data-provision/deduplication/deduplication.md rename to docs/graph-production-workflow/deduplication/deduplication.md diff --git a/docs/data-provision/deduplication/organizations.md b/docs/graph-production-workflow/deduplication/organizations.md similarity index 100% rename from docs/data-provision/deduplication/organizations.md rename to docs/graph-production-workflow/deduplication/organizations.md diff --git a/docs/data-provision/deduplication/research-products.md b/docs/graph-production-workflow/deduplication/research-products.md similarity index 100% rename from docs/data-provision/deduplication/research-products.md rename to docs/graph-production-workflow/deduplication/research-products.md diff --git a/docs/data-provision/enrichment-by-mining/_category_.json b/docs/graph-production-workflow/enrichment-by-mining/_category_.json similarity index 100% rename from docs/data-provision/enrichment-by-mining/_category_.json rename to docs/graph-production-workflow/enrichment-by-mining/_category_.json diff --git a/docs/data-provision/enrichment-by-mining/acks.md b/docs/graph-production-workflow/enrichment-by-mining/acks.md similarity index 100% rename from docs/data-provision/enrichment-by-mining/acks.md rename to docs/graph-production-workflow/enrichment-by-mining/acks.md diff --git a/docs/data-provision/enrichment-by-mining/affiliation_matching.md b/docs/graph-production-workflow/enrichment-by-mining/affiliation_matching.md similarity index 100% rename from docs/data-provision/enrichment-by-mining/affiliation_matching.md rename to docs/graph-production-workflow/enrichment-by-mining/affiliation_matching.md diff --git a/docs/data-provision/enrichment-by-mining/citation_matching.md b/docs/graph-production-workflow/enrichment-by-mining/citation_matching.md similarity index 100% rename from docs/data-provision/enrichment-by-mining/citation_matching.md rename to docs/graph-production-workflow/enrichment-by-mining/citation_matching.md diff --git a/docs/data-provision/enrichment-by-mining/cites.md b/docs/graph-production-workflow/enrichment-by-mining/cites.md similarity index 100% rename from docs/data-provision/enrichment-by-mining/cites.md rename to docs/graph-production-workflow/enrichment-by-mining/cites.md diff --git a/docs/data-provision/enrichment-by-mining/classifies.md b/docs/graph-production-workflow/enrichment-by-mining/classifies.md similarity index 100% rename from docs/data-provision/enrichment-by-mining/classifies.md rename to docs/graph-production-workflow/enrichment-by-mining/classifies.md diff --git a/docs/data-provision/enrichment-by-mining/documents_similarity.md b/docs/graph-production-workflow/enrichment-by-mining/documents_similarity.md similarity index 100% rename from docs/data-provision/enrichment-by-mining/documents_similarity.md rename to docs/graph-production-workflow/enrichment-by-mining/documents_similarity.md diff --git a/docs/data-provision/enrichment-by-mining/img.png b/docs/graph-production-workflow/enrichment-by-mining/img.png similarity index 100% rename from docs/data-provision/enrichment-by-mining/img.png rename to docs/graph-production-workflow/enrichment-by-mining/img.png diff --git a/docs/data-provision/enrichment-by-mining/metadata_extraction.md b/docs/graph-production-workflow/enrichment-by-mining/metadata_extraction.md similarity index 100% rename from docs/data-provision/enrichment-by-mining/metadata_extraction.md rename to docs/graph-production-workflow/enrichment-by-mining/metadata_extraction.md diff --git a/docs/data-provision/finalisation.md b/docs/graph-production-workflow/finalisation.md similarity index 89% rename from docs/data-provision/finalisation.md rename to docs/graph-production-workflow/finalisation.md index 22e5ca9..06548dc 100644 --- a/docs/data-provision/finalisation.md +++ b/docs/graph-production-workflow/finalisation.md @@ -10,7 +10,7 @@ Bibliographic records that do not meet minimal requirements for being part of th Currently, the only criteria applied horizontally to the entire graph aims at excluding scientific results whose title is not meaningful for citation purposes. Then, different criteria are applied in the pre-processing of specific sub-collections: -* [Crossref filtering](/data-provision/aggregation/non-compatible-sources/doiboost#crossref-filtering) +* [Crossref filtering](/graph-production-workflow/aggregation/non-compatible-sources/doiboost#crossref-filtering) ## Country cleaning diff --git a/docs/data-provision/data-provision.md b/docs/graph-production-workflow/graph-production-workflow.md similarity index 100% rename from docs/data-provision/data-provision.md rename to docs/graph-production-workflow/graph-production-workflow.md diff --git a/docs/data-provision/indexing.md b/docs/graph-production-workflow/indexing.md similarity index 100% rename from docs/data-provision/indexing.md rename to docs/graph-production-workflow/indexing.md diff --git a/versioned_docs/version-5.2.0/data-provision/indicators-ingestion/impact-scores.md b/docs/graph-production-workflow/indicators-ingestion/impact-indicators.md similarity index 96% rename from versioned_docs/version-5.2.0/data-provision/indicators-ingestion/impact-scores.md rename to docs/graph-production-workflow/indicators-ingestion/impact-indicators.md index b5d9bcd..6c90186 100644 --- a/versioned_docs/version-5.2.0/data-provision/indicators-ingestion/impact-scores.md +++ b/docs/graph-production-workflow/indicators-ingestion/impact-indicators.md @@ -1,6 +1,7 @@ # Impact indicators -This page summarises all calculated impact indicators, which are included in the [impactMeasures](/data-model/entities/other#impactmeasures) property which is part of the [indicators](/data-model/entities/result#indicators) property of the result. +This page summarises all calculated impact indicators, provided by [BIP!](https://bip.imsi.athenarc.gr/), which are included in the [impactMeasures](/data-model/entities/other#impactmeasures) property (found under the [indicators](/data-model/entities/result#indicators) property of the result). + It should be noted that the impact indicators are being calculated on the level of the research output. Below we explain their main intuition, the way they are calculated, and their most important limitations, in an attempt help avoiding common pitfalls and misuses. diff --git a/docs/graph-production-workflow/indicators-ingestion/indicators-ingestion.md b/docs/graph-production-workflow/indicators-ingestion/indicators-ingestion.md new file mode 100644 index 0000000..4402287 --- /dev/null +++ b/docs/graph-production-workflow/indicators-ingestion/indicators-ingestion.md @@ -0,0 +1,8 @@ +import DocCardList from '@theme/DocCardList'; + +# Indicators ingestion + +In this step, results are enriched with Impact and Usage Statistics indicators. +The former are provided by [BIP!](https://bip.imsi.athenarc.gr/) while the latter are computed by OpenAIRE's [UsageCounts service](https://usagecounts.openaire.eu/). + + \ No newline at end of file diff --git a/versioned_docs/version-5.2.0/data-provision/indicators-ingestion/usage-counts.md b/docs/graph-production-workflow/indicators-ingestion/usage-counts.md similarity index 88% rename from versioned_docs/version-5.2.0/data-provision/indicators-ingestion/usage-counts.md rename to docs/graph-production-workflow/indicators-ingestion/usage-counts.md index fd98a43..b1a86bd 100644 --- a/versioned_docs/version-5.2.0/data-provision/indicators-ingestion/usage-counts.md +++ b/docs/graph-production-workflow/indicators-ingestion/usage-counts.md @@ -1,7 +1,7 @@ -# Usage Statistics Indicators +# Usage Statistics indicators Usage Statistics indicators for research products, like publications, datasets,etc., are an important complement to other (traditional and alternative) bibliometric indicators to provide a comprehensive and recent view of the impact of such resources but also about their authors, institutions and the platforms themselves. They are taking into account different levels of information: the usage of data sources, the usage of individual items in the context of their resource type and the usage of individual web resources or files. -Usage Statistics Indicators are built by the OpenAIRE's UsageCounts Service. The service collects usage data and consolidated usage statistics reports respectively, from its distributed network of data providers (repositories, e-journals, CRIS) by utilizing open standards and protocols and delivers reliable, consolidated and comparable usage metrics like counts of item downloads and metadata views conformant to COUNTER Code of Practice. +Usage Statistics Indicators are built by the OpenAIRE's UsageCounts service. The service collects usage data and consolidated usage statistics reports respectively, from its distributed network of data providers (repositories, e-journals, CRIS) by utilizing open standards and protocols and delivers reliable, consolidated and comparable usage metrics like counts of item downloads and metadata views conformant to COUNTER Code of Practice. You can find more information about the UsageCounts service [here](https://usagecounts.openaire.eu/). \ No newline at end of file diff --git a/docs/data-provision/merge-by-id.md b/docs/graph-production-workflow/merge-by-id.md similarity index 100% rename from docs/data-provision/merge-by-id.md rename to docs/graph-production-workflow/merge-by-id.md diff --git a/docs/data-provision/stats.md b/docs/graph-production-workflow/stats.md similarity index 100% rename from docs/data-provision/stats.md rename to docs/graph-production-workflow/stats.md diff --git a/sidebars.js b/sidebars.js index a5c625c..3f99733 100644 --- a/sidebars.js +++ b/sidebars.js @@ -67,35 +67,35 @@ const sidebars = { { type: 'category', label: "Graph production workflow", - link: {type: 'doc', id: 'data-provision/data-provision'}, + link: {type: 'doc', id: 'graph-production-workflow/graph-production-workflow'}, items: [ { type: 'category', label: "Aggregation", - link: {type: 'doc', id: 'data-provision/aggregation/aggregation'}, + link: {type: 'doc', id: 'graph-production-workflow/aggregation/aggregation'}, items: [ { type: 'doc', label: "OpenAIRE compatible sources", - id: 'data-provision/aggregation/compatible-sources', + id: 'graph-production-workflow/aggregation/compatible-sources', }, { type: 'category', label: "Non-compatible sources", link: { type: 'generated-index' }, items: [ - { type: 'doc', id: 'data-provision/aggregation/non-compatible-sources/doiboost', label: 'DOIBoost' }, - { type: 'doc', id: 'data-provision/aggregation/non-compatible-sources/pubmed' }, - { type: 'doc', id: 'data-provision/aggregation/non-compatible-sources/datacite' }, - { type: 'doc', id: 'data-provision/aggregation/non-compatible-sources/ebi', label: 'EMBL-EBI' }, - { type: 'doc', id: 'data-provision/aggregation/non-compatible-sources/uniprot', label: 'UniProtKB/Swiss-Prot' } + { type: 'doc', id: 'graph-production-workflow/aggregation/non-compatible-sources/doiboost', label: 'DOIBoost' }, + { type: 'doc', id: 'graph-production-workflow/aggregation/non-compatible-sources/pubmed' }, + { type: 'doc', id: 'graph-production-workflow/aggregation/non-compatible-sources/datacite' }, + { type: 'doc', id: 'graph-production-workflow/aggregation/non-compatible-sources/ebi', label: 'EMBL-EBI' }, + { type: 'doc', id: 'graph-production-workflow/aggregation/non-compatible-sources/uniprot', label: 'UniProtKB/Swiss-Prot' } ] } ] }, { type: 'doc', - id: 'data-provision/merge-by-id' + id: 'graph-production-workflow/merge-by-id' }, { type: 'category', @@ -105,23 +105,23 @@ const sidebars = { description: 'The OpenAIRE Graph is enriched using the different Text and Data Mining (TDM) algorithms that are grouped in the following categories.' }, items: [ - { type: 'doc', id: 'data-provision/enrichment-by-mining/affiliation_matching' }, - { type: 'doc', id: 'data-provision/enrichment-by-mining/citation_matching' }, - { type: 'doc', id: 'data-provision/enrichment-by-mining/classifies' }, - { type: 'doc', id: 'data-provision/enrichment-by-mining/documents_similarity' }, - { type: 'doc', id: 'data-provision/enrichment-by-mining/acks' }, - { type: 'doc', id: 'data-provision/enrichment-by-mining/cites' }, - { type: 'doc', id: 'data-provision/enrichment-by-mining/metadata_extraction' }, + { type: 'doc', id: 'graph-production-workflow/enrichment-by-mining/affiliation_matching' }, + { type: 'doc', id: 'graph-production-workflow/enrichment-by-mining/citation_matching' }, + { type: 'doc', id: 'graph-production-workflow/enrichment-by-mining/classifies' }, + { type: 'doc', id: 'graph-production-workflow/enrichment-by-mining/documents_similarity' }, + { type: 'doc', id: 'graph-production-workflow/enrichment-by-mining/acks' }, + { type: 'doc', id: 'graph-production-workflow/enrichment-by-mining/cites' }, + { type: 'doc', id: 'graph-production-workflow/enrichment-by-mining/metadata_extraction' }, ] }, - { type: 'doc', id: 'data-provision/cleaning' }, + { type: 'doc', id: 'graph-production-workflow/cleaning' }, { type: 'category', label: "Deduplication", - link: {type: 'doc', id: 'data-provision/deduplication/deduplication'}, + link: {type: 'doc', id: 'graph-production-workflow/deduplication/deduplication'}, items: [ - { type: 'doc', id: 'data-provision/deduplication/research-products' }, - { type: 'doc', id: 'data-provision/deduplication/organizations' }, + { type: 'doc', id: 'graph-production-workflow/deduplication/research-products' }, + { type: 'doc', id: 'graph-production-workflow/deduplication/organizations' }, ] }, { @@ -133,26 +133,23 @@ const sidebars = { }, items: [ - { type: 'doc', id: 'data-provision/deduction-and-propagation/bulk-tagging' }, - { type: 'doc', id: 'data-provision/deduction-and-propagation/propagation' }, + { type: 'doc', id: 'graph-production-workflow/deduction-and-propagation/bulk-tagging' }, + { type: 'doc', id: 'graph-production-workflow/deduction-and-propagation/propagation' }, ] }, { type: 'category', label: "Indicators ingestion", - link: { - type: 'generated-index' , - description: 'In this step, the following types of indicators are ingested in the OpenAIRE Graph.' + link: {type: 'doc', id: 'graph-production-workflow/indicators-ingestion/indicators-ingestion'}, - }, items: [ - { type: 'doc', id: 'data-provision/indicators-ingestion/impact-scores' }, - { type: 'doc', id: 'data-provision/indicators-ingestion/usage-counts' }, + { type: 'doc', id: 'graph-production-workflow/indicators-ingestion/impact-indicators' }, + { type: 'doc', id: 'graph-production-workflow/indicators-ingestion/usage-counts' }, ] }, - { type: 'doc', id: 'data-provision/finalisation' }, - { type: 'doc', id: 'data-provision/indexing' }, - { type: 'doc', id: 'data-provision/stats' } + { type: 'doc', id: 'graph-production-workflow/finalisation' }, + { type: 'doc', id: 'graph-production-workflow/indexing' }, + { type: 'doc', id: 'graph-production-workflow/stats' } ] }, { diff --git a/versioned_docs/version-5.2.0/changelog.md b/versioned_docs/version-5.2.0/changelog.md index c874cb7..c0ca8be 100644 --- a/versioned_docs/version-5.2.0/changelog.md +++ b/versioned_docs/version-5.2.0/changelog.md @@ -27,8 +27,8 @@ _Start Date: 2023-02-13 • Release Date: 2023-03-01 • Dump release: **n - Revised SDG classification: improved coverage (+600K classified DOIs) - General increase of the funded scientific outputs, thanks to the full text mining scanning new OpenAccess publications - Integrated contents from - - [EMBL-EBIs Protein Data Bank in Europe](/data-provision/aggregation/non-compatible-sources/ebi) - - [UniProtKB/Swiss-Prot](/data-provision/aggregation/non-compatible-sources/uniprot) + - [EMBL-EBIs Protein Data Bank in Europe](/graph-production-workflow/aggregation/non-compatible-sources/ebi) + - [UniProtKB/Swiss-Prot](/graph-production-workflow//aggregation/non-compatible-sources/uniprot) #### Changed diff --git a/versioned_docs/version-5.2.0/data-model/entities/other.md b/versioned_docs/version-5.2.0/data-model/entities/other.md index e066b5b..18c585a 100644 --- a/versioned_docs/version-5.2.0/data-model/entities/other.md +++ b/versioned_docs/version-5.2.0/data-model/entities/other.md @@ -615,7 +615,7 @@ _Type: [ImpactMeasures](#impactmeasures-1) • Cardinality: ONE_ These impact-based indicators, provided by [BIP!](https://bip.imsi.athenarc.gr/), estimate the impact of a result. -For details about their calculation, please refer [here](/data-provision/indicators-ingestion/impact-scores). +For details about their calculation, please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores). ```json "impactMeasures": { @@ -682,7 +682,7 @@ The different impact-based indicators as computed by [BIP!](https://bip.imsi.ath _Type: [Score](#score) • Cardinality: ONE_ This indicator reflects the overall/total impact of an article in the research community at large, based on the underlying citation network (diachronically). -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#pagerank-pr). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#pagerank-pr). ```json "influence": { @@ -695,7 +695,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This is an alternative to the "Influence" indicator, which also reflects the overall/total impact of an article in the research community at large, based on the underlying citation network (diachronically). -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#citation-count-cc). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#citation-count-cc). ```json "influence_alt" :{ @@ -708,7 +708,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This indicator reflects the "current" impact/attention (the "hype") of an article in the research community at large, based on the underlying citation network. -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#attrank). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#attrank). ```json "popularity":{ @@ -722,7 +722,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This is an alternative to the "Popularity" indicator, which also reflects the "current" impact/attention (the "hype") of an article in the research community at large, based on the underlying citation network. -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#ram). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#ram). ```json "popularity_alt":{ @@ -736,7 +736,7 @@ For more details please refer [here](/data-provision/indicators-ingestion/impact _Type: [Score](#score) • Cardinality: ONE_ This indicator reflects the initial momentum of an article directly after its publication, based on the underlying citation network. -For more details please refer [here](/data-provision/indicators-ingestion/impact-scores#incubation-citation-count-icc). +For more details please refer [here](/graph-production-workflow/indicators-ingestion/impact-scores#incubation-citation-count-icc). ```json "impulse":{ diff --git a/versioned_docs/version-5.2.0/data-model/entities/result.md b/versioned_docs/version-5.2.0/data-model/entities/result.md index f0abfcc..4b1a321 100644 --- a/versioned_docs/version-5.2.0/data-model/entities/result.md +++ b/versioned_docs/version-5.2.0/data-model/entities/result.md @@ -187,7 +187,7 @@ Date when the embargo ends and this result turns Open Access. _Type: [Indicator](other#indicator) • Cardinality: ONE_ The indicators computed for this result; -currently, the following two types of indicators are supported: [impact indicators](/data-provision/indicators-ingestion/impact-scores) and [usage statistics indicators](/data-provision/indicators-ingestion/usage-counts). +currently, the following two types of indicators are supported: [impact indicators](/graph-production-workflow/indicators-ingestion/impact-scores) and [usage statistics indicators](/graph-production-workflow/indicators-ingestion/usage-counts). ```json "indicators": { diff --git a/versioned_docs/version-5.2.0/data-model/pids-and-identifiers.md b/versioned_docs/version-5.2.0/data-model/pids-and-identifiers.md index de31912..c613366 100644 --- a/versioned_docs/version-5.2.0/data-model/pids-and-identifiers.md +++ b/versioned_docs/version-5.2.0/data-model/pids-and-identifiers.md @@ -77,5 +77,5 @@ Currently, the following data sources are used as "PID authorities": | pdb | `pdb_________` | EMBL-EBI | | uniprot | `uniprot_____` | EMBL-EBI | -OpenAIRE also perform duplicate identification (see the [dedicated section for details](/data-provision/deduplication)). +OpenAIRE also perform duplicate identification (see the [dedicated section for details](/graph-production-workflow/deduplication)). All duplicates are **merged** together in a **representative record** which must be assigned a dedicated OpenAIRE identifier (i.e. it cannot have the identifier of one of the aggregated record). diff --git a/versioned_docs/version-5.2.0/data-provision/_category_.json b/versioned_docs/version-5.2.0/data-provision/_category_.json deleted file mode 100644 index 80915c5..0000000 --- a/versioned_docs/version-5.2.0/data-provision/_category_.json +++ /dev/null @@ -1,8 +0,0 @@ -{ - "label": "Data provision", - "position": 6, - "link": { - "type": "doc", - "id": "data-provision" - } -} \ No newline at end of file diff --git a/versioned_docs/version-5.2.0/downloads/subgraphs.md b/versioned_docs/version-5.2.0/downloads/subgraphs.md index 2c91970..7fd5e97 100644 --- a/versioned_docs/version-5.2.0/downloads/subgraphs.md +++ b/versioned_docs/version-5.2.0/downloads/subgraphs.md @@ -5,7 +5,7 @@ sidebar_position: 3 # Sub-graph dumps :::caution -This version is not accompanied with public dump files, hence the files in this section are based on [v5.0.0](/docs/5.0.0/) of the Graph. The data of v.5.1.0 are only exposed via the [OpenAIRE Graph API](https://graph.openaire.eu/develop/) and added-value services that are built on top of this version of the Graph (e.g., the [OpenAIRE Explore](https://explore.openaire.eu/)). If you would be interested to get bulk access to Graph v5.1.0 data, please contact us via our [helpdesk](https://graph.openaire.eu/support). +This version is not accompanied with public dump files, hence the files in this section are based on [v5.0.0](/docs/5.0.0/) of the Graph. More recent versions of the data are only exposed via the [OpenAIRE Graph API](https://graph.openaire.eu/develop/) and added-value services that are built on top of this version of the Graph (e.g., the [OpenAIRE Explore](https://explore.openaire.eu/)). If you would be interested to get bulk access to more recent versions of the Graph data, please contact us via our [helpdesk](https://graph.openaire.eu/support). ::: In order to facilitate users, different dumps are available under the Zenodo community called [OpenAIRE Graph](https://zenodo.org/communities/openaire-research-graph). diff --git a/versioned_docs/version-5.2.0/graph-production-workflow/_category_.json b/versioned_docs/version-5.2.0/graph-production-workflow/_category_.json new file mode 100644 index 0000000..8da8ce0 --- /dev/null +++ b/versioned_docs/version-5.2.0/graph-production-workflow/_category_.json @@ -0,0 +1,8 @@ +{ + "label": "Graph production workflow", + "position": 6, + "link": { + "type": "doc", + "id": "graph-production-workflow" + } +} \ No newline at end of file diff --git a/versioned_docs/version-5.2.0/data-provision/aggregation/aggregation.md b/versioned_docs/version-5.2.0/graph-production-workflow/aggregation/aggregation.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/aggregation/aggregation.md rename to versioned_docs/version-5.2.0/graph-production-workflow/aggregation/aggregation.md diff --git a/versioned_docs/version-5.2.0/data-provision/aggregation/compatible-sources.md b/versioned_docs/version-5.2.0/graph-production-workflow/aggregation/compatible-sources.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/aggregation/compatible-sources.md rename to versioned_docs/version-5.2.0/graph-production-workflow/aggregation/compatible-sources.md diff --git a/versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/datacite.md b/versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/datacite.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/datacite.md rename to versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/datacite.md diff --git a/versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/doiboost.md b/versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/doiboost.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/doiboost.md rename to versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/doiboost.md diff --git a/versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/ebi.md b/versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/ebi.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/ebi.md rename to versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/ebi.md diff --git a/versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/pubmed.md b/versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/pubmed.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/pubmed.md rename to versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/pubmed.md diff --git a/versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/uniprot.md b/versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/uniprot.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/aggregation/non-compatible-sources/uniprot.md rename to versioned_docs/version-5.2.0/graph-production-workflow/aggregation/non-compatible-sources/uniprot.md diff --git a/versioned_docs/version-5.2.0/data-provision/cleaning.md b/versioned_docs/version-5.2.0/graph-production-workflow/cleaning.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/cleaning.md rename to versioned_docs/version-5.2.0/graph-production-workflow/cleaning.md diff --git a/versioned_docs/version-5.2.0/data-provision/deduction-and-propagation/bulk-tagging.md b/versioned_docs/version-5.2.0/graph-production-workflow/deduction-and-propagation/bulk-tagging.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/deduction-and-propagation/bulk-tagging.md rename to versioned_docs/version-5.2.0/graph-production-workflow/deduction-and-propagation/bulk-tagging.md diff --git a/versioned_docs/version-5.2.0/data-provision/deduction-and-propagation/propagation.md b/versioned_docs/version-5.2.0/graph-production-workflow/deduction-and-propagation/propagation.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/deduction-and-propagation/propagation.md rename to versioned_docs/version-5.2.0/graph-production-workflow/deduction-and-propagation/propagation.md diff --git a/versioned_docs/version-5.2.0/data-provision/deduplication/_category_.json b/versioned_docs/version-5.2.0/graph-production-workflow/deduplication/_category_.json similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/deduplication/_category_.json rename to versioned_docs/version-5.2.0/graph-production-workflow/deduplication/_category_.json diff --git a/versioned_docs/version-5.2.0/data-provision/deduplication/clustering-functions.md b/versioned_docs/version-5.2.0/graph-production-workflow/deduplication/clustering-functions.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/deduplication/clustering-functions.md rename to versioned_docs/version-5.2.0/graph-production-workflow/deduplication/clustering-functions.md diff --git a/versioned_docs/version-5.2.0/data-provision/deduplication/deduplication.md b/versioned_docs/version-5.2.0/graph-production-workflow/deduplication/deduplication.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/deduplication/deduplication.md rename to versioned_docs/version-5.2.0/graph-production-workflow/deduplication/deduplication.md diff --git a/versioned_docs/version-5.2.0/data-provision/deduplication/organizations.md b/versioned_docs/version-5.2.0/graph-production-workflow/deduplication/organizations.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/deduplication/organizations.md rename to versioned_docs/version-5.2.0/graph-production-workflow/deduplication/organizations.md diff --git a/versioned_docs/version-5.2.0/data-provision/deduplication/research-products.md b/versioned_docs/version-5.2.0/graph-production-workflow/deduplication/research-products.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/deduplication/research-products.md rename to versioned_docs/version-5.2.0/graph-production-workflow/deduplication/research-products.md diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/_category_.json b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/_category_.json similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/_category_.json rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/_category_.json diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/acks.md b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/acks.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/acks.md rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/acks.md diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/affiliation_matching.md b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/affiliation_matching.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/affiliation_matching.md rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/affiliation_matching.md diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/citation_matching.md b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/citation_matching.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/citation_matching.md rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/citation_matching.md diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/cites.md b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/cites.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/cites.md rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/cites.md diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/classifies.md b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/classifies.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/classifies.md rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/classifies.md diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/documents_similarity.md b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/documents_similarity.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/documents_similarity.md rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/documents_similarity.md diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/img.png b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/img.png similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/img.png rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/img.png diff --git a/versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/metadata_extraction.md b/versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/metadata_extraction.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/enrichment-by-mining/metadata_extraction.md rename to versioned_docs/version-5.2.0/graph-production-workflow/enrichment-by-mining/metadata_extraction.md diff --git a/versioned_docs/version-5.2.0/data-provision/finalisation.md b/versioned_docs/version-5.2.0/graph-production-workflow/finalisation.md similarity index 89% rename from versioned_docs/version-5.2.0/data-provision/finalisation.md rename to versioned_docs/version-5.2.0/graph-production-workflow/finalisation.md index 22e5ca9..06548dc 100644 --- a/versioned_docs/version-5.2.0/data-provision/finalisation.md +++ b/versioned_docs/version-5.2.0/graph-production-workflow/finalisation.md @@ -10,7 +10,7 @@ Bibliographic records that do not meet minimal requirements for being part of th Currently, the only criteria applied horizontally to the entire graph aims at excluding scientific results whose title is not meaningful for citation purposes. Then, different criteria are applied in the pre-processing of specific sub-collections: -* [Crossref filtering](/data-provision/aggregation/non-compatible-sources/doiboost#crossref-filtering) +* [Crossref filtering](/graph-production-workflow/aggregation/non-compatible-sources/doiboost#crossref-filtering) ## Country cleaning diff --git a/versioned_docs/version-5.2.0/data-provision/data-provision.md b/versioned_docs/version-5.2.0/graph-production-workflow/graph-production-workflow.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/data-provision.md rename to versioned_docs/version-5.2.0/graph-production-workflow/graph-production-workflow.md diff --git a/versioned_docs/version-5.2.0/data-provision/indexing.md b/versioned_docs/version-5.2.0/graph-production-workflow/indexing.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/indexing.md rename to versioned_docs/version-5.2.0/graph-production-workflow/indexing.md diff --git a/docs/data-provision/indicators-ingestion/impact-scores.md b/versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/impact-indicators.md similarity index 96% rename from docs/data-provision/indicators-ingestion/impact-scores.md rename to versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/impact-indicators.md index b5d9bcd..6c90186 100644 --- a/docs/data-provision/indicators-ingestion/impact-scores.md +++ b/versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/impact-indicators.md @@ -1,6 +1,7 @@ # Impact indicators -This page summarises all calculated impact indicators, which are included in the [impactMeasures](/data-model/entities/other#impactmeasures) property which is part of the [indicators](/data-model/entities/result#indicators) property of the result. +This page summarises all calculated impact indicators, provided by [BIP!](https://bip.imsi.athenarc.gr/), which are included in the [impactMeasures](/data-model/entities/other#impactmeasures) property (found under the [indicators](/data-model/entities/result#indicators) property of the result). + It should be noted that the impact indicators are being calculated on the level of the research output. Below we explain their main intuition, the way they are calculated, and their most important limitations, in an attempt help avoiding common pitfalls and misuses. diff --git a/versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/indicators-ingestion.md b/versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/indicators-ingestion.md new file mode 100644 index 0000000..4402287 --- /dev/null +++ b/versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/indicators-ingestion.md @@ -0,0 +1,8 @@ +import DocCardList from '@theme/DocCardList'; + +# Indicators ingestion + +In this step, results are enriched with Impact and Usage Statistics indicators. +The former are provided by [BIP!](https://bip.imsi.athenarc.gr/) while the latter are computed by OpenAIRE's [UsageCounts service](https://usagecounts.openaire.eu/). + + \ No newline at end of file diff --git a/docs/data-provision/indicators-ingestion/usage-counts.md b/versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/usage-counts.md similarity index 88% rename from docs/data-provision/indicators-ingestion/usage-counts.md rename to versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/usage-counts.md index fd98a43..b1a86bd 100644 --- a/docs/data-provision/indicators-ingestion/usage-counts.md +++ b/versioned_docs/version-5.2.0/graph-production-workflow/indicators-ingestion/usage-counts.md @@ -1,7 +1,7 @@ -# Usage Statistics Indicators +# Usage Statistics indicators Usage Statistics indicators for research products, like publications, datasets,etc., are an important complement to other (traditional and alternative) bibliometric indicators to provide a comprehensive and recent view of the impact of such resources but also about their authors, institutions and the platforms themselves. They are taking into account different levels of information: the usage of data sources, the usage of individual items in the context of their resource type and the usage of individual web resources or files. -Usage Statistics Indicators are built by the OpenAIRE's UsageCounts Service. The service collects usage data and consolidated usage statistics reports respectively, from its distributed network of data providers (repositories, e-journals, CRIS) by utilizing open standards and protocols and delivers reliable, consolidated and comparable usage metrics like counts of item downloads and metadata views conformant to COUNTER Code of Practice. +Usage Statistics Indicators are built by the OpenAIRE's UsageCounts service. The service collects usage data and consolidated usage statistics reports respectively, from its distributed network of data providers (repositories, e-journals, CRIS) by utilizing open standards and protocols and delivers reliable, consolidated and comparable usage metrics like counts of item downloads and metadata views conformant to COUNTER Code of Practice. You can find more information about the UsageCounts service [here](https://usagecounts.openaire.eu/). \ No newline at end of file diff --git a/versioned_docs/version-5.2.0/data-provision/merge-by-id.md b/versioned_docs/version-5.2.0/graph-production-workflow/merge-by-id.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/merge-by-id.md rename to versioned_docs/version-5.2.0/graph-production-workflow/merge-by-id.md diff --git a/versioned_docs/version-5.2.0/data-provision/stats.md b/versioned_docs/version-5.2.0/graph-production-workflow/stats.md similarity index 100% rename from versioned_docs/version-5.2.0/data-provision/stats.md rename to versioned_docs/version-5.2.0/graph-production-workflow/stats.md diff --git a/versioned_sidebars/version-5.2.0-sidebars.json b/versioned_sidebars/version-5.2.0-sidebars.json index 382912b..3188c4d 100644 --- a/versioned_sidebars/version-5.2.0-sidebars.json +++ b/versioned_sidebars/version-5.2.0-sidebars.json @@ -88,7 +88,7 @@ "label": "Graph production workflow", "link": { "type": "doc", - "id": "data-provision/data-provision" + "id": "graph-production-workflow/graph-production-workflow" }, "items": [ { @@ -96,13 +96,13 @@ "label": "Aggregation", "link": { "type": "doc", - "id": "data-provision/aggregation/aggregation" + "id": "graph-production-workflow/aggregation/aggregation" }, "items": [ { "type": "doc", "label": "OpenAIRE compatible sources", - "id": "data-provision/aggregation/compatible-sources" + "id": "graph-production-workflow/aggregation/compatible-sources" }, { "type": "category", @@ -113,25 +113,25 @@ "items": [ { "type": "doc", - "id": "data-provision/aggregation/non-compatible-sources/doiboost", + "id": "graph-production-workflow/aggregation/non-compatible-sources/doiboost", "label": "DOIBoost" }, { "type": "doc", - "id": "data-provision/aggregation/non-compatible-sources/pubmed" + "id": "graph-production-workflow/aggregation/non-compatible-sources/pubmed" }, { "type": "doc", - "id": "data-provision/aggregation/non-compatible-sources/datacite" + "id": "graph-production-workflow/aggregation/non-compatible-sources/datacite" }, { "type": "doc", - "id": "data-provision/aggregation/non-compatible-sources/ebi", + "id": "graph-production-workflow/aggregation/non-compatible-sources/ebi", "label": "EMBL-EBI" }, { "type": "doc", - "id": "data-provision/aggregation/non-compatible-sources/uniprot", + "id": "graph-production-workflow/aggregation/non-compatible-sources/uniprot", "label": "UniProtKB/Swiss-Prot" } ] @@ -140,7 +140,7 @@ }, { "type": "doc", - "id": "data-provision/merge-by-id" + "id": "graph-production-workflow/merge-by-id" }, { "type": "category", @@ -152,53 +152,53 @@ "items": [ { "type": "doc", - "id": "data-provision/enrichment-by-mining/affiliation_matching" + "id": "graph-production-workflow/enrichment-by-mining/affiliation_matching" }, { "type": "doc", - "id": "data-provision/enrichment-by-mining/citation_matching" + "id": "graph-production-workflow/enrichment-by-mining/citation_matching" }, { "type": "doc", - "id": "data-provision/enrichment-by-mining/classifies" + "id": "graph-production-workflow/enrichment-by-mining/classifies" }, { "type": "doc", - "id": "data-provision/enrichment-by-mining/documents_similarity" + "id": "graph-production-workflow/enrichment-by-mining/documents_similarity" }, { "type": "doc", - "id": "data-provision/enrichment-by-mining/acks" + "id": "graph-production-workflow/enrichment-by-mining/acks" }, { "type": "doc", - "id": "data-provision/enrichment-by-mining/cites" + "id": "graph-production-workflow/enrichment-by-mining/cites" }, { "type": "doc", - "id": "data-provision/enrichment-by-mining/metadata_extraction" + "id": "graph-production-workflow/enrichment-by-mining/metadata_extraction" } ] }, { "type": "doc", - "id": "data-provision/cleaning" + "id": "graph-production-workflow/cleaning" }, { "type": "category", "label": "Deduplication", "link": { "type": "doc", - "id": "data-provision/deduplication/deduplication" + "id": "graph-production-workflow/deduplication/deduplication" }, "items": [ { "type": "doc", - "id": "data-provision/deduplication/research-products" + "id": "graph-production-workflow/deduplication/research-products" }, { "type": "doc", - "id": "data-provision/deduplication/organizations" + "id": "graph-production-workflow/deduplication/organizations" } ] }, @@ -212,11 +212,11 @@ "items": [ { "type": "doc", - "id": "data-provision/deduction-and-propagation/bulk-tagging" + "id": "graph-production-workflow/deduction-and-propagation/bulk-tagging" }, { "type": "doc", - "id": "data-provision/deduction-and-propagation/propagation" + "id": "graph-production-workflow/deduction-and-propagation/propagation" } ] }, @@ -224,31 +224,31 @@ "type": "category", "label": "Indicators ingestion", "link": { - "type": "generated-index", - "description": "In this step, the following types of indicators are ingested in the OpenAIRE Graph." + "type": "doc", + "id": "graph-production-workflow/indicators-ingestion/indicators-ingestion" }, "items": [ { "type": "doc", - "id": "data-provision/indicators-ingestion/impact-scores" + "id": "graph-production-workflow/indicators-ingestion/impact-indicators" }, { "type": "doc", - "id": "data-provision/indicators-ingestion/usage-counts" + "id": "graph-production-workflow/indicators-ingestion/usage-counts" } ] }, { "type": "doc", - "id": "data-provision/finalisation" + "id": "graph-production-workflow/finalisation" }, { "type": "doc", - "id": "data-provision/indexing" + "id": "graph-production-workflow/indexing" }, { "type": "doc", - "id": "data-provision/stats" + "id": "graph-production-workflow/stats" } ] },