diff --git a/dhp-workflows/dhp-worfklow-profiles/src/main/resources/eu/dnetlib/dhp/wf/profiles/graph_construction.xml b/dhp-workflows/dhp-worfklow-profiles/src/main/resources/eu/dnetlib/dhp/wf/profiles/graph_construction.xml
index 819b3e12d..4d77883b4 100644
--- a/dhp-workflows/dhp-worfklow-profiles/src/main/resources/eu/dnetlib/dhp/wf/profiles/graph_construction.xml
+++ b/dhp-workflows/dhp-worfklow-profiles/src/main/resources/eu/dnetlib/dhp/wf/profiles/graph_construction.xml
@@ -11,6 +11,29 @@
Data Provision
30
+
+
+ reuse cached content from the aggregation system
+
+ reuseContent
+ true
+
+
+
+
+
+
+
+ set the aggregator content path
+
+ contentPath
+ /tmp/beta_aggregator
+
+
+
+
+
+
Set the path containing the AGGREGATOR graph
@@ -62,87 +85,94 @@
-
- Set the target path to store the CLEANED graph
+
+ Set the target path to store the ORCID enriched graph
- cleanedGraphPath
- /tmp/beta_provision/graph/05_graph_cleaned
+ orcidGraphPath
+ /tmp/beta_provision/graph/05_graph_orcid
-
- Set the target path to store the ORCID enriched graph
-
- orcidGraphPath
- /tmp/beta_provision/graph/06_graph_orcid
-
-
-
-
-
Set the target path to store the BULK TAGGED graph
bulkTaggingGraphPath
- /tmp/beta_provision/graph/07_graph_bulktagging
+ /tmp/beta_provision/graph/06_graph_bulktagging
+
Set the target path to store the AFFILIATION from INSTITUTIONAL REPOS graph
affiliationGraphPath
- /tmp/beta_provision/graph/08_graph_affiliation
+ /tmp/beta_provision/graph/07_graph_affiliation
+
Set the target path to store the COMMUNITY from SELECTED SOURCES graph
communityOrganizationGraphPath
- /tmp/beta_provision/graph/09_graph_comunity_organization
+ /tmp/beta_provision/graph/08_graph_comunity_organization
+
Set the target path to store the FUNDING from SEMANTIC RELATION graph
fundingGraphPath
- /tmp/beta_provision/graph/10_graph_funding
+ /tmp/beta_provision/graph/09_graph_funding
+
Set the target path to store the COMMUNITY from SEMANTIC RELATION graph
communitySemRelGraphPath
- /tmp/beta_provision/graph/11_graph_comunity_sem_rel
+ /tmp/beta_provision/graph/10_graph_comunity_sem_rel
+
Set the target path to store the COUNTRY enriched graph
countryGraphPath
- /tmp/beta_provision/graph/12_graph_country
+ /tmp/beta_provision/graph/11_graph_country
+
+
+ Set the target path to store the CLEANED graph
+
+ cleanedGraphPath
+ /tmp/beta_provision/graph/12_graph_cleaned
+
+
+
+
+
+
Set the target path to store the blacklisted graph
@@ -153,6 +183,7 @@
+
Set the lookup address
@@ -163,6 +194,7 @@
+
Set the map of paths for the Bulk Tagging
@@ -173,6 +205,7 @@
+
Set the map of associations organization, community list for the propagation of community to result through organization
@@ -185,6 +218,7 @@
+
Set the dedup orchestrator name
@@ -195,6 +229,7 @@
+
declares the ActionSet ids to promote in the RAW graph
@@ -205,6 +240,7 @@
+
declares the ActionSet ids to promote in the INFERRED graph
@@ -215,6 +251,7 @@
+
wait configurations
@@ -222,6 +259,7 @@
+
create the AGGREGATOR graph
@@ -230,7 +268,9 @@
{
'graphOutputPath' : 'aggregatorGraphPath',
- 'isLookupUrl' : 'isLookUpUrl'
+ 'isLookupUrl' : 'isLookUpUrl',
+ 'reuseContent' : 'reuseContent',
+ 'contentPath' : 'contentPath'
}
@@ -241,8 +281,6 @@
'postgresURL' : 'jdbc:postgresql://beta.services.openaire.eu:5432/dnet_openaireplus',
'postgresUser' : 'dnet',
'postgresPassword' : '',
- 'reuseContent' : 'false',
- 'contentPath' : '/tmp/beta_provision/aggregator',
'workingDir' : '/tmp/beta_provision/working_dir/aggregator'
}
@@ -252,6 +290,7 @@
+
create the RAW graph
@@ -289,6 +328,7 @@
+
search for duplicates in the raw graph
@@ -314,6 +354,7 @@
+
create the INFERRED graph
@@ -351,6 +392,7 @@
+
mark duplicates as deleted and redistribute the relationships
@@ -375,41 +417,6 @@
-
- clean the properties in the graph typed as Qualifier according to the vocabulary indicated in schemeid
-
- executeOozieJob
- IIS
-
- {
- 'graphInputPath' : 'consistentGraphPath',
- 'graphOutputPath': 'cleanedGraphPath',
- 'isLookupUrl': 'isLookUpUrl'
- }
-
-
- {
- 'oozie.wf.application.path' : '/lib/dnet/oa/graph/clean/oozie_app',
- 'workingPath' : '/tmp/beta_provision/working_dir/clean'
- }
-
- build-report
-
-
-
-
-
-
-
- Do we skip the graph enrichment steps? (Yes to prepare the graph for the IIS)
-
- NO
-
-
-
-
-
-
propagates ORCID among results linked by allowedsemrels semantic relationships
@@ -417,7 +424,7 @@
IIS
{
- 'sourcePath' : 'cleanedGraphPath',
+ 'sourcePath' : 'consistentGraphPath',
'outputPath': 'orcidGraphPath'
}
@@ -435,6 +442,7 @@
+
mark results respecting some rules as belonging to communities
@@ -460,6 +468,7 @@
+
creates relashionships between results and organizations when the organizations are associated to institutional repositories
@@ -484,6 +493,7 @@
+
marks as belonging to communities the result collected from datasources related to the organizations specified in the organizationCommunityMap
@@ -509,6 +519,7 @@
+
created relation between projects and results linked to other results trough allowedsemrel semantic relations linked to projects
@@ -534,6 +545,7 @@
+
tag as belonging to communitites result in in allowedsemrels relation with other result already linked to communities
@@ -560,6 +572,7 @@
+
associated to results colleced from allowedtypes and those in the whithelist the country of the organization(s) handling the datasource it is collected from
@@ -584,10 +597,36 @@
build-report
+
+
+
+
+
+
+ clean the properties in the graph typed as Qualifier according to the vocabulary indicated in schemeid
+
+ executeOozieJob
+ IIS
+
+ {
+ 'graphInputPath' : 'countryGraphPath',
+ 'graphOutputPath': 'cleanedGraphPath',
+ 'isLookupUrl': 'isLookUpUrl'
+ }
+
+
+ {
+ 'oozie.wf.application.path' : '/lib/dnet/oa/graph/clean/oozie_app',
+ 'workingPath' : '/tmp/beta_provision/working_dir/clean'
+ }
+
+ build-report
+
+
removes blacklisted relations
@@ -595,7 +634,7 @@
IIS
{
- 'sourcePath' : 'countryGraphPath',
+ 'sourcePath' : 'cleanedGraphPath',
'outputPath': 'blacklistedGraphPath'
}