diff --git a/dhp-build/dhp-build-assembly-resources/pom.xml b/dhp-build/dhp-build-assembly-resources/pom.xml
index 0c4637def4..c837cd5386 100644
--- a/dhp-build/dhp-build-assembly-resources/pom.xml
+++ b/dhp-build/dhp-build-assembly-resources/pom.xml
@@ -6,7 +6,7 @@
eu.dnetlib.dhp
dhp-build
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
dhp-build-assembly-resources
diff --git a/dhp-build/dhp-build-properties-maven-plugin/pom.xml b/dhp-build/dhp-build-properties-maven-plugin/pom.xml
index 308d787157..df5045fcb6 100644
--- a/dhp-build/dhp-build-properties-maven-plugin/pom.xml
+++ b/dhp-build/dhp-build-properties-maven-plugin/pom.xml
@@ -6,7 +6,7 @@
eu.dnetlib.dhp
dhp-build
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
dhp-build-properties-maven-plugin
@@ -102,7 +102,7 @@
-
+
diff --git a/dhp-build/pom.xml b/dhp-build/pom.xml
index e471af76d5..3b54b4e61a 100644
--- a/dhp-build/pom.xml
+++ b/dhp-build/pom.xml
@@ -4,7 +4,7 @@
eu.dnetlib.dhp
dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
dhp-build
pom
diff --git a/dhp-common/pom.xml b/dhp-common/pom.xml
index f6283d450c..1268afa3a1 100644
--- a/dhp-common/pom.xml
+++ b/dhp-common/pom.xml
@@ -5,7 +5,7 @@
eu.dnetlib.dhp
dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
../
diff --git a/dhp-schemas/pom.xml b/dhp-schemas/pom.xml
index a85c0dd230..8deb2eab23 100644
--- a/dhp-schemas/pom.xml
+++ b/dhp-schemas/pom.xml
@@ -5,7 +5,7 @@
eu.dnetlib.dhp
dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
../
diff --git a/dhp-workflows/dhp-aggregation/pom.xml b/dhp-workflows/dhp-aggregation/pom.xml
index 95e9578478..8d4d880b3f 100644
--- a/dhp-workflows/dhp-aggregation/pom.xml
+++ b/dhp-workflows/dhp-aggregation/pom.xml
@@ -4,7 +4,7 @@
eu.dnetlib.dhp
dhp-workflows
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
dhp-aggregation
diff --git a/dhp-workflows/dhp-dedup-openaire/pom.xml b/dhp-workflows/dhp-dedup-openaire/pom.xml
index a4793da897..e7f2a926f4 100644
--- a/dhp-workflows/dhp-dedup-openaire/pom.xml
+++ b/dhp-workflows/dhp-dedup-openaire/pom.xml
@@ -3,7 +3,7 @@
dhp-workflows
eu.dnetlib.dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
4.0.0
dhp-dedup-openaire
diff --git a/dhp-workflows/dhp-dedup-scholexplorer/pom.xml b/dhp-workflows/dhp-dedup-scholexplorer/pom.xml
index 387952e338..e87811cd5d 100644
--- a/dhp-workflows/dhp-dedup-scholexplorer/pom.xml
+++ b/dhp-workflows/dhp-dedup-scholexplorer/pom.xml
@@ -1,10 +1,9 @@
-
+
dhp-workflows
eu.dnetlib.dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
4.0.0
diff --git a/dhp-workflows/dhp-distcp/pom.xml b/dhp-workflows/dhp-distcp/pom.xml
index c3f09b42c1..d013dd1d98 100644
--- a/dhp-workflows/dhp-distcp/pom.xml
+++ b/dhp-workflows/dhp-distcp/pom.xml
@@ -3,7 +3,7 @@
dhp-workflows
eu.dnetlib.dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
4.0.0
diff --git a/dhp-workflows/dhp-graph-mapper/derby.log b/dhp-workflows/dhp-graph-mapper/derby.log
deleted file mode 100644
index 0c6791d965..0000000000
--- a/dhp-workflows/dhp-graph-mapper/derby.log
+++ /dev/null
@@ -1,13 +0,0 @@
-----------------------------------------------------------------
-Thu Mar 26 19:43:00 CET 2020:
-Booting Derby version The Apache Software Foundation - Apache Derby - 10.12.1.1 - (1704137): instance a816c00e-0171-1827-9724-000012c70f40
-on database directory /private/var/folders/xn/nr5vdk8n1572rvrnx5890_d80000gn/T/junit3871072562876431144/junit_metastore_db with class loader org.apache.spark.sql.hive.client.IsolatedClientLoader$$anon$1@4e6b5ed4
-Loaded from file:/Users/claudio/.m2/repository/org/apache/derby/derby/10.12.1.1/derby-10.12.1.1.jar
-java.vendor=Oracle Corporation
-java.runtime.version=1.8.0_181-b13
-user.dir=/Users/claudio/workspace/git/dnet-hadoop/dhp-workflows/dhp-graph-mapper
-os.name=Mac OS X
-os.arch=x86_64
-os.version=10.15.3
-derby.system.home=null
-Database Class Loader started - derby.database.classpath=''
diff --git a/dhp-workflows/dhp-graph-mapper/pom.xml b/dhp-workflows/dhp-graph-mapper/pom.xml
index 03b6d00524..9876edc16a 100644
--- a/dhp-workflows/dhp-graph-mapper/pom.xml
+++ b/dhp-workflows/dhp-graph-mapper/pom.xml
@@ -1,10 +1,9 @@
-
+
dhp-workflows
eu.dnetlib.dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
4.0.0
diff --git a/dhp-workflows/dhp-graph-provision-scholexplorer/pom.xml b/dhp-workflows/dhp-graph-provision-scholexplorer/pom.xml
index bb41858a6f..de38a01b3f 100644
--- a/dhp-workflows/dhp-graph-provision-scholexplorer/pom.xml
+++ b/dhp-workflows/dhp-graph-provision-scholexplorer/pom.xml
@@ -1,10 +1,9 @@
-
+
dhp-workflows
eu.dnetlib.dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
4.0.0
diff --git a/dhp-workflows/dhp-graph-provision/job-override.properties b/dhp-workflows/dhp-graph-provision/job-override.properties
deleted file mode 100644
index 8230dfc18f..0000000000
--- a/dhp-workflows/dhp-graph-provision/job-override.properties
+++ /dev/null
@@ -1,14 +0,0 @@
-sparkExecutorCoresForJoining=1
-sparkDriverMemoryForJoining=10G
-sparkExecutorMemoryForJoining=15G
-sparkExecutorCoresForIndexing=64
-sparkDriverMemoryForIndexing=3G
-sparkExecutorMemoryForIndexing=2G
-#isLookupUrl=http://services.openaire.eu:8280/is/services/isLookUp
-isLookupUrl=http://beta.services.openaire.eu:8280/is/services/isLookUp?wsdl
-sourcePath=/tmp/db_openaireplus_services.export_dhp.2020.02.03
-outputPath=/tmp/openaire_provision
-format=TMF
-batchSize=2000
-reuseRecords=false
-otherDsTypeId=scholarcomminfra, infospace, pubsrepository::mock, entityregistry, entityregistry::projects, entityregistry::repositories, websource
\ No newline at end of file
diff --git a/dhp-workflows/dhp-graph-provision/pom.xml b/dhp-workflows/dhp-graph-provision/pom.xml
index ac4e01d218..baac163d27 100644
--- a/dhp-workflows/dhp-graph-provision/pom.xml
+++ b/dhp-workflows/dhp-graph-provision/pom.xml
@@ -3,7 +3,7 @@
dhp-workflows
eu.dnetlib.dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
4.0.0
diff --git a/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/SparkXmlRecordBuilderJob.java b/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/SparkXmlRecordBuilderJob.java
index a84cda53a6..0a898c0fcc 100644
--- a/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/SparkXmlRecordBuilderJob.java
+++ b/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/SparkXmlRecordBuilderJob.java
@@ -29,14 +29,9 @@ public class SparkXmlRecordBuilderJob {
final String otherDsTypeId = parser.get("otherDsTypeId");
final FileSystem fs = FileSystem.get(spark.sparkContext().hadoopConfiguration());
- if (fs.exists(new Path(outputPath))) {
- fs.delete(new Path(outputPath), true);
- fs.mkdirs(new Path(outputPath));
- }
new GraphJoiner(spark, ContextMapper.fromIS(isLookupUrl), otherDsTypeId, inputPath, outputPath)
.adjacencyLists();
- //.asXML();
}
}
diff --git a/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/utils/TemplateResources.java b/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/utils/TemplateResources.java
index a9086f7bc9..b22e083ce3 100644
--- a/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/utils/TemplateResources.java
+++ b/dhp-workflows/dhp-graph-provision/src/main/java/eu/dnetlib/dhp/oa/provision/utils/TemplateResources.java
@@ -7,17 +7,17 @@ import java.nio.charset.StandardCharsets;
public class TemplateResources {
- private String record = read("eu/dnetlib/dhp/graph/template/record.st");
+ private String record = read("eu/dnetlib/dhp/oa/provision/template/record.st");
- private String instance = read("eu/dnetlib/dhp/graph/template/instance.st");
+ private String instance = read("eu/dnetlib/dhp/oa/provision/template/instance.st");
- private String rel = read("eu/dnetlib/dhp/graph/template/rel.st");
+ private String rel = read("eu/dnetlib/dhp/oa/provision/template/rel.st");
- private String webresource = read("eu/dnetlib/dhp/graph/template/webresource.st");
+ private String webresource = read("eu/dnetlib/dhp/oa/provision/template/webresource.st");
- private String child = read("eu/dnetlib/dhp/graph/template/child.st");
+ private String child = read("eu/dnetlib/dhp/oa/provision/template/child.st");
- private String entity = read("eu/dnetlib/dhp/graph/template/entity.st");
+ private String entity = read("eu/dnetlib/dhp/oa/provision/template/entity.st");
private static String read(final String classpathResource) throws IOException {
return Resources.toString(Resources.getResource(classpathResource), StandardCharsets.UTF_8);
diff --git a/dhp-workflows/dhp-graph-provision/src/main/resources/eu/dnetlib/dhp/oa/provision/oozie_app/workflow.xml b/dhp-workflows/dhp-graph-provision/src/main/resources/eu/dnetlib/dhp/oa/provision/oozie_app/workflow.xml
index 1d99831e45..a28174cce2 100644
--- a/dhp-workflows/dhp-graph-provision/src/main/resources/eu/dnetlib/dhp/oa/provision/oozie_app/workflow.xml
+++ b/dhp-workflows/dhp-graph-provision/src/main/resources/eu/dnetlib/dhp/oa/provision/oozie_app/workflow.xml
@@ -58,6 +58,10 @@
+
+
+
+
yarn
cluster
build_adjacency_lists
@@ -67,7 +71,6 @@
--executor-cores ${sparkExecutorCoresForJoining}
--executor-memory ${sparkExecutorMemoryForJoining}
--driver-memory=${sparkDriverMemoryForJoining}
- --conf spark.dynamicAllocation.maxExecutors=${sparkExecutorCoresForJoining}
--conf spark.extraListeners="com.cloudera.spark.lineage.NavigatorAppListener"
--conf spark.sql.queryExecutionListeners="com.cloudera.spark.lineage.NavigatorQueryListener"
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
diff --git a/dhp-workflows/pom.xml b/dhp-workflows/pom.xml
index 433cf1fa9d..4b5fb4b4f6 100644
--- a/dhp-workflows/pom.xml
+++ b/dhp-workflows/pom.xml
@@ -6,7 +6,7 @@
eu.dnetlib.dhp
dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
../
diff --git a/pom.xml b/pom.xml
index 99e40b9b53..ae19ddbe51 100644
--- a/pom.xml
+++ b/pom.xml
@@ -1,11 +1,9 @@
-
+
4.0.0
eu.dnetlib.dhp
dhp
- 1.1.6-SNAPSHOT
+ 1.1.7-SNAPSHOT
pom
http://www.d-net.research-infrastructures.eu