From 6f43acda5e64ae8c87128e6612c5a4fa5e1c195f Mon Sep 17 00:00:00 2001 From: "miriam.baglioni" Date: Tue, 11 Aug 2020 15:38:20 +0200 Subject: [PATCH] added the maketar and send to zenodo step. Adjusted wf parameters --- .../graph/dump_whole/oozie_app/workflow.xml | 108 ++++++++++++------ 1 file changed, 75 insertions(+), 33 deletions(-) diff --git a/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/oa/graph/dump_whole/oozie_app/workflow.xml b/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/oa/graph/dump_whole/oozie_app/workflow.xml index 00d75e897..a1b984f9c 100644 --- a/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/oa/graph/dump_whole/oozie_app/workflow.xml +++ b/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/oa/graph/dump_whole/oozie_app/workflow.xml @@ -13,6 +13,26 @@ outputPath the output path + + accessToken + the access token used for the deposition in Zenodo + + + connectionUrl + the connection url for Zenodo + + + metadata + the metadata associated to the deposition + + + newDeposition + true if it is a brand new depositon. false for new version of an old deposition + + + conceptRecordId + for new version, the id of the record for the old deposition + organizationCommunityMap the organization community map @@ -97,13 +117,13 @@ - + - eu.dnetlib.dhp.oa.graph.dump.community.SaveCommunityMap + eu.dnetlib.dhp.oa.graph.dump.SaveCommunityMap --outputPath${workingDir}/communityMap --nameNode${nameNode} --isLookUpUrl${isLookUpUrl} @@ -143,8 +163,7 @@ --sourcePath${sourcePath}/publication --resultTableNameeu.dnetlib.dhp.schema.oaf.Publication --outputPath${workingDir}/result/publication - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap @@ -170,8 +189,7 @@ --sourcePath${sourcePath}/dataset --resultTableNameeu.dnetlib.dhp.schema.oaf.Dataset --outputPath${workingDir}/result/dataset - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap @@ -197,8 +215,7 @@ --sourcePath${sourcePath}/otherresearchproduct --resultTableNameeu.dnetlib.dhp.schema.oaf.OtherResearchProduct --outputPath${workingDir}/result/otherresearchproduct - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap @@ -224,8 +241,7 @@ --sourcePath${sourcePath}/software --resultTableNameeu.dnetlib.dhp.schema.oaf.Software --outputPath${workingDir}/result/software - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap @@ -250,9 +266,9 @@ --sourcePath${sourcePath}/organization --resultTableNameeu.dnetlib.dhp.schema.oaf.Organization - --outputPath${outputPath}/organization - - --isLookUpUrl${isLookUpUrl} + --outputPath${workingDir}/collect/organization + --communityMapPath${workingDir}/communityMap + @@ -277,9 +293,9 @@ --sourcePath${sourcePath}/project --resultTableNameeu.dnetlib.dhp.schema.oaf.Project - --outputPath${outputPath}/project - - --isLookUpUrl${isLookUpUrl} + --outputPath${workingDir}/collect/project + --communityMapPath${workingDir}/communityMap + @@ -304,9 +320,9 @@ --sourcePath${sourcePath}/datasource --resultTableNameeu.dnetlib.dhp.schema.oaf.Datasource - --outputPath${outputPath}/datasource - - --isLookUpUrl${isLookUpUrl} + --outputPath${workingDir}/collect/datasource + --communityMapPath${workingDir}/communityMap + @@ -330,7 +346,7 @@ --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir} --sourcePath${sourcePath}/relation - --outputPath${outputPath}/relation + --outputPath${workingDir}/relation/relation @@ -349,8 +365,8 @@ eu.dnetlib.dhp.oa.graph.dump.graph.CreateContextEntities - --hdfsPath${outputPath}/context - --hdfsNameNode${nameNode} + --hdfsPath${workingDir}/collect/context + --nameNode${nameNode} --isLookUpUrl${isLookUpUrl} @@ -361,7 +377,7 @@ eu.dnetlib.dhp.oa.graph.dump.graph.CreateContextRelation --hdfsPath${workingDir}/relation/context - --hdfsNameNode${nameNode} + --nameNode${nameNode} --isLookUpUrl${isLookUpUrl} @@ -424,8 +440,8 @@ --sourcePath${sourcePath}/publication --resultTableNameeu.dnetlib.dhp.schema.oaf.Publication --outputPath${workingDir}/relation/publication - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap + @@ -451,8 +467,8 @@ --sourcePath${sourcePath}/dataset --resultTableNameeu.dnetlib.dhp.schema.oaf.Dataset --outputPath${workingDir}/relation/dataset - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap + @@ -478,8 +494,8 @@ --sourcePath${sourcePath}/otherresearchproduct --resultTableNameeu.dnetlib.dhp.schema.oaf.OtherResearchProduct --outputPath${workingDir}/relation/orp - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap + @@ -505,8 +521,8 @@ --sourcePath${sourcePath}/software --resultTableNameeu.dnetlib.dhp.schema.oaf.Software --outputPath${workingDir}/relation/software - - --isLookUpUrl${isLookUpUrl} + --communityMapPath${workingDir}/communityMap + @@ -533,13 +549,39 @@ --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir} --sourcePath${workingDir} - --outputPath${outputPath} + --outputPath${workingDir}/collect - + + + + + + + eu.dnetlib.dhp.oa.graph.dump.MakeTar + --hdfsPath${outputPath} + --nameNode${nameNode} + --sourcePath${workingDir}/collect + + + + + eu.dnetlib.dhp.oa.graph.dump.SendToZenodoHDFS + --hdfsPath${outputPath} + --nameNode${nameNode} + --accessToken${accessToken} + --connectionUrl${connectionUrl} + --metadata${metadata} + --communityMapPath${workingDir}/communityMap + --conceptRecordId${conceptRecordId} + --newDeposition${newDeposition} + + + +