sourcePath
the source path
outputPath
sets the outputPath
${jobTracker}
${nameNode}
oozie.action.sharelib.for.spark
${oozieActionShareLibForSpark2}
Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]
${nameNode}/${sourcePath}/relation
${nameNode}/${outputPath}/relation
${nameNode}/${sourcePath}/publication
${nameNode}/${outputPath}/publication
${nameNode}/${sourcePath}/dataset
${nameNode}/${outputPath}/dataset
${nameNode}/${sourcePath}/otherresearchproduct
${nameNode}/${outputPath}/otherresearchproduct
${nameNode}/${sourcePath}/software
${nameNode}/${outputPath}/software
${nameNode}/${sourcePath}/organization
${nameNode}/${outputPath}/organization
${nameNode}/${sourcePath}/project
${nameNode}/${outputPath}/project
${nameNode}/${sourcePath}/datasource
${nameNode}/${outputPath}/datasource
yarn
cluster
PrepareResultOrganizationAssociation
eu.dnetlib.dhp.resulttoorganizationfrominstrepo.PrepareResultInstRepoAssociation
dhp-enrichment-${projectVersion}.jar
--executor-cores=${sparkExecutorCores}
--executor-memory=${sparkExecutorMemory}
--driver-memory=${sparkDriverMemory}
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
--sourcePath${sourcePath}
--hive_metastore_uris${hive_metastore_uris}
--datasourceOrganizationPath${workingDir}/preparedInfo/datasourceOrganization
--alreadyLinkedPath${workingDir}/preparedInfo/alreadyLinked
--blacklist${blacklist}
yarn
cluster
resultToOrganizationFromInstRepoPropagationForPublications
eu.dnetlib.dhp.resulttoorganizationfrominstrepo.SparkResultToOrganizationFromIstRepoJob
dhp-enrichment-${projectVersion}.jar
--executor-cores=${sparkExecutorCores}
--executor-memory=${sparkExecutorMemory}
--driver-memory=${sparkDriverMemory}
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
--conf spark.dynamicAllocation.enabled=true
--conf spark.dynamicAllocation.maxExecutors=${spark2MaxExecutors}
--sourcePath${sourcePath}/publication
--outputPath${outputPath}/relation
--datasourceOrganizationPath${workingDir}/preparedInfo/datasourceOrganization
--alreadyLinkedPath${workingDir}/preparedInfo/alreadyLinked
--hive_metastore_uris${hive_metastore_uris}
--resultTableNameeu.dnetlib.dhp.schema.oaf.Publication
yarn
cluster
resultToOrganizationFromInstRepoPropagationForDataset
eu.dnetlib.dhp.resulttoorganizationfrominstrepo.SparkResultToOrganizationFromIstRepoJob
dhp-enrichment-${projectVersion}.jar
--executor-cores=${sparkExecutorCores}
--executor-memory=${sparkExecutorMemory}
--driver-memory=${sparkDriverMemory}
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
--conf spark.dynamicAllocation.enabled=true
--conf spark.dynamicAllocation.maxExecutors=${spark2MaxExecutors}
--sourcePath${sourcePath}/dataset
--outputPath${outputPath}/relation
--datasourceOrganizationPath${workingDir}/preparedInfo/datasourceOrganization
--alreadyLinkedPath${workingDir}/preparedInfo/alreadyLinked
--hive_metastore_uris${hive_metastore_uris}
--resultTableNameeu.dnetlib.dhp.schema.oaf.Dataset
yarn
cluster
resultToOrganizationFromInstRepoPropagationForORP
eu.dnetlib.dhp.resulttoorganizationfrominstrepo.SparkResultToOrganizationFromIstRepoJob
dhp-enrichment-${projectVersion}.jar
--executor-cores=${sparkExecutorCores}
--executor-memory=${sparkExecutorMemory}
--driver-memory=${sparkDriverMemory}
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
--conf spark.dynamicAllocation.enabled=true
--conf spark.dynamicAllocation.maxExecutors=${spark2MaxExecutors}
--sourcePath${sourcePath}/otherresearchproduct
--outputPath${outputPath}/relation
--datasourceOrganizationPath${workingDir}/preparedInfo/datasourceOrganization
--alreadyLinkedPath${workingDir}/preparedInfo/alreadyLinked
--hive_metastore_uris${hive_metastore_uris}
--resultTableNameeu.dnetlib.dhp.schema.oaf.OtherResearchProduct
yarn
cluster
resultToOrganizationFromInstRepoPropagationForSoftware
eu.dnetlib.dhp.resulttoorganizationfrominstrepo.SparkResultToOrganizationFromIstRepoJob
dhp-enrichment-${projectVersion}.jar
--executor-cores=${sparkExecutorCores}
--executor-memory=${sparkExecutorMemory}
--driver-memory=${sparkDriverMemory}
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
--conf spark.dynamicAllocation.enabled=true
--conf spark.dynamicAllocation.maxExecutors=${spark2MaxExecutors}
--sourcePath${sourcePath}/software
--outputPath${outputPath}/relation
--datasourceOrganizationPath${workingDir}/preparedInfo/datasourceOrganization
--alreadyLinkedPath${workingDir}/preparedInfo/alreadyLinked
--hive_metastore_uris${hive_metastore_uris}
--resultTableNameeu.dnetlib.dhp.schema.oaf.Software