magBasePath
The base path of MAG DUMP CSV Tables
mdStoreOutputId
the identifier of the cleaned MDStore
mdStoreManagerURI
the path of the cleaned mdstore
resume_from
generateOAF
start Node
Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]
${wf:conf('resume_from') eq 'generateTable'}
yarn
cluster
Generate MAG Table
eu.dnetlib.dhp.collection.mag.SparkCreateMagDenormalizedTable
dhp-aggregation-${projectVersion}.jar
--executor-memory=${sparkExecutorMemory}
--executor-cores=${sparkExecutorCores}
--driver-memory=${sparkDriverMemory}
--conf spark.executor.memoryOverhead=2g
--conf spark.sql.shuffle.partitions=3000
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
--magBasePath${magBasePath}
--masteryarn
oozie.launcher.mapreduce.user.classpath.first
true
eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode
--actionNEW_VERSION
--mdStoreID${mdStoreOutputId}
--mdStoreManagerURI${mdStoreManagerURI}
yarn
cluster
MAG TO OAF
eu.dnetlib.dhp.collection.mag.SparkMAGtoOAF
dhp-aggregation-${projectVersion}.jar
--executor-memory=${sparkExecutorMemory}
--executor-cores=${sparkExecutorCores}
--driver-memory=${sparkDriverMemory}
--conf spark.executor.memoryOverhead=2g
--conf spark.sql.shuffle.partitions=3000
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
--mdstoreOutputVersion${wf:actionData('StartTransaction')['mdStoreVersion']}
--magBasePath${magBasePath}
--masteryarn
oozie.launcher.mapreduce.user.classpath.first
true
eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode
--actionCOMMIT
--namenode${nameNode}
--mdStoreVersion${wf:actionData('StartTransaction')['mdStoreVersion']}
--mdStoreManagerURI${mdStoreManagerURI}
oozie.launcher.mapreduce.user.classpath.first
true
eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode
--actionREAD_UNLOCK
--mdStoreManagerURI${mdStoreManagerURI}
--readMDStoreId${wf:actionData('BeginRead')['mdStoreReadLockVersion']}
oozie.launcher.mapreduce.user.classpath.first
true
eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode
--actionROLLBACK
--mdStoreVersion${wf:actionData('StartTransaction')['mdStoreVersion']}
--mdStoreManagerURI${mdStoreManagerURI}