Merge branch 'beta' of https://code-repo.d4science.org/D-Net/dnet-hadoop into index_records

This commit is contained in:
Claudio Atzori 2024-02-28 10:27:28 +01:00
commit 6fcf872daa
20 changed files with 8309 additions and 51 deletions

View File

@ -0,0 +1,244 @@
package eu.dnetlib.dhp.collection.orcid;
import java.io.IOException;
import java.io.InputStream;
import java.net.HttpURLConnection;
import java.net.URL;
import java.util.concurrent.BlockingQueue;
import javax.swing.*;
import org.apache.commons.io.IOUtils;
import org.apache.commons.lang3.StringUtils;
import org.apache.hadoop.io.SequenceFile;
import org.apache.hadoop.io.Text;
import org.apache.http.HttpHeaders;
import org.jetbrains.annotations.NotNull;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import eu.dnetlib.dhp.common.collection.HttpClientParams;
public class ORCIDWorker extends Thread {
final static Logger log = LoggerFactory.getLogger(ORCIDWorker.class);
public static String JOB_COMPLETE = "JOB_COMPLETE";
private static final String userAgent = "Mozilla/5.0 (compatible; OAI; +http://www.openaire.eu)";
private final BlockingQueue<String> queue;
private boolean hasComplete = false;
private final SequenceFile.Writer employments;
private final SequenceFile.Writer summary;
private final SequenceFile.Writer works;
private final String token;
private final String id;
public static ORCIDWorkerBuilder builder() {
return new ORCIDWorkerBuilder();
}
public ORCIDWorker(String id, BlockingQueue<String> myqueue, SequenceFile.Writer employments,
SequenceFile.Writer summary, SequenceFile.Writer works, String token) {
this.id = id;
this.queue = myqueue;
this.employments = employments;
this.summary = summary;
this.works = works;
this.token = token;
}
public static String retrieveURL(final String id, final String apiUrl, String token) {
try {
final HttpURLConnection urlConn = getHttpURLConnection(apiUrl, token);
if (urlConn.getResponseCode() > 199 && urlConn.getResponseCode() < 300) {
InputStream input = urlConn.getInputStream();
return IOUtils.toString(input);
} else {
log
.error(
"Thread {} UNABLE TO DOWNLOAD FROM THIS URL {} , status code {}", id, apiUrl,
urlConn.getResponseCode());
}
} catch (Exception e) {
log.error("Thread {} Error on retrieving URL {} {}", id, apiUrl, e);
}
return null;
}
@NotNull
private static HttpURLConnection getHttpURLConnection(String apiUrl, String token) throws IOException {
final HttpURLConnection urlConn = (HttpURLConnection) new URL(apiUrl).openConnection();
final HttpClientParams clientParams = new HttpClientParams();
urlConn.setInstanceFollowRedirects(false);
urlConn.setReadTimeout(clientParams.getReadTimeOut() * 1000);
urlConn.setConnectTimeout(clientParams.getConnectTimeOut() * 1000);
urlConn.addRequestProperty(HttpHeaders.USER_AGENT, userAgent);
urlConn.addRequestProperty(HttpHeaders.AUTHORIZATION, String.format("Bearer %s", token));
return urlConn;
}
private static String generateSummaryURL(final String orcidId) {
return "https://api.orcid.org/v3.0/" + orcidId + "/record";
}
private static String generateWorksURL(final String orcidId) {
return "https://api.orcid.org/v3.0/" + orcidId + "/works";
}
private static String generateEmploymentsURL(final String orcidId) {
return "https://api.orcid.org/v3.0/" + orcidId + "/employments";
}
private static void writeResultToSequenceFile(String id, String url, String token, String orcidId,
SequenceFile.Writer file) throws IOException {
final String response = retrieveURL(id, url, token);
if (response != null) {
if (orcidId == null) {
log.error("Thread {} {} {}", id, orcidId, response);
throw new RuntimeException("null items ");
}
if (file == null) {
log.error("Thread {} file is null for {} URL:{}", id, url, orcidId);
} else {
file.append(new Text(orcidId), new Text(response));
file.hflush();
}
} else
log.error("Thread {} response is null for {} URL:{}", id, url, orcidId);
}
@Override
public void run() {
final Text key = new Text();
final Text value = new Text();
long start;
long total_time;
String orcidId = "";
int requests = 0;
if (summary == null || employments == null || works == null)
throw new RuntimeException("Null files");
while (!hasComplete) {
try {
orcidId = queue.take();
if (orcidId.equalsIgnoreCase(JOB_COMPLETE)) {
hasComplete = true;
} else {
start = System.currentTimeMillis();
writeResultToSequenceFile(id, generateSummaryURL(orcidId), token, orcidId, summary);
total_time = System.currentTimeMillis() - start;
requests++;
if (total_time < 1000) {
// I know making a sleep on a thread is bad, but we need to stay to 24 requests per seconds,
// hence
// the time between two http request in a thread must be 1 second
Thread.sleep(1000L - total_time);
}
start = System.currentTimeMillis();
writeResultToSequenceFile(id, generateWorksURL(orcidId), token, orcidId, works);
total_time = System.currentTimeMillis() - start;
requests++;
if (total_time < 1000) {
// I know making a sleep on a thread is bad, but we need to stay to 24 requests per seconds,
// hence
// the time between two http request in a thread must be 1 second
Thread.sleep(1000L - total_time);
}
start = System.currentTimeMillis();
writeResultToSequenceFile(id, generateEmploymentsURL(orcidId), token, orcidId, employments);
total_time = System.currentTimeMillis() - start;
requests++;
if (total_time < 1000) {
// I know making a sleep on a thread is bad, but we need to stay to 24 requests per seconds,
// hence
// the time between two http request in a thread must be 1 second
Thread.sleep(1000L - total_time);
}
if (requests % 30 == 0) {
log.info("Thread {} Downloaded {}", id, requests);
}
}
} catch (Throwable e) {
log.error("Thread {} Unable to save ORICD: {} item error", id, orcidId, e);
}
}
try {
works.close();
summary.close();
employments.close();
} catch (Throwable e) {
throw new RuntimeException(e);
}
log.info("Thread {} COMPLETE ", id);
log.info("Thread {} Downloaded {}", id, requests);
}
public static class ORCIDWorkerBuilder {
private String id;
private SequenceFile.Writer employments;
private SequenceFile.Writer summary;
private SequenceFile.Writer works;
private BlockingQueue<String> queue;
private String token;
public ORCIDWorkerBuilder withId(final String id) {
this.id = id;
return this;
}
public ORCIDWorkerBuilder withEmployments(final SequenceFile.Writer sequenceFile) {
this.employments = sequenceFile;
return this;
}
public ORCIDWorkerBuilder withSummary(final SequenceFile.Writer sequenceFile) {
this.summary = sequenceFile;
return this;
}
public ORCIDWorkerBuilder withWorks(final SequenceFile.Writer sequenceFile) {
this.works = sequenceFile;
return this;
}
public ORCIDWorkerBuilder withAccessToken(final String accessToken) {
this.token = accessToken;
return this;
}
public ORCIDWorkerBuilder withBlockingQueue(final BlockingQueue<String> queue) {
this.queue = queue;
return this;
}
public ORCIDWorker build() {
if (this.summary == null || this.works == null || this.employments == null || StringUtils.isEmpty(token)
|| queue == null)
throw new RuntimeException("Unable to build missing required params");
return new ORCIDWorker(id, queue, employments, summary, works, token);
}
}
}

View File

@ -0,0 +1,171 @@
package eu.dnetlib.dhp.collection.orcid;
import static eu.dnetlib.dhp.utils.DHPUtils.getHadoopConfiguration;
import java.io.*;
import java.net.HttpURLConnection;
import java.net.URL;
import java.util.ArrayList;
import java.util.List;
import java.util.Objects;
import java.util.concurrent.ArrayBlockingQueue;
import java.util.concurrent.BlockingQueue;
import org.apache.commons.compress.archivers.tar.TarArchiveEntry;
import org.apache.commons.compress.archivers.tar.TarArchiveInputStream;
import org.apache.commons.compress.compressors.gzip.GzipCompressorInputStream;
import org.apache.commons.io.IOUtils;
import org.apache.commons.lang3.StringUtils;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.SequenceFile;
import org.apache.hadoop.io.Text;
import org.apache.spark.sql.SparkSession;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import eu.dnetlib.dhp.application.ArgumentApplicationParser;
import eu.dnetlib.dhp.common.collection.HttpClientParams;
public class OrcidGetUpdatesFile {
private static Logger log = LoggerFactory.getLogger(OrcidGetUpdatesFile.class);
public static void main(String[] args) throws Exception {
ArgumentApplicationParser parser = new ArgumentApplicationParser(
IOUtils
.toString(
Objects
.requireNonNull(
OrcidGetUpdatesFile.class
.getResourceAsStream(
"/eu/dnetlib/dhp/collection/orcid/download_orcid_update_parameter.json")))
);
parser.parseArgument(args);
final String namenode = parser.get("namenode");
log.info("got variable namenode: {}", namenode);
final String master = parser.get("master");
log.info("got variable master: {}", master);
final String targetPath = parser.get("targetPath");
log.info("got variable targetPath: {}", targetPath);
final String apiURL = parser.get("apiURL");
log.info("got variable apiURL: {}", apiURL);
final String accessToken = parser.get("accessToken");
log.info("got variable accessToken: {}", accessToken);
final String graphPath = parser.get("graphPath");
log.info("got variable graphPath: {}", graphPath);
final SparkSession spark = SparkSession
.builder()
.appName(OrcidGetUpdatesFile.class.getName())
.master(master)
.getOrCreate();
final String latestDate = spark
.read()
.load(graphPath + "/Authors")
.selectExpr("max(lastModifiedDate)")
.first()
.getString(0);
log.info("latest date is {}", latestDate);
final FileSystem fileSystem = FileSystem.get(getHadoopConfiguration(namenode));
new OrcidGetUpdatesFile().readTar(fileSystem, accessToken, apiURL, targetPath, latestDate);
}
private SequenceFile.Writer createFile(Path aPath, FileSystem fileSystem) throws IOException {
return SequenceFile
.createWriter(
fileSystem.getConf(),
SequenceFile.Writer.file(aPath),
SequenceFile.Writer.keyClass(Text.class),
SequenceFile.Writer.valueClass(Text.class));
}
private ORCIDWorker createWorker(final String id, final String targetPath, final BlockingQueue<String> queue,
final String accessToken, FileSystem fileSystem) throws Exception {
return ORCIDWorker
.builder()
.withId(id)
.withEmployments(createFile(new Path(String.format("%s/employments_%s", targetPath, id)), fileSystem))
.withSummary(createFile(new Path(String.format("%s/summary_%s", targetPath, id)), fileSystem))
.withWorks(createFile(new Path(String.format("%s/works_%s", targetPath, id)), fileSystem))
.withAccessToken(accessToken)
.withBlockingQueue(queue)
.build();
}
public void readTar(FileSystem fileSystem, final String accessToken, final String apiURL, final String targetPath,
final String startDate) throws Exception {
final HttpURLConnection urlConn = (HttpURLConnection) new URL(apiURL).openConnection();
final HttpClientParams clientParams = new HttpClientParams();
urlConn.setInstanceFollowRedirects(false);
urlConn.setReadTimeout(clientParams.getReadTimeOut() * 1000);
urlConn.setConnectTimeout(clientParams.getConnectTimeOut() * 1000);
if (urlConn.getResponseCode() > 199 && urlConn.getResponseCode() < 300) {
InputStream input = urlConn.getInputStream();
Path hdfsWritePath = new Path("/tmp/orcid_updates.tar.gz");
final FSDataOutputStream fsDataOutputStream = fileSystem.create(hdfsWritePath, true);
IOUtils.copy(input, fsDataOutputStream);
fsDataOutputStream.flush();
fsDataOutputStream.close();
FSDataInputStream updateFile = fileSystem.open(hdfsWritePath);
TarArchiveInputStream tais = new TarArchiveInputStream(new GzipCompressorInputStream(
new BufferedInputStream(
updateFile.getWrappedStream())));
TarArchiveEntry entry;
BlockingQueue<String> queue = new ArrayBlockingQueue<String>(3000);
final List<ORCIDWorker> workers = new ArrayList<>();
for (int i = 0; i < 22; i++) {
workers.add(createWorker("" + i, targetPath, queue, accessToken, fileSystem));
}
workers.forEach(Thread::start);
while ((entry = tais.getNextTarEntry()) != null) {
if (entry.isFile()) {
BufferedReader br = new BufferedReader(new InputStreamReader(tais));
System.out.println(br.readLine());
br
.lines()
.map(l -> l.split(","))
.filter(s -> StringUtils.compare(s[3].substring(0, 10), startDate) > 0)
.map(s -> s[0])
.forEach(s -> {
try {
queue.put(s);
} catch (InterruptedException e) {
throw new RuntimeException(e);
}
});
}
}
for (int i = 0; i < 22; i++) {
queue.put(ORCIDWorker.JOB_COMPLETE);
}
for (ORCIDWorker worker : workers) {
worker.join();
}
}
}
}

View File

@ -1,11 +1,15 @@
package eu.dnetlib.dhp.collection.orcid;
import java.util.Arrays;
import java.util.Collections;
import java.util.List;
import java.util.*;
import java.util.stream.Collectors;
import org.apache.commons.lang3.StringUtils;
import org.dom4j.Document;
import org.dom4j.DocumentFactory;
import org.dom4j.DocumentHelper;
import org.dom4j.Node;
import org.jetbrains.annotations.NotNull;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
@ -40,8 +44,8 @@ public class OrcidParser {
private static final String NS_ERROR = "error";
private static final String NS_HISTORY = "history";
private static final String NS_HISTORY_URL = "http://www.orcid.org/ns/history";
private static final String NS_BULK_URL = "http://www.orcid.org/ns/bulk";
private static final String NS_BULK = "bulk";
private static final String NS_EMPLOYMENT = "employment";
private static final String NS_EMPLOYMENT_URL = "http://www.orcid.org/ns/employment";
private static final String NS_EXTERNAL = "external-identifier";
private static final String NS_EXTERNAL_URL = "http://www.orcid.org/ns/external-identifier";
@ -61,6 +65,7 @@ public class OrcidParser {
ap.declareXPathNameSpace(NS_WORK, NS_WORK_URL);
ap.declareXPathNameSpace(NS_EXTERNAL, NS_EXTERNAL_URL);
ap.declareXPathNameSpace(NS_ACTIVITIES, NS_ACTIVITIES_URL);
ap.declareXPathNameSpace(NS_EMPLOYMENT, NS_EMPLOYMENT_URL);
}
public Author parseSummary(final String xml) {
@ -70,13 +75,15 @@ public class OrcidParser {
generateParsedDocument(xml);
List<VtdUtilityParser.Node> recordNodes = VtdUtilityParser
.getTextValuesWithAttributes(
ap, vn, "//record:record", Arrays.asList("path"));
ap, vn, "//record:record", Collections.singletonList("path"));
if (!recordNodes.isEmpty()) {
final String oid = (recordNodes.get(0).getAttributes().get("path")).substring(1);
author.setOrcid(oid);
} else {
return null;
}
final String ltm = VtdUtilityParser.getSingleValue(ap, vn, "//common:last-modified-date");
author.setLastModifiedDate(ltm);
List<VtdUtilityParser.Node> personNodes = VtdUtilityParser
.getTextValuesWithAttributes(
ap, vn, "//person:name", Arrays.asList("visibility"));
@ -129,6 +136,64 @@ public class OrcidParser {
}
}
public List<Work> parseWorks(final String xml) {
try {
String oid;
generateParsedDocument(xml);
List<VtdUtilityParser.Node> workNodes = VtdUtilityParser
.getTextValuesWithAttributes(ap, vn, "//activities:works", Arrays.asList("path", "visibility"));
if (!workNodes.isEmpty()) {
oid = (workNodes.get(0).getAttributes().get("path")).split("/")[1];
} else {
return null;
}
final List<Work> works = new ArrayList<>();
ap.selectXPath("//work:work-summary");
while (ap.evalXPath() != -1) {
final Work work = new Work();
work.setOrcid(oid);
final AutoPilot ap1 = new AutoPilot(ap.getNav());
ap1.selectXPath("./work:title/common:title");
while (ap1.evalXPath() != -1) {
int it = vn.getText();
work.setTitle(vn.toNormalizedString(it));
}
ap1.selectXPath(".//common:external-id");
while (ap1.evalXPath() != -1) {
final Pid pid = new Pid();
final AutoPilot ap2 = new AutoPilot(ap1.getNav());
ap2.selectXPath("./common:external-id-type");
while (ap2.evalXPath() != -1) {
int it = vn.getText();
pid.setSchema(vn.toNormalizedString(it));
}
ap2.selectXPath("./common:external-id-value");
while (ap2.evalXPath() != -1) {
int it = vn.getText();
pid.setValue(vn.toNormalizedString(it));
}
work.addPid(pid);
}
works.add(work);
}
return works;
} catch (Throwable e) {
log.error("Error on parsing {}", xml);
log.error(e.getMessage());
return null;
}
}
public Work parseWork(final String xml) {
try {
@ -176,11 +241,15 @@ public class OrcidParser {
}
private String extractEmploymentDate(final String xpath) throws Exception {
return extractEmploymentDate(xpath, ap);
}
ap.selectXPath(xpath);
private String extractEmploymentDate(final String xpath, AutoPilot pp) throws Exception {
pp.selectXPath(xpath);
StringBuilder sb = new StringBuilder();
while (ap.evalXPath() != -1) {
final AutoPilot ap1 = new AutoPilot(ap.getNav());
while (pp.evalXPath() != -1) {
final AutoPilot ap1 = new AutoPilot(pp.getNav());
ap1.selectXPath("./common:year");
while (ap1.evalXPath() != -1) {
int it = vn.getText();
@ -203,6 +272,104 @@ public class OrcidParser {
}
public List<Employment> parseEmployments(final String xml) {
try {
String oid;
Map<String, String> nsContext = getNameSpaceMap();
DocumentFactory.getInstance().setXPathNamespaceURIs(nsContext);
Document doc = DocumentHelper.parseText(xml);
oid = doc.valueOf("//activities:employments/@path");
if (oid == null || StringUtils.isEmpty(oid))
return null;
final String orcid = oid.split("/")[1];
List<Node> nodes = doc.selectNodes("//employment:employment-summary");
return nodes.stream().map(n -> {
final Employment e = new Employment();
e.setOrcid(orcid);
final String depName = n.valueOf(".//common:department-name");
if (StringUtils.isNotBlank(depName))
e.setDepartmentName(depName);
final String roleTitle = n.valueOf(".//common:role-title");
e.setRoleTitle(roleTitle);
final String organizationName = n.valueOf(".//common:organization/common:name");
if (StringUtils.isEmpty(e.getDepartmentName()))
e.setDepartmentName(organizationName);
final Pid p = new Pid();
final String pid = n
.valueOf(
"./common:organization/common:disambiguated-organization/common:disambiguated-organization-identifier");
p.setValue(pid);
final String pidType = n
.valueOf("./common:organization/common:disambiguated-organization/common:disambiguation-source");
p.setSchema(pidType);
e.setAffiliationId(p);
final StringBuilder aDate = new StringBuilder();
final String sy = n.valueOf("./common:start-date/common:year");
if (StringUtils.isNotBlank(sy)) {
aDate.append(sy);
final String sm = n.valueOf("./common:start-date/common:month");
final String sd = n.valueOf("./common:start-date/common:day");
aDate.append("-");
if (StringUtils.isNotBlank(sm))
aDate.append(sm);
else
aDate.append("01");
aDate.append("-");
if (StringUtils.isNotBlank(sd))
aDate.append(sd);
else
aDate.append("01");
e.setEndDate(aDate.toString());
}
final String ey = n.valueOf("./common:end-date/common:year");
if (StringUtils.isNotBlank(ey)) {
aDate.append(ey);
final String em = n.valueOf("./common:end-date/common:month");
final String ed = n.valueOf("./common:end-date/common:day");
aDate.append("-");
if (StringUtils.isNotBlank(em))
aDate.append(em);
else
aDate.append("01");
aDate.append("-");
if (StringUtils.isNotBlank(ed))
aDate.append(ed);
else
aDate.append("01");
e.setEndDate(aDate.toString());
}
return e;
}).collect(Collectors.toList());
} catch (Throwable e) {
log.error("Error on parsing {}", xml);
log.error(e.getMessage());
return null;
}
}
@NotNull
private static Map<String, String> getNameSpaceMap() {
Map<String, String> nsContext = new HashMap<>();
nsContext.put(NS_COMMON, NS_COMMON_URL);
nsContext.put(NS_PERSON, NS_PERSON_URL);
nsContext.put(NS_DETAILS, NS_DETAILS_URL);
nsContext.put(NS_OTHER, NS_OTHER_URL);
nsContext.put(NS_RECORD, NS_RECORD_URL);
nsContext.put(NS_ERROR, NS_ERROR_URL);
nsContext.put(NS_HISTORY, NS_HISTORY_URL);
nsContext.put(NS_WORK, NS_WORK_URL);
nsContext.put(NS_EXTERNAL, NS_EXTERNAL_URL);
nsContext.put(NS_ACTIVITIES, NS_ACTIVITIES_URL);
nsContext.put(NS_EMPLOYMENT, NS_EMPLOYMENT_URL);
return nsContext;
}
public Employment parseEmployment(final String xml) {
try {
final Employment employment = new Employment();

View File

@ -18,6 +18,8 @@ public class Author extends ORCIDItem {
private String biography;
private String lastModifiedDate;
public String getBiography() {
return biography;
}
@ -74,6 +76,14 @@ public class Author extends ORCIDItem {
this.otherPids = otherPids;
}
public String getLastModifiedDate() {
return lastModifiedDate;
}
public void setLastModifiedDate(String lastModifiedDate) {
this.lastModifiedDate = lastModifiedDate;
}
public void addOtherPid(final Pid pid) {
if (otherPids == null)

View File

@ -0,0 +1,26 @@
[
{
"paramName": "m",
"paramLongName": "master",
"paramDescription": "the master name",
"paramRequired": true
},
{
"paramName": "t",
"paramLongName": "targetPath",
"paramDescription": "the target PATH of the DF tables",
"paramRequired": true
},
{
"paramName": "g",
"paramLongName": "graphPath",
"paramDescription": "the PATH of the current graph path",
"paramRequired": true
},
{
"paramName": "u",
"paramLongName": "updatePath",
"paramDescription": "the PATH of the current graph update path",
"paramRequired": true
}
]

View File

@ -0,0 +1,37 @@
[ {
"paramName": "n",
"paramLongName": "namenode",
"paramDescription": "the Name Node URI",
"paramRequired": true
},
{
"paramName": "m",
"paramLongName": "master",
"paramDescription": "the master name",
"paramRequired": true
},
{
"paramName": "t",
"paramLongName": "targetPath",
"paramDescription": "the target PATH where download the files",
"paramRequired": true
},
{
"paramName": "a",
"paramLongName": "apiURL",
"paramDescription": "the URL to download the tar file",
"paramRequired": true
},
{
"paramName": "g",
"paramLongName": "graphPath",
"paramDescription": "the path of the input graph",
"paramRequired": true
},
{
"paramName": "at",
"paramLongName": "accessToken",
"paramDescription": "the accessToken to contact API",
"paramRequired": true
}
]

View File

@ -16,6 +16,12 @@
"paramLongName": "sourcePath",
"paramDescription": "the PATH of the ORCID sequence file",
"paramRequired": true
},
{
"paramName": "fu",
"paramLongName": "fromUpdate",
"paramDescription": "whether we have to generate table from dump or from update",
"paramRequired": false
}
]

View File

@ -0,0 +1,23 @@
<configuration>
<property>
<name>jobTracker</name>
<value>yarnRM</value>
</property>
<property>
<name>nameNode</name>
<value>hdfs://nameservice1</value>
</property>
<property>
<name>oozie.use.system.libpath</name>
<value>true</value>
</property>
<property>
<name>oozie.action.sharelib.for.spark</name>
<value>spark2</value>
</property>
<property>
<name>oozie.launcher.mapreduce.user.classpath.first</name>
<value>true</value>
</property>
</configuration>

View File

@ -0,0 +1,114 @@
<workflow-app name="download_Update_ORCID" xmlns="uri:oozie:workflow:0.5">
<parameters>
<property>
<name>graphPath</name>
<description>the path to store the original ORCID dump</description>
</property>
<property>
<name>targetPath</name>
<description>the path to store the original ORCID dump</description>
</property>
<property>
<name>apiURL</name>
<value>http://74804fb637bd8e2fba5b-e0a029c2f87486cddec3b416996a6057.r3.cf1.rackcdn.com/last_modified.csv.tar</value>
<description>The URL of the update CSV list </description>
</property>
<property>
<name>accessToken</name>
<description>The access token</description>
</property>
</parameters>
<start to="startUpdate"/>
<kill name="Kill">
<message>Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]</message>
</kill>
<action name="startUpdate">
<spark xmlns="uri:oozie:spark-action:0.2">
<master>yarn</master>
<mode>cluster</mode>
<name>Check Latest Orcid and Download updates</name>
<class>eu.dnetlib.dhp.collection.orcid.OrcidGetUpdatesFile</class>
<jar>dhp-aggregation-${projectVersion}.jar</jar>
<spark-opts>
--executor-memory=${sparkExecutorMemory}
--executor-cores=${sparkExecutorCores}
--driver-memory=${sparkDriverMemory}
--conf spark.executor.memoryOverhead=2g
--conf spark.sql.shuffle.partitions=3000
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
</spark-opts>
<arg>--master</arg><arg>yarn</arg>
<arg>--namenode</arg><arg>${nameNode}</arg>
<arg>--graphPath</arg><arg>${graphPath}</arg>
<arg>--targetPath</arg><arg>${targetPath}</arg>
<arg>--apiURL</arg><arg>${apiURL}</arg>
<arg>--accessToken</arg><arg>${accessToken}</arg>
</spark>
<ok to="generateTables"/>
<error to="Kill"/>
</action>
<action name="generateTables">
<spark xmlns="uri:oozie:spark-action:0.2">
<master>yarn</master>
<mode>cluster</mode>
<name>Generate ORCID Tables</name>
<class>eu.dnetlib.dhp.collection.orcid.SparkGenerateORCIDTable</class>
<jar>dhp-aggregation-${projectVersion}.jar</jar>
<spark-opts>
--executor-memory=${sparkExecutorMemory}
--executor-cores=${sparkExecutorCores}
--driver-memory=${sparkDriverMemory}
--conf spark.executor.memoryOverhead=2g
--conf spark.sql.shuffle.partitions=3000
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
</spark-opts>
<arg>--sourcePath</arg><arg>${targetPath}</arg>
<arg>--targetPath</arg><arg>${targetPath}/updateTable</arg>
<arg>--fromUpdate</arg><arg>true</arg>
<arg>--master</arg><arg>yarn</arg>
</spark>
<ok to="updateTable"/>
<error to="Kill"/>
</action>
<action name="updateTable">
<spark xmlns="uri:oozie:spark-action:0.2">
<master>yarn</master>
<mode>cluster</mode>
<name>Update ORCID Tables</name>
<class>eu.dnetlib.dhp.collection.orcid.SparkApplyUpdate</class>
<jar>dhp-aggregation-${projectVersion}.jar</jar>
<spark-opts>
--executor-memory=${sparkExecutorMemory}
--executor-cores=${sparkExecutorCores}
--driver-memory=${sparkDriverMemory}
--conf spark.executor.memoryOverhead=2g
--conf spark.sql.shuffle.partitions=3000
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
</spark-opts>
<arg>--graphPath</arg><arg>${graphPath}</arg>
<arg>--updatePath</arg><arg>${targetPath}/updateTable</arg>
<arg>--targetPath</arg><arg>${targetPath}/newTable</arg>
<arg>--master</arg><arg>yarn</arg>
</spark>
<ok to="End"/>
<error to="Kill"/>
</action>
<end name="End"/>
</workflow-app>

View File

@ -0,0 +1,120 @@
package eu.dnetlib.dhp.collection.orcid
import eu.dnetlib.dhp.application.AbstractScalaApplication
import org.apache.spark.sql.{DataFrame, SaveMode, SparkSession}
import org.slf4j.{Logger, LoggerFactory}
class SparkApplyUpdate(propertyPath: String, args: Array[String], log: Logger)
extends AbstractScalaApplication(propertyPath, args, log: Logger) {
/** Here all the spark applications runs this method
* where the whole logic of the spark node is defined
*/
override def run(): Unit = {
val graphPath: String = parser.get("graphPath")
log.info("found parameters graphPath: {}", graphPath)
val updatePath: String = parser.get("updatePath")
log.info("found parameters updatePath: {}", updatePath)
val targetPath: String = parser.get("targetPath")
log.info("found parameters targetPath: {}", targetPath)
applyTableUpdate(spark, graphPath, updatePath, targetPath)
checkUpdate(spark, graphPath, targetPath)
moveTable(spark, graphPath, targetPath)
}
private def moveTable(spark: SparkSession, graphPath: String, updatePath: String): Unit = {
spark.read
.load(s"$updatePath/Authors")
.repartition(1000)
.write
.mode(SaveMode.Overwrite)
.save(s"$graphPath/Authors")
spark.read
.load(s"$updatePath/Works")
.repartition(1000)
.write
.mode(SaveMode.Overwrite)
.save(s"$graphPath/Works")
spark.read
.load(s"$updatePath/Employments")
.repartition(1000)
.write
.mode(SaveMode.Overwrite)
.save(s"$graphPath/Employments")
}
private def updateDataset(
inputDataset: DataFrame,
idUpdate: DataFrame,
updateDataframe: DataFrame,
targetPath: String
): Unit = {
inputDataset
.join(idUpdate, inputDataset("orcid").equalTo(idUpdate("orcid")), "leftanti")
.select(inputDataset("*"))
.unionByName(updateDataframe)
.write
.mode(SaveMode.Overwrite)
.save(targetPath)
}
private def checkUpdate(spark: SparkSession, graphPath: String, updatePath: String): Unit = {
val totalOriginalAuthors = spark.read.load(s"$graphPath/Authors").count
val totalOriginalWorks = spark.read.load(s"$graphPath/Works").count
val totalOriginalEmployments = spark.read.load(s"$graphPath/Employments").count
val totalUpdateAuthors = spark.read.load(s"$updatePath/Authors").count
val totalUpdateWorks = spark.read.load(s"$updatePath/Works").count
val totalUpdateEmployments = spark.read.load(s"$updatePath/Employments").count
log.info("totalOriginalAuthors: {}", totalOriginalAuthors)
log.info("totalOriginalWorks: {}", totalOriginalWorks)
log.info("totalOriginalEmployments: {}", totalOriginalEmployments)
log.info("totalUpdateAuthors: {}", totalUpdateAuthors)
log.info("totalUpdateWorks: {}", totalUpdateWorks)
log.info("totalUpdateEmployments: {}", totalUpdateEmployments)
if (
totalUpdateAuthors < totalOriginalAuthors || totalUpdateEmployments < totalOriginalEmployments || totalUpdateWorks < totalOriginalWorks
)
throw new RuntimeException("The updated Graph contains less elements of the original one")
}
private def applyTableUpdate(spark: SparkSession, graphPath: String, updatePath: String, targetPath: String): Unit = {
val orcidIDUpdate = spark.read.load(s"$updatePath/Authors").select("orcid")
updateDataset(
spark.read.load(s"$graphPath/Authors"),
orcidIDUpdate,
spark.read.load(s"$updatePath/Authors"),
s"$targetPath/Authors"
)
updateDataset(
spark.read.load(s"$graphPath/Employments"),
orcidIDUpdate,
spark.read.load(s"$updatePath/Employments"),
s"$targetPath/Employments"
)
updateDataset(
spark.read.load(s"$graphPath/Works"),
orcidIDUpdate,
spark.read.load(s"$updatePath/Works"),
s"$targetPath/Works"
)
}
}
object SparkApplyUpdate {
val log: Logger = LoggerFactory.getLogger(SparkGenerateORCIDTable.getClass)
def main(args: Array[String]): Unit = {
new SparkApplyUpdate("/eu/dnetlib/dhp/collection/orcid/apply_orcid_table_parameter.json", args, log)
.initialize()
.run()
}
}

View File

@ -6,6 +6,7 @@ import org.apache.hadoop.io.Text
import org.apache.spark.SparkContext
import org.apache.spark.sql.{Encoder, Encoders, SaveMode, SparkSession}
import org.slf4j.{Logger, LoggerFactory}
import scala.collection.JavaConverters._
class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Logger)
extends AbstractScalaApplication(propertyPath, args, log: Logger) {
@ -18,12 +19,16 @@ class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Lo
log.info("found parameters sourcePath: {}", sourcePath)
val targetPath: String = parser.get("targetPath")
log.info("found parameters targetPath: {}", targetPath)
extractORCIDTable(spark, sourcePath, targetPath)
extractORCIDEmploymentsTable(spark, sourcePath, targetPath)
extractORCIDWorksTable(spark, sourcePath, targetPath)
val fromUpdate = "true".equals(parser.get("fromUpdate"))
val sourceSummaryPath = if (fromUpdate) s"$sourcePath/summary*" else sourcePath
val sourceEmploymentsPath = if (fromUpdate) s"$sourcePath/employments*" else sourcePath
val sourceWorksPath = if (fromUpdate) s"$sourcePath/works*" else sourcePath
extractORCIDTable(spark, sourceSummaryPath, targetPath, fromUpdate)
extractORCIDEmploymentsTable(spark, sourceEmploymentsPath, targetPath, fromUpdate)
extractORCIDWorksTable(spark, sourceWorksPath, targetPath, fromUpdate)
}
def extractORCIDTable(spark: SparkSession, sourcePath: String, targetPath: String): Unit = {
def extractORCIDTable(spark: SparkSession, sourcePath: String, targetPath: String, skipFilterByKey: Boolean): Unit = {
val sc: SparkContext = spark.sparkContext
import spark.implicits._
val df = sc
@ -32,8 +37,8 @@ class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Lo
.toDF
.as[(String, String)]
implicit val orcidAuthor: Encoder[Author] = Encoders.bean(classOf[Author])
// implicit val orcidPID:Encoder[Pid] = Encoders.bean(classOf[Pid])
df.filter(r => r._1.contains("summaries"))
val newDf = if (!skipFilterByKey) df.filter(r => r._1.contains("summaries")) else df
newDf
.map { r =>
val p = new OrcidParser
p.parseSummary(r._2)
@ -44,7 +49,12 @@ class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Lo
.save(s"$targetPath/Authors")
}
def extractORCIDWorksTable(spark: SparkSession, sourcePath: String, targetPath: String): Unit = {
def extractORCIDWorksTable(
spark: SparkSession,
sourcePath: String,
targetPath: String,
skipFilterByKey: Boolean
): Unit = {
val sc: SparkContext = spark.sparkContext
import spark.implicits._
val df = sc
@ -53,7 +63,19 @@ class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Lo
.toDF
.as[(String, String)]
implicit val orcidWorkAuthor: Encoder[Work] = Encoders.bean(classOf[Work])
implicit val orcidPID: Encoder[Pid] = Encoders.bean(classOf[Pid])
//We are in the case of parsing ORCID UPDATE
if (skipFilterByKey) {
df.flatMap { r =>
val p = new OrcidParser
p.parseWorks(r._2).asScala
}.filter(p => p != null)
.write
.mode(SaveMode.Overwrite)
.save(s"$targetPath/Works")
}
//We are in the case of parsing ORCID DUMP
else {
df.filter(r => r._1.contains("works"))
.map { r =>
val p = new OrcidParser
@ -64,8 +86,14 @@ class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Lo
.mode(SaveMode.Overwrite)
.save(s"$targetPath/Works")
}
}
def extractORCIDEmploymentsTable(spark: SparkSession, sourcePath: String, targetPath: String): Unit = {
def extractORCIDEmploymentsTable(
spark: SparkSession,
sourcePath: String,
targetPath: String,
skipFilterByKey: Boolean
): Unit = {
val sc: SparkContext = spark.sparkContext
import spark.implicits._
val df = sc
@ -74,7 +102,17 @@ class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Lo
.toDF
.as[(String, String)]
implicit val orcidEmploymentAuthor: Encoder[Employment] = Encoders.bean(classOf[Employment])
implicit val orcidPID: Encoder[Pid] = Encoders.bean(classOf[Pid])
if (skipFilterByKey) {
df.flatMap { r =>
val p = new OrcidParser
p.parseEmployments(r._2).asScala
}.filter(p => p != null)
.write
.mode(SaveMode.Overwrite)
.save(s"$targetPath/Employments")
}
//We are in the case of parsing ORCID DUMP
else {
df.filter(r => r._1.contains("employments"))
.map { r =>
val p = new OrcidParser
@ -85,6 +123,7 @@ class SparkGenerateORCIDTable(propertyPath: String, args: Array[String], log: Lo
.mode(SaveMode.Overwrite)
.save(s"$targetPath/Employments")
}
}
}
object SparkGenerateORCIDTable {

View File

@ -2,6 +2,7 @@
package eu.dnetlib.dhp.collection.orcid;
import java.io.IOException;
import java.net.URI;
import java.util.Arrays;
import java.util.List;
import java.util.Objects;
@ -9,7 +10,12 @@ import java.util.Objects;
import org.apache.commons.io.IOUtils;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.LocalFileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.SequenceFile;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.io.compress.CompressionCodec;
import org.apache.hadoop.io.compress.CompressionCodecFactory;
import org.apache.spark.SparkContext;
import org.apache.spark.api.java.JavaSparkContext;
import org.apache.spark.sql.Encoders;
@ -27,6 +33,7 @@ import com.ximpleware.XPathParseException;
import eu.dnetlib.dhp.collection.orcid.model.Author;
import eu.dnetlib.dhp.collection.orcid.model.ORCIDItem;
import eu.dnetlib.dhp.collection.orcid.model.Work;
import eu.dnetlib.dhp.parser.utility.VtdException;
public class DownloadORCIDTest {
@ -82,6 +89,34 @@ public class DownloadORCIDTest {
});
}
@Test
public void testParsingOrcidUpdateEmployments() throws Exception {
final String xml = IOUtils
.toString(
Objects
.requireNonNull(
getClass().getResourceAsStream("/eu/dnetlib/dhp/collection/orcid/update_employments.xml")));
final OrcidParser parser = new OrcidParser();
final ObjectMapper mapper = new ObjectMapper();
System.out.println(mapper.writeValueAsString(parser.parseEmployments(xml)));
}
@Test
public void testParsingOrcidUpdateWorks() throws Exception {
final String xml = IOUtils
.toString(
Objects
.requireNonNull(
getClass().getResourceAsStream("/eu/dnetlib/dhp/collection/orcid/update_work.xml")));
final OrcidParser parser = new OrcidParser();
final List<Work> works = parser.parseWorks(xml);
final ObjectMapper mapper = new ObjectMapper();
System.out.println(mapper.writeValueAsString(works));
}
@Test
public void testParsingEmployments() throws Exception {

View File

@ -0,0 +1,966 @@
<record:record path="/0000-0001-6816-8350" xmlns:internal="http://www.orcid.org/ns/internal" xmlns:education="http://www.orcid.org/ns/education" xmlns:distinction="http://www.orcid.org/ns/distinction" xmlns:deprecated="http://www.orcid.org/ns/deprecated" xmlns:other-name="http://www.orcid.org/ns/other-name" xmlns:membership="http://www.orcid.org/ns/membership" xmlns:error="http://www.orcid.org/ns/error" xmlns:common="http://www.orcid.org/ns/common" xmlns:record="http://www.orcid.org/ns/record" xmlns:personal-details="http://www.orcid.org/ns/personal-details" xmlns:keyword="http://www.orcid.org/ns/keyword" xmlns:email="http://www.orcid.org/ns/email" xmlns:external-identifier="http://www.orcid.org/ns/external-identifier" xmlns:funding="http://www.orcid.org/ns/funding" xmlns:preferences="http://www.orcid.org/ns/preferences" xmlns:address="http://www.orcid.org/ns/address" xmlns:invited-position="http://www.orcid.org/ns/invited-position" xmlns:work="http://www.orcid.org/ns/work" xmlns:history="http://www.orcid.org/ns/history" xmlns:employment="http://www.orcid.org/ns/employment" xmlns:qualification="http://www.orcid.org/ns/qualification" xmlns:service="http://www.orcid.org/ns/service" xmlns:person="http://www.orcid.org/ns/person" xmlns:activities="http://www.orcid.org/ns/activities" xmlns:researcher-url="http://www.orcid.org/ns/researcher-url" xmlns:peer-review="http://www.orcid.org/ns/peer-review" xmlns:bulk="http://www.orcid.org/ns/bulk" xmlns:research-resource="http://www.orcid.org/ns/research-resource">
<common:orcid-identifier>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:orcid-identifier>
<preferences:preferences>
<preferences:locale>en</preferences:locale>
</preferences:preferences>
<history:history>
<history:creation-method>Direct</history:creation-method>
<history:submission-date>2016-01-06T05:08:45.720Z</history:submission-date>
<common:last-modified-date>2024-01-02T20:07:05.186Z</common:last-modified-date>
<history:claimed>true</history:claimed>
<history:verified-email>true</history:verified-email>
<history:verified-primary-email>true</history:verified-primary-email>
</history:history>
<person:person path="/0000-0001-6816-8350/person">
<common:last-modified-date>2023-12-02T13:32:05.269Z</common:last-modified-date>
<other-name:other-names path="/0000-0001-6816-8350/other-names"/>
<researcher-url:researcher-urls path="/0000-0001-6816-8350/researcher-urls">
<common:last-modified-date>2016-02-09T09:18:18.417Z</common:last-modified-date>
<researcher-url:researcher-url put-code="633431" visibility="public" path="/0000-0001-6816-8350/researcher-urls/633431" display-index="0">
<common:created-date>2016-02-09T09:18:18.416Z</common:created-date>
<common:last-modified-date>2016-02-09T09:18:18.417Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<researcher-url:url-name>Dr Michael Muchiri</researcher-url:url-name>
<researcher-url:url>http://www.rmit.edu.au/contact/staff-contacts/academic-staff/m/muchiri-dr-michael</researcher-url:url>
</researcher-url:researcher-url>
</researcher-url:researcher-urls>
<email:emails path="/0000-0001-6816-8350/email"/>
<address:addresses path="/0000-0001-6816-8350/address">
<common:last-modified-date>2023-12-02T13:32:05.269Z</common:last-modified-date>
<address:address put-code="897528" visibility="public" path="/0000-0001-6816-8350/address/897528" display-index="2">
<common:created-date>2018-02-13T02:32:04.094Z</common:created-date>
<common:last-modified-date>2023-12-02T13:32:05.269Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<address:country>AU</address:country>
</address:address>
<address:address put-code="3191142" visibility="public" path="/0000-0001-6816-8350/address/3191142" display-index="1">
<common:created-date>2023-12-02T13:32:05.260Z</common:created-date>
<common:last-modified-date>2023-12-02T13:32:05.260Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<address:country>SA</address:country>
</address:address>
</address:addresses>
<keyword:keywords path="/0000-0001-6816-8350/keywords">
<common:last-modified-date>2023-12-02T13:31:16.269Z</common:last-modified-date>
<keyword:keyword put-code="368304" visibility="public" path="/0000-0001-6816-8350/keywords/368304" display-index="4">
<common:created-date>2016-02-09T09:16:44.001Z</common:created-date>
<common:last-modified-date>2023-12-02T13:31:16.269Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<keyword:content>Organizational Behavior</keyword:content>
</keyword:keyword>
<keyword:keyword put-code="368303" visibility="public" path="/0000-0001-6816-8350/keywords/368303" display-index="3">
<common:created-date>2016-02-09T09:16:27.374Z</common:created-date>
<common:last-modified-date>2023-12-02T13:31:16.269Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<keyword:content>Organizational Leadership</keyword:content>
</keyword:keyword>
<keyword:keyword put-code="368306" visibility="public" path="/0000-0001-6816-8350/keywords/368306" display-index="2">
<common:created-date>2016-02-09T09:17:08.998Z</common:created-date>
<common:last-modified-date>2023-12-02T13:31:16.269Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<keyword:content>Organizational performance</keyword:content>
</keyword:keyword>
<keyword:keyword put-code="3590814" visibility="public" path="/0000-0001-6816-8350/keywords/3590814" display-index="1">
<common:created-date>2023-12-02T13:31:16.259Z</common:created-date>
<common:last-modified-date>2023-12-02T13:31:16.259Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<keyword:content>Thriving at work</keyword:content>
</keyword:keyword>
</keyword:keywords>
<external-identifier:external-identifiers path="/0000-0001-6816-8350/external-identifiers">
<common:last-modified-date>2018-04-10T00:49:55.386Z</common:last-modified-date>
<external-identifier:external-identifier put-code="998076" visibility="public" path="/0000-0001-6816-8350/external-identifiers/998076" display-index="0">
<common:created-date>2018-04-10T00:49:55.385Z</common:created-date>
<common:last-modified-date>2018-04-10T00:49:55.386Z</common:last-modified-date>
<common:source>
<common:source-client-id>
<common:uri>https://orcid.org/client/0000-0003-1377-5676</common:uri>
<common:path>0000-0003-1377-5676</common:path>
<common:host>orcid.org</common:host>
</common:source-client-id>
<common:source-name>ResearcherID</common:source-name>
<common:assertion-origin-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:assertion-origin-orcid>
</common:source>
<common:external-id-type>ResearcherID</common:external-id-type>
<common:external-id-value>D-1929-2018</common:external-id-value>
<common:external-id-url>http://www.researcherid.com/rid/D-1929-2018</common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</external-identifier:external-identifier>
</external-identifier:external-identifiers>
</person:person>
<activities:activities-summary path="/0000-0001-6816-8350/activities">
<common:last-modified-date>2023-12-02T13:28:26.051Z</common:last-modified-date>
<activities:distinctions path="/0000-0001-6816-8350/distinctions"/>
<activities:educations path="/0000-0001-6816-8350/educations">
<common:last-modified-date>2018-02-13T02:33:38.225Z</common:last-modified-date>
<activities:affiliation-group>
<common:last-modified-date>2016-02-09T06:55:21.838Z</common:last-modified-date>
<common:external-ids/>
<education:education-summary put-code="1549986" display-index="0" path="/0000-0001-6816-8350/education/1549986" visibility="public">
<common:created-date>2016-02-09T06:54:39.199Z</common:created-date>
<common:last-modified-date>2016-02-09T06:55:21.838Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Management</common:department-name>
<common:role-title>PhD</common:role-title>
<common:start-date>
<common:year>2021</common:year>
</common:start-date>
<common:end-date>
<common:year>2022</common:year>
<common:month>02</common:month>
<common:day>12</common:day>
</common:end-date>
<common:start-date>
<common:year>2003</common:year>
<common:month>03</common:month>
</common:start-date>
<common:end-date>
<common:year>2007</common:year>
<common:month>03</common:month>
</common:end-date>
<common:organization>
<common:name>University of New England</common:name>
<common:address>
<common:city>Armidale</common:city>
<common:region>NSW</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>1319</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</education:education-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2018-02-13T02:33:38.225Z</common:last-modified-date>
<common:external-ids/>
<education:education-summary put-code="1549990" display-index="0" path="/0000-0001-6816-8350/education/1549990" visibility="public">
<common:created-date>2016-02-09T06:57:04.181Z</common:created-date>
<common:last-modified-date>2018-02-13T02:33:38.225Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Psychology</common:department-name>
<common:role-title>Master of Science (Industrial and Organizational) Psychology</common:role-title>
<common:start-date>
<common:year>1998</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2000</common:year>
<common:month>01</common:month>
</common:end-date>
<common:organization>
<common:name>Universitas Gadjah Mada</common:name>
<common:address>
<common:city>Yogyakarta</common:city>
<common:region>Daerah Istimewa Yogyakart</common:region>
<common:country>ID</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>59166</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</education:education-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2018-02-13T02:33:35.821Z</common:last-modified-date>
<common:external-ids/>
<education:education-summary put-code="1549998" display-index="0" path="/0000-0001-6816-8350/education/1549998" visibility="public">
<common:created-date>2016-02-09T06:58:59.869Z</common:created-date>
<common:last-modified-date>2018-02-13T02:33:35.821Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Education</common:department-name>
<common:role-title>Bachelor of Education (Honors)</common:role-title>
<common:start-date>
<common:year>1988</common:year>
<common:month>03</common:month>
</common:start-date>
<common:end-date>
<common:year>1991</common:year>
<common:month>03</common:month>
</common:end-date>
<common:organization>
<common:name>Kenyatta University</common:name>
<common:address>
<common:city>Nairobi</common:city>
<common:region>Nairobi</common:region>
<common:country>KE</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>107864</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</education:education-summary>
</activities:affiliation-group>
</activities:educations>
<activities:employments path="/0000-0001-6816-8350/employments">
<common:last-modified-date>2023-12-02T13:28:26.051Z</common:last-modified-date>
<activities:affiliation-group>
<common:last-modified-date>2023-12-02T13:28:26.051Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="21884863" display-index="1" path="/0000-0001-6816-8350/employment/21884863" visibility="public">
<common:created-date>2023-12-02T13:28:26.051Z</common:created-date>
<common:last-modified-date>2023-12-02T13:28:26.051Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Management</common:department-name>
<common:role-title>Associate Professor in Management</common:role-title>
<common:start-date>
<common:year>2023</common:year>
<common:month>08</common:month>
<common:day>20</common:day>
</common:start-date>
<common:organization>
<common:name>Alfaisal University</common:name>
<common:address>
<common:city>Riyadh</common:city>
<common:country>SA</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>https://ror.org/00cdrtq48</common:disambiguated-organization-identifier>
<common:disambiguation-source>ROR</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
<common:url>https://faculty.alfaisal.edu/user/mmuchiri</common:url>
</employment:employment-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2016-02-09T07:00:06.052Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="1550002" display-index="0" path="/0000-0001-6816-8350/employment/1550002" visibility="public">
<common:created-date>2016-02-09T07:00:06.052Z</common:created-date>
<common:last-modified-date>2016-02-09T07:00:06.052Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Management</common:department-name>
<common:role-title>Senior Lecturer</common:role-title>
<common:start-date>
<common:year>2014</common:year>
<common:month>02</common:month>
</common:start-date>
<common:organization>
<common:name>RMIT University</common:name>
<common:address>
<common:city>Melbourne</common:city>
<common:region>VIC</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>5376</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2016-02-09T07:01:08.398Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="1550007" display-index="0" path="/0000-0001-6816-8350/employment/1550007" visibility="public">
<common:created-date>2016-02-09T07:01:08.398Z</common:created-date>
<common:last-modified-date>2016-02-09T07:01:08.398Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Management</common:department-name>
<common:role-title>Senior Lecturer in Human Resource Management</common:role-title>
<common:start-date>
<common:year>2010</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2014</common:year>
<common:month>02</common:month>
</common:end-date>
<common:organization>
<common:name>Central Queensland University</common:name>
<common:address>
<common:city>Rockhampton</common:city>
<common:region>QLD</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>273488</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2016-02-09T07:01:47.814Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="1550010" display-index="0" path="/0000-0001-6816-8350/employment/1550010" visibility="public">
<common:created-date>2016-02-09T07:01:47.814Z</common:created-date>
<common:last-modified-date>2016-02-09T07:01:47.814Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Management</common:department-name>
<common:role-title>Lecturer in Management</common:role-title>
<common:start-date>
<common:year>2007</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2010</common:year>
<common:month>01</common:month>
</common:end-date>
<common:organization>
<common:name>Central Queensland University</common:name>
<common:address>
<common:city>Rockhampton</common:city>
<common:region>QLD</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>273488</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2018-02-13T02:33:13.213Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="1550017" display-index="0" path="/0000-0001-6816-8350/employment/1550017" visibility="public">
<common:created-date>2016-02-09T07:03:42.180Z</common:created-date>
<common:last-modified-date>2018-02-13T02:33:13.213Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Human Resource Development Division</common:department-name>
<common:role-title>Chief Human Resource Development Officer</common:role-title>
<common:start-date>
<common:year>2005</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2007</common:year>
<common:month>01</common:month>
</common:end-date>
<common:organization>
<common:name>Government of Kenya Directorate of Personnel Management</common:name>
<common:address>
<common:city>Nairobi</common:city>
<common:region>Nairobi</common:region>
<common:country>KE</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>360256</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2016-02-09T07:05:02.300Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="1550020" display-index="0" path="/0000-0001-6816-8350/employment/1550020" visibility="public">
<common:created-date>2016-02-09T07:05:02.300Z</common:created-date>
<common:last-modified-date>2016-02-09T07:05:02.300Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Human Resource Development Division</common:department-name>
<common:role-title>Human Resource Development Officer</common:role-title>
<common:start-date>
<common:year>2001</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2005</common:year>
<common:month>01</common:month>
</common:end-date>
<common:organization>
<common:name>Government of Kenya Directorate of Personnel Management</common:name>
<common:address>
<common:city>Nairobi</common:city>
<common:region>Nairobi</common:region>
<common:country>KE</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>360256</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2016-02-09T07:36:52.398Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="1550050" display-index="0" path="/0000-0001-6816-8350/employment/1550050" visibility="public">
<common:created-date>2016-02-09T07:36:52.398Z</common:created-date>
<common:last-modified-date>2016-02-09T07:36:52.398Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<common:department-name>Public Sector Management Technical Assistance Project</common:department-name>
<common:role-title>Project Coordinator for Development Learning Centre</common:role-title>
<common:start-date>
<common:year>2002</common:year>
<common:month>08</common:month>
</common:start-date>
<common:end-date>
<common:year>2003</common:year>
<common:month>03</common:month>
</common:end-date>
<common:organization>
<common:name>Government of Kenya Directorate of Personnel Management</common:name>
<common:address>
<common:city>Nairobi</common:city>
<common:region>Nairobi</common:region>
<common:country>KE</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>360256</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
</activities:employments>
<activities:fundings path="/0000-0001-6816-8350/fundings">
<common:last-modified-date>2016-02-09T09:05:27.100Z</common:last-modified-date>
<activities:group>
<common:last-modified-date>2016-02-09T09:05:27.100Z</common:last-modified-date>
<common:external-ids/>
<funding:funding-summary put-code="150520" path="/0000-0001-6816-8350/funding/150520" visibility="public" display-index="6">
<common:created-date>2016-02-09T09:05:27.100Z</common:created-date>
<common:last-modified-date>2016-02-09T09:05:27.100Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<funding:title>
<common:title>A cross-country examination of Employee Wellbeing, Leadership, High Performance Work Systems and Innovative Behaviours</common:title>
</funding:title>
<funding:type>grant</funding:type>
<common:start-date>
<common:year>2016</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2016</common:year>
<common:month>12</common:month>
</common:end-date>
<common:organization>
<common:name>RMIT University</common:name>
<common:address>
<common:city>VIC</common:city>
<common:region>VIC</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>http://dx.doi.org/10.13039/501100001780</common:disambiguated-organization-identifier>
<common:disambiguation-source>FUNDREF</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</funding:funding-summary>
</activities:group>
<activities:group>
<common:last-modified-date>2016-02-09T09:03:51.641Z</common:last-modified-date>
<common:external-ids/>
<funding:funding-summary put-code="150518" path="/0000-0001-6816-8350/funding/150518" visibility="public" display-index="5">
<common:created-date>2016-02-09T09:03:51.641Z</common:created-date>
<common:last-modified-date>2016-02-09T09:03:51.641Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<funding:title>
<common:title>Leading Safe and Thriving Organisations: An Investigation of the Relationships between Leadership, Thriving Behaviour, Authentic Followership and Safety Climate in an Australian Multinational Enterprise</common:title>
</funding:title>
<funding:type>grant</funding:type>
<common:start-date>
<common:year>2015</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2015</common:year>
<common:month>12</common:month>
</common:end-date>
<common:organization>
<common:name>RMIT University</common:name>
<common:address>
<common:city>VIC</common:city>
<common:region>VIC</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>http://dx.doi.org/10.13039/501100001780</common:disambiguated-organization-identifier>
<common:disambiguation-source>FUNDREF</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</funding:funding-summary>
</activities:group>
<activities:group>
<common:last-modified-date>2016-02-09T09:02:28.297Z</common:last-modified-date>
<common:external-ids/>
<funding:funding-summary put-code="150516" path="/0000-0001-6816-8350/funding/150516" visibility="public" display-index="4">
<common:created-date>2016-02-09T09:02:28.297Z</common:created-date>
<common:last-modified-date>2016-02-09T09:02:28.297Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<funding:title>
<common:title>A multilevel, cross-country examination of leadership, followership and innovative behaviours in Australia and Indonesia. </common:title>
</funding:title>
<funding:type>grant</funding:type>
<common:start-date>
<common:year>2015</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2015</common:year>
<common:month>12</common:month>
</common:end-date>
<common:organization>
<common:name>RMIT University</common:name>
<common:address>
<common:city>VIC</common:city>
<common:region>VIC</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>http://dx.doi.org/10.13039/501100001780</common:disambiguated-organization-identifier>
<common:disambiguation-source>FUNDREF</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</funding:funding-summary>
</activities:group>
<activities:group>
<common:last-modified-date>2016-02-09T09:00:51.749Z</common:last-modified-date>
<common:external-ids/>
<funding:funding-summary put-code="150514" path="/0000-0001-6816-8350/funding/150514" visibility="public" display-index="3">
<common:created-date>2016-02-09T09:00:51.749Z</common:created-date>
<common:last-modified-date>2016-02-09T09:00:51.749Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<funding:title>
<common:title>Workplace safety and positive leadership: Exploring relationships between leader behaviours, organisational climate, safety climate, safety citizenship behaviours and innovative behaviours within city councils in Victoria </common:title>
</funding:title>
<funding:type>grant</funding:type>
<common:start-date>
<common:year>2014</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2014</common:year>
<common:month>12</common:month>
</common:end-date>
<common:organization>
<common:name>RMIT University</common:name>
<common:address>
<common:city>VIC</common:city>
<common:region>VIC</common:region>
<common:country>AU</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>http://dx.doi.org/10.13039/501100001780</common:disambiguated-organization-identifier>
<common:disambiguation-source>FUNDREF</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</funding:funding-summary>
</activities:group>
<activities:group>
<common:last-modified-date>2016-02-09T07:46:44.919Z</common:last-modified-date>
<common:external-ids/>
<funding:funding-summary put-code="150485" path="/0000-0001-6816-8350/funding/150485" visibility="public" display-index="0">
<common:created-date>2016-02-09T07:46:44.919Z</common:created-date>
<common:last-modified-date>2016-02-09T07:46:44.919Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0001-6816-8350</common:uri>
<common:path>0000-0001-6816-8350</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
</common:source>
<funding:title>
<common:title>Sustainable Business Model for Central Queensland Regional Information Systems.</common:title>
</funding:title>
<funding:type>grant</funding:type>
<common:start-date>
<common:year>2008</common:year>
<common:month>01</common:month>
</common:start-date>
<common:end-date>
<common:year>2008</common:year>
<common:month>12</common:month>
</common:end-date>
<common:organization>
<common:name>Department of Local Government, Planning, Sport and Recreation, Queensland, Australia </common:name>
<common:address>
<common:city>Rockhampton</common:city>
<common:region>Central Queensland</common:region>
<common:country>AU</common:country>
</common:address>
</common:organization>
</funding:funding-summary>
</activities:group>
</activities:fundings>
<activities:invited-positions path="/0000-0001-6816-8350/invited-positions"/>
<activities:memberships path="/0000-0001-6816-8350/memberships"/>
<activities:peer-reviews path="/0000-0001-6816-8350/peer-reviews">
<common:last-modified-date>2023-05-31T05:53:44.542Z</common:last-modified-date>
<activities:group>
<common:last-modified-date>2023-05-31T05:53:44.542Z</common:last-modified-date>
<common:external-ids>
<common:external-id>
<common:external-id-type>peer-review</common:external-id-type>
<common:external-id-value>issn:0167-4544</common:external-id-value>
</common:external-id>
</common:external-ids>
<activities:peer-review-group>
<common:last-modified-date>2023-02-28T06:51:52.426Z</common:last-modified-date>
<common:external-ids>
<common:external-id>
<common:external-id-type>source-work-id</common:external-id-type>
<common:external-id-value>c9bdf086-cfee-4cd9-bcfb-268cc5423248</common:external-id-value>
<common:external-id-normalized transient="true">c9bdf086-cfee-4cd9-bcfb-268cc5423248</common:external-id-normalized>
<common:external-id-url></common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<peer-review:peer-review-summary put-code="8741329" path="/0000-0001-6816-8350/peer-review/8741329" visibility="public" display-index="0">
<common:created-date>2023-02-28T06:51:52.426Z</common:created-date>
<common:last-modified-date>2023-02-28T06:51:52.426Z</common:last-modified-date>
<common:source>
<common:source-client-id>
<common:uri>https://orcid.org/client/APP-945VYTN20C7BZXYT</common:uri>
<common:path>APP-945VYTN20C7BZXYT</common:path>
<common:host>orcid.org</common:host>
</common:source-client-id>
<common:source-name>Springer Nature @ Editorial Manager</common:source-name>
</common:source>
<peer-review:reviewer-role>reviewer</peer-review:reviewer-role>
<common:external-ids>
<common:external-id>
<common:external-id-type>source-work-id</common:external-id-type>
<common:external-id-value>c9bdf086-cfee-4cd9-bcfb-268cc5423248</common:external-id-value>
<common:external-id-normalized transient="true">c9bdf086-cfee-4cd9-bcfb-268cc5423248</common:external-id-normalized>
<common:external-id-url></common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<peer-review:review-type>review</peer-review:review-type>
<peer-review:completion-date>
<common:year>2023</common:year>
</peer-review:completion-date>
<peer-review:review-group-id>issn:0167-4544</peer-review:review-group-id>
<peer-review:convening-organization>
<common:name>Springer Nature</common:name>
<common:address>
<common:city>New York</common:city>
<common:country>US</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>grid.467660.5</common:disambiguated-organization-identifier>
<common:disambiguation-source>GRID</common:disambiguation-source>
</common:disambiguated-organization>
</peer-review:convening-organization>
</peer-review:peer-review-summary>
</activities:peer-review-group>
<activities:peer-review-group>
<common:last-modified-date>2023-05-31T05:53:44.542Z</common:last-modified-date>
<common:external-ids>
<common:external-id>
<common:external-id-type>source-work-id</common:external-id-type>
<common:external-id-value>c442840b-5807-459d-802a-303d8ba4e25e</common:external-id-value>
<common:external-id-normalized transient="true">c442840b-5807-459d-802a-303d8ba4e25e</common:external-id-normalized>
<common:external-id-url></common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<peer-review:peer-review-summary put-code="9680570" path="/0000-0001-6816-8350/peer-review/9680570" visibility="public" display-index="0">
<common:created-date>2023-05-31T05:53:44.542Z</common:created-date>
<common:last-modified-date>2023-05-31T05:53:44.542Z</common:last-modified-date>
<common:source>
<common:source-client-id>
<common:uri>https://orcid.org/client/APP-945VYTN20C7BZXYT</common:uri>
<common:path>APP-945VYTN20C7BZXYT</common:path>
<common:host>orcid.org</common:host>
</common:source-client-id>
<common:source-name>Springer Nature @ Editorial Manager</common:source-name>
</common:source>
<peer-review:reviewer-role>reviewer</peer-review:reviewer-role>
<common:external-ids>
<common:external-id>
<common:external-id-type>source-work-id</common:external-id-type>
<common:external-id-value>c442840b-5807-459d-802a-303d8ba4e25e</common:external-id-value>
<common:external-id-normalized transient="true">c442840b-5807-459d-802a-303d8ba4e25e</common:external-id-normalized>
<common:external-id-url></common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<peer-review:review-type>review</peer-review:review-type>
<peer-review:completion-date>
<common:year>2023</common:year>
</peer-review:completion-date>
<peer-review:review-group-id>issn:0167-4544</peer-review:review-group-id>
<peer-review:convening-organization>
<common:name>Springer Nature</common:name>
<common:address>
<common:city>New York</common:city>
<common:country>US</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>grid.467660.5</common:disambiguated-organization-identifier>
<common:disambiguation-source>GRID</common:disambiguation-source>
</common:disambiguated-organization>
</peer-review:convening-organization>
</peer-review:peer-review-summary>
</activities:peer-review-group>
</activities:group>
</activities:peer-reviews>
<activities:qualifications path="/0000-0001-6816-8350/qualifications"/>
<activities:research-resources path="/0000-0001-6816-8350/research-resources"/>
<activities:services path="/0000-0001-6816-8350/services"/>
<activities:works path="/0000-0001-6816-8350/works">
<common:last-modified-date>2023-06-02T20:12:00.338Z</common:last-modified-date>
<activities:group>
<common:last-modified-date>2023-06-02T20:12:00.338Z</common:last-modified-date>
<common:external-ids>
<common:external-id>
<common:external-id-type>doi</common:external-id-type>
<common:external-id-value>10.4337/9781800881945.00020</common:external-id-value>
<common:external-id-normalized transient="true">10.4337/9781800881945.00020</common:external-id-normalized>
<common:external-id-url>https://doi.org/10.4337/9781800881945.00020</common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<work:work-summary put-code="134891279" path="/0000-0001-6816-8350/work/134891279" visibility="public" display-index="0">
<common:created-date>2023-05-11T21:05:54.188Z</common:created-date>
<common:last-modified-date>2023-06-02T20:12:00.338Z</common:last-modified-date>
<common:source>
<common:source-client-id>
<common:uri>https://orcid.org/client/0000-0001-9884-1913</common:uri>
<common:path>0000-0001-9884-1913</common:path>
<common:host>orcid.org</common:host>
</common:source-client-id>
<common:source-name>Crossref</common:source-name>
</common:source>
<work:title>
<common:title>Ethical leadership as workplace innovation and enabler for employee commitment and innovative work behaviours in Vietnam</common:title>
</work:title>
<common:external-ids>
<common:external-id>
<common:external-id-type>doi</common:external-id-type>
<common:external-id-value>10.4337/9781800881945.00020</common:external-id-value>
<common:external-id-normalized transient="true">10.4337/9781800881945.00020</common:external-id-normalized>
<common:external-id-url>https://doi.org/10.4337/9781800881945.00020</common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<common:url>https://doi.org/10.4337/9781800881945.00020</common:url>
<work:type>book-chapter</work:type>
<common:publication-date>
<common:year>2023</common:year>
<common:month>05</common:month>
<common:day>26</common:day>
</common:publication-date>
</work:work-summary>
</activities:group>
<activities:group>
<common:last-modified-date>2023-03-01T11:30:31.972Z</common:last-modified-date>
<common:external-ids>
<common:external-id>
<common:external-id-type>doi</common:external-id-type>
<common:external-id-value>10.1007/s10551-022-05081-6</common:external-id-value>
<common:external-id-normalized transient="true">10.1007/s10551-022-05081-6</common:external-id-normalized>
<common:external-id-url>https://doi.org/10.1007/s10551-022-05081-6</common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<work:work-summary put-code="110048777" path="/0000-0001-6816-8350/work/110048777" visibility="public" display-index="0">
<common:created-date>2022-03-18T03:36:55.927Z</common:created-date>
<common:last-modified-date>2023-03-01T11:30:31.972Z</common:last-modified-date>
<common:source>
<common:source-client-id>
<common:uri>https://orcid.org/client/0000-0001-9884-1913</common:uri>
<common:path>0000-0001-9884-1913</common:path>
<common:host>orcid.org</common:host>
</common:source-client-id>
<common:source-name>Crossref</common:source-name>
</common:source>
<work:title>
<common:title>Unethical Leadership: Review, Synthesis and Directions for Future Research</common:title>
</work:title>
<common:external-ids>
<common:external-id>
<common:external-id-type>doi</common:external-id-type>
<common:external-id-value>10.1007/s10551-022-05081-6</common:external-id-value>
<common:external-id-normalized transient="true">10.1007/s10551-022-05081-6</common:external-id-normalized>
<common:external-id-url>https://doi.org/10.1007/s10551-022-05081-6</common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<common:url>https://doi.org/10.1007/s10551-022-05081-6</common:url>
<work:type>journal-article</work:type>
<common:publication-date>
<common:year>2023</common:year>
<common:month>03</common:month>
</common:publication-date>
<work:journal-title>Journal of Business Ethics</work:journal-title>
</work:work-summary>
</activities:group>
<activities:group>
<common:last-modified-date>2022-05-28T18:16:16.575Z</common:last-modified-date>
<common:external-ids>
<common:external-id>
<common:external-id-type>doi</common:external-id-type>
<common:external-id-value>10.1017/jmo.2019.33</common:external-id-value>
<common:external-id-normalized transient="true">10.1017/jmo.2019.33</common:external-id-normalized>
<common:external-id-url>https://doi.org/10.1017/jmo.2019.33</common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<work:work-summary put-code="57272180" path="/0000-0001-6816-8350/work/57272180" visibility="public" display-index="0">
<common:created-date>2019-05-10T07:23:14.608Z</common:created-date>
<common:last-modified-date>2022-05-28T18:16:16.575Z</common:last-modified-date>
<common:source>
<common:source-client-id>
<common:uri>https://orcid.org/client/0000-0001-9884-1913</common:uri>
<common:path>0000-0001-9884-1913</common:path>
<common:host>orcid.org</common:host>
</common:source-client-id>
<common:source-name>Crossref</common:source-name>
</common:source>
<work:title>
<common:title>And now for something completely different: Reframing social processes of leadership theory using positive organisational behaviour</common:title>
</work:title>
<common:external-ids>
<common:external-id>
<common:external-id-type>doi</common:external-id-type>
<common:external-id-value>10.1017/jmo.2019.33</common:external-id-value>
<common:external-id-normalized transient="true">10.1017/jmo.2019.33</common:external-id-normalized>
<common:external-id-url>https://doi.org/10.1017/jmo.2019.33</common:external-id-url>
<common:external-id-relationship>self</common:external-id-relationship>
</common:external-id>
</common:external-ids>
<common:url>https://doi.org/10.1017/jmo.2019.33</common:url>
<work:type>journal-article</work:type>
<common:publication-date>
<common:year>2019</common:year>
<common:month>05</common:month>
<common:day>09</common:day>
</common:publication-date>
<work:journal-title>Journal of Management &amp; Organization</work:journal-title>
</work:work-summary>
</activities:group>
</activities:works>
</activities:activities-summary>
</record:record>

View File

@ -0,0 +1,60 @@
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
<activities:employments path="/0000-0002-0456-1185/employments" xmlns:internal="http://www.orcid.org/ns/internal" xmlns:education="http://www.orcid.org/ns/education" xmlns:distinction="http://www.orcid.org/ns/distinction" xmlns:deprecated="http://www.orcid.org/ns/deprecated" xmlns:other-name="http://www.orcid.org/ns/other-name" xmlns:membership="http://www.orcid.org/ns/membership" xmlns:error="http://www.orcid.org/ns/error" xmlns:common="http://www.orcid.org/ns/common" xmlns:record="http://www.orcid.org/ns/record" xmlns:personal-details="http://www.orcid.org/ns/personal-details" xmlns:keyword="http://www.orcid.org/ns/keyword" xmlns:email="http://www.orcid.org/ns/email" xmlns:external-identifier="http://www.orcid.org/ns/external-identifier" xmlns:funding="http://www.orcid.org/ns/funding" xmlns:preferences="http://www.orcid.org/ns/preferences" xmlns:address="http://www.orcid.org/ns/address" xmlns:invited-position="http://www.orcid.org/ns/invited-position" xmlns:work="http://www.orcid.org/ns/work" xmlns:history="http://www.orcid.org/ns/history" xmlns:employment="http://www.orcid.org/ns/employment" xmlns:qualification="http://www.orcid.org/ns/qualification" xmlns:service="http://www.orcid.org/ns/service" xmlns:person="http://www.orcid.org/ns/person" xmlns:activities="http://www.orcid.org/ns/activities" xmlns:researcher-url="http://www.orcid.org/ns/researcher-url" xmlns:peer-review="http://www.orcid.org/ns/peer-review" xmlns:bulk="http://www.orcid.org/ns/bulk" xmlns:research-resource="http://www.orcid.org/ns/research-resource">
<common:last-modified-date>2024-01-07T23:59:38.869Z</common:last-modified-date>
<activities:affiliation-group>
<common:last-modified-date>2024-01-07T23:59:38.869Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="22127142" display-index="0" path="/0000-0002-0456-1185/employment/22127142" visibility="public">
<common:created-date>2024-01-07T23:59:38.869Z</common:created-date>
<common:last-modified-date>2024-01-07T23:59:38.869Z</common:last-modified-date>
<common:source>
<common:source-client-id>
<common:uri>https://orcid.org/client/APP-N0TAO4G9BBK9PWHT</common:uri>
<common:path>APP-N0TAO4G9BBK9PWHT</common:path>
<common:host>orcid.org</common:host>
</common:source-client-id>
<common:source-name>Tampere University</common:source-name>
</common:source>
<common:organization>
<common:name>Tampere University</common:name>
<common:address>
<common:city>Tampere</common:city>
<common:country>FI</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>https://ror.org/033003e23</common:disambiguated-organization-identifier>
<common:disambiguation-source>ROR</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
<activities:affiliation-group>
<common:last-modified-date>2019-01-03T17:00:05.658Z</common:last-modified-date>
<common:external-ids/>
<employment:employment-summary put-code="3291239" display-index="1" path="/0000-0002-0456-1185/employment/3291239" visibility="public">
<common:created-date>2017-02-26T04:46:20.917Z</common:created-date>
<common:last-modified-date>2019-01-03T17:00:05.658Z</common:last-modified-date>
<common:source>
<common:source-orcid>
<common:uri>https://orcid.org/0000-0002-0456-1185</common:uri>
<common:path>0000-0002-0456-1185</common:path>
<common:host>orcid.org</common:host>
</common:source-orcid>
<common:source-name>Tiina Manninen</common:source-name>
</common:source>
<common:department-name> Faculty of Medicine and Health Technology</common:department-name>
<common:role-title>Academy Research Fellow</common:role-title>
<common:organization>
<common:name>Tampere University</common:name>
<common:address>
<common:city>Tampere</common:city>
<common:country>FI</common:country>
</common:address>
<common:disambiguated-organization>
<common:disambiguated-organization-identifier>7839</common:disambiguated-organization-identifier>
<common:disambiguation-source>RINGGOLD</common:disambiguation-source>
</common:disambiguated-organization>
</common:organization>
</employment:employment-summary>
</activities:affiliation-group>
</activities:employments>

View File

@ -23,10 +23,15 @@ class CrossrefMappingTest {
val mapper = new ObjectMapper()
@Test
def testMissingAuthorParser():Unit = {
val json: String = Source.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/doiboost/crossref/s41567-022-01757-y.json")).mkString
def testMissingAuthorParser(): Unit = {
val json: String = Source
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/doiboost/crossref/s41567-022-01757-y.json"))
.mkString
val result = Crossref2Oaf.convert(json)
result.filter(o => o.isInstanceOf[Publication]).map(p=> p.asInstanceOf[Publication]).foreach(p =>assertTrue(p.getAuthor.size()>0))
result
.filter(o => o.isInstanceOf[Publication])
.map(p => p.asInstanceOf[Publication])
.foreach(p => assertTrue(p.getAuthor.size() > 0))
}
@Test

View File

@ -1293,6 +1293,7 @@ class MappersTest {
p.getInstance().get(0).getAlternateIdentifier().forEach(x -> System.out.println(x.getValue()));
}
@Test
void testNotWellFormed() throws IOException {
final String xml = IOUtils