762 lines
32 KiB
Java
762 lines
32 KiB
Java
package eu.dnetlib.dhp.schema.oaf.utils;
|
|
|
|
import com.google.common.base.Preconditions;
|
|
import eu.dnetlib.dhp.common.api.zenodo.File;
|
|
import eu.dnetlib.dhp.schema.common.AccessRightComparator;
|
|
import eu.dnetlib.dhp.schema.common.ModelConstants;
|
|
import eu.dnetlib.dhp.schema.common.ModelSupport;
|
|
import eu.dnetlib.dhp.schema.oaf.*;
|
|
import org.apache.commons.lang3.StringUtils;
|
|
import org.apache.commons.lang3.tuple.ImmutablePair;
|
|
import org.apache.commons.lang3.tuple.Pair;
|
|
import static com.google.common.base.Preconditions.checkArgument;
|
|
import static com.ibm.icu.text.PluralRules.Operand.e;
|
|
|
|
import java.text.ParseException;
|
|
import java.util.*;
|
|
import java.util.stream.Collectors;
|
|
import java.util.stream.Stream;
|
|
|
|
/**
|
|
* The type Oaf utils class groups all
|
|
* the utilities method used for OAF Generation
|
|
*/
|
|
public class OafUtils {
|
|
|
|
/**
|
|
* Normalize pid string.
|
|
*
|
|
* @param pid the pid
|
|
* @return the string
|
|
*/
|
|
public static String extractKeyFromPid(final StructuredProperty pid) {
|
|
if (pid == null)
|
|
return null;
|
|
final StructuredProperty normalizedPid = CleaningFunctions.normalizePidValue(pid);
|
|
|
|
return String.format("%s::%s", normalizedPid.getQualifier().getClassid(), normalizedPid.getValue());
|
|
}
|
|
|
|
|
|
/**
|
|
* This method converts the list of instance enrichments
|
|
* into a Map where the key is the normalized identifier
|
|
* and the value is the instance itself
|
|
*
|
|
* @param ri the list of enrichment instances
|
|
* @return the result map
|
|
*/
|
|
public static Map<String, Instance> toInstanceMap(final List<Instance> ri) {
|
|
|
|
|
|
return ri
|
|
.stream()
|
|
.filter(i -> i.getPid() != null || i.getAlternateIdentifier() != null)
|
|
.flatMap(i -> {
|
|
final List<Pair<String, Instance>> result = new ArrayList<>();
|
|
if (i.getPid() != null)
|
|
i.getPid().stream().filter(OafUtils::validPid).forEach(p -> result.add(new ImmutablePair<>(extractKeyFromPid(p), i)));
|
|
if (i.getAlternateIdentifier() != null)
|
|
i.getAlternateIdentifier().stream().filter(OafUtils::validPid).forEach(p -> result.add(new ImmutablePair<>(extractKeyFromPid(p), i)));
|
|
return result.stream();
|
|
}).collect(Collectors.toMap(
|
|
Pair::getLeft,
|
|
Pair::getRight,
|
|
(a, b) -> a
|
|
));
|
|
}
|
|
|
|
/**
|
|
* Valid pid boolean.
|
|
*
|
|
* @param p the p
|
|
* @return the boolean
|
|
*/
|
|
private static boolean validPid(final StructuredProperty p) {
|
|
return p.getValue()!= null && p.getQualifier()!= null && p.getQualifier().getClassid()!=null;
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
* This utility method finds the list of enrichment instances
|
|
* that match one or more PIDs in the input list
|
|
*
|
|
* @param pids the list of PIDs
|
|
* @param enrichments the List of enrichment instances having the same pid
|
|
* @return the list
|
|
*/
|
|
private static List<Instance> findEnrichmentsByPID(final List<StructuredProperty> pids, final Map<String,Instance> enrichments) {
|
|
if (pids == null || enrichments == null)
|
|
return null;
|
|
return pids
|
|
.stream()
|
|
.map(OafUtils::extractKeyFromPid)
|
|
.map(enrichments::get)
|
|
.filter(Objects::nonNull)
|
|
.collect(Collectors.toList());
|
|
}
|
|
|
|
/**
|
|
* Is an enrichment boolean.
|
|
*
|
|
* @param e the e
|
|
* @return the boolean
|
|
*/
|
|
public static boolean isAnEnrichment(OafEntity e) {
|
|
return e.getDataInfo()!= null &&
|
|
e.getDataInfo().getProvenanceaction()!= null
|
|
&& ModelConstants.PROVENANCE_ENRICH.equalsIgnoreCase(e.getDataInfo().getProvenanceaction().getClassid());
|
|
}
|
|
|
|
|
|
/**
|
|
* This method apply enrichment on a single instance
|
|
* The enrichment consists of replacing values on
|
|
* single attribute only if in the current instance is missing
|
|
* The only repeatable field enriched is measures
|
|
*
|
|
* @param currentInstance the current instance
|
|
* @param enrichment the enrichment instance
|
|
*/
|
|
private static void applyEnrichment(final Instance currentInstance, final Instance enrichment) {
|
|
if (currentInstance == null || enrichment == null)
|
|
return;
|
|
|
|
//ENRICH accessright
|
|
if (enrichment.getAccessright()!=null && currentInstance.getAccessright() == null)
|
|
currentInstance.setAccessright(enrichment.getAccessright());
|
|
|
|
//ENRICH license
|
|
if (enrichment.getLicense()!=null && currentInstance.getLicense() == null)
|
|
currentInstance.setLicense(enrichment.getLicense());
|
|
|
|
//ENRICH instanceType
|
|
if (enrichment.getInstancetype()!=null && currentInstance.getInstancetype() == null)
|
|
currentInstance.setInstancetype(enrichment.getInstancetype());
|
|
|
|
//ENRICH hostedby
|
|
if (enrichment.getHostedby()!=null && currentInstance.getHostedby() == null)
|
|
currentInstance.setHostedby(enrichment.getHostedby());
|
|
|
|
//ENRICH distributionlocation
|
|
if (enrichment.getDistributionlocation()!=null && currentInstance.getDistributionlocation() == null)
|
|
currentInstance.setDistributionlocation(enrichment.getDistributionlocation());
|
|
|
|
//ENRICH collectedfrom
|
|
if (enrichment.getCollectedfrom()!=null && currentInstance.getCollectedfrom() == null)
|
|
currentInstance.setCollectedfrom(enrichment.getCollectedfrom());
|
|
|
|
//ENRICH dateofacceptance
|
|
if (enrichment.getDateofacceptance()!=null && currentInstance.getDateofacceptance() == null)
|
|
currentInstance.setDateofacceptance(enrichment.getDateofacceptance());
|
|
|
|
//ENRICH processingchargeamount
|
|
if (enrichment.getProcessingchargeamount()!=null && currentInstance.getProcessingchargeamount() == null)
|
|
currentInstance.setProcessingchargeamount(enrichment.getProcessingchargeamount());
|
|
|
|
//ENRICH refereed
|
|
if (enrichment.getRefereed()!=null && currentInstance.getRefereed() == null)
|
|
currentInstance.setRefereed(enrichment.getRefereed());
|
|
|
|
//ENRICH measures
|
|
if (enrichment.getMeasures()!=null)
|
|
if (currentInstance.getMeasures() == null)
|
|
currentInstance.setMeasures(enrichment.getMeasures());
|
|
else
|
|
enrichment.getMeasures().forEach(currentInstance.getMeasures()::add);
|
|
|
|
}
|
|
|
|
|
|
/**
|
|
* This main method apply the enrichment of the instances
|
|
*
|
|
* @param toEnrichInstances the instances that could be enriched
|
|
* @param enrichmentInstances the enrichment instances
|
|
* @return list of instances possibly enriched
|
|
*/
|
|
private static List<Instance> enrichInstances(final List<Instance> toEnrichInstances,final List<Instance> enrichmentInstances) {
|
|
final List<Instance> enrichmentResult = new ArrayList<>();
|
|
|
|
if (toEnrichInstances == null) {
|
|
return enrichmentResult;
|
|
}
|
|
if (enrichmentInstances == null) {
|
|
return enrichmentResult;
|
|
}
|
|
Map<String, Instance> ri = toInstanceMap(enrichmentInstances);
|
|
|
|
toEnrichInstances.forEach(i -> {
|
|
final List<Instance> e = findEnrichmentsByPID(i.getPid(), ri);
|
|
if (e!= null && e.size()> 0) {
|
|
e.forEach(enr -> applyEnrichment(i, enr));
|
|
} else {
|
|
final List<Instance> a = findEnrichmentsByPID(i.getAlternateIdentifier(), ri);
|
|
if (a!= null && a.size()> 0) {
|
|
a.forEach(enr -> applyEnrichment(i, enr));
|
|
}
|
|
}
|
|
enrichmentResult.add(i);
|
|
});
|
|
return enrichmentResult;
|
|
}
|
|
|
|
/**
|
|
* Longest lists list.
|
|
*
|
|
* @param a the a
|
|
* @param b the b
|
|
* @return the list
|
|
*/
|
|
public static List<Field<String>> longestLists(List<Field<String>> a, List<Field<String>> b) {
|
|
if (a == null || b == null)
|
|
return a == null ? b : a;
|
|
if (a.size() == b.size()) {
|
|
int msa = a
|
|
.stream()
|
|
.filter(i -> i != null && i.getValue() != null)
|
|
.map(i -> i.getValue().length())
|
|
.max(Comparator.naturalOrder())
|
|
.orElse(0);
|
|
int msb = b
|
|
.stream()
|
|
.filter(i -> i != null && i.getValue() != null)
|
|
.map(i -> i.getValue().length())
|
|
.max(Comparator.naturalOrder())
|
|
.orElse(0);
|
|
return msa > msb ? a : b;
|
|
}
|
|
return a.size() > b.size() ? a : b;
|
|
}
|
|
|
|
|
|
/**
|
|
* This method merge two oaf object of the same type
|
|
* It should replace the mergeFrom utility inside the oaf
|
|
* class.
|
|
*
|
|
* @param original First object
|
|
* @param enrich second object
|
|
* @return the merged object
|
|
*/
|
|
public static <T extends Oaf> T mergeOAF(T original, T enrich) {
|
|
if (original == null)
|
|
return enrich;
|
|
if (enrich == null)
|
|
return original;
|
|
|
|
if (original.getClass() != enrich.getClass())
|
|
throw new RuntimeException(String.format("Trying to merge different types of object %s, and %s",
|
|
original.getClass().getCanonicalName(),
|
|
enrich.getClass().getCanonicalName()));
|
|
|
|
Oaf result ;
|
|
|
|
switch (original.getClass().getSimpleName().toLowerCase()) {
|
|
case "relation":
|
|
result = mergeOAFRelation((Relation) original, (Relation) enrich);
|
|
break;
|
|
case "publication":
|
|
result = mergeOAFPublication((Publication) original, (Publication) enrich);
|
|
break;
|
|
case "dataset":
|
|
result = mergeOAFDataset((Dataset) original, (Dataset) enrich);
|
|
break;
|
|
case "software":
|
|
result = mergeOAFSoftware((Software) original, (Software) enrich);
|
|
break;
|
|
case "otherresearchproduct":
|
|
result = mergeOAFOtherResearchProduct((OtherResearchProduct) original, (OtherResearchProduct) enrich);
|
|
break;
|
|
case "project":
|
|
result = mergeOAFProject((Project) original, (Project)enrich);
|
|
break;
|
|
case "organization":
|
|
result = mergeOAFOrganization((Organization) original, (Organization)enrich);
|
|
break;
|
|
default:
|
|
throw new RuntimeException("Trying to merge an unsupported class");
|
|
|
|
|
|
}
|
|
result.setCollectedfrom(
|
|
Stream
|
|
.concat(
|
|
Optional
|
|
.ofNullable(original.getCollectedfrom())
|
|
.map(Collection::stream)
|
|
.orElse(Stream.empty()),
|
|
Optional
|
|
.ofNullable(enrich.getCollectedfrom())
|
|
.map(Collection::stream)
|
|
.orElse(Stream.empty()))
|
|
.distinct() // relies on KeyValue.equals
|
|
.collect(Collectors.toList()));
|
|
|
|
result.setLastupdatetimestamp(
|
|
Math
|
|
.max(
|
|
Optional.ofNullable(original.getLastupdatetimestamp()).orElse(0L),
|
|
Optional.ofNullable(enrich.getLastupdatetimestamp()).orElse(0L)));
|
|
|
|
return (T) result;
|
|
|
|
}
|
|
|
|
|
|
@SafeVarargs
|
|
public static <T> List<T> mergeLists(final List<T>... lists) {
|
|
|
|
return Arrays
|
|
.stream(lists)
|
|
.filter(Objects::nonNull)
|
|
.flatMap(List::stream)
|
|
.filter(Objects::nonNull)
|
|
.distinct()
|
|
.collect(Collectors.toList());
|
|
}
|
|
|
|
|
|
private static int compareTrust(Oaf a, Oaf b) {
|
|
return extractTrust(a).compareTo(extractTrust(b));
|
|
}
|
|
|
|
private static String extractTrust(Oaf e) {
|
|
if (e == null || e.getDataInfo() == null || e.getDataInfo().getTrust() == null)
|
|
return "0.0";
|
|
return e.getDataInfo().getTrust();
|
|
}
|
|
|
|
|
|
private static void mergeOAFDataInfo(Oaf from, Oaf to) {
|
|
Optional.ofNullable(to)
|
|
.ifPresent(other -> Optional.ofNullable(other.getDataInfo())
|
|
.ifPresent(otherDataInfo -> Optional.ofNullable(from.getDataInfo())
|
|
.ifPresent(thisDataInfo -> {
|
|
if (compareTrust(from, other) < 0 || thisDataInfo.getInvisible()) {
|
|
from.setDataInfo(otherDataInfo);
|
|
}
|
|
})));
|
|
}
|
|
|
|
|
|
/**
|
|
* Gets main title.
|
|
*
|
|
* @param titles the titles
|
|
* @return the main title
|
|
*/
|
|
private static StructuredProperty getMainTitle(final List<StructuredProperty> titles) {
|
|
// need to check if the list of titles contains more than 1 main title? (in that case, we should chose which
|
|
// main title select in the list)
|
|
for (StructuredProperty t : titles) {
|
|
if (t.getQualifier() != null && t.getQualifier().getClassid() != null)
|
|
if (t.getQualifier().getClassid().equals("main title"))
|
|
return t;
|
|
}
|
|
return null;
|
|
}
|
|
|
|
|
|
private static OafEntity mergeEntity(final OafEntity original,final OafEntity enrich) {
|
|
|
|
final OafEntity mergedEntity = original;
|
|
|
|
|
|
mergedEntity.setOriginalId(mergeLists(mergedEntity.getOriginalId(), enrich.getOriginalId()));
|
|
|
|
mergedEntity.setPid(mergeLists(mergedEntity.getPid(), enrich.getPid()));
|
|
|
|
|
|
if (enrich.getDateofcollection() != null && compareTrust(mergedEntity, enrich) < 0)
|
|
mergedEntity.setDateofcollection(enrich.getDateofcollection());
|
|
|
|
if (enrich.getDateoftransformation() != null && compareTrust(mergedEntity, enrich) < 0)
|
|
mergedEntity.setDateoftransformation(enrich.getDateoftransformation());
|
|
|
|
mergedEntity.setExtraInfo(mergeLists(mergedEntity.getExtraInfo(), enrich.getExtraInfo()));
|
|
|
|
if (enrich.getOaiprovenance() != null && compareTrust(mergedEntity, enrich) < 0)
|
|
mergedEntity.setOaiprovenance(enrich.getOaiprovenance());
|
|
|
|
return mergedEntity;
|
|
|
|
|
|
}
|
|
|
|
private static Result mergeOAFResult(final Result original,final Result enrich) {
|
|
|
|
|
|
final Result mergedResult = (Result) mergeEntity(original, enrich);
|
|
|
|
if(mergedResult.getProcessingchargeamount() == null || StringUtils.isBlank(mergedResult.getProcessingchargeamount().getValue() )){
|
|
mergedResult.setProcessingchargeamount(enrich.getProcessingchargeamount());
|
|
mergedResult.setProcessingchargecurrency(enrich.getProcessingchargecurrency());
|
|
}
|
|
|
|
mergedResult.setMeasures(mergeLists(mergedResult.getMeasures(), enrich.getMeasures()));
|
|
|
|
if( !isAnEnrichment(mergedResult) && !isAnEnrichment(enrich))
|
|
mergedResult.setInstance(mergeLists(mergedResult.getInstance(), enrich.getInstance()));
|
|
else {
|
|
final List<Instance> enrichmentInstances = isAnEnrichment(mergedResult) ? mergedResult.getInstance() : enrich.getInstance();
|
|
final List<Instance> enrichedInstances= isAnEnrichment(mergedResult) ? enrich.getInstance(): mergedResult.getInstance();
|
|
if (isAnEnrichment(mergedResult))
|
|
mergedResult.setDataInfo(enrich.getDataInfo());
|
|
mergedResult.setInstance(enrichInstances(enrichedInstances,enrichmentInstances));
|
|
}
|
|
|
|
if (enrich.getBestaccessright() != null
|
|
&& new AccessRightComparator().compare(enrich.getBestaccessright(), mergedResult.getBestaccessright()) < 0)
|
|
mergedResult.setBestaccessright(enrich.getBestaccessright());
|
|
|
|
if (enrich.getResulttype() != null && compareTrust(mergedResult, enrich) < 0)
|
|
mergedResult.setResulttype(enrich.getResulttype());
|
|
|
|
if (enrich.getLanguage() != null && compareTrust(mergedResult, enrich) < 0)
|
|
mergedResult.setLanguage(enrich.getLanguage());
|
|
|
|
if (Objects.nonNull(enrich.getDateofacceptance())) {
|
|
if (Objects.isNull(mergedResult.getDateofacceptance())) {
|
|
mergedResult.setDateofacceptance(enrich.getDateofacceptance());
|
|
} else if (compareTrust(mergedResult, enrich) < 0) {
|
|
mergedResult.setDateofacceptance(enrich.getDateofacceptance());
|
|
}
|
|
}
|
|
|
|
mergedResult.setCountry(mergeLists(mergedResult.getCountry(), enrich.getCountry()));
|
|
|
|
mergedResult.setSubject(mergeLists(mergedResult.getSubject(), enrich.getSubject()));
|
|
|
|
// merge title lists: main title with higher trust and distinct between the others
|
|
StructuredProperty baseMainTitle = null;
|
|
if (mergedResult.getTitle() != null) {
|
|
baseMainTitle = getMainTitle(mergedResult.getTitle());
|
|
if (baseMainTitle != null) {
|
|
final StructuredProperty p = baseMainTitle;
|
|
mergedResult.setTitle(mergedResult.getTitle().stream().filter(t -> t != p).collect(Collectors.toList()));
|
|
}
|
|
}
|
|
|
|
StructuredProperty newMainTitle = null;
|
|
if (enrich.getTitle() != null) {
|
|
newMainTitle = getMainTitle(enrich.getTitle());
|
|
if (newMainTitle != null) {
|
|
final StructuredProperty p = newMainTitle;
|
|
enrich.setTitle(enrich.getTitle().stream().filter(t -> t != p).collect(Collectors.toList()));
|
|
}
|
|
}
|
|
|
|
if (newMainTitle != null && compareTrust(mergedResult, enrich) < 0) {
|
|
baseMainTitle = newMainTitle;
|
|
}
|
|
|
|
mergedResult.setTitle(mergeLists(mergedResult.getTitle(), enrich.getTitle()));
|
|
if (mergedResult.getTitle() != null && baseMainTitle != null) {
|
|
mergedResult.getTitle().add(baseMainTitle);
|
|
}
|
|
|
|
mergedResult.setRelevantdate (mergeLists(mergedResult.getRelevantdate(), enrich.getRelevantdate()));
|
|
|
|
mergedResult.setDescription( longestLists(mergedResult.getDescription(), enrich.getDescription()));
|
|
|
|
if (enrich.getPublisher() != null && compareTrust(mergedResult, enrich) < 0)
|
|
mergedResult.setPublisher(enrich.getPublisher());
|
|
|
|
if (enrich.getEmbargoenddate() != null && compareTrust(mergedResult, enrich) < 0)
|
|
mergedResult.setEmbargoenddate(enrich.getEmbargoenddate());
|
|
|
|
mergedResult.setSource(mergeLists(mergedResult.getSource(), enrich.getSource()));
|
|
|
|
mergedResult.setFulltext(mergeLists(mergedResult.getFulltext(), enrich.getFulltext()));
|
|
|
|
mergedResult.setFormat(mergeLists(mergedResult.getFormat(), enrich.getFormat()));
|
|
|
|
mergedResult.setContributor(mergeLists(mergedResult.getContributor(), enrich.getContributor()));
|
|
|
|
if (enrich.getResourcetype() != null)
|
|
mergedResult.setResourcetype(enrich.getResourcetype());
|
|
|
|
mergedResult.setCoverage(mergeLists(mergedResult.getCoverage(), enrich.getCoverage()));
|
|
|
|
mergedResult.setContext(mergeLists(mergedResult.getContext(), enrich.getContext()));
|
|
|
|
mergedResult.setExternalReference(mergeLists(mergedResult.getExternalReference(), enrich.getExternalReference()));
|
|
|
|
return mergedResult;
|
|
}
|
|
|
|
private static OtherResearchProduct mergeOAFOtherResearchProduct(final OtherResearchProduct original,final OtherResearchProduct enrich) {
|
|
final OtherResearchProduct mergedORP = (OtherResearchProduct) mergeOAFResult(original, enrich);
|
|
|
|
|
|
mergedORP.setContactperson(mergeLists(mergedORP.getContactperson(), enrich.getContactperson()));
|
|
mergedORP.setContactgroup(mergeLists(mergedORP.getContactgroup(), enrich.getContactgroup()));
|
|
mergedORP.setTool(mergeLists(mergedORP.getTool(), enrich.getTool()));
|
|
mergeOAFDataInfo(mergedORP, enrich);
|
|
|
|
return mergedORP;
|
|
}
|
|
|
|
private static Software mergeOAFSoftware(final Software original, final Software enrich) {
|
|
final Software mergedSoftware = (Software) mergeOAFResult(original, enrich);
|
|
|
|
mergedSoftware.setDocumentationUrl(mergeLists(mergedSoftware.getDocumentationUrl(), enrich.getDocumentationUrl()));
|
|
|
|
mergedSoftware.setLicense(mergeLists(mergedSoftware.getLicense(), enrich.getLicense()));
|
|
|
|
mergedSoftware.setCodeRepositoryUrl(enrich.getCodeRepositoryUrl() != null && compareTrust(mergedSoftware,enrich) < 0
|
|
? enrich.getCodeRepositoryUrl()
|
|
: mergedSoftware.getCodeRepositoryUrl());
|
|
|
|
mergedSoftware.setProgrammingLanguage(enrich.getProgrammingLanguage() != null && compareTrust(mergedSoftware, enrich) < 0
|
|
? enrich.getProgrammingLanguage()
|
|
: mergedSoftware.getProgrammingLanguage());
|
|
|
|
mergeOAFDataInfo(mergedSoftware, enrich);
|
|
return mergedSoftware;
|
|
}
|
|
|
|
private static Dataset mergeOAFDataset(Dataset original, Dataset enrich) {
|
|
|
|
final Dataset mergedDataset = (Dataset) mergeOAFResult(original, enrich);
|
|
|
|
mergedDataset.setStoragedate(enrich.getStoragedate() != null && compareTrust(mergedDataset, enrich) < 0 ? enrich.getStoragedate() : mergedDataset.getStoragedate());
|
|
|
|
mergedDataset.setDevice(enrich.getDevice() != null && compareTrust(mergedDataset, enrich) < 0 ? enrich.getDevice() : mergedDataset.getDevice());
|
|
|
|
mergedDataset.setSize(enrich.getSize() != null && compareTrust(mergedDataset, enrich) < 0 ? enrich.getSize() : mergedDataset.getSize());
|
|
|
|
mergedDataset.setVersion(enrich.getVersion() != null && compareTrust(mergedDataset, enrich) < 0 ? enrich.getVersion() : mergedDataset.getVersion());
|
|
|
|
mergedDataset.setLastmetadataupdate(
|
|
enrich.getLastmetadataupdate() != null && compareTrust(mergedDataset,enrich) < 0
|
|
? enrich.getLastmetadataupdate()
|
|
: mergedDataset.getLastmetadataupdate());
|
|
|
|
mergedDataset.setMetadataversionnumber(
|
|
enrich.getMetadataversionnumber() != null && compareTrust(mergedDataset, enrich) < 0
|
|
? enrich.getMetadataversionnumber()
|
|
: mergedDataset.getMetadataversionnumber());
|
|
|
|
mergedDataset.setGeolocation(mergeLists(mergedDataset.getGeolocation(), enrich.getGeolocation()));
|
|
|
|
mergeOAFDataInfo(mergedDataset, enrich);
|
|
|
|
return mergedDataset;
|
|
}
|
|
|
|
private static Publication mergeOAFPublication(Publication original, Publication enrich) {
|
|
|
|
final Publication mergedPublication = (Publication) mergeOAFResult(original, enrich);
|
|
|
|
if (enrich.getJournal() != null && compareTrust(mergedPublication, enrich) < 0)
|
|
mergedPublication.setJournal(enrich.getJournal());
|
|
mergeOAFDataInfo(mergedPublication, enrich);
|
|
return mergedPublication;
|
|
}
|
|
|
|
|
|
private static Relation mergeOAFRelation(Relation from, Relation to) {
|
|
|
|
checkArgument(Objects.equals(from.getSource(), to.getSource()), "source ids must be equal");
|
|
checkArgument(Objects.equals(from.getTarget(), to.getTarget()), "target ids must be equal");
|
|
checkArgument(Objects.equals(from.getRelType(), to.getRelType()), "relType(s) must be equal");
|
|
checkArgument(
|
|
Objects.equals(from.getSubRelType(), to.getSubRelType()), "subRelType(s) must be equal");
|
|
checkArgument(Objects.equals(from.getRelClass(), to.getRelClass()), "relClass(es) must be equal");
|
|
|
|
from.setValidated(from.getValidated() || to.getValidated());
|
|
try {
|
|
from.setValidationDate(ModelSupport.oldest(from.getValidationDate(), to.getValidationDate()));
|
|
} catch (ParseException e) {
|
|
throw new IllegalArgumentException(String
|
|
.format(
|
|
"invalid validation date format in relation [s:%s, t:%s]: %s", from.getSource(), from.getTarget(),
|
|
from.getValidationDate()));
|
|
}
|
|
|
|
return from;
|
|
}
|
|
|
|
|
|
private static Oaf mergeOAFOrganization(Organization original, Organization enrich) {
|
|
|
|
final Organization mergedOrganization = (Organization) mergeEntity(original, enrich);
|
|
|
|
int ct = compareTrust(mergedOrganization, enrich);
|
|
mergedOrganization.setLegalshortname(enrich.getLegalshortname() != null && ct < 0
|
|
? enrich.getLegalshortname()
|
|
: mergedOrganization.getLegalname());
|
|
|
|
|
|
mergedOrganization.setLegalname(enrich.getLegalname() != null && ct < 0 ?
|
|
enrich.getLegalname()
|
|
: mergedOrganization.getLegalname());
|
|
|
|
mergedOrganization.setAlternativeNames(mergeLists(enrich.getAlternativeNames(), mergedOrganization.getAlternativeNames()));
|
|
|
|
|
|
mergedOrganization.setWebsiteurl(enrich.getWebsiteurl() != null && ct < 0
|
|
? enrich.getWebsiteurl()
|
|
: mergedOrganization.getWebsiteurl());
|
|
|
|
mergedOrganization.setLogourl(enrich.getLogourl() != null && ct < 0
|
|
? enrich.getLogourl()
|
|
: mergedOrganization.getLogourl());
|
|
|
|
mergedOrganization.setEclegalbody(enrich.getEclegalbody() != null && ct < 0
|
|
? enrich.getEclegalbody()
|
|
: mergedOrganization.getEclegalbody());
|
|
|
|
mergedOrganization.setEclegalperson(enrich.getEclegalperson() != null && ct < 0
|
|
? enrich.getEclegalperson()
|
|
: mergedOrganization.getEclegalperson());
|
|
|
|
mergedOrganization.setEcnonprofit (enrich.getEcnonprofit() != null && ct< 0
|
|
? enrich.getEcnonprofit()
|
|
: mergedOrganization.getEcnonprofit());
|
|
|
|
mergedOrganization.setEcresearchorganization (enrich.getEcresearchorganization() != null && ct < 0
|
|
? enrich.getEcresearchorganization()
|
|
: mergedOrganization.getEcresearchorganization());
|
|
|
|
mergedOrganization.setEchighereducation (enrich.getEchighereducation() != null && ct < 0
|
|
? enrich.getEchighereducation()
|
|
: mergedOrganization.getEchighereducation());
|
|
|
|
mergedOrganization.setEcinternationalorganizationeurinterests (enrich.getEcinternationalorganizationeurinterests() != null && ct< 0
|
|
? enrich.getEcinternationalorganizationeurinterests()
|
|
: mergedOrganization.getEcinternationalorganizationeurinterests());
|
|
|
|
mergedOrganization.setEcinternationalorganization (enrich.getEcinternationalorganization() != null && ct < 0
|
|
? enrich.getEcinternationalorganization()
|
|
: mergedOrganization.getEcinternationalorganization());
|
|
|
|
mergedOrganization.setEcenterprise (enrich.getEcenterprise() != null && ct < 0
|
|
? enrich.getEcenterprise()
|
|
: mergedOrganization.getEcenterprise());
|
|
|
|
mergedOrganization.setEcsmevalidated (enrich.getEcsmevalidated() != null && ct < 0
|
|
? enrich.getEcsmevalidated()
|
|
: mergedOrganization.getEcsmevalidated());
|
|
mergedOrganization.setEcnutscode( enrich.getEcnutscode() != null && ct < 0
|
|
? enrich.getEcnutscode()
|
|
: mergedOrganization.getEcnutscode());
|
|
|
|
mergedOrganization.setCountry (enrich.getCountry() != null && ct < 0 ?
|
|
enrich.getCountry()
|
|
:mergedOrganization.getCountry());
|
|
|
|
mergeOAFDataInfo(mergedOrganization, enrich);
|
|
|
|
return mergedOrganization;
|
|
}
|
|
|
|
private static Oaf mergeOAFProject(Project original, Project enrich) {
|
|
|
|
final Project mergedProject = (Project) mergeEntity(original, enrich);
|
|
|
|
int ct = compareTrust(mergedProject, enrich);
|
|
|
|
|
|
mergedProject.setWebsiteurl (enrich.getWebsiteurl() != null && ct < 0
|
|
? enrich.getWebsiteurl()
|
|
: mergedProject.getWebsiteurl());
|
|
|
|
mergedProject.setCode(enrich.getCode() != null && ct < 0 ?
|
|
enrich.getCode() :
|
|
mergedProject.getCode());
|
|
|
|
mergedProject.setAcronym(enrich.getAcronym() != null && ct < 0
|
|
? enrich.getAcronym()
|
|
: mergedProject.getAcronym());
|
|
|
|
mergedProject.setTitle (enrich.getTitle() != null && ct < 0
|
|
? enrich.getTitle()
|
|
: mergedProject.getTitle());
|
|
mergedProject.setStartdate (enrich.getStartdate() != null && ct < 0
|
|
? enrich.getStartdate()
|
|
: mergedProject.getStartdate());
|
|
mergedProject.setEnddate (enrich.getEnddate() != null && ct < 0
|
|
? enrich.getEnddate()
|
|
: mergedProject.getEnddate());
|
|
mergedProject.setCallidentifier ( enrich.getCallidentifier() != null && ct < 0
|
|
? enrich.getCallidentifier()
|
|
: mergedProject.getCallidentifier());
|
|
mergedProject.setKeywords ( enrich.getKeywords() != null && ct < 0
|
|
? enrich.getKeywords()
|
|
: mergedProject.getKeywords());
|
|
|
|
mergedProject.setDuration ( enrich.getDuration() != null && ct < 0
|
|
? enrich.getDuration()
|
|
: mergedProject.getDuration());
|
|
mergedProject.setEcsc39 ( enrich.getEcsc39() != null && ct < 0
|
|
? enrich.getEcsc39() :
|
|
mergedProject.getEcsc39());
|
|
mergedProject.setOamandatepublications ( enrich.getOamandatepublications() != null && ct < 0
|
|
? enrich.getOamandatepublications()
|
|
: mergedProject.getOamandatepublications());
|
|
mergedProject.setEcarticle29_3 (enrich.getEcarticle29_3() != null && ct < 0
|
|
? enrich.getEcarticle29_3()
|
|
: mergedProject.getEcarticle29_3());
|
|
|
|
mergedProject.setSubjects (mergeLists(mergedProject.getSubjects(), enrich.getSubjects()));
|
|
mergedProject.setFundingtree (mergeLists(mergedProject.getFundingtree(), enrich.getFundingtree()));
|
|
mergedProject.setContracttype (enrich.getContracttype() != null && ct < 0
|
|
? enrich.getContracttype()
|
|
: mergedProject.getContracttype());
|
|
mergedProject.setOptional1 ( enrich.getOptional1() != null && ct < 0
|
|
? enrich.getOptional1()
|
|
: mergedProject.getOptional1());
|
|
mergedProject.setOptional2 (enrich.getOptional2() != null && ct < 0
|
|
? enrich.getOptional2()
|
|
: mergedProject.getOptional2());
|
|
|
|
mergedProject.setJsonextrainfo ( enrich.getJsonextrainfo() != null && ct < 0
|
|
? enrich.getJsonextrainfo()
|
|
: mergedProject.getJsonextrainfo());
|
|
|
|
mergedProject.setContactfullname ( enrich.getContactfullname() != null && ct < 0
|
|
? enrich.getContactfullname()
|
|
: mergedProject.getContactfullname());
|
|
|
|
mergedProject.setContactfax ( enrich.getContactfax() != null && ct < 0
|
|
? enrich.getContactfax()
|
|
: mergedProject.getContactfax());
|
|
|
|
mergedProject.setContactphone (enrich.getContactphone() != null && ct < 0
|
|
? enrich.getContactphone()
|
|
: mergedProject.getContactphone());
|
|
|
|
mergedProject.setContactemail ( enrich.getContactemail() != null && ct < 0
|
|
? enrich.getContactemail()
|
|
: mergedProject.getContactemail());
|
|
|
|
mergedProject.setSummary ( enrich.getSummary() != null && ct < 0
|
|
? enrich.getSummary()
|
|
: mergedProject.getSummary());
|
|
|
|
mergedProject.setCurrency( enrich.getCurrency() != null && ct < 0
|
|
? enrich.getCurrency()
|
|
: mergedProject.getCurrency());
|
|
|
|
if (enrich.getH2020topiccode() != null && StringUtils.isEmpty(mergedProject.getH2020topiccode())){
|
|
mergedProject.setH2020topiccode(enrich.getH2020topiccode());
|
|
mergedProject.setH2020topicdescription(enrich.getH2020topicdescription());
|
|
}
|
|
|
|
mergedProject.setH2020classification (mergeLists(mergedProject.getH2020classification(), enrich.getH2020classification()));
|
|
|
|
mergeOAFDataInfo(mergedProject, enrich);
|
|
|
|
return mergedProject;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|