Merge branch 'master' of https://code-repo.d4science.org/D-Net/dnet-hadoop into islookup_timeout
This commit is contained in:
commit
74da8a08cf
|
@ -2,7 +2,6 @@
|
||||||
package eu.dnetlib.dhp.broker.model;
|
package eu.dnetlib.dhp.broker.model;
|
||||||
|
|
||||||
import java.io.Serializable;
|
import java.io.Serializable;
|
||||||
import java.util.Map;
|
|
||||||
|
|
||||||
public class Event implements Serializable {
|
public class Event implements Serializable {
|
||||||
|
|
||||||
|
@ -25,7 +24,7 @@ public class Event implements Serializable {
|
||||||
|
|
||||||
private boolean instantMessage;
|
private boolean instantMessage;
|
||||||
|
|
||||||
private Map<String, Object> map;
|
private MappedFields map;
|
||||||
|
|
||||||
public Event() {
|
public Event() {
|
||||||
}
|
}
|
||||||
|
@ -33,7 +32,7 @@ public class Event implements Serializable {
|
||||||
public Event(final String producerId, final String eventId, final String topic, final String payload,
|
public Event(final String producerId, final String eventId, final String topic, final String payload,
|
||||||
final Long creationDate, final Long expiryDate,
|
final Long creationDate, final Long expiryDate,
|
||||||
final boolean instantMessage,
|
final boolean instantMessage,
|
||||||
final Map<String, Object> map) {
|
final MappedFields map) {
|
||||||
this.producerId = producerId;
|
this.producerId = producerId;
|
||||||
this.eventId = eventId;
|
this.eventId = eventId;
|
||||||
this.topic = topic;
|
this.topic = topic;
|
||||||
|
@ -100,11 +99,11 @@ public class Event implements Serializable {
|
||||||
this.instantMessage = instantMessage;
|
this.instantMessage = instantMessage;
|
||||||
}
|
}
|
||||||
|
|
||||||
public Map<String, Object> getMap() {
|
public MappedFields getMap() {
|
||||||
return this.map;
|
return this.map;
|
||||||
}
|
}
|
||||||
|
|
||||||
public void setMap(final Map<String, Object> map) {
|
public void setMap(final MappedFields map) {
|
||||||
this.map = map;
|
this.map = map;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -3,9 +3,8 @@ package eu.dnetlib.dhp.broker.model;
|
||||||
|
|
||||||
import java.text.ParseException;
|
import java.text.ParseException;
|
||||||
import java.util.Date;
|
import java.util.Date;
|
||||||
import java.util.HashMap;
|
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.stream.Collectors;
|
||||||
|
|
||||||
import org.apache.commons.codec.digest.DigestUtils;
|
import org.apache.commons.codec.digest.DigestUtils;
|
||||||
import org.apache.commons.lang3.StringUtils;
|
import org.apache.commons.lang3.StringUtils;
|
||||||
|
@ -30,7 +29,7 @@ public class EventFactory {
|
||||||
|
|
||||||
final Event res = new Event();
|
final Event res = new Event();
|
||||||
|
|
||||||
final Map<String, Object> map = createMapFromResult(updateInfo);
|
final MappedFields map = createMapFromResult(updateInfo);
|
||||||
|
|
||||||
final String eventId = calculateEventId(
|
final String eventId = calculateEventId(
|
||||||
updateInfo.getTopicPath(), updateInfo.getTarget().getOpenaireId(), updateInfo.getHighlightValueAsString());
|
updateInfo.getTopicPath(), updateInfo.getTarget().getOpenaireId(), updateInfo.getHighlightValueAsString());
|
||||||
|
@ -46,35 +45,35 @@ public class EventFactory {
|
||||||
return res;
|
return res;
|
||||||
}
|
}
|
||||||
|
|
||||||
private static Map<String, Object> createMapFromResult(final UpdateInfo<?> updateInfo) {
|
private static MappedFields createMapFromResult(final UpdateInfo<?> updateInfo) {
|
||||||
final Map<String, Object> map = new HashMap<>();
|
final MappedFields map = new MappedFields();
|
||||||
|
|
||||||
final OaBrokerMainEntity source = updateInfo.getSource();
|
final OaBrokerMainEntity source = updateInfo.getSource();
|
||||||
final OaBrokerMainEntity target = updateInfo.getTarget();
|
final OaBrokerMainEntity target = updateInfo.getTarget();
|
||||||
|
|
||||||
map.put("target_datasource_id", target.getCollectedFromId());
|
map.setTargetDatasourceId(target.getCollectedFromId());
|
||||||
map.put("target_datasource_name", target.getCollectedFromName());
|
map.setTargetDatasourceName(target.getCollectedFromName());
|
||||||
|
|
||||||
map.put("target_publication_id", target.getOpenaireId());
|
map.setTargetResultId(target.getOpenaireId());
|
||||||
|
|
||||||
final List<String> titles = target.getTitles();
|
final List<String> titles = target.getTitles();
|
||||||
if (titles.size() > 0) {
|
if (titles.size() > 0) {
|
||||||
map.put("target_publication_title", titles.get(0));
|
map.setTargetResultTitle(titles.get(0));
|
||||||
}
|
}
|
||||||
|
|
||||||
final long date = parseDateTolong(target.getPublicationdate());
|
final long date = parseDateTolong(target.getPublicationdate());
|
||||||
if (date > 0) {
|
if (date > 0) {
|
||||||
map.put("target_dateofacceptance", date);
|
map.setTargetDateofacceptance(date);
|
||||||
}
|
}
|
||||||
|
|
||||||
map.put("target_publication_subject_list", target.getSubjects());
|
map.setTargetSubjects(target.getSubjects().stream().map(s -> s.getValue()).collect(Collectors.toList()));
|
||||||
map.put("target_publication_author_list", target.getCreators());
|
map.setTargetAuthors(target.getCreators().stream().map(a -> a.getFullname()).collect(Collectors.toList()));
|
||||||
|
|
||||||
// PROVENANCE INFO
|
// PROVENANCE INFO
|
||||||
map.put("trust", updateInfo.getTrust());
|
map.setTrust(updateInfo.getTrust());
|
||||||
map.put("provenance_datasource_id", source.getCollectedFromId());
|
map.setProvenanceDatasourceId(source.getCollectedFromId());
|
||||||
map.put("provenance_datasource_name", source.getCollectedFromName());
|
map.setProvenanceDatasourceName(source.getCollectedFromName());
|
||||||
map.put("provenance_publication_id_list", source.getOpenaireId());
|
map.setProvenanceResultId(source.getOpenaireId());
|
||||||
|
|
||||||
return map;
|
return map;
|
||||||
}
|
}
|
||||||
|
|
|
@ -0,0 +1,114 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.broker.model;
|
||||||
|
|
||||||
|
import java.io.Serializable;
|
||||||
|
import java.util.List;
|
||||||
|
|
||||||
|
public class MappedFields implements Serializable {
|
||||||
|
|
||||||
|
/**
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
private static final long serialVersionUID = -7999704113195802008L;
|
||||||
|
|
||||||
|
private String targetDatasourceId;
|
||||||
|
private String targetDatasourceName;
|
||||||
|
private String targetResultId;
|
||||||
|
private String targetResultTitle;
|
||||||
|
private long targetDateofacceptance;
|
||||||
|
private List<String> targetSubjects;
|
||||||
|
private List<String> targetAuthors;
|
||||||
|
private float trust;
|
||||||
|
private String provenanceDatasourceId;
|
||||||
|
private String provenanceDatasourceName;
|
||||||
|
private String provenanceResultId;
|
||||||
|
|
||||||
|
public String getTargetDatasourceId() {
|
||||||
|
return targetDatasourceId;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTargetDatasourceId(final String targetDatasourceId) {
|
||||||
|
this.targetDatasourceId = targetDatasourceId;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getTargetDatasourceName() {
|
||||||
|
return targetDatasourceName;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTargetDatasourceName(final String targetDatasourceName) {
|
||||||
|
this.targetDatasourceName = targetDatasourceName;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getTargetResultId() {
|
||||||
|
return targetResultId;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTargetResultId(final String targetResultId) {
|
||||||
|
this.targetResultId = targetResultId;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getTargetResultTitle() {
|
||||||
|
return targetResultTitle;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTargetResultTitle(final String targetResultTitle) {
|
||||||
|
this.targetResultTitle = targetResultTitle;
|
||||||
|
}
|
||||||
|
|
||||||
|
public long getTargetDateofacceptance() {
|
||||||
|
return targetDateofacceptance;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTargetDateofacceptance(final long targetDateofacceptance) {
|
||||||
|
this.targetDateofacceptance = targetDateofacceptance;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<String> getTargetSubjects() {
|
||||||
|
return targetSubjects;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTargetSubjects(final List<String> targetSubjects) {
|
||||||
|
this.targetSubjects = targetSubjects;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<String> getTargetAuthors() {
|
||||||
|
return targetAuthors;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTargetAuthors(final List<String> targetAuthors) {
|
||||||
|
this.targetAuthors = targetAuthors;
|
||||||
|
}
|
||||||
|
|
||||||
|
public float getTrust() {
|
||||||
|
return trust;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTrust(final float trust) {
|
||||||
|
this.trust = trust;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getProvenanceDatasourceId() {
|
||||||
|
return provenanceDatasourceId;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setProvenanceDatasourceId(final String provenanceDatasourceId) {
|
||||||
|
this.provenanceDatasourceId = provenanceDatasourceId;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getProvenanceDatasourceName() {
|
||||||
|
return provenanceDatasourceName;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setProvenanceDatasourceName(final String provenanceDatasourceName) {
|
||||||
|
this.provenanceDatasourceName = provenanceDatasourceName;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getProvenanceResultId() {
|
||||||
|
return provenanceResultId;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setProvenanceResultId(final String provenanceResultId) {
|
||||||
|
this.provenanceResultId = provenanceResultId;
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
|
@ -1,13 +1,14 @@
|
||||||
|
|
||||||
package eu.dnetlib.dhp.broker.oa.matchers;
|
package eu.dnetlib.dhp.broker.oa.matchers;
|
||||||
|
|
||||||
import java.util.Arrays;
|
import java.util.ArrayList;
|
||||||
import java.util.Collection;
|
import java.util.Collection;
|
||||||
import java.util.HashMap;
|
import java.util.HashMap;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
import java.util.function.BiConsumer;
|
import java.util.function.BiConsumer;
|
||||||
import java.util.function.Function;
|
import java.util.function.Function;
|
||||||
|
import java.util.stream.Collectors;
|
||||||
|
|
||||||
import org.apache.commons.codec.digest.DigestUtils;
|
import org.apache.commons.codec.digest.DigestUtils;
|
||||||
import org.apache.commons.lang3.StringUtils;
|
import org.apache.commons.lang3.StringUtils;
|
||||||
|
@ -19,15 +20,15 @@ import eu.dnetlib.pace.config.DedupConfig;
|
||||||
|
|
||||||
public abstract class UpdateMatcher<T> {
|
public abstract class UpdateMatcher<T> {
|
||||||
|
|
||||||
private final boolean multipleUpdate;
|
private final int maxNumber;
|
||||||
private final Function<T, Topic> topicFunction;
|
private final Function<T, Topic> topicFunction;
|
||||||
private final BiConsumer<OaBrokerMainEntity, T> compileHighlightFunction;
|
private final BiConsumer<OaBrokerMainEntity, T> compileHighlightFunction;
|
||||||
private final Function<T, String> highlightToStringFunction;
|
private final Function<T, String> highlightToStringFunction;
|
||||||
|
|
||||||
public UpdateMatcher(final boolean multipleUpdate, final Function<T, Topic> topicFunction,
|
public UpdateMatcher(final int maxNumber, final Function<T, Topic> topicFunction,
|
||||||
final BiConsumer<OaBrokerMainEntity, T> compileHighlightFunction,
|
final BiConsumer<OaBrokerMainEntity, T> compileHighlightFunction,
|
||||||
final Function<T, String> highlightToStringFunction) {
|
final Function<T, String> highlightToStringFunction) {
|
||||||
this.multipleUpdate = multipleUpdate;
|
this.maxNumber = maxNumber;
|
||||||
this.topicFunction = topicFunction;
|
this.topicFunction = topicFunction;
|
||||||
this.compileHighlightFunction = compileHighlightFunction;
|
this.compileHighlightFunction = compileHighlightFunction;
|
||||||
this.highlightToStringFunction = highlightToStringFunction;
|
this.highlightToStringFunction = highlightToStringFunction;
|
||||||
|
@ -57,17 +58,19 @@ public abstract class UpdateMatcher<T> {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
final Collection<UpdateInfo<T>> values = infoMap.values();
|
final List<UpdateInfo<T>> values = infoMap
|
||||||
|
.values()
|
||||||
|
.stream()
|
||||||
|
.sorted((o1, o2) -> Float.compare(o2.getTrust(), o1.getTrust())) // DESCENDING
|
||||||
|
.collect(Collectors.toList());
|
||||||
|
|
||||||
if (values.isEmpty() || multipleUpdate) {
|
if (values.isEmpty()) {
|
||||||
return values;
|
return new ArrayList<>();
|
||||||
|
} else if (values.size() > maxNumber) {
|
||||||
|
System.err.println("Too many events (" + values.size() + ") matched by " + getClass().getSimpleName());
|
||||||
|
return values.subList(0, maxNumber);
|
||||||
} else {
|
} else {
|
||||||
final UpdateInfo<T> v = values
|
return values;
|
||||||
.stream()
|
|
||||||
.sorted((o1, o2) -> Float.compare(o1.getTrust(), o2.getTrust()))
|
|
||||||
.findFirst()
|
|
||||||
.get();
|
|
||||||
return Arrays.asList(v);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -81,8 +84,8 @@ public abstract class UpdateMatcher<T> {
|
||||||
return StringUtils.isBlank(field);
|
return StringUtils.isBlank(field);
|
||||||
}
|
}
|
||||||
|
|
||||||
public boolean isMultipleUpdate() {
|
public int getMaxNumber() {
|
||||||
return multipleUpdate;
|
return maxNumber;
|
||||||
}
|
}
|
||||||
|
|
||||||
public Function<T, Topic> getTopicFunction() {
|
public Function<T, Topic> getTopicFunction() {
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public abstract class AbstractEnrichMissingDataset extends UpdateMatcher<OaBrokerRelatedDataset> {
|
public abstract class AbstractEnrichMissingDataset extends UpdateMatcher<OaBrokerRelatedDataset> {
|
||||||
|
|
||||||
public AbstractEnrichMissingDataset(final Topic topic) {
|
public AbstractEnrichMissingDataset(final Topic topic) {
|
||||||
super(true,
|
super(10,
|
||||||
rel -> topic,
|
rel -> topic,
|
||||||
(p, rel) -> p.getDatasets().add(rel),
|
(p, rel) -> p.getDatasets().add(rel),
|
||||||
rel -> rel.getOpenaireId());
|
rel -> rel.getOpenaireId());
|
||||||
|
|
|
@ -12,7 +12,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMissingProject extends UpdateMatcher<OaBrokerProject> {
|
public class EnrichMissingProject extends UpdateMatcher<OaBrokerProject> {
|
||||||
|
|
||||||
public EnrichMissingProject() {
|
public EnrichMissingProject() {
|
||||||
super(true,
|
super(20,
|
||||||
prj -> Topic.ENRICH_MISSING_PROJECT,
|
prj -> Topic.ENRICH_MISSING_PROJECT,
|
||||||
(p, prj) -> p.getProjects().add(prj),
|
(p, prj) -> p.getProjects().add(prj),
|
||||||
prj -> prj.getFunder() + "::" + prj.getFundingProgram() + prj.getCode());
|
prj -> prj.getFunder() + "::" + prj.getFundingProgram() + prj.getCode());
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMoreProject extends UpdateMatcher<OaBrokerProject> {
|
public class EnrichMoreProject extends UpdateMatcher<OaBrokerProject> {
|
||||||
|
|
||||||
public EnrichMoreProject() {
|
public EnrichMoreProject() {
|
||||||
super(true,
|
super(20,
|
||||||
prj -> Topic.ENRICH_MORE_PROJECT,
|
prj -> Topic.ENRICH_MORE_PROJECT,
|
||||||
(p, prj) -> p.getProjects().add(prj),
|
(p, prj) -> p.getProjects().add(prj),
|
||||||
prj -> projectAsString(prj));
|
prj -> projectAsString(prj));
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public abstract class AbstractEnrichMissingPublication extends UpdateMatcher<OaBrokerRelatedPublication> {
|
public abstract class AbstractEnrichMissingPublication extends UpdateMatcher<OaBrokerRelatedPublication> {
|
||||||
|
|
||||||
public AbstractEnrichMissingPublication(final Topic topic) {
|
public AbstractEnrichMissingPublication(final Topic topic) {
|
||||||
super(true,
|
super(10,
|
||||||
rel -> topic,
|
rel -> topic,
|
||||||
(p, rel) -> p.getPublications().add(rel),
|
(p, rel) -> p.getPublications().add(rel),
|
||||||
rel -> rel.getOpenaireId());
|
rel -> rel.getOpenaireId());
|
||||||
|
|
|
@ -13,7 +13,7 @@ public class EnrichMissingSoftware
|
||||||
extends UpdateMatcher<OaBrokerRelatedSoftware> {
|
extends UpdateMatcher<OaBrokerRelatedSoftware> {
|
||||||
|
|
||||||
public EnrichMissingSoftware() {
|
public EnrichMissingSoftware() {
|
||||||
super(true,
|
super(10,
|
||||||
s -> Topic.ENRICH_MISSING_SOFTWARE,
|
s -> Topic.ENRICH_MISSING_SOFTWARE,
|
||||||
(p, s) -> p.getSoftwares().add(s),
|
(p, s) -> p.getSoftwares().add(s),
|
||||||
s -> s.getOpenaireId());
|
s -> s.getOpenaireId());
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMoreSoftware extends UpdateMatcher<OaBrokerRelatedSoftware> {
|
public class EnrichMoreSoftware extends UpdateMatcher<OaBrokerRelatedSoftware> {
|
||||||
|
|
||||||
public EnrichMoreSoftware() {
|
public EnrichMoreSoftware() {
|
||||||
super(true,
|
super(10,
|
||||||
s -> Topic.ENRICH_MORE_SOFTWARE,
|
s -> Topic.ENRICH_MORE_SOFTWARE,
|
||||||
(p, s) -> p.getSoftwares().add(s),
|
(p, s) -> p.getSoftwares().add(s),
|
||||||
s -> s.getOpenaireId());
|
s -> s.getOpenaireId());
|
||||||
|
|
|
@ -12,7 +12,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMissingAbstract extends UpdateMatcher<String> {
|
public class EnrichMissingAbstract extends UpdateMatcher<String> {
|
||||||
|
|
||||||
public EnrichMissingAbstract() {
|
public EnrichMissingAbstract() {
|
||||||
super(false,
|
super(1,
|
||||||
s -> Topic.ENRICH_MISSING_ABSTRACT,
|
s -> Topic.ENRICH_MISSING_ABSTRACT,
|
||||||
(p, s) -> p.getAbstracts().add(s),
|
(p, s) -> p.getAbstracts().add(s),
|
||||||
s -> s);
|
s -> s);
|
||||||
|
|
|
@ -15,7 +15,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMissingAuthorOrcid extends UpdateMatcher<OaBrokerAuthor> {
|
public class EnrichMissingAuthorOrcid extends UpdateMatcher<OaBrokerAuthor> {
|
||||||
|
|
||||||
public EnrichMissingAuthorOrcid() {
|
public EnrichMissingAuthorOrcid() {
|
||||||
super(true,
|
super(40,
|
||||||
aut -> Topic.ENRICH_MISSING_AUTHOR_ORCID,
|
aut -> Topic.ENRICH_MISSING_AUTHOR_ORCID,
|
||||||
(p, aut) -> p.getCreators().add(aut),
|
(p, aut) -> p.getCreators().add(aut),
|
||||||
aut -> aut.getOrcid());
|
aut -> aut.getOrcid());
|
||||||
|
|
|
@ -14,7 +14,7 @@ import eu.dnetlib.dhp.broker.oa.util.BrokerConstants;
|
||||||
public class EnrichMissingOpenAccess extends UpdateMatcher<OaBrokerInstance> {
|
public class EnrichMissingOpenAccess extends UpdateMatcher<OaBrokerInstance> {
|
||||||
|
|
||||||
public EnrichMissingOpenAccess() {
|
public EnrichMissingOpenAccess() {
|
||||||
super(true,
|
super(20,
|
||||||
i -> Topic.ENRICH_MISSING_OA_VERSION,
|
i -> Topic.ENRICH_MISSING_OA_VERSION,
|
||||||
(p, i) -> p.getInstances().add(i),
|
(p, i) -> p.getInstances().add(i),
|
||||||
OaBrokerInstance::getUrl);
|
OaBrokerInstance::getUrl);
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMissingPid extends UpdateMatcher<OaBrokerTypedValue> {
|
public class EnrichMissingPid extends UpdateMatcher<OaBrokerTypedValue> {
|
||||||
|
|
||||||
public EnrichMissingPid() {
|
public EnrichMissingPid() {
|
||||||
super(true,
|
super(10,
|
||||||
pid -> Topic.ENRICH_MISSING_PID,
|
pid -> Topic.ENRICH_MISSING_PID,
|
||||||
(p, pid) -> p.getPids().add(pid),
|
(p, pid) -> p.getPids().add(pid),
|
||||||
pid -> pid.getType() + "::" + pid.getValue());
|
pid -> pid.getType() + "::" + pid.getValue());
|
||||||
|
|
|
@ -12,7 +12,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMissingPublicationDate extends UpdateMatcher<String> {
|
public class EnrichMissingPublicationDate extends UpdateMatcher<String> {
|
||||||
|
|
||||||
public EnrichMissingPublicationDate() {
|
public EnrichMissingPublicationDate() {
|
||||||
super(false,
|
super(1,
|
||||||
date -> Topic.ENRICH_MISSING_PUBLICATION_DATE,
|
date -> Topic.ENRICH_MISSING_PUBLICATION_DATE,
|
||||||
(p, date) -> p.setPublicationdate(date),
|
(p, date) -> p.setPublicationdate(date),
|
||||||
s -> s);
|
s -> s);
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMissingSubject extends UpdateMatcher<OaBrokerTypedValue> {
|
public class EnrichMissingSubject extends UpdateMatcher<OaBrokerTypedValue> {
|
||||||
|
|
||||||
public EnrichMissingSubject() {
|
public EnrichMissingSubject() {
|
||||||
super(true,
|
super(20,
|
||||||
s -> Topic.fromPath("ENRICH/MISSING/SUBJECT/" + s.getType()),
|
s -> Topic.fromPath("ENRICH/MISSING/SUBJECT/" + s.getType()),
|
||||||
(p, s) -> p.getSubjects().add(s),
|
(p, s) -> p.getSubjects().add(s),
|
||||||
s -> subjectAsString(s));
|
s -> subjectAsString(s));
|
||||||
|
|
|
@ -14,7 +14,7 @@ import eu.dnetlib.dhp.broker.oa.util.BrokerConstants;
|
||||||
public class EnrichMoreOpenAccess extends UpdateMatcher<OaBrokerInstance> {
|
public class EnrichMoreOpenAccess extends UpdateMatcher<OaBrokerInstance> {
|
||||||
|
|
||||||
public EnrichMoreOpenAccess() {
|
public EnrichMoreOpenAccess() {
|
||||||
super(true,
|
super(20,
|
||||||
i -> Topic.ENRICH_MORE_OA_VERSION,
|
i -> Topic.ENRICH_MORE_OA_VERSION,
|
||||||
(p, i) -> p.getInstances().add(i),
|
(p, i) -> p.getInstances().add(i),
|
||||||
OaBrokerInstance::getUrl);
|
OaBrokerInstance::getUrl);
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMorePid extends UpdateMatcher<OaBrokerTypedValue> {
|
public class EnrichMorePid extends UpdateMatcher<OaBrokerTypedValue> {
|
||||||
|
|
||||||
public EnrichMorePid() {
|
public EnrichMorePid() {
|
||||||
super(true,
|
super(20,
|
||||||
pid -> Topic.ENRICH_MORE_PID,
|
pid -> Topic.ENRICH_MORE_PID,
|
||||||
(p, pid) -> p.getPids().add(pid),
|
(p, pid) -> p.getPids().add(pid),
|
||||||
pid -> pidAsString(pid));
|
pid -> pidAsString(pid));
|
||||||
|
|
|
@ -13,7 +13,7 @@ import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
public class EnrichMoreSubject extends UpdateMatcher<OaBrokerTypedValue> {
|
public class EnrichMoreSubject extends UpdateMatcher<OaBrokerTypedValue> {
|
||||||
|
|
||||||
public EnrichMoreSubject() {
|
public EnrichMoreSubject() {
|
||||||
super(true,
|
super(20,
|
||||||
s -> Topic.fromPath("ENRICH/MORE/SUBJECT/" + s.getType()),
|
s -> Topic.fromPath("ENRICH/MORE/SUBJECT/" + s.getType()),
|
||||||
(p, s) -> p.getSubjects().add(s),
|
(p, s) -> p.getSubjects().add(s),
|
||||||
s -> subjectAsString(s));
|
s -> subjectAsString(s));
|
||||||
|
|
|
@ -7,20 +7,7 @@ import java.util.List;
|
||||||
import eu.dnetlib.broker.objects.OaBrokerMainEntity;
|
import eu.dnetlib.broker.objects.OaBrokerMainEntity;
|
||||||
import eu.dnetlib.dhp.broker.model.EventFactory;
|
import eu.dnetlib.dhp.broker.model.EventFactory;
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedDatasets.EnrichMissingDatasetIsReferencedBy;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedDatasets.EnrichMissingDatasetIsRelatedTo;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedDatasets.EnrichMissingDatasetIsSupplementedBy;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedDatasets.EnrichMissingDatasetIsSupplementedTo;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedDatasets.EnrichMissingDatasetReferences;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedProjects.EnrichMissingProject;
|
import eu.dnetlib.dhp.broker.oa.matchers.relatedProjects.EnrichMissingProject;
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedProjects.EnrichMoreProject;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedPublications.EnrichMissingPublicationIsReferencedBy;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedPublications.EnrichMissingPublicationIsRelatedTo;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedPublications.EnrichMissingPublicationIsSupplementedBy;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedPublications.EnrichMissingPublicationIsSupplementedTo;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedPublications.EnrichMissingPublicationReferences;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedSoftware.EnrichMissingSoftware;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.relatedSoftware.EnrichMoreSoftware;
|
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.simple.EnrichMissingAbstract;
|
import eu.dnetlib.dhp.broker.oa.matchers.simple.EnrichMissingAbstract;
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.simple.EnrichMissingAuthorOrcid;
|
import eu.dnetlib.dhp.broker.oa.matchers.simple.EnrichMissingAuthorOrcid;
|
||||||
import eu.dnetlib.dhp.broker.oa.matchers.simple.EnrichMissingOpenAccess;
|
import eu.dnetlib.dhp.broker.oa.matchers.simple.EnrichMissingOpenAccess;
|
||||||
|
@ -47,22 +34,22 @@ public class EventFinder {
|
||||||
matchers.add(new EnrichMorePid());
|
matchers.add(new EnrichMorePid());
|
||||||
matchers.add(new EnrichMoreSubject());
|
matchers.add(new EnrichMoreSubject());
|
||||||
|
|
||||||
// Advanced matchers
|
// // Advanced matchers
|
||||||
matchers.add(new EnrichMissingProject());
|
matchers.add(new EnrichMissingProject());
|
||||||
matchers.add(new EnrichMoreProject());
|
// matchers.add(new EnrichMoreProject());
|
||||||
matchers.add(new EnrichMissingSoftware());
|
// matchers.add(new EnrichMissingSoftware());
|
||||||
matchers.add(new EnrichMoreSoftware());
|
// matchers.add(new EnrichMoreSoftware());
|
||||||
matchers.add(new EnrichMissingPublicationIsRelatedTo());
|
// matchers.add(new EnrichMissingPublicationIsRelatedTo());
|
||||||
matchers.add(new EnrichMissingPublicationIsReferencedBy());
|
// matchers.add(new EnrichMissingPublicationIsReferencedBy());
|
||||||
matchers.add(new EnrichMissingPublicationReferences());
|
// matchers.add(new EnrichMissingPublicationReferences());
|
||||||
matchers.add(new EnrichMissingPublicationIsSupplementedTo());
|
// matchers.add(new EnrichMissingPublicationIsSupplementedTo());
|
||||||
matchers.add(new EnrichMissingPublicationIsSupplementedBy());
|
// matchers.add(new EnrichMissingPublicationIsSupplementedBy());
|
||||||
matchers.add(new EnrichMissingDatasetIsRelatedTo());
|
// matchers.add(new EnrichMissingDatasetIsRelatedTo());
|
||||||
matchers.add(new EnrichMissingDatasetIsReferencedBy());
|
// matchers.add(new EnrichMissingDatasetIsReferencedBy());
|
||||||
matchers.add(new EnrichMissingDatasetReferences());
|
// matchers.add(new EnrichMissingDatasetReferences());
|
||||||
matchers.add(new EnrichMissingDatasetIsSupplementedTo());
|
// matchers.add(new EnrichMissingDatasetIsSupplementedTo());
|
||||||
matchers.add(new EnrichMissingDatasetIsSupplementedBy());
|
// matchers.add(new EnrichMissingDatasetIsSupplementedBy());
|
||||||
matchers.add(new EnrichMissingAbstract());
|
// matchers.add(new EnrichMissingAbstract());
|
||||||
}
|
}
|
||||||
|
|
||||||
public static EventGroup generateEvents(final ResultGroup results, final DedupConfig dedupConfig) {
|
public static EventGroup generateEvents(final ResultGroup results, final DedupConfig dedupConfig) {
|
||||||
|
|
Loading…
Reference in New Issue