dnet-hadoop/dhp-workflows/dhp-broker-events/src/main/java/eu/dnetlib/dhp/broker/oa/matchers/relatedDatasets/AbstractEnrichMissingDatase...

46 lines
1.1 KiB
Java
Raw Normal View History

package eu.dnetlib.dhp.broker.oa.matchers.relatedDatasets;
import java.util.List;
import java.util.Set;
import java.util.stream.Collectors;
2020-06-16 12:34:13 +02:00
import eu.dnetlib.broker.objects.Dataset;
import eu.dnetlib.broker.objects.OpenaireBrokerResult;
import eu.dnetlib.dhp.broker.model.Topic;
import eu.dnetlib.dhp.broker.oa.matchers.UpdateMatcher;
public abstract class AbstractEnrichMissingDataset
2020-06-16 12:34:13 +02:00
extends UpdateMatcher<Dataset> {
public AbstractEnrichMissingDataset(final Topic topic) {
2020-06-12 09:47:55 +02:00
super(true,
rel -> topic,
(p, rel) -> p.getDatasets().add(rel),
2020-06-16 12:34:13 +02:00
rel -> rel.getOriginalId());
}
2020-06-11 11:25:18 +02:00
protected abstract boolean filterByType(String relType);
@Override
2020-06-16 12:34:13 +02:00
protected final List<Dataset> findDifferences(final OpenaireBrokerResult source,
final OpenaireBrokerResult target) {
final Set<String> existingDatasets = target
2020-06-11 11:25:18 +02:00
.getDatasets()
.stream()
2020-06-11 11:25:18 +02:00
.filter(rel -> filterByType(rel.getRelType()))
2020-06-16 12:34:13 +02:00
.map(Dataset::getOriginalId)
.collect(Collectors.toSet());
return source
2020-06-11 11:25:18 +02:00
.getDatasets()
.stream()
2020-06-11 11:25:18 +02:00
.filter(rel -> filterByType(rel.getRelType()))
2020-06-16 12:34:13 +02:00
.filter(d -> !existingDatasets.contains(d.getOriginalId()))
.collect(Collectors.toList());
}
}