forked from D-Net/dnet-hadoop
[Cleaning] drop alternate identifiers with empty values
This commit is contained in:
parent
827e7e37db
commit
b5b7dc2104
|
@ -152,7 +152,12 @@ public class CleaningFunctions {
|
||||||
Optional
|
Optional
|
||||||
.ofNullable(i.getPid())
|
.ofNullable(i.getPid())
|
||||||
.ifPresent(pid -> {
|
.ifPresent(pid -> {
|
||||||
final Set<StructuredProperty> pids = Sets.newHashSet(pid);
|
final Set<StructuredProperty> pids = Sets
|
||||||
|
.newHashSet(
|
||||||
|
pid
|
||||||
|
.stream()
|
||||||
|
.filter(p -> StringUtils.isBlank(p.getValue()))
|
||||||
|
.collect(Collectors.toList()));
|
||||||
final Set<StructuredProperty> altIds = Sets.newHashSet(i.getAlternateIdentifier());
|
final Set<StructuredProperty> altIds = Sets.newHashSet(i.getAlternateIdentifier());
|
||||||
i.setAlternateIdentifier(Lists.newArrayList(Sets.difference(altIds, pids)));
|
i.setAlternateIdentifier(Lists.newArrayList(Sets.difference(altIds, pids)));
|
||||||
});
|
});
|
||||||
|
|
Loading…
Reference in New Issue