forked from D-Net/dnet-hadoop
[Cleaning] filter authors not providing word characters in the fullname
This commit is contained in:
parent
2890511613
commit
885e0dd926
|
@ -206,7 +206,8 @@ public class CleaningFunctions {
|
||||||
.getAuthor()
|
.getAuthor()
|
||||||
.stream()
|
.stream()
|
||||||
.filter(a -> Objects.nonNull(a))
|
.filter(a -> Objects.nonNull(a))
|
||||||
.filter(a -> StringUtils.isNotBlank(StringUtils.trim(a.getFullname())))
|
.filter(a -> StringUtils.isNotBlank(a.getFullname()))
|
||||||
|
.filter(a -> StringUtils.isNotBlank(a.getFullname().replaceAll("[\\W]", "")))
|
||||||
.collect(Collectors.toList()));
|
.collect(Collectors.toList()));
|
||||||
|
|
||||||
boolean nullRank = r
|
boolean nullRank = r
|
||||||
|
|
Loading…
Reference in New Issue