forked from D-Net/dnet-hadoop
[cleaning] allow enriched orcids to pass the cleaning, rule out non-orcid author pids
This commit is contained in:
parent
aba95ed1d1
commit
84d54643cf
|
@ -689,6 +689,7 @@ public class GraphCleaningFunctions extends CleaningFunctions {
|
||||||
.filter(Objects::nonNull)
|
.filter(Objects::nonNull)
|
||||||
.filter(p -> Objects.nonNull(p.getQualifier()))
|
.filter(p -> Objects.nonNull(p.getQualifier()))
|
||||||
.filter(p -> StringUtils.isNotBlank(p.getValue()))
|
.filter(p -> StringUtils.isNotBlank(p.getValue()))
|
||||||
|
.filter(p -> StringUtils.contains(StringUtils.lowerCase(p.getQualifier().getClassid()), ORCID))
|
||||||
.map(p -> {
|
.map(p -> {
|
||||||
// hack to distinguish orcid from orcid_pending
|
// hack to distinguish orcid from orcid_pending
|
||||||
String pidProvenance = getProvenance(p.getDataInfo());
|
String pidProvenance = getProvenance(p.getDataInfo());
|
||||||
|
@ -698,7 +699,8 @@ public class GraphCleaningFunctions extends CleaningFunctions {
|
||||||
.toLowerCase()
|
.toLowerCase()
|
||||||
.contains(ModelConstants.ORCID)) {
|
.contains(ModelConstants.ORCID)) {
|
||||||
if (pidProvenance
|
if (pidProvenance
|
||||||
.equals(ModelConstants.SYSIMPORT_CROSSWALK_ENTITYREGISTRY)) {
|
.equals(ModelConstants.SYSIMPORT_CROSSWALK_ENTITYREGISTRY) ||
|
||||||
|
pidProvenance.equals("ORCID_ENRICHMENT")) {
|
||||||
p.getQualifier().setClassid(ModelConstants.ORCID);
|
p.getQualifier().setClassid(ModelConstants.ORCID);
|
||||||
} else {
|
} else {
|
||||||
p.getQualifier().setClassid(ModelConstants.ORCID_PENDING);
|
p.getQualifier().setClassid(ModelConstants.ORCID_PENDING);
|
||||||
|
|
Loading…
Reference in New Issue