forked from D-Net/dnet-hadoop
defaults fixed in the cleaning workflow forces result.publisher to NULL when result.publisher.value in empty
This commit is contained in:
parent
4bbfcf1ac6
commit
cd631bb5bc
|
@ -173,6 +173,9 @@ public class CleanGraphSparkJob {
|
||||||
} else if (value instanceof Result) {
|
} else if (value instanceof Result) {
|
||||||
|
|
||||||
Result r = (Result) value;
|
Result r = (Result) value;
|
||||||
|
if (Objects.nonNull(r.getPublisher()) && StringUtils.isBlank(r.getPublisher().getValue())) {
|
||||||
|
r.setPublisher(null);
|
||||||
|
}
|
||||||
if (Objects.isNull(r.getLanguage()) || StringUtils.isBlank(r.getLanguage().getClassid())) {
|
if (Objects.isNull(r.getLanguage()) || StringUtils.isBlank(r.getLanguage().getClassid())) {
|
||||||
r
|
r
|
||||||
.setLanguage(
|
.setLanguage(
|
||||||
|
|
|
@ -66,6 +66,8 @@ public class CleaningFunctionTest {
|
||||||
|
|
||||||
assertNotNull(p_out);
|
assertNotNull(p_out);
|
||||||
|
|
||||||
|
assertNotNull(p_out.getPublisher());
|
||||||
|
assertNull(p_out.getPublisher().getValue());
|
||||||
assertEquals("und", p_out.getLanguage().getClassid());
|
assertEquals("und", p_out.getLanguage().getClassid());
|
||||||
assertEquals("Undetermined", p_out.getLanguage().getClassname());
|
assertEquals("Undetermined", p_out.getLanguage().getClassname());
|
||||||
|
|
||||||
|
@ -88,6 +90,7 @@ public class CleaningFunctionTest {
|
||||||
|
|
||||||
Publication p_defaults = CleanGraphSparkJob.fixDefaults(p_out);
|
Publication p_defaults = CleanGraphSparkJob.fixDefaults(p_out);
|
||||||
assertEquals("CLOSED", p_defaults.getBestaccessright().getClassid());
|
assertEquals("CLOSED", p_defaults.getBestaccessright().getClassid());
|
||||||
|
assertNull(p_out.getPublisher());
|
||||||
|
|
||||||
getAuthorPids(p_defaults).forEach(pid -> {
|
getAuthorPids(p_defaults).forEach(pid -> {
|
||||||
System.out
|
System.out
|
||||||
|
|
|
@ -208,6 +208,9 @@
|
||||||
}
|
}
|
||||||
],
|
],
|
||||||
"bestaccessright": null,
|
"bestaccessright": null,
|
||||||
|
"publisher": {
|
||||||
|
"value": null
|
||||||
|
},
|
||||||
"collectedfrom": [
|
"collectedfrom": [
|
||||||
{
|
{
|
||||||
"key": "10|CSC_________::a2b9ce8435390bcbfc05f3cae3948747",
|
"key": "10|CSC_________::a2b9ce8435390bcbfc05f3cae3948747",
|
||||||
|
|
Loading…
Reference in New Issue