forked from D-Net/dnet-hadoop
defaults fixed in the cleaning workflow forces result.publisher to NULL when result.publisher.value in empty
This commit is contained in:
parent
4bbfcf1ac6
commit
cd631bb5bc
|
@ -173,6 +173,9 @@ public class CleanGraphSparkJob {
|
|||
} else if (value instanceof Result) {
|
||||
|
||||
Result r = (Result) value;
|
||||
if (Objects.nonNull(r.getPublisher()) && StringUtils.isBlank(r.getPublisher().getValue())) {
|
||||
r.setPublisher(null);
|
||||
}
|
||||
if (Objects.isNull(r.getLanguage()) || StringUtils.isBlank(r.getLanguage().getClassid())) {
|
||||
r
|
||||
.setLanguage(
|
||||
|
|
|
@ -66,6 +66,8 @@ public class CleaningFunctionTest {
|
|||
|
||||
assertNotNull(p_out);
|
||||
|
||||
assertNotNull(p_out.getPublisher());
|
||||
assertNull(p_out.getPublisher().getValue());
|
||||
assertEquals("und", p_out.getLanguage().getClassid());
|
||||
assertEquals("Undetermined", p_out.getLanguage().getClassname());
|
||||
|
||||
|
@ -88,6 +90,7 @@ public class CleaningFunctionTest {
|
|||
|
||||
Publication p_defaults = CleanGraphSparkJob.fixDefaults(p_out);
|
||||
assertEquals("CLOSED", p_defaults.getBestaccessright().getClassid());
|
||||
assertNull(p_out.getPublisher());
|
||||
|
||||
getAuthorPids(p_defaults).forEach(pid -> {
|
||||
System.out
|
||||
|
|
|
@ -208,6 +208,9 @@
|
|||
}
|
||||
],
|
||||
"bestaccessright": null,
|
||||
"publisher": {
|
||||
"value": null
|
||||
},
|
||||
"collectedfrom": [
|
||||
{
|
||||
"key": "10|CSC_________::a2b9ce8435390bcbfc05f3cae3948747",
|
||||
|
|
Loading…
Reference in New Issue