Master branch updates from beta September 2023 #337
|
@ -5,6 +5,7 @@ import static eu.dnetlib.dhp.PropagationConstant.removeOutputDir;
|
||||||
import static eu.dnetlib.dhp.common.SparkSessionSupport.runWithSparkSession;
|
import static eu.dnetlib.dhp.common.SparkSessionSupport.runWithSparkSession;
|
||||||
|
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
|
import java.util.Objects;
|
||||||
import java.util.Optional;
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.commons.io.IOUtils;
|
import org.apache.commons.io.IOUtils;
|
||||||
|
@ -102,6 +103,7 @@ public class SparkBulkTagJob {
|
||||||
ResultTagger resultTagger = new ResultTagger();
|
ResultTagger resultTagger = new ResultTagger();
|
||||||
readPath(spark, inputPath, resultClazz)
|
readPath(spark, inputPath, resultClazz)
|
||||||
.map(patchResult(), Encoders.bean(resultClazz))
|
.map(patchResult(), Encoders.bean(resultClazz))
|
||||||
|
.filter(Objects::nonNull)
|
||||||
.map(
|
.map(
|
||||||
(MapFunction<R, R>) value -> resultTagger
|
(MapFunction<R, R>) value -> resultTagger
|
||||||
.enrichContextCriteria(
|
.enrichContextCriteria(
|
||||||
|
@ -124,6 +126,9 @@ public class SparkBulkTagJob {
|
||||||
// TODO remove this hack as soon as the values fixed by this method will be provided as NON null
|
// TODO remove this hack as soon as the values fixed by this method will be provided as NON null
|
||||||
private static <R extends Result> MapFunction<R, R> patchResult() {
|
private static <R extends Result> MapFunction<R, R> patchResult() {
|
||||||
return r -> {
|
return r -> {
|
||||||
|
if(r.getDataInfo() == null){
|
||||||
|
return null;
|
||||||
|
}
|
||||||
if (r.getDataInfo().getDeletedbyinference() == null) {
|
if (r.getDataInfo().getDeletedbyinference() == null) {
|
||||||
r.getDataInfo().setDeletedbyinference(false);
|
r.getDataInfo().setDeletedbyinference(false);
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue