From 7400cd019d88cda9e094f37300bc15f344589459 Mon Sep 17 00:00:00 2001 From: "miriam.baglioni" Date: Wed, 12 Aug 2020 10:03:33 +0200 Subject: [PATCH] removed not needed variable --- .../dump/graph/SparkOrganizationRelation.java | 24 ++++++++++++------- 1 file changed, 15 insertions(+), 9 deletions(-) diff --git a/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/oa/graph/dump/graph/SparkOrganizationRelation.java b/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/oa/graph/dump/graph/SparkOrganizationRelation.java index db9fb85453..6a92db25cd 100644 --- a/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/oa/graph/dump/graph/SparkOrganizationRelation.java +++ b/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/oa/graph/dump/graph/SparkOrganizationRelation.java @@ -8,11 +8,13 @@ import static eu.dnetlib.dhp.common.SparkSessionSupport.runWithSparkSession; import java.io.Serializable; import java.util.*; +import java.util.function.Consumer; import org.apache.commons.io.IOUtils; import org.apache.spark.SparkConf; import org.apache.spark.api.java.function.MapFunction; import org.apache.spark.sql.*; +import org.jetbrains.annotations.NotNull; import org.slf4j.Logger; import org.slf4j.LoggerFactory; @@ -74,7 +76,6 @@ public class SparkOrganizationRelation implements Serializable { Dataset relationDataset = Utils.readPath(spark, inputPath, Relation.class); relationDataset.createOrReplaceTempView("relation"); - Set organizationSet = organizationMap.keySet(); List relList = new ArrayList<>(); @@ -95,15 +96,9 @@ public class SparkOrganizationRelation implements Serializable { }, Encoders.bean(MergedRels.class)) .filter(Objects::nonNull) .collectAsList() - .forEach(mergedRels -> { - String oId = mergedRels.getOrganizationId(); - organizationSet.remove(oId); - organizationMap - .get(oId) - .forEach(community -> addRelations(relList, community, mergedRels.getRepresentativeId())); - }); + .forEach(getMergedRelsConsumer(organizationMap, relList)); - organizationSet + organizationMap.keySet() .forEach( oId -> organizationMap .get(oId) @@ -118,6 +113,17 @@ public class SparkOrganizationRelation implements Serializable { } + @NotNull + private static Consumer getMergedRelsConsumer(OrganizationMap organizationMap, List relList) { + return mergedRels -> { + String oId = mergedRels.getOrganizationId(); + organizationMap + .get(oId) + .forEach(community -> addRelations(relList, community, mergedRels.getRepresentativeId())); + organizationMap.remove(oId); + }; + } + private static void addRelations(List relList, String community, String organization) {