Merge pull request 'Dump per Country' (#3) from dumpSubset into master

Reviewed-on: #3
2023-07-15 11:13:28 +02:00 · 2023-07-15 11:13:28 +02:00 · 7ccd4e7866
parent abc30756e4 25be584028
commit 7ccd4e7866
20 changed files with 1480 additions and 33 deletions
--- a/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/SendToZenodoHDFS.java
+++ b/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/SendToZenodoHDFS.java
@ -90,9 +90,9 @@ public class SendToZenodoHDFS implements Serializable {
 			zenodoApiClient.sendMretadata(metadata);
 		}

-		if (Boolean.TRUE.equals(publish)) {
-			zenodoApiClient.publish();
-		}
+//		if (Boolean.TRUE.equals(publish)) {
+//			zenodoApiClient.publish();
+//		}
 	}

 }
--- a/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/community/SparkDumpCommunityProducts.java
+++ b/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/community/SparkDumpCommunityProducts.java
@ -8,6 +8,7 @@ import java.util.*;
 import java.util.stream.Collectors;

 import org.apache.commons.io.IOUtils;
+import org.apache.commons.lang.StringUtils;
 import org.apache.spark.SparkConf;
 import org.apache.spark.api.java.function.FilterFunction;
 import org.apache.spark.api.java.function.MapFunction;
@ -65,21 +66,25 @@ public class SparkDumpCommunityProducts implements Serializable {
 		final String resultClassName = parser.get("resultTableName");
 		log.info("resultTableName: {}", resultClassName);

-		String communityMapPath = parser.get("communityMapPath");
+		String communityMapPath = Optional
+			.ofNullable(parser.get("communityMapPath"))
+			.orElse(null);
+
+		String dumpType = Optional
+			.ofNullable(parser.get("dumpType"))
+			.orElse(null);

 		Class<? extends Result> inputClazz = (Class<? extends Result>) Class.forName(resultClassName);

 		SparkConf conf = new SparkConf();

-		String finalCommunityMapPath = communityMapPath;
-
 		runWithSparkSession(
 			conf,
 			isSparkSessionManaged,
 			spark -> {
 				Utils.removeOutputDir(spark, outputPath);
 				resultDump(
-					spark, inputPath, outputPath, finalCommunityMapPath, inputClazz);
+					spark, inputPath, outputPath, communityMapPath, inputClazz, dumpType);
 			});

 	}
@ -89,14 +94,18 @@ public class SparkDumpCommunityProducts implements Serializable {
 		String inputPath,
 		String outputPath,
 		String communityMapPath,
-		Class<I> inputClazz) {
+		Class<I> inputClazz,
+		String dumpType) {

-		CommunityMap communityMap = Utils.getCommunityMap(spark, communityMapPath);
+		CommunityMap communityMap = null;
+		if (!StringUtils.isEmpty(communityMapPath))
+			communityMap = Utils.getCommunityMap(spark, communityMapPath);

+		CommunityMap finalCommunityMap = communityMap;
 		Utils
 			.readPath(spark, inputPath, inputClazz)
 			.map(
-				(MapFunction<I, CommunityResult>) value -> execMap(value, communityMap),
+				(MapFunction<I, CommunityResult>) value -> execMap(value, finalCommunityMap, dumpType),
 				Encoders.bean(CommunityResult.class))
 			.filter((FilterFunction<CommunityResult>) value -> value != null)
 			.map(
@ -109,7 +118,7 @@ public class SparkDumpCommunityProducts implements Serializable {
 	}

 	private static <I extends OafEntity, O extends eu.dnetlib.dhp.oa.model.Result> O execMap(I value,
-		CommunityMap communityMap) throws NoAvailableEntityTypeException, CardinalityTooHighException {
+		CommunityMap communityMap, String dumpType) throws NoAvailableEntityTypeException, CardinalityTooHighException {

 		Optional<DataInfo> odInfo = Optional.ofNullable(value.getDataInfo());
 		if (Boolean.FALSE.equals(odInfo.isPresent())) {
@ -119,26 +128,27 @@ public class SparkDumpCommunityProducts implements Serializable {
 			|| Boolean.TRUE.equals(odInfo.get().getInvisible())) {
 			return null;
 		}
-		Set<String> communities = communityMap.keySet();
+		if (StringUtils.isEmpty(dumpType)) {
+			Set<String> communities = communityMap.keySet();

-		Optional<List<Context>> inputContext = Optional
-			.ofNullable(((eu.dnetlib.dhp.schema.oaf.Result) value).getContext());
-		if (!inputContext.isPresent()) {
-			return null;
-		}
-		List<String> toDumpFor = inputContext.get().stream().map(c -> {
-			if (communities.contains(c.getId())) {
-				return c.getId();
+			Optional<List<Context>> inputContext = Optional
+				.ofNullable(((eu.dnetlib.dhp.schema.oaf.Result) value).getContext());
+			if (!inputContext.isPresent()) {
+				return null;
 			}
-			if (c.getId().contains("::") && communities.contains(c.getId().substring(0, c.getId().indexOf("::")))) {
-				return c.getId().substring(0, c.getId().indexOf("::"));
+			List<String> toDumpFor = inputContext.get().stream().map(c -> {
+				if (communities.contains(c.getId())) {
+					return c.getId();
+				}
+				if (c.getId().contains("::") && communities.contains(c.getId().substring(0, c.getId().indexOf("::")))) {
+					return c.getId().substring(0, c.getId().indexOf("::"));
+				}
+				return null;
+			}).filter(Objects::nonNull).collect(Collectors.toList());
+			if (toDumpFor.isEmpty()) {
+				return null;
 			}
-			return null;
-		}).filter(Objects::nonNull).collect(Collectors.toList());
-		if (toDumpFor.isEmpty()) {
-			return null;
 		}
-
 		return (O) ResultMapper.map(value, communityMap, Constants.DUMPTYPE.COMMUNITY.getType());

 	}
--- a/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/country/SparkFindResultWithCountry.java
+++ b/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/country/SparkFindResultWithCountry.java
@ -0,0 +1,136 @@
+
+package eu.dnetlib.dhp.oa.graph.dump.country;
+
+import static eu.dnetlib.dhp.common.SparkSessionSupport.runWithSparkSession;
+
+import java.io.Serializable;
+import java.util.*;
+
+import javax.rmi.CORBA.Util;
+
+import org.apache.commons.io.IOUtils;
+import org.apache.spark.SparkConf;
+import org.apache.spark.api.java.function.FilterFunction;
+import org.apache.spark.api.java.function.MapFunction;
+import org.apache.spark.sql.Dataset;
+import org.apache.spark.sql.Encoders;
+import org.apache.spark.sql.SaveMode;
+import org.apache.spark.sql.SparkSession;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.gson.Gson;
+import com.jayway.jsonpath.DocumentContext;
+import com.jayway.jsonpath.JsonPath;
+
+import eu.dnetlib.dhp.application.ArgumentApplicationParser;
+import eu.dnetlib.dhp.oa.graph.dump.Constants;
+import eu.dnetlib.dhp.oa.graph.dump.ResultMapper;
+import eu.dnetlib.dhp.oa.graph.dump.Utils;
+import eu.dnetlib.dhp.oa.graph.dump.subset.MasterDuplicate;
+import eu.dnetlib.dhp.oa.graph.dump.subset.SparkDumpResult;
+import eu.dnetlib.dhp.oa.graph.dump.subset.criteria.VerbResolver;
+import eu.dnetlib.dhp.oa.graph.dump.subset.criteria.VerbResolverFactory;
+import eu.dnetlib.dhp.oa.graph.dump.subset.selectionconstraints.Param;
+import eu.dnetlib.dhp.oa.graph.dump.subset.selectionconstraints.SelectionConstraints;
+import eu.dnetlib.dhp.oa.model.graph.GraphResult;
+import eu.dnetlib.dhp.schema.oaf.DataInfo;
+import eu.dnetlib.dhp.schema.oaf.KeyValue;
+import scala.Tuple2;
+
+/**
+ * @author miriam.baglioni
+ * @Date 27/04/23
+ * Selects the results having in the country the given country
+ */
+public class SparkFindResultWithCountry implements Serializable {
+	private static final Logger log = LoggerFactory.getLogger(SparkFindResultWithCountry.class);
+
+	public static final String COMPRESSION = "compression";
+	public static final String GZIP = "gzip";
+
+	public static void main(String[] args) throws Exception {
+		String jsonConfiguration = IOUtils
+			.toString(
+				SparkFindResultWithCountry.class
+					.getResourceAsStream(
+						"/eu/dnetlib/dhp/oa/graph/dump/result_country_parameters.json"));
+
+		final ArgumentApplicationParser parser = new ArgumentApplicationParser(jsonConfiguration);
+		parser.parseArgument(args);
+
+		Boolean isSparkSessionManaged = Optional
+			.ofNullable(parser.get("isSparkSessionManaged"))
+			.map(Boolean::valueOf)
+			.orElse(Boolean.TRUE);
+		log.info("isSparkSessionManaged: {}", isSparkSessionManaged);
+
+		final String inputPath = parser.get("sourcePath");
+		log.info("inputPath: {}", inputPath);
+
+		final String outputPath = parser.get("outputPath");
+		log.info("outputPath: {}", outputPath);
+
+		final String resultType = parser.get("resultType");
+		log.info("resultType: {}", resultType);
+
+		final String resultClassName = parser.get("resultTableName");
+		log.info("resultTableName: {}", resultClassName);
+
+		final String preparedInfoPath = parser.get("resultWithCountry");
+
+		Class<? extends eu.dnetlib.dhp.schema.oaf.Result> inputClazz = (Class<? extends eu.dnetlib.dhp.schema.oaf.Result>) Class
+			.forName(resultClassName);
+
+		run(
+			isSparkSessionManaged, inputPath, outputPath, inputClazz,
+			resultType, preparedInfoPath);
+
+	}
+
+	private static void run(Boolean isSparkSessionManaged, String inputPath, String outputPath,
+
+		Class<? extends eu.dnetlib.dhp.schema.oaf.Result> inputClazz, String resultType, String preparedInfoPath) {
+		SparkConf conf = new SparkConf();
+
+		runWithSparkSession(
+			conf,
+			isSparkSessionManaged,
+			spark -> {
+				Utils.removeOutputDir(spark, outputPath + "/original/" + resultType);
+
+				resultDump(
+					spark, inputPath, outputPath, inputClazz, resultType, preparedInfoPath);
+			});
+
+	}
+
+	public static <I extends eu.dnetlib.dhp.schema.oaf.Result> void resultDump(
+		SparkSession spark,
+		String inputPath,
+		String outputPath,
+		Class<I> inputClazz,
+
+		String resultType,
+
+		String preparedInfoPath) {
+
+		Dataset<String> resultsWithCountry = spark.read().textFile(preparedInfoPath).distinct();
+
+		Dataset<I> result = Utils
+			.readPath(spark, inputPath, inputClazz)
+			.filter(
+				(FilterFunction<I>) r -> !r.getDataInfo().getInvisible() && !r.getDataInfo().getDeletedbyinference());
+
+		resultsWithCountry
+			.joinWith(result, resultsWithCountry.col("value").equalTo(result.col("id")))
+			.map((MapFunction<Tuple2<String, I>, I>) t2 -> t2._2(), Encoders.bean(inputClazz))
+			.write()
+			.mode(SaveMode.Overwrite)
+			.option("compression", "gzip")
+			.json(outputPath + "/original/" + resultType);
+
+	}
+
+}
--- a/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/country/SparkFindResultsRelatedToCountry.java
+++ b/dump/src/main/java/eu/dnetlib/dhp/oa/graph/dump/country/SparkFindResultsRelatedToCountry.java
@ -0,0 +1,171 @@
+
+package eu.dnetlib.dhp.oa.graph.dump.country;
+
+import static eu.dnetlib.dhp.common.SparkSessionSupport.runWithSparkSession;
+
+import java.io.Serializable;
+import java.io.StringReader;
+import java.util.*;
+
+import org.apache.commons.io.IOUtils;
+import org.apache.spark.SparkConf;
+import org.apache.spark.api.java.function.FilterFunction;
+import org.apache.spark.api.java.function.MapFunction;
+import org.apache.spark.sql.Dataset;
+import org.apache.spark.sql.Encoders;
+import org.apache.spark.sql.SaveMode;
+import org.apache.spark.sql.SparkSession;
+import org.dom4j.Document;
+import org.dom4j.DocumentException;
+import org.dom4j.Node;
+import org.dom4j.io.SAXReader;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+import org.xml.sax.SAXException;
+
+import eu.dnetlib.dhp.application.ArgumentApplicationParser;
+import eu.dnetlib.dhp.oa.graph.dump.Utils;
+import eu.dnetlib.dhp.schema.common.ModelConstants;
+import eu.dnetlib.dhp.schema.oaf.*;
+import scala.Tuple2;
+
+/**
+ * @author miriam.baglioni
+ * @Date 27/04/23
+ * Finds the results id which are in relation with another entity having the given country
+ * or that have that country in the country list
+ */
+public class SparkFindResultsRelatedToCountry implements Serializable {
+	private static final Logger log = LoggerFactory.getLogger(SparkFindResultsRelatedToCountry.class);
+
+	public static final String COMPRESSION = "compression";
+	public static final String GZIP = "gzip";
+
+	public static void main(String[] args) throws Exception {
+		String jsonConfiguration = IOUtils
+			.toString(
+				SparkFindResultsRelatedToCountry.class
+					.getResourceAsStream(
+						"/eu/dnetlib/dhp/oa/graph/dump/result_related_country_parameters.json"));
+
+		final ArgumentApplicationParser parser = new ArgumentApplicationParser(jsonConfiguration);
+		parser.parseArgument(args);
+
+		Boolean isSparkSessionManaged = Optional
+			.ofNullable(parser.get("isSparkSessionManaged"))
+			.map(Boolean::valueOf)
+			.orElse(Boolean.TRUE);
+		log.info("isSparkSessionManaged: {}", isSparkSessionManaged);
+
+		final String inputPath = parser.get("sourcePath");
+		log.info("inputPath: {}", inputPath);
+
+		final String outputPath = parser.get("outputPath");
+		log.info("outputPath: {}", outputPath);
+
+		final String country = parser.get("country");
+
+		run(
+			isSparkSessionManaged, inputPath, outputPath, country);
+
+	}
+
+	private static void run(Boolean isSparkSessionManaged, String inputPath, String outputPath,
+		String country) {
+		SparkConf conf = new SparkConf();
+
+		runWithSparkSession(
+			conf,
+			isSparkSessionManaged,
+			spark -> {
+				findRelatedEntities(
+					spark, inputPath, outputPath, country);
+			});
+
+	}
+
+	public static <I extends eu.dnetlib.dhp.schema.oaf.Result> void findRelatedEntities(
+		SparkSession spark,
+		String inputPath,
+		String outputPath,
+		String country) {
+
+		Dataset<Project> projectsInCountry = Utils
+			.readPath(spark, inputPath + "/project", Project.class)
+			.filter((FilterFunction<Project>) p -> isCountryInFunderJurisdiction(p.getFundingtree(), country));
+
+		Dataset<Relation> relsProjectResults = Utils
+			.readPath(spark, inputPath + "/relation", Relation.class)
+			.filter(
+				(FilterFunction<Relation>) r -> !r.getDataInfo().getDeletedbyinference() &&
+					r.getRelClass().equals(ModelConstants.PRODUCES));
+
+		projectsInCountry
+			.joinWith(relsProjectResults, projectsInCountry.col("id").equalTo(relsProjectResults.col("source")))
+			.map((MapFunction<Tuple2<Project, Relation>, String>) t2 -> t2._2().getTarget(), Encoders.STRING())
+			.write()
+			.option(COMPRESSION, GZIP)
+			.mode(SaveMode.Overwrite)
+			.text(outputPath);
+
+		Dataset<Organization> organizationsInCountry = Utils
+			.readPath(spark, inputPath + "/organization", Organization.class)
+			.filter((FilterFunction<Organization>) o -> o.getCountry().getClassid().equals(country));
+
+		Dataset<Relation> relsOrganizationResults = Utils
+			.readPath(spark, inputPath + "/relation", Relation.class)
+			.filter(
+				(FilterFunction<Relation>) r -> !r.getDataInfo().getDeletedbyinference() &&
+					r.getRelClass().equals(ModelConstants.IS_AUTHOR_INSTITUTION_OF));
+
+		organizationsInCountry
+			.joinWith(
+				relsOrganizationResults,
+				organizationsInCountry.col("id").equalTo(relsOrganizationResults.col("source")))
+			.map((MapFunction<Tuple2<Organization, Relation>, String>) t2 -> t2._2().getTarget(), Encoders.STRING())
+			.write()
+			.option(COMPRESSION, GZIP)
+			.mode(SaveMode.Append)
+			.text(outputPath);
+
+		selectResultWithCountry(spark, inputPath, outputPath, country, "publication", Publication.class);
+		selectResultWithCountry(
+			spark, inputPath, outputPath, country, "dataset", eu.dnetlib.dhp.schema.oaf.Dataset.class);
+		selectResultWithCountry(spark, inputPath, outputPath, country, "software", Software.class);
+		selectResultWithCountry(
+			spark, inputPath, outputPath, country, "otherresearchproduct", OtherResearchProduct.class);
+
+	}
+
+	private static <R extends Result> void selectResultWithCountry(SparkSession spark, String inputPath,
+		String outputPath, String country, String type, Class<R> inputClazz) {
+		Utils
+			.readPath(spark, inputPath + "/" + type, inputClazz)
+			.filter(
+				(FilterFunction<R>) p -> !p.getDataInfo().getDeletedbyinference() && !p.getDataInfo().getInvisible() &&
+					p.getCountry() != null &&
+					p.getCountry().stream().anyMatch(c -> c.getClassid().equals(country)))
+			.map((MapFunction<R, String>) p -> p.getId(), Encoders.STRING())
+			.write()
+			.option(COMPRESSION, GZIP)
+			.mode(SaveMode.Append)
+			.text(outputPath);
+	}
+
+	private static boolean isCountryInFunderJurisdiction(List<Field<String>> fundingtrees, String country) {
+		try {
+			final SAXReader reader = new SAXReader();
+			reader.setFeature("http://apache.org/xml/features/disallow-doctype-decl", true);
+			for (Field<String> fundingtree : fundingtrees) {
+				final Document doc = reader.read(new StringReader(fundingtree.getValue()));
+				if (((Node) (doc.selectNodes("//funder/jurisdiction").get(0))).getText().equals(country)) {
+					return true;
+				}
+			}
+			return false;
+		} catch (DocumentException | SAXException e) {
+			throw new IllegalArgumentException(e);
+		}
+	}
+
+}
--- a/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/countryresults/oozie_app/config-default.xml
+++ b/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/countryresults/oozie_app/config-default.xml
@ -0,0 +1,30 @@
+<configuration>
+    <property>
+        <name>jobTracker</name>
+        <value>yarnRM</value>
+    </property>
+    <property>
+        <name>nameNode</name>
+        <value>hdfs://nameservice1</value>
+    </property>
+    <property>
+        <name>oozie.use.system.libpath</name>
+        <value>true</value>
+    </property>
+    <property>
+        <name>hiveMetastoreUris</name>
+        <value>thrift://iis-cdh5-test-m3.ocean.icm.edu.pl:9083</value>
+    </property>
+    <property>
+        <name>hiveJdbcUrl</name>
+        <value>jdbc:hive2://iis-cdh5-test-m3.ocean.icm.edu.pl:10000</value>
+    </property>
+    <property>
+        <name>hiveDbName</name>
+        <value>openaire</value>
+    </property>
+    <property>
+        <name>oozie.launcher.mapreduce.user.classpath.first</name>
+        <value>true</value>
+    </property>
+</configuration>
--- a/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/countryresults/oozie_app/workflow.xml
+++ b/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/countryresults/oozie_app/workflow.xml
@ -0,0 +1,540 @@
+<workflow-app name="sub-dump_subset" xmlns="uri:oozie:workflow:0.5">
+    <parameters>
+        <property>
+            <name>sourcePath</name>
+            <description>the source path</description>
+        </property>
+        <property>
+            <name>outputPath</name>
+            <description>the output path</description>
+        </property>
+<property>
+    <name>country</name>
+    <description>the country for which to produce the dump</description>
+</property>
+        <property>
+            <name>hiveDbName</name>
+            <description>the target hive database name</description>
+        </property>
+        <property>
+            <name>hiveJdbcUrl</name>
+            <description>hive server jdbc url</description>
+        </property>
+        <property>
+            <name>hiveMetastoreUris</name>
+            <description>hive server metastore URIs</description>
+        </property>
+        <property>
+            <name>sparkDriverMemory</name>
+            <description>memory for driver process</description>
+        </property>
+        <property>
+            <name>sparkExecutorMemory</name>
+            <description>memory for individual executor</description>
+        </property>
+        <property>
+            <name>sparkExecutorCores</name>
+            <description>number of cores used by single executor</description>
+        </property>
+        <property>
+            <name>oozieActionShareLibForSpark2</name>
+            <description>oozie action sharelib for spark 2.*</description>
+        </property>
+        <property>
+            <name>spark2ExtraListeners</name>
+            <value>com.cloudera.spark.lineage.NavigatorAppListener</value>
+            <description>spark 2.* extra listeners classname</description>
+        </property>
+        <property>
+            <name>spark2SqlQueryExecutionListeners</name>
+            <value>com.cloudera.spark.lineage.NavigatorQueryListener</value>
+            <description>spark 2.* sql query execution listeners classname</description>
+        </property>
+        <property>
+            <name>spark2YarnHistoryServerAddress</name>
+            <description>spark 2.* yarn history server address</description>
+        </property>
+        <property>
+            <name>spark2EventLogDir</name>
+            <description>spark 2.* event log dir location</description>
+        </property>
+    </parameters>
+
+    <global>
+        <job-tracker>${jobTracker}</job-tracker>
+        <name-node>${nameNode}</name-node>
+        <configuration>
+            <property>
+                <name>mapreduce.job.queuename</name>
+                <value>${queueName}</value>
+            </property>
+            <property>
+                <name>oozie.launcher.mapred.job.queue.name</name>
+                <value>${oozieLauncherQueueName}</value>
+            </property>
+            <property>
+                <name>oozie.action.sharelib.for.spark</name>
+                <value>${oozieActionShareLibForSpark2}</value>
+            </property>
+
+        </configuration>
+    </global>
+
+<!--    <start to="save_community_map" />-->
+    <start to="make_archive" />
+
+    <action name="save_community_map">
+        <java>
+            <main-class>eu.dnetlib.dhp.oa.graph.dump.SaveCommunityMap</main-class>
+            <arg>--outputPath</arg><arg>${workingDir}/communityMap</arg>
+            <arg>--nameNode</arg><arg>${nameNode}</arg>
+            <arg>--isLookUpUrl</arg><arg>${isLookUpUrl}</arg>
+        </java>
+        <ok to="find_results_for_country"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="find_results_for_country">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table publication </name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.country.SparkFindResultsRelatedToCountry</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${sourcePath}</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/resultsInCountry</arg>
+            <arg>--country</arg><arg>${country}</arg>
+        </spark>
+        <ok to="fork_select"/>
+        <error to="Kill"/>
+    </action>
+
+
+    <fork name="fork_select">
+        <path start="select_publication"/>
+        <path start="select_dataset"/>
+        <path start="select_orp"/>
+        <path start="select_software"/>
+    </fork>
+
+    <action name="select_publication">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table publication </name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.country.SparkFindResultWithCountry</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=7G
+                --executor-cores=2
+                --driver-memory=7G
+                --conf spark.sql.shuffle.partitions=3840
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${sourcePath}/publication</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Publication</arg>
+            <arg>--outputPath</arg><arg>${outputPath}</arg>
+            <arg>--resultWithCountry</arg><arg>${workingDir}/resultsInCountry</arg>
+            <arg>--resultType</arg><arg>publication</arg>
+        </spark>
+        <ok to="join_dump"/>
+        <error to="Kill"/>
+    </action>
+
+
+    <action name="select_dataset">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table dataset </name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.country.SparkFindResultWithCountry</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${sourcePath}/dataset</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Dataset</arg>
+            <arg>--outputPath</arg><arg>${outputPath}</arg>
+            <arg>--resultType</arg><arg>dataset</arg>
+            <arg>--resultWithCountry</arg><arg>${workingDir}/resultsInCountry</arg>
+        </spark>
+        <ok to="join_dump"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="select_orp">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table ORP </name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.country.SparkFindResultWithCountry</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${sourcePath}/otherresearchproduct</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.OtherResearchProduct</arg>
+            <arg>--outputPath</arg><arg>${outputPath}</arg>
+            <arg>--resultType</arg><arg>otherresearchproduct</arg>
+            <arg>--resultWithCountry</arg><arg>${workingDir}/resultsInCountry</arg>
+        </spark>
+        <ok to="join_dump"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="select_software">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table software </name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.country.SparkFindResultWithCountry</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${sourcePath}/software</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Software</arg>
+            <arg>--outputPath</arg><arg>${outputPath}</arg>
+            <arg>--resultType</arg><arg>software</arg>
+            <arg>--resultWithCountry</arg><arg>${workingDir}/resultsInCountry</arg>
+        </spark>
+        <ok to="join_dump"/>
+        <error to="Kill"/>
+    </action>
+
+    <join name="join_dump" to="fork_dump_community"/>
+
+    <action name="select_subset">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Select valid table relation </name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.subset.SparkSelectSubset</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+                --conf spark.sql.shuffle.partitions=3840
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${sourcePath}</arg>
+            <arg>--outputPath</arg><arg>${outputPath}</arg>
+            <arg>--removeSet</arg><arg>${removeSet}</arg>
+
+        </spark>
+        <ok to="fork_dump_community"/>
+        <error to="Kill"/>
+    </action>
+
+
+    <fork name="fork_dump_community">
+        <path start="dump_publication"/>
+        <path start="dump_dataset"/>
+        <path start="dump_orp"/>
+        <path start="dump_software"/>
+    </fork>
+
+    <action name="dump_publication">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table publication for community/funder related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/publication</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Publication</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/publication</arg>
+            <arg>--communityMapPath</arg><arg>${workingDir}/communityMap</arg>
+            <arg>--dumpType</arg><arg>country</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="dump_dataset">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table dataset for community/funder related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/dataset</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Dataset</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/dataset</arg>
+            <arg>--communityMapPath</arg><arg>${workingDir}/communityMap</arg>
+            <arg>--dumpType</arg><arg>country</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="dump_orp">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table ORP for community related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/otherresearchproduct</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.OtherResearchProduct</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/otherresearchproduct</arg>
+            <arg>--communityMapPath</arg><arg>${workingDir}/communityMap</arg>
+            <arg>--dumpType</arg><arg>country</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="dump_software">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table software for community related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/software</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Software</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/software</arg>
+            <arg>--communityMapPath</arg><arg>${workingDir}/communityMap</arg>
+            <arg>--dumpType</arg><arg>country</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <join name="join_dump_comm" to="prepareResultProject"/>
+
+    <action name="prepareResultProject">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Prepare association result subset of project info</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkPrepareResultProject</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${sourcePath}</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/preparedInfo</arg>
+        </spark>
+        <ok to="fork_extendWithProject"/>
+        <error to="Kill"/>
+    </action>
+
+
+
+<fork name="fork_extendWithProject">
+<path start="extend_publication"/>
+<path start="extend_dataset"/>
+<path start="extend_orp"/>
+<path start="extend_software"/>
+</fork>
+
+<action name="extend_publication">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped publications with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/publication</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/publication</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+<action name="extend_dataset">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped dataset with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/dataset</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/dataset</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+<action name="extend_orp">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped ORP with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/otherresearchproduct</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/otherresearchproduct</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+<action name="extend_software">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped software with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/software</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/software</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+
+<join name="join_extend" to="make_archive"/>
+
+    <action name="make_archive">
+        <java>
+            <main-class>eu.dnetlib.dhp.oa.graph.dump.MakeTar</main-class>
+            <arg>--hdfsPath</arg><arg>${outputPath}/tar</arg>
+            <arg>--nameNode</arg><arg>${nameNode}</arg>
+            <arg>--sourcePath</arg><arg>${outputPath}/dump</arg>
+        </java>
+        <ok to="End"/>
+        <error to="Kill"/>
+    </action>
+
+    <kill name="Kill">
+        <message>Sub-workflow dump complete failed with error message ${wf:errorMessage()}
+        </message>
+    </kill>
+
+    <end name="End" />
+</workflow-app>
--- a/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/input_cm_parameters.json
+++ b/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/input_cm_parameters.json
@ -23,13 +23,13 @@
 		"paramName": "sd",
 		"paramLongName": "singleDeposition",
 		"paramDescription": "true if the dump should be created for a single community",
-		"paramRequired": true
+		"paramRequired": false
 	},
 	{
 		"paramName": "ci",
 		"paramLongName": "communityId",
 		"paramDescription": "the id of the community for which to create the dump",
-		"paramRequired": true
+		"paramRequired": false
 	}
 ]

--- a/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/result_country_parameters.json
+++ b/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/result_country_parameters.json
@ -0,0 +1,42 @@
+
+[
+
+  {
+    "paramName":"s",
+    "paramLongName":"sourcePath",
+    "paramDescription": "the path of the sequencial file to read",
+    "paramRequired": true
+  },
+  {
+    "paramName": "out",
+    "paramLongName": "outputPath",
+    "paramDescription": "the path used to store temporary output files",
+    "paramRequired": true
+  },
+  {
+    "paramName": "ssm",
+    "paramLongName": "isSparkSessionManaged",
+    "paramDescription": "true if the spark session is managed, false otherwise",
+    "paramRequired": false
+  },
+  {
+    "paramName": "c",
+    "paramLongName": "resultWithCountry",
+    "paramDescription": "the path of the id of results associated to a given country",
+    "paramRequired": true
+  },
+  {
+  "paramName":"tn",
+  "paramLongName":"resultTableName",
+"paramDescription": "the name of the result table we are currently working on",
+"paramRequired": true
+},
+{
+"paramName":"rt",
+"paramLongName":"resultType",
+"paramDescription": "",
+"paramRequired": true
+}
+]
+
+
--- a/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/result_related_country_parameters.json
+++ b/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/result_related_country_parameters.json
@ -0,0 +1,29 @@
+[
+
+  {
+    "paramName":"s",
+    "paramLongName":"sourcePath",
+    "paramDescription": "the path of the sequencial file to read",
+    "paramRequired": true
+  },
+  {
+    "paramName": "out",
+    "paramLongName": "outputPath",
+    "paramDescription": "the path used to store temporary output files",
+    "paramRequired": true
+  },
+  {
+    "paramName": "ssm",
+    "paramLongName": "isSparkSessionManaged",
+    "paramDescription": "true if the spark session is managed, false otherwise",
+    "paramRequired": false
+  },
+  {
+    "paramName": "c",
+    "paramLongName": "country",
+    "paramDescription": "the path of the association result projectlist",
+    "paramRequired": true
+  }
+]
+
+
--- a/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/wf/subworkflows/subset/oozie_app/workflow.xml
+++ b/dump/src/main/resources/eu/dnetlib/dhp/oa/graph/dump/wf/subworkflows/subset/oozie_app/workflow.xml
@ -20,7 +20,10 @@
            <name>selectionCriteria</name>
            <description>the selection criteria used to select the results</description>
        </property>
-
+        <property>
+            <name>mapAs</name>
+            <description>It specifies the type of model for the dump (community - complete)</description>
+        </property>
        <property>
            <name>hiveDbName</name>
            <description>the target hive database name</description>
@ -231,8 +234,6 @@

    <join name="join_dump" to="select_subset"/>

-
-
    <action name="select_subset">
        <spark xmlns="uri:oozie:spark-action:0.2">
            <master>yarn</master>
@ -256,10 +257,267 @@
            <arg>--removeSet</arg><arg>${removeSet}</arg>

        </spark>
-        <ok to="fork_dump_otherentities"/>
+        <ok to="dumpModel"/>
        <error to="Kill"/>
    </action>

+
+    <decision name="dumpModel">
+        <switch>
+            <case to="fork_dump_community">${wf:conf('mapAs') eq "community"}</case>
+            <default to="fork_dump_otherentities"/>
+        </switch>
+    </decision>
+
+    <fork name="fork_dump_community">
+        <path start="dump_publication"/>
+        <path start="dump_dataset"/>
+        <path start="dump_orp"/>
+        <path start="dump_software"/>
+    </fork>
+
+    <action name="dump_publication">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table publication for community/funder related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/publication</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Publication</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/publication</arg>
+            <arg>--communityMapPath</arg><arg>${communityMapPath}</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="dump_dataset">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table dataset for community/funder related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/dataset</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Dataset</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/dataset</arg>
+            <arg>--communityMapPath</arg><arg>${communityMapPath}</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="dump_orp">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table ORP for community related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/otherresearchproduct</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.OtherResearchProduct</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/otherresearchproduct</arg>
+            <arg>--communityMapPath</arg><arg>${communityMapPath}</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <action name="dump_software">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Dump table software for community related products</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkDumpCommunityProducts</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original/software</arg>
+            <arg>--resultTableName</arg><arg>eu.dnetlib.dhp.schema.oaf.Software</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/dump/software</arg>
+            <arg>--communityMapPath</arg><arg>${communityMapPath}</arg>
+        </spark>
+        <ok to="join_dump_comm"/>
+        <error to="Kill"/>
+    </action>
+
+    <join name="join_dump_comm" to="prepareResultProject"/>
+
+    <action name="prepareResultProject">
+        <spark xmlns="uri:oozie:spark-action:0.2">
+            <master>yarn</master>
+            <mode>cluster</mode>
+            <name>Prepare association result subset of project info</name>
+            <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkPrepareResultProject</class>
+            <jar>dump-${projectVersion}.jar</jar>
+            <spark-opts>
+                --executor-memory=${sparkExecutorMemory}
+                --executor-cores=${sparkExecutorCores}
+                --driver-memory=${sparkDriverMemory}
+                --conf spark.extraListeners=${spark2ExtraListeners}
+                --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+                --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+                --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+                --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+            </spark-opts>
+            <arg>--sourcePath</arg><arg>${outputPath}/original</arg>
+            <arg>--outputPath</arg><arg>${workingDir}/preparedInfo</arg>
+        </spark>
+        <ok to="fork_extendWithProject"/>
+        <error to="Kill"/>
+    </action>
+
+
+
+<fork name="fork_extendWithProject">
+<path start="extend_publication"/>
+<path start="extend_dataset"/>
+<path start="extend_orp"/>
+<path start="extend_software"/>
+</fork>
+
+<action name="extend_publication">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped publications with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/publication</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/publication</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+<action name="extend_dataset">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped dataset with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/dataset</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/dataset</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+<action name="extend_orp">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped ORP with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/otherresearchproduct</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/otherresearchproduct</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+<action name="extend_software">
+<spark xmlns="uri:oozie:spark-action:0.2">
+    <master>yarn</master>
+    <mode>cluster</mode>
+    <name>Extend dumped software with information about project</name>
+    <class>eu.dnetlib.dhp.oa.graph.dump.community.SparkUpdateProjectInfo</class>
+    <jar>dump-${projectVersion}.jar</jar>
+    <spark-opts>
+        --executor-memory=${sparkExecutorMemory}
+        --executor-cores=${sparkExecutorCores}
+        --driver-memory=${sparkDriverMemory}
+        --conf spark.extraListeners=${spark2ExtraListeners}
+        --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
+        --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
+        --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
+        --conf spark.sql.warehouse.dir=${sparkSqlWarehouseDir}
+    </spark-opts>
+    <arg>--sourcePath</arg><arg>${workingDir}/dump/software</arg>
+    <arg>--outputPath</arg><arg>${outputPath}/dump/software</arg>
+    <arg>--preparedInfoPath</arg><arg>${workingDir}/preparedInfo</arg>
+</spark>
+<ok to="join_extend"/>
+<error to="Kill"/>
+</action>
+
+
+<join name="join_extend" to="End"/>
+    
    <fork name="fork_dump_otherentities">
        <path start="dump_organization"/>
        <path start="dump_project"/>
--- a/dump/src/test/java/eu/dnetlib/dhp/oa/graph/dump/country/FindResultRelatedToCountryTest.java
+++ b/dump/src/test/java/eu/dnetlib/dhp/oa/graph/dump/country/FindResultRelatedToCountryTest.java
@ -0,0 +1,96 @@
+
+package eu.dnetlib.dhp.oa.graph.dump.country;
+
+import java.io.IOException;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.util.HashMap;
+
+import org.apache.commons.io.FileUtils;
+import org.apache.neethi.Assertion;
+import org.apache.spark.SparkConf;
+import org.apache.spark.api.java.JavaRDD;
+import org.apache.spark.api.java.JavaSparkContext;
+import org.apache.spark.api.java.function.FilterFunction;
+import org.apache.spark.sql.Encoders;
+import org.apache.spark.sql.SparkSession;
+import org.junit.jupiter.api.AfterAll;
+import org.junit.jupiter.api.Assertions;
+import org.junit.jupiter.api.BeforeAll;
+import org.junit.jupiter.api.Test;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+
+/**
+ * @author miriam.baglioni
+ * @Date 02/05/23
+ */
+public class FindResultRelatedToCountryTest {
+
+	private static SparkSession spark;
+
+	private static Path workingDir;
+
+	private static final Logger log = LoggerFactory
+		.getLogger(FindResultRelatedToCountryTest.class);
+
+	private static final HashMap<String, String> map = new HashMap<>();
+
+	@BeforeAll
+	public static void beforeAll() throws IOException {
+		workingDir = Files
+			.createTempDirectory(FindResultRelatedToCountryTest.class.getSimpleName());
+		log.info("using work dir {}", workingDir);
+
+		SparkConf conf = new SparkConf();
+		conf.setAppName(FindResultRelatedToCountryTest.class.getSimpleName());
+
+		conf.setMaster("local[*]");
+		conf.set("spark.driver.host", "localhost");
+		conf.set("hive.metastore.local", "true");
+		conf.set("spark.ui.enabled", "false");
+		conf.set("spark.sql.warehouse.dir", workingDir.toString());
+		conf.set("hive.metastore.warehouse.dir", workingDir.resolve("warehouse").toString());
+
+		spark = SparkSession
+			.builder()
+			.appName(FindResultRelatedToCountryTest.class.getSimpleName())
+			.config(conf)
+			.getOrCreate();
+	}
+
+	@AfterAll
+	public static void afterAll() throws IOException {
+		FileUtils.deleteDirectory(workingDir.toFile());
+		spark.stop();
+	}
+
+	@Test
+	void test1() throws Exception {
+
+		final String sourcePath = getClass()
+			.getResource("/eu/dnetlib/dhp/oa/graph/dump/country/graph")
+			.getPath();
+
+		SparkFindResultsRelatedToCountry.main(new String[] {
+			"-isSparkSessionManaged", Boolean.FALSE.toString(),
+			"-outputPath", workingDir.toString() + "/resultWithCountry",
+			"-sourcePath", sourcePath,
+			"-country", "PT"
+		});
+
+		final JavaSparkContext sc = JavaSparkContext.fromSparkContext(spark.sparkContext());
+
+		JavaRDD<String> tmp = sc
+			.textFile(workingDir.toString() + "/resultWithCountry");
+
+		Assertions.assertEquals(3, tmp.count());
+
+		Assertions.assertTrue(tmp.collect().contains("50|06cdd3ff4700::136eb030ccb020e170df9627fa1a70af"));
+		Assertions.assertTrue(tmp.collect().contains("50|06cdd3ff4700::93859bd27121c3ee7c6ee4bfb1790cbb"));
+		Assertions.assertTrue(tmp.collect().contains("50|06cdd3ff4700::136eb030ccb020e170df9627fa1a70ag"));
+
+	}
+}
--- a/dump/src/test/java/eu/dnetlib/dhp/oa/graph/dump/country/FindResultWithCountryTest.java
+++ b/dump/src/test/java/eu/dnetlib/dhp/oa/graph/dump/country/FindResultWithCountryTest.java
@ -0,0 +1,115 @@
+
+package eu.dnetlib.dhp.oa.graph.dump.country;
+
+import java.io.IOException;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.security.PublicKey;
+import java.util.HashMap;
+
+import org.apache.commons.io.FileUtils;
+import org.apache.spark.SparkConf;
+import org.apache.spark.api.java.JavaRDD;
+import org.apache.spark.api.java.JavaSparkContext;
+import org.apache.spark.api.java.function.MapFunction;
+import org.apache.spark.sql.Encoders;
+import org.apache.spark.sql.SparkSession;
+import org.junit.jupiter.api.AfterAll;
+import org.junit.jupiter.api.Assertions;
+import org.junit.jupiter.api.BeforeAll;
+import org.junit.jupiter.api.Test;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+
+import eu.dnetlib.dhp.oa.graph.dump.Utils;
+import eu.dnetlib.dhp.oa.model.graph.Relation;
+import eu.dnetlib.dhp.schema.oaf.Publication;
+
+/**
+ * @author miriam.baglioni
+ * @Date 02/05/23
+ */
+public class FindResultWithCountryTest {
+	private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper();
+
+	private static SparkSession spark;
+
+	private static Path workingDir;
+
+	private static final Logger log = LoggerFactory
+		.getLogger(FindResultWithCountryTest.class);
+
+	private static final HashMap<String, String> map = new HashMap<>();
+
+	@BeforeAll
+	public static void beforeAll() throws IOException {
+		workingDir = Files
+			.createTempDirectory(FindResultWithCountryTest.class.getSimpleName());
+		log.info("using work dir {}", workingDir);
+
+		SparkConf conf = new SparkConf();
+		conf.setAppName(FindResultWithCountryTest.class.getSimpleName());
+
+		conf.setMaster("local[*]");
+		conf.set("spark.driver.host", "localhost");
+		conf.set("hive.metastore.local", "true");
+		conf.set("spark.ui.enabled", "false");
+		conf.set("spark.sql.warehouse.dir", workingDir.toString());
+		conf.set("hive.metastore.warehouse.dir", workingDir.resolve("warehouse").toString());
+
+		spark = SparkSession
+			.builder()
+			.appName(FindResultWithCountryTest.class.getSimpleName())
+			.config(conf)
+			.getOrCreate();
+	}
+
+	@AfterAll
+	public static void afterAll() throws IOException {
+		FileUtils.deleteDirectory(workingDir.toFile());
+		spark.stop();
+	}
+
+	@Test
+	void test1() throws Exception {
+
+		final String sourcePath = getClass()
+			.getResource("/eu/dnetlib/dhp/oa/graph/dump/country/graph/publication")
+			.getPath();
+
+		spark
+			.read()
+			.textFile(
+				getClass()
+					.getResource("/eu/dnetlib/dhp/oa/graph/dump/country/resultWithCountry")
+					.getPath())
+			.write()
+			.text(workingDir.toString() + "/resWithCountry");
+
+		SparkFindResultWithCountry.main(new String[] {
+			"-isSparkSessionManaged", Boolean.FALSE.toString(),
+			"-outputPath", workingDir.toString() + "/out",
+			"-sourcePath", sourcePath,
+			"-resultType", "publication",
+			"-resultTableName", "eu.dnetlib.dhp.schema.oaf.Publication",
+			"-resultWithCountry", workingDir.toString() + "/resWithCountry"
+		});
+
+		final JavaSparkContext sc = JavaSparkContext.fromSparkContext(spark.sparkContext());
+		JavaRDD<Publication> tmp = sc
+			.textFile(workingDir.toString() + "/out/original/publication")
+			.map(item -> OBJECT_MAPPER.readValue(item, Publication.class));
+
+		Assertions.assertEquals(2, tmp.count());
+
+		Assertions
+			.assertTrue(
+				tmp.map(p -> p.getId()).collect().contains("50|06cdd3ff4700::136eb030ccb020e170df9627fa1a70af"));
+		Assertions
+			.assertTrue(
+				tmp.map(p -> p.getId()).collect().contains("50|06cdd3ff4700::136eb030ccb020e170df9627fa1a70ag"));
+
+	}
+}
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/dataset/dataset
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/dataset/dataset
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/organization/organization.json
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/organization/organization.json
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/otherresearchproduct/other
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/otherresearchproduct/other
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/project/project.json
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/project/project.json
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/publication/publication.json
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/publication/publication.json
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/relation/relation.json
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/relation/relation.json
@ -0,0 +1,8 @@
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":false,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"produces","relType":"datasourceOrganization","source":"40|fct_________::037de16e31bf518b1b2a836ee37ce983","subRelType":"provision","target":"50|06cdd3ff4700::136eb030ccb020e170df9627fa1a70ag","validated":false}
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":false,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"isAuthorInstitutionOf","relType":"datasourceOrganization","source":"20|anr_________::17811d09a4f30a15d4fe207d46861b53","subRelType":"provision","target":"50|06cdd3ff4700::93859bd27121c3ee7c6ee4bfb1790cbb","validated":false}
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":false,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"isAuthorInstitutionOf","relType":"datasourceOrganization","source":"20|corda_______::810928466bdce1665c4f1838ca9e2844","subRelType":"provision","target":"50|06cdd3ff4700::93859bd27121c3ee7c6ee4bfb1790cba","validated":false}
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":false,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"produces","relType":"datasourceOrganization","source":"40|anr_________::658a5d80c4b3e1175781fe2e2294cffa","subRelType":"provision","target":"50|____EGIAppDB::ce6d2420f693a96a29d1400970393969","validated":false}
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":true,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"isProvidedBy","relType":"datasourceOrganization","source":"10|doajarticles::690b3aaf177a4c70b81bacd8d023cbdc","subRelType":"provision","target":"20|doajarticles::396262ee936f3d3e26ff0e60bea6cae0","validated":false}
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":true,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"isProvidedBy","relType":"datasourceOrganization","source":"10|doajarticles::7a71f278237d1ab35088efda03fa007a","subRelType":"provision","target":"20|doajarticles::03748bcb5d754c951efec9700e18a56d","validated":false}
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":false,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"isProvidedBy","relType":"datasourceOrganization","source":"10|doajarticles::8b75543067b50076e70764917e188178","subRelType":"provision","target":"20|doajarticles::50cb15ff7a6a3f8531f063770179e346","validated":false}
+{"collectedfrom":[{"key":"10|driver______::bee53aa31dc2cbb538c10c2b65fa5824","value":"DOAJ-Articles"}],"dataInfo":{"deletedbyinference":true,"inferred":false,"invisible":false,"provenanceaction":{"classid":"sysimport:crosswalk:entityregistry","classname":"Harvested","schemeid":"dnet:provenanceActions","schemename":"dnet:provenanceActions"},"trust":"0.900"},"lastupdatetimestamp":1680789947124,"properties":[],"relClass":"isProvidedBy","relType":"datasourceOrganization","source":"10|doajarticles::9f3ff882f023209d9ffb4dc32b77d376","subRelType":"provision","target":"20|doajarticles::ffc1811633b3222e4764c7b0517f83e8","validated":false}
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/software/software.json
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/graph/software/software.json
--- a/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/resultWithCountry/resultId
+++ b/dump/src/test/resources/eu/dnetlib/dhp/oa/graph/dump/country/resultWithCountry/resultId
@ -0,0 +1,3 @@
+50|06cdd3ff4700::136eb030ccb020e170df9627fa1a70af
+50|06cdd3ff4700::93859bd27121c3ee7c6ee4bfb1790cbb
+50|06cdd3ff4700::136eb030ccb020e170df9627fa1a70ag