This commit is contained in:
Miriam Baglioni 2024-01-08 11:59:36 +01:00
parent 9435c6756e
commit 231ed85aa1
2 changed files with 14 additions and 0 deletions

View File

@ -78,6 +78,17 @@ public class SelectEoscResultsJobStep1 implements Serializable {
String inputPath, String outputPath,
Class<R> inputClazz, String communityMapPath, String eoscDatasourceIdsPath) {
// final StructType structureSchema = new StructType()
// .add("eoscId", DataTypes.StringType)
// .add("graphId", DataTypes.StringType)
// .add("graphName", DataTypes.StringType);
//
// // .fromDDL("`graphId`: STRING, `eoscId`:STRING");
// org.apache.spark.sql.Dataset<Row> df = spark
// .read()
// .schema(structureSchema)
// .json(eoscDatasourceIdsPath);
List<MasterDuplicate> df = Utils
.readPath(spark, eoscDatasourceIdsPath, MasterDuplicate.class)
.collectAsList();

View File

@ -0,0 +1,3 @@
sourcePath=/tmp/prod_provision/graph/20_graph_blacklisted
outputPath=/tmp/miriam/graph_dumps/country_PT
country=PT