master #11
|
@ -55,8 +55,8 @@ public class PrepareProjectResultsAssociation {
|
||||||
|
|
||||||
runWithSparkHiveSession(conf, isSparkSessionManaged,
|
runWithSparkHiveSession(conf, isSparkSessionManaged,
|
||||||
spark -> {
|
spark -> {
|
||||||
removeOutputDir(spark, potentialUpdatePath);
|
// removeOutputDir(spark, potentialUpdatePath);
|
||||||
removeOutputDir(spark, alreadyLinkedPath);
|
// removeOutputDir(spark, alreadyLinkedPath);
|
||||||
prepareResultProjProjectResults(spark, inputPath, potentialUpdatePath, alreadyLinkedPath, allowedsemrel);
|
prepareResultProjProjectResults(spark, inputPath, potentialUpdatePath, alreadyLinkedPath, allowedsemrel);
|
||||||
|
|
||||||
});
|
});
|
||||||
|
@ -91,9 +91,14 @@ public class PrepareProjectResultsAssociation {
|
||||||
"GROUP BY projectId ";
|
"GROUP BY projectId ";
|
||||||
|
|
||||||
spark.sql(query).as(Encoders.bean(ProjectResultSet.class))
|
spark.sql(query).as(Encoders.bean(ProjectResultSet.class))
|
||||||
.toJavaRDD()
|
.toJSON()
|
||||||
.map(r -> OBJECT_MAPPER.writeValueAsString(r))
|
.write()
|
||||||
.saveAsTextFile(potentialUpdatePath, GzipCodec.class);
|
.mode(SaveMode.Overwrite)
|
||||||
|
.option("compression","gzip")
|
||||||
|
.text(potentialUpdatePath);
|
||||||
|
// .toJavaRDD()
|
||||||
|
// .map(r -> OBJECT_MAPPER.writeValueAsString(r))
|
||||||
|
// .saveAsTextFile(potentialUpdatePath, GzipCodec.class);
|
||||||
|
|
||||||
|
|
||||||
query = "SELECT target projectId, collect_set(source) resultSet " +
|
query = "SELECT target projectId, collect_set(source) resultSet " +
|
||||||
|
@ -102,9 +107,14 @@ public class PrepareProjectResultsAssociation {
|
||||||
|
|
||||||
spark.sql(query)
|
spark.sql(query)
|
||||||
.as(Encoders.bean(ProjectResultSet.class))
|
.as(Encoders.bean(ProjectResultSet.class))
|
||||||
.toJavaRDD()
|
.toJSON()
|
||||||
.map(r -> OBJECT_MAPPER.writeValueAsString(r))
|
.write()
|
||||||
.saveAsTextFile(alreadyLinkedPath, GzipCodec.class);
|
.mode(SaveMode.Overwrite)
|
||||||
|
.option("compression","gzip")
|
||||||
|
.text(alreadyLinkedPath);
|
||||||
|
// .toJavaRDD()
|
||||||
|
// .map(r -> OBJECT_MAPPER.writeValueAsString(r))
|
||||||
|
// .saveAsTextFile(alreadyLinkedPath, GzipCodec.class);
|
||||||
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue