implemented oozie workflow to generate scholix dump filtering relclass semantic #229

Merged
claudio.atzori merged 2 commits from opencitation_enrichments into beta 2022-07-21 10:12:18 +02:00
1 changed files with 1 additions and 3 deletions
Showing only changes of commit 5f651f2316 - Show all commits

View File

@ -112,13 +112,11 @@ object SparkConvertRDDtoDataset {
"opencitations".equalsIgnoreCase(k.getValue)
)
)
.filter(r => r.getRelClass != null && r.getRelClass.equalsIgnoreCase(filterRelation))
.filter(r => r.getSubRelType != null && r.getSubRelType.equalsIgnoreCase(filterRelation))
spark.createDataset(rddRelation).as[Relation].write.mode(SaveMode.Overwrite).save(s"$relPath")
} else {
val relationSemanticFilter = List(
// "cites",
// "iscitedby",
"merges",
"ismergedin",
"HasAmongTopNSimilarDocuments",