dnet-hadoop/dhp-workflows/dhp-graph-mapper/src/test/scala/eu/dnetlib/dhp/oa/graph/resolution/ResolveEntitiesTest.scala

package eu.dnetlib.dhp.oa.graph.resolution

import com.fasterxml.jackson.databind.ObjectMapper
import eu.dnetlib.dhp.schema.oaf.common.EntityType
import eu.dnetlib.dhp.schema.oaf.utils.{MergeUtils, OafMapperUtils}
import eu.dnetlib.dhp.schema.oaf.{Publication, Result, StructuredProperty}
import org.apache.commons.io.FileUtils
import org.apache.spark.SparkConf
import org.apache.spark.sql._
import org.junit.jupiter.api.Assertions._
import org.junit.jupiter.api.TestInstance.Lifecycle
import org.junit.jupiter.api.{AfterAll, BeforeAll, Test, TestInstance}

import java.nio.file.{Files, Path}
import scala.collection.JavaConverters._
import scala.io.Source

@TestInstance(Lifecycle.PER_CLASS)
class ResolveEntitiesTest extends Serializable {

  var workingDir: Path = null

  val FAKE_TITLE = "FAKETITLE"
  val FAKE_SUBJECT = "FAKESUBJECT"

  var sparkSession: Option[SparkSession] = None

  @BeforeAll
  def setUp(): Unit = {
    workingDir = Files.createTempDirectory(getClass.getSimpleName)

    val conf = new SparkConf()
    sparkSession = Some(
      SparkSession
        .builder()
        .config(conf)
        .appName(getClass.getSimpleName)
        .master("local[*]")
        .getOrCreate()
    )
    populateDatasets(sparkSession.get)
    generateUpdates(sparkSession.get)

  }

  @AfterAll
  def tearDown(): Unit = {
    FileUtils.deleteDirectory(workingDir.toFile)
    sparkSession.get.stop()

  }

  def generateUpdates(spark: SparkSession): Unit = {
    val template = Source.fromInputStream(this.getClass.getResourceAsStream("updates")).mkString

    val pids: List[String] = template.linesWithSeparators.map(l =>l.stripLineEnd)
      .map { id =>
        val r = new Result
        r.setId(id.toLowerCase.trim)
        r.setSubject(
          List(
            OafMapperUtils.subject(
              FAKE_SUBJECT,
              OafMapperUtils.qualifier("fos", "fosCS", "fossSchema"),
              null
            )
          ).asJava
        )
        r.setTitle(
          List(
            OafMapperUtils.structuredProperty(
              FAKE_TITLE,
              OafMapperUtils.qualifier("fos", "fosCS", "fossSchema")
            )
          ).asJava
        )
        r
      }
      .map { r =>
        val mapper = new ObjectMapper()

        mapper.writeValueAsString(r)
      }
      .toList

    val sc = spark.sparkContext

    println(sc.parallelize(pids).count())

    spark
      .createDataset(sc.parallelize(pids))(Encoders.STRING)
      .write
      .mode(SaveMode.Overwrite)
      .option("compression", "gzip")
      .text(s"$workingDir/updates")

    import spark.implicits._
    implicit val resEncoder: Encoder[Result] = Encoders.bean(classOf[Result])
    val ds = spark.read
      .text(s"$workingDir/updates")
      .as[String]
      .map { s =>
        val mapper = new ObjectMapper()
        mapper.readValue(s, classOf[Result])
      }
      .collect()

    assertEquals(4, ds.length)
    ds.foreach { r => assertNotNull(r.getSubject) }
    ds.foreach { r => assertEquals(1, r.getSubject.size()) }
    ds.foreach { r => assertNotNull(r.getTitle) }
    ds.foreach { r => assertEquals(1, r.getTitle.size()) }

    ds.flatMap(r => r.getTitle.asScala.map(t => t.getValue))
      .foreach(t => assertEquals(FAKE_TITLE, t))
    ds.flatMap(r => r.getSubject.asScala.map(t => t.getValue))
      .foreach(t => assertEquals(FAKE_SUBJECT, t))

    println("generated Updates")
  }

  def populateDatasets(spark: SparkSession): Unit = {
    import spark.implicits._
    val entities = SparkResolveEntities.entities

    entities.foreach { e =>
      val template = Source.fromInputStream(this.getClass.getResourceAsStream(s"$e")).mkString
      spark
        .createDataset(spark.sparkContext.parallelize(template.linesWithSeparators.map(l =>l.stripLineEnd).toList))
        .as[String]
        .write
        .option("compression", "gzip")
        .text(s"$workingDir/graph/$e")
      println(s"Created Dataset $e")
    }
    SparkResolveRelation.extractPidResolvedTableFromJsonRDD(
      spark,
      s"$workingDir/graph",
      s"$workingDir/work"
    )

  }

  @Test
  def testResolution(): Unit = {
    val spark: SparkSession = sparkSession.get
    implicit val resEncoder: Encoder[Result] = Encoders.kryo(classOf[Result])
    SparkResolveEntities.resolveEntities(spark, s"$workingDir/work", s"$workingDir/updates")

    val ds = spark.read.load(s"$workingDir/work/resolvedEntities").as[Result]

    assertEquals(3, ds.count())

    ds.collect().foreach { r =>
      assertTrue(r.getId.startsWith("50"))
    }
  }

  private def structuredPContainsValue(
    l: java.util.List[StructuredProperty],
    exptectedValue: String
  ): Boolean = {
    l.asScala.exists(p => p.getValue != null && p.getValue.equalsIgnoreCase(exptectedValue))
  }

  @Test
  def testUpdate(): Unit = {
    val spark: SparkSession = sparkSession.get
    import spark.implicits._
    implicit val resEncoder: Encoder[Result] = Encoders.kryo(classOf[Result])
    val m = new ObjectMapper()
    SparkResolveEntities.resolveEntities(spark, s"$workingDir/work", s"$workingDir/updates")
    SparkResolveEntities.generateResolvedEntities(
      spark,
      s"$workingDir/work",
      s"$workingDir/graph",
      s"$workingDir/target"
    )

    val pubDS: Dataset[Result] = spark.read
      .text(s"$workingDir/target/publication")
      .as[String]
      .map(s => SparkResolveEntities.deserializeObject(s, EntityType.publication))
    val t = pubDS
      .filter(p => p.getTitle != null && p.getSubject != null)
      .filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))
      .count()

    var ct = pubDS.count()
    var et = pubDS
      .filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))
      .count()

    assertEquals(ct, et)

    val datDS: Dataset[Result] = spark.read
      .text(s"$workingDir/target/dataset")
      .as[String]
      .map(s => SparkResolveEntities.deserializeObject(s, EntityType.dataset))
    val td = datDS
      .filter(p => p.getTitle != null && p.getSubject != null)
      .filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))
      .count()
    ct = datDS.count()
    et = datDS
      .filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))
      .count()
    assertEquals(ct, et)

    val softDS: Dataset[Result] = spark.read
      .text(s"$workingDir/target/software")
      .as[String]
      .map(s => SparkResolveEntities.deserializeObject(s, EntityType.software))
    val ts = softDS
      .filter(p => p.getTitle != null && p.getSubject != null)
      .filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))
      .count()
    ct = softDS.count()
    et = softDS
      .filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))
      .count()
    assertEquals(ct, et)

    val orpDS: Dataset[Result] = spark.read
      .text(s"$workingDir/target/otherresearchproduct")
      .as[String]
      .map(s => SparkResolveEntities.deserializeObject(s, EntityType.otherresearchproduct))
    val to = orpDS
      .filter(p => p.getTitle != null && p.getSubject != null)
      .filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))
      .count()

    ct = orpDS.count()
    et = orpDS
      .filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))
      .count()
    assertEquals(ct, et)

    assertEquals(0, t)
    assertEquals(2, td)
    assertEquals(1, ts)
    assertEquals(0, to)

  }

  @Test
  def testMerge(): Unit = {

    var r = new Result
    r.setSubject(
      List(
        OafMapperUtils.subject(
          FAKE_SUBJECT,
          OafMapperUtils.qualifier("fos", "fosCS", "fossSchema"),
          null
        )
      ).asJava
    )

    val mapper = new ObjectMapper()

    val p = mapper.readValue(
      Source
        .fromInputStream(this.getClass.getResourceAsStream(s"publication"))
        .mkString
        .linesWithSeparators.map(l =>l.stripLineEnd)
        .next(),
      classOf[Publication]
    )

    r = MergeUtils.mergeResult(r, p);

    println(mapper.writeValueAsString(r))

  }

}
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`package eu.dnetlib.dhp.oa.graph.resolution`

			`import com.fasterxml.jackson.databind.ObjectMapper`
WIP: refactoring the internal graph data model and its utilities 2023-02-06 13:45:21 +01:00			`import eu.dnetlib.dhp.schema.oaf.common.EntityType`
			`import eu.dnetlib.dhp.schema.oaf.utils.{MergeUtils, OafMapperUtils}`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`import eu.dnetlib.dhp.schema.oaf.{Publication, Result, StructuredProperty}`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`import org.apache.commons.io.FileUtils`
			`import org.apache.spark.SparkConf`
			`import org.apache.spark.sql._`
			`import org.junit.jupiter.api.Assertions._`
			`import org.junit.jupiter.api.TestInstance.Lifecycle`
			`import org.junit.jupiter.api.{AfterAll, BeforeAll, Test, TestInstance}`

			`import java.nio.file.{Files, Path}`
			`import scala.collection.JavaConverters._`
			`import scala.io.Source`

			`@TestInstance(Lifecycle.PER_CLASS)`
			`class ResolveEntitiesTest extends Serializable {`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`var workingDir: Path = null`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`val FAKE_TITLE = "FAKETITLE"`
			`val FAKE_SUBJECT = "FAKESUBJECT"`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`var sparkSession: Option[SparkSession] = None`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`@BeforeAll`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`def setUp(): Unit = {`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`workingDir = Files.createTempDirectory(getClass.getSimpleName)`

			`val conf = new SparkConf()`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`sparkSession = Some(`
			`SparkSession`
			`.builder()`
			`.config(conf)`
			`.appName(getClass.getSimpleName)`
			`.master("local[*]")`
			`.getOrCreate()`
			`)`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`populateDatasets(sparkSession.get)`
			`generateUpdates(sparkSession.get)`

			`}`

			`@AfterAll`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`def tearDown(): Unit = {`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`FileUtils.deleteDirectory(workingDir.toFile)`
			`sparkSession.get.stop()`

			`}`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`def generateUpdates(spark: SparkSession): Unit = {`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`val template = Source.fromInputStream(this.getClass.getResourceAsStream("updates")).mkString`

updated lines function to it's implementation linesWithSeparators.map(l => l.stripLineEnd) in this way we force scala plugin compiler to consider this pipeline scala code and not java.string.lines() pipeline 2022-12-21 11:21:17 +01:00			`val pids: List[String] = template.linesWithSeparators.map(l =>l.stripLineEnd)`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`.map { id =>`
			`val r = new Result`
			`r.setId(id.toLowerCase.trim)`
			`r.setSubject(`
			`List(`
WIP: cleaning of subjects 2022-08-04 11:39:39 +02:00			`OafMapperUtils.subject(`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`FAKE_SUBJECT,`
WIP: refactoring the internal graph data model and its utilities 2023-02-06 13:45:21 +01:00			`OafMapperUtils.qualifier("fos", "fosCS", "fossSchema"),`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`null`
			`)`
			`).asJava`
			`)`
			`r.setTitle(`
			`List(`
			`OafMapperUtils.structuredProperty(`
			`FAKE_TITLE,`
WIP: refactoring the internal graph data model and its utilities 2023-02-06 13:45:21 +01:00			`OafMapperUtils.qualifier("fos", "fosCS", "fossSchema")`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`)`
			`).asJava`
			`)`
			`r`
			`}`
			`.map { r =>`
			`val mapper = new ObjectMapper()`

			`mapper.writeValueAsString(r)`
			`}`
			`.toList`

			`val sc = spark.sparkContext`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`println(sc.parallelize(pids).count())`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`spark`
			`.createDataset(sc.parallelize(pids))(Encoders.STRING)`
			`.write`
			`.mode(SaveMode.Overwrite)`
			`.option("compression", "gzip")`
			`.text(s"$workingDir/updates")`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`import spark.implicits._`
			`implicit val resEncoder: Encoder[Result] = Encoders.bean(classOf[Result])`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`val ds = spark.read`
			`.text(s"$workingDir/updates")`
			`.as[String]`
			`.map { s =>`
			`val mapper = new ObjectMapper()`
			`mapper.readValue(s, classOf[Result])`
			`}`
			`.collect()`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`assertEquals(4, ds.length)`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`ds.foreach { r => assertNotNull(r.getSubject) }`
			`ds.foreach { r => assertEquals(1, r.getSubject.size()) }`
			`ds.foreach { r => assertNotNull(r.getTitle) }`
			`ds.foreach { r => assertEquals(1, r.getTitle.size()) }`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`ds.flatMap(r => r.getTitle.asScala.map(t => t.getValue))`
			`.foreach(t => assertEquals(FAKE_TITLE, t))`
			`ds.flatMap(r => r.getSubject.asScala.map(t => t.getValue))`
			`.foreach(t => assertEquals(FAKE_SUBJECT, t))`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`println("generated Updates")`
			`}`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`def populateDatasets(spark: SparkSession): Unit = {`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`import spark.implicits._`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`val entities = SparkResolveEntities.entities`

			`entities.foreach { e =>`
			`val template = Source.fromInputStream(this.getClass.getResourceAsStream(s"$e")).mkString`
			`spark`
updated lines function to it's implementation linesWithSeparators.map(l => l.stripLineEnd) in this way we force scala plugin compiler to consider this pipeline scala code and not java.string.lines() pipeline 2022-12-21 11:21:17 +01:00			`.createDataset(spark.sparkContext.parallelize(template.linesWithSeparators.map(l =>l.stripLineEnd).toList))`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`.as[String]`
			`.write`
			`.option("compression", "gzip")`
			`.text(s"$workingDir/graph/$e")`
			`println(s"Created Dataset $e")`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`}`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`SparkResolveRelation.extractPidResolvedTableFromJsonRDD(`
			`spark,`
			`s"$workingDir/graph",`
			`s"$workingDir/work"`
			`)`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`}`

			`@Test`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`def testResolution(): Unit = {`
			`val spark: SparkSession = sparkSession.get`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`implicit val resEncoder: Encoder[Result] = Encoders.kryo(classOf[Result])`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`SparkResolveEntities.resolveEntities(spark, s"$workingDir/work", s"$workingDir/updates")`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
			`val ds = spark.read.load(s"$workingDir/work/resolvedEntities").as[Result]`

			`assertEquals(3, ds.count())`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`ds.collect().foreach { r =>`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`assertTrue(r.getId.startsWith("50"))`
			`}`
			`}`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`private def structuredPContainsValue(`
			`l: java.util.List[StructuredProperty],`
			`exptectedValue: String`
			`): Boolean = {`
			`l.asScala.exists(p => p.getValue != null && p.getValue.equalsIgnoreCase(exptectedValue))`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`}`

			`@Test`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`def testUpdate(): Unit = {`
			`val spark: SparkSession = sparkSession.get`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`import spark.implicits._`
			`implicit val resEncoder: Encoder[Result] = Encoders.kryo(classOf[Result])`
			`val m = new ObjectMapper()`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`SparkResolveEntities.resolveEntities(spark, s"$workingDir/work", s"$workingDir/updates")`
			`SparkResolveEntities.generateResolvedEntities(`
			`spark,`
			`s"$workingDir/work",`
			`s"$workingDir/graph",`
			`s"$workingDir/target"`
			`)`

			`val pubDS: Dataset[Result] = spark.read`
			`.text(s"$workingDir/target/publication")`
			`.as[String]`
			`.map(s => SparkResolveEntities.deserializeObject(s, EntityType.publication))`
			`val t = pubDS`
			`.filter(p => p.getTitle != null && p.getSubject != null)`
			`.filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))`
			`.count()`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`var ct = pubDS.count()`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`var et = pubDS`
formatted code 2022-01-12 09:40:28 +01:00			`.filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`.count()`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00
			`assertEquals(ct, et)`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`val datDS: Dataset[Result] = spark.read`
			`.text(s"$workingDir/target/dataset")`
			`.as[String]`
			`.map(s => SparkResolveEntities.deserializeObject(s, EntityType.dataset))`
			`val td = datDS`
			`.filter(p => p.getTitle != null && p.getSubject != null)`
			`.filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))`
			`.count()`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`ct = datDS.count()`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`et = datDS`
formatted code 2022-01-12 09:40:28 +01:00			`.filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`.count()`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`assertEquals(ct, et)`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`val softDS: Dataset[Result] = spark.read`
			`.text(s"$workingDir/target/software")`
			`.as[String]`
			`.map(s => SparkResolveEntities.deserializeObject(s, EntityType.software))`
			`val ts = softDS`
			`.filter(p => p.getTitle != null && p.getSubject != null)`
			`.filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))`
			`.count()`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`ct = softDS.count()`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`et = softDS`
formatted code 2022-01-12 09:40:28 +01:00			`.filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`.count()`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`assertEquals(ct, et)`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`val orpDS: Dataset[Result] = spark.read`
			`.text(s"$workingDir/target/otherresearchproduct")`
			`.as[String]`
			`.map(s => SparkResolveEntities.deserializeObject(s, EntityType.otherresearchproduct))`
			`val to = orpDS`
			`.filter(p => p.getTitle != null && p.getSubject != null)`
			`.filter(p => p.getTitle.asScala.exists(t => t.getValue.equalsIgnoreCase("FAKETITLE")))`
			`.count()`
implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`ct = orpDS.count()`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`et = orpDS`
formatted code 2022-01-12 09:40:28 +01:00			`.filter(p => p.getTitle != null && p.getTitle.asScala.forall(t => t.getValue != null && t.getValue.nonEmpty))`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`.count()`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`assertEquals(ct, et)`

implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`assertEquals(0, t)`
			`assertEquals(2, td)`
			`assertEquals(1, ts)`
			`assertEquals(0, to)`

			`}`

updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00			`@Test`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`def testMerge(): Unit = {`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00
WIP: refactoring the internal graph data model and its utilities 2023-02-06 13:45:21 +01:00			`var r = new Result`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`r.setSubject(`
			`List(`
WIP: cleaning of subjects 2022-08-04 11:39:39 +02:00			`OafMapperUtils.subject(`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`FAKE_SUBJECT,`
WIP: refactoring the internal graph data model and its utilities 2023-02-06 13:45:21 +01:00			`OafMapperUtils.qualifier("fos", "fosCS", "fossSchema"),`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`null`
			`)`
			`).asJava`
			`)`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00
			`val mapper = new ObjectMapper()`

scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`val p = mapper.readValue(`
			`Source`
			`.fromInputStream(this.getClass.getResourceAsStream(s"publication"))`
			`.mkString`
updated lines function to it's implementation linesWithSeparators.map(l => l.stripLineEnd) in this way we force scala plugin compiler to consider this pipeline scala code and not java.string.lines() pipeline 2022-12-21 11:21:17 +01:00			`.linesWithSeparators.map(l =>l.stripLineEnd)`
scalafmt: code formatting 2022-01-11 16:57:48 +01:00			`.next(),`
			`classOf[Publication]`
			`)`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00
WIP: refactoring the internal graph data model and its utilities 2023-02-06 13:45:21 +01:00			`r = MergeUtils.mergeResult(r, p);`
updated resolution wf: - generate a new version of the graph - changed merge from union to join 2021-11-22 11:48:55 +01:00
			`println(mapper.writeValueAsString(r))`

			`}`

implemented and tested resolution of entities 2021-11-11 10:17:40 +01:00			`}`