diff --git a/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/BioDBToOAF.scala b/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/BioDBToOAF.scala index 3a3c2f94dd..2422a25dbe 100644 --- a/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/BioDBToOAF.scala +++ b/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/BioDBToOAF.scala @@ -66,6 +66,21 @@ object BioDBToOAF { ) } + def crossrefLinksToOaf(input:String):Oaf = { + implicit lazy val formats: DefaultFormats.type = org.json4s.DefaultFormats + lazy val json = parse(input) + val source_pid = (json \ "Source" \ "Identifier" \ "ID").extract[String].toLowerCase + val source_pid_type = (json \ "Source" \ "Identifier" \ "IDScheme").extract[String].toLowerCase + + val target_pid = (json \ "Target" \ "Identifier" \ "ID").extract[String].toLowerCase + val target_pid_type = (json \ "Target" \ "Identifier" \ "IDScheme").extract[String].toLowerCase + + val relation_semantic= (json \ "RelationshipType" \ "Name").extract[String] + + createRelation(target_pid, target_pid_type, generate_unresolved_id(source_pid, source_pid_type),collectedFromMap("elsevier"),"relationship", relation_semantic) + + } + def scholixResolvedToOAF(input:ScholixResolved):Oaf = { @@ -213,11 +228,11 @@ object BioDBToOAF { - - def crossrefLinkToRelation(input:String):Oaf = { - null + def generate_unresolved_id(pid:String, pidType:String) :String = { + s"unresolved::$pid::$pidType" } + def createRelation(pid: String, pidType: String, sourceId: String, collectedFrom: KeyValue, subRelType:String, relClass:String):Relation = { val rel = new Relation diff --git a/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/SparkTransformBioDatabaseToOAF.scala b/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/SparkTransformBioDatabaseToOAF.scala index 3f81ec3a8e..1bca02a730 100644 --- a/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/SparkTransformBioDatabaseToOAF.scala +++ b/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/sx/bio/SparkTransformBioDatabaseToOAF.scala @@ -41,6 +41,8 @@ object SparkTransformBioDatabaseToOAF { spark.createDataset(sc.textFile(dbPath).flatMap(i => BioDBToOAF.pdbTOOaf(i))).write.mode(SaveMode.Overwrite).save(targetPath) case "SCHOLIX" => spark.read.load(dbPath).as[ScholixResolved].map(i => BioDBToOAF.scholixResolvedToOAF(i)).write.mode(SaveMode.Overwrite).save(targetPath) + case "CROSSREF_LINKS"=> + spark.createDataset(sc.textFile(dbPath).map(i => BioDBToOAF.crossrefLinksToOaf(i))).write.mode(SaveMode.Overwrite).save(targetPath) } } diff --git a/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/sx/bio/oozie_app/workflow.xml b/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/sx/bio/oozie_app/workflow.xml index d7f6538db4..90e2ae34f7 100644 --- a/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/sx/bio/oozie_app/workflow.xml +++ b/dhp-workflows/dhp-graph-mapper/src/main/resources/eu/dnetlib/dhp/sx/bio/oozie_app/workflow.xml @@ -20,6 +20,10 @@ the Scholix Resolved Dataset Path + + CrossrefLinksPath + the CrossrefLinks Path + targetPath the Target Working dir path @@ -134,9 +138,40 @@ --databaseSCHOLIX --targetPath${targetPath}/scholix_resolved_OAF + + + + + + + + yarn + cluster + Convert Crossref Links to OAF Dataset + eu.dnetlib.dhp.sx.bio.SparkTransformBioDatabaseToOAF + dhp-graph-mapper-${projectVersion}.jar + + --executor-memory=${sparkExecutorMemory} + --executor-cores=${sparkExecutorCores} + --driver-memory=${sparkDriverMemory} + --conf spark.extraListeners=${spark2ExtraListeners} + --conf spark.sql.shuffle.partitions=2000 + --conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners} + --conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress} + --conf spark.eventLog.dir=${nameNode}${spark2EventLogDir} + + --masteryarn + --dbPath${CrossrefLinksPath} + --databaseCROSSREF_LINKS + --targetPath${targetPath}/crossref_unresolved_relation_OAF + + + + + \ No newline at end of file diff --git a/dhp-workflows/dhp-graph-mapper/src/test/java/eu/dnetlib/dhp/sx/bio/pubmed/BioScholixTest.scala b/dhp-workflows/dhp-graph-mapper/src/test/java/eu/dnetlib/dhp/sx/bio/pubmed/BioScholixTest.scala index f1c6b9e136..a23c6530f0 100644 --- a/dhp-workflows/dhp-graph-mapper/src/test/java/eu/dnetlib/dhp/sx/bio/pubmed/BioScholixTest.scala +++ b/dhp-workflows/dhp-graph-mapper/src/test/java/eu/dnetlib/dhp/sx/bio/pubmed/BioScholixTest.scala @@ -131,6 +131,22 @@ class BioScholixTest extends AbstractVocabularyTest{ } + @Test + def testCrossrefLinksToOAF():Unit = { + + val records:String =Source.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/sx/bio/crossref_links")).mkString + records.lines.foreach(s => assertTrue(s.nonEmpty)) + + + val result:List[Oaf] =records.lines.map(s => BioDBToOAF.crossrefLinksToOaf(s)).toList + + assertNotNull(result) + assertTrue(result.nonEmpty) + + println(mapper.writeValueAsString(result.head)) + + } + @Test def testEBILinksToOAF():Unit = { val iterator = GzFileIterator(getClass.getResourceAsStream("/eu/dnetlib/dhp/sx/bio/ebi_links.gz"), "UTF-8") diff --git a/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/crossref_links b/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/crossref_links index 5eded83907..53f45f7d25 100644 --- a/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/crossref_links +++ b/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/crossref_links @@ -1,10 +1,16 @@ -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "P29964", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=P29964[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0141-8130", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0141-8130"}, "Name": "International Journal of Biological Macromolecules"}, "Identifier": {"ID": "10.1016/j.ijbiomac.2017.09.060", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ijbiomac.2017.09.060"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2018", "Title": "Molecular structure of cyclomaltodextrinase derived from amylolytic lactic acid bacterium "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "P56942", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=P56942[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0091-3022", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0091-3022"}, "Name": "Frontiers in Neuroendocrinology"}, "Identifier": {"ID": "10.1016/j.yfrne.2010.09.001", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.yfrne.2010.09.001"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2011", "Title": "New aspects of melanocortin signaling: A role for PRCP in \u03b1-MSH degradation"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "Q9R0R4", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=Q9R0R4[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0091-3022", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0091-3022"}, "Name": "Frontiers in Neuroendocrinology"}, "Identifier": {"ID": "10.1016/j.yfrne.2010.09.001", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.yfrne.2010.09.001"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2011", "Title": "New aspects of melanocortin signaling: A role for PRCP in \u03b1-MSH degradation"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "Q9EQX0", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=Q9EQX0[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0091-3022", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0091-3022"}, "Name": "Frontiers in Neuroendocrinology"}, "Identifier": {"ID": "10.1016/j.yfrne.2010.09.001", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.yfrne.2010.09.001"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2011", "Title": "New aspects of melanocortin signaling: A role for PRCP in \u03b1-MSH degradation"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "NP_060522.3", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=NP_060522.3[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0002-9297", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0002-9297"}, "Name": "The American Journal of Human Genetics"}, "Identifier": {"ID": "10.1016/j.ajhg.2016.05.008", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ajhg.2016.05.008"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2016", "Title": "Biallelic Mutations of "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "NP_666328.2", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=NP_666328.2[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0002-9297", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0002-9297"}, "Name": "The American Journal of Human Genetics"}, "Identifier": {"ID": "10.1016/j.ajhg.2016.05.008", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ajhg.2016.05.008"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2016", "Title": "Biallelic Mutations of "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "NP_001025735.1", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=NP_001025735.1[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0002-9297", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0002-9297"}, "Name": "The American Journal of Human Genetics"}, "Identifier": {"ID": "10.1016/j.ajhg.2016.05.008", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ajhg.2016.05.008"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2016", "Title": "Biallelic Mutations of "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "XP_008119452.1", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=XP_008119452.1[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0002-9297", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0002-9297"}, "Name": "The American Journal of Human Genetics"}, "Identifier": {"ID": "10.1016/j.ajhg.2016.05.008", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ajhg.2016.05.008"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2016", "Title": "Biallelic Mutations of "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "XP_003964762.1", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=XP_003964762.1[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0002-9297", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0002-9297"}, "Name": "The American Journal of Human Genetics"}, "Identifier": {"ID": "10.1016/j.ajhg.2016.05.008", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ajhg.2016.05.008"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2016", "Title": "Biallelic Mutations of "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} -{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "XP_004208946.2", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=XP_004208946.2[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0002-9297", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0002-9297"}, "Name": "The American Journal of Human Genetics"}, "Identifier": {"ID": "10.1016/j.ajhg.2016.05.008", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ajhg.2016.05.008"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2016", "Title": "Biallelic Mutations of "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} \ No newline at end of file +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "AEB31277", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=AEB31277[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0303-7207", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0303-7207"}, "Name": "Molecular and Cellular Endocrinology"}, "Identifier": {"ID": "10.1016/j.mce.2012.11.015", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.mce.2012.11.015"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2013", "Title": "Identification of ovarian genes regulated by follicle-stimulating hormone (Fsh) in vitro during early secondary oocyte growth in coho salmon"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "CAG38743", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=CAG38743[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "1095-6433", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/1095-6433"}, "Name": "Comparative Biochemistry and Physiology Part A: Molecular & Integrative Physiology"}, "Identifier": {"ID": "10.1016/j.cbpa.2012.04.025", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.cbpa.2012.04.025"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Mitogen activated protein kinase 14\u20101 regulates serum glucocorticoid kinase 1 during seawater acclimation in Atlantic killifish, "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "NP_031982", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=NP_031982[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0016-6480", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0016-6480"}, "Name": "General and Comparative Endocrinology"}, "Identifier": {"ID": "10.1016/j.ygcen.2010.02.015", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ygcen.2010.02.015"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2010", "Title": "Nucleotide sequence, tissue expression patterns and phylogenetic analysis of estrogen receptor one mRNA in the Murray rainbowfish ("}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "CAD43599", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=CAD43599[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0016-6480", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0016-6480"}, "Name": "General and Comparative Endocrinology"}, "Identifier": {"ID": "10.1016/j.ygcen.2010.02.015", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ygcen.2010.02.015"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2010", "Title": "Nucleotide sequence, tissue expression patterns and phylogenetic analysis of estrogen receptor one mRNA in the Murray rainbowfish ("}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "CAB45139", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=CAB45139[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0016-6480", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0016-6480"}, "Name": "General and Comparative Endocrinology"}, "Identifier": {"ID": "10.1016/j.ygcen.2010.02.015", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ygcen.2010.02.015"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2010", "Title": "Nucleotide sequence, tissue expression patterns and phylogenetic analysis of estrogen receptor one mRNA in the Murray rainbowfish ("}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "NP_001117738", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=NP_001117738[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0143-4179", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0143-4179"}, "Name": "Neuropeptides"}, "Identifier": {"ID": "10.1016/j.npep.2012.09.006", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.npep.2012.09.006"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Neuroendocrine control of feeding behavior and psychomotor activity by neuropeptideY in fish"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "P60709", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=P60709[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0006-291X", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0006-291X"}, "Name": "Biochemical and Biophysical Research Communications"}, "Identifier": {"ID": "10.1016/j.bbrc.2010.05.079", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.bbrc.2010.05.079"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2010", "Title": "Proteomic analysis of ACTN4-interacting proteins reveals it\u2019s a putative involvement in mRNA metabolism"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "BAJ11577", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=BAJ11577[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0378-1119", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0378-1119"}, "Name": "Gene"}, "Identifier": {"ID": "10.1016/j.gene.2012.06.011", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.gene.2012.06.011"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Isolation and characterization of a "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "BAI49900", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=BAI49900[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0378-1119", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0378-1119"}, "Name": "Gene"}, "Identifier": {"ID": "10.1016/j.gene.2012.06.011", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.gene.2012.06.011"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Isolation and characterization of a "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "P06733", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=P06733[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0303-7207", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0303-7207"}, "Name": "Molecular and Cellular Endocrinology"}, "Identifier": {"ID": "10.1016/j.mce.2010.05.022", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.mce.2010.05.022"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2010", "Title": "Proteomic approach reveals novel targets for retinoic acid-mediated therapy of thyroid carcinoma"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "Q15782", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=Q15782[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "1570-9639", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/1570-9639"}, "Name": "Biochimica et Biophysica Acta (BBA) - Proteins and Proteomics"}, "Identifier": {"ID": "10.1016/j.bbapap.2012.01.011", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.bbapap.2012.01.011"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Proteomic analysis of secretion from human transplanted submandibular gland replacing lacrimal gland with severe keratoconjunctivitis sicca"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "P15515", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=P15515[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "1570-9639", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/1570-9639"}, "Name": "Biochimica et Biophysica Acta (BBA) - Proteins and Proteomics"}, "Identifier": {"ID": "10.1016/j.bbapap.2012.01.011", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.bbapap.2012.01.011"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Proteomic analysis of secretion from human transplanted submandibular gland replacing lacrimal gland with severe keratoconjunctivitis sicca"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "P12273", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=P12273[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "1570-9639", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/1570-9639"}, "Name": "Biochimica et Biophysica Acta (BBA) - Proteins and Proteomics"}, "Identifier": {"ID": "10.1016/j.bbapap.2012.01.011", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.bbapap.2012.01.011"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Proteomic analysis of secretion from human transplanted submandibular gland replacing lacrimal gland with severe keratoconjunctivitis sicca"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "FLJ21865", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=FLJ21865[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "1368-8375", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/1368-8375"}, "Name": "Oral Oncology"}, "Identifier": {"ID": "10.1016/j.oraloncology.2011.11.010", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.oraloncology.2011.11.010"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Biomarker detection for the diagnosis of lymph node metastasis from oral squamous cell carcinoma"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "AAT74587", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=AAT74587[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0378-1119", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0378-1119"}, "Name": "Gene"}, "Identifier": {"ID": "10.1016/j.gene.2014.06.013", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.gene.2014.06.013"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2014", "Title": "Molecular characterization of "}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} +{"LinkProvider": {"Name": "Elsevier"}, "Target": {"Identifier": {"ID": "P00746", "IDScheme": "ncbi-p", "IDURL": "https://www.ncbi.nlm.nih.gov/entrez/query.fcgi?cmd=search&db=protein&doptcmdl=genbank&term=P00746[accn]"}, "Type": {"Name": "dataset"}}, "Source": {"Publisher": {"Identifier": {"ID": "0002-9440", "IDScheme": "ISNI", "IDURL": "http://www.isni.org/isni/0002-9440"}, "Name": "The American Journal of Pathology"}, "Identifier": {"ID": "10.1016/j.ajpath.2011.10.024", "IDScheme": "DOI", "IDURL": "https://doi.org/10.1016/j.ajpath.2011.10.024"}, "Type": {"SubType": "journal article", "Name": "literature"}, "PublicationDate": "2012", "Title": "Age-Dependent Changes in the Cerebrospinal Fluid Proteome by Slow Off-Rate Modified Aptamer Array"}, "LinkedPublicationDate": "2018", "LicenseURL": "https://creativecommons.org/licenses/by/4.0/", "RelationshipType": {"Name": "IsReferencedBy"}} \ No newline at end of file diff --git a/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/ebi_links.gz b/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/ebi_links.gz index 0da111c144..9baef7de61 100644 Binary files a/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/ebi_links.gz and b/dhp-workflows/dhp-graph-mapper/src/test/resources/eu/dnetlib/dhp/sx/bio/ebi_links.gz differ