Compare commits

...

36 Commits

Author SHA1 Message Date
Enrico Ottonello 64bc955444 new script to nquads download from scraping service 2022-07-19 12:12:01 +02:00
Enrico Ottonello 18c9b95cb1 removed duplicated subjects 2022-06-28 13:07:53 +02:00
Enrico Ottonello 33dcf9964c fixed alternate identifier 2022-05-18 12:02:27 +02:00
Enrico Ottonello 792e78e848 fixed alternate identifier redundant 2022-05-18 10:44:31 +02:00
Enrico Ottonello aef88f9e5c added accessrights and hostedby 2022-05-18 10:07:50 +02:00
Enrico Ottonello f6c37656c9 instance type set to 0046 - Bioentity 2022-05-18 09:46:43 +02:00
Enrico Ottonello 41de8fb785 added ped test with doi citation; fix pmid pid type 2022-05-13 12:27:40 +02:00
Enrico Ottonello 6d4235bd00 removed bmuse workflow module 2022-05-11 11:22:01 +02:00
Enrico Ottonello baa312f256 updated dhp-rdfconverter version to 1.2.5-SNAPSHOT 2022-05-11 11:20:16 +02:00
Enrico Ottonello 6fa9624c29 merge with beta for bioschemas
Merge branch 'beta' of https://code-repo.d4science.org/D-Net/dnet-hadoop into beta_bioschema
2022-05-11 10:56:03 +02:00
Enrico Ottonello 0703e0c65f converter input taken from textfile on hdfs with base64 gzipped rows 2022-05-11 10:43:13 +02:00
Enrico Ottonello 9a0ca0296a added mobidb constants configuration and test 2022-04-07 13:17:50 +02:00
Enrico Ottonello d0df02062c raised runtimeexception on record without title or url 2022-04-06 13:19:58 +02:00
Enrico Ottonello 7fc5b97871 skipped record without title or url 2022-04-06 13:08:48 +02:00
Enrico Ottonello a203c33693 added disprot constants configuration 2022-04-06 12:48:24 +02:00
Enrico Ottonello afb46d71f7 added subjects to disprot output 2022-04-06 12:22:10 +02:00
Enrico Ottonello 98178b3165 custom deserializer for property value type working for both ped and disprot 2022-04-05 10:47:17 +02:00
Enrico Ottonello f11dfc51f7 fix resolved url format, added alternate identifier from original pid 2022-03-22 16:39:21 +01:00
Enrico Ottonello afe84c4244 added subjects to oaf generation 2022-03-18 18:10:39 +01:00
Enrico Ottonello db831e6f43 removed dynamic allocation on wf 2022-03-18 17:43:53 +01:00
Enrico Ottonello 861f2a3306 added titles merging title page and protein identifier 2022-03-18 14:51:57 +01:00
Enrico Ottonello f43bfdb594 added subjects 2022-03-17 19:24:07 +01:00
Enrico Ottonello 3ef5eec3a6 added bmuse and rdfconverter modules - added repository for bmuse jars 2022-03-16 12:07:36 +01:00
Enrico Ottonello 41284ec2f9 retrieving vocabulary terms from nquads 2022-03-16 11:26:50 +01:00
Enrico Ottonello e53a606afc added date of collection, resource type as workflow parameter 2022-03-15 17:36:48 +01:00
Enrico Ottonello bd37f14941 added working ocean configuration 2022-03-03 14:38:21 +01:00
Enrico Ottonello 29ee1b9d82 added datasource key to workflow parameter to properly choose collected from and id values 2022-03-03 12:31:29 +01:00
Enrico Ottonello e57216a1fa added oozie workflow to generate bioschema dataset on hdfs 2022-03-02 16:58:10 +01:00
Enrico Ottonello f28d7e3b9d added spark dataset creation 2022-03-02 12:12:37 +01:00
Enrico Ottonello 8f281846a4 update test file 2022-02-28 13:37:53 +01:00
Enrico Ottonello f833de8a75 added relatedIdentifierType, fix IsCitedBy value 2022-02-28 13:37:28 +01:00
Enrico Ottonello 7f9636ef00 added alternateIdentifiers to oaf 2022-02-25 14:42:08 +01:00
Enrico Ottonello 2f5caef77b resolution of generated relations url to uniprot and pubmed datasources 2022-02-24 16:59:50 +01:00
Enrico Ottonello 4975278558 added modules for downloading data with bmuse and converting to datacite json format 2022-02-22 12:53:19 +01:00
Enrico Ottonello 2bc79c50f8 mapping bioschema to oaf 2022-02-22 11:46:29 +01:00
Enrico Ottonello 446f81ee60 wf to generate oaf from bioschema json datacite 2022-02-22 11:42:57 +01:00
32 changed files with 3469 additions and 0 deletions

View File

@ -0,0 +1,50 @@
[
{
"paramName": "s",
"paramLongName": "sourcePath",
"paramDescription": "the source mdstore path",
"paramRequired": false
},
{
"paramName": "t",
"paramLongName": "targetPath",
"paramDescription": "the path where storing final dataset",
"paramRequired": false
},
{
"paramName": "mo",
"paramLongName": "mdstoreOutputVersion",
"paramDescription": "the target mdstore path",
"paramRequired": false
},
{
"paramName": "m",
"paramLongName": "master",
"paramDescription": "the master name",
"paramRequired": true
},
{
"paramName": "i",
"paramLongName": "isLookupUrl",
"paramDescription": "the isLookup URL",
"paramRequired": false
},
{
"paramName": "l",
"paramLongName": "exportLinks",
"paramDescription": "should export also links",
"paramRequired": false
},
{
"paramName": "k",
"paramLongName": "datasourceKey",
"paramDescription": "the key that identifies the datasource",
"paramRequired": true
},
{
"paramName": "p",
"paramLongName": "profile",
"paramDescription": "resource profile",
"paramRequired": true
}
]

View File

@ -0,0 +1,84 @@
<configuration>
<!-- OCEAN -->
<!-- <property>-->
<!-- <name>jobTracker</name>-->
<!-- <value>yarnRM</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>nameNode</name>-->
<!-- <value>hdfs://nameservice1</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>oozie.use.system.libpath</name>-->
<!-- <value>true</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>oozie.action.sharelib.for.spark</name>-->
<!-- <value>spark2</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>oozie.launcher.mapreduce.user.classpath.first</name>-->
<!-- <value>true</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>spark2YarnHistoryServerAddress</name>-->
<!-- <value>http://hadoop-rm2.garr-pa1.d4science.org:19888</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>spark2EventLogDir</name>-->
<!-- <value>/user/spark/spark2ApplicationHistory</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>spark2ExtraListeners</name>-->
<!-- <value>"com.cloudera.spark.lineage.NavigatorAppListener"</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>spark2SqlQueryExecutionListeners</name>-->
<!-- <value>"com.cloudera.spark.lineage.NavigatorQueryListener"</value>-->
<!-- </property>-->
<!-- GARR -->
<property>
<name>jobTracker</name>
<value>hadoop-rm3.garr-pa1.d4science.org:8032</value>
</property>
<property>
<name>nameNode</name>
<value>hdfs://hadoop-rm1.garr-pa1.d4science.org:8020</value>
</property>
<property>
<name>hive_metastore_uris</name>
<value>thrift://hadoop-edge3.garr-pa1.d4science.org:9083</value>
</property>
<property>
<name>spark2YarnHistoryServerAddress</name>
<value>http://hadoop-rm2.garr-pa1.d4science.org:19888</value>
</property>
<property>
<name>oozie.launcher.mapreduce.user.classpath.first</name>
<value>true</value>
</property>
<property>
<name>oozie.use.system.libpath</name>
<value>true</value>
</property>
<property>
<name>oozie.action.sharelib.for.spark</name>
<value>spark2</value>
</property>
<property>
<name>spark2EventLogDir</name>
<value>/user/spark/spark2ApplicationHistory</value>
</property>
<property>
<name>spark2ExtraListeners</name>
<value>"com.cloudera.spark.lineage.NavigatorAppListener"</value>
</property>
<property>
<name>spark2SqlQueryExecutionListeners</name>
<value>"com.cloudera.spark.lineage.NavigatorQueryListener"</value>
</property>
</configuration>

View File

@ -0,0 +1,134 @@
<workflow-app name="generate_bioschema" xmlns="uri:oozie:workflow:0.5">
<parameters>
<property>
<name>mainPath</name>
<value>/data/bioschema/mobidb</value>
<description>the working path of Bioschema stores</description>
</property>
<property>
<name>datasourceKey</name>
<value>mobidb</value>
<description>the key that identifies the datasource (eg ped, disprot, mobidb)</description>
</property>
<property>
<name>profile</name>
<value>protein</value>
<description>resource profile (eg protein, gene)</description>
</property>
</parameters>
<start to="ResetDataset"/>
<kill name="Kill">
<message>Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]</message>
</kill>
<action name="ResetDataset">
<fs>
<delete path='${mainPath}/dataset/*'/>
</fs>
<ok to="TransformJob"/>
<error to="Kill"/>
</action>
<action name="StartTransaction">
<java>
<configuration>
<property>
<name>oozie.launcher.mapreduce.user.classpath.first</name>
<value>true</value>
</property>
</configuration>
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
<arg>--action</arg><arg>NEW_VERSION</arg>
<arg>--mdStoreID</arg><arg>${mdStoreOutputId}</arg>
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
<capture-output/>
</java>
<ok to="TransformJob"/>
<error to="EndReadRollBack"/>
</action>
<action name="TransformJob">
<spark xmlns="uri:oozie:spark-action:0.2">
<master>yarn-cluster</master>
<mode>cluster</mode>
<name>TransformJob</name>
<class>eu.dnetlib.dhp.bioschema.GenerateBioschemaDatasetSpark</class>
<jar>dhp-aggregation-${projectVersion}.jar</jar>
<spark-opts>
--executor-memory=${sparkExecutorMemory}
--executor-cores=${sparkExecutorCores}
--driver-memory=${sparkDriverMemory}
--conf spark.sql.shuffle.partitions=3840
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
</spark-opts>
<arg>--sourcePath</arg><arg>${mainPath}/json-datacite</arg>
<arg>--targetPath</arg><arg>${mainPath}/dataset</arg>
<arg>--exportLinks</arg><arg>true</arg>
<arg>--datasourceKey</arg><arg>${datasourceKey}</arg>
<arg>--profile</arg><arg>${profile}</arg>
<arg>--master</arg><arg>yarn-cluster</arg>
</spark>
<ok to="End"/>
<error to="Kill"/>
</action>
<action name="CommitVersion">
<java>
<configuration>
<property>
<name>oozie.launcher.mapreduce.user.classpath.first</name>
<value>true</value>
</property>
</configuration>
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
<arg>--action</arg><arg>COMMIT</arg>
<arg>--namenode</arg><arg>${nameNode}</arg>
<arg>--mdStoreVersion</arg><arg>${wf:actionData('StartTransaction')['mdStoreVersion']}</arg>
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
</java>
<ok to="End"/>
<error to="Kill"/>
</action>
<action name="EndReadRollBack">
<java>
<configuration>
<property>
<name>oozie.launcher.mapreduce.user.classpath.first</name>
<value>true</value>
</property>
</configuration>
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
<arg>--action</arg><arg>READ_UNLOCK</arg>
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
<arg>--readMDStoreId</arg><arg>${wf:actionData('BeginRead')['mdStoreReadLockVersion']}</arg>
<capture-output/>
</java>
<ok to="RollBack"/>
<error to="Kill"/>
</action>
<action name="RollBack">
<java>
<configuration>
<property>
<name>oozie.launcher.mapreduce.user.classpath.first</name>
<value>true</value>
</property>
</configuration>
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
<arg>--action</arg><arg>ROLLBACK</arg>
<arg>--mdStoreVersion</arg><arg>${wf:actionData('StartTransaction')['mdStoreVersion']}</arg>
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
</java>
<ok to="Kill"/>
<error to="Kill"/>
</action>
<end name="End"/>
</workflow-app>

View File

@ -0,0 +1,308 @@
package eu.dnetlib.dhp.bioschema
import eu.dnetlib.dhp.schema.common.ModelConstants
import eu.dnetlib.dhp.schema.oaf.{DataInfo, KeyValue, Qualifier}
import eu.dnetlib.dhp.schema.oaf.utils.OafMapperUtils
import java.time.format.DateTimeFormatter
import java.util.Locale
import java.util.regex.Pattern
/*
The following class are utility class used for the mapping from
bioschema json datacite to OAF Schema
*/
case class RelatedIdentifierType(
relationType: String,
relatedIdentifier: String,
relatedIdentifierType: String
) {}
case class AlternateIdentifierType(
alternateIdentifier: String
) {}
case class IdentifierType(
identifier: String,
identifierType: String
) {}
case class NameIdentifiersType(
nameIdentifierScheme: Option[String],
schemeUri: Option[String],
nameIdentifier: Option[String]
) {}
case class CreatorType(
nameType: Option[String],
nameIdentifiers: Option[List[NameIdentifiersType]],
name: Option[String],
familyName: Option[String],
givenName: Option[String],
affiliation: Option[List[String]]
) {}
case class TitleType(title: Option[String], titleType: Option[String], lang: Option[String]) {}
case class SubjectType(
schemeURI: Option[String],
value: Option[String],
subjectScheme: Option[String]
) {}
case class DescriptionType(descriptionType: Option[String], description: Option[String]) {}
case class DateType(date: Option[String], dateType: Option[String]) {}
case class OAFRelations(relation: String, inverse: String, relType: String)
class BioschemaModelConstants extends Serializable {}
object BioschemaModelConstants {
val PROTEIN_RESOURCETYPE: Qualifier =
qualifier("0046", "Bioentity", ModelConstants.DNET_PUBLICATION_RESOURCE, ModelConstants.DNET_PUBLICATION_RESOURCE)
val DATA_INFO: DataInfo = OafMapperUtils.dataInfo(
false,
null,
false,
false,
ModelConstants.PROVENANCE_ACTION_SET_QUALIFIER,
"0.9"
)
val PED_PREFIX: String = "fsh_____3595"
val DISPROT_PREFIX: String = "fsh_____1904"
val MOBIDB_PREFIX: String = "fsh_____2176"
val resolvedURLPattern: Map[String, String] = Map(
"https://identifiers.org/pubmed:" -> "pmid",
"http://purl.uniprot.org/uniprot/" -> "uniprot",
"https://identifiers.org/uniprot:" -> "uniprot",
"https://identifiers.org/disprot:" -> "disprot",
"https://identifiers.org/mobidb:" -> "mobidb",
"https://doi.org/" -> "doi"
)
val collectedFromMap: Map[String, KeyValue] = {
val PEDCollectedFrom: KeyValue = OafMapperUtils.keyValue(
"10|fairsharing_::c0e8517b1fe0b5270f3f41d4b56d6118",
"Protein Ensemble Database"
)
PEDCollectedFrom.setDataInfo(DATA_INFO)
val DISPROTCollectedFrom: KeyValue = OafMapperUtils.keyValue(
"10|fairsharing_::c91591a8d461c2869b9f535ded3e213e",
"Database of Protein Disorder"
)
DISPROTCollectedFrom.setDataInfo(DATA_INFO)
val MOBIDBCollectedFrom: KeyValue = OafMapperUtils.keyValue(
"10|fairsharing_::0234c510bc6d908b28c70ff313743079",
"MobiDB"
)
MOBIDBCollectedFrom.setDataInfo(DATA_INFO)
Map(
"ped" -> PEDCollectedFrom,
"disprot" -> DISPROTCollectedFrom,
"mobidb" -> MOBIDBCollectedFrom
)
}
val datasourceKeyPrefix: Map[String, String] = Map(
"ped" -> PED_PREFIX,
"disprot" -> DISPROT_PREFIX,
"mobidb" -> MOBIDB_PREFIX
)
val REL_TYPE_VALUE: String = "resultResult"
val DATE_RELATION_KEY = "RelationDate"
val dataInfo: DataInfo = bioschemaDataInfo("0.9")
val subRelTypeMapping: Map[String, OAFRelations] = Map(
ModelConstants.REFERENCES -> OAFRelations(
ModelConstants.REFERENCES,
ModelConstants.IS_REFERENCED_BY,
ModelConstants.RELATIONSHIP
),
ModelConstants.IS_REFERENCED_BY -> OAFRelations(
ModelConstants.IS_REFERENCED_BY,
ModelConstants.REFERENCES,
ModelConstants.RELATIONSHIP
),
ModelConstants.IS_SUPPLEMENTED_BY -> OAFRelations(
ModelConstants.IS_SUPPLEMENTED_BY,
ModelConstants.IS_SUPPLEMENT_TO,
ModelConstants.SUPPLEMENT
),
ModelConstants.IS_SUPPLEMENT_TO -> OAFRelations(
ModelConstants.IS_SUPPLEMENT_TO,
ModelConstants.IS_SUPPLEMENTED_BY,
ModelConstants.SUPPLEMENT
),
ModelConstants.HAS_PART -> OAFRelations(
ModelConstants.HAS_PART,
ModelConstants.IS_PART_OF,
ModelConstants.PART
),
ModelConstants.IS_PART_OF -> OAFRelations(
ModelConstants.IS_PART_OF,
ModelConstants.HAS_PART,
ModelConstants.PART
),
ModelConstants.IS_VERSION_OF -> OAFRelations(
ModelConstants.IS_VERSION_OF,
ModelConstants.HAS_VERSION,
ModelConstants.VERSION
),
ModelConstants.HAS_VERSION -> OAFRelations(
ModelConstants.HAS_VERSION,
ModelConstants.IS_VERSION_OF,
ModelConstants.VERSION
),
ModelConstants.IS_IDENTICAL_TO -> OAFRelations(
ModelConstants.IS_IDENTICAL_TO,
ModelConstants.IS_IDENTICAL_TO,
ModelConstants.RELATIONSHIP
),
ModelConstants.IS_CONTINUED_BY -> OAFRelations(
ModelConstants.IS_CONTINUED_BY,
ModelConstants.CONTINUES,
ModelConstants.RELATIONSHIP
),
ModelConstants.CONTINUES -> OAFRelations(
ModelConstants.CONTINUES,
ModelConstants.IS_CONTINUED_BY,
ModelConstants.RELATIONSHIP
),
ModelConstants.IS_NEW_VERSION_OF -> OAFRelations(
ModelConstants.IS_NEW_VERSION_OF,
ModelConstants.IS_PREVIOUS_VERSION_OF,
ModelConstants.VERSION
),
ModelConstants.IS_PREVIOUS_VERSION_OF -> OAFRelations(
ModelConstants.IS_PREVIOUS_VERSION_OF,
ModelConstants.IS_NEW_VERSION_OF,
ModelConstants.VERSION
),
ModelConstants.IS_DOCUMENTED_BY -> OAFRelations(
ModelConstants.IS_DOCUMENTED_BY,
ModelConstants.DOCUMENTS,
ModelConstants.RELATIONSHIP
),
ModelConstants.DOCUMENTS -> OAFRelations(
ModelConstants.DOCUMENTS,
ModelConstants.IS_DOCUMENTED_BY,
ModelConstants.RELATIONSHIP
),
ModelConstants.IS_SOURCE_OF -> OAFRelations(
ModelConstants.IS_SOURCE_OF,
ModelConstants.IS_DERIVED_FROM,
ModelConstants.VERSION
),
ModelConstants.IS_DERIVED_FROM -> OAFRelations(
ModelConstants.IS_DERIVED_FROM,
ModelConstants.IS_SOURCE_OF,
ModelConstants.VERSION
),
ModelConstants.CITES -> OAFRelations(
ModelConstants.CITES,
ModelConstants.IS_CITED_BY,
ModelConstants.CITATION
),
ModelConstants.IS_CITED_BY -> OAFRelations(
ModelConstants.IS_CITED_BY,
ModelConstants.CITES,
ModelConstants.CITATION
),
ModelConstants.IS_VARIANT_FORM_OF -> OAFRelations(
ModelConstants.IS_VARIANT_FORM_OF,
ModelConstants.IS_DERIVED_FROM,
ModelConstants.VERSION
),
ModelConstants.IS_OBSOLETED_BY -> OAFRelations(
ModelConstants.IS_OBSOLETED_BY,
ModelConstants.IS_NEW_VERSION_OF,
ModelConstants.VERSION
),
ModelConstants.REVIEWS -> OAFRelations(
ModelConstants.REVIEWS,
ModelConstants.IS_REVIEWED_BY,
ModelConstants.REVIEW
),
ModelConstants.IS_REVIEWED_BY -> OAFRelations(
ModelConstants.IS_REVIEWED_BY,
ModelConstants.REVIEWS,
ModelConstants.REVIEW
),
ModelConstants.DOCUMENTS -> OAFRelations(
ModelConstants.DOCUMENTS,
ModelConstants.IS_DOCUMENTED_BY,
ModelConstants.RELATIONSHIP
),
ModelConstants.IS_DOCUMENTED_BY -> OAFRelations(
ModelConstants.IS_DOCUMENTED_BY,
ModelConstants.DOCUMENTS,
ModelConstants.RELATIONSHIP
),
ModelConstants.COMPILES -> OAFRelations(
ModelConstants.COMPILES,
ModelConstants.IS_COMPILED_BY,
ModelConstants.RELATIONSHIP
),
ModelConstants.IS_COMPILED_BY -> OAFRelations(
ModelConstants.IS_COMPILED_BY,
ModelConstants.COMPILES,
ModelConstants.RELATIONSHIP
)
)
def bioschemaDataInfo(trust: String): DataInfo = OafMapperUtils.dataInfo(
false,
null,
false,
false,
ModelConstants.PROVENANCE_ACTION_SET_QUALIFIER,
trust
)
val df_en: DateTimeFormatter = DateTimeFormatter.ofPattern(
"[MM-dd-yyyy][MM/dd/yyyy][dd-MM-yy][dd-MMM-yyyy][dd/MMM/yyyy][dd-MMM-yy][dd/MMM/yy][dd-MM-yy][dd/MM/yy][dd-MM-yyyy][dd/MM/yyyy][yyyy-MM-dd][yyyy/MM/dd]",
Locale.ENGLISH
)
val df_it: DateTimeFormatter =
DateTimeFormatter.ofPattern("[dd-MM-yyyy][dd/MM/yyyy]", Locale.ITALIAN)
val Date_regex: List[Pattern] = List(
//Y-M-D
Pattern.compile(
"(18|19|20)\\d\\d([- /.])(0[1-9]|1[012])\\2(0[1-9]|[12][0-9]|3[01])",
Pattern.MULTILINE
),
//M-D-Y
Pattern.compile(
"((0[1-9]|1[012])|([1-9]))([- /.])(0[1-9]|[12][0-9]|3[01])([- /.])(18|19|20)?\\d\\d",
Pattern.MULTILINE
),
//D-M-Y
Pattern.compile(
"(?:(?:31(/|-|\\.)(?:0?[13578]|1[02]|(?:Jan|Mar|May|Jul|Aug|Oct|Dec)))\\1|(?:(?:29|30)(/|-|\\.)(?:0?[1,3-9]|1[0-2]|(?:Jan|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec))\\2))(?:(?:1[6-9]|[2-9]\\d)?\\d{2})|(?:29(/|-|\\.)(?:0?2|(?:Feb))\\3(?:(?:(?:1[6-9]|[2-9]\\d)?(?:0[48]|[2468][048]|[13579][26])|(?:(?:16|[2468][048]|[3579][26])00))))|(?:0?[1-9]|1\\d|2[0-8])(/|-|\\.)(?:(?:0?[1-9]|(?:Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep))|(?:1[0-2]|(?:Oct|Nov|Dec)))\\4(?:(?:1[6-9]|[2-9]\\d)?\\d{2})",
Pattern.MULTILINE
),
//Y
Pattern.compile("(19|20)\\d\\d", Pattern.MULTILINE)
)
private def qualifier(classid: String, classname: String, schemeid: String, schemename: String) = {
val q = new Qualifier
q.setClassid(classid)
q.setClassname(classname)
q.setSchemeid(schemeid)
q.setSchemename(schemename)
q
}
}

View File

@ -0,0 +1,308 @@
package eu.dnetlib.dhp.bioschema
import com.fasterxml.jackson.databind.ObjectMapper
import eu.dnetlib.dhp.bioschema.BioschemaModelConstants._
import eu.dnetlib.dhp.schema.common.ModelConstants
import eu.dnetlib.dhp.schema.oaf.utils.{IdentifierFactory, OafMapperUtils}
import eu.dnetlib.dhp.schema.oaf.{Dataset => OafDataset, _}
import eu.dnetlib.dhp.utils.DHPUtils
import org.apache.commons.lang3.StringUtils
import org.json4s.DefaultFormats
import org.json4s.JsonAST.{JField, JObject, JString}
import org.json4s.jackson.JsonMethods.parse
import java.time.LocalDate
import scala.collection.JavaConverters._
object BioschemaToOAFTransformation {
val mapper = new ObjectMapper()
def extract_date(input: String): Option[String] = {
val d = Date_regex
.map(pattern => {
val matcher = pattern.matcher(input)
if (matcher.find())
matcher.group(0)
else
null
})
.find(s => s != null)
if (d.isDefined) {
val a_date = if (d.get.length == 4) s"01-01-${d.get}" else d.get
try {
return Some(LocalDate.parse(a_date, df_en).toString)
} catch {
case _: Throwable =>
try {
return Some(LocalDate.parse(a_date, df_it).toString)
} catch {
case _: Throwable =>
return None
}
}
}
d
}
def getResult(resourceClassName: String): Result = {
val i = new Instance
resourceClassName.toUpperCase() match {
case "PROTEIN" =>
i.setInstancetype(
PROTEIN_RESOURCETYPE
)
val d = new OafDataset
d.setInstance(List(i).asJava)
d.setResourcetype(
PROTEIN_RESOURCETYPE
)
return d
}
null
}
def generateOAFDate(dt: String, q: Qualifier): StructuredProperty = {
OafMapperUtils.structuredProperty(dt, q, null)
}
def generateOAF(
input: String,
exportLinks: Boolean,
datasourceKey: String,
resourceClassName: String
): List[Oaf] = {
implicit lazy val formats: DefaultFormats.type = org.json4s.DefaultFormats
lazy val json = parse(input)
val result = getResult(resourceClassName)
if (result == null)
return List()
val pid = (json \ "id").extract[String]
result.setPid(
List(
OafMapperUtils.structuredProperty(
pid,
datasourceKey,
datasourceKey,
ModelConstants.DNET_PID_TYPES,
ModelConstants.DNET_PID_TYPES,
DATA_INFO
)
).asJava
)
result.setId(OafMapperUtils.createOpenaireId(50, s"${datasourceKeyPrefix(datasourceKey)}::$pid", true))
result.setOriginalId(List(pid).asJava)
result.setDataInfo(dataInfo)
val titles: List[TitleType] = (json \\ "titles").extractOrElse[List[TitleType]](List())
if (titles.isEmpty) {
throw new RuntimeException("Title not found")
}
result.setTitle(
titles
.filter(t => t.title.nonEmpty)
.map(t => {
OafMapperUtils
.structuredProperty(t.title.get, ModelConstants.MAIN_TITLE_QUALIFIER, dataInfo)
})
.asJava
)
val dates = (json \\ "dates").extract[List[DateType]]
val collected_date = dates
.filter(d => d.date.isDefined && d.dateType.isDefined)
.find(d => d.dateType.get.equalsIgnoreCase("collected"))
.map(d => extract_date(d.date.get))
.find(d => d != null && d.isDefined)
.map(d => d.get)
if (collected_date.isDefined) {
result.setDateofcollection(collected_date.get)
}
result.setRelevantdate(
dates
.filter(d => d.date.isDefined && d.dateType.isDefined)
.map(d => (extract_date(d.date.get), d.dateType.get))
.filter(d => d._1.isDefined)
.map(d =>
(
d._1.get,
OafMapperUtils.qualifier(
d._2.toLowerCase(),
d._2.toLowerCase(),
ModelConstants.DNET_DATACITE_DATE,
ModelConstants.DNET_DATACITE_DATE
)
)
)
.filter(d => d._2 != null)
.map(d => generateOAFDate(d._1, d._2))
.asJava
)
result.setCollectedfrom(List(collectedFromMap(datasourceKey)).asJava)
val descriptions = (json \\ "descriptions").extract[List[DescriptionType]]
result.setDescription(
descriptions
.filter(d => d.description.isDefined)
.map(d => OafMapperUtils.field(d.description.get, null))
.filter(s => s != null)
.asJava
)
val subjects = (json \\ "subjects").extract[List[SubjectType]]
result.setSubject(
subjects
.filter(s => s.value.nonEmpty && s.subjectScheme.nonEmpty && s.schemeURI.nonEmpty)
.map(s =>
OafMapperUtils.structuredProperty(
s.value.get,
s.subjectScheme.get,
s.schemeURI.get,
ModelConstants.DNET_SUBJECT_TYPOLOGIES,
ModelConstants.DNET_SUBJECT_TYPOLOGIES,
null
)
)
.asJava
)
val instance = result.getInstance().get(0)
val ids: List[IdentifierType] = for {
JObject(identifiers) <- json \\ "identifiers"
JField("identifier", JString(identifier)) <- identifiers
JField("identifierType", JString(identifierType)) <- identifiers
} yield IdentifierType(identifier, identifierType)
instance.setUrl(
ids
.map(id => {
id.identifier
})
.asJava
)
if (instance.getUrl.isEmpty) {
throw new RuntimeException("Url not found")
}
instance.setCollectedfrom(collectedFromMap(datasourceKey))
instance.setHostedby(collectedFromMap(datasourceKey))
instance.setPid(result.getPid)
result.setId(IdentifierFactory.createIdentifier(result))
var relations: List[Relation] = List()
if (result.getId == null)
return List()
val alternativeIdentifierUrls: List[AlternateIdentifierType] = for {
JObject(alternateIdentifiers) <- json \\ "alternateIdentifiers"
JField("alternateIdentifier", JString(alternateIdentifier)) <- alternateIdentifiers
} yield AlternateIdentifierType(alternateIdentifier)
val alternativeIdentifierUrl: AlternateIdentifierType = alternativeIdentifierUrls.asJava.get(0)
val alternativeIdentifiers = resolvedURLPattern
.filter(pattern => !pattern._1.contains(datasourceKey))
.map(pattern => {
if (alternativeIdentifierUrl.alternateIdentifier.startsWith(s"${pattern._1}")) {
val relatedId = StringUtils.substringAfter(alternativeIdentifierUrl.alternateIdentifier, s"${pattern._1}")
OafMapperUtils.structuredProperty(
relatedId,
pattern._2,
pattern._2,
ModelConstants.DNET_PID_TYPES,
ModelConstants.DNET_PID_TYPES,
dataInfo
)
} else
null
})
.find(s => s != null)
if (alternativeIdentifiers.isDefined) {
instance.setAlternateIdentifier(List(alternativeIdentifiers.get).asJava)
}
val access_rights_qualifier =
OafMapperUtils.accessRight(
ModelConstants.UNKNOWN,
ModelConstants.NOT_AVAILABLE,
ModelConstants.DNET_ACCESS_MODES,
ModelConstants.DNET_ACCESS_MODES
)
instance.setAccessright(access_rights_qualifier)
if (exportLinks) {
val rels: List[RelatedIdentifierType] = for {
JObject(relIdentifier) <- json \\ "relatedIdentifiers"
JField("relationType", JString(relationType)) <- relIdentifier
JField("relatedIdentifierType", JString(relatedIdentifierType)) <- relIdentifier
JField("relatedIdentifier", JString(relatedIdentifier)) <- relIdentifier
} yield RelatedIdentifierType(relationType, relatedIdentifier, relatedIdentifierType)
relations = relations ::: generateRelations(
rels,
result.getId,
null,
pid,
datasourceKey
)
}
if (relations != null && relations.nonEmpty) {
List(result) ::: relations
} else
List(result)
}
private def generateRelations(
rels: List[RelatedIdentifierType],
id: String,
date: String,
pid: String,
datasourceKey: String
): List[Relation] = {
rels
.map(r => {
val rel = new Relation
rel.setCollectedfrom(List(collectedFromMap(datasourceKey)).asJava)
rel.setDataInfo(dataInfo)
val subRelType = subRelTypeMapping(r.relationType).relType
rel.setRelType(REL_TYPE_VALUE)
rel.setSubRelType(subRelType)
rel.setRelClass(r.relationType)
val dateProps: KeyValue = OafMapperUtils.keyValue(DATE_RELATION_KEY, date)
rel.setProperties(List(dateProps).asJava)
resolvedURLPattern
.map(p => {
if (r.relatedIdentifier.startsWith(s"${p._1}")) {
val relatedId = StringUtils.substringAfter(r.relatedIdentifier, s"${p._1}")
rel.setTarget(
DHPUtils.generateUnresolvedIdentifier(relatedId, p._2)
)
} else
null
})
.find(s => s != null)
rel.setSource(id)
rel.setCollectedfrom(List(collectedFromMap(datasourceKey)).asJava)
rel.getCollectedfrom.asScala.map(c => c.getValue).toList
rel
})
}
}

View File

@ -0,0 +1,99 @@
package eu.dnetlib.dhp.bioschema
import com.fasterxml.jackson.databind.ObjectMapper
import eu.dnetlib.dhp.application.AbstractScalaApplication
import eu.dnetlib.dhp.collection.CollectionUtils
import eu.dnetlib.dhp.common.Constants.{MDSTORE_DATA_PATH, MDSTORE_SIZE_PATH}
import eu.dnetlib.dhp.schema.mdstore.MDStoreVersion
import eu.dnetlib.dhp.schema.oaf.Oaf
import eu.dnetlib.dhp.utils.DHPUtils.writeHdfsFile
import org.apache.spark.sql.{Encoder, Encoders, SparkSession}
import org.slf4j.{Logger, LoggerFactory}
class GenerateBioschemaDatasetSpark(propertyPath: String, args: Array[String], log: Logger)
extends AbstractScalaApplication(propertyPath, args, log: Logger) {
/** Here all the spark applications runs this method
* where the whole logic of the spark node is defined
*/
override def run(): Unit = {
val sourcePath = parser.get("sourcePath")
log.info(s"SourcePath is '$sourcePath'")
val exportLinks = "true".equalsIgnoreCase(parser.get("exportLinks"))
log.info(s"exportLinks is '$exportLinks'")
val datasourceKey = parser.get("datasourceKey").toLowerCase
log.info(s"datasourceKey is '$datasourceKey'")
val profile = parser.get("profile").toLowerCase
log.info(s"profile is '$profile'")
// val mdstoreOutputVersion = parser.get("mdstoreOutputVersion")
// log.info(s"mdstoreOutputVersion is '$mdstoreOutputVersion'")
// val mapper = new ObjectMapper()
// val cleanedMdStoreVersion = mapper.readValue(mdstoreOutputVersion, classOf[MDStoreVersion])
// val outputBasePath = cleanedMdStoreVersion.getHdfsPath
// log.info(s"outputBasePath is '$outputBasePath'")
// val targetPath = s"$outputBasePath$MDSTORE_DATA_PATH"
// log.info(s"targetPath is '$targetPath'")
val targetPath = parser.get("targetPath")
generateBioschemaDataset(sourcePath, exportLinks, targetPath, datasourceKey, profile, spark)
// reportTotalSize(targetPath, outputBasePath)
}
/** For working with MDStore we need to store in a file on hdfs the size of
* the current dataset
* @param targetPath
* @param outputBasePath
*/
def reportTotalSize(targetPath: String, outputBasePath: String): Unit = {
val total_items = spark.read.text(targetPath).count()
writeHdfsFile(
spark.sparkContext.hadoopConfiguration,
s"$total_items",
outputBasePath + MDSTORE_SIZE_PATH
)
}
/** Generate the transformed and cleaned OAF Dataset from the native one
*
* @param sourcePath sourcePath of the native Dataset in format JSON/Datacite
* @param exportLinks If true it generates unresolved links
* @param targetPath the targetPath of the result Dataset
*/
def generateBioschemaDataset(
sourcePath: String,
exportLinks: Boolean,
targetPath: String,
datasourceKey: String,
profile: String,
spark: SparkSession
): Unit = {
require(spark != null)
implicit val resultEncoder: Encoder[Oaf] = Encoders.kryo(classOf[Oaf])
CollectionUtils.saveDataset(
spark.createDataset(
spark.sparkContext
.textFile(sourcePath)
.flatMap(i => BioschemaToOAFTransformation.generateOAF(i, exportLinks, datasourceKey, profile))
),
targetPath
)
}
}
object GenerateBioschemaDatasetSpark {
val log: Logger = LoggerFactory.getLogger(GenerateBioschemaDatasetSpark.getClass)
def main(args: Array[String]): Unit = {
new GenerateBioschemaDatasetSpark(
"/eu/dnetlib/dhp/bioschema/generate_dataset_params.json",
args,
log
).initialize().run()
}
}

View File

@ -0,0 +1,45 @@
{
"id": "DP01454",
"types": {
"resourceType": "Protein",
"resourceTypeGeneral": "Dataset"
},
"creators": [],
"identifiers": [
{
"identifier": "https://disprot.org/DP01454",
"identifierType": "URL"
}
],
"relatedIdentifiers": [
{
"relationType": "IsIdenticalTo",
"relatedIdentifier": "http://purl.uniprot.org/uniprot/P60006",
"relatedIdentifierType": "URL"
}
],
"alternateIdentifiers": [
{
"alternateIdentifier": "https://identifiers.org/disprot:DP01454"
}
],
"descriptions": [],
"titles": [
{
"title": "DP01454 - Anaphase-promoting complex subunit 15 "
}
],
"dates": [
{
"date": "2021-11-25T12:23:57",
"dateType": "Collected"
}
],
"subjects": [
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "disorder",
"subjectScheme": "IDPO:00076"
}
]
}

View File

@ -0,0 +1,75 @@
{
"id": "Q9UPN6",
"types": {
"resourceType": "Protein",
"resourceTypeGeneral": "Dataset"
},
"creators": [],
"identifiers": [
{
"identifier": "https://mobidb.org/Q9UPN6",
"identifierType": "URL"
}
],
"relatedIdentifiers": [
{
"relationType": "IsIdenticalTo",
"relatedIdentifier": "http://purl.uniprot.org/uniprot/Q9UPN6",
"relatedIdentifierType": "URL"
}
],
"alternateIdentifiers": [
{
"alternateIdentifier": "https://identifiers.org/mobidb:Q9UPN6"
}
],
"descriptions": [],
"titles": [
{
"title": "Q9UPN6 - SR-related and CTD-associated factor 8 "
}
],
"dates": [
{
"date": "2021-12-06T14:49:15",
"dateType": "Collected"
}
],
"subjects": [
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "Disorder",
"subjectScheme": "IDPO:00076"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "Disorder",
"subjectScheme": "IDPO:00076"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "Disorder",
"subjectScheme": "IDPO:00076"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "Disorder",
"subjectScheme": "IDPO:00076"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "Disorder",
"subjectScheme": "IDPO:00076"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "Disorder",
"subjectScheme": "IDPO:00076"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
"value": "Disorder",
"subjectScheme": "IDPO:00076"
}
]
}

View File

@ -0,0 +1,80 @@
{
"id": "PED00180#Q9KPH3_A_0",
"types": {
"resourceType": "Protein",
"resourceTypeGeneral": "Dataset"
},
"creators": [],
"identifiers": [
{
"identifier": "https://proteinensemble.org/PED00180#Q9KPH3_A_0",
"identifierType": "URL"
}
],
"relatedIdentifiers": [
{
"relationType": "IsCitedBy",
"relatedIdentifier": "https://doi.org/10.1016/j.jsb.2020.107573",
"relatedIdentifierType": "URL"
},
{
"relationType": "IsIdenticalTo",
"relatedIdentifier": "http://purl.uniprot.org/uniprot/Q9KPH3",
"relatedIdentifierType": "URL"
}
],
"alternateIdentifiers": [
{
"alternateIdentifier": "https://identifiers.org/uniprot:Q9KPH3"
}
],
"descriptions": [],
"titles": [
{
"title": "PED00180#Q9KPH3_A_0 - Structural ensemble of protein DciA from Vibrio cholerae (1-157) "
}
],
"dates": [
{
"date": "2022-05-10T18:03:43",
"dateType": "Collected"
}
],
"subjects": [
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120",
"value": "NMR",
"subjectScheme": "IDPO:00120"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125",
"value": "SAXS",
"subjectScheme": "IDPO:00125"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00224",
"value": "GROMACS",
"subjectScheme": "IDPO:00224"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00228",
"value": "AMBER",
"subjectScheme": "IDPO:00228"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00185",
"value": "FM",
"subjectScheme": "IDPO:00185"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00213",
"value": "EOM",
"subjectScheme": "IDPO:00213"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00214",
"value": "GAJOE",
"subjectScheme": "IDPO:00214"
}
]
}

View File

@ -0,0 +1,5 @@
{"id":"PED00111#O75880_A_1","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00111#O75880_A_1","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsCitedBy","relatedIdentifier":"https://identifiers.org/pubmed:16735468","relatedIdentifierType":"URL"},{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/O75880","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:O75880"}],"descriptions":[],"titles":[{"title":"PED00111#O75880_A_1 - Structural ensemble of the C-terminal region of Sco1 (132-301), apo structure."}],"dates":[{"date":"2021-12-10T11:17:16","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141","value":"TOCSY","subjectScheme":"IDPO:00141"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143","value":"NOESY","subjectScheme":"IDPO:00143"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147","value":"HSQC","subjectScheme":"IDPO:00147"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00153","value":"HNHA","subjectScheme":"IDPO:00153"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00154","value":"HNCO","subjectScheme":"IDPO:00154"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00155","value":"HNCA","subjectScheme":"IDPO:00155"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00156","value":"HNCACO","subjectScheme":"IDPO:00156"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00157","value":"HNCOCA","subjectScheme":"IDPO:00157"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00158","value":"HNCACB","subjectScheme":"IDPO:00158"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00160","value":"CBCACONH","subjectScheme":"IDPO:00160"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00164","value":"CBCANH","subjectScheme":"IDPO:00164"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00175","value":"NOE","subjectScheme":"IDPO:00175"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00228","value":"AMBER","subjectScheme":"IDPO:00228"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00190","value":"DYANA","subjectScheme":"IDPO:00190"}]}
{"id":"PED00112#P19634_A_1","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00112#P19634_A_1","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsCitedBy","relatedIdentifier":"https://identifiers.org/pubmed:24840010","relatedIdentifierType":"URL"},{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P19634","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P19634"}],"descriptions":[],"titles":[{"title":"PED00112#P19634_A_1 - Structural ensemble of the TM VI-VII of the nhe1 isoform of the sodium/hydrogen exchanger (226-274)"}],"dates":[{"date":"2021-12-10T11:17:20","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141","value":"TOCSY","subjectScheme":"IDPO:00141"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143","value":"NOESY","subjectScheme":"IDPO:00143"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147","value":"HSQC","subjectScheme":"IDPO:00147"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167","value":"chemical shift","subjectScheme":"IDPO:00167"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00188","value":"Structure calculation","subjectScheme":"IDPO:00188"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00202","value":"NMRpipe","subjectScheme":"IDPO:00202"}]}
{"id":"PED00113#P04156_A_0","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00113#P04156_A_0","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P04156","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P04156"}],"descriptions":[],"titles":[{"title":"PED00113#P04156_A_0 - Structural ensemble of major prion protein (173-195)"}],"dates":[{"date":"2021-12-10T11:17:24","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"}]}
{"id":"PED00114#P27958_A_0","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00114#P27958_A_0","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsCitedBy","relatedIdentifier":"https://identifiers.org/pubmed:15247283","relatedIdentifierType":"URL"},{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P27958","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P27958"}],"descriptions":[],"titles":[{"title":"PED00114#P27958_A_0 - Structural ensemble of the membrane anchor domain of the nonstructural protein 5A (NS5A) of hepatitis C virus (1973-2003), in 50% tfe"}],"dates":[{"date":"2021-12-10T11:17:27","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141","value":"TOCSY","subjectScheme":"IDPO:00141"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143","value":"NOESY","subjectScheme":"IDPO:00143"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147","value":"HSQC","subjectScheme":"IDPO:00147"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00175","value":"NOE","subjectScheme":"IDPO:00175"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00194","value":"X-PLOR","subjectScheme":"IDPO:00194"}]}
{"id":"PED00115#P04156_A_0","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00115#P04156_A_0","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P04156","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P04156"}],"descriptions":[],"titles":[{"title":"PED00115#P04156_A_0 - Structural ensemble of major prion protein (173-195), mutant D178N"}],"dates":[{"date":"2021-12-10T11:17:30","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"}]}

View File

@ -0,0 +1,120 @@
{
"id": "PED00111#O75880_A_1",
"types": {
"resourceType": "Protein",
"resourceTypeGeneral": "Dataset"
},
"creators": [],
"identifiers": [
{
"identifier": "https://proteinensemble.org/PED00111#O75880_A_1",
"identifierType": "URL"
}
],
"relatedIdentifiers": [
{
"relationType": "IsCitedBy",
"relatedIdentifier": "https://identifiers.org/pubmed:16735468",
"relatedIdentifierType": "URL"
},
{
"relationType": "IsIdenticalTo",
"relatedIdentifier": "http://purl.uniprot.org/uniprot/O75880",
"relatedIdentifierType": "URL"
}
],
"alternateIdentifiers": [
{
"alternateIdentifier": "https://identifiers.org/uniprot:O75880"
}
],
"descriptions": [],
"titles": [
{
"title": "PED00111#O75880_A_1 - Structural ensemble of the C-terminal region of Sco1 (132-301), apo structure."
}
],
"dates": [
{
"date": "2021-12-10T11:17:16",
"dateType": "Collected"
}
],
"subjects": [
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120",
"value": "NMR",
"subjectScheme": "IDPO:00120"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141",
"value": "TOCSY",
"subjectScheme": "IDPO:00141"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143",
"value": "NOESY",
"subjectScheme": "IDPO:00143"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147",
"value": "HSQC",
"subjectScheme": "IDPO:00147"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00153",
"value": "HNHA",
"subjectScheme": "IDPO:00153"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00154",
"value": "HNCO",
"subjectScheme": "IDPO:00154"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00155",
"value": "HNCA",
"subjectScheme": "IDPO:00155"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00156",
"value": "HNCACO",
"subjectScheme": "IDPO:00156"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00157",
"value": "HNCOCA",
"subjectScheme": "IDPO:00157"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00158",
"value": "HNCACB",
"subjectScheme": "IDPO:00158"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00160",
"value": "CBCACONH",
"subjectScheme": "IDPO:00160"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00164",
"value": "CBCANH",
"subjectScheme": "IDPO:00164"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00175",
"value": "NOE",
"subjectScheme": "IDPO:00175"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00228",
"value": "AMBER",
"subjectScheme": "IDPO:00228"
},
{
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00190",
"value": "DYANA",
"subjectScheme": "IDPO:00190"
}
]
}

View File

@ -0,0 +1,115 @@
package eu.dnetlib.dhp.bioschema
import com.fasterxml.jackson.databind.{ObjectMapper, SerializationFeature}
import eu.dnetlib.dhp.aggregation.AbstractVocabularyTest
import eu.dnetlib.dhp.schema.oaf.Oaf
import org.apache.commons.io.FileUtils
import org.apache.spark.SparkConf
import org.apache.spark.sql.{Encoder, Encoders, SparkSession}
import org.junit.jupiter.api.Assertions._
import org.junit.jupiter.api.extension.ExtendWith
import org.junit.jupiter.api.{AfterEach, BeforeEach, Test}
import org.mockito.junit.jupiter.MockitoExtension
import org.slf4j.{Logger, LoggerFactory}
import java.nio.file.{Files, Path}
import scala.io.Source
@ExtendWith(Array(classOf[MockitoExtension]))
class BioschemaDataciteToOAFTest {
private var workingDir: Path = null
val log: Logger = LoggerFactory.getLogger(getClass)
@BeforeEach
def setUp(): Unit = {
workingDir = Files.createTempDirectory(getClass.getSimpleName)
}
@AfterEach
def tearDown(): Unit = {
FileUtils.deleteDirectory(workingDir.toFile)
}
@Test
def testGeneratePED(): Unit = {
val path = getClass.getResource("/eu/dnetlib/dhp/bioschema/ped_dump").getPath
val conf = new SparkConf()
val spark: SparkSession = SparkSession
.builder()
.config(conf)
.appName(getClass.getSimpleName)
.master("local[*]")
.getOrCreate()
implicit val oafEncoder: Encoder[Oaf] = Encoders.kryo[Oaf]
val instance = new GenerateBioschemaDatasetSpark(null, null, log)
val targetPath = s"$workingDir/result"
instance.generateBioschemaDataset(path, exportLinks = true, targetPath, "ped", "protein", spark)
val total_items = spark.read.text(targetPath).count()
println(s"total_items: $total_items")
assertTrue(total_items == 21)
instance.generateBioschemaDataset(path, exportLinks = false, targetPath, "ped", "protein", spark)
val total_datasets = spark.read.text(targetPath).count()
println(s"total_datasets: $total_datasets")
assertTrue(total_datasets == 5)
spark.stop()
}
@Test
def testPEDMapping(): Unit = {
val record = Source
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/ped_record.json"))
.mkString
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "ped", "protein")
res.foreach(r => {
println(mapper.writeValueAsString(r))
println("----------------------------")
})
}
@Test
def testDISPROTMapping(): Unit = {
val record = Source
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/disprot_record.json"))
.mkString
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "disprot", "protein")
res.foreach(r => {
println(mapper.writeValueAsString(r))
println("----------------------------")
})
}
@Test
def testMOBIDBMapping(): Unit = {
val record = Source
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/mobidb_record.json"))
.mkString
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "mobidb", "protein")
res.foreach(r => {
println(mapper.writeValueAsString(r))
println("----------------------------")
})
}
@Test
def testPEDDoiCitationMapping(): Unit = {
val record = Source
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/ped_doi_citation.json"))
.mkString
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "ped", "protein")
res.foreach(r => {
println(mapper.writeValueAsString(r))
println("----------------------------")
})
}
}

View File

@ -0,0 +1,42 @@
<?xml version="1.0" encoding="UTF-8"?>
<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
<modelVersion>4.0.0</modelVersion>
<parent>
<groupId>eu.dnetlib.dhp</groupId>
<artifactId>dhp-workflows</artifactId>
<version>1.2.5-SNAPSHOT</version>
</parent>
<artifactId>dhp-rdfconverter</artifactId>
<dependencies>
<dependency>
<groupId>org.apache.spark</groupId>
<artifactId>spark-core_2.11</artifactId>
</dependency>
<dependency>
<groupId>org.apache.spark</groupId>
<artifactId>spark-sql_2.11</artifactId>
</dependency>
<dependency>
<groupId>eu.dnetlib.dhp</groupId>
<artifactId>dhp-common</artifactId>
<version>${project.version}</version>
</dependency>
<dependency>
<groupId>org.apache.any23</groupId>
<artifactId>apache-any23-core</artifactId>
<version>2.3</version>
</dependency>
<dependency>
<groupId>org.eclipse.rdf4j</groupId>
<artifactId>rdf4j-rio-rdfxml</artifactId>
<version>2.5.4</version>
</dependency>
<dependency>
<groupId>org.eclipse.rdf4j</groupId>
<artifactId>rdf4j-model</artifactId>
<version>2.5.4</version>
</dependency>
</dependencies>
</project>

View File

@ -0,0 +1,82 @@
package eu.dnetlib.dhp.rdfconverter.bioschema;
import static eu.dnetlib.dhp.common.SparkSessionSupport.runWithSparkSession;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Objects;
import java.util.Optional;
import org.apache.commons.io.IOUtils;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.io.compress.GzipCodec;
import org.apache.spark.SparkConf;
import org.apache.spark.api.java.JavaPairRDD;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.api.java.JavaSparkContext;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import eu.dnetlib.dhp.application.ArgumentApplicationParser;
import eu.dnetlib.dhp.rdfconverter.utils.CompressorUtil;
import eu.dnetlib.dhp.rdfconverter.utils.RDFConverter;
import ucar.nc2.stream.NcStreamProto;
public class SparkRdfToDatacite {
static Logger logger = LoggerFactory.getLogger(SparkRdfToDatacite.class);
public static void main(String[] args) throws Exception {
final ArgumentApplicationParser parser = new ArgumentApplicationParser(
IOUtils
.toString(
SparkRdfToDatacite.class
.getResourceAsStream(
"/eu/dnetlib/dhp/rdfconverter/bioschema/generate_dataset.json")));
parser.parseArgument(args);
Boolean isSparkSessionManaged = Optional
.ofNullable(parser.get("isSparkSessionManaged"))
.map(Boolean::valueOf)
.orElse(Boolean.TRUE);
final String workingPath = parser.get("workingPath");
final String rdfNquadsRecords = parser.get("rdfInput");
final String output = parser.get("output");
final String profile = parser.get("profile");
SparkConf conf = new SparkConf();
runWithSparkSession(
conf,
isSparkSessionManaged,
spark -> {
JavaSparkContext sc = JavaSparkContext.fromSparkContext(spark.sparkContext());
String base64GzippedNquadsPath = workingPath.concat(rdfNquadsRecords);
JavaRDD<String> base64GzippedNquadsRDD = sc
.textFile(base64GzippedNquadsPath);
logger.info("Rdf nquads records retrieved: {}", base64GzippedNquadsRDD.count());
JavaRDD<String> proteins2 = base64GzippedNquadsRDD
.flatMap(nquads -> {
RDFConverter converter = new RDFConverter();
ArrayList<String> jsonlds = null;
try {
jsonlds = converter
.nQuadsFile2DataciteJson(CompressorUtil.decompressValue(nquads), profile);
} catch (Exception e) {
logger.error("converting: " + nquads, e);
return Arrays.asList(new String()).iterator();
}
return jsonlds.iterator();
});
logger.info("json datacite non filtered: {}", proteins2.count());
JavaRDD<Text> proteins = proteins2
.filter(Objects::nonNull)
.filter(jsonld -> !jsonld.isEmpty())
.distinct()
.map(jsonld -> new Text(jsonld));
logger.info("json datacite generated: {}", proteins.count());
proteins.saveAsTextFile(workingPath.concat(output), GzipCodec.class);
});
}
}

View File

@ -0,0 +1,489 @@
package eu.dnetlib.dhp.rdfconverter.bioschema.model;
import java.util.List;
import com.fasterxml.jackson.annotation.JsonIgnoreProperties;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.fasterxml.jackson.databind.annotation.JsonDeserialize;
import eu.dnetlib.dhp.rdfconverter.utils.CustomPropertyValueDeserializer;
@JsonIgnoreProperties(ignoreUnknown = true)
public class BioSchemaProtein {
@JsonProperty("@id")
private String id;
@JsonProperty("@graph")
private List<Entry> entryList;
@JsonProperty("http://purl.org/pav/retrievedOn")
private DateTimeType retrievedOn;
public static class Entry {
@JsonProperty("@id")
private String id;
@JsonProperty("@type")
// private List<String> type;
private String type;
@JsonProperty("https://schema.org/identifier")
private String identifier;
@JsonProperty("https://schema.org/name")
private String name;
@JsonProperty("associatedDisease")
private List<AssociatedDisease> associatedDisease;
@JsonProperty("description")
private String description;
@JsonProperty("isEncodedByBioChemEntity")
private String isEncodedByBioChemEntity;
@JsonProperty("url")
private String url;
@JsonProperty("alternateName")
private String alternateName;
@JsonProperty("bioChemInteraction")
private List<Link> bioChemInteraction;
@JsonProperty("bioChemSimilarity")
private List<Link> bioChemSimilarity;
@JsonProperty("hasMolecularFunction")
private String hasMolecularFunction;
@JsonProperty("image")
private String image;
@JsonProperty("isInvolvedInBiologicalProcess")
private String isInvolvedInBiologicalProcess;
@JsonProperty("isPartOfBioChemEntity")
private IsPartOfBioChemEntity isPartOfBioChemEntity;
@JsonProperty("mainEntityOfPage")
private Link mainEntityOfPage;
@JsonProperty("https://schema.org/citation")
private Citation citation;
@JsonProperty("https://schema.org/sameAs")
private List<Link> sameAs;
@JsonProperty("https://schema.org/hasSequenceAnnotation")
private List<Link> hasSequenceAnnotation;
@JsonProperty("https://schema.org/additionalProperty")
private List<Link> sequenceAnnotation;
@JsonProperty("https://schema.org/value")
@JsonDeserialize(using = CustomPropertyValueDeserializer.class)
private Link propertyValue;
@JsonProperty("https://schema.org/termCode")
private String termCode;
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
public String getType() {
return type;
}
public void setType(String type) {
this.type = type;
}
public String getName() {
return name;
}
public void setName(String name) {
this.name = name;
}
public List<Link> getSameAs() {
return sameAs;
}
public void setSameAs(List<Link> sameAs) {
this.sameAs = sameAs;
}
public String getIdentifier() {
return identifier;
}
public void setIdentifier(String identifier) {
this.identifier = identifier;
}
public String getDescription() {
return description;
}
public void setDescription(String description) {
this.description = description;
}
public String getIsEncodedByBioChemEntity() {
return isEncodedByBioChemEntity;
}
public void setIsEncodedByBioChemEntity(String isEncodedByBioChemEntity) {
this.isEncodedByBioChemEntity = isEncodedByBioChemEntity;
}
public String getUrl() {
return url;
}
public void setUrl(String url) {
this.url = url;
}
public String getAlternateName() {
return alternateName;
}
public void setAlternateName(String alternateName) {
this.alternateName = alternateName;
}
public List<Link> getBioChemInteraction() {
return bioChemInteraction;
}
public void setBioChemInteraction(List<Link> bioChemInteraction) {
this.bioChemInteraction = bioChemInteraction;
}
public List<Link> getBioChemSimilarity() {
return bioChemSimilarity;
}
public void setBioChemSimilarity(List<Link> bioChemSimilarity) {
this.bioChemSimilarity = bioChemSimilarity;
}
public String getHasMolecularFunction() {
return hasMolecularFunction;
}
public void setHasMolecularFunction(String hasMolecularFunction) {
this.hasMolecularFunction = hasMolecularFunction;
}
public String getImage() {
return image;
}
public void setImage(String image) {
this.image = image;
}
public String getIsInvolvedInBiologicalProcess() {
return isInvolvedInBiologicalProcess;
}
public void setIsInvolvedInBiologicalProcess(String isInvolvedInBiologicalProcess) {
this.isInvolvedInBiologicalProcess = isInvolvedInBiologicalProcess;
}
public List<AssociatedDisease> getAssociatedDisease() {
return associatedDisease;
}
public void setAssociatedDisease(List<AssociatedDisease> associatedDisease) {
this.associatedDisease = associatedDisease;
}
public IsPartOfBioChemEntity getIsPartOfBioChemEntity() {
return isPartOfBioChemEntity;
}
public void setIsPartOfBioChemEntity(IsPartOfBioChemEntity isPartOfBioChemEntity) {
this.isPartOfBioChemEntity = isPartOfBioChemEntity;
}
public Link getMainEntityOfPage() {
return mainEntityOfPage;
}
public void setMainEntityOfPage(Link mainEntityOfPage) {
this.mainEntityOfPage = mainEntityOfPage;
}
public List<Link> getHasSequenceAnnotation() {
return hasSequenceAnnotation;
}
public void setHasSequenceAnnotation(List<Link> hasSequenceAnnotation) {
this.hasSequenceAnnotation = hasSequenceAnnotation;
}
public List<Link> getSequenceAnnotation() {
return sequenceAnnotation;
}
public void setSequenceAnnotation(List<Link> sequenceAnnotation) {
this.sequenceAnnotation = sequenceAnnotation;
}
public Citation getCitation() {
return citation;
}
public void setCitation(Citation citation) {
this.citation = citation;
}
public Link getPropertyValue() {
return propertyValue;
}
public void setPropertyValue(Link propertyValue) {
this.propertyValue = propertyValue;
}
public String getTermCode() {
return termCode;
}
public void setTermCode(String termCode) {
this.termCode = termCode;
}
}
public static class IsPartOfBioChemEntity {
@JsonProperty("@type")
private String type;
@JsonProperty("url")
private String url;
public String getType() {
return type;
}
public void setType(String type) {
this.type = type;
}
public String getUrl() {
return url;
}
public void setUrl(String url) {
this.url = url;
}
}
public static class AssociatedDisease {
@JsonProperty("@type")
private String type;
@JsonProperty("name")
private String name;
@JsonProperty("code")
private DeseaseCode code;
@JsonProperty("id")
private String id;
public String getType() {
return type;
}
public void setType(String type) {
this.type = type;
}
public String getName() {
return name;
}
public void setName(String name) {
this.name = name;
}
public DeseaseCode getCode() {
return code;
}
public void setCode(DeseaseCode code) {
this.code = code;
}
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
}
public static class DeseaseCode {
@JsonProperty("@type")
private String type;
@JsonProperty("codeValue")
private String codeValue;
@JsonProperty("codingSystem")
private String codingSystem;
public String getType() {
return type;
}
public void setType(String type) {
this.type = type;
}
public String getCodeValue() {
return codeValue;
}
public void setCodeValue(String codeValue) {
this.codeValue = codeValue;
}
public String getCodingSystem() {
return codingSystem;
}
public void setCodingSystem(String codingSystem) {
this.codingSystem = codingSystem;
}
}
public static class Link {
@JsonProperty("@id")
private String id;
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
}
public static class DateTimeType {
@JsonProperty("@type")
private String type;
@JsonProperty("@value")
private String value;
public String getType() {
return type;
}
public void setType(String type) {
this.type = type;
}
public String getValue() {
return value;
}
public void setValue(String value) {
this.value = value;
}
}
public static class Citation {
@JsonProperty("@id")
private String id;
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
}
public static class SequenceAnnotationId {
@JsonProperty("@id")
private String id;
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
}
public static class SequenceAnnotation {
@JsonProperty("https://schema.org/additionalProperty")
private List<PropertyValue> additionalProperty;
public List<PropertyValue> getAdditionalProperty() {
return additionalProperty;
}
public void setAdditionalProperty(List<PropertyValue> additionalProperty) {
this.additionalProperty = additionalProperty;
}
}
public static class PropertyValue {
@JsonProperty("https://schema.org/value")
private DefinedTerm definedTerm;
public DefinedTerm getDefinedTerm() {
return definedTerm;
}
public void setDefinedTerm(DefinedTerm definedTerm) {
this.definedTerm = definedTerm;
}
}
public static class DefinedTerm {
@JsonProperty("@id")
private String id;
@JsonProperty("https://schema.org/termCode")
private String termCode;
@JsonProperty("https://schema.org/name")
private String name;
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
public String getTermCode() {
return termCode;
}
public void setTermCode(String termCode) {
this.termCode = termCode;
}
public String getName() {
return name;
}
public void setName(String name) {
this.name = name;
}
}
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
public List<Entry> getEntryList() {
return entryList;
}
public void setEntryList(List<Entry> entryList) {
this.entryList = entryList;
}
public DateTimeType getRetrievedOn() {
return retrievedOn;
}
public void setRetrievedOn(DateTimeType retrievedOn) {
this.retrievedOn = retrievedOn;
}
}

View File

@ -0,0 +1,331 @@
package eu.dnetlib.dhp.rdfconverter.bioschema.model;
import java.util.ArrayList;
import java.util.List;
import com.fasterxml.jackson.annotation.JsonInclude;
@JsonInclude(JsonInclude.Include.NON_NULL)
public class DataciteProtein {
private String id;
private String doi;
private Types types;
List<Creators> creators = new ArrayList<Creators>();
private String publisher;
private String publicationYear;
private static final String schemaVersion = "http://datacite.org/schema/kernel-4";
List<Identifier> identifiers = new ArrayList<Identifier>();
List<RelatedIdentifier> relatedIdentifiers = new ArrayList<RelatedIdentifier>();
List<AlternateIdentifier> alternateIdentifiers = new ArrayList<AlternateIdentifier>();
List<Description> descriptions = new ArrayList<Description>();
List<Title> titles = new ArrayList<Title>();
private List<DataciteDate> dates = new ArrayList<DataciteDate>();
private List<Subject> subjects = new ArrayList<Subject>();
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class Types {
private String resourceType;
private String resourceTypeGeneral;
public String getResourceType() {
return resourceType;
}
public void setResourceType(String resourceType) {
this.resourceType = resourceType;
}
public String getResourceTypeGeneral() {
return resourceTypeGeneral;
}
public void setResourceTypeGeneral(String resourceTypeGeneral) {
this.resourceTypeGeneral = resourceTypeGeneral;
}
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class Creators {
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class Identifier {
private String identifier;
private String identifierType;
public String getIdentifier() {
return identifier;
}
public void setIdentifier(String identifier) {
this.identifier = identifier;
}
public String getIdentifierType() {
return identifierType;
}
public void setIdentifierType(String identifierType) {
this.identifierType = identifierType;
}
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class RelatedIdentifier {
private String relationType;
private String relatedIdentifier;
private String relatedIdentifierType;
public String getRelationType() {
return relationType;
}
public void setRelationType(String relationType) {
this.relationType = relationType;
}
public String getRelatedIdentifier() {
return relatedIdentifier;
}
public void setRelatedIdentifier(String relatedIdentifier) {
this.relatedIdentifier = relatedIdentifier;
}
public String getRelatedIdentifierType() {
return relatedIdentifierType;
}
public void setRelatedIdentifierType(String relatedIdentifierType) {
this.relatedIdentifierType = relatedIdentifierType;
}
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class AlternateIdentifier {
private String alternateIdentifier;
private String alternateIdentifierType;
public String getAlternateIdentifier() {
return alternateIdentifier;
}
public void setAlternateIdentifier(String alternateIdentifier) {
this.alternateIdentifier = alternateIdentifier;
}
public String getAlternateIdentifierType() {
return alternateIdentifierType;
}
public void setAlternateIdentifierType(String alternateIdentifierType) {
this.alternateIdentifierType = alternateIdentifierType;
}
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class Description {
private String description;
private String descriptionType;
public String getDescription() {
return description;
}
public void setDescription(String description) {
this.description = description;
}
public String getDescriptionType() {
return descriptionType;
}
public void setDescriptionType(String descriptionType) {
this.descriptionType = descriptionType;
}
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class Title {
private String title;
private String titleType;
public String getTitle() {
return title;
}
public void setTitle(String title) {
this.title = title;
}
public String getTitleType() {
return titleType;
}
public void setTitleType(String titleType) {
this.titleType = titleType;
}
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class DataciteDate {
private String date;
private String dateType;
public String getDate() {
return date;
}
public void setDate(String date) {
this.date = date;
}
public String getDateType() {
return dateType;
}
public void setDateType(String dateType) {
this.dateType = dateType;
}
}
@JsonInclude(JsonInclude.Include.NON_NULL)
public static class Subject {
private String schemeURI;
private String value;
private String subjectScheme;
public String getSchemeURI() {
return schemeURI;
}
public void setSchemeURI(String schemeURI) {
this.schemeURI = schemeURI;
}
public String getValue() {
return value;
}
public void setValue(String value) {
this.value = value;
}
public String getSubjectScheme() {
return subjectScheme;
}
public void setSubjectScheme(String subjectScheme) {
this.subjectScheme = subjectScheme;
}
}
public String getId() {
return id;
}
public void setId(String id) {
this.id = id;
}
public String getDoi() {
return doi;
}
public void setDoi(String doi) {
this.doi = doi;
}
public Types getTypes() {
return types;
}
public void setTypes(Types types) {
this.types = types;
}
public List<Creators> getCreators() {
return creators;
}
public void setCreators(List<Creators> creators) {
this.creators = creators;
}
public String getPublisher() {
return publisher;
}
public void setPublisher(String publisher) {
this.publisher = publisher;
}
public String getPublicationYear() {
return publicationYear;
}
public void setPublicationYear(String publicationYear) {
this.publicationYear = publicationYear;
}
public static String getSchemaVersion() {
return schemaVersion;
}
public List<RelatedIdentifier> getRelatedIdentifiers() {
return relatedIdentifiers;
}
public void setRelatedIdentifiers(List<RelatedIdentifier> relatedIdentifiers) {
this.relatedIdentifiers = relatedIdentifiers;
}
public List<AlternateIdentifier> getAlternateIdentifiers() {
return alternateIdentifiers;
}
public void setAlternateIdentifiers(List<AlternateIdentifier> alternateIdentifiers) {
this.alternateIdentifiers = alternateIdentifiers;
}
public List<Description> getDescriptions() {
return descriptions;
}
public void setDescriptions(List<Description> descriptions) {
this.descriptions = descriptions;
}
public List<Title> getTitles() {
return titles;
}
public void setTitles(List<Title> titles) {
this.titles = titles;
}
public List<Identifier> getIdentifiers() {
return identifiers;
}
public void setIdentifiers(List<Identifier> identifiers) {
this.identifiers = identifiers;
}
public List<DataciteDate> getDates() {
return dates;
}
public void setDates(List<DataciteDate> dates) {
this.dates = dates;
}
public List<Subject> getSubjects() {
return subjects;
}
public void setSubjects(List<Subject> subjects) {
this.subjects = subjects;
}
}

View File

@ -0,0 +1,35 @@
package eu.dnetlib.dhp.rdfconverter.utils;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.IOException;
import java.io.StringWriter;
import java.util.zip.GZIPInputStream;
import java.util.zip.GZIPOutputStream;
import org.apache.commons.codec.binary.Base64;
import org.apache.commons.io.IOUtils;
public class CompressorUtil {
public static String decompressValue(final String abstractCompressed) {
try {
byte[] byteArray = Base64.decodeBase64(abstractCompressed.getBytes());
GZIPInputStream gis = new GZIPInputStream(new ByteArrayInputStream(byteArray));
final StringWriter stringWriter = new StringWriter();
IOUtils.copy(gis, stringWriter);
return stringWriter.toString();
} catch (IOException e) {
throw new IllegalArgumentException(e);
}
}
public static String compressValue(final String value) throws IOException {
ByteArrayOutputStream out = new ByteArrayOutputStream();
GZIPOutputStream gzip = new GZIPOutputStream(out);
gzip.write(value.getBytes());
gzip.close();
return java.util.Base64.getEncoder().encodeToString(out.toByteArray());
}
}

View File

@ -0,0 +1,43 @@
package eu.dnetlib.dhp.rdfconverter.utils;
import java.io.IOException;
import com.fasterxml.jackson.core.JsonParser;
import com.fasterxml.jackson.core.ObjectCodec;
import com.fasterxml.jackson.databind.DeserializationContext;
import com.fasterxml.jackson.databind.JsonNode;
import com.fasterxml.jackson.databind.deser.std.StdDeserializer;
import eu.dnetlib.dhp.rdfconverter.bioschema.model.BioSchemaProtein;
public class CustomPropertyValueDeserializer
extends StdDeserializer<BioSchemaProtein.Link> {
public CustomPropertyValueDeserializer() {
this(null);
}
public CustomPropertyValueDeserializer(Class<?> vc) {
super(vc);
}
@Override
public BioSchemaProtein.Link deserialize(
JsonParser jsonparser, DeserializationContext context)
throws IOException {
ObjectCodec oc = jsonparser.getCodec();
JsonNode node = oc.readTree(jsonparser);
JsonNode id = node.get("@id");
if (id != null) {
BioSchemaProtein.Link link = new BioSchemaProtein.Link();
link.setId(id.asText());
return link;
} else {
String txt = node.asText();
BioSchemaProtein.Link link = new BioSchemaProtein.Link();
link.setId(txt);
return link;
}
}
}

View File

@ -0,0 +1,309 @@
package eu.dnetlib.dhp.rdfconverter.utils;
import java.io.IOException;
import java.io.StringReader;
import java.io.StringWriter;
import java.util.*;
import java.util.stream.Collectors;
import org.eclipse.rdf4j.model.Model;
import org.eclipse.rdf4j.rio.RDFFormat;
import org.eclipse.rdf4j.rio.RDFWriter;
import org.eclipse.rdf4j.rio.Rio;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.ObjectMapper;
import com.fasterxml.jackson.databind.module.SimpleModule;
import com.github.jsonldjava.core.JsonLdOptions;
import com.github.jsonldjava.core.JsonLdProcessor;
import com.github.jsonldjava.utils.JsonUtils;
import eu.dnetlib.dhp.rdfconverter.bioschema.model.BioSchemaProtein;
import eu.dnetlib.dhp.rdfconverter.bioschema.model.DataciteProtein;
public class RDFConverter {
private static final Logger log = LoggerFactory.getLogger(RDFConverter.class);
public ArrayList<String> nQuadsFile2DataciteJson(String nquads, String profile) throws Exception {
if (profile.equals("Protein")) {
return nQuadsFile2DataciteJson(nquads);
}
throw new RuntimeException("Profile not supported");
}
private ArrayList<String> nQuadsFile2DataciteJson(String nquads) throws Exception {
StringReader reader = new StringReader(nquads);
Model model = Rio.parse(reader, "", RDFFormat.NQUADS);
StringWriter jsonLDWriter = new StringWriter();
RDFWriter rdfRecordWriter = Rio.createWriter(RDFFormat.JSONLD, jsonLDWriter);
Rio.write(model, rdfRecordWriter);
String jsonLDBuffer = jsonLDWriter.toString();
Object jsonObject = JsonUtils.fromString(jsonLDBuffer);
Object compact = JsonLdProcessor.compact(jsonObject, new HashMap<>(), new JsonLdOptions());
String compactContent = JsonUtils.toString(compact);
log.debug("jsonld: " + compactContent);
ObjectMapper objectMapper = new ObjectMapper();
objectMapper.enable(DeserializationFeature.ACCEPT_SINGLE_VALUE_AS_ARRAY);
objectMapper.enable(DeserializationFeature.ACCEPT_EMPTY_STRING_AS_NULL_OBJECT);
objectMapper.configure(DeserializationFeature.FAIL_ON_UNKNOWN_PROPERTIES, false);
objectMapper.configure(DeserializationFeature.FAIL_ON_INVALID_SUBTYPE, false);
objectMapper.configure(DeserializationFeature.FAIL_ON_MISSING_CREATOR_PROPERTIES, false);
BioSchemaProtein bioSchemaProtein = objectMapper.readValue(compactContent, BioSchemaProtein.class);
BioSchemaProtein.DateTimeType retrievedOnType = bioSchemaProtein.getRetrievedOn();
List<String> citations = bioSchemaProtein.getEntryList().stream().map(entry -> {
if (entry.getCitation() != null) {
BioSchemaProtein.Citation citationInfo = entry.getCitation();
return citationInfo.getId();
}
return null;
}).filter(id -> id != null).collect(Collectors.toList());
ArrayList<String> results = new ArrayList<String>();
final List<DataciteProtein> dataciteProteins = new ArrayList<>();
final Map<String, List<BioSchemaProtein.Link>> sequenceAnnotations = new HashMap<>();
final Map<String, String> propertyValues = new HashMap<>();
final Map<String, BioSchemaProtein.DefinedTerm> definedTerms = new HashMap<>();
final Map<String, BioSchemaProtein.Entry> bioschemaProteins = new HashMap<>();
final List<String> mainTitles = new ArrayList<>();
bioSchemaProtein.getEntryList().stream().forEach(entry -> {
if (entry.getType() != null
&& entry
.getType()
.equals("https://schema.org/Protein")) {
DataciteProtein dataciteProtein = new DataciteProtein();
citations.forEach(citation -> {
addRelatedIdentifier(dataciteProtein, citation, "IsCitedBy");
});
DataciteProtein.Types types = new DataciteProtein.Types();
types.setResourceType("Protein");
types.setResourceTypeGeneral("Dataset");
dataciteProtein.setTypes(types);
DataciteProtein.DataciteDate dataciteDate = new DataciteProtein.DataciteDate();
dataciteDate.setDate(retrievedOnType.getValue());
dataciteDate.setDateType("Collected");
dataciteProtein.getDates().add(dataciteDate);
DataciteProtein.Identifier identifier = new DataciteProtein.Identifier();
identifier.setIdentifier(entry.getId());
identifier.setIdentifierType("URL");
dataciteProtein.getIdentifiers().add(identifier);
if (entry.getIdentifier() != null) {
addAlternateIdentifier(dataciteProtein, entry.getIdentifier());
}
if (entry.getDescription() != null) {
DataciteProtein.Description description = new DataciteProtein.Description();
description.setDescription(entry.getDescription());
dataciteProtein.getDescriptions().add(description);
}
if (entry.getIsEncodedByBioChemEntity() != null) {
addRelatedIdentifier(dataciteProtein, entry.getIsEncodedByBioChemEntity(), "");
}
if (entry.getUrl() != null) {
addAlternateIdentifier(dataciteProtein, entry.getUrl());
}
if (entry.getAlternateName() != null) {
DataciteProtein.Title title = new DataciteProtein.Title();
title.setTitle(entry.getAlternateName());
title.setTitleType("AlternativeTitle");
dataciteProtein.getTitles().add(title);
}
if (entry.getBioChemInteraction() != null) {
entry.getBioChemInteraction().stream().filter(Objects::nonNull).forEach(bc -> {
addRelatedIdentifier(dataciteProtein, bc.getId(), "");
});
}
if (entry.getBioChemSimilarity() != null) {
entry.getBioChemSimilarity().stream().filter(Objects::nonNull).forEach(bc -> {
addRelatedIdentifier(dataciteProtein, bc.getId(), "");
});
}
if (entry.getHasMolecularFunction() != null) {
addRelatedIdentifier(dataciteProtein, entry.getHasMolecularFunction(), "");
}
if (entry.getIsInvolvedInBiologicalProcess() != null) {
addRelatedIdentifier(dataciteProtein, entry.getIsInvolvedInBiologicalProcess(), "");
}
if (entry.getIsEncodedByBioChemEntity() != null) {
addRelatedIdentifier(dataciteProtein, entry.getIsEncodedByBioChemEntity(), "");
}
if (entry.getIsPartOfBioChemEntity() != null) {
addRelatedIdentifier(dataciteProtein, entry.getIsPartOfBioChemEntity().getUrl(), "");
}
if (entry.getSameAs() != null) {
entry.getSameAs().stream().filter(Objects::nonNull).forEach(sameAs -> {
addRelatedIdentifier(dataciteProtein, sameAs.getId(), "IsIdenticalTo");
});
}
if (entry.getAssociatedDisease() != null) {
entry.getAssociatedDisease().stream().filter(Objects::nonNull).forEach(ad -> {
addRelatedIdentifier(dataciteProtein, ad.getName(), "IsIdenticalTo");
});
}
String proteinId = "";
try {
String[] identifierParts = dataciteProtein.getIdentifiers().get(0).getIdentifier().split("/");
proteinId = identifierParts[identifierParts.length - 1];
} catch (Exception e) {
log.error("Identifier not found", e.getMessage());
}
mainTitles.add(" " + entry.getName() + " ");
dataciteProtein.setId(proteinId);
bioschemaProteins.put(entry.getId(), entry);
dataciteProteins.add(dataciteProtein);
}
if (entry.getType() != null
&& entry
.getType()
.equals("https://schema.org/SequenceAnnotation")) {
sequenceAnnotations.put(entry.getId(), entry.getSequenceAnnotation());
}
if (entry.getType() != null
&& entry
.getType()
.equals("https://schema.org/PropertyValue")) {
propertyValues.put(entry.getId(), entry.getPropertyValue().getId());
}
if (entry.getType() != null
&& entry
.getType()
.equals("https://schema.org/DefinedTerm")) {
BioSchemaProtein.DefinedTerm term = new BioSchemaProtein.DefinedTerm();
term.setId(entry.getId());
term.setTermCode(entry.getTermCode());
term.setName(entry.getName());
definedTerms.put(term.getId(), term);
}
if (entry.getType() != null
&& entry
.getType()
.equals("https://schema.org/CollectionPage")) {
mainTitles.add(entry.getName());
}
});
bioschemaProteins
.entrySet()
.stream()
.filter(bioProtein -> Objects.nonNull(bioProtein.getValue().getHasSequenceAnnotation()))
.forEach(bioProtein -> {
List<String> seqAnnIds = bioProtein
.getValue()
.getHasSequenceAnnotation()
.stream()
.map(s -> s.getId())
.collect(Collectors.toList());
List<BioSchemaProtein.Link> propertyIds = sequenceAnnotations
.entrySet()
.stream()
.filter(s -> seqAnnIds.contains(s.getKey()))
.flatMap(s -> {
return s.getValue().stream();
})
.collect(Collectors.toList());
propertyIds
.stream()
.map(propertyId -> propertyValues.get(propertyId.getId()))
.filter(term -> Objects.nonNull(term))
.map(term -> definedTerms.get(term))
.filter(term -> Objects.nonNull(term))
.forEach(term -> {
dataciteProteins
.stream()
.filter(
dcProtein -> dcProtein
.getIdentifiers()
.get(0)
.getIdentifier()
.equals(bioProtein.getKey()))
.filter(dcProtein -> Objects.nonNull(dcProtein))
.forEach(d -> {
DataciteProtein.Subject subject = new DataciteProtein.Subject();
subject.setSchemeURI(term.getId());
subject.setValue(term.getName());
subject.setSubjectScheme(term.getTermCode());
d.getSubjects().add(subject);
});
});
});
dataciteProteins
.stream()
.filter(d -> (d.getSubjects() != null && !d.getSubjects().isEmpty()))
.forEach(d -> {
Map<String, DataciteProtein.Subject> cleanedSubjects = new HashMap<>();
d.getSubjects().stream().forEach(s -> {
cleanedSubjects.putIfAbsent(s.getValue(), s);
});
d.getSubjects().clear();
d.setSubjects(cleanedSubjects.values().stream().collect(Collectors.toList()));
});
dataciteProteins.forEach(d -> {
DataciteProtein.Title title = new DataciteProtein.Title();
title.setTitle(d.getId() + " - ".concat(mainTitles.get(0)));
d.getTitles().add(title);
});
ObjectMapper mapper = new ObjectMapper();
dataciteProteins.forEach(d -> {
StringWriter writer = new StringWriter();
try {
mapper.writeValue(writer, d);
} catch (IOException e) {
throw new RuntimeException(e);
}
results.add(writer.toString());
});
if (dataciteProteins.isEmpty()) {
log.error("No Protein data found: " + nquads);
}
return results;
}
private void addRelatedIdentifier(DataciteProtein DataciteProtein, String relatedIdentifierValue,
String relationType) {
DataciteProtein.RelatedIdentifier relatedIdentifier = new DataciteProtein.RelatedIdentifier();
relatedIdentifier.setRelatedIdentifier(relatedIdentifierValue);
if (!relationType.isEmpty()) {
relatedIdentifier.setRelationType(relationType);
}
if (relatedIdentifierValue.contains("http://") || relatedIdentifierValue.contains("https://")) {
relatedIdentifier.setRelatedIdentifierType("URL");
}
DataciteProtein.getRelatedIdentifiers().add(relatedIdentifier);
}
private void addAlternateIdentifier(DataciteProtein DataciteProtein, String alternateIdentifierValue) {
DataciteProtein.AlternateIdentifier alternateIdentifier = new DataciteProtein.AlternateIdentifier();
alternateIdentifier.setAlternateIdentifier(alternateIdentifierValue);
DataciteProtein.getAlternateIdentifiers().add(alternateIdentifier);
}
}

View File

@ -0,0 +1,32 @@
[
{
"paramName": "n",
"paramLongName": "nameNode",
"paramDescription": "the Name Node URI",
"paramRequired": true
},
{
"paramName": "w",
"paramLongName": "workingPath",
"paramDescription": "the working path",
"paramRequired": true
},
{
"paramName": "i",
"paramLongName": "rdfInput",
"paramDescription": "sequence file inside working path that contains rdf records",
"paramRequired": true
},
{
"paramName": "o",
"paramLongName": "output",
"paramDescription": "relative path inside workingpath where bioschema dataset in datacite format will be stored",
"paramRequired": true
},
{
"paramName": "p",
"paramLongName": "profile",
"paramDescription": "the input data profile that has to be used for conversion (https://bioschemas.org/profiles/)",
"paramRequired": true
}
]

View File

@ -0,0 +1,65 @@
<configuration>
<!-- OCEAN -->
<!-- <property>-->
<!-- <name>jobTracker</name>-->
<!-- <value>yarnRM</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>nameNode</name>-->
<!-- <value>hdfs://nameservice1</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>hive_metastore_uris</name>-->
<!-- <value>thrift://iis-cdh5-test-m3.ocean.icm.edu.pl:9083</value>-->
<!-- </property>-->
<!-- <property>-->
<!-- <name>spark2YarnHistoryServerAddress</name>-->
<!-- <value>http://iis-cdh5-test-gw.ocean.icm.edu.pl:18089</value>-->
<!-- </property>-->
<!-- GARR -->
<property>
<name>jobTracker</name>
<value>hadoop-rm3.garr-pa1.d4science.org:8032</value>
</property>
<property>
<name>nameNode</name>
<value>hdfs://hadoop-rm1.garr-pa1.d4science.org:8020</value>
</property>
<property>
<name>hive_metastore_uris</name>
<value>thrift://hadoop-edge3.garr-pa1.d4science.org:9083</value>
</property>
<property>
<name>spark2YarnHistoryServerAddress</name>
<value>http://hadoop-rm2.garr-pa1.d4science.org:19888</value>
</property>
<property>
<name>oozie.launcher.mapreduce.user.classpath.first</name>
<value>true</value>
</property>
<property>
<name>oozie.use.system.libpath</name>
<value>true</value>
</property>
<property>
<name>oozie.action.sharelib.for.spark</name>
<value>spark2</value>
</property>
<property>
<name>spark2EventLogDir</name>
<value>/user/spark/spark2ApplicationHistory</value>
</property>
<property>
<name>spark2ExtraListeners</name>
<value>"com.cloudera.spark.lineage.NavigatorAppListener"</value>
</property>
<property>
<name>spark2SqlQueryExecutionListeners</name>
<value>"com.cloudera.spark.lineage.NavigatorQueryListener"</value>
</property>
</configuration>

View File

@ -0,0 +1,3 @@
wget -O /tmp/base64_gzipped_nquads.txt https://hadoop-bioschemas-ds.garr-pa1.d4science.org/bioschemas-api/api/getNQuads?datasourceKey=$1
hdfs dfs -copyFromLocal /tmp/base64_gzipped_nquads.txt /data/bioschema/mobidb
rm -f /tmp/base64_gzipped_nquads.txt

View File

@ -0,0 +1,118 @@
<workflow-app name="RdfConverter" xmlns="uri:oozie:workflow:0.5">
<parameters>
<property>
<name>bioschemas_datasource_key</name>
<value>mobidb</value>
<description>bioschemas datasource key (i.e. mobidb, ped, disprot)</description>
</property>
<property>
<name>workingPath</name>
<value>/data/bioschema/mobidb/</value>
<description>the working path</description>
</property>
<property>
<name>rdfInput</name>
<value>base64_gzipped_nquads.txt</value>
<description>rdf output of scraping workflow</description>
</property>
<property>
<name>output</name>
<value>json-datacite/</value>
</property>
<property>
<name>profile</name>
<value>Protein</value>
<description>the input data profile that has to be used for conversion (https://bioschemas.org/profiles/)</description>
</property>
<property>
<name>oozie.launcher.mapreduce.map.java.opts</name>
<value>-Xmx4g</value>
</property>
<property>
<name>spark2RdfConversionMaxExecutors</name>
<value>50</value>
</property>
<property>
<name>sparkDriverMemory</name>
<value>7G</value>
<description>memory for driver process</description>
</property>
<property>
<name>sparkExecutorMemory</name>
<value>2G</value>
<description>memory for individual executor</description>
</property>
<property>
<name>sparkExecutorCores</name>
<value>4</value>
<description>number of cores used by single executor</description>
</property>
<property>
<name>spark2ExtraListeners</name>
<value>com.cloudera.spark.lineage.NavigatorAppListener</value>
<description>spark 2.* extra listeners classname</description>
</property>
<property>
<name>spark2YarnHistoryServerAddress</name>
<description>spark 2.* yarn history server address</description>
</property>
<property>
<name>spark2EventLogDir</name>
<description>spark 2.* event log dir location</description>
</property>
</parameters>
<start to="DownloadNQuads"/>
<kill name="Kill">
<message>Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]</message>
</kill>
<action name="DownloadNQuads">
<shell xmlns="uri:oozie:shell-action:0.1">
<job-tracker>${jobTracker}</job-tracker>
<name-node>${nameNode}</name-node>
<exec>download_nquads.sh</exec>
<argument>${bioschemas_datasource_key}</argument>
<file>download_nquads.sh</file>
<capture-output/>
</shell>
<ok to="ResetWorkingPath"/>
<error to="Kill"/>
</action>
<action name="ResetWorkingPath">
<fs>
<delete path='${workingPath}${output}'/>
</fs>
<ok to="NquadsToDataciteJson"/>
<error to="Kill"/>
</action>
<action name="NquadsToDataciteJson">
<spark xmlns="uri:oozie:spark-action:0.2">
<master>yarn-cluster</master>
<mode>cluster</mode>
<name>NquadsToDataciteJson</name>
<class>eu.dnetlib.dhp.rdfconverter.bioschema.SparkRdfToDatacite</class>
<jar>dhp-rdfconverter-${projectVersion}.jar</jar>
<spark-opts>
--executor-cores=${sparkExecutorCores}
--driver-memory=${sparkDriverMemory}
--executor-memory=${sparkExecutorMemory}
--driver-memory=${sparkDriverMemory}
--conf spark.extraListeners=${spark2ExtraListeners}
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
</spark-opts>
<arg>--nameNode</arg><arg>${nameNode}</arg>
<arg>--workingPath</arg><arg>${workingPath}</arg>
<arg>--rdfInput</arg><arg>${rdfInput}</arg>
<arg>--output</arg><arg>${output}</arg>
<arg>--profile</arg><arg>${profile}</arg>
</spark>
<ok to="End"/>
<error to="Kill"/>
</action>
<end name="End"/>
</workflow-app>

View File

@ -0,0 +1,9 @@
# Set root logger level to DEBUG and its only appender to A1.
log4j.rootLogger=INFO, A1
# A1 is set to be a ConsoleAppender.
log4j.appender.A1=org.apache.log4j.ConsoleAppender
# A1 uses PatternLayout.
log4j.appender.A1.layout=org.apache.log4j.PatternLayout
log4j.appender.A1.layout.ConversionPattern=%-4r [%t] %-5p %c %x - %m%n

View File

@ -0,0 +1,64 @@
package eu.dnetlib.dhp.rdfconverter.bioschema;
import java.io.InputStream;
import java.util.ArrayList;
import org.apache.commons.io.IOUtils;
import org.junit.jupiter.api.Test;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import eu.dnetlib.dhp.rdfconverter.utils.CompressorUtil;
import eu.dnetlib.dhp.rdfconverter.utils.RDFConverter;
public class ConverterTest {
static Logger logger = LoggerFactory.getLogger(ConverterTest.class);
@Test
public void disprotToDataciteTest() throws Exception {
InputStream is = ConverterTest.class.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/disprot.nq");
String nq = IOUtils.toString(is);
RDFConverter converter = new RDFConverter();
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
results.stream().forEach(r -> {
logger.info("JSON DATACITE >> " + r);
});
}
@Test
public void pedCitationTest() throws Exception {
InputStream is = ConverterTest.class.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/ped.nq");
String nq = IOUtils.toString(is);
RDFConverter converter = new RDFConverter();
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
results.stream().forEach(r -> {
logger.info("JSON DATACITE >> " + r);
});
}
@Test
public void mobidbToDataciteTest() throws Exception {
InputStream is = ConverterTest.class.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/mobidb.nq");
String nq = IOUtils.toString(is);
RDFConverter converter = new RDFConverter();
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
results.stream().forEach(r -> {
logger.info("JSON DATACITE >> " + r);
});
}
@Test
public void decompressTest() throws Exception {
InputStream is = ConverterTest.class
.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/base64_gzipped_nquads.txt");
String base64_gzipped_nquads = IOUtils.toString(is);
String nq = CompressorUtil.decompressValue(base64_gzipped_nquads);
RDFConverter converter = new RDFConverter();
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
results.stream().forEach(r -> {
logger.info("JSON DATACITE >> " + r);
});
}
}

View File

@ -0,0 +1 @@
H4sIAAAAAAAAANVY23KjOBB9369wOc+2uNhJ7EqlipiLVQgGkBbGL7OFQbZVayMv4Hj89yOMk2GSSc3O+FLJG0Kt0+d0S92Cu0VZroshAFPGi2RBV3HR5fkcJHm8XYJHGaz4lKVT4Em9a1UGiqQoUk9WgXTfuquWipXrTb7cr1nHjyCnZc7oI03NnK8ONhV8DbM3q6HuW92/7s7l/FN232pX5h2p15FVIitDRR325faXL08Lt9ttd6vulyqSJIPPDsJ7CldpXFLCVvQcDJOcCvQ0YuWiEZy5GG6m3YSvwDjq4Igi8OD8jQ0haEnjghagjOdA6va7yg+kGkH1ZUW9bXhtyJMHgwGQFCCikaezTrHLyvhrJyuuyt2aNljU+uoU5bykLGtM/r7+/8fzOTppAkqarwqQ8GzGxQPhb7tf53zGliIuB6IiNrLcCQxkaNg4N+sXsVrExQPjHl/uVjTH9L8NzRIR1rbj6tD2EYpcy0BuiEIMdQ+byLEt7AUG1EIUwCAUj2SCQnfieAhGrg1tYYNN3UNEx4Y9MSPTGLs28aAXuRMvtEJk6iOkWTbWiEkINg3XD209RMQUgGMUOpaOkecRCD2oYWwTXzNsATP2I9sPRyZEriVea9DBCIeuoQVi1sIhJIFr+roJDYgFD4xx4AVjKGhBn+CAYIuYAcS+QMYOsULXI8jWoWHpEOmhbVjQtVw9dEI48i0B4kVjB6GJjibYRoGQZJloAgkKPWhblm4LbgZqXzZZLKVZyWaM5iJDT/PfX9aea6xhjXNpglmy3KQ0hZkel+Lolw2eDYgr4UXqSIMLs8viqiy2tU3J14t4vmut6/PX6l+YSCGIaMWLMrLJWMVnb3B4fg1yCXaivvKMr1gSxNmcHuH8ddsEfeXmWr3t9W5OpekPSuvR/WVUtUH2SCOe/3smHaeI7dE6dTpjGU2JaGzvWOarEtSgjasKdErn8uCmr6rXN/3bjxORX1abw4HfgX5/oAyUD6rsZ73wSdnwQyt7vmhO+ZJN8zjf7W3EELijB0gqkf98NIXVdXnE06oh19RP1YPPT13k4kVmhE+elXzJ54fUHAZ1frTPn9z3d7ZelbJT9ovjCu/Zpf78Ylglq7UvGe9oL/6K+/fNeHC45nkZv7klmbgbPW/KM1wsn36PvP2FXLJyuf/CFIv0hyMj/Q0PBaE5ARIAAA==

View File

@ -0,0 +1,52 @@
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> <http://purl.org/pav/retrievedFrom> <https://disprot.org/DP01454> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> <http://purl.org/pav/retrievedOn> "2021-11-25T12:23:57"^^<http://www.w3.org/2001/XMLSchema#dateTime> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> <http://purl.org/pav/createdWith> <https://github.com/HW-SWeL/BMUSE/releases/tag/0.5.2> .
<https://disprot.org/DP01454> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/hasBioPolymerSequence> "MSTLFPSLFPRVTETLWFNLDRPCVEETELQQQEQQHQAWLQSIAEKDNNLVPIGKPASEHYDDEEEEDDEDDEDSEEDSEDDEDMQDMDEMNDYNESPDDGEVNEVDMEGNEQDQDQWMI" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/hasSequenceAnnotation> <https://disprot.org/DP01454#disorder-content> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/hasSequenceAnnotation> <https://disprot.org/DP01454r001> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/identifier> "https://identifiers.org/disprot:DP01454" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/includedInDataset> "https://disprot.org/#2021-08" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/name> "Anaphase-promoting complex subunit 15" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P60006> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <https://schema.org/taxonomicRange> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/profiles/Protein/0.11-RELEASE> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CreativeWork> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454#disorder-content> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454#disorder-content> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454#disorder-content> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://schema.org/name> "Protein disorder content" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://schema.org/propertyID> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00499> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://schema.org/value> "5.371900826446281E-1" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <https://schema.org/rangeEnd> "121" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <https://schema.org/rangeStart> "1" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454r001> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454r001> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454r001> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454r001> <https://schema.org/subjectOf> <https://identifiers.org/pubmed:26083744> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/name> "disorder" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/termCode> "IDPO:00076" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl> <https://schema.org/name> "IDP ontology" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <https://schema.org/rangeEnd> "121" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <https://schema.org/rangeStart> "57" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://identifiers.org/pubmed:26083744> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/ScholarlyArticle> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/inDefinedTermSet> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/sameAs> <http://purl.uniprot.org/taxonomy/9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/sameAs> <https://identifiers.org/taxonomy:9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/sameAs> <http://purl.obolibrary.org/obo/NCBITaxon_9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/termCode> "9606" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/url> <http://purl.bioontology.org/ontology/NCBITAXON/9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <https://schema.org/name> "NCBI taxon" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <https://schema.org/url> <https://bioportal.bioontology.org/ontologies/NCBITAXON> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
<https://disprot.org/DP01454> <http://purl.org/dc/terms/title> "DisProt" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .

View File

@ -0,0 +1,118 @@
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> <http://purl.org/pav/retrievedFrom> <https://mobidb.org/Q9UPN6> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> <http://purl.org/pav/retrievedOn> "2021-12-06T14:49:15"^^<http://www.w3.org/2001/XMLSchema#dateTime> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> <http://purl.org/pav/createdWith> <https://github.com/HW-SWeL/BMUSE/releases/tag/0.5.2> .
<https://mobidb.org/Q9UPN6> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasBioPolymerSequence> "MEAVKTFNSELYSLNDYKPPISKAKMTQITKAAIKAIKFYKHVVQSVEKFIQKCKPEYKVPGLYVIDSIVRQSRHQFGQEKDVFAPRFSNNIISTFQNLYRCPGDDKSKIVRVLNLWQKNNVFKSEIIQPLLDMAAGIPPPVVTPVLASTTTAMSNTPGTPVTPVTPANVVQGLPDPWVSQITNTDTLAAVAQILQSPQGQQLQQLIQTLQIQQQKPQPSILQALDAGLVVQLQALTAQLTAAAAAANTLTPLEQGVSFNKKLMDRFDFGEDSEHSEEPKKEIPASQLSHVSESVNNSIFHQIAEQLQQQNLEHLRQQLLEQQQPQKATPQDSQEGTFGSEHSASPSQGSSQQHFLEPEVNLDDSIDIQQQDMDIDEGQDGVEEEVFEQEAKKVAVRSRSRTHSRSRSRSPRKRRSRSRSGSRKRKHRKRSRSRSRERKRKSSRSYSSERRAREREKERQKKGLPPIRSKTLSVCSTTLWVGQVDKKATQQDLTNLFEEFGQIESINMIPPRGCAYVCMVHRQDAFRALQKLSSGSYKIGSKVIKIAWALNKGVKTEYKQFWDVDLGVTYIPWEKVKVDDLEGFAEGGMIDQETVNTEWETVKSSEPVKETVQTTQSPTPVEKETVVTTQAEVFPPPVAMLQIPVAPAVPTVSLVPPAFPVSMPVPPPGFSPIPPPPFLRASFNPSQPPPGFMPPPVPPPVVPPPTIPPVVPTSLVQPSLSMTPETVKDVGFGSLVIPGGSVASNLATSALPAGNVFNAPTKQAEPEEKVPHLIDHQISSGENTRSVIPNDISSNAAILGGQPPNVTSNSGILGVQRPNVSSNSEILGVRPSNVSSSSGIIAAQPPNILNNSGILGIQPPSVSNSSGLLGVLPPNIPNNSGLVGVQPPNVPNTPGLLGTQPPAGPQNLPPLSIPNQRMPTMPMLDIRPGLIPQAPGPRFPLIQPGIPPQRGIPPPSVLDSALHPPPRGPFPPGDIFSQPERPFLAPGRQSVDNVTNPEKRIPLGNDNIQQEGDRDYRFPPIETRESISRPPPVDVRDVVGRPIDPREGPGRPPLDGRDHFGRPPVDIRENLVRPGIDHLGRRDHFGFNPEKPWGHRGDFDEREHRVLPVYGGPKGLHEERGRFRSGNYRFDPRSGPWNRGFGQEVHRDFDDRRRPWERQRDRDDRDFDFCREMNGNRLGRDRIQNTWVPPPHARVFDYFEGATSQRKGDNVPQVNGENTERHAQPPPIPVQNDPELYEKLTSSNEINKEKSDTVADIESEPVVESTETEGT" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/identifier> "https://identifiers.org/mobidb:Q9UPN6" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/includedInDataset> "https://mobidb.org/#2020-09" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/name> "SR-related and CTD-associated factor 8" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/Q9UPN6> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <https://schema.org/taxonomicRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/profiles/Protein/0.11-RELEASE> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CreativeWork> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://schema.org/description> "Protein disorder content predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://schema.org/name> "Protein disorder content" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://schema.org/propertyID> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00499> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://schema.org/value> "2.93E-1" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <https://schema.org/rangeEnd> "1271" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <https://schema.org/rangeStart> "1" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/name> "Disorder" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/termCode> "IDPO:00076" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://disprot.org/assets/data/IDPO_v0.2.owl> <https://schema.org/name> "IDP ontology" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <https://schema.org/rangeEnd> "289" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <https://schema.org/rangeStart> "270" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <https://schema.org/rangeEnd> "354" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <https://schema.org/rangeStart> "322" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <https://schema.org/rangeEnd> "468" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <https://schema.org/rangeStart> "384" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <https://schema.org/rangeEnd> "827" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <https://schema.org/rangeStart> "808" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <https://schema.org/rangeEnd> "918" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <https://schema.org/rangeStart> "899" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <https://schema.org/rangeEnd> "1064" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <https://schema.org/rangeStart> "945" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <https://schema.org/rangeEnd> "1271" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <https://schema.org/rangeStart> "1198" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/inDefinedTermSet> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/sameAs> <http://purl.uniprot.org/taxonomy/9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/sameAs> <https://identifiers.org/taxonomy:9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/sameAs> <http://purl.obolibrary.org/obo/NCBITaxon_9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/termCode> "9606" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/url> <http://purl.bioontology.org/ontology/NCBITAXON/9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <https://schema.org/name> "NCBI taxon" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <https://schema.org/url> <https://bioportal.bioontology.org/ontologies/NCBITAXON> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
<https://mobidb.org/Q9UPN6> <http://purl.org/dc/terms/title> "MobiDB" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .

View File

@ -0,0 +1,229 @@
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> <http://purl.org/pav/retrievedFrom> <https://proteinensemble.org/PED00014> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> <http://purl.org/pav/retrievedOn> "2021-12-06T11:52:22"^^<http://www.w3.org/2001/XMLSchema#dateTime> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> <http://purl.org/pav/createdWith> <https://github.com/HW-SWeL/BMUSE/releases/tag/0.5.2> .
<https://proteinensemble.org/PED00014> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CollectionPage> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014> <https://schema.org/citation> <https://identifiers.org/pubmed:20399186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014> <https://schema.org/identifier> "https://identifiers.org/ped:PED00014" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014> <https://schema.org/includedInDataset> "https://proteinensemble.org/#2021-02-12" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014> <https://schema.org/mainEntity> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014> <https://schema.org/name> "Structural ensemble of pSic1 (1-90) phosphorylated at Thr5, Thr33, Thr45, Ser69, Ser76 and Ser80, in complex with SKP1 (4-186) and CDC4 (270-744)" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://identifiers.org/pubmed:20399186> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/ScholarlyArticle> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/ItemList> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/itemListElement> <https://proteinensemble.org/PED00014#P07834_D_0> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/itemListElement> <https://proteinensemble.org/PED00014#P52286_C_0> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/itemListElement> <https://proteinensemble.org/PED00014#P38634_A_1> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/numberOfItems> "3" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/hasBioPolymerSequence> "LKRDLITSLPFEISLKIFNYLQFEDIINSLGVSQNWNKIIRKSTSLWKKLLISENFVSPKGFNSLNLKLSQKYPKLSQQDRLRLSFLENIFILKNWYNPKFVPQRTTLRGHMTSVITCLQFEDNYVITGADDKMIRVYDSINKKFLLQLSGHDGGVWALKYAHGGILVSGSTDRTVRVWDIKKGCCTHVFKGHNSTVRCLDIVEYKNIKYIVTGSRDNTLHVWKLPKESSVPDHGEEHDYPLVFHTPEENPYFVGVLRGHMASVRTVSGHGNIVVSGSYDNTLIVWDVAQMKCLYILSGHTDRIYSTIYDHERKRCISASMDTTIRIWDLENIWNNGECSYATNSASPCAKILGAMYTLQGHTALVGLLRLSDKFLVSAAADGSIRGWDANDYSRKFSYHHTNLSAITTFYVSDNILVSGSENQFNIYNLRSGKLVHANILKDADQIWSVNFKGKTLVAAVEKDGQSFLEILDFS" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/hasSequenceAnnotation> <https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/identifier> "https://identifiers.org/uniprot:P07834" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/name> "Cell division control protein 4" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P07834> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/profiles/Protein/0.11-RELEASE> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CreativeWork> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://schema.org/name> "NMR" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://schema.org/termCode> "IDPO:00120" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl> <https://schema.org/name> "IDP ontology" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://schema.org/name> "RDC" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://schema.org/termCode> "IDPO:00166" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://schema.org/name> "chemical shift" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://schema.org/termCode> "IDPO:00167" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://schema.org/name> "relaxation" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://schema.org/termCode> "IDPO:00168" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://schema.org/name> "T2 relaxation" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://schema.org/termCode> "IDPO:00169" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://schema.org/name> "SAXS" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://schema.org/termCode> "IDPO:00125" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://schema.org/name> "TraDES" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://schema.org/termCode> "IDPO:00186" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://schema.org/name> "CNS" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://schema.org/termCode> "IDPO:00192" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://schema.org/name> "CRYSOL" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://schema.org/termCode> "IDPO:00208" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://schema.org/name> "ShiftX" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://schema.org/termCode> "IDPO:00210" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://schema.org/name> "ENSEMBLE" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://schema.org/termCode> "IDPO:00216" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <https://schema.org/rangeEnd> "744" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <https://schema.org/rangeStart> "270" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/hasBioPolymerSequence> "SNVVLVSGEGERFTVDKKIAERSLLLKNYLNDMHDSNLQNNSDSESDSDSETNHKSKDNNNGDDDDEDDDEIVMPVPNVRSSVLQKVIEWAEHHRDSNFPDEDDDDSRKSAPVDSWDREFLKVDQEMLYEIILAANYLNIKPLLDAGCKVVAEMIRGRSPEEIRRTFNIVNDFTPEEEAAIRR" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/hasSequenceAnnotation> <https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/identifier> "https://identifiers.org/uniprot:P52286" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P52286> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <https://schema.org/rangeEnd> "186" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <https://schema.org/rangeStart> "4" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/hasBioPolymerSequence> "MTPSTPPRSRGTRYLAQPSGNTSSSALMQGQKTPQKPSQNLVPVTPSTTKSFKNAPLLAPPNSNMGMTSPFNGLTSPQRSPFPKSSVKRT" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/hasSequenceAnnotation> <https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/identifier> "https://identifiers.org/uniprot:P38634" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P38634> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <https://schema.org/rangeEnd> "90" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <https://schema.org/rangeStart> "1" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
<https://proteinensemble.org/PED00014> <http://purl.org/dc/terms/title> "PED" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .

View File

@ -0,0 +1,11 @@
# Set root logger level to DEBUG and its only appender to A1.
log4j.rootLogger=INFO, A1
# A1 is set to be a ConsoleAppender.
log4j.appender.A1=org.apache.log4j.ConsoleAppender
# A1 uses PatternLayout.
log4j.logger.org = ERROR
log4j.logger.eu.dnetlib = DEBUG
log4j.appender.A1.layout=org.apache.log4j.PatternLayout
log4j.appender.A1.layout.ConversionPattern=%-4r [%t] %-5p %c %x - %m%n

View File

@ -38,6 +38,7 @@
<module>dhp-usage-raw-data-update</module>
<module>dhp-broker-events</module>
<module>dhp-doiboost</module>
<module>dhp-rdfconverter</module>
</modules>
<pluginRepositories>

12
pom.xml
View File

@ -105,6 +105,18 @@
<enabled>false</enabled>
</snapshots>
</repository>
<repository>
<id>dnet-deps</id>
<name>D-Net Dependencies</name>
<url>https://maven.d4science.org/nexus/content/repositories/dnet-deps/</url>
<releases>
<enabled>true</enabled>
</releases>
<snapshots>
<enabled>false</enabled>
</snapshots>
<layout>default</layout>
</repository>
</repositories>
<dependencies>