Compare commits
36 Commits
main
...
beta_biosc
Author | SHA1 | Date |
---|---|---|
Enrico Ottonello | 64bc955444 | |
Enrico Ottonello | 18c9b95cb1 | |
Enrico Ottonello | 33dcf9964c | |
Enrico Ottonello | 792e78e848 | |
Enrico Ottonello | aef88f9e5c | |
Enrico Ottonello | f6c37656c9 | |
Enrico Ottonello | 41de8fb785 | |
Enrico Ottonello | 6d4235bd00 | |
Enrico Ottonello | baa312f256 | |
Enrico Ottonello | 6fa9624c29 | |
Enrico Ottonello | 0703e0c65f | |
Enrico Ottonello | 9a0ca0296a | |
Enrico Ottonello | d0df02062c | |
Enrico Ottonello | 7fc5b97871 | |
Enrico Ottonello | a203c33693 | |
Enrico Ottonello | afb46d71f7 | |
Enrico Ottonello | 98178b3165 | |
Enrico Ottonello | f11dfc51f7 | |
Enrico Ottonello | afe84c4244 | |
Enrico Ottonello | db831e6f43 | |
Enrico Ottonello | 861f2a3306 | |
Enrico Ottonello | f43bfdb594 | |
Enrico Ottonello | 3ef5eec3a6 | |
Enrico Ottonello | 41284ec2f9 | |
Enrico Ottonello | e53a606afc | |
Enrico Ottonello | bd37f14941 | |
Enrico Ottonello | 29ee1b9d82 | |
Enrico Ottonello | e57216a1fa | |
Enrico Ottonello | f28d7e3b9d | |
Enrico Ottonello | 8f281846a4 | |
Enrico Ottonello | f833de8a75 | |
Enrico Ottonello | 7f9636ef00 | |
Enrico Ottonello | 2f5caef77b | |
Enrico Ottonello | 4975278558 | |
Enrico Ottonello | 2bc79c50f8 | |
Enrico Ottonello | 446f81ee60 |
|
@ -0,0 +1,50 @@
|
||||||
|
[
|
||||||
|
{
|
||||||
|
"paramName": "s",
|
||||||
|
"paramLongName": "sourcePath",
|
||||||
|
"paramDescription": "the source mdstore path",
|
||||||
|
"paramRequired": false
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "t",
|
||||||
|
"paramLongName": "targetPath",
|
||||||
|
"paramDescription": "the path where storing final dataset",
|
||||||
|
"paramRequired": false
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "mo",
|
||||||
|
"paramLongName": "mdstoreOutputVersion",
|
||||||
|
"paramDescription": "the target mdstore path",
|
||||||
|
"paramRequired": false
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "m",
|
||||||
|
"paramLongName": "master",
|
||||||
|
"paramDescription": "the master name",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "i",
|
||||||
|
"paramLongName": "isLookupUrl",
|
||||||
|
"paramDescription": "the isLookup URL",
|
||||||
|
"paramRequired": false
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "l",
|
||||||
|
"paramLongName": "exportLinks",
|
||||||
|
"paramDescription": "should export also links",
|
||||||
|
"paramRequired": false
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "k",
|
||||||
|
"paramLongName": "datasourceKey",
|
||||||
|
"paramDescription": "the key that identifies the datasource",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "p",
|
||||||
|
"paramLongName": "profile",
|
||||||
|
"paramDescription": "resource profile",
|
||||||
|
"paramRequired": true
|
||||||
|
}
|
||||||
|
]
|
|
@ -0,0 +1,84 @@
|
||||||
|
<configuration>
|
||||||
|
|
||||||
|
<!-- OCEAN -->
|
||||||
|
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>jobTracker</name>-->
|
||||||
|
<!-- <value>yarnRM</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>nameNode</name>-->
|
||||||
|
<!-- <value>hdfs://nameservice1</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>oozie.use.system.libpath</name>-->
|
||||||
|
<!-- <value>true</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>oozie.action.sharelib.for.spark</name>-->
|
||||||
|
<!-- <value>spark2</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>oozie.launcher.mapreduce.user.classpath.first</name>-->
|
||||||
|
<!-- <value>true</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>spark2YarnHistoryServerAddress</name>-->
|
||||||
|
<!-- <value>http://hadoop-rm2.garr-pa1.d4science.org:19888</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>spark2EventLogDir</name>-->
|
||||||
|
<!-- <value>/user/spark/spark2ApplicationHistory</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>spark2ExtraListeners</name>-->
|
||||||
|
<!-- <value>"com.cloudera.spark.lineage.NavigatorAppListener"</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>spark2SqlQueryExecutionListeners</name>-->
|
||||||
|
<!-- <value>"com.cloudera.spark.lineage.NavigatorQueryListener"</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
|
||||||
|
<!-- GARR -->
|
||||||
|
|
||||||
|
<property>
|
||||||
|
<name>jobTracker</name>
|
||||||
|
<value>hadoop-rm3.garr-pa1.d4science.org:8032</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>nameNode</name>
|
||||||
|
<value>hdfs://hadoop-rm1.garr-pa1.d4science.org:8020</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>hive_metastore_uris</name>
|
||||||
|
<value>thrift://hadoop-edge3.garr-pa1.d4science.org:9083</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2YarnHistoryServerAddress</name>
|
||||||
|
<value>http://hadoop-rm2.garr-pa1.d4science.org:19888</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>oozie.launcher.mapreduce.user.classpath.first</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>oozie.use.system.libpath</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>oozie.action.sharelib.for.spark</name>
|
||||||
|
<value>spark2</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2EventLogDir</name>
|
||||||
|
<value>/user/spark/spark2ApplicationHistory</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2ExtraListeners</name>
|
||||||
|
<value>"com.cloudera.spark.lineage.NavigatorAppListener"</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2SqlQueryExecutionListeners</name>
|
||||||
|
<value>"com.cloudera.spark.lineage.NavigatorQueryListener"</value>
|
||||||
|
</property>
|
||||||
|
</configuration>
|
|
@ -0,0 +1,134 @@
|
||||||
|
<workflow-app name="generate_bioschema" xmlns="uri:oozie:workflow:0.5">
|
||||||
|
<parameters>
|
||||||
|
<property>
|
||||||
|
<name>mainPath</name>
|
||||||
|
<value>/data/bioschema/mobidb</value>
|
||||||
|
<description>the working path of Bioschema stores</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>datasourceKey</name>
|
||||||
|
<value>mobidb</value>
|
||||||
|
<description>the key that identifies the datasource (eg ped, disprot, mobidb)</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>profile</name>
|
||||||
|
<value>protein</value>
|
||||||
|
<description>resource profile (eg protein, gene)</description>
|
||||||
|
</property>
|
||||||
|
</parameters>
|
||||||
|
|
||||||
|
<start to="ResetDataset"/>
|
||||||
|
|
||||||
|
<kill name="Kill">
|
||||||
|
<message>Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]</message>
|
||||||
|
</kill>
|
||||||
|
|
||||||
|
<action name="ResetDataset">
|
||||||
|
<fs>
|
||||||
|
<delete path='${mainPath}/dataset/*'/>
|
||||||
|
</fs>
|
||||||
|
<ok to="TransformJob"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="StartTransaction">
|
||||||
|
<java>
|
||||||
|
<configuration>
|
||||||
|
<property>
|
||||||
|
<name>oozie.launcher.mapreduce.user.classpath.first</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
</configuration>
|
||||||
|
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
|
||||||
|
<arg>--action</arg><arg>NEW_VERSION</arg>
|
||||||
|
<arg>--mdStoreID</arg><arg>${mdStoreOutputId}</arg>
|
||||||
|
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
|
||||||
|
<capture-output/>
|
||||||
|
</java>
|
||||||
|
<ok to="TransformJob"/>
|
||||||
|
<error to="EndReadRollBack"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="TransformJob">
|
||||||
|
<spark xmlns="uri:oozie:spark-action:0.2">
|
||||||
|
<master>yarn-cluster</master>
|
||||||
|
<mode>cluster</mode>
|
||||||
|
<name>TransformJob</name>
|
||||||
|
<class>eu.dnetlib.dhp.bioschema.GenerateBioschemaDatasetSpark</class>
|
||||||
|
<jar>dhp-aggregation-${projectVersion}.jar</jar>
|
||||||
|
<spark-opts>
|
||||||
|
--executor-memory=${sparkExecutorMemory}
|
||||||
|
--executor-cores=${sparkExecutorCores}
|
||||||
|
--driver-memory=${sparkDriverMemory}
|
||||||
|
--conf spark.sql.shuffle.partitions=3840
|
||||||
|
--conf spark.extraListeners=${spark2ExtraListeners}
|
||||||
|
--conf spark.sql.queryExecutionListeners=${spark2SqlQueryExecutionListeners}
|
||||||
|
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
|
||||||
|
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
|
||||||
|
</spark-opts>
|
||||||
|
<arg>--sourcePath</arg><arg>${mainPath}/json-datacite</arg>
|
||||||
|
<arg>--targetPath</arg><arg>${mainPath}/dataset</arg>
|
||||||
|
<arg>--exportLinks</arg><arg>true</arg>
|
||||||
|
<arg>--datasourceKey</arg><arg>${datasourceKey}</arg>
|
||||||
|
<arg>--profile</arg><arg>${profile}</arg>
|
||||||
|
<arg>--master</arg><arg>yarn-cluster</arg>
|
||||||
|
</spark>
|
||||||
|
<ok to="End"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="CommitVersion">
|
||||||
|
<java>
|
||||||
|
<configuration>
|
||||||
|
<property>
|
||||||
|
<name>oozie.launcher.mapreduce.user.classpath.first</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
</configuration>
|
||||||
|
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
|
||||||
|
<arg>--action</arg><arg>COMMIT</arg>
|
||||||
|
<arg>--namenode</arg><arg>${nameNode}</arg>
|
||||||
|
<arg>--mdStoreVersion</arg><arg>${wf:actionData('StartTransaction')['mdStoreVersion']}</arg>
|
||||||
|
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
|
||||||
|
</java>
|
||||||
|
<ok to="End"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="EndReadRollBack">
|
||||||
|
<java>
|
||||||
|
<configuration>
|
||||||
|
<property>
|
||||||
|
<name>oozie.launcher.mapreduce.user.classpath.first</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
</configuration>
|
||||||
|
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
|
||||||
|
<arg>--action</arg><arg>READ_UNLOCK</arg>
|
||||||
|
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
|
||||||
|
<arg>--readMDStoreId</arg><arg>${wf:actionData('BeginRead')['mdStoreReadLockVersion']}</arg>
|
||||||
|
<capture-output/>
|
||||||
|
</java>
|
||||||
|
<ok to="RollBack"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="RollBack">
|
||||||
|
<java>
|
||||||
|
<configuration>
|
||||||
|
<property>
|
||||||
|
<name>oozie.launcher.mapreduce.user.classpath.first</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
</configuration>
|
||||||
|
<main-class>eu.dnetlib.dhp.aggregation.mdstore.MDStoreActionNode</main-class>
|
||||||
|
<arg>--action</arg><arg>ROLLBACK</arg>
|
||||||
|
<arg>--mdStoreVersion</arg><arg>${wf:actionData('StartTransaction')['mdStoreVersion']}</arg>
|
||||||
|
<arg>--mdStoreManagerURI</arg><arg>${mdStoreManagerURI}</arg>
|
||||||
|
</java>
|
||||||
|
<ok to="Kill"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<end name="End"/>
|
||||||
|
</workflow-app>
|
|
@ -0,0 +1,308 @@
|
||||||
|
package eu.dnetlib.dhp.bioschema
|
||||||
|
|
||||||
|
import eu.dnetlib.dhp.schema.common.ModelConstants
|
||||||
|
import eu.dnetlib.dhp.schema.oaf.{DataInfo, KeyValue, Qualifier}
|
||||||
|
import eu.dnetlib.dhp.schema.oaf.utils.OafMapperUtils
|
||||||
|
|
||||||
|
import java.time.format.DateTimeFormatter
|
||||||
|
import java.util.Locale
|
||||||
|
import java.util.regex.Pattern
|
||||||
|
|
||||||
|
/*
|
||||||
|
The following class are utility class used for the mapping from
|
||||||
|
bioschema json datacite to OAF Schema
|
||||||
|
*/
|
||||||
|
|
||||||
|
case class RelatedIdentifierType(
|
||||||
|
relationType: String,
|
||||||
|
relatedIdentifier: String,
|
||||||
|
relatedIdentifierType: String
|
||||||
|
) {}
|
||||||
|
|
||||||
|
case class AlternateIdentifierType(
|
||||||
|
alternateIdentifier: String
|
||||||
|
) {}
|
||||||
|
|
||||||
|
case class IdentifierType(
|
||||||
|
identifier: String,
|
||||||
|
identifierType: String
|
||||||
|
) {}
|
||||||
|
|
||||||
|
case class NameIdentifiersType(
|
||||||
|
nameIdentifierScheme: Option[String],
|
||||||
|
schemeUri: Option[String],
|
||||||
|
nameIdentifier: Option[String]
|
||||||
|
) {}
|
||||||
|
|
||||||
|
case class CreatorType(
|
||||||
|
nameType: Option[String],
|
||||||
|
nameIdentifiers: Option[List[NameIdentifiersType]],
|
||||||
|
name: Option[String],
|
||||||
|
familyName: Option[String],
|
||||||
|
givenName: Option[String],
|
||||||
|
affiliation: Option[List[String]]
|
||||||
|
) {}
|
||||||
|
|
||||||
|
case class TitleType(title: Option[String], titleType: Option[String], lang: Option[String]) {}
|
||||||
|
|
||||||
|
case class SubjectType(
|
||||||
|
schemeURI: Option[String],
|
||||||
|
value: Option[String],
|
||||||
|
subjectScheme: Option[String]
|
||||||
|
) {}
|
||||||
|
|
||||||
|
case class DescriptionType(descriptionType: Option[String], description: Option[String]) {}
|
||||||
|
|
||||||
|
case class DateType(date: Option[String], dateType: Option[String]) {}
|
||||||
|
|
||||||
|
case class OAFRelations(relation: String, inverse: String, relType: String)
|
||||||
|
|
||||||
|
class BioschemaModelConstants extends Serializable {}
|
||||||
|
|
||||||
|
object BioschemaModelConstants {
|
||||||
|
|
||||||
|
val PROTEIN_RESOURCETYPE: Qualifier =
|
||||||
|
qualifier("0046", "Bioentity", ModelConstants.DNET_PUBLICATION_RESOURCE, ModelConstants.DNET_PUBLICATION_RESOURCE)
|
||||||
|
|
||||||
|
val DATA_INFO: DataInfo = OafMapperUtils.dataInfo(
|
||||||
|
false,
|
||||||
|
null,
|
||||||
|
false,
|
||||||
|
false,
|
||||||
|
ModelConstants.PROVENANCE_ACTION_SET_QUALIFIER,
|
||||||
|
"0.9"
|
||||||
|
)
|
||||||
|
|
||||||
|
val PED_PREFIX: String = "fsh_____3595"
|
||||||
|
val DISPROT_PREFIX: String = "fsh_____1904"
|
||||||
|
val MOBIDB_PREFIX: String = "fsh_____2176"
|
||||||
|
|
||||||
|
val resolvedURLPattern: Map[String, String] = Map(
|
||||||
|
"https://identifiers.org/pubmed:" -> "pmid",
|
||||||
|
"http://purl.uniprot.org/uniprot/" -> "uniprot",
|
||||||
|
"https://identifiers.org/uniprot:" -> "uniprot",
|
||||||
|
"https://identifiers.org/disprot:" -> "disprot",
|
||||||
|
"https://identifiers.org/mobidb:" -> "mobidb",
|
||||||
|
"https://doi.org/" -> "doi"
|
||||||
|
)
|
||||||
|
|
||||||
|
val collectedFromMap: Map[String, KeyValue] = {
|
||||||
|
val PEDCollectedFrom: KeyValue = OafMapperUtils.keyValue(
|
||||||
|
"10|fairsharing_::c0e8517b1fe0b5270f3f41d4b56d6118",
|
||||||
|
"Protein Ensemble Database"
|
||||||
|
)
|
||||||
|
PEDCollectedFrom.setDataInfo(DATA_INFO)
|
||||||
|
|
||||||
|
val DISPROTCollectedFrom: KeyValue = OafMapperUtils.keyValue(
|
||||||
|
"10|fairsharing_::c91591a8d461c2869b9f535ded3e213e",
|
||||||
|
"Database of Protein Disorder"
|
||||||
|
)
|
||||||
|
DISPROTCollectedFrom.setDataInfo(DATA_INFO)
|
||||||
|
|
||||||
|
val MOBIDBCollectedFrom: KeyValue = OafMapperUtils.keyValue(
|
||||||
|
"10|fairsharing_::0234c510bc6d908b28c70ff313743079",
|
||||||
|
"MobiDB"
|
||||||
|
)
|
||||||
|
MOBIDBCollectedFrom.setDataInfo(DATA_INFO)
|
||||||
|
|
||||||
|
Map(
|
||||||
|
"ped" -> PEDCollectedFrom,
|
||||||
|
"disprot" -> DISPROTCollectedFrom,
|
||||||
|
"mobidb" -> MOBIDBCollectedFrom
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
val datasourceKeyPrefix: Map[String, String] = Map(
|
||||||
|
"ped" -> PED_PREFIX,
|
||||||
|
"disprot" -> DISPROT_PREFIX,
|
||||||
|
"mobidb" -> MOBIDB_PREFIX
|
||||||
|
)
|
||||||
|
|
||||||
|
val REL_TYPE_VALUE: String = "resultResult"
|
||||||
|
val DATE_RELATION_KEY = "RelationDate"
|
||||||
|
val dataInfo: DataInfo = bioschemaDataInfo("0.9")
|
||||||
|
|
||||||
|
val subRelTypeMapping: Map[String, OAFRelations] = Map(
|
||||||
|
ModelConstants.REFERENCES -> OAFRelations(
|
||||||
|
ModelConstants.REFERENCES,
|
||||||
|
ModelConstants.IS_REFERENCED_BY,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.IS_REFERENCED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_REFERENCED_BY,
|
||||||
|
ModelConstants.REFERENCES,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.IS_SUPPLEMENTED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_SUPPLEMENTED_BY,
|
||||||
|
ModelConstants.IS_SUPPLEMENT_TO,
|
||||||
|
ModelConstants.SUPPLEMENT
|
||||||
|
),
|
||||||
|
ModelConstants.IS_SUPPLEMENT_TO -> OAFRelations(
|
||||||
|
ModelConstants.IS_SUPPLEMENT_TO,
|
||||||
|
ModelConstants.IS_SUPPLEMENTED_BY,
|
||||||
|
ModelConstants.SUPPLEMENT
|
||||||
|
),
|
||||||
|
ModelConstants.HAS_PART -> OAFRelations(
|
||||||
|
ModelConstants.HAS_PART,
|
||||||
|
ModelConstants.IS_PART_OF,
|
||||||
|
ModelConstants.PART
|
||||||
|
),
|
||||||
|
ModelConstants.IS_PART_OF -> OAFRelations(
|
||||||
|
ModelConstants.IS_PART_OF,
|
||||||
|
ModelConstants.HAS_PART,
|
||||||
|
ModelConstants.PART
|
||||||
|
),
|
||||||
|
ModelConstants.IS_VERSION_OF -> OAFRelations(
|
||||||
|
ModelConstants.IS_VERSION_OF,
|
||||||
|
ModelConstants.HAS_VERSION,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.HAS_VERSION -> OAFRelations(
|
||||||
|
ModelConstants.HAS_VERSION,
|
||||||
|
ModelConstants.IS_VERSION_OF,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.IS_IDENTICAL_TO -> OAFRelations(
|
||||||
|
ModelConstants.IS_IDENTICAL_TO,
|
||||||
|
ModelConstants.IS_IDENTICAL_TO,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.IS_CONTINUED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_CONTINUED_BY,
|
||||||
|
ModelConstants.CONTINUES,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.CONTINUES -> OAFRelations(
|
||||||
|
ModelConstants.CONTINUES,
|
||||||
|
ModelConstants.IS_CONTINUED_BY,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.IS_NEW_VERSION_OF -> OAFRelations(
|
||||||
|
ModelConstants.IS_NEW_VERSION_OF,
|
||||||
|
ModelConstants.IS_PREVIOUS_VERSION_OF,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.IS_PREVIOUS_VERSION_OF -> OAFRelations(
|
||||||
|
ModelConstants.IS_PREVIOUS_VERSION_OF,
|
||||||
|
ModelConstants.IS_NEW_VERSION_OF,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.IS_DOCUMENTED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_DOCUMENTED_BY,
|
||||||
|
ModelConstants.DOCUMENTS,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.DOCUMENTS -> OAFRelations(
|
||||||
|
ModelConstants.DOCUMENTS,
|
||||||
|
ModelConstants.IS_DOCUMENTED_BY,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.IS_SOURCE_OF -> OAFRelations(
|
||||||
|
ModelConstants.IS_SOURCE_OF,
|
||||||
|
ModelConstants.IS_DERIVED_FROM,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.IS_DERIVED_FROM -> OAFRelations(
|
||||||
|
ModelConstants.IS_DERIVED_FROM,
|
||||||
|
ModelConstants.IS_SOURCE_OF,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.CITES -> OAFRelations(
|
||||||
|
ModelConstants.CITES,
|
||||||
|
ModelConstants.IS_CITED_BY,
|
||||||
|
ModelConstants.CITATION
|
||||||
|
),
|
||||||
|
ModelConstants.IS_CITED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_CITED_BY,
|
||||||
|
ModelConstants.CITES,
|
||||||
|
ModelConstants.CITATION
|
||||||
|
),
|
||||||
|
ModelConstants.IS_VARIANT_FORM_OF -> OAFRelations(
|
||||||
|
ModelConstants.IS_VARIANT_FORM_OF,
|
||||||
|
ModelConstants.IS_DERIVED_FROM,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.IS_OBSOLETED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_OBSOLETED_BY,
|
||||||
|
ModelConstants.IS_NEW_VERSION_OF,
|
||||||
|
ModelConstants.VERSION
|
||||||
|
),
|
||||||
|
ModelConstants.REVIEWS -> OAFRelations(
|
||||||
|
ModelConstants.REVIEWS,
|
||||||
|
ModelConstants.IS_REVIEWED_BY,
|
||||||
|
ModelConstants.REVIEW
|
||||||
|
),
|
||||||
|
ModelConstants.IS_REVIEWED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_REVIEWED_BY,
|
||||||
|
ModelConstants.REVIEWS,
|
||||||
|
ModelConstants.REVIEW
|
||||||
|
),
|
||||||
|
ModelConstants.DOCUMENTS -> OAFRelations(
|
||||||
|
ModelConstants.DOCUMENTS,
|
||||||
|
ModelConstants.IS_DOCUMENTED_BY,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.IS_DOCUMENTED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_DOCUMENTED_BY,
|
||||||
|
ModelConstants.DOCUMENTS,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.COMPILES -> OAFRelations(
|
||||||
|
ModelConstants.COMPILES,
|
||||||
|
ModelConstants.IS_COMPILED_BY,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
),
|
||||||
|
ModelConstants.IS_COMPILED_BY -> OAFRelations(
|
||||||
|
ModelConstants.IS_COMPILED_BY,
|
||||||
|
ModelConstants.COMPILES,
|
||||||
|
ModelConstants.RELATIONSHIP
|
||||||
|
)
|
||||||
|
)
|
||||||
|
|
||||||
|
def bioschemaDataInfo(trust: String): DataInfo = OafMapperUtils.dataInfo(
|
||||||
|
false,
|
||||||
|
null,
|
||||||
|
false,
|
||||||
|
false,
|
||||||
|
ModelConstants.PROVENANCE_ACTION_SET_QUALIFIER,
|
||||||
|
trust
|
||||||
|
)
|
||||||
|
|
||||||
|
val df_en: DateTimeFormatter = DateTimeFormatter.ofPattern(
|
||||||
|
"[MM-dd-yyyy][MM/dd/yyyy][dd-MM-yy][dd-MMM-yyyy][dd/MMM/yyyy][dd-MMM-yy][dd/MMM/yy][dd-MM-yy][dd/MM/yy][dd-MM-yyyy][dd/MM/yyyy][yyyy-MM-dd][yyyy/MM/dd]",
|
||||||
|
Locale.ENGLISH
|
||||||
|
)
|
||||||
|
|
||||||
|
val df_it: DateTimeFormatter =
|
||||||
|
DateTimeFormatter.ofPattern("[dd-MM-yyyy][dd/MM/yyyy]", Locale.ITALIAN)
|
||||||
|
|
||||||
|
val Date_regex: List[Pattern] = List(
|
||||||
|
//Y-M-D
|
||||||
|
Pattern.compile(
|
||||||
|
"(18|19|20)\\d\\d([- /.])(0[1-9]|1[012])\\2(0[1-9]|[12][0-9]|3[01])",
|
||||||
|
Pattern.MULTILINE
|
||||||
|
),
|
||||||
|
//M-D-Y
|
||||||
|
Pattern.compile(
|
||||||
|
"((0[1-9]|1[012])|([1-9]))([- /.])(0[1-9]|[12][0-9]|3[01])([- /.])(18|19|20)?\\d\\d",
|
||||||
|
Pattern.MULTILINE
|
||||||
|
),
|
||||||
|
//D-M-Y
|
||||||
|
Pattern.compile(
|
||||||
|
"(?:(?:31(/|-|\\.)(?:0?[13578]|1[02]|(?:Jan|Mar|May|Jul|Aug|Oct|Dec)))\\1|(?:(?:29|30)(/|-|\\.)(?:0?[1,3-9]|1[0-2]|(?:Jan|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec))\\2))(?:(?:1[6-9]|[2-9]\\d)?\\d{2})|(?:29(/|-|\\.)(?:0?2|(?:Feb))\\3(?:(?:(?:1[6-9]|[2-9]\\d)?(?:0[48]|[2468][048]|[13579][26])|(?:(?:16|[2468][048]|[3579][26])00))))|(?:0?[1-9]|1\\d|2[0-8])(/|-|\\.)(?:(?:0?[1-9]|(?:Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep))|(?:1[0-2]|(?:Oct|Nov|Dec)))\\4(?:(?:1[6-9]|[2-9]\\d)?\\d{2})",
|
||||||
|
Pattern.MULTILINE
|
||||||
|
),
|
||||||
|
//Y
|
||||||
|
Pattern.compile("(19|20)\\d\\d", Pattern.MULTILINE)
|
||||||
|
)
|
||||||
|
|
||||||
|
private def qualifier(classid: String, classname: String, schemeid: String, schemename: String) = {
|
||||||
|
val q = new Qualifier
|
||||||
|
q.setClassid(classid)
|
||||||
|
q.setClassname(classname)
|
||||||
|
q.setSchemeid(schemeid)
|
||||||
|
q.setSchemename(schemename)
|
||||||
|
q
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,308 @@
|
||||||
|
package eu.dnetlib.dhp.bioschema
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.databind.ObjectMapper
|
||||||
|
import eu.dnetlib.dhp.bioschema.BioschemaModelConstants._
|
||||||
|
import eu.dnetlib.dhp.schema.common.ModelConstants
|
||||||
|
import eu.dnetlib.dhp.schema.oaf.utils.{IdentifierFactory, OafMapperUtils}
|
||||||
|
import eu.dnetlib.dhp.schema.oaf.{Dataset => OafDataset, _}
|
||||||
|
import eu.dnetlib.dhp.utils.DHPUtils
|
||||||
|
import org.apache.commons.lang3.StringUtils
|
||||||
|
import org.json4s.DefaultFormats
|
||||||
|
import org.json4s.JsonAST.{JField, JObject, JString}
|
||||||
|
import org.json4s.jackson.JsonMethods.parse
|
||||||
|
|
||||||
|
import java.time.LocalDate
|
||||||
|
import scala.collection.JavaConverters._
|
||||||
|
|
||||||
|
object BioschemaToOAFTransformation {
|
||||||
|
|
||||||
|
val mapper = new ObjectMapper()
|
||||||
|
|
||||||
|
def extract_date(input: String): Option[String] = {
|
||||||
|
val d = Date_regex
|
||||||
|
.map(pattern => {
|
||||||
|
val matcher = pattern.matcher(input)
|
||||||
|
if (matcher.find())
|
||||||
|
matcher.group(0)
|
||||||
|
else
|
||||||
|
null
|
||||||
|
})
|
||||||
|
.find(s => s != null)
|
||||||
|
|
||||||
|
if (d.isDefined) {
|
||||||
|
val a_date = if (d.get.length == 4) s"01-01-${d.get}" else d.get
|
||||||
|
try {
|
||||||
|
return Some(LocalDate.parse(a_date, df_en).toString)
|
||||||
|
} catch {
|
||||||
|
case _: Throwable =>
|
||||||
|
try {
|
||||||
|
return Some(LocalDate.parse(a_date, df_it).toString)
|
||||||
|
} catch {
|
||||||
|
case _: Throwable =>
|
||||||
|
return None
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
d
|
||||||
|
}
|
||||||
|
|
||||||
|
def getResult(resourceClassName: String): Result = {
|
||||||
|
val i = new Instance
|
||||||
|
resourceClassName.toUpperCase() match {
|
||||||
|
case "PROTEIN" =>
|
||||||
|
i.setInstancetype(
|
||||||
|
PROTEIN_RESOURCETYPE
|
||||||
|
)
|
||||||
|
val d = new OafDataset
|
||||||
|
d.setInstance(List(i).asJava)
|
||||||
|
d.setResourcetype(
|
||||||
|
PROTEIN_RESOURCETYPE
|
||||||
|
)
|
||||||
|
return d
|
||||||
|
}
|
||||||
|
null
|
||||||
|
}
|
||||||
|
|
||||||
|
def generateOAFDate(dt: String, q: Qualifier): StructuredProperty = {
|
||||||
|
OafMapperUtils.structuredProperty(dt, q, null)
|
||||||
|
}
|
||||||
|
|
||||||
|
def generateOAF(
|
||||||
|
input: String,
|
||||||
|
exportLinks: Boolean,
|
||||||
|
datasourceKey: String,
|
||||||
|
resourceClassName: String
|
||||||
|
): List[Oaf] = {
|
||||||
|
|
||||||
|
implicit lazy val formats: DefaultFormats.type = org.json4s.DefaultFormats
|
||||||
|
lazy val json = parse(input)
|
||||||
|
|
||||||
|
val result = getResult(resourceClassName)
|
||||||
|
if (result == null)
|
||||||
|
return List()
|
||||||
|
|
||||||
|
val pid = (json \ "id").extract[String]
|
||||||
|
|
||||||
|
result.setPid(
|
||||||
|
List(
|
||||||
|
OafMapperUtils.structuredProperty(
|
||||||
|
pid,
|
||||||
|
datasourceKey,
|
||||||
|
datasourceKey,
|
||||||
|
ModelConstants.DNET_PID_TYPES,
|
||||||
|
ModelConstants.DNET_PID_TYPES,
|
||||||
|
DATA_INFO
|
||||||
|
)
|
||||||
|
).asJava
|
||||||
|
)
|
||||||
|
result.setId(OafMapperUtils.createOpenaireId(50, s"${datasourceKeyPrefix(datasourceKey)}::$pid", true))
|
||||||
|
result.setOriginalId(List(pid).asJava)
|
||||||
|
result.setDataInfo(dataInfo)
|
||||||
|
|
||||||
|
val titles: List[TitleType] = (json \\ "titles").extractOrElse[List[TitleType]](List())
|
||||||
|
if (titles.isEmpty) {
|
||||||
|
throw new RuntimeException("Title not found")
|
||||||
|
}
|
||||||
|
result.setTitle(
|
||||||
|
titles
|
||||||
|
.filter(t => t.title.nonEmpty)
|
||||||
|
.map(t => {
|
||||||
|
OafMapperUtils
|
||||||
|
.structuredProperty(t.title.get, ModelConstants.MAIN_TITLE_QUALIFIER, dataInfo)
|
||||||
|
})
|
||||||
|
.asJava
|
||||||
|
)
|
||||||
|
|
||||||
|
val dates = (json \\ "dates").extract[List[DateType]]
|
||||||
|
|
||||||
|
val collected_date = dates
|
||||||
|
.filter(d => d.date.isDefined && d.dateType.isDefined)
|
||||||
|
.find(d => d.dateType.get.equalsIgnoreCase("collected"))
|
||||||
|
.map(d => extract_date(d.date.get))
|
||||||
|
.find(d => d != null && d.isDefined)
|
||||||
|
.map(d => d.get)
|
||||||
|
if (collected_date.isDefined) {
|
||||||
|
result.setDateofcollection(collected_date.get)
|
||||||
|
}
|
||||||
|
|
||||||
|
result.setRelevantdate(
|
||||||
|
dates
|
||||||
|
.filter(d => d.date.isDefined && d.dateType.isDefined)
|
||||||
|
.map(d => (extract_date(d.date.get), d.dateType.get))
|
||||||
|
.filter(d => d._1.isDefined)
|
||||||
|
.map(d =>
|
||||||
|
(
|
||||||
|
d._1.get,
|
||||||
|
OafMapperUtils.qualifier(
|
||||||
|
d._2.toLowerCase(),
|
||||||
|
d._2.toLowerCase(),
|
||||||
|
ModelConstants.DNET_DATACITE_DATE,
|
||||||
|
ModelConstants.DNET_DATACITE_DATE
|
||||||
|
)
|
||||||
|
)
|
||||||
|
)
|
||||||
|
.filter(d => d._2 != null)
|
||||||
|
.map(d => generateOAFDate(d._1, d._2))
|
||||||
|
.asJava
|
||||||
|
)
|
||||||
|
|
||||||
|
result.setCollectedfrom(List(collectedFromMap(datasourceKey)).asJava)
|
||||||
|
|
||||||
|
val descriptions = (json \\ "descriptions").extract[List[DescriptionType]]
|
||||||
|
|
||||||
|
result.setDescription(
|
||||||
|
descriptions
|
||||||
|
.filter(d => d.description.isDefined)
|
||||||
|
.map(d => OafMapperUtils.field(d.description.get, null))
|
||||||
|
.filter(s => s != null)
|
||||||
|
.asJava
|
||||||
|
)
|
||||||
|
|
||||||
|
val subjects = (json \\ "subjects").extract[List[SubjectType]]
|
||||||
|
|
||||||
|
result.setSubject(
|
||||||
|
subjects
|
||||||
|
.filter(s => s.value.nonEmpty && s.subjectScheme.nonEmpty && s.schemeURI.nonEmpty)
|
||||||
|
.map(s =>
|
||||||
|
OafMapperUtils.structuredProperty(
|
||||||
|
s.value.get,
|
||||||
|
s.subjectScheme.get,
|
||||||
|
s.schemeURI.get,
|
||||||
|
ModelConstants.DNET_SUBJECT_TYPOLOGIES,
|
||||||
|
ModelConstants.DNET_SUBJECT_TYPOLOGIES,
|
||||||
|
null
|
||||||
|
)
|
||||||
|
)
|
||||||
|
.asJava
|
||||||
|
)
|
||||||
|
|
||||||
|
val instance = result.getInstance().get(0)
|
||||||
|
|
||||||
|
val ids: List[IdentifierType] = for {
|
||||||
|
JObject(identifiers) <- json \\ "identifiers"
|
||||||
|
JField("identifier", JString(identifier)) <- identifiers
|
||||||
|
JField("identifierType", JString(identifierType)) <- identifiers
|
||||||
|
} yield IdentifierType(identifier, identifierType)
|
||||||
|
|
||||||
|
instance.setUrl(
|
||||||
|
ids
|
||||||
|
.map(id => {
|
||||||
|
id.identifier
|
||||||
|
})
|
||||||
|
.asJava
|
||||||
|
)
|
||||||
|
if (instance.getUrl.isEmpty) {
|
||||||
|
throw new RuntimeException("Url not found")
|
||||||
|
}
|
||||||
|
instance.setCollectedfrom(collectedFromMap(datasourceKey))
|
||||||
|
instance.setHostedby(collectedFromMap(datasourceKey))
|
||||||
|
|
||||||
|
instance.setPid(result.getPid)
|
||||||
|
|
||||||
|
result.setId(IdentifierFactory.createIdentifier(result))
|
||||||
|
var relations: List[Relation] = List()
|
||||||
|
|
||||||
|
if (result.getId == null)
|
||||||
|
return List()
|
||||||
|
|
||||||
|
val alternativeIdentifierUrls: List[AlternateIdentifierType] = for {
|
||||||
|
JObject(alternateIdentifiers) <- json \\ "alternateIdentifiers"
|
||||||
|
JField("alternateIdentifier", JString(alternateIdentifier)) <- alternateIdentifiers
|
||||||
|
} yield AlternateIdentifierType(alternateIdentifier)
|
||||||
|
|
||||||
|
val alternativeIdentifierUrl: AlternateIdentifierType = alternativeIdentifierUrls.asJava.get(0)
|
||||||
|
|
||||||
|
val alternativeIdentifiers = resolvedURLPattern
|
||||||
|
.filter(pattern => !pattern._1.contains(datasourceKey))
|
||||||
|
.map(pattern => {
|
||||||
|
if (alternativeIdentifierUrl.alternateIdentifier.startsWith(s"${pattern._1}")) {
|
||||||
|
val relatedId = StringUtils.substringAfter(alternativeIdentifierUrl.alternateIdentifier, s"${pattern._1}")
|
||||||
|
OafMapperUtils.structuredProperty(
|
||||||
|
relatedId,
|
||||||
|
pattern._2,
|
||||||
|
pattern._2,
|
||||||
|
ModelConstants.DNET_PID_TYPES,
|
||||||
|
ModelConstants.DNET_PID_TYPES,
|
||||||
|
dataInfo
|
||||||
|
)
|
||||||
|
} else
|
||||||
|
null
|
||||||
|
})
|
||||||
|
.find(s => s != null)
|
||||||
|
|
||||||
|
if (alternativeIdentifiers.isDefined) {
|
||||||
|
instance.setAlternateIdentifier(List(alternativeIdentifiers.get).asJava)
|
||||||
|
}
|
||||||
|
|
||||||
|
val access_rights_qualifier =
|
||||||
|
OafMapperUtils.accessRight(
|
||||||
|
ModelConstants.UNKNOWN,
|
||||||
|
ModelConstants.NOT_AVAILABLE,
|
||||||
|
ModelConstants.DNET_ACCESS_MODES,
|
||||||
|
ModelConstants.DNET_ACCESS_MODES
|
||||||
|
)
|
||||||
|
instance.setAccessright(access_rights_qualifier)
|
||||||
|
|
||||||
|
if (exportLinks) {
|
||||||
|
val rels: List[RelatedIdentifierType] = for {
|
||||||
|
JObject(relIdentifier) <- json \\ "relatedIdentifiers"
|
||||||
|
JField("relationType", JString(relationType)) <- relIdentifier
|
||||||
|
JField("relatedIdentifierType", JString(relatedIdentifierType)) <- relIdentifier
|
||||||
|
JField("relatedIdentifier", JString(relatedIdentifier)) <- relIdentifier
|
||||||
|
} yield RelatedIdentifierType(relationType, relatedIdentifier, relatedIdentifierType)
|
||||||
|
|
||||||
|
relations = relations ::: generateRelations(
|
||||||
|
rels,
|
||||||
|
result.getId,
|
||||||
|
null,
|
||||||
|
pid,
|
||||||
|
datasourceKey
|
||||||
|
)
|
||||||
|
|
||||||
|
}
|
||||||
|
if (relations != null && relations.nonEmpty) {
|
||||||
|
List(result) ::: relations
|
||||||
|
} else
|
||||||
|
List(result)
|
||||||
|
}
|
||||||
|
|
||||||
|
private def generateRelations(
|
||||||
|
rels: List[RelatedIdentifierType],
|
||||||
|
id: String,
|
||||||
|
date: String,
|
||||||
|
pid: String,
|
||||||
|
datasourceKey: String
|
||||||
|
): List[Relation] = {
|
||||||
|
rels
|
||||||
|
.map(r => {
|
||||||
|
val rel = new Relation
|
||||||
|
rel.setCollectedfrom(List(collectedFromMap(datasourceKey)).asJava)
|
||||||
|
rel.setDataInfo(dataInfo)
|
||||||
|
|
||||||
|
val subRelType = subRelTypeMapping(r.relationType).relType
|
||||||
|
rel.setRelType(REL_TYPE_VALUE)
|
||||||
|
rel.setSubRelType(subRelType)
|
||||||
|
rel.setRelClass(r.relationType)
|
||||||
|
|
||||||
|
val dateProps: KeyValue = OafMapperUtils.keyValue(DATE_RELATION_KEY, date)
|
||||||
|
|
||||||
|
rel.setProperties(List(dateProps).asJava)
|
||||||
|
|
||||||
|
resolvedURLPattern
|
||||||
|
.map(p => {
|
||||||
|
if (r.relatedIdentifier.startsWith(s"${p._1}")) {
|
||||||
|
val relatedId = StringUtils.substringAfter(r.relatedIdentifier, s"${p._1}")
|
||||||
|
rel.setTarget(
|
||||||
|
DHPUtils.generateUnresolvedIdentifier(relatedId, p._2)
|
||||||
|
)
|
||||||
|
} else
|
||||||
|
null
|
||||||
|
})
|
||||||
|
.find(s => s != null)
|
||||||
|
rel.setSource(id)
|
||||||
|
rel.setCollectedfrom(List(collectedFromMap(datasourceKey)).asJava)
|
||||||
|
rel.getCollectedfrom.asScala.map(c => c.getValue).toList
|
||||||
|
rel
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,99 @@
|
||||||
|
package eu.dnetlib.dhp.bioschema
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.databind.ObjectMapper
|
||||||
|
import eu.dnetlib.dhp.application.AbstractScalaApplication
|
||||||
|
import eu.dnetlib.dhp.collection.CollectionUtils
|
||||||
|
import eu.dnetlib.dhp.common.Constants.{MDSTORE_DATA_PATH, MDSTORE_SIZE_PATH}
|
||||||
|
import eu.dnetlib.dhp.schema.mdstore.MDStoreVersion
|
||||||
|
import eu.dnetlib.dhp.schema.oaf.Oaf
|
||||||
|
import eu.dnetlib.dhp.utils.DHPUtils.writeHdfsFile
|
||||||
|
import org.apache.spark.sql.{Encoder, Encoders, SparkSession}
|
||||||
|
import org.slf4j.{Logger, LoggerFactory}
|
||||||
|
|
||||||
|
class GenerateBioschemaDatasetSpark(propertyPath: String, args: Array[String], log: Logger)
|
||||||
|
extends AbstractScalaApplication(propertyPath, args, log: Logger) {
|
||||||
|
|
||||||
|
/** Here all the spark applications runs this method
|
||||||
|
* where the whole logic of the spark node is defined
|
||||||
|
*/
|
||||||
|
override def run(): Unit = {
|
||||||
|
|
||||||
|
val sourcePath = parser.get("sourcePath")
|
||||||
|
log.info(s"SourcePath is '$sourcePath'")
|
||||||
|
val exportLinks = "true".equalsIgnoreCase(parser.get("exportLinks"))
|
||||||
|
log.info(s"exportLinks is '$exportLinks'")
|
||||||
|
val datasourceKey = parser.get("datasourceKey").toLowerCase
|
||||||
|
log.info(s"datasourceKey is '$datasourceKey'")
|
||||||
|
val profile = parser.get("profile").toLowerCase
|
||||||
|
log.info(s"profile is '$profile'")
|
||||||
|
|
||||||
|
// val mdstoreOutputVersion = parser.get("mdstoreOutputVersion")
|
||||||
|
// log.info(s"mdstoreOutputVersion is '$mdstoreOutputVersion'")
|
||||||
|
// val mapper = new ObjectMapper()
|
||||||
|
// val cleanedMdStoreVersion = mapper.readValue(mdstoreOutputVersion, classOf[MDStoreVersion])
|
||||||
|
// val outputBasePath = cleanedMdStoreVersion.getHdfsPath
|
||||||
|
// log.info(s"outputBasePath is '$outputBasePath'")
|
||||||
|
// val targetPath = s"$outputBasePath$MDSTORE_DATA_PATH"
|
||||||
|
// log.info(s"targetPath is '$targetPath'")
|
||||||
|
|
||||||
|
val targetPath = parser.get("targetPath")
|
||||||
|
|
||||||
|
generateBioschemaDataset(sourcePath, exportLinks, targetPath, datasourceKey, profile, spark)
|
||||||
|
|
||||||
|
// reportTotalSize(targetPath, outputBasePath)
|
||||||
|
}
|
||||||
|
|
||||||
|
/** For working with MDStore we need to store in a file on hdfs the size of
|
||||||
|
* the current dataset
|
||||||
|
* @param targetPath
|
||||||
|
* @param outputBasePath
|
||||||
|
*/
|
||||||
|
def reportTotalSize(targetPath: String, outputBasePath: String): Unit = {
|
||||||
|
val total_items = spark.read.text(targetPath).count()
|
||||||
|
writeHdfsFile(
|
||||||
|
spark.sparkContext.hadoopConfiguration,
|
||||||
|
s"$total_items",
|
||||||
|
outputBasePath + MDSTORE_SIZE_PATH
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
/** Generate the transformed and cleaned OAF Dataset from the native one
|
||||||
|
*
|
||||||
|
* @param sourcePath sourcePath of the native Dataset in format JSON/Datacite
|
||||||
|
* @param exportLinks If true it generates unresolved links
|
||||||
|
* @param targetPath the targetPath of the result Dataset
|
||||||
|
*/
|
||||||
|
def generateBioschemaDataset(
|
||||||
|
sourcePath: String,
|
||||||
|
exportLinks: Boolean,
|
||||||
|
targetPath: String,
|
||||||
|
datasourceKey: String,
|
||||||
|
profile: String,
|
||||||
|
spark: SparkSession
|
||||||
|
): Unit = {
|
||||||
|
require(spark != null)
|
||||||
|
|
||||||
|
implicit val resultEncoder: Encoder[Oaf] = Encoders.kryo(classOf[Oaf])
|
||||||
|
CollectionUtils.saveDataset(
|
||||||
|
spark.createDataset(
|
||||||
|
spark.sparkContext
|
||||||
|
.textFile(sourcePath)
|
||||||
|
.flatMap(i => BioschemaToOAFTransformation.generateOAF(i, exportLinks, datasourceKey, profile))
|
||||||
|
),
|
||||||
|
targetPath
|
||||||
|
)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
object GenerateBioschemaDatasetSpark {
|
||||||
|
|
||||||
|
val log: Logger = LoggerFactory.getLogger(GenerateBioschemaDatasetSpark.getClass)
|
||||||
|
|
||||||
|
def main(args: Array[String]): Unit = {
|
||||||
|
new GenerateBioschemaDatasetSpark(
|
||||||
|
"/eu/dnetlib/dhp/bioschema/generate_dataset_params.json",
|
||||||
|
args,
|
||||||
|
log
|
||||||
|
).initialize().run()
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,45 @@
|
||||||
|
{
|
||||||
|
"id": "DP01454",
|
||||||
|
"types": {
|
||||||
|
"resourceType": "Protein",
|
||||||
|
"resourceTypeGeneral": "Dataset"
|
||||||
|
},
|
||||||
|
"creators": [],
|
||||||
|
"identifiers": [
|
||||||
|
{
|
||||||
|
"identifier": "https://disprot.org/DP01454",
|
||||||
|
"identifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"relatedIdentifiers": [
|
||||||
|
{
|
||||||
|
"relationType": "IsIdenticalTo",
|
||||||
|
"relatedIdentifier": "http://purl.uniprot.org/uniprot/P60006",
|
||||||
|
"relatedIdentifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"alternateIdentifiers": [
|
||||||
|
{
|
||||||
|
"alternateIdentifier": "https://identifiers.org/disprot:DP01454"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"descriptions": [],
|
||||||
|
"titles": [
|
||||||
|
{
|
||||||
|
"title": "DP01454 - Anaphase-promoting complex subunit 15 "
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"dates": [
|
||||||
|
{
|
||||||
|
"date": "2021-11-25T12:23:57",
|
||||||
|
"dateType": "Collected"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"subjects": [
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
|
@ -0,0 +1,75 @@
|
||||||
|
{
|
||||||
|
"id": "Q9UPN6",
|
||||||
|
"types": {
|
||||||
|
"resourceType": "Protein",
|
||||||
|
"resourceTypeGeneral": "Dataset"
|
||||||
|
},
|
||||||
|
"creators": [],
|
||||||
|
"identifiers": [
|
||||||
|
{
|
||||||
|
"identifier": "https://mobidb.org/Q9UPN6",
|
||||||
|
"identifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"relatedIdentifiers": [
|
||||||
|
{
|
||||||
|
"relationType": "IsIdenticalTo",
|
||||||
|
"relatedIdentifier": "http://purl.uniprot.org/uniprot/Q9UPN6",
|
||||||
|
"relatedIdentifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"alternateIdentifiers": [
|
||||||
|
{
|
||||||
|
"alternateIdentifier": "https://identifiers.org/mobidb:Q9UPN6"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"descriptions": [],
|
||||||
|
"titles": [
|
||||||
|
{
|
||||||
|
"title": "Q9UPN6 - SR-related and CTD-associated factor 8 "
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"dates": [
|
||||||
|
{
|
||||||
|
"date": "2021-12-06T14:49:15",
|
||||||
|
"dateType": "Collected"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"subjects": [
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "Disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "Disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "Disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "Disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "Disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "Disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076",
|
||||||
|
"value": "Disorder",
|
||||||
|
"subjectScheme": "IDPO:00076"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
|
@ -0,0 +1,80 @@
|
||||||
|
{
|
||||||
|
"id": "PED00180#Q9KPH3_A_0",
|
||||||
|
"types": {
|
||||||
|
"resourceType": "Protein",
|
||||||
|
"resourceTypeGeneral": "Dataset"
|
||||||
|
},
|
||||||
|
"creators": [],
|
||||||
|
"identifiers": [
|
||||||
|
{
|
||||||
|
"identifier": "https://proteinensemble.org/PED00180#Q9KPH3_A_0",
|
||||||
|
"identifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"relatedIdentifiers": [
|
||||||
|
{
|
||||||
|
"relationType": "IsCitedBy",
|
||||||
|
"relatedIdentifier": "https://doi.org/10.1016/j.jsb.2020.107573",
|
||||||
|
"relatedIdentifierType": "URL"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"relationType": "IsIdenticalTo",
|
||||||
|
"relatedIdentifier": "http://purl.uniprot.org/uniprot/Q9KPH3",
|
||||||
|
"relatedIdentifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"alternateIdentifiers": [
|
||||||
|
{
|
||||||
|
"alternateIdentifier": "https://identifiers.org/uniprot:Q9KPH3"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"descriptions": [],
|
||||||
|
"titles": [
|
||||||
|
{
|
||||||
|
"title": "PED00180#Q9KPH3_A_0 - Structural ensemble of protein DciA from Vibrio cholerae (1-157) "
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"dates": [
|
||||||
|
{
|
||||||
|
"date": "2022-05-10T18:03:43",
|
||||||
|
"dateType": "Collected"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"subjects": [
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120",
|
||||||
|
"value": "NMR",
|
||||||
|
"subjectScheme": "IDPO:00120"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125",
|
||||||
|
"value": "SAXS",
|
||||||
|
"subjectScheme": "IDPO:00125"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00224",
|
||||||
|
"value": "GROMACS",
|
||||||
|
"subjectScheme": "IDPO:00224"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00228",
|
||||||
|
"value": "AMBER",
|
||||||
|
"subjectScheme": "IDPO:00228"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00185",
|
||||||
|
"value": "FM",
|
||||||
|
"subjectScheme": "IDPO:00185"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00213",
|
||||||
|
"value": "EOM",
|
||||||
|
"subjectScheme": "IDPO:00213"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00214",
|
||||||
|
"value": "GAJOE",
|
||||||
|
"subjectScheme": "IDPO:00214"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
|
@ -0,0 +1,5 @@
|
||||||
|
{"id":"PED00111#O75880_A_1","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00111#O75880_A_1","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsCitedBy","relatedIdentifier":"https://identifiers.org/pubmed:16735468","relatedIdentifierType":"URL"},{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/O75880","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:O75880"}],"descriptions":[],"titles":[{"title":"PED00111#O75880_A_1 - Structural ensemble of the C-terminal region of Sco1 (132-301), apo structure."}],"dates":[{"date":"2021-12-10T11:17:16","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141","value":"TOCSY","subjectScheme":"IDPO:00141"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143","value":"NOESY","subjectScheme":"IDPO:00143"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147","value":"HSQC","subjectScheme":"IDPO:00147"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00153","value":"HNHA","subjectScheme":"IDPO:00153"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00154","value":"HNCO","subjectScheme":"IDPO:00154"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00155","value":"HNCA","subjectScheme":"IDPO:00155"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00156","value":"HNCACO","subjectScheme":"IDPO:00156"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00157","value":"HNCOCA","subjectScheme":"IDPO:00157"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00158","value":"HNCACB","subjectScheme":"IDPO:00158"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00160","value":"CBCACONH","subjectScheme":"IDPO:00160"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00164","value":"CBCANH","subjectScheme":"IDPO:00164"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00175","value":"NOE","subjectScheme":"IDPO:00175"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00228","value":"AMBER","subjectScheme":"IDPO:00228"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00190","value":"DYANA","subjectScheme":"IDPO:00190"}]}
|
||||||
|
{"id":"PED00112#P19634_A_1","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00112#P19634_A_1","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsCitedBy","relatedIdentifier":"https://identifiers.org/pubmed:24840010","relatedIdentifierType":"URL"},{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P19634","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P19634"}],"descriptions":[],"titles":[{"title":"PED00112#P19634_A_1 - Structural ensemble of the TM VI-VII of the nhe1 isoform of the sodium/hydrogen exchanger (226-274)"}],"dates":[{"date":"2021-12-10T11:17:20","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141","value":"TOCSY","subjectScheme":"IDPO:00141"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143","value":"NOESY","subjectScheme":"IDPO:00143"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147","value":"HSQC","subjectScheme":"IDPO:00147"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167","value":"chemical shift","subjectScheme":"IDPO:00167"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00188","value":"Structure calculation","subjectScheme":"IDPO:00188"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00202","value":"NMRpipe","subjectScheme":"IDPO:00202"}]}
|
||||||
|
{"id":"PED00113#P04156_A_0","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00113#P04156_A_0","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P04156","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P04156"}],"descriptions":[],"titles":[{"title":"PED00113#P04156_A_0 - Structural ensemble of major prion protein (173-195)"}],"dates":[{"date":"2021-12-10T11:17:24","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"}]}
|
||||||
|
{"id":"PED00114#P27958_A_0","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00114#P27958_A_0","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsCitedBy","relatedIdentifier":"https://identifiers.org/pubmed:15247283","relatedIdentifierType":"URL"},{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P27958","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P27958"}],"descriptions":[],"titles":[{"title":"PED00114#P27958_A_0 - Structural ensemble of the membrane anchor domain of the nonstructural protein 5A (NS5A) of hepatitis C virus (1973-2003), in 50% tfe"}],"dates":[{"date":"2021-12-10T11:17:27","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141","value":"TOCSY","subjectScheme":"IDPO:00141"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143","value":"NOESY","subjectScheme":"IDPO:00143"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147","value":"HSQC","subjectScheme":"IDPO:00147"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00175","value":"NOE","subjectScheme":"IDPO:00175"},{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl:00194","value":"X-PLOR","subjectScheme":"IDPO:00194"}]}
|
||||||
|
{"id":"PED00115#P04156_A_0","types":{"resourceType":"Protein","resourceTypeGeneral":"Dataset"},"creators":[],"identifiers":[{"identifier":"https://proteinensemble.org/PED00115#P04156_A_0","identifierType":"URL"}],"relatedIdentifiers":[{"relationType":"IsIdenticalTo","relatedIdentifier":"http://purl.uniprot.org/uniprot/P04156","relatedIdentifierType":"URL"}],"alternateIdentifiers":[{"alternateIdentifier":"https://identifiers.org/uniprot:P04156"}],"descriptions":[],"titles":[{"title":"PED00115#P04156_A_0 - Structural ensemble of major prion protein (173-195), mutant D178N"}],"dates":[{"date":"2021-12-10T11:17:30","dateType":"Collected"}],"subjects":[{"schemeURI":"https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120","value":"NMR","subjectScheme":"IDPO:00120"}]}
|
|
@ -0,0 +1,120 @@
|
||||||
|
{
|
||||||
|
"id": "PED00111#O75880_A_1",
|
||||||
|
"types": {
|
||||||
|
"resourceType": "Protein",
|
||||||
|
"resourceTypeGeneral": "Dataset"
|
||||||
|
},
|
||||||
|
"creators": [],
|
||||||
|
"identifiers": [
|
||||||
|
{
|
||||||
|
"identifier": "https://proteinensemble.org/PED00111#O75880_A_1",
|
||||||
|
"identifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"relatedIdentifiers": [
|
||||||
|
{
|
||||||
|
"relationType": "IsCitedBy",
|
||||||
|
"relatedIdentifier": "https://identifiers.org/pubmed:16735468",
|
||||||
|
"relatedIdentifierType": "URL"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"relationType": "IsIdenticalTo",
|
||||||
|
"relatedIdentifier": "http://purl.uniprot.org/uniprot/O75880",
|
||||||
|
"relatedIdentifierType": "URL"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"alternateIdentifiers": [
|
||||||
|
{
|
||||||
|
"alternateIdentifier": "https://identifiers.org/uniprot:O75880"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"descriptions": [],
|
||||||
|
"titles": [
|
||||||
|
{
|
||||||
|
"title": "PED00111#O75880_A_1 - Structural ensemble of the C-terminal region of Sco1 (132-301), apo structure."
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"dates": [
|
||||||
|
{
|
||||||
|
"date": "2021-12-10T11:17:16",
|
||||||
|
"dateType": "Collected"
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"subjects": [
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120",
|
||||||
|
"value": "NMR",
|
||||||
|
"subjectScheme": "IDPO:00120"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00141",
|
||||||
|
"value": "TOCSY",
|
||||||
|
"subjectScheme": "IDPO:00141"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00143",
|
||||||
|
"value": "NOESY",
|
||||||
|
"subjectScheme": "IDPO:00143"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00147",
|
||||||
|
"value": "HSQC",
|
||||||
|
"subjectScheme": "IDPO:00147"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00153",
|
||||||
|
"value": "HNHA",
|
||||||
|
"subjectScheme": "IDPO:00153"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00154",
|
||||||
|
"value": "HNCO",
|
||||||
|
"subjectScheme": "IDPO:00154"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00155",
|
||||||
|
"value": "HNCA",
|
||||||
|
"subjectScheme": "IDPO:00155"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00156",
|
||||||
|
"value": "HNCACO",
|
||||||
|
"subjectScheme": "IDPO:00156"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00157",
|
||||||
|
"value": "HNCOCA",
|
||||||
|
"subjectScheme": "IDPO:00157"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00158",
|
||||||
|
"value": "HNCACB",
|
||||||
|
"subjectScheme": "IDPO:00158"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00160",
|
||||||
|
"value": "CBCACONH",
|
||||||
|
"subjectScheme": "IDPO:00160"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00164",
|
||||||
|
"value": "CBCANH",
|
||||||
|
"subjectScheme": "IDPO:00164"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00175",
|
||||||
|
"value": "NOE",
|
||||||
|
"subjectScheme": "IDPO:00175"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00228",
|
||||||
|
"value": "AMBER",
|
||||||
|
"subjectScheme": "IDPO:00228"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"schemeURI": "https://disprot.org/assets/data/IDPO_v0.2.owl:00190",
|
||||||
|
"value": "DYANA",
|
||||||
|
"subjectScheme": "IDPO:00190"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
|
@ -0,0 +1,115 @@
|
||||||
|
package eu.dnetlib.dhp.bioschema
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.databind.{ObjectMapper, SerializationFeature}
|
||||||
|
import eu.dnetlib.dhp.aggregation.AbstractVocabularyTest
|
||||||
|
import eu.dnetlib.dhp.schema.oaf.Oaf
|
||||||
|
import org.apache.commons.io.FileUtils
|
||||||
|
import org.apache.spark.SparkConf
|
||||||
|
import org.apache.spark.sql.{Encoder, Encoders, SparkSession}
|
||||||
|
import org.junit.jupiter.api.Assertions._
|
||||||
|
import org.junit.jupiter.api.extension.ExtendWith
|
||||||
|
import org.junit.jupiter.api.{AfterEach, BeforeEach, Test}
|
||||||
|
import org.mockito.junit.jupiter.MockitoExtension
|
||||||
|
import org.slf4j.{Logger, LoggerFactory}
|
||||||
|
|
||||||
|
import java.nio.file.{Files, Path}
|
||||||
|
import scala.io.Source
|
||||||
|
|
||||||
|
@ExtendWith(Array(classOf[MockitoExtension]))
|
||||||
|
class BioschemaDataciteToOAFTest {
|
||||||
|
|
||||||
|
private var workingDir: Path = null
|
||||||
|
val log: Logger = LoggerFactory.getLogger(getClass)
|
||||||
|
|
||||||
|
@BeforeEach
|
||||||
|
def setUp(): Unit = {
|
||||||
|
workingDir = Files.createTempDirectory(getClass.getSimpleName)
|
||||||
|
}
|
||||||
|
|
||||||
|
@AfterEach
|
||||||
|
def tearDown(): Unit = {
|
||||||
|
FileUtils.deleteDirectory(workingDir.toFile)
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
def testGeneratePED(): Unit = {
|
||||||
|
val path = getClass.getResource("/eu/dnetlib/dhp/bioschema/ped_dump").getPath
|
||||||
|
val conf = new SparkConf()
|
||||||
|
val spark: SparkSession = SparkSession
|
||||||
|
.builder()
|
||||||
|
.config(conf)
|
||||||
|
.appName(getClass.getSimpleName)
|
||||||
|
.master("local[*]")
|
||||||
|
.getOrCreate()
|
||||||
|
|
||||||
|
implicit val oafEncoder: Encoder[Oaf] = Encoders.kryo[Oaf]
|
||||||
|
val instance = new GenerateBioschemaDatasetSpark(null, null, log)
|
||||||
|
val targetPath = s"$workingDir/result"
|
||||||
|
|
||||||
|
instance.generateBioschemaDataset(path, exportLinks = true, targetPath, "ped", "protein", spark)
|
||||||
|
|
||||||
|
val total_items = spark.read.text(targetPath).count()
|
||||||
|
println(s"total_items: $total_items")
|
||||||
|
assertTrue(total_items == 21)
|
||||||
|
|
||||||
|
instance.generateBioschemaDataset(path, exportLinks = false, targetPath, "ped", "protein", spark)
|
||||||
|
|
||||||
|
val total_datasets = spark.read.text(targetPath).count()
|
||||||
|
println(s"total_datasets: $total_datasets")
|
||||||
|
assertTrue(total_datasets == 5)
|
||||||
|
|
||||||
|
spark.stop()
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
def testPEDMapping(): Unit = {
|
||||||
|
val record = Source
|
||||||
|
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/ped_record.json"))
|
||||||
|
.mkString
|
||||||
|
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
|
||||||
|
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "ped", "protein")
|
||||||
|
res.foreach(r => {
|
||||||
|
println(mapper.writeValueAsString(r))
|
||||||
|
println("----------------------------")
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
def testDISPROTMapping(): Unit = {
|
||||||
|
val record = Source
|
||||||
|
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/disprot_record.json"))
|
||||||
|
.mkString
|
||||||
|
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
|
||||||
|
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "disprot", "protein")
|
||||||
|
res.foreach(r => {
|
||||||
|
println(mapper.writeValueAsString(r))
|
||||||
|
println("----------------------------")
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
def testMOBIDBMapping(): Unit = {
|
||||||
|
val record = Source
|
||||||
|
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/mobidb_record.json"))
|
||||||
|
.mkString
|
||||||
|
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
|
||||||
|
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "mobidb", "protein")
|
||||||
|
res.foreach(r => {
|
||||||
|
println(mapper.writeValueAsString(r))
|
||||||
|
println("----------------------------")
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
def testPEDDoiCitationMapping(): Unit = {
|
||||||
|
val record = Source
|
||||||
|
.fromInputStream(getClass.getResourceAsStream("/eu/dnetlib/dhp/bioschema/ped_doi_citation.json"))
|
||||||
|
.mkString
|
||||||
|
val mapper = new ObjectMapper().enable(SerializationFeature.INDENT_OUTPUT)
|
||||||
|
val res: List[Oaf] = BioschemaToOAFTransformation.generateOAF(record, true, "ped", "protein")
|
||||||
|
res.foreach(r => {
|
||||||
|
println(mapper.writeValueAsString(r))
|
||||||
|
println("----------------------------")
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,42 @@
|
||||||
|
<?xml version="1.0" encoding="UTF-8"?>
|
||||||
|
<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
|
||||||
|
<modelVersion>4.0.0</modelVersion>
|
||||||
|
<parent>
|
||||||
|
<groupId>eu.dnetlib.dhp</groupId>
|
||||||
|
<artifactId>dhp-workflows</artifactId>
|
||||||
|
<version>1.2.5-SNAPSHOT</version>
|
||||||
|
</parent>
|
||||||
|
<artifactId>dhp-rdfconverter</artifactId>
|
||||||
|
|
||||||
|
<dependencies>
|
||||||
|
<dependency>
|
||||||
|
<groupId>org.apache.spark</groupId>
|
||||||
|
<artifactId>spark-core_2.11</artifactId>
|
||||||
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>org.apache.spark</groupId>
|
||||||
|
<artifactId>spark-sql_2.11</artifactId>
|
||||||
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>eu.dnetlib.dhp</groupId>
|
||||||
|
<artifactId>dhp-common</artifactId>
|
||||||
|
<version>${project.version}</version>
|
||||||
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>org.apache.any23</groupId>
|
||||||
|
<artifactId>apache-any23-core</artifactId>
|
||||||
|
<version>2.3</version>
|
||||||
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>org.eclipse.rdf4j</groupId>
|
||||||
|
<artifactId>rdf4j-rio-rdfxml</artifactId>
|
||||||
|
<version>2.5.4</version>
|
||||||
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>org.eclipse.rdf4j</groupId>
|
||||||
|
<artifactId>rdf4j-model</artifactId>
|
||||||
|
<version>2.5.4</version>
|
||||||
|
</dependency>
|
||||||
|
</dependencies>
|
||||||
|
|
||||||
|
</project>
|
|
@ -0,0 +1,82 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.rdfconverter.bioschema;
|
||||||
|
|
||||||
|
import static eu.dnetlib.dhp.common.SparkSessionSupport.runWithSparkSession;
|
||||||
|
|
||||||
|
import java.util.ArrayList;
|
||||||
|
import java.util.Arrays;
|
||||||
|
import java.util.Objects;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
|
import org.apache.commons.io.IOUtils;
|
||||||
|
import org.apache.hadoop.io.Text;
|
||||||
|
import org.apache.hadoop.io.compress.GzipCodec;
|
||||||
|
import org.apache.spark.SparkConf;
|
||||||
|
import org.apache.spark.api.java.JavaPairRDD;
|
||||||
|
import org.apache.spark.api.java.JavaRDD;
|
||||||
|
import org.apache.spark.api.java.JavaSparkContext;
|
||||||
|
import org.slf4j.Logger;
|
||||||
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
import eu.dnetlib.dhp.application.ArgumentApplicationParser;
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.utils.CompressorUtil;
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.utils.RDFConverter;
|
||||||
|
import ucar.nc2.stream.NcStreamProto;
|
||||||
|
|
||||||
|
public class SparkRdfToDatacite {
|
||||||
|
|
||||||
|
static Logger logger = LoggerFactory.getLogger(SparkRdfToDatacite.class);
|
||||||
|
|
||||||
|
public static void main(String[] args) throws Exception {
|
||||||
|
|
||||||
|
final ArgumentApplicationParser parser = new ArgumentApplicationParser(
|
||||||
|
IOUtils
|
||||||
|
.toString(
|
||||||
|
SparkRdfToDatacite.class
|
||||||
|
.getResourceAsStream(
|
||||||
|
"/eu/dnetlib/dhp/rdfconverter/bioschema/generate_dataset.json")));
|
||||||
|
parser.parseArgument(args);
|
||||||
|
Boolean isSparkSessionManaged = Optional
|
||||||
|
.ofNullable(parser.get("isSparkSessionManaged"))
|
||||||
|
.map(Boolean::valueOf)
|
||||||
|
.orElse(Boolean.TRUE);
|
||||||
|
final String workingPath = parser.get("workingPath");
|
||||||
|
final String rdfNquadsRecords = parser.get("rdfInput");
|
||||||
|
final String output = parser.get("output");
|
||||||
|
final String profile = parser.get("profile");
|
||||||
|
|
||||||
|
SparkConf conf = new SparkConf();
|
||||||
|
runWithSparkSession(
|
||||||
|
conf,
|
||||||
|
isSparkSessionManaged,
|
||||||
|
spark -> {
|
||||||
|
JavaSparkContext sc = JavaSparkContext.fromSparkContext(spark.sparkContext());
|
||||||
|
String base64GzippedNquadsPath = workingPath.concat(rdfNquadsRecords);
|
||||||
|
JavaRDD<String> base64GzippedNquadsRDD = sc
|
||||||
|
.textFile(base64GzippedNquadsPath);
|
||||||
|
logger.info("Rdf nquads records retrieved: {}", base64GzippedNquadsRDD.count());
|
||||||
|
|
||||||
|
JavaRDD<String> proteins2 = base64GzippedNquadsRDD
|
||||||
|
.flatMap(nquads -> {
|
||||||
|
RDFConverter converter = new RDFConverter();
|
||||||
|
ArrayList<String> jsonlds = null;
|
||||||
|
try {
|
||||||
|
jsonlds = converter
|
||||||
|
.nQuadsFile2DataciteJson(CompressorUtil.decompressValue(nquads), profile);
|
||||||
|
} catch (Exception e) {
|
||||||
|
logger.error("converting: " + nquads, e);
|
||||||
|
return Arrays.asList(new String()).iterator();
|
||||||
|
}
|
||||||
|
return jsonlds.iterator();
|
||||||
|
});
|
||||||
|
logger.info("json datacite non filtered: {}", proteins2.count());
|
||||||
|
JavaRDD<Text> proteins = proteins2
|
||||||
|
.filter(Objects::nonNull)
|
||||||
|
.filter(jsonld -> !jsonld.isEmpty())
|
||||||
|
.distinct()
|
||||||
|
.map(jsonld -> new Text(jsonld));
|
||||||
|
logger.info("json datacite generated: {}", proteins.count());
|
||||||
|
proteins.saveAsTextFile(workingPath.concat(output), GzipCodec.class);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,489 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.rdfconverter.bioschema.model;
|
||||||
|
|
||||||
|
import java.util.List;
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.annotation.JsonIgnoreProperties;
|
||||||
|
import com.fasterxml.jackson.annotation.JsonProperty;
|
||||||
|
import com.fasterxml.jackson.databind.annotation.JsonDeserialize;
|
||||||
|
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.utils.CustomPropertyValueDeserializer;
|
||||||
|
|
||||||
|
@JsonIgnoreProperties(ignoreUnknown = true)
|
||||||
|
public class BioSchemaProtein {
|
||||||
|
@JsonProperty("@id")
|
||||||
|
private String id;
|
||||||
|
@JsonProperty("@graph")
|
||||||
|
private List<Entry> entryList;
|
||||||
|
@JsonProperty("http://purl.org/pav/retrievedOn")
|
||||||
|
private DateTimeType retrievedOn;
|
||||||
|
|
||||||
|
public static class Entry {
|
||||||
|
@JsonProperty("@id")
|
||||||
|
private String id;
|
||||||
|
@JsonProperty("@type")
|
||||||
|
// private List<String> type;
|
||||||
|
private String type;
|
||||||
|
@JsonProperty("https://schema.org/identifier")
|
||||||
|
private String identifier;
|
||||||
|
@JsonProperty("https://schema.org/name")
|
||||||
|
private String name;
|
||||||
|
@JsonProperty("associatedDisease")
|
||||||
|
private List<AssociatedDisease> associatedDisease;
|
||||||
|
@JsonProperty("description")
|
||||||
|
private String description;
|
||||||
|
@JsonProperty("isEncodedByBioChemEntity")
|
||||||
|
private String isEncodedByBioChemEntity;
|
||||||
|
@JsonProperty("url")
|
||||||
|
private String url;
|
||||||
|
@JsonProperty("alternateName")
|
||||||
|
private String alternateName;
|
||||||
|
@JsonProperty("bioChemInteraction")
|
||||||
|
private List<Link> bioChemInteraction;
|
||||||
|
@JsonProperty("bioChemSimilarity")
|
||||||
|
private List<Link> bioChemSimilarity;
|
||||||
|
@JsonProperty("hasMolecularFunction")
|
||||||
|
private String hasMolecularFunction;
|
||||||
|
@JsonProperty("image")
|
||||||
|
private String image;
|
||||||
|
@JsonProperty("isInvolvedInBiologicalProcess")
|
||||||
|
private String isInvolvedInBiologicalProcess;
|
||||||
|
@JsonProperty("isPartOfBioChemEntity")
|
||||||
|
private IsPartOfBioChemEntity isPartOfBioChemEntity;
|
||||||
|
@JsonProperty("mainEntityOfPage")
|
||||||
|
private Link mainEntityOfPage;
|
||||||
|
@JsonProperty("https://schema.org/citation")
|
||||||
|
private Citation citation;
|
||||||
|
@JsonProperty("https://schema.org/sameAs")
|
||||||
|
private List<Link> sameAs;
|
||||||
|
@JsonProperty("https://schema.org/hasSequenceAnnotation")
|
||||||
|
private List<Link> hasSequenceAnnotation;
|
||||||
|
@JsonProperty("https://schema.org/additionalProperty")
|
||||||
|
private List<Link> sequenceAnnotation;
|
||||||
|
@JsonProperty("https://schema.org/value")
|
||||||
|
@JsonDeserialize(using = CustomPropertyValueDeserializer.class)
|
||||||
|
private Link propertyValue;
|
||||||
|
@JsonProperty("https://schema.org/termCode")
|
||||||
|
private String termCode;
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getType() {
|
||||||
|
return type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setType(String type) {
|
||||||
|
this.type = type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getName() {
|
||||||
|
return name;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setName(String name) {
|
||||||
|
this.name = name;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Link> getSameAs() {
|
||||||
|
return sameAs;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setSameAs(List<Link> sameAs) {
|
||||||
|
this.sameAs = sameAs;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getIdentifier() {
|
||||||
|
return identifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setIdentifier(String identifier) {
|
||||||
|
this.identifier = identifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getDescription() {
|
||||||
|
return description;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDescription(String description) {
|
||||||
|
this.description = description;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getIsEncodedByBioChemEntity() {
|
||||||
|
return isEncodedByBioChemEntity;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setIsEncodedByBioChemEntity(String isEncodedByBioChemEntity) {
|
||||||
|
this.isEncodedByBioChemEntity = isEncodedByBioChemEntity;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getUrl() {
|
||||||
|
return url;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setUrl(String url) {
|
||||||
|
this.url = url;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getAlternateName() {
|
||||||
|
return alternateName;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setAlternateName(String alternateName) {
|
||||||
|
this.alternateName = alternateName;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Link> getBioChemInteraction() {
|
||||||
|
return bioChemInteraction;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setBioChemInteraction(List<Link> bioChemInteraction) {
|
||||||
|
this.bioChemInteraction = bioChemInteraction;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Link> getBioChemSimilarity() {
|
||||||
|
return bioChemSimilarity;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setBioChemSimilarity(List<Link> bioChemSimilarity) {
|
||||||
|
this.bioChemSimilarity = bioChemSimilarity;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getHasMolecularFunction() {
|
||||||
|
return hasMolecularFunction;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setHasMolecularFunction(String hasMolecularFunction) {
|
||||||
|
this.hasMolecularFunction = hasMolecularFunction;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getImage() {
|
||||||
|
return image;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setImage(String image) {
|
||||||
|
this.image = image;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getIsInvolvedInBiologicalProcess() {
|
||||||
|
return isInvolvedInBiologicalProcess;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setIsInvolvedInBiologicalProcess(String isInvolvedInBiologicalProcess) {
|
||||||
|
this.isInvolvedInBiologicalProcess = isInvolvedInBiologicalProcess;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<AssociatedDisease> getAssociatedDisease() {
|
||||||
|
return associatedDisease;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setAssociatedDisease(List<AssociatedDisease> associatedDisease) {
|
||||||
|
this.associatedDisease = associatedDisease;
|
||||||
|
}
|
||||||
|
|
||||||
|
public IsPartOfBioChemEntity getIsPartOfBioChemEntity() {
|
||||||
|
return isPartOfBioChemEntity;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setIsPartOfBioChemEntity(IsPartOfBioChemEntity isPartOfBioChemEntity) {
|
||||||
|
this.isPartOfBioChemEntity = isPartOfBioChemEntity;
|
||||||
|
}
|
||||||
|
|
||||||
|
public Link getMainEntityOfPage() {
|
||||||
|
return mainEntityOfPage;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setMainEntityOfPage(Link mainEntityOfPage) {
|
||||||
|
this.mainEntityOfPage = mainEntityOfPage;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Link> getHasSequenceAnnotation() {
|
||||||
|
return hasSequenceAnnotation;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setHasSequenceAnnotation(List<Link> hasSequenceAnnotation) {
|
||||||
|
this.hasSequenceAnnotation = hasSequenceAnnotation;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Link> getSequenceAnnotation() {
|
||||||
|
return sequenceAnnotation;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setSequenceAnnotation(List<Link> sequenceAnnotation) {
|
||||||
|
this.sequenceAnnotation = sequenceAnnotation;
|
||||||
|
}
|
||||||
|
|
||||||
|
public Citation getCitation() {
|
||||||
|
return citation;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setCitation(Citation citation) {
|
||||||
|
this.citation = citation;
|
||||||
|
}
|
||||||
|
|
||||||
|
public Link getPropertyValue() {
|
||||||
|
return propertyValue;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setPropertyValue(Link propertyValue) {
|
||||||
|
this.propertyValue = propertyValue;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getTermCode() {
|
||||||
|
return termCode;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTermCode(String termCode) {
|
||||||
|
this.termCode = termCode;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class IsPartOfBioChemEntity {
|
||||||
|
@JsonProperty("@type")
|
||||||
|
private String type;
|
||||||
|
@JsonProperty("url")
|
||||||
|
private String url;
|
||||||
|
|
||||||
|
public String getType() {
|
||||||
|
return type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setType(String type) {
|
||||||
|
this.type = type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getUrl() {
|
||||||
|
return url;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setUrl(String url) {
|
||||||
|
this.url = url;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class AssociatedDisease {
|
||||||
|
@JsonProperty("@type")
|
||||||
|
private String type;
|
||||||
|
@JsonProperty("name")
|
||||||
|
private String name;
|
||||||
|
@JsonProperty("code")
|
||||||
|
private DeseaseCode code;
|
||||||
|
@JsonProperty("id")
|
||||||
|
private String id;
|
||||||
|
|
||||||
|
public String getType() {
|
||||||
|
return type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setType(String type) {
|
||||||
|
this.type = type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getName() {
|
||||||
|
return name;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setName(String name) {
|
||||||
|
this.name = name;
|
||||||
|
}
|
||||||
|
|
||||||
|
public DeseaseCode getCode() {
|
||||||
|
return code;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setCode(DeseaseCode code) {
|
||||||
|
this.code = code;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class DeseaseCode {
|
||||||
|
@JsonProperty("@type")
|
||||||
|
private String type;
|
||||||
|
@JsonProperty("codeValue")
|
||||||
|
private String codeValue;
|
||||||
|
@JsonProperty("codingSystem")
|
||||||
|
private String codingSystem;
|
||||||
|
|
||||||
|
public String getType() {
|
||||||
|
return type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setType(String type) {
|
||||||
|
this.type = type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getCodeValue() {
|
||||||
|
return codeValue;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setCodeValue(String codeValue) {
|
||||||
|
this.codeValue = codeValue;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getCodingSystem() {
|
||||||
|
return codingSystem;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setCodingSystem(String codingSystem) {
|
||||||
|
this.codingSystem = codingSystem;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class Link {
|
||||||
|
@JsonProperty("@id")
|
||||||
|
private String id;
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class DateTimeType {
|
||||||
|
@JsonProperty("@type")
|
||||||
|
private String type;
|
||||||
|
@JsonProperty("@value")
|
||||||
|
private String value;
|
||||||
|
|
||||||
|
public String getType() {
|
||||||
|
return type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setType(String type) {
|
||||||
|
this.type = type;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getValue() {
|
||||||
|
return value;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setValue(String value) {
|
||||||
|
this.value = value;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class Citation {
|
||||||
|
@JsonProperty("@id")
|
||||||
|
private String id;
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class SequenceAnnotationId {
|
||||||
|
@JsonProperty("@id")
|
||||||
|
private String id;
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class SequenceAnnotation {
|
||||||
|
@JsonProperty("https://schema.org/additionalProperty")
|
||||||
|
private List<PropertyValue> additionalProperty;
|
||||||
|
|
||||||
|
public List<PropertyValue> getAdditionalProperty() {
|
||||||
|
return additionalProperty;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setAdditionalProperty(List<PropertyValue> additionalProperty) {
|
||||||
|
this.additionalProperty = additionalProperty;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class PropertyValue {
|
||||||
|
@JsonProperty("https://schema.org/value")
|
||||||
|
private DefinedTerm definedTerm;
|
||||||
|
|
||||||
|
public DefinedTerm getDefinedTerm() {
|
||||||
|
return definedTerm;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDefinedTerm(DefinedTerm definedTerm) {
|
||||||
|
this.definedTerm = definedTerm;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static class DefinedTerm {
|
||||||
|
@JsonProperty("@id")
|
||||||
|
private String id;
|
||||||
|
@JsonProperty("https://schema.org/termCode")
|
||||||
|
private String termCode;
|
||||||
|
@JsonProperty("https://schema.org/name")
|
||||||
|
private String name;
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getTermCode() {
|
||||||
|
return termCode;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTermCode(String termCode) {
|
||||||
|
this.termCode = termCode;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getName() {
|
||||||
|
return name;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setName(String name) {
|
||||||
|
this.name = name;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Entry> getEntryList() {
|
||||||
|
return entryList;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setEntryList(List<Entry> entryList) {
|
||||||
|
this.entryList = entryList;
|
||||||
|
}
|
||||||
|
|
||||||
|
public DateTimeType getRetrievedOn() {
|
||||||
|
return retrievedOn;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setRetrievedOn(DateTimeType retrievedOn) {
|
||||||
|
this.retrievedOn = retrievedOn;
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,331 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.rdfconverter.bioschema.model;
|
||||||
|
|
||||||
|
import java.util.ArrayList;
|
||||||
|
import java.util.List;
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.annotation.JsonInclude;
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public class DataciteProtein {
|
||||||
|
private String id;
|
||||||
|
private String doi;
|
||||||
|
private Types types;
|
||||||
|
List<Creators> creators = new ArrayList<Creators>();
|
||||||
|
private String publisher;
|
||||||
|
private String publicationYear;
|
||||||
|
private static final String schemaVersion = "http://datacite.org/schema/kernel-4";
|
||||||
|
List<Identifier> identifiers = new ArrayList<Identifier>();
|
||||||
|
List<RelatedIdentifier> relatedIdentifiers = new ArrayList<RelatedIdentifier>();
|
||||||
|
List<AlternateIdentifier> alternateIdentifiers = new ArrayList<AlternateIdentifier>();
|
||||||
|
List<Description> descriptions = new ArrayList<Description>();
|
||||||
|
List<Title> titles = new ArrayList<Title>();
|
||||||
|
private List<DataciteDate> dates = new ArrayList<DataciteDate>();
|
||||||
|
private List<Subject> subjects = new ArrayList<Subject>();
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class Types {
|
||||||
|
private String resourceType;
|
||||||
|
private String resourceTypeGeneral;
|
||||||
|
|
||||||
|
public String getResourceType() {
|
||||||
|
return resourceType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setResourceType(String resourceType) {
|
||||||
|
this.resourceType = resourceType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getResourceTypeGeneral() {
|
||||||
|
return resourceTypeGeneral;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setResourceTypeGeneral(String resourceTypeGeneral) {
|
||||||
|
this.resourceTypeGeneral = resourceTypeGeneral;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class Creators {
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class Identifier {
|
||||||
|
private String identifier;
|
||||||
|
private String identifierType;
|
||||||
|
|
||||||
|
public String getIdentifier() {
|
||||||
|
return identifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setIdentifier(String identifier) {
|
||||||
|
this.identifier = identifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getIdentifierType() {
|
||||||
|
return identifierType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setIdentifierType(String identifierType) {
|
||||||
|
this.identifierType = identifierType;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class RelatedIdentifier {
|
||||||
|
private String relationType;
|
||||||
|
private String relatedIdentifier;
|
||||||
|
private String relatedIdentifierType;
|
||||||
|
|
||||||
|
public String getRelationType() {
|
||||||
|
return relationType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setRelationType(String relationType) {
|
||||||
|
this.relationType = relationType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getRelatedIdentifier() {
|
||||||
|
return relatedIdentifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setRelatedIdentifier(String relatedIdentifier) {
|
||||||
|
this.relatedIdentifier = relatedIdentifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getRelatedIdentifierType() {
|
||||||
|
return relatedIdentifierType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setRelatedIdentifierType(String relatedIdentifierType) {
|
||||||
|
this.relatedIdentifierType = relatedIdentifierType;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class AlternateIdentifier {
|
||||||
|
private String alternateIdentifier;
|
||||||
|
private String alternateIdentifierType;
|
||||||
|
|
||||||
|
public String getAlternateIdentifier() {
|
||||||
|
return alternateIdentifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setAlternateIdentifier(String alternateIdentifier) {
|
||||||
|
this.alternateIdentifier = alternateIdentifier;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getAlternateIdentifierType() {
|
||||||
|
return alternateIdentifierType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setAlternateIdentifierType(String alternateIdentifierType) {
|
||||||
|
this.alternateIdentifierType = alternateIdentifierType;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class Description {
|
||||||
|
private String description;
|
||||||
|
private String descriptionType;
|
||||||
|
|
||||||
|
public String getDescription() {
|
||||||
|
return description;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDescription(String description) {
|
||||||
|
this.description = description;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getDescriptionType() {
|
||||||
|
return descriptionType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDescriptionType(String descriptionType) {
|
||||||
|
this.descriptionType = descriptionType;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class Title {
|
||||||
|
private String title;
|
||||||
|
private String titleType;
|
||||||
|
|
||||||
|
public String getTitle() {
|
||||||
|
return title;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTitle(String title) {
|
||||||
|
this.title = title;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getTitleType() {
|
||||||
|
return titleType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTitleType(String titleType) {
|
||||||
|
this.titleType = titleType;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class DataciteDate {
|
||||||
|
private String date;
|
||||||
|
private String dateType;
|
||||||
|
|
||||||
|
public String getDate() {
|
||||||
|
return date;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDate(String date) {
|
||||||
|
this.date = date;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getDateType() {
|
||||||
|
return dateType;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDateType(String dateType) {
|
||||||
|
this.dateType = dateType;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
||||||
|
public static class Subject {
|
||||||
|
private String schemeURI;
|
||||||
|
private String value;
|
||||||
|
private String subjectScheme;
|
||||||
|
|
||||||
|
public String getSchemeURI() {
|
||||||
|
return schemeURI;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setSchemeURI(String schemeURI) {
|
||||||
|
this.schemeURI = schemeURI;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getValue() {
|
||||||
|
return value;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setValue(String value) {
|
||||||
|
this.value = value;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getSubjectScheme() {
|
||||||
|
return subjectScheme;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setSubjectScheme(String subjectScheme) {
|
||||||
|
this.subjectScheme = subjectScheme;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getId() {
|
||||||
|
return id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setId(String id) {
|
||||||
|
this.id = id;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getDoi() {
|
||||||
|
return doi;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDoi(String doi) {
|
||||||
|
this.doi = doi;
|
||||||
|
}
|
||||||
|
|
||||||
|
public Types getTypes() {
|
||||||
|
return types;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTypes(Types types) {
|
||||||
|
this.types = types;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Creators> getCreators() {
|
||||||
|
return creators;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setCreators(List<Creators> creators) {
|
||||||
|
this.creators = creators;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getPublisher() {
|
||||||
|
return publisher;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setPublisher(String publisher) {
|
||||||
|
this.publisher = publisher;
|
||||||
|
}
|
||||||
|
|
||||||
|
public String getPublicationYear() {
|
||||||
|
return publicationYear;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setPublicationYear(String publicationYear) {
|
||||||
|
this.publicationYear = publicationYear;
|
||||||
|
}
|
||||||
|
|
||||||
|
public static String getSchemaVersion() {
|
||||||
|
return schemaVersion;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<RelatedIdentifier> getRelatedIdentifiers() {
|
||||||
|
return relatedIdentifiers;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setRelatedIdentifiers(List<RelatedIdentifier> relatedIdentifiers) {
|
||||||
|
this.relatedIdentifiers = relatedIdentifiers;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<AlternateIdentifier> getAlternateIdentifiers() {
|
||||||
|
return alternateIdentifiers;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setAlternateIdentifiers(List<AlternateIdentifier> alternateIdentifiers) {
|
||||||
|
this.alternateIdentifiers = alternateIdentifiers;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Description> getDescriptions() {
|
||||||
|
return descriptions;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDescriptions(List<Description> descriptions) {
|
||||||
|
this.descriptions = descriptions;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Title> getTitles() {
|
||||||
|
return titles;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setTitles(List<Title> titles) {
|
||||||
|
this.titles = titles;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Identifier> getIdentifiers() {
|
||||||
|
return identifiers;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setIdentifiers(List<Identifier> identifiers) {
|
||||||
|
this.identifiers = identifiers;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<DataciteDate> getDates() {
|
||||||
|
return dates;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setDates(List<DataciteDate> dates) {
|
||||||
|
this.dates = dates;
|
||||||
|
}
|
||||||
|
|
||||||
|
public List<Subject> getSubjects() {
|
||||||
|
return subjects;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void setSubjects(List<Subject> subjects) {
|
||||||
|
this.subjects = subjects;
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,35 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.rdfconverter.utils;
|
||||||
|
|
||||||
|
import java.io.ByteArrayInputStream;
|
||||||
|
import java.io.ByteArrayOutputStream;
|
||||||
|
import java.io.IOException;
|
||||||
|
import java.io.StringWriter;
|
||||||
|
import java.util.zip.GZIPInputStream;
|
||||||
|
import java.util.zip.GZIPOutputStream;
|
||||||
|
|
||||||
|
import org.apache.commons.codec.binary.Base64;
|
||||||
|
import org.apache.commons.io.IOUtils;
|
||||||
|
|
||||||
|
public class CompressorUtil {
|
||||||
|
|
||||||
|
public static String decompressValue(final String abstractCompressed) {
|
||||||
|
try {
|
||||||
|
byte[] byteArray = Base64.decodeBase64(abstractCompressed.getBytes());
|
||||||
|
GZIPInputStream gis = new GZIPInputStream(new ByteArrayInputStream(byteArray));
|
||||||
|
final StringWriter stringWriter = new StringWriter();
|
||||||
|
IOUtils.copy(gis, stringWriter);
|
||||||
|
return stringWriter.toString();
|
||||||
|
} catch (IOException e) {
|
||||||
|
throw new IllegalArgumentException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public static String compressValue(final String value) throws IOException {
|
||||||
|
ByteArrayOutputStream out = new ByteArrayOutputStream();
|
||||||
|
GZIPOutputStream gzip = new GZIPOutputStream(out);
|
||||||
|
gzip.write(value.getBytes());
|
||||||
|
gzip.close();
|
||||||
|
return java.util.Base64.getEncoder().encodeToString(out.toByteArray());
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,43 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.rdfconverter.utils;
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.core.JsonParser;
|
||||||
|
import com.fasterxml.jackson.core.ObjectCodec;
|
||||||
|
import com.fasterxml.jackson.databind.DeserializationContext;
|
||||||
|
import com.fasterxml.jackson.databind.JsonNode;
|
||||||
|
import com.fasterxml.jackson.databind.deser.std.StdDeserializer;
|
||||||
|
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.bioschema.model.BioSchemaProtein;
|
||||||
|
|
||||||
|
public class CustomPropertyValueDeserializer
|
||||||
|
extends StdDeserializer<BioSchemaProtein.Link> {
|
||||||
|
|
||||||
|
public CustomPropertyValueDeserializer() {
|
||||||
|
this(null);
|
||||||
|
}
|
||||||
|
|
||||||
|
public CustomPropertyValueDeserializer(Class<?> vc) {
|
||||||
|
super(vc);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public BioSchemaProtein.Link deserialize(
|
||||||
|
JsonParser jsonparser, DeserializationContext context)
|
||||||
|
throws IOException {
|
||||||
|
ObjectCodec oc = jsonparser.getCodec();
|
||||||
|
JsonNode node = oc.readTree(jsonparser);
|
||||||
|
JsonNode id = node.get("@id");
|
||||||
|
if (id != null) {
|
||||||
|
BioSchemaProtein.Link link = new BioSchemaProtein.Link();
|
||||||
|
link.setId(id.asText());
|
||||||
|
return link;
|
||||||
|
} else {
|
||||||
|
String txt = node.asText();
|
||||||
|
BioSchemaProtein.Link link = new BioSchemaProtein.Link();
|
||||||
|
link.setId(txt);
|
||||||
|
return link;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,309 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.rdfconverter.utils;
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
|
import java.io.StringReader;
|
||||||
|
import java.io.StringWriter;
|
||||||
|
import java.util.*;
|
||||||
|
import java.util.stream.Collectors;
|
||||||
|
|
||||||
|
import org.eclipse.rdf4j.model.Model;
|
||||||
|
import org.eclipse.rdf4j.rio.RDFFormat;
|
||||||
|
import org.eclipse.rdf4j.rio.RDFWriter;
|
||||||
|
import org.eclipse.rdf4j.rio.Rio;
|
||||||
|
import org.slf4j.Logger;
|
||||||
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.databind.DeserializationFeature;
|
||||||
|
import com.fasterxml.jackson.databind.ObjectMapper;
|
||||||
|
import com.fasterxml.jackson.databind.module.SimpleModule;
|
||||||
|
import com.github.jsonldjava.core.JsonLdOptions;
|
||||||
|
import com.github.jsonldjava.core.JsonLdProcessor;
|
||||||
|
import com.github.jsonldjava.utils.JsonUtils;
|
||||||
|
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.bioschema.model.BioSchemaProtein;
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.bioschema.model.DataciteProtein;
|
||||||
|
|
||||||
|
public class RDFConverter {
|
||||||
|
|
||||||
|
private static final Logger log = LoggerFactory.getLogger(RDFConverter.class);
|
||||||
|
|
||||||
|
public ArrayList<String> nQuadsFile2DataciteJson(String nquads, String profile) throws Exception {
|
||||||
|
if (profile.equals("Protein")) {
|
||||||
|
return nQuadsFile2DataciteJson(nquads);
|
||||||
|
}
|
||||||
|
throw new RuntimeException("Profile not supported");
|
||||||
|
}
|
||||||
|
|
||||||
|
private ArrayList<String> nQuadsFile2DataciteJson(String nquads) throws Exception {
|
||||||
|
StringReader reader = new StringReader(nquads);
|
||||||
|
Model model = Rio.parse(reader, "", RDFFormat.NQUADS);
|
||||||
|
StringWriter jsonLDWriter = new StringWriter();
|
||||||
|
RDFWriter rdfRecordWriter = Rio.createWriter(RDFFormat.JSONLD, jsonLDWriter);
|
||||||
|
Rio.write(model, rdfRecordWriter);
|
||||||
|
String jsonLDBuffer = jsonLDWriter.toString();
|
||||||
|
Object jsonObject = JsonUtils.fromString(jsonLDBuffer);
|
||||||
|
Object compact = JsonLdProcessor.compact(jsonObject, new HashMap<>(), new JsonLdOptions());
|
||||||
|
String compactContent = JsonUtils.toString(compact);
|
||||||
|
log.debug("jsonld: " + compactContent);
|
||||||
|
|
||||||
|
ObjectMapper objectMapper = new ObjectMapper();
|
||||||
|
objectMapper.enable(DeserializationFeature.ACCEPT_SINGLE_VALUE_AS_ARRAY);
|
||||||
|
objectMapper.enable(DeserializationFeature.ACCEPT_EMPTY_STRING_AS_NULL_OBJECT);
|
||||||
|
objectMapper.configure(DeserializationFeature.FAIL_ON_UNKNOWN_PROPERTIES, false);
|
||||||
|
objectMapper.configure(DeserializationFeature.FAIL_ON_INVALID_SUBTYPE, false);
|
||||||
|
objectMapper.configure(DeserializationFeature.FAIL_ON_MISSING_CREATOR_PROPERTIES, false);
|
||||||
|
BioSchemaProtein bioSchemaProtein = objectMapper.readValue(compactContent, BioSchemaProtein.class);
|
||||||
|
BioSchemaProtein.DateTimeType retrievedOnType = bioSchemaProtein.getRetrievedOn();
|
||||||
|
|
||||||
|
List<String> citations = bioSchemaProtein.getEntryList().stream().map(entry -> {
|
||||||
|
if (entry.getCitation() != null) {
|
||||||
|
BioSchemaProtein.Citation citationInfo = entry.getCitation();
|
||||||
|
return citationInfo.getId();
|
||||||
|
}
|
||||||
|
return null;
|
||||||
|
}).filter(id -> id != null).collect(Collectors.toList());
|
||||||
|
|
||||||
|
ArrayList<String> results = new ArrayList<String>();
|
||||||
|
final List<DataciteProtein> dataciteProteins = new ArrayList<>();
|
||||||
|
final Map<String, List<BioSchemaProtein.Link>> sequenceAnnotations = new HashMap<>();
|
||||||
|
final Map<String, String> propertyValues = new HashMap<>();
|
||||||
|
final Map<String, BioSchemaProtein.DefinedTerm> definedTerms = new HashMap<>();
|
||||||
|
final Map<String, BioSchemaProtein.Entry> bioschemaProteins = new HashMap<>();
|
||||||
|
final List<String> mainTitles = new ArrayList<>();
|
||||||
|
|
||||||
|
bioSchemaProtein.getEntryList().stream().forEach(entry -> {
|
||||||
|
|
||||||
|
if (entry.getType() != null
|
||||||
|
&& entry
|
||||||
|
.getType()
|
||||||
|
.equals("https://schema.org/Protein")) {
|
||||||
|
|
||||||
|
DataciteProtein dataciteProtein = new DataciteProtein();
|
||||||
|
|
||||||
|
citations.forEach(citation -> {
|
||||||
|
addRelatedIdentifier(dataciteProtein, citation, "IsCitedBy");
|
||||||
|
});
|
||||||
|
|
||||||
|
DataciteProtein.Types types = new DataciteProtein.Types();
|
||||||
|
types.setResourceType("Protein");
|
||||||
|
types.setResourceTypeGeneral("Dataset");
|
||||||
|
dataciteProtein.setTypes(types);
|
||||||
|
|
||||||
|
DataciteProtein.DataciteDate dataciteDate = new DataciteProtein.DataciteDate();
|
||||||
|
dataciteDate.setDate(retrievedOnType.getValue());
|
||||||
|
dataciteDate.setDateType("Collected");
|
||||||
|
dataciteProtein.getDates().add(dataciteDate);
|
||||||
|
|
||||||
|
DataciteProtein.Identifier identifier = new DataciteProtein.Identifier();
|
||||||
|
identifier.setIdentifier(entry.getId());
|
||||||
|
identifier.setIdentifierType("URL");
|
||||||
|
dataciteProtein.getIdentifiers().add(identifier);
|
||||||
|
|
||||||
|
if (entry.getIdentifier() != null) {
|
||||||
|
addAlternateIdentifier(dataciteProtein, entry.getIdentifier());
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getDescription() != null) {
|
||||||
|
DataciteProtein.Description description = new DataciteProtein.Description();
|
||||||
|
description.setDescription(entry.getDescription());
|
||||||
|
dataciteProtein.getDescriptions().add(description);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getIsEncodedByBioChemEntity() != null) {
|
||||||
|
addRelatedIdentifier(dataciteProtein, entry.getIsEncodedByBioChemEntity(), "");
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getUrl() != null) {
|
||||||
|
addAlternateIdentifier(dataciteProtein, entry.getUrl());
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getAlternateName() != null) {
|
||||||
|
DataciteProtein.Title title = new DataciteProtein.Title();
|
||||||
|
title.setTitle(entry.getAlternateName());
|
||||||
|
title.setTitleType("AlternativeTitle");
|
||||||
|
dataciteProtein.getTitles().add(title);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getBioChemInteraction() != null) {
|
||||||
|
entry.getBioChemInteraction().stream().filter(Objects::nonNull).forEach(bc -> {
|
||||||
|
addRelatedIdentifier(dataciteProtein, bc.getId(), "");
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getBioChemSimilarity() != null) {
|
||||||
|
entry.getBioChemSimilarity().stream().filter(Objects::nonNull).forEach(bc -> {
|
||||||
|
addRelatedIdentifier(dataciteProtein, bc.getId(), "");
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getHasMolecularFunction() != null) {
|
||||||
|
addRelatedIdentifier(dataciteProtein, entry.getHasMolecularFunction(), "");
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getIsInvolvedInBiologicalProcess() != null) {
|
||||||
|
addRelatedIdentifier(dataciteProtein, entry.getIsInvolvedInBiologicalProcess(), "");
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getIsEncodedByBioChemEntity() != null) {
|
||||||
|
addRelatedIdentifier(dataciteProtein, entry.getIsEncodedByBioChemEntity(), "");
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getIsPartOfBioChemEntity() != null) {
|
||||||
|
addRelatedIdentifier(dataciteProtein, entry.getIsPartOfBioChemEntity().getUrl(), "");
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getSameAs() != null) {
|
||||||
|
entry.getSameAs().stream().filter(Objects::nonNull).forEach(sameAs -> {
|
||||||
|
addRelatedIdentifier(dataciteProtein, sameAs.getId(), "IsIdenticalTo");
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
if (entry.getAssociatedDisease() != null) {
|
||||||
|
entry.getAssociatedDisease().stream().filter(Objects::nonNull).forEach(ad -> {
|
||||||
|
addRelatedIdentifier(dataciteProtein, ad.getName(), "IsIdenticalTo");
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
String proteinId = "";
|
||||||
|
try {
|
||||||
|
String[] identifierParts = dataciteProtein.getIdentifiers().get(0).getIdentifier().split("/");
|
||||||
|
proteinId = identifierParts[identifierParts.length - 1];
|
||||||
|
} catch (Exception e) {
|
||||||
|
log.error("Identifier not found", e.getMessage());
|
||||||
|
}
|
||||||
|
|
||||||
|
mainTitles.add(" " + entry.getName() + " ");
|
||||||
|
|
||||||
|
dataciteProtein.setId(proteinId);
|
||||||
|
bioschemaProteins.put(entry.getId(), entry);
|
||||||
|
dataciteProteins.add(dataciteProtein);
|
||||||
|
}
|
||||||
|
if (entry.getType() != null
|
||||||
|
&& entry
|
||||||
|
.getType()
|
||||||
|
.equals("https://schema.org/SequenceAnnotation")) {
|
||||||
|
sequenceAnnotations.put(entry.getId(), entry.getSequenceAnnotation());
|
||||||
|
}
|
||||||
|
if (entry.getType() != null
|
||||||
|
&& entry
|
||||||
|
.getType()
|
||||||
|
.equals("https://schema.org/PropertyValue")) {
|
||||||
|
propertyValues.put(entry.getId(), entry.getPropertyValue().getId());
|
||||||
|
}
|
||||||
|
if (entry.getType() != null
|
||||||
|
&& entry
|
||||||
|
.getType()
|
||||||
|
.equals("https://schema.org/DefinedTerm")) {
|
||||||
|
BioSchemaProtein.DefinedTerm term = new BioSchemaProtein.DefinedTerm();
|
||||||
|
term.setId(entry.getId());
|
||||||
|
term.setTermCode(entry.getTermCode());
|
||||||
|
term.setName(entry.getName());
|
||||||
|
definedTerms.put(term.getId(), term);
|
||||||
|
}
|
||||||
|
if (entry.getType() != null
|
||||||
|
&& entry
|
||||||
|
.getType()
|
||||||
|
.equals("https://schema.org/CollectionPage")) {
|
||||||
|
mainTitles.add(entry.getName());
|
||||||
|
}
|
||||||
|
});
|
||||||
|
bioschemaProteins
|
||||||
|
.entrySet()
|
||||||
|
.stream()
|
||||||
|
.filter(bioProtein -> Objects.nonNull(bioProtein.getValue().getHasSequenceAnnotation()))
|
||||||
|
.forEach(bioProtein -> {
|
||||||
|
List<String> seqAnnIds = bioProtein
|
||||||
|
.getValue()
|
||||||
|
.getHasSequenceAnnotation()
|
||||||
|
.stream()
|
||||||
|
.map(s -> s.getId())
|
||||||
|
.collect(Collectors.toList());
|
||||||
|
List<BioSchemaProtein.Link> propertyIds = sequenceAnnotations
|
||||||
|
.entrySet()
|
||||||
|
.stream()
|
||||||
|
.filter(s -> seqAnnIds.contains(s.getKey()))
|
||||||
|
.flatMap(s -> {
|
||||||
|
return s.getValue().stream();
|
||||||
|
})
|
||||||
|
.collect(Collectors.toList());
|
||||||
|
|
||||||
|
propertyIds
|
||||||
|
.stream()
|
||||||
|
.map(propertyId -> propertyValues.get(propertyId.getId()))
|
||||||
|
.filter(term -> Objects.nonNull(term))
|
||||||
|
.map(term -> definedTerms.get(term))
|
||||||
|
.filter(term -> Objects.nonNull(term))
|
||||||
|
.forEach(term -> {
|
||||||
|
dataciteProteins
|
||||||
|
.stream()
|
||||||
|
.filter(
|
||||||
|
dcProtein -> dcProtein
|
||||||
|
.getIdentifiers()
|
||||||
|
.get(0)
|
||||||
|
.getIdentifier()
|
||||||
|
.equals(bioProtein.getKey()))
|
||||||
|
.filter(dcProtein -> Objects.nonNull(dcProtein))
|
||||||
|
.forEach(d -> {
|
||||||
|
DataciteProtein.Subject subject = new DataciteProtein.Subject();
|
||||||
|
subject.setSchemeURI(term.getId());
|
||||||
|
subject.setValue(term.getName());
|
||||||
|
subject.setSubjectScheme(term.getTermCode());
|
||||||
|
d.getSubjects().add(subject);
|
||||||
|
});
|
||||||
|
});
|
||||||
|
});
|
||||||
|
|
||||||
|
dataciteProteins
|
||||||
|
.stream()
|
||||||
|
.filter(d -> (d.getSubjects() != null && !d.getSubjects().isEmpty()))
|
||||||
|
.forEach(d -> {
|
||||||
|
Map<String, DataciteProtein.Subject> cleanedSubjects = new HashMap<>();
|
||||||
|
d.getSubjects().stream().forEach(s -> {
|
||||||
|
cleanedSubjects.putIfAbsent(s.getValue(), s);
|
||||||
|
});
|
||||||
|
d.getSubjects().clear();
|
||||||
|
d.setSubjects(cleanedSubjects.values().stream().collect(Collectors.toList()));
|
||||||
|
});
|
||||||
|
|
||||||
|
dataciteProteins.forEach(d -> {
|
||||||
|
DataciteProtein.Title title = new DataciteProtein.Title();
|
||||||
|
title.setTitle(d.getId() + " - ".concat(mainTitles.get(0)));
|
||||||
|
d.getTitles().add(title);
|
||||||
|
});
|
||||||
|
|
||||||
|
ObjectMapper mapper = new ObjectMapper();
|
||||||
|
dataciteProteins.forEach(d -> {
|
||||||
|
StringWriter writer = new StringWriter();
|
||||||
|
try {
|
||||||
|
mapper.writeValue(writer, d);
|
||||||
|
} catch (IOException e) {
|
||||||
|
throw new RuntimeException(e);
|
||||||
|
}
|
||||||
|
results.add(writer.toString());
|
||||||
|
});
|
||||||
|
if (dataciteProteins.isEmpty()) {
|
||||||
|
log.error("No Protein data found: " + nquads);
|
||||||
|
}
|
||||||
|
return results;
|
||||||
|
}
|
||||||
|
|
||||||
|
private void addRelatedIdentifier(DataciteProtein DataciteProtein, String relatedIdentifierValue,
|
||||||
|
String relationType) {
|
||||||
|
DataciteProtein.RelatedIdentifier relatedIdentifier = new DataciteProtein.RelatedIdentifier();
|
||||||
|
relatedIdentifier.setRelatedIdentifier(relatedIdentifierValue);
|
||||||
|
if (!relationType.isEmpty()) {
|
||||||
|
relatedIdentifier.setRelationType(relationType);
|
||||||
|
}
|
||||||
|
if (relatedIdentifierValue.contains("http://") || relatedIdentifierValue.contains("https://")) {
|
||||||
|
relatedIdentifier.setRelatedIdentifierType("URL");
|
||||||
|
}
|
||||||
|
DataciteProtein.getRelatedIdentifiers().add(relatedIdentifier);
|
||||||
|
}
|
||||||
|
|
||||||
|
private void addAlternateIdentifier(DataciteProtein DataciteProtein, String alternateIdentifierValue) {
|
||||||
|
DataciteProtein.AlternateIdentifier alternateIdentifier = new DataciteProtein.AlternateIdentifier();
|
||||||
|
alternateIdentifier.setAlternateIdentifier(alternateIdentifierValue);
|
||||||
|
DataciteProtein.getAlternateIdentifiers().add(alternateIdentifier);
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,32 @@
|
||||||
|
[
|
||||||
|
{
|
||||||
|
"paramName": "n",
|
||||||
|
"paramLongName": "nameNode",
|
||||||
|
"paramDescription": "the Name Node URI",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "w",
|
||||||
|
"paramLongName": "workingPath",
|
||||||
|
"paramDescription": "the working path",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "i",
|
||||||
|
"paramLongName": "rdfInput",
|
||||||
|
"paramDescription": "sequence file inside working path that contains rdf records",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "o",
|
||||||
|
"paramLongName": "output",
|
||||||
|
"paramDescription": "relative path inside workingpath where bioschema dataset in datacite format will be stored",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "p",
|
||||||
|
"paramLongName": "profile",
|
||||||
|
"paramDescription": "the input data profile that has to be used for conversion (https://bioschemas.org/profiles/)",
|
||||||
|
"paramRequired": true
|
||||||
|
}
|
||||||
|
]
|
|
@ -0,0 +1,65 @@
|
||||||
|
<configuration>
|
||||||
|
|
||||||
|
<!-- OCEAN -->
|
||||||
|
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>jobTracker</name>-->
|
||||||
|
<!-- <value>yarnRM</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>nameNode</name>-->
|
||||||
|
<!-- <value>hdfs://nameservice1</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>hive_metastore_uris</name>-->
|
||||||
|
<!-- <value>thrift://iis-cdh5-test-m3.ocean.icm.edu.pl:9083</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
<!-- <property>-->
|
||||||
|
<!-- <name>spark2YarnHistoryServerAddress</name>-->
|
||||||
|
<!-- <value>http://iis-cdh5-test-gw.ocean.icm.edu.pl:18089</value>-->
|
||||||
|
<!-- </property>-->
|
||||||
|
|
||||||
|
|
||||||
|
<!-- GARR -->
|
||||||
|
|
||||||
|
<property>
|
||||||
|
<name>jobTracker</name>
|
||||||
|
<value>hadoop-rm3.garr-pa1.d4science.org:8032</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>nameNode</name>
|
||||||
|
<value>hdfs://hadoop-rm1.garr-pa1.d4science.org:8020</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>hive_metastore_uris</name>
|
||||||
|
<value>thrift://hadoop-edge3.garr-pa1.d4science.org:9083</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2YarnHistoryServerAddress</name>
|
||||||
|
<value>http://hadoop-rm2.garr-pa1.d4science.org:19888</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>oozie.launcher.mapreduce.user.classpath.first</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>oozie.use.system.libpath</name>
|
||||||
|
<value>true</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>oozie.action.sharelib.for.spark</name>
|
||||||
|
<value>spark2</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2EventLogDir</name>
|
||||||
|
<value>/user/spark/spark2ApplicationHistory</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2ExtraListeners</name>
|
||||||
|
<value>"com.cloudera.spark.lineage.NavigatorAppListener"</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2SqlQueryExecutionListeners</name>
|
||||||
|
<value>"com.cloudera.spark.lineage.NavigatorQueryListener"</value>
|
||||||
|
</property>
|
||||||
|
</configuration>
|
|
@ -0,0 +1,3 @@
|
||||||
|
wget -O /tmp/base64_gzipped_nquads.txt https://hadoop-bioschemas-ds.garr-pa1.d4science.org/bioschemas-api/api/getNQuads?datasourceKey=$1
|
||||||
|
hdfs dfs -copyFromLocal /tmp/base64_gzipped_nquads.txt /data/bioschema/mobidb
|
||||||
|
rm -f /tmp/base64_gzipped_nquads.txt
|
|
@ -0,0 +1,118 @@
|
||||||
|
<workflow-app name="RdfConverter" xmlns="uri:oozie:workflow:0.5">
|
||||||
|
<parameters>
|
||||||
|
<property>
|
||||||
|
<name>bioschemas_datasource_key</name>
|
||||||
|
<value>mobidb</value>
|
||||||
|
<description>bioschemas datasource key (i.e. mobidb, ped, disprot)</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>workingPath</name>
|
||||||
|
<value>/data/bioschema/mobidb/</value>
|
||||||
|
<description>the working path</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>rdfInput</name>
|
||||||
|
<value>base64_gzipped_nquads.txt</value>
|
||||||
|
<description>rdf output of scraping workflow</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>output</name>
|
||||||
|
<value>json-datacite/</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>profile</name>
|
||||||
|
<value>Protein</value>
|
||||||
|
<description>the input data profile that has to be used for conversion (https://bioschemas.org/profiles/)</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>oozie.launcher.mapreduce.map.java.opts</name>
|
||||||
|
<value>-Xmx4g</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2RdfConversionMaxExecutors</name>
|
||||||
|
<value>50</value>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>sparkDriverMemory</name>
|
||||||
|
<value>7G</value>
|
||||||
|
<description>memory for driver process</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>sparkExecutorMemory</name>
|
||||||
|
<value>2G</value>
|
||||||
|
<description>memory for individual executor</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>sparkExecutorCores</name>
|
||||||
|
<value>4</value>
|
||||||
|
<description>number of cores used by single executor</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2ExtraListeners</name>
|
||||||
|
<value>com.cloudera.spark.lineage.NavigatorAppListener</value>
|
||||||
|
<description>spark 2.* extra listeners classname</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2YarnHistoryServerAddress</name>
|
||||||
|
<description>spark 2.* yarn history server address</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>spark2EventLogDir</name>
|
||||||
|
<description>spark 2.* event log dir location</description>
|
||||||
|
</property>
|
||||||
|
</parameters>
|
||||||
|
|
||||||
|
<start to="DownloadNQuads"/>
|
||||||
|
<kill name="Kill">
|
||||||
|
<message>Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]</message>
|
||||||
|
</kill>
|
||||||
|
|
||||||
|
<action name="DownloadNQuads">
|
||||||
|
<shell xmlns="uri:oozie:shell-action:0.1">
|
||||||
|
<job-tracker>${jobTracker}</job-tracker>
|
||||||
|
<name-node>${nameNode}</name-node>
|
||||||
|
<exec>download_nquads.sh</exec>
|
||||||
|
<argument>${bioschemas_datasource_key}</argument>
|
||||||
|
<file>download_nquads.sh</file>
|
||||||
|
<capture-output/>
|
||||||
|
</shell>
|
||||||
|
<ok to="ResetWorkingPath"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="ResetWorkingPath">
|
||||||
|
<fs>
|
||||||
|
<delete path='${workingPath}${output}'/>
|
||||||
|
</fs>
|
||||||
|
<ok to="NquadsToDataciteJson"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="NquadsToDataciteJson">
|
||||||
|
<spark xmlns="uri:oozie:spark-action:0.2">
|
||||||
|
<master>yarn-cluster</master>
|
||||||
|
<mode>cluster</mode>
|
||||||
|
<name>NquadsToDataciteJson</name>
|
||||||
|
<class>eu.dnetlib.dhp.rdfconverter.bioschema.SparkRdfToDatacite</class>
|
||||||
|
<jar>dhp-rdfconverter-${projectVersion}.jar</jar>
|
||||||
|
<spark-opts>
|
||||||
|
--executor-cores=${sparkExecutorCores}
|
||||||
|
--driver-memory=${sparkDriverMemory}
|
||||||
|
--executor-memory=${sparkExecutorMemory}
|
||||||
|
--driver-memory=${sparkDriverMemory}
|
||||||
|
--conf spark.extraListeners=${spark2ExtraListeners}
|
||||||
|
--conf spark.yarn.historyServer.address=${spark2YarnHistoryServerAddress}
|
||||||
|
--conf spark.eventLog.dir=${nameNode}${spark2EventLogDir}
|
||||||
|
</spark-opts>
|
||||||
|
<arg>--nameNode</arg><arg>${nameNode}</arg>
|
||||||
|
<arg>--workingPath</arg><arg>${workingPath}</arg>
|
||||||
|
<arg>--rdfInput</arg><arg>${rdfInput}</arg>
|
||||||
|
<arg>--output</arg><arg>${output}</arg>
|
||||||
|
<arg>--profile</arg><arg>${profile}</arg>
|
||||||
|
</spark>
|
||||||
|
<ok to="End"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<end name="End"/>
|
||||||
|
</workflow-app>
|
|
@ -0,0 +1,9 @@
|
||||||
|
# Set root logger level to DEBUG and its only appender to A1.
|
||||||
|
log4j.rootLogger=INFO, A1
|
||||||
|
|
||||||
|
# A1 is set to be a ConsoleAppender.
|
||||||
|
log4j.appender.A1=org.apache.log4j.ConsoleAppender
|
||||||
|
|
||||||
|
# A1 uses PatternLayout.
|
||||||
|
log4j.appender.A1.layout=org.apache.log4j.PatternLayout
|
||||||
|
log4j.appender.A1.layout.ConversionPattern=%-4r [%t] %-5p %c %x - %m%n
|
|
@ -0,0 +1,64 @@
|
||||||
|
|
||||||
|
package eu.dnetlib.dhp.rdfconverter.bioschema;
|
||||||
|
|
||||||
|
import java.io.InputStream;
|
||||||
|
import java.util.ArrayList;
|
||||||
|
|
||||||
|
import org.apache.commons.io.IOUtils;
|
||||||
|
import org.junit.jupiter.api.Test;
|
||||||
|
import org.slf4j.Logger;
|
||||||
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.utils.CompressorUtil;
|
||||||
|
import eu.dnetlib.dhp.rdfconverter.utils.RDFConverter;
|
||||||
|
|
||||||
|
public class ConverterTest {
|
||||||
|
|
||||||
|
static Logger logger = LoggerFactory.getLogger(ConverterTest.class);
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void disprotToDataciteTest() throws Exception {
|
||||||
|
InputStream is = ConverterTest.class.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/disprot.nq");
|
||||||
|
String nq = IOUtils.toString(is);
|
||||||
|
RDFConverter converter = new RDFConverter();
|
||||||
|
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
|
||||||
|
results.stream().forEach(r -> {
|
||||||
|
logger.info("JSON DATACITE >> " + r);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void pedCitationTest() throws Exception {
|
||||||
|
InputStream is = ConverterTest.class.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/ped.nq");
|
||||||
|
String nq = IOUtils.toString(is);
|
||||||
|
RDFConverter converter = new RDFConverter();
|
||||||
|
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
|
||||||
|
results.stream().forEach(r -> {
|
||||||
|
logger.info("JSON DATACITE >> " + r);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void mobidbToDataciteTest() throws Exception {
|
||||||
|
InputStream is = ConverterTest.class.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/mobidb.nq");
|
||||||
|
String nq = IOUtils.toString(is);
|
||||||
|
RDFConverter converter = new RDFConverter();
|
||||||
|
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
|
||||||
|
results.stream().forEach(r -> {
|
||||||
|
logger.info("JSON DATACITE >> " + r);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void decompressTest() throws Exception {
|
||||||
|
InputStream is = ConverterTest.class
|
||||||
|
.getResourceAsStream("/eu/dnetlib/dhp/rdfconverter/bioschema/base64_gzipped_nquads.txt");
|
||||||
|
String base64_gzipped_nquads = IOUtils.toString(is);
|
||||||
|
String nq = CompressorUtil.decompressValue(base64_gzipped_nquads);
|
||||||
|
RDFConverter converter = new RDFConverter();
|
||||||
|
ArrayList<String> results = converter.nQuadsFile2DataciteJson(nq, "Protein");
|
||||||
|
results.stream().forEach(r -> {
|
||||||
|
logger.info("JSON DATACITE >> " + r);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1 @@
|
||||||
|
H4sIAAAAAAAAANVY23KjOBB9369wOc+2uNhJ7EqlipiLVQgGkBbGL7OFQbZVayMv4Hj89yOMk2GSSc3O+FLJG0Kt0+d0S92Cu0VZroshAFPGi2RBV3HR5fkcJHm8XYJHGaz4lKVT4Em9a1UGiqQoUk9WgXTfuquWipXrTb7cr1nHjyCnZc7oI03NnK8ONhV8DbM3q6HuW92/7s7l/FN232pX5h2p15FVIitDRR325faXL08Lt9ttd6vulyqSJIPPDsJ7CldpXFLCVvQcDJOcCvQ0YuWiEZy5GG6m3YSvwDjq4Igi8OD8jQ0haEnjghagjOdA6va7yg+kGkH1ZUW9bXhtyJMHgwGQFCCikaezTrHLyvhrJyuuyt2aNljU+uoU5bykLGtM/r7+/8fzOTppAkqarwqQ8GzGxQPhb7tf53zGliIuB6IiNrLcCQxkaNg4N+sXsVrExQPjHl/uVjTH9L8NzRIR1rbj6tD2EYpcy0BuiEIMdQ+byLEt7AUG1EIUwCAUj2SCQnfieAhGrg1tYYNN3UNEx4Y9MSPTGLs28aAXuRMvtEJk6iOkWTbWiEkINg3XD209RMQUgGMUOpaOkecRCD2oYWwTXzNsATP2I9sPRyZEriVea9DBCIeuoQVi1sIhJIFr+roJDYgFD4xx4AVjKGhBn+CAYIuYAcS+QMYOsULXI8jWoWHpEOmhbVjQtVw9dEI48i0B4kVjB6GJjibYRoGQZJloAgkKPWhblm4LbgZqXzZZLKVZyWaM5iJDT/PfX9aea6xhjXNpglmy3KQ0hZkel+Lolw2eDYgr4UXqSIMLs8viqiy2tU3J14t4vmut6/PX6l+YSCGIaMWLMrLJWMVnb3B4fg1yCXaivvKMr1gSxNmcHuH8ddsEfeXmWr3t9W5OpekPSuvR/WVUtUH2SCOe/3smHaeI7dE6dTpjGU2JaGzvWOarEtSgjasKdErn8uCmr6rXN/3bjxORX1abw4HfgX5/oAyUD6rsZ73wSdnwQyt7vmhO+ZJN8zjf7W3EELijB0gqkf98NIXVdXnE06oh19RP1YPPT13k4kVmhE+elXzJ54fUHAZ1frTPn9z3d7ZelbJT9ovjCu/Zpf78Ylglq7UvGe9oL/6K+/fNeHC45nkZv7klmbgbPW/KM1wsn36PvP2FXLJyuf/CFIv0hyMj/Q0PBaE5ARIAAA==
|
|
@ -0,0 +1,52 @@
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> <http://purl.org/pav/retrievedFrom> <https://disprot.org/DP01454> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> <http://purl.org/pav/retrievedOn> "2021-11-25T12:23:57"^^<http://www.w3.org/2001/XMLSchema#dateTime> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> <http://purl.org/pav/createdWith> <https://github.com/HW-SWeL/BMUSE/releases/tag/0.5.2> .
|
||||||
|
<https://disprot.org/DP01454> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/hasBioPolymerSequence> "MSTLFPSLFPRVTETLWFNLDRPCVEETELQQQEQQHQAWLQSIAEKDNNLVPIGKPASEHYDDEEEEDDEDDEDSEEDSEDDEDMQDMDEMNDYNESPDDGEVNEVDMEGNEQDQDQWMI" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/hasSequenceAnnotation> <https://disprot.org/DP01454#disorder-content> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/hasSequenceAnnotation> <https://disprot.org/DP01454r001> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/identifier> "https://identifiers.org/disprot:DP01454" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/includedInDataset> "https://disprot.org/#2021-08" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/name> "Anaphase-promoting complex subunit 15" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P60006> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <https://schema.org/taxonomicRange> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/profiles/Protein/0.11-RELEASE> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CreativeWork> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454#disorder-content> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454#disorder-content> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454#disorder-content> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://schema.org/name> "Protein disorder content" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://schema.org/propertyID> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00499> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/159543474> <https://schema.org/value> "5.371900826446281E-1" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <https://schema.org/rangeEnd> "121" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/77094838> <https://schema.org/rangeStart> "1" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454r001> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454r001> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454r001> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454r001> <https://schema.org/subjectOf> <https://identifiers.org/pubmed:26083744> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1595402293> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/name> "disorder" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/termCode> "IDPO:00076" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl> <https://schema.org/name> "IDP ontology" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <https://schema.org/rangeEnd> "121" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/1951282934> <https://schema.org/rangeStart> "57" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://identifiers.org/pubmed:26083744> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/ScholarlyArticle> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/inDefinedTermSet> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/sameAs> <http://purl.uniprot.org/taxonomy/9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/sameAs> <https://identifiers.org/taxonomy:9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/sameAs> <http://purl.obolibrary.org/obo/NCBITaxon_9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/termCode> "9606" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/200140588> <https://schema.org/url> <http://purl.bioontology.org/ontology/NCBITAXON/9606> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <https://schema.org/name> "NCBI taxon" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0/disprot.org/DP01454/827138196> <https://schema.org/url> <https://bioportal.bioontology.org/ontologies/NCBITAXON> <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
||||||
|
<https://disprot.org/DP01454> <http://purl.org/dc/terms/title> "DisProt" <https://bioschemas.org/crawl/v1/disprot/DP01454/20211125/0> .
|
|
@ -0,0 +1,118 @@
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> <http://purl.org/pav/retrievedFrom> <https://mobidb.org/Q9UPN6> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> <http://purl.org/pav/retrievedOn> "2021-12-06T14:49:15"^^<http://www.w3.org/2001/XMLSchema#dateTime> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> <http://purl.org/pav/createdWith> <https://github.com/HW-SWeL/BMUSE/releases/tag/0.5.2> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasBioPolymerSequence> "MEAVKTFNSELYSLNDYKPPISKAKMTQITKAAIKAIKFYKHVVQSVEKFIQKCKPEYKVPGLYVIDSIVRQSRHQFGQEKDVFAPRFSNNIISTFQNLYRCPGDDKSKIVRVLNLWQKNNVFKSEIIQPLLDMAAGIPPPVVTPVLASTTTAMSNTPGTPVTPVTPANVVQGLPDPWVSQITNTDTLAAVAQILQSPQGQQLQQLIQTLQIQQQKPQPSILQALDAGLVVQLQALTAQLTAAAAAANTLTPLEQGVSFNKKLMDRFDFGEDSEHSEEPKKEIPASQLSHVSESVNNSIFHQIAEQLQQQNLEHLRQQLLEQQQPQKATPQDSQEGTFGSEHSASPSQGSSQQHFLEPEVNLDDSIDIQQQDMDIDEGQDGVEEEVFEQEAKKVAVRSRSRTHSRSRSRSPRKRRSRSRSGSRKRKHRKRSRSRSRERKRKSSRSYSSERRAREREKERQKKGLPPIRSKTLSVCSTTLWVGQVDKKATQQDLTNLFEEFGQIESINMIPPRGCAYVCMVHRQDAFRALQKLSSGSYKIGSKVIKIAWALNKGVKTEYKQFWDVDLGVTYIPWEKVKVDDLEGFAEGGMIDQETVNTEWETVKSSEPVKETVQTTQSPTPVEKETVVTTQAEVFPPPVAMLQIPVAPAVPTVSLVPPAFPVSMPVPPPGFSPIPPPPFLRASFNPSQPPPGFMPPPVPPPVVPPPTIPPVVPTSLVQPSLSMTPETVKDVGFGSLVIPGGSVASNLATSALPAGNVFNAPTKQAEPEEKVPHLIDHQISSGENTRSVIPNDISSNAAILGGQPPNVTSNSGILGVQRPNVSSNSEILGVRPSNVSSSSGIIAAQPPNILNNSGILGIQPPSVSNSSGLLGVLPPNIPNNSGLVGVQPPNVPNTPGLLGTQPPAGPQNLPPLSIPNQRMPTMPMLDIRPGLIPQAPGPRFPLIQPGIPPQRGIPPPSVLDSALHPPPRGPFPPGDIFSQPERPFLAPGRQSVDNVTNPEKRIPLGNDNIQQEGDRDYRFPPIETRESISRPPPVDVRDVVGRPIDPREGPGRPPLDGRDHFGRPPVDIRENLVRPGIDHLGRRDHFGFNPEKPWGHRGDFDEREHRVLPVYGGPKGLHEERGRFRSGNYRFDPRSGPWNRGFGQEVHRDFDDRRRPWERQRDRDDRDFDFCREMNGNRLGRDRIQNTWVPPPHARVFDYFEGATSQRKGDNVPQVNGENTERHAQPPPIPVQNDPELYEKLTSSNEINKEKSDTVADIESEPVVESTETEGT" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/hasSequenceAnnotation> <https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/identifier> "https://identifiers.org/mobidb:Q9UPN6" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/includedInDataset> "https://mobidb.org/#2020-09" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/name> "SR-related and CTD-associated factor 8" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/Q9UPN6> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <https://schema.org/taxonomicRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/profiles/Protein/0.11-RELEASE> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CreativeWork> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://schema.org/description> "Protein disorder content predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-content-mobidb_lite> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://schema.org/name> "Protein disorder content" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://schema.org/propertyID> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00499> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1018653369> <https://schema.org/value> "2.93E-1" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <https://schema.org/rangeEnd> "1271" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1799426988> <https://schema.org/rangeStart> "1" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.270_289> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1828683> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/name> "Disorder" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://schema.org/termCode> "IDPO:00076" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl> <https://schema.org/name> "IDP ontology" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <https://schema.org/rangeEnd> "289" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/432948463> <https://schema.org/rangeStart> "270" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.322_354> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/75870383> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <https://schema.org/rangeEnd> "354" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/985831280> <https://schema.org/rangeStart> "322" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.384_468> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/2027294569> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <https://schema.org/rangeEnd> "468" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1332124339> <https://schema.org/rangeStart> "384" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.808_827> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1437016135> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <https://schema.org/rangeEnd> "827" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/839471977> <https://schema.org/rangeStart> "808" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.899_918> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/144111614> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <https://schema.org/rangeEnd> "918" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/781835543> <https://schema.org/rangeStart> "899" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.945_1064> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/902536730> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <https://schema.org/rangeEnd> "1064" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/518954157> <https://schema.org/rangeStart> "945" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://schema.org/description> "Protein disordered region predicted by MobiDB-lite" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6#prediction-disorder-mobidb_lite.1198_1271> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/322445788> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00076> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <https://schema.org/rangeEnd> "1271" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/5118922> <https://schema.org/rangeStart> "1198" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/inDefinedTermSet> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/sameAs> <http://purl.uniprot.org/taxonomy/9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/sameAs> <https://identifiers.org/taxonomy:9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/sameAs> <http://purl.obolibrary.org/obo/NCBITaxon_9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/termCode> "9606" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/1444334161> <https://schema.org/url> <http://purl.bioontology.org/ontology/NCBITAXON/9606> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <https://schema.org/name> "NCBI taxon" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0/mobidb.org/Q9UPN6/569363713> <https://schema.org/url> <https://bioportal.bioontology.org/ontologies/NCBITAXON> <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
||||||
|
<https://mobidb.org/Q9UPN6> <http://purl.org/dc/terms/title> "MobiDB" <https://bioschemas.org/crawl/v1/mobidb/Q9UPN6/20211206/0> .
|
|
@ -0,0 +1,229 @@
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> <http://purl.org/pav/retrievedFrom> <https://proteinensemble.org/PED00014> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> <http://purl.org/pav/retrievedOn> "2021-12-06T11:52:22"^^<http://www.w3.org/2001/XMLSchema#dateTime> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> <http://purl.org/pav/createdWith> <https://github.com/HW-SWeL/BMUSE/releases/tag/0.5.2> .
|
||||||
|
<https://proteinensemble.org/PED00014> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CollectionPage> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014> <https://schema.org/citation> <https://identifiers.org/pubmed:20399186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014> <https://schema.org/identifier> "https://identifiers.org/ped:PED00014" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014> <https://schema.org/includedInDataset> "https://proteinensemble.org/#2021-02-12" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014> <https://schema.org/mainEntity> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014> <https://schema.org/name> "Structural ensemble of pSic1 (1-90) phosphorylated at Thr5, Thr33, Thr45, Ser69, Ser76 and Ser80, in complex with SKP1 (4-186) and CDC4 (270-744)" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://identifiers.org/pubmed:20399186> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/ScholarlyArticle> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/ItemList> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/itemListElement> <https://proteinensemble.org/PED00014#P07834_D_0> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/itemListElement> <https://proteinensemble.org/PED00014#P52286_C_0> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/itemListElement> <https://proteinensemble.org/PED00014#P38634_A_1> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/23786852> <https://schema.org/numberOfItems> "3" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/hasBioPolymerSequence> "LKRDLITSLPFEISLKIFNYLQFEDIINSLGVSQNWNKIIRKSTSLWKKLLISENFVSPKGFNSLNLKLSQKYPKLSQQDRLRLSFLENIFILKNWYNPKFVPQRTTLRGHMTSVITCLQFEDNYVITGADDKMIRVYDSINKKFLLQLSGHDGGVWALKYAHGGILVSGSTDRTVRVWDIKKGCCTHVFKGHNSTVRCLDIVEYKNIKYIVTGSRDNTLHVWKLPKESSVPDHGEEHDYPLVFHTPEENPYFVGVLRGHMASVRTVSGHGNIVVSGSYDNTLIVWDVAQMKCLYILSGHTDRIYSTIYDHERKRCISASMDTTIRIWDLENIWNNGECSYATNSASPCAKILGAMYTLQGHTALVGLLRLSDKFLVSAAADGSIRGWDANDYSRKFSYHHTNLSAITTFYVSDNILVSGSENQFNIYNLRSGKLVHANILKDADQIWSVNFKGKTLVAAVEKDGQSFLEILDFS" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/hasSequenceAnnotation> <https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/identifier> "https://identifiers.org/uniprot:P07834" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/name> "Cell division control protein 4" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P07834> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/profiles/Protein/0.11-RELEASE> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/CreativeWork> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P07834_D_0_270_744> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/368314152> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://schema.org/name> "NMR" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://schema.org/termCode> "IDPO:00120" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTermSet> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl> <https://schema.org/name> "IDP ontology" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2096895906> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://schema.org/name> "RDC" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://schema.org/termCode> "IDPO:00166" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1073956941> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://schema.org/name> "chemical shift" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://schema.org/termCode> "IDPO:00167" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/367565188> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://schema.org/name> "relaxation" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://schema.org/termCode> "IDPO:00168" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1109163979> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://schema.org/name> "T2 relaxation" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://schema.org/termCode> "IDPO:00169" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/639913980> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://schema.org/name> "SAXS" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://schema.org/termCode> "IDPO:00125" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/107821945> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://schema.org/name> "TraDES" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://schema.org/termCode> "IDPO:00186" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2059079389> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://schema.org/name> "CNS" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://schema.org/termCode> "IDPO:00192" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1901071107> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://schema.org/name> "CRYSOL" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://schema.org/termCode> "IDPO:00208" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/274002240> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://schema.org/name> "ShiftX" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://schema.org/termCode> "IDPO:00210" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/502163975> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/DefinedTerm> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://schema.org/inDefinedTermSet> <https://disprot.org/assets/data/IDPO_v0.2.owl> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://schema.org/name> "ENSEMBLE" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://schema.org/termCode> "IDPO:00216" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <https://schema.org/rangeEnd> "744" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1565361539> <https://schema.org/rangeStart> "270" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/hasBioPolymerSequence> "SNVVLVSGEGERFTVDKKIAERSLLLKNYLNDMHDSNLQNNSDSESDSDSETNHKSKDNNNGDDDDEDDDEIVMPVPNVRSSVLQKVIEWAEHHRDSNFPDEDDDDSRKSAPVDSWDREFLKVDQEMLYEIILAANYLNIKPLLDAGCKVVAEMIRGRSPEEIRRTFNIVNDFTPEEEAAIRR" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/hasSequenceAnnotation> <https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/identifier> "https://identifiers.org/uniprot:P52286" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P52286> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P52286_C_0_4_186> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/400036188> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1958752721> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1896099201> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1858414809> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/569393342> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/946591913> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/892712429> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/561273240> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/649186691> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1894898714> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1015020144> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <https://schema.org/rangeEnd> "186" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/240836288> <https://schema.org/rangeStart> "4" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/Protein> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1> <http://purl.org/dc/terms/conformsTo> <https://bioschemas.org/profiles/Protein/0.11-RELEASE> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/hasBioPolymerSequence> "MTPSTPPRSRGTRYLAQPSGNTSSSALMQGQKTPQKPSQNLVPVTPSTTKSFKNAPLLAPPNSNMGMTSPFNGLTSPQRSPFPKSSVKRT" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/hasSequenceAnnotation> <https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/identifier> "https://identifiers.org/uniprot:P38634" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1> <https://schema.org/sameAs> <http://purl.uniprot.org/uniprot/P38634> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceAnnotation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/additionalProperty> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014#P38634_A_1_1_90> <https://schema.org/sequenceLocation> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/420904342> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00120> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1005499560> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00166> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/803096160> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00167> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1785075011> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00168> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/943606610> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00169> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/696555349> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl#IDPO:00125> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1412437827> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00186> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/837490728> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00192> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1021447597> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00208> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/725322807> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00210> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/PropertyValue> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <https://schema.org/name> "Term" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/2067319117> <https://schema.org/value> <https://disprot.org/assets/data/IDPO_v0.2.owl:00216> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <https://schema.org/SequenceRange> <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <https://schema.org/rangeEnd> "90" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1/proteinensemble.org/PED00014/1503093711> <https://schema.org/rangeStart> "1" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
||||||
|
<https://proteinensemble.org/PED00014> <http://purl.org/dc/terms/title> "PED" <https://bioschemas.org/crawl/v1/proteinensemble/PED00014/20211206/1> .
|
|
@ -0,0 +1,11 @@
|
||||||
|
# Set root logger level to DEBUG and its only appender to A1.
|
||||||
|
log4j.rootLogger=INFO, A1
|
||||||
|
|
||||||
|
# A1 is set to be a ConsoleAppender.
|
||||||
|
log4j.appender.A1=org.apache.log4j.ConsoleAppender
|
||||||
|
|
||||||
|
# A1 uses PatternLayout.
|
||||||
|
log4j.logger.org = ERROR
|
||||||
|
log4j.logger.eu.dnetlib = DEBUG
|
||||||
|
log4j.appender.A1.layout=org.apache.log4j.PatternLayout
|
||||||
|
log4j.appender.A1.layout.ConversionPattern=%-4r [%t] %-5p %c %x - %m%n
|
|
@ -38,6 +38,7 @@
|
||||||
<module>dhp-usage-raw-data-update</module>
|
<module>dhp-usage-raw-data-update</module>
|
||||||
<module>dhp-broker-events</module>
|
<module>dhp-broker-events</module>
|
||||||
<module>dhp-doiboost</module>
|
<module>dhp-doiboost</module>
|
||||||
|
<module>dhp-rdfconverter</module>
|
||||||
</modules>
|
</modules>
|
||||||
|
|
||||||
<pluginRepositories>
|
<pluginRepositories>
|
||||||
|
|
12
pom.xml
12
pom.xml
|
@ -105,6 +105,18 @@
|
||||||
<enabled>false</enabled>
|
<enabled>false</enabled>
|
||||||
</snapshots>
|
</snapshots>
|
||||||
</repository>
|
</repository>
|
||||||
|
<repository>
|
||||||
|
<id>dnet-deps</id>
|
||||||
|
<name>D-Net Dependencies</name>
|
||||||
|
<url>https://maven.d4science.org/nexus/content/repositories/dnet-deps/</url>
|
||||||
|
<releases>
|
||||||
|
<enabled>true</enabled>
|
||||||
|
</releases>
|
||||||
|
<snapshots>
|
||||||
|
<enabled>false</enabled>
|
||||||
|
</snapshots>
|
||||||
|
<layout>default</layout>
|
||||||
|
</repository>
|
||||||
</repositories>
|
</repositories>
|
||||||
|
|
||||||
<dependencies>
|
<dependencies>
|
||||||
|
|
Loading…
Reference in New Issue