710 lines
29 KiB
Java
710 lines
29 KiB
Java
package eu.dnetlib.ariadneplus.catalogue;
|
|
|
|
import java.io.BufferedOutputStream;
|
|
import java.io.ByteArrayOutputStream;
|
|
import java.io.IOException;
|
|
import java.net.URISyntaxException;
|
|
import java.util.Iterator;
|
|
import java.util.List;
|
|
import java.util.Set;
|
|
|
|
import com.fasterxml.jackson.core.JsonEncoding;
|
|
import com.fasterxml.jackson.core.JsonFactory;
|
|
import com.fasterxml.jackson.core.JsonGenerator;
|
|
import com.google.common.base.Joiner;
|
|
import com.google.common.collect.Iterators;
|
|
import com.google.common.collect.Lists;
|
|
import com.google.common.collect.Sets;
|
|
import eu.dnetlib.ariadneplus.CRM;
|
|
import eu.dnetlib.ariadneplus.publisher.AriadnePlusPublisherException;
|
|
import eu.dnetlib.ariadneplus.rdf.ResourceReader;
|
|
import org.apache.commons.lang3.StringUtils;
|
|
import org.apache.commons.logging.Log;
|
|
import org.apache.commons.logging.LogFactory;
|
|
import org.apache.jena.rdf.model.RDFNode;
|
|
import org.apache.jena.rdf.model.Resource;
|
|
import org.apache.jena.rdf.model.StmtIterator;
|
|
import org.apache.jena.vocabulary.RDF;
|
|
import org.springframework.beans.factory.annotation.Autowired;
|
|
import org.springframework.stereotype.Component;
|
|
|
|
/**
|
|
* Created by Alessia Bardi on 21/11/2017.
|
|
*
|
|
* @author Alessia Bardi
|
|
*/
|
|
@Component
|
|
public class CatalogueRegistrator {
|
|
|
|
private static final Log log = LogFactory.getLog(CatalogueRegistrator.class);
|
|
private final String ARIADNEPLUS_BASE_URL = "http://ariadneplus.d4science.org";
|
|
|
|
@Autowired
|
|
private ResourceReader resourceReader;
|
|
|
|
@Autowired
|
|
private CatalogueAPIClient catalogueAPIClient;
|
|
|
|
public String register(final Resource resource, final Resource type, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException, URISyntaxException, InterruptedException {
|
|
String resURI = resource.getURI();
|
|
log.debug(String.format("Catalogue --> Processing resource : %s with type: %s from source: %s", resURI, type.getLocalName(), datasourceName));
|
|
String resCatName = catalogueAPIClient.getNameForCatalogue(resURI.substring(resURI.lastIndexOf("handle/") + 7));
|
|
if(catalogueAPIClient.isRegistered(resCatName)){
|
|
log.debug(resCatName+ " is already registered");
|
|
String json = getJson(type, resource, resCatName, datasourceName);
|
|
catalogueAPIClient.doUpdate(json, resCatName);
|
|
}
|
|
else {
|
|
//resource not yet registered
|
|
String json = getJson(type, resource, resCatName, datasourceName);
|
|
if(!catalogueAPIClient.doRegister(json, resCatName)){
|
|
log.warn(String.format("%s could not be registered even the second time, giving up", resURI));
|
|
return null;
|
|
}
|
|
}
|
|
log.debug(String.format("%s registered on the catalogue with name: %s", resURI, resCatName));
|
|
return resCatName;
|
|
}
|
|
|
|
protected boolean purge(final String resCatName) throws URISyntaxException, AriadnePlusPublisherException {
|
|
return catalogueAPIClient.purgeItem(resCatName);
|
|
}
|
|
|
|
protected String getJson(final Resource type, final Resource resource, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
switch (type.getLocalName()) {
|
|
case "E29_Design_or_Procedure":
|
|
return getJsonForDesignProcedure(resource, resNameForCatalogue, datasourceName);
|
|
case "D14_Software":
|
|
return getJsonForSoftware(resource, resNameForCatalogue, datasourceName);
|
|
case "PE35_Project":
|
|
return getJsonForProject(resource, resNameForCatalogue, datasourceName);
|
|
case "PE1_Service":
|
|
return getJsonForService(resource, resNameForCatalogue, datasourceName);
|
|
case "E39_Actor":
|
|
return getJsonForActor(resource, resNameForCatalogue, datasourceName);
|
|
case "PE18_Dataset":
|
|
return getJsonForDataset(resource, resNameForCatalogue, datasourceName);
|
|
case "E78_Collection":
|
|
return getJsonForCollection(resource, resNameForCatalogue, datasourceName);
|
|
default:
|
|
throw new IllegalArgumentException(String.format("Type " + type.getLocalName() + " not supported"));
|
|
}
|
|
}
|
|
|
|
protected String getJsonForProject(final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
JsonFactory jsonFactory = new JsonFactory();
|
|
final ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
BufferedOutputStream bos = new BufferedOutputStream(out);
|
|
JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8);
|
|
jg.writeStartObject();
|
|
writeCommonFields(jg, res, resNameForCatalogue, datasourceName);
|
|
//Only RI_Project are linked to RIs that must be used as groups
|
|
List<String> maintainer_RIs = Lists.newArrayList(resourceReader.getMaintainersLabels(res));
|
|
if(maintainer_RIs.size() > 0) {
|
|
jg.writeArrayFieldStart("groups");
|
|
for(String ri : maintainer_RIs) {
|
|
String group = CKANUtils.getCkanGroup(ri);
|
|
if(StringUtils.isNotBlank(group)) {
|
|
jg.writeStartObject();
|
|
jg.writeStringField("name", group);
|
|
jg.writeEndObject();
|
|
}
|
|
}
|
|
jg.writeEndArray();
|
|
}
|
|
|
|
jg.writeStringField("maintainer", Joiner.on(", ").join(resourceReader.getMaintainersLabels(res)));
|
|
//TODO: it should be better to identify email contacts rather than generic contact labels of maintainer
|
|
//jg.writeStringField("maintainer_email", Joiner.on(", ").join(resourceReader.getMaintainerContacts(res)));
|
|
|
|
jg.writeArrayFieldStart("extras");
|
|
addExtra(jg, "system:type", CKANUtils.Project_type);
|
|
//specific class
|
|
addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E7_Activity).getLocalName());
|
|
if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL))
|
|
addExtra(jg, "AriadnePlus URL", res.getURI());
|
|
else addExtra(jg, "URL", res.getURI());
|
|
addIdentifiers(res, jg);
|
|
|
|
addExtra(jg, "started on", resourceReader.getStartTime(res));
|
|
int idx = 1;
|
|
Iterator<String> maintainers = resourceReader.getMaintainerUrls(res);
|
|
while(maintainers.hasNext()){
|
|
addExtra(jg, String.format("maintaining team (%d)", idx), maintainers.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "maintaining team", Joiner.on(", ").join(resourceReader.getMaintainerUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> services = resourceReader.getOfferedServiceUrls(res);
|
|
while(services.hasNext()){
|
|
addExtra(jg, String.format("offers (%d)", idx), services.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "offers", Joiner.on(", ").join(resourceReader.getOfferedServiceUrls(res)));
|
|
|
|
jg.writeEndArray(); //end extras
|
|
|
|
jg.writeEndObject();
|
|
jg.close();
|
|
return out.toString("UTF-8");
|
|
}
|
|
|
|
protected String getJsonForService(final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
JsonFactory jsonFactory = new JsonFactory();
|
|
final ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
BufferedOutputStream bos = new BufferedOutputStream(out);
|
|
JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8);
|
|
jg.writeStartObject();
|
|
writeCommonFields(jg, res, resNameForCatalogue, datasourceName);
|
|
jg.writeStringField("maintainer", Joiner.on(", ").join(resourceReader.getMaintainersLabels(res)));
|
|
//TODO: it should be better to identify email contacts rather than generic contact labels of maintainer
|
|
//jg.writeStringField("maintainer_email", Joiner.on(", ").join(resourceReader.getMaintainerContacts(res)));
|
|
|
|
jg.writeArrayFieldStart("extras");
|
|
addExtra(jg, "system:type", CKANUtils.Service_type);
|
|
//specific class
|
|
addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E7_Activity).getLocalName());
|
|
if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL))
|
|
addExtra(jg, "AriadnePlus URL", res.getURI());
|
|
else addExtra(jg, "URL", res.getURI());
|
|
addIdentifiers(res, jg);
|
|
addExtra(jg, "competence", Joiner.on(", ").join(resourceReader.getCompetences(res)));
|
|
addExtra(jg, "activity type", Joiner.on(", ").join(resourceReader.getActivityTypes(res)));
|
|
//condition of use (Rights)
|
|
addExtra(jg, "condition of use", resourceReader.getConditionOfUse(res));
|
|
int idx = 1;
|
|
Iterator<String> contacts = Iterators.concat(resourceReader.getResourceDirectContactPointsURI(res), resourceReader.getProviderContactPoints(res));
|
|
while(contacts.hasNext()){
|
|
addExtra(jg, String.format("contact points (%d)", idx), contacts.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "contact points", Joiner.on(", ").join(Iterators.concat(resourceReader.getResourceDirectContactPointsURI(res), resourceReader.getProviderContactPoints(res))));
|
|
idx = 1;
|
|
Iterator<String> providers = resourceReader.getProviderUris(res);
|
|
while(providers.hasNext()){
|
|
addExtra(jg, String.format("provided by (%d)", idx), providers.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "provided by", Joiner.on(", ").join(resourceReader.getProviderUris(res)));
|
|
idx = 1;
|
|
Iterator<String> points = resourceReader.getAccessPoints(res);
|
|
while(points.hasNext()){
|
|
addExtra(jg, String.format("online access point (%d)", idx), points.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "online access point", Joiner.on(", ").join(resourceReader.getAccessPoints(res)));
|
|
addExtra(jg, "protocol", Joiner.on(", ").join(resourceReader.getProtocols(res)));
|
|
idx = 1;
|
|
Iterator<String> delivers = resourceReader.getDeliversOnRequest(res);
|
|
while(delivers.hasNext()){
|
|
addExtra(jg, String.format("delivers on request (%d)", idx), delivers.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "delivers on request", Joiner.on(", ").join(resourceReader.getDeliversOnRequest(res)));
|
|
idx = 1;
|
|
Iterator<String> runs = resourceReader.getRunsOnRequest(res);
|
|
while(runs.hasNext()){
|
|
addExtra(jg, String.format("runs on request (%d)", idx), runs.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "runs on request", Joiner.on(", ").join(resourceReader.getRunsOnRequest(res)));
|
|
idx = 1;
|
|
Iterator<String> hosts = resourceReader.getHostedStuff(res);
|
|
while(hosts.hasNext()){
|
|
addExtra(jg, String.format("hosts (%d)", idx), hosts.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "hosts", Joiner.on(", ").join(resourceReader.getHostedStuff(res)));
|
|
idx = 1;
|
|
Iterator<String> curates = resourceReader.getCuratedObjects(res);
|
|
while(curates.hasNext()){
|
|
addExtra(jg, String.format("curates (%d)", idx), curates.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "curates", Joiner.on(", ").join(resourceReader.getCuratedObjects(res)));
|
|
addExtra(jg, "declared begin/end of operation", Joiner.on(", ").join(resourceReader.getDeclarativeTimes(res)));
|
|
addExtra(jg, "availability", resourceReader.getAvailability(res));
|
|
idx = 1;
|
|
Iterator<String> plans = resourceReader.getCurationPlans(res);
|
|
while(plans.hasNext()){
|
|
addExtra(jg, String.format("uses curation plan (%d)", idx), plans.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "uses curation plan", Joiner.on(", ").join(resourceReader.getCurationPlans(res)));
|
|
addExtra(jg, "time of service", Joiner.on(", ").join(resourceReader.getDeclarativeTimes(res)));
|
|
//TODO: where to get it?
|
|
//addExtra(jg, "last confirmation", "");
|
|
//TODO: where to get it?
|
|
//addExtra(jg, "date of registration", "");
|
|
|
|
jg.writeEndArray(); //end extras
|
|
|
|
jg.writeEndObject();
|
|
jg.close();
|
|
return out.toString("UTF-8");
|
|
}
|
|
|
|
protected String getJsonForActor(final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
JsonFactory jsonFactory = new JsonFactory();
|
|
final ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
BufferedOutputStream bos = new BufferedOutputStream(out);
|
|
JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8);
|
|
jg.writeStartObject();
|
|
writeCommonFields(jg, res, resNameForCatalogue, datasourceName);
|
|
|
|
jg.writeArrayFieldStart("extras");
|
|
addExtra(jg, "system:type", CKANUtils.Actor_type);
|
|
//specific class
|
|
addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E39_Actor).getLocalName());
|
|
if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL))
|
|
addExtra(jg, "AriadnePlus URL", res.getURI());
|
|
else addExtra(jg, "URL", res.getURI());
|
|
addIdentifiers(res, jg);
|
|
addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res)));
|
|
int idx = 1;
|
|
Iterator<String> hasMembers = resourceReader.getMemberUrls(res);
|
|
while(hasMembers.hasNext()){
|
|
addExtra(jg, String.format("has member (%d)", idx), hasMembers.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has member", Joiner.on(", ").join(resourceReader.getMemberUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> isMembers = resourceReader.isMemberOf(res);
|
|
while(isMembers.hasNext()){
|
|
addExtra(jg, String.format("is member of (%d)", idx), isMembers.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "is member of", Joiner.on(", ").join(resourceReader.isMemberOf(res)));
|
|
idx = 1;
|
|
Iterator<String> provides = resourceReader.getProvidedServiceUrls(res);
|
|
while(provides.hasNext()){
|
|
addExtra(jg, String.format("provides (%d)", idx), provides.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "provides", Joiner.on(", ").join(resourceReader.getProvidedServiceUrls(res)));
|
|
|
|
idx = 1;
|
|
String contactPoints = "";
|
|
StmtIterator it = res.listProperties(CRM.P76_has_contact_point);
|
|
while(it.hasNext()) {
|
|
Resource cp = it.next().getResource();
|
|
Resource cpType = cp.getPropertyResourceValue(CRM.P2_has_type);
|
|
String cpTypeLabel = resourceReader.getLabel(cpType);
|
|
String cpLabel = resourceReader.getLabel(cp);
|
|
if (StringUtils.isNotBlank(cpLabel)) {
|
|
if (StringUtils.isNotBlank(cpTypeLabel)) {
|
|
addExtra(jg,String.format("contact point (%d) - %s ", idx, cpTypeLabel), cpLabel );
|
|
idx++;
|
|
//contactPoints += cpTypeLabel + ": ";
|
|
}
|
|
else{
|
|
addExtra(jg,String.format("contact point (%d)", idx), cpLabel );
|
|
idx++;
|
|
//contactPoints += cpLabel + "; ";
|
|
}
|
|
|
|
}
|
|
else{
|
|
addExtra(jg,String.format("contact point (%d)", idx), cp.getURI());
|
|
idx++;
|
|
}
|
|
}
|
|
// addExtra(jg,"contact points", contactPoints );
|
|
idx = 1;
|
|
Iterator<String> maintains = resourceReader.getMaintainedUrls(res);
|
|
while(maintains.hasNext()){
|
|
addExtra(jg, String.format("maintains (%d)", idx), maintains.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "maintains", Joiner.on(", ").join(resourceReader.getMaintainedUrls(res)));
|
|
|
|
jg.writeEndArray();
|
|
|
|
jg.writeEndObject();
|
|
jg.close();
|
|
return out.toString("UTF-8");
|
|
}
|
|
|
|
protected String getJsonForDataset(final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
JsonFactory jsonFactory = new JsonFactory();
|
|
final ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
BufferedOutputStream bos = new BufferedOutputStream(out);
|
|
JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8);
|
|
jg.writeStartObject();
|
|
writeCommonFields(jg, res, resNameForCatalogue, datasourceName);
|
|
|
|
jg.writeArrayFieldStart("extras");
|
|
addExtra(jg, "system:type", CKANUtils.Dataset_type);
|
|
//specific class
|
|
addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E70_Thing).getLocalName());
|
|
if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) {
|
|
addExtra(jg, "AriadnePlus URL", res.getURI());
|
|
}
|
|
else addExtra(jg, "URL", res.getURI());
|
|
addIdentifiers(res, jg);
|
|
addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res)));
|
|
int idx = 1;
|
|
Iterator<String> isPartOf = resourceReader.getIsPartOfUrls(res);
|
|
while(isPartOf.hasNext()){
|
|
addExtra(jg, String.format("is part of (%d)", idx), isPartOf.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "is part of", Joiner.on(", ").join(resourceReader.getIsPartOfUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> hasPart = resourceReader.getHasPartUrls(res);
|
|
while(hasPart.hasNext()){
|
|
addExtra(jg, String.format("has part (%d)", idx), hasPart.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has part", Joiner.on(", ").join(resourceReader.getHasPartUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> curators = resourceReader.getCuratorUrls(res);
|
|
while(curators.hasNext()){
|
|
addExtra(jg, String.format("curated by (%d)", idx), curators.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "curated by", Joiner.on(", ").join(resourceReader.getCuratorUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> curationplans = resourceReader.getResourceCuratorCurationPlans(res);
|
|
while(curationplans.hasNext()){
|
|
addExtra(jg, String.format("curation plan (%d)", idx), curationplans.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "curation plan", Joiner.on(", ").join(resourceReader.getResourceCuratorCurationPlans(res)));
|
|
idx = 1;
|
|
Iterator<String> hostedbys = resourceReader.getHostedBys(res);
|
|
while(hostedbys.hasNext()){
|
|
addExtra(jg, String.format("hosted by (%d)", idx), hostedbys.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "hosted by", Joiner.on(", ").join(resourceReader.getHostedBys(res)));
|
|
addExtra(jg, "encoding type", Joiner.on(", ").join(resourceReader.getEncodings(res)));
|
|
idx = 1;
|
|
Iterator<String> creators = resourceReader.getCreatorsURIs(res);
|
|
while(creators.hasNext()){
|
|
addExtra(jg, String.format("creator (%d)", idx), creators.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "creator", Joiner.on(", ").join(resourceReader.getCreatorsURIs(res)));
|
|
idx = 1;
|
|
Iterator<String> sw = resourceReader.getUsedSoftware(res);
|
|
while(sw.hasNext()){
|
|
addExtra(jg, String.format("used software (%d)", idx), sw.next());
|
|
idx++;
|
|
}
|
|
|
|
addExtra(jg, "subject", Joiner.on(", ").join(resourceReader.getSubjects(res)));
|
|
addExtra(jg, "temporal coverage", Joiner.on(", ").join(resourceReader.getTemporalCoverages(res)));
|
|
addExtra(jg, "spatial coverage", Joiner.on(", ").join(resourceReader.getSpatialCoverages(res)));
|
|
idx = 1;
|
|
Iterator<String> usedbys = resourceReader.getUsedBy(res);
|
|
while(usedbys.hasNext()){
|
|
addExtra(jg, String.format("used by (%d)", idx), usedbys.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "used by", Joiner.on(", ").join(resourceReader.getUsedBy(res)));
|
|
addExtra(jg, "languages", Joiner.on(", ").join(resourceReader.getLanguages(res)));
|
|
idx = 1;
|
|
Iterator<String> metadata = resourceReader.getMetadata(res);
|
|
while(metadata.hasNext()){
|
|
addExtra(jg, String.format("has metadata (%d)", idx), metadata.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has metadata", Joiner.on(", ").join(resourceReader.getMetadata(res)));
|
|
idx = 1;
|
|
Iterator<String> metadataFor = resourceReader.getDescribedDataset(res);
|
|
while(metadataFor.hasNext()){
|
|
addExtra(jg, String.format("is metadata for (%d)", idx), metadataFor.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "is metadata for", Joiner.on(", ").join(resourceReader.getDescribedDataset(res)));
|
|
idx = 1;
|
|
Iterator<String> snaphsots = resourceReader.getSnapshots(res);
|
|
while(snaphsots.hasNext()){
|
|
addExtra(jg, String.format("has snapshot (%d)", idx), snaphsots.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has snapshot", Joiner.on(", ").join(resourceReader.getSnapshots(res)));
|
|
idx = 1;
|
|
Iterator<String> issnaphsots = resourceReader.getIsSnapshotOfs(res);
|
|
while(issnaphsots.hasNext()){
|
|
addExtra(jg, String.format("is snapshot of (%d)", idx), issnaphsots.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "is snapshot of", Joiner.on(", ").join(resourceReader.getIsSnapshotOfs(res)));
|
|
|
|
jg.writeEndArray();
|
|
|
|
jg.writeEndObject();
|
|
jg.close();
|
|
return out.toString("UTF-8");
|
|
}
|
|
|
|
protected String getJsonForSoftware(final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
JsonFactory jsonFactory = new JsonFactory();
|
|
final ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
BufferedOutputStream bos = new BufferedOutputStream(out);
|
|
JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8);
|
|
jg.writeStartObject();
|
|
writeCommonFields(jg, res, resNameForCatalogue, datasourceName);
|
|
|
|
jg.writeArrayFieldStart("extras");
|
|
addExtra(jg, "system:type", CKANUtils.Software_type);
|
|
//specific class
|
|
addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E70_Thing).getLocalName());
|
|
if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) {
|
|
addExtra(jg, "AriadnePlus URL", res.getURI());
|
|
}
|
|
else addExtra(jg, "URL", res.getURI());
|
|
addIdentifiers(res, jg);
|
|
addExtra(jg, "subject", Joiner.on(", ").join(resourceReader.getSubjects(res)));
|
|
addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res)));
|
|
int idx = 1;
|
|
Iterator<String> hosted = resourceReader.getHostedBys(res);
|
|
while(hosted.hasNext()){
|
|
addExtra(jg, String.format("hosted by (%d)", idx), hosted.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "hosted by", Joiner.on(", ").join(resourceReader.getHostedBys(res)));
|
|
idx = 1;
|
|
Iterator<String> curated = resourceReader.getCuratorUrls(res);
|
|
while(curated.hasNext()){
|
|
addExtra(jg, String.format("curated by (%d)", idx), curated.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "curated by", Joiner.on(", ").join(resourceReader.getCuratorUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> hasSnapshot = resourceReader.getSnapshots(res);
|
|
while(hasSnapshot.hasNext()){
|
|
addExtra(jg, String.format("has snapshot (%d)", idx), hasSnapshot.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has snapshot", Joiner.on(", ").join(resourceReader.getSnapshots(res)));
|
|
idx = 1;
|
|
Iterator<String> isSnapshot = resourceReader.getIsSnapshotOfs(res);
|
|
while(isSnapshot.hasNext()){
|
|
addExtra(jg, String.format("is snapshot (%d)", idx), isSnapshot.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "is snapshot of", Joiner.on(", ").join(resourceReader.getIsSnapshotOfs(res)));
|
|
idx = 1;
|
|
Iterator<String> isPart = resourceReader.getIsPartOfUrls(res);
|
|
while(isPart.hasNext()){
|
|
addExtra(jg, String.format("is part of (%d)", idx), isPart.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "is part of", Joiner.on(", ").join(resourceReader.getIsPartOfUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> hasPart = resourceReader.getHasPartUrls(res);
|
|
while(hasPart.hasNext()){
|
|
addExtra(jg, String.format("has part (%d)", idx), hasPart.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has part", Joiner.on(", ").join(resourceReader.getHasPartUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> hasRelease = resourceReader.getHasReleases(res);
|
|
while(hasRelease.hasNext()){
|
|
addExtra(jg, String.format("has release (%d)", idx), hasRelease.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has release", Joiner.on(", ").join(resourceReader.getHasReleases(res)));
|
|
idx = 1;
|
|
Iterator<String> isRelease = resourceReader.getIsReleaseOfs(res);
|
|
while(isRelease.hasNext()){
|
|
addExtra(jg, String.format("is release (%d)", idx), isRelease.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "is release of", Joiner.on(", ").join(resourceReader.getIsReleaseOfs(res)));
|
|
idx = 1;
|
|
Iterator<String> used = resourceReader.getUsedBy(res);
|
|
while(used.hasNext()){
|
|
addExtra(jg, String.format("used by (%d)", idx), used.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "used by", Joiner.on(", ").join(resourceReader.getUsedBy(res)));
|
|
addExtra(jg, "creation time", resourceReader.getFirstCreationTime(res));
|
|
|
|
jg.writeEndArray();
|
|
|
|
jg.writeEndObject();
|
|
jg.close();
|
|
return out.toString("UTF-8");
|
|
}
|
|
|
|
protected String getJsonForCollection(final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
JsonFactory jsonFactory = new JsonFactory();
|
|
final ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
BufferedOutputStream bos = new BufferedOutputStream(out);
|
|
JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8);
|
|
jg.writeStartObject();
|
|
writeCommonFields(jg, res, resNameForCatalogue, datasourceName);
|
|
|
|
jg.writeArrayFieldStart("extras");
|
|
addExtra(jg, "system:type", CKANUtils.Collection_type);
|
|
//specific class
|
|
addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E70_Thing).getLocalName());
|
|
if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) {
|
|
addExtra(jg, "AriadnePlus URL", res.getURI());
|
|
}
|
|
else addExtra(jg, "URL", res.getURI());
|
|
addIdentifiers(res, jg);
|
|
addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res)));
|
|
addExtra(jg, "subject", Joiner.on(", ").join(resourceReader.getSubjects(res)));
|
|
addExtra(jg, "temporal coverage", Joiner.on(", ").join(resourceReader.getTemporalCoverages(res)));
|
|
addExtra(jg, "spatial coverage", Joiner.on(", ").join(resourceReader.getSpatialCoverages(res)));
|
|
int idx = 1;
|
|
Iterator<String> hasPart = resourceReader.getHasPartUrls(res);
|
|
while(hasPart.hasNext()){
|
|
addExtra(jg, String.format("has part (%d)", idx), hasPart.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "has part", Joiner.on(", ").join(resourceReader.getHasPartUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> hosted = resourceReader.getHostedBys(res);
|
|
while(hosted.hasNext()){
|
|
addExtra(jg, String.format("hosted by (%d)", idx), hosted.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "hosted by", Joiner.on(", ").join(resourceReader.getHostedBys(res)));
|
|
idx = 1;
|
|
Iterator<String> curated = resourceReader.getCuratorUrls(res);
|
|
while(curated.hasNext()){
|
|
addExtra(jg, String.format("curated by (%d)", idx), curated.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "curated by", Joiner.on(", ").join(resourceReader.getCuratorUrls(res)));
|
|
idx = 1;
|
|
Iterator<String> creators = resourceReader.getCreatorsURIs(res);
|
|
while(creators.hasNext()){
|
|
addExtra(jg, String.format("creator (%d)", idx), creators.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "creator", Joiner.on(", ").join(resourceReader.getCreatorsURIs(res)));
|
|
addExtra(jg, "languages", Joiner.on(", ").join(resourceReader.getLanguages(res)));
|
|
|
|
jg.writeEndArray();
|
|
|
|
jg.writeEndObject();
|
|
jg.close();
|
|
return out.toString("UTF-8");
|
|
}
|
|
|
|
|
|
protected String getJsonForDesignProcedure(final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
JsonFactory jsonFactory = new JsonFactory();
|
|
final ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
BufferedOutputStream bos = new BufferedOutputStream(out);
|
|
JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8);
|
|
jg.writeStartObject();
|
|
writeCommonFields(jg, res, resNameForCatalogue, datasourceName);
|
|
|
|
jg.writeArrayFieldStart("extras");
|
|
addExtra(jg, "system:type", CKANUtils.DesignOrProcedure_type);
|
|
//specific class
|
|
addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E29_Design_or_Procedure).getLocalName());
|
|
if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) {
|
|
addExtra(jg, "AriadnePlus URL", res.getURI());
|
|
}
|
|
else addExtra(jg, "URL", res.getURI());
|
|
addIdentifiers(res, jg);
|
|
int idx = 1;
|
|
Iterator<String> used = resourceReader.getUsedBy(res);
|
|
while(used.hasNext()){
|
|
addExtra(jg, String.format("used by (%d)", idx), used.next());
|
|
idx++;
|
|
}
|
|
//addExtra(jg, "used by", Joiner.on(", ").join(resourceReader.getUsedBy(res)));
|
|
//TODO: add additional metadata for E29_Design_or_Procedure, if any
|
|
jg.writeEndArray();
|
|
|
|
jg.writeEndObject();
|
|
jg.close();
|
|
return out.toString("UTF-8");
|
|
}
|
|
|
|
protected void addIdentifiers(final Resource res, final JsonGenerator jg ) throws IOException {
|
|
/*
|
|
<${subjectURL}> crm:P1_is_identified_by ?IDRes .
|
|
?IDRes a crm:E42_Identifier .
|
|
?IDRes rdfs:label ?ID_label .
|
|
*/
|
|
StmtIterator it = res.listProperties(CRM.P1_is_identified_by);
|
|
Set<String> ids = Sets.newHashSet();
|
|
while(it.hasNext()){
|
|
RDFNode obj = it.next().getObject();
|
|
if(obj.isLiteral()) ids.add(obj.asLiteral().getLexicalForm());
|
|
else {
|
|
Resource id = (Resource) obj;
|
|
if (id.hasProperty(RDF.type, CRM.E42_Identifier)) {
|
|
ids.add(resourceReader.getLabel(id));
|
|
}
|
|
}
|
|
}
|
|
addExtra(jg, "ID", String.join(",", ids));
|
|
}
|
|
|
|
protected void addExtra(final JsonGenerator jg, final String key, final String value) throws IOException {
|
|
if(StringUtils.isNotBlank(value)) {
|
|
jg.writeStartObject();
|
|
jg.writeStringField("key", key);
|
|
jg.writeStringField("value", value);
|
|
jg.writeEndObject();
|
|
}
|
|
}
|
|
|
|
|
|
|
|
protected void writeCommonFields(final JsonGenerator jg, final Resource res, final String resNameForCatalogue, final String datasourceName)
|
|
throws IOException, AriadnePlusPublisherException {
|
|
String ckanOrg = CKANUtils.getCKanOrg(datasourceName);
|
|
//id is available only for updates
|
|
if(StringUtils.isBlank(ckanOrg)) throw new AriadnePlusPublisherException(String.format("Cannot register %s : blank ckan org for data source with name %s", resNameForCatalogue, datasourceName));
|
|
//the owning organization, i.e. the data souce from which this resource has been collected from
|
|
jg.writeStringField("owner_org", ckanOrg);
|
|
jg.writeStringField("name", resNameForCatalogue);
|
|
//default license
|
|
jg.writeStringField("license_id", resourceReader.getCatalogueLicense(res).getId());
|
|
String title = resourceReader.getTitle(res);
|
|
if (StringUtils.isBlank(title))
|
|
title = resNameForCatalogue;
|
|
jg.writeStringField("title", title);
|
|
//description
|
|
jg.writeStringField("notes",Joiner.on(';').join(resourceReader.getDescriptions(res)));
|
|
//the names of all superclasses of the entity
|
|
jg.writeArrayFieldStart("tags");
|
|
Iterator<String> classNames = resourceReader.getRDFClassNames(res);
|
|
while (classNames.hasNext()) {
|
|
jg.writeStartObject();
|
|
jg.writeStringField("name", classNames.next());
|
|
jg.writeEndObject();
|
|
}
|
|
jg.writeEndArray();
|
|
}
|
|
|
|
|
|
public ResourceReader getResourceReader() {
|
|
return resourceReader;
|
|
}
|
|
|
|
public void setResourceReader(final ResourceReader resourceReader) {
|
|
this.resourceReader = resourceReader;
|
|
}
|
|
|
|
public CatalogueAPIClient getCatalogueAPIClient() {
|
|
return catalogueAPIClient;
|
|
}
|
|
|
|
public void setCatalogueAPIClient(final CatalogueAPIClient catalogueAPIClient) {
|
|
this.catalogueAPIClient = catalogueAPIClient;
|
|
}
|
|
}
|