package eu.dnetlib.ariadneplus.catalogue; import java.io.BufferedOutputStream; import java.io.ByteArrayOutputStream; import java.io.IOException; import java.net.URISyntaxException; import java.util.Iterator; import java.util.List; import java.util.Set; import com.fasterxml.jackson.core.JsonEncoding; import com.fasterxml.jackson.core.JsonFactory; import com.fasterxml.jackson.core.JsonGenerator; import com.google.common.base.Joiner; import com.google.common.collect.Iterators; import com.google.common.collect.Lists; import com.google.common.collect.Sets; import eu.dnetlib.ariadneplus.CRM; import eu.dnetlib.ariadneplus.publisher.AriadnePlusPublisherException; import eu.dnetlib.ariadneplus.rdf.ResourceReader; import org.apache.commons.lang3.StringUtils; import org.apache.commons.logging.Log; import org.apache.commons.logging.LogFactory; import org.apache.jena.rdf.model.RDFNode; import org.apache.jena.rdf.model.Resource; import org.apache.jena.rdf.model.StmtIterator; import org.apache.jena.vocabulary.RDF; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.stereotype.Component; /** * Created by Alessia Bardi on 21/11/2017. * * @author Alessia Bardi */ @Component public class CatalogueRegistrator { private static final Log log = LogFactory.getLog(CatalogueRegistrator.class); private final String ARIADNEPLUS_BASE_URL = "http://ariadneplus.d4science.org"; @Autowired private ResourceReader resourceReader; @Autowired private CatalogueAPIClient catalogueAPIClient; public String register(final Resource resource, final Resource type, final String datasourceName) throws IOException, AriadnePlusPublisherException, URISyntaxException, InterruptedException { String resURI = resource.getURI(); log.debug(String.format("Catalogue --> Processing resource : %s with type: %s from source: %s", resURI, type.getLocalName(), datasourceName)); String resCatName = catalogueAPIClient.getNameForCatalogue(resURI.substring(resURI.lastIndexOf("handle/") + 7)); if(catalogueAPIClient.isRegistered(resCatName)){ log.debug(resCatName+ " is already registered"); String json = getJson(type, resource, resCatName, datasourceName); catalogueAPIClient.doUpdate(json, resCatName); } else { //resource not yet registered String json = getJson(type, resource, resCatName, datasourceName); if(!catalogueAPIClient.doRegister(json, resCatName)){ log.warn(String.format("%s could not be registered even the second time, giving up", resURI)); return null; } } log.debug(String.format("%s registered on the catalogue with name: %s", resURI, resCatName)); return resCatName; } protected boolean purge(final String resCatName) throws URISyntaxException, AriadnePlusPublisherException { return catalogueAPIClient.purgeItem(resCatName); } protected String getJson(final Resource type, final Resource resource, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { switch (type.getLocalName()) { case "E29_Design_or_Procedure": return getJsonForDesignProcedure(resource, resNameForCatalogue, datasourceName); case "D14_Software": return getJsonForSoftware(resource, resNameForCatalogue, datasourceName); case "PE35_Project": return getJsonForProject(resource, resNameForCatalogue, datasourceName); case "PE1_Service": return getJsonForService(resource, resNameForCatalogue, datasourceName); case "E39_Actor": return getJsonForActor(resource, resNameForCatalogue, datasourceName); case "PE18_Dataset": return getJsonForDataset(resource, resNameForCatalogue, datasourceName); case "E78_Collection": return getJsonForCollection(resource, resNameForCatalogue, datasourceName); default: throw new IllegalArgumentException(String.format("Type " + type.getLocalName() + " not supported")); } } protected String getJsonForProject(final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { JsonFactory jsonFactory = new JsonFactory(); final ByteArrayOutputStream out = new ByteArrayOutputStream(); BufferedOutputStream bos = new BufferedOutputStream(out); JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8); jg.writeStartObject(); writeCommonFields(jg, res, resNameForCatalogue, datasourceName); //Only RI_Project are linked to RIs that must be used as groups List maintainer_RIs = Lists.newArrayList(resourceReader.getMaintainersLabels(res)); if(maintainer_RIs.size() > 0) { jg.writeArrayFieldStart("groups"); for(String ri : maintainer_RIs) { String group = CKANUtils.getCkanGroup(ri); if(StringUtils.isNotBlank(group)) { jg.writeStartObject(); jg.writeStringField("name", group); jg.writeEndObject(); } } jg.writeEndArray(); } jg.writeStringField("maintainer", Joiner.on(", ").join(resourceReader.getMaintainersLabels(res))); //TODO: it should be better to identify email contacts rather than generic contact labels of maintainer //jg.writeStringField("maintainer_email", Joiner.on(", ").join(resourceReader.getMaintainerContacts(res))); jg.writeArrayFieldStart("extras"); addExtra(jg, "system:type", CKANUtils.Project_type); //specific class addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E7_Activity).getLocalName()); if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) addExtra(jg, "AriadnePlus URL", res.getURI()); else addExtra(jg, "URL", res.getURI()); addIdentifiers(res, jg); addExtra(jg, "started on", resourceReader.getStartTime(res)); int idx = 1; Iterator maintainers = resourceReader.getMaintainerUrls(res); while(maintainers.hasNext()){ addExtra(jg, String.format("maintaining team (%d)", idx), maintainers.next()); idx++; } //addExtra(jg, "maintaining team", Joiner.on(", ").join(resourceReader.getMaintainerUrls(res))); idx = 1; Iterator services = resourceReader.getOfferedServiceUrls(res); while(services.hasNext()){ addExtra(jg, String.format("offers (%d)", idx), services.next()); idx++; } //addExtra(jg, "offers", Joiner.on(", ").join(resourceReader.getOfferedServiceUrls(res))); jg.writeEndArray(); //end extras jg.writeEndObject(); jg.close(); return out.toString("UTF-8"); } protected String getJsonForService(final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { JsonFactory jsonFactory = new JsonFactory(); final ByteArrayOutputStream out = new ByteArrayOutputStream(); BufferedOutputStream bos = new BufferedOutputStream(out); JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8); jg.writeStartObject(); writeCommonFields(jg, res, resNameForCatalogue, datasourceName); jg.writeStringField("maintainer", Joiner.on(", ").join(resourceReader.getMaintainersLabels(res))); //TODO: it should be better to identify email contacts rather than generic contact labels of maintainer //jg.writeStringField("maintainer_email", Joiner.on(", ").join(resourceReader.getMaintainerContacts(res))); jg.writeArrayFieldStart("extras"); addExtra(jg, "system:type", CKANUtils.Service_type); //specific class addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E7_Activity).getLocalName()); if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) addExtra(jg, "AriadnePlus URL", res.getURI()); else addExtra(jg, "URL", res.getURI()); addIdentifiers(res, jg); addExtra(jg, "competence", Joiner.on(", ").join(resourceReader.getCompetences(res))); addExtra(jg, "activity type", Joiner.on(", ").join(resourceReader.getActivityTypes(res))); //condition of use (Rights) addExtra(jg, "condition of use", resourceReader.getConditionOfUse(res)); int idx = 1; Iterator contacts = Iterators.concat(resourceReader.getResourceDirectContactPointsURI(res), resourceReader.getProviderContactPoints(res)); while(contacts.hasNext()){ addExtra(jg, String.format("contact points (%d)", idx), contacts.next()); idx++; } //addExtra(jg, "contact points", Joiner.on(", ").join(Iterators.concat(resourceReader.getResourceDirectContactPointsURI(res), resourceReader.getProviderContactPoints(res)))); idx = 1; Iterator providers = resourceReader.getProviderUris(res); while(providers.hasNext()){ addExtra(jg, String.format("provided by (%d)", idx), providers.next()); idx++; } //addExtra(jg, "provided by", Joiner.on(", ").join(resourceReader.getProviderUris(res))); idx = 1; Iterator points = resourceReader.getAccessPoints(res); while(points.hasNext()){ addExtra(jg, String.format("online access point (%d)", idx), points.next()); idx++; } //addExtra(jg, "online access point", Joiner.on(", ").join(resourceReader.getAccessPoints(res))); addExtra(jg, "protocol", Joiner.on(", ").join(resourceReader.getProtocols(res))); idx = 1; Iterator delivers = resourceReader.getDeliversOnRequest(res); while(delivers.hasNext()){ addExtra(jg, String.format("delivers on request (%d)", idx), delivers.next()); idx++; } //addExtra(jg, "delivers on request", Joiner.on(", ").join(resourceReader.getDeliversOnRequest(res))); idx = 1; Iterator runs = resourceReader.getRunsOnRequest(res); while(runs.hasNext()){ addExtra(jg, String.format("runs on request (%d)", idx), runs.next()); idx++; } //addExtra(jg, "runs on request", Joiner.on(", ").join(resourceReader.getRunsOnRequest(res))); idx = 1; Iterator hosts = resourceReader.getHostedStuff(res); while(hosts.hasNext()){ addExtra(jg, String.format("hosts (%d)", idx), hosts.next()); idx++; } //addExtra(jg, "hosts", Joiner.on(", ").join(resourceReader.getHostedStuff(res))); idx = 1; Iterator curates = resourceReader.getCuratedObjects(res); while(curates.hasNext()){ addExtra(jg, String.format("curates (%d)", idx), curates.next()); idx++; } //addExtra(jg, "curates", Joiner.on(", ").join(resourceReader.getCuratedObjects(res))); addExtra(jg, "declared begin/end of operation", Joiner.on(", ").join(resourceReader.getDeclarativeTimes(res))); addExtra(jg, "availability", resourceReader.getAvailability(res)); idx = 1; Iterator plans = resourceReader.getCurationPlans(res); while(plans.hasNext()){ addExtra(jg, String.format("uses curation plan (%d)", idx), plans.next()); idx++; } //addExtra(jg, "uses curation plan", Joiner.on(", ").join(resourceReader.getCurationPlans(res))); addExtra(jg, "time of service", Joiner.on(", ").join(resourceReader.getDeclarativeTimes(res))); //TODO: where to get it? //addExtra(jg, "last confirmation", ""); //TODO: where to get it? //addExtra(jg, "date of registration", ""); jg.writeEndArray(); //end extras jg.writeEndObject(); jg.close(); return out.toString("UTF-8"); } protected String getJsonForActor(final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { JsonFactory jsonFactory = new JsonFactory(); final ByteArrayOutputStream out = new ByteArrayOutputStream(); BufferedOutputStream bos = new BufferedOutputStream(out); JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8); jg.writeStartObject(); writeCommonFields(jg, res, resNameForCatalogue, datasourceName); jg.writeArrayFieldStart("extras"); addExtra(jg, "system:type", CKANUtils.Actor_type); //specific class addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E39_Actor).getLocalName()); if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) addExtra(jg, "AriadnePlus URL", res.getURI()); else addExtra(jg, "URL", res.getURI()); addIdentifiers(res, jg); addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res))); int idx = 1; Iterator hasMembers = resourceReader.getMemberUrls(res); while(hasMembers.hasNext()){ addExtra(jg, String.format("has member (%d)", idx), hasMembers.next()); idx++; } //addExtra(jg, "has member", Joiner.on(", ").join(resourceReader.getMemberUrls(res))); idx = 1; Iterator isMembers = resourceReader.isMemberOf(res); while(isMembers.hasNext()){ addExtra(jg, String.format("is member of (%d)", idx), isMembers.next()); idx++; } //addExtra(jg, "is member of", Joiner.on(", ").join(resourceReader.isMemberOf(res))); idx = 1; Iterator provides = resourceReader.getProvidedServiceUrls(res); while(provides.hasNext()){ addExtra(jg, String.format("provides (%d)", idx), provides.next()); idx++; } //addExtra(jg, "provides", Joiner.on(", ").join(resourceReader.getProvidedServiceUrls(res))); idx = 1; String contactPoints = ""; StmtIterator it = res.listProperties(CRM.P76_has_contact_point); while(it.hasNext()) { Resource cp = it.next().getResource(); Resource cpType = cp.getPropertyResourceValue(CRM.P2_has_type); String cpTypeLabel = resourceReader.getLabel(cpType); String cpLabel = resourceReader.getLabel(cp); if (StringUtils.isNotBlank(cpLabel)) { if (StringUtils.isNotBlank(cpTypeLabel)) { addExtra(jg,String.format("contact point (%d) - %s ", idx, cpTypeLabel), cpLabel ); idx++; //contactPoints += cpTypeLabel + ": "; } else{ addExtra(jg,String.format("contact point (%d)", idx), cpLabel ); idx++; //contactPoints += cpLabel + "; "; } } else{ addExtra(jg,String.format("contact point (%d)", idx), cp.getURI()); idx++; } } // addExtra(jg,"contact points", contactPoints ); idx = 1; Iterator maintains = resourceReader.getMaintainedUrls(res); while(maintains.hasNext()){ addExtra(jg, String.format("maintains (%d)", idx), maintains.next()); idx++; } //addExtra(jg, "maintains", Joiner.on(", ").join(resourceReader.getMaintainedUrls(res))); jg.writeEndArray(); jg.writeEndObject(); jg.close(); return out.toString("UTF-8"); } protected String getJsonForDataset(final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { JsonFactory jsonFactory = new JsonFactory(); final ByteArrayOutputStream out = new ByteArrayOutputStream(); BufferedOutputStream bos = new BufferedOutputStream(out); JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8); jg.writeStartObject(); writeCommonFields(jg, res, resNameForCatalogue, datasourceName); jg.writeArrayFieldStart("extras"); addExtra(jg, "system:type", CKANUtils.Dataset_type); //specific class addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E70_Thing).getLocalName()); if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) { addExtra(jg, "AriadnePlus URL", res.getURI()); } else addExtra(jg, "URL", res.getURI()); addIdentifiers(res, jg); addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res))); int idx = 1; Iterator isPartOf = resourceReader.getIsPartOfUrls(res); while(isPartOf.hasNext()){ addExtra(jg, String.format("is part of (%d)", idx), isPartOf.next()); idx++; } //addExtra(jg, "is part of", Joiner.on(", ").join(resourceReader.getIsPartOfUrls(res))); idx = 1; Iterator hasPart = resourceReader.getHasPartUrls(res); while(hasPart.hasNext()){ addExtra(jg, String.format("has part (%d)", idx), hasPart.next()); idx++; } //addExtra(jg, "has part", Joiner.on(", ").join(resourceReader.getHasPartUrls(res))); idx = 1; Iterator curators = resourceReader.getCuratorUrls(res); while(curators.hasNext()){ addExtra(jg, String.format("curated by (%d)", idx), curators.next()); idx++; } //addExtra(jg, "curated by", Joiner.on(", ").join(resourceReader.getCuratorUrls(res))); idx = 1; Iterator curationplans = resourceReader.getResourceCuratorCurationPlans(res); while(curationplans.hasNext()){ addExtra(jg, String.format("curation plan (%d)", idx), curationplans.next()); idx++; } //addExtra(jg, "curation plan", Joiner.on(", ").join(resourceReader.getResourceCuratorCurationPlans(res))); idx = 1; Iterator hostedbys = resourceReader.getHostedBys(res); while(hostedbys.hasNext()){ addExtra(jg, String.format("hosted by (%d)", idx), hostedbys.next()); idx++; } //addExtra(jg, "hosted by", Joiner.on(", ").join(resourceReader.getHostedBys(res))); addExtra(jg, "encoding type", Joiner.on(", ").join(resourceReader.getEncodings(res))); idx = 1; Iterator creators = resourceReader.getCreatorsURIs(res); while(creators.hasNext()){ addExtra(jg, String.format("creator (%d)", idx), creators.next()); idx++; } //addExtra(jg, "creator", Joiner.on(", ").join(resourceReader.getCreatorsURIs(res))); idx = 1; Iterator sw = resourceReader.getUsedSoftware(res); while(sw.hasNext()){ addExtra(jg, String.format("used software (%d)", idx), sw.next()); idx++; } addExtra(jg, "subject", Joiner.on(", ").join(resourceReader.getSubjects(res))); addExtra(jg, "temporal coverage", Joiner.on(", ").join(resourceReader.getTemporalCoverages(res))); addExtra(jg, "spatial coverage", Joiner.on(", ").join(resourceReader.getSpatialCoverages(res))); idx = 1; Iterator usedbys = resourceReader.getUsedBy(res); while(usedbys.hasNext()){ addExtra(jg, String.format("used by (%d)", idx), usedbys.next()); idx++; } //addExtra(jg, "used by", Joiner.on(", ").join(resourceReader.getUsedBy(res))); addExtra(jg, "languages", Joiner.on(", ").join(resourceReader.getLanguages(res))); idx = 1; Iterator metadata = resourceReader.getMetadata(res); while(metadata.hasNext()){ addExtra(jg, String.format("has metadata (%d)", idx), metadata.next()); idx++; } //addExtra(jg, "has metadata", Joiner.on(", ").join(resourceReader.getMetadata(res))); idx = 1; Iterator metadataFor = resourceReader.getDescribedDataset(res); while(metadataFor.hasNext()){ addExtra(jg, String.format("is metadata for (%d)", idx), metadataFor.next()); idx++; } //addExtra(jg, "is metadata for", Joiner.on(", ").join(resourceReader.getDescribedDataset(res))); idx = 1; Iterator snaphsots = resourceReader.getSnapshots(res); while(snaphsots.hasNext()){ addExtra(jg, String.format("has snapshot (%d)", idx), snaphsots.next()); idx++; } //addExtra(jg, "has snapshot", Joiner.on(", ").join(resourceReader.getSnapshots(res))); idx = 1; Iterator issnaphsots = resourceReader.getIsSnapshotOfs(res); while(issnaphsots.hasNext()){ addExtra(jg, String.format("is snapshot of (%d)", idx), issnaphsots.next()); idx++; } //addExtra(jg, "is snapshot of", Joiner.on(", ").join(resourceReader.getIsSnapshotOfs(res))); jg.writeEndArray(); jg.writeEndObject(); jg.close(); return out.toString("UTF-8"); } protected String getJsonForSoftware(final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { JsonFactory jsonFactory = new JsonFactory(); final ByteArrayOutputStream out = new ByteArrayOutputStream(); BufferedOutputStream bos = new BufferedOutputStream(out); JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8); jg.writeStartObject(); writeCommonFields(jg, res, resNameForCatalogue, datasourceName); jg.writeArrayFieldStart("extras"); addExtra(jg, "system:type", CKANUtils.Software_type); //specific class addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E70_Thing).getLocalName()); if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) { addExtra(jg, "AriadnePlus URL", res.getURI()); } else addExtra(jg, "URL", res.getURI()); addIdentifiers(res, jg); addExtra(jg, "subject", Joiner.on(", ").join(resourceReader.getSubjects(res))); addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res))); int idx = 1; Iterator hosted = resourceReader.getHostedBys(res); while(hosted.hasNext()){ addExtra(jg, String.format("hosted by (%d)", idx), hosted.next()); idx++; } //addExtra(jg, "hosted by", Joiner.on(", ").join(resourceReader.getHostedBys(res))); idx = 1; Iterator curated = resourceReader.getCuratorUrls(res); while(curated.hasNext()){ addExtra(jg, String.format("curated by (%d)", idx), curated.next()); idx++; } //addExtra(jg, "curated by", Joiner.on(", ").join(resourceReader.getCuratorUrls(res))); idx = 1; Iterator hasSnapshot = resourceReader.getSnapshots(res); while(hasSnapshot.hasNext()){ addExtra(jg, String.format("has snapshot (%d)", idx), hasSnapshot.next()); idx++; } //addExtra(jg, "has snapshot", Joiner.on(", ").join(resourceReader.getSnapshots(res))); idx = 1; Iterator isSnapshot = resourceReader.getIsSnapshotOfs(res); while(isSnapshot.hasNext()){ addExtra(jg, String.format("is snapshot (%d)", idx), isSnapshot.next()); idx++; } //addExtra(jg, "is snapshot of", Joiner.on(", ").join(resourceReader.getIsSnapshotOfs(res))); idx = 1; Iterator isPart = resourceReader.getIsPartOfUrls(res); while(isPart.hasNext()){ addExtra(jg, String.format("is part of (%d)", idx), isPart.next()); idx++; } //addExtra(jg, "is part of", Joiner.on(", ").join(resourceReader.getIsPartOfUrls(res))); idx = 1; Iterator hasPart = resourceReader.getHasPartUrls(res); while(hasPart.hasNext()){ addExtra(jg, String.format("has part (%d)", idx), hasPart.next()); idx++; } //addExtra(jg, "has part", Joiner.on(", ").join(resourceReader.getHasPartUrls(res))); idx = 1; Iterator hasRelease = resourceReader.getHasReleases(res); while(hasRelease.hasNext()){ addExtra(jg, String.format("has release (%d)", idx), hasRelease.next()); idx++; } //addExtra(jg, "has release", Joiner.on(", ").join(resourceReader.getHasReleases(res))); idx = 1; Iterator isRelease = resourceReader.getIsReleaseOfs(res); while(isRelease.hasNext()){ addExtra(jg, String.format("is release (%d)", idx), isRelease.next()); idx++; } //addExtra(jg, "is release of", Joiner.on(", ").join(resourceReader.getIsReleaseOfs(res))); idx = 1; Iterator used = resourceReader.getUsedBy(res); while(used.hasNext()){ addExtra(jg, String.format("used by (%d)", idx), used.next()); idx++; } //addExtra(jg, "used by", Joiner.on(", ").join(resourceReader.getUsedBy(res))); addExtra(jg, "creation time", resourceReader.getFirstCreationTime(res)); jg.writeEndArray(); jg.writeEndObject(); jg.close(); return out.toString("UTF-8"); } protected String getJsonForCollection(final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { JsonFactory jsonFactory = new JsonFactory(); final ByteArrayOutputStream out = new ByteArrayOutputStream(); BufferedOutputStream bos = new BufferedOutputStream(out); JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8); jg.writeStartObject(); writeCommonFields(jg, res, resNameForCatalogue, datasourceName); jg.writeArrayFieldStart("extras"); addExtra(jg, "system:type", CKANUtils.Collection_type); //specific class addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E70_Thing).getLocalName()); if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) { addExtra(jg, "AriadnePlus URL", res.getURI()); } else addExtra(jg, "URL", res.getURI()); addIdentifiers(res, jg); addExtra(jg, "has type", Joiner.on(", ").join(resourceReader.getHasTypeLabels(res))); addExtra(jg, "subject", Joiner.on(", ").join(resourceReader.getSubjects(res))); addExtra(jg, "temporal coverage", Joiner.on(", ").join(resourceReader.getTemporalCoverages(res))); addExtra(jg, "spatial coverage", Joiner.on(", ").join(resourceReader.getSpatialCoverages(res))); int idx = 1; Iterator hasPart = resourceReader.getHasPartUrls(res); while(hasPart.hasNext()){ addExtra(jg, String.format("has part (%d)", idx), hasPart.next()); idx++; } //addExtra(jg, "has part", Joiner.on(", ").join(resourceReader.getHasPartUrls(res))); idx = 1; Iterator hosted = resourceReader.getHostedBys(res); while(hosted.hasNext()){ addExtra(jg, String.format("hosted by (%d)", idx), hosted.next()); idx++; } //addExtra(jg, "hosted by", Joiner.on(", ").join(resourceReader.getHostedBys(res))); idx = 1; Iterator curated = resourceReader.getCuratorUrls(res); while(curated.hasNext()){ addExtra(jg, String.format("curated by (%d)", idx), curated.next()); idx++; } //addExtra(jg, "curated by", Joiner.on(", ").join(resourceReader.getCuratorUrls(res))); idx = 1; Iterator creators = resourceReader.getCreatorsURIs(res); while(creators.hasNext()){ addExtra(jg, String.format("creator (%d)", idx), creators.next()); idx++; } //addExtra(jg, "creator", Joiner.on(", ").join(resourceReader.getCreatorsURIs(res))); addExtra(jg, "languages", Joiner.on(", ").join(resourceReader.getLanguages(res))); jg.writeEndArray(); jg.writeEndObject(); jg.close(); return out.toString("UTF-8"); } protected String getJsonForDesignProcedure(final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { JsonFactory jsonFactory = new JsonFactory(); final ByteArrayOutputStream out = new ByteArrayOutputStream(); BufferedOutputStream bos = new BufferedOutputStream(out); JsonGenerator jg = jsonFactory.createGenerator(bos, JsonEncoding.UTF8); jg.writeStartObject(); writeCommonFields(jg, res, resNameForCatalogue, datasourceName); jg.writeArrayFieldStart("extras"); addExtra(jg, "system:type", CKANUtils.DesignOrProcedure_type); //specific class addExtra(jg, "instance of", resourceReader.findSpecificType(res, CRM.E29_Design_or_Procedure).getLocalName()); if (res.getURI().startsWith(ARIADNEPLUS_BASE_URL)) { addExtra(jg, "AriadnePlus URL", res.getURI()); } else addExtra(jg, "URL", res.getURI()); addIdentifiers(res, jg); int idx = 1; Iterator used = resourceReader.getUsedBy(res); while(used.hasNext()){ addExtra(jg, String.format("used by (%d)", idx), used.next()); idx++; } //addExtra(jg, "used by", Joiner.on(", ").join(resourceReader.getUsedBy(res))); //TODO: add additional metadata for E29_Design_or_Procedure, if any jg.writeEndArray(); jg.writeEndObject(); jg.close(); return out.toString("UTF-8"); } protected void addIdentifiers(final Resource res, final JsonGenerator jg ) throws IOException { /* <${subjectURL}> crm:P1_is_identified_by ?IDRes . ?IDRes a crm:E42_Identifier . ?IDRes rdfs:label ?ID_label . */ StmtIterator it = res.listProperties(CRM.P1_is_identified_by); Set ids = Sets.newHashSet(); while(it.hasNext()){ RDFNode obj = it.next().getObject(); if(obj.isLiteral()) ids.add(obj.asLiteral().getLexicalForm()); else { Resource id = (Resource) obj; if (id.hasProperty(RDF.type, CRM.E42_Identifier)) { ids.add(resourceReader.getLabel(id)); } } } addExtra(jg, "ID", String.join(",", ids)); } protected void addExtra(final JsonGenerator jg, final String key, final String value) throws IOException { if(StringUtils.isNotBlank(value)) { jg.writeStartObject(); jg.writeStringField("key", key); jg.writeStringField("value", value); jg.writeEndObject(); } } protected void writeCommonFields(final JsonGenerator jg, final Resource res, final String resNameForCatalogue, final String datasourceName) throws IOException, AriadnePlusPublisherException { String ckanOrg = CKANUtils.getCKanOrg(datasourceName); //id is available only for updates if(StringUtils.isBlank(ckanOrg)) throw new AriadnePlusPublisherException(String.format("Cannot register %s : blank ckan org for data source with name %s", resNameForCatalogue, datasourceName)); //the owning organization, i.e. the data souce from which this resource has been collected from jg.writeStringField("owner_org", ckanOrg); jg.writeStringField("name", resNameForCatalogue); //default license jg.writeStringField("license_id", resourceReader.getCatalogueLicense(res).getId()); String title = resourceReader.getTitle(res); if (StringUtils.isBlank(title)) title = resNameForCatalogue; jg.writeStringField("title", title); //description jg.writeStringField("notes",Joiner.on(';').join(resourceReader.getDescriptions(res))); //the names of all superclasses of the entity jg.writeArrayFieldStart("tags"); Iterator classNames = resourceReader.getRDFClassNames(res); while (classNames.hasNext()) { jg.writeStartObject(); jg.writeStringField("name", classNames.next()); jg.writeEndObject(); } jg.writeEndArray(); } public ResourceReader getResourceReader() { return resourceReader; } public void setResourceReader(final ResourceReader resourceReader) { this.resourceReader = resourceReader; } public CatalogueAPIClient getCatalogueAPIClient() { return catalogueAPIClient; } public void setCatalogueAPIClient(final CatalogueAPIClient catalogueAPIClient) { this.catalogueAPIClient = catalogueAPIClient; } }