package eu.dnetlib.organizations.utils; import java.time.OffsetDateTime; import java.util.Arrays; import java.util.HashMap; import java.util.LinkedHashSet; import java.util.List; import java.util.Map; import java.util.Objects; import java.util.Optional; import java.util.Set; import java.util.UUID; import java.util.function.Function; import java.util.stream.Collectors; import javax.transaction.Transactional; import org.apache.commons.io.IOUtils; import org.apache.commons.lang3.StringUtils; import org.apache.commons.logging.Log; import org.apache.commons.logging.LogFactory; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.cache.annotation.Cacheable; import org.springframework.jdbc.core.BeanPropertyRowMapper; import org.springframework.jdbc.core.JdbcTemplate; import org.springframework.stereotype.Component; import org.springframework.web.bind.annotation.RequestBody; import eu.dnetlib.organizations.controller.UserRole; import eu.dnetlib.organizations.model.Acronym; import eu.dnetlib.organizations.model.JournalEntry; import eu.dnetlib.organizations.model.OpenaireConflictPK; import eu.dnetlib.organizations.model.OpenaireDuplicate; import eu.dnetlib.organizations.model.Organization; import eu.dnetlib.organizations.model.OtherIdentifier; import eu.dnetlib.organizations.model.OtherName; import eu.dnetlib.organizations.model.Relationship; import eu.dnetlib.organizations.model.Url; import eu.dnetlib.organizations.model.User; import eu.dnetlib.organizations.model.UserCountry; import eu.dnetlib.organizations.model.utils.BrowseEntry; import eu.dnetlib.organizations.model.utils.OrganizationConflict; import eu.dnetlib.organizations.model.utils.TempBrowseEntry; import eu.dnetlib.organizations.model.utils.VocabularyTerm; import eu.dnetlib.organizations.model.view.OrganizationView; import eu.dnetlib.organizations.model.view.UserView; import eu.dnetlib.organizations.repository.AcronymRepository; import eu.dnetlib.organizations.repository.JournalEntryRepository; import eu.dnetlib.organizations.repository.OpenaireConflictRepository; import eu.dnetlib.organizations.repository.OpenaireDuplicateRepository; import eu.dnetlib.organizations.repository.OrganizationRepository; import eu.dnetlib.organizations.repository.OtherIdentifierRepository; import eu.dnetlib.organizations.repository.OtherNameRepository; import eu.dnetlib.organizations.repository.RelationshipRepository; import eu.dnetlib.organizations.repository.UrlRepository; import eu.dnetlib.organizations.repository.UserCountryRepository; import eu.dnetlib.organizations.repository.UserRepository; import eu.dnetlib.organizations.repository.readonly.OrganizationViewRepository; @Component public class DatabaseUtils { @Autowired private AcronymRepository acronymRepository; @Autowired private OrganizationRepository organizationRepository; @Autowired private OtherIdentifierRepository otherIdentifierRepository; @Autowired private OtherNameRepository otherNameRepository; @Autowired private UrlRepository urlRepository; @Autowired private RelationshipRepository relationshipRepository; @Autowired private UserRepository userRepository; @Autowired private UserCountryRepository userCountryRepository; @Autowired private OpenaireConflictRepository openaireConflictRepository; @Autowired private OpenaireDuplicateRepository openaireDuplicateRepository; @Autowired private OrganizationViewRepository organizationViewRepository; @Autowired private JournalEntryRepository journalEntryRepository; @Autowired private JdbcTemplate jdbcTemplate; private static final Log log = LogFactory.getLog(DatabaseUtils.class); public enum VocabularyTable { languages, countries, org_types, id_types, rel_types, simrel_types } @Transactional public String insertOrUpdateOrganization(final OrganizationView orgView, final String user, final boolean isSimpleUser) { final String oldId = StringUtils.isNotBlank(orgView.getId()) ? new String(orgView.getId()) : null; final String oldStatus = oldId != null ? organizationRepository.findById(oldId) .map(Organization::getStatus) .orElse(null) : null; final boolean alreadyApproved = StringUtils.equals(oldStatus, OrganizationStatus.approved.toString()); final String newStatus; if (!isSimpleUser) { // IS ADMIN newStatus = OrganizationStatus.approved.toString(); } else if (isSimpleUser && oldStatus == null) { newStatus = OrganizationStatus.suggested.toString(); } else if (isSimpleUser && alreadyApproved) { newStatus = OrganizationStatus.approved.toString(); } else { throw new RuntimeException("User not authorized"); } if (oldId == null || !oldId.startsWith(OpenOrgsConstants.OPENORGS_PREFIX)) { if (isSimpleUser) { final String pendingId = OpenOrgsConstants.OPENORGS_PENDING_PREFIX + UUID.randomUUID(); orgView.setId(pendingId); // to override the generation strategy of the ID organizationRepository.preparePendingOrg(pendingId); } else { orgView.setId(null); // The ID is generated by the DB } } final Organization org = new Organization(orgView.getId(), orgView.getName(), orgView.getType(), orgView.getLat(), orgView.getLng(), orgView.getCity(), orgView.getCountry(), newStatus, orgView.getEcLegalBody(), orgView.getEcLegalPerson(), orgView.getEcNonProfit(), orgView.getEcResearchOrganization(), orgView.getEcHigherEducation(), orgView.getEcInternationalOrganizationEurInterests(), orgView.getEcInternationalOrganization(), orgView.getEcEnterprise(), orgView.getEcSmeValidated(), orgView.getEcNutscode()); final String newId = organizationRepository.save(org).getId(); final OffsetDateTime now = OffsetDateTime.now(); if (StringUtils.equals(newId, oldId)) { makeRelations(newId, orgView, true); } else { organizationRepository.updateCreationDate(newId, user, now); makeRelations(newId, orgView, false); if (oldId != null) { final List dups = openaireDuplicateRepository.findByLocalId(oldId) .stream() .map(d -> new OpenaireDuplicate(newId, d.getOaOriginalId(), SimilarityType.suggested.toString(), d.getOaCollectedFrom())) .collect(Collectors.toList()); openaireDuplicateRepository.saveAll(dups); dups.forEach(d -> { openaireDuplicateRepository.updateCreatedByIfMissing(d.getLocalId(), d.getOaOriginalId(), user); openaireDuplicateRepository.updateModificationDate(d.getLocalId(), d.getOaOriginalId(), user, now); }); if (oldId.startsWith(OpenOrgsConstants.OPENORGS_PENDING_PREFIX)) { organizationRepository.deleteById(oldId); } } } organizationRepository.updateModificationDate(newId, user, now); JournalOperations op = JournalOperations.UNKNOWN; String message = "-"; if (newStatus.equals(OrganizationStatus.suggested.toString())) { if (oldStatus == null) { op = JournalOperations.NEW_SUGG_ORG; message = "Created a new suggested org"; } else if (oldStatus != null) { op = JournalOperations.EDIT_SUGG_ORG; message = "Metadata updated"; } } else if (newStatus.equals(OrganizationStatus.approved.toString())) { if (oldStatus == null) { op = JournalOperations.NEW_ORG; message = "Created a new organization"; } else if (oldStatus.equals(OrganizationStatus.suggested.toString())) { op = JournalOperations.APPROVE_SUGG_ORG; message = "Approved the suggested org: " + oldId; } else { op = JournalOperations.EDIT_ORG; message = "Metadata updated"; } } else { // IMPOSSIBLE ??? } journalEntryRepository.save(new JournalEntry(newId, op, message, user)); return newId; } @Transactional public void saveDuplicates(final List simrels, final String user) { final OffsetDateTime now = OffsetDateTime.now(); final List list = openaireDuplicateRepository.saveAll(simrels.stream() .filter(d -> !d.getOaOriginalId().startsWith(OpenOrgsConstants.OPENORGS_PENDING_PREFIX)) .collect(Collectors.toList())); simrels.stream() .map(OpenaireDuplicate::getOaOriginalId) .filter(id -> id.startsWith(OpenOrgsConstants.OPENORGS_PENDING_PREFIX)) .forEach(organizationRepository::deleteById); list.forEach(d -> { openaireDuplicateRepository.updateCreatedByIfMissing(d.getLocalId(), d.getOaOriginalId(), user); openaireDuplicateRepository.updateModificationDate(d.getLocalId(), d.getOaOriginalId(), user, now); }); final String message = String.format("Duplicates updated (%s similars, %s differents, %s suggested)", list.stream() .filter(d -> d.getRelType().equals(SimilarityType.is_similar.toString())) .count(), list.stream() .filter(d -> d.getRelType().equals(SimilarityType.is_different.toString())) .count(), list.stream().filter(d -> d.getRelType().equals(SimilarityType.suggested.toString())).count()); list.stream() .map(OpenaireDuplicate::getLocalId) .distinct() .map(id -> new JournalEntry(id, JournalOperations.DUPLICATES, message, user)) .forEach(journalEntryRepository::save); } private void makeRelations(final String orgId, final OrganizationView orgView, final boolean update) { if (update) { acronymRepository.deleteByOrgId(orgId); otherNameRepository.deleteByOrgId(orgId); otherIdentifierRepository.deleteByOrgId(orgId); urlRepository.deleteByOrgId(orgId); relationshipRepository.deleteById1(orgId); relationshipRepository.deleteById2(orgId); } orgView.getAcronyms().forEach(s -> acronymRepository.save(new Acronym(orgId, s))); orgView.getOtherNames().forEach(n -> otherNameRepository.save(new OtherName(orgId, n.getName(), n.getLang()))); orgView.getOtherIdentifiers().forEach(id -> otherIdentifierRepository.save(new OtherIdentifier(orgId, id.getId(), id.getType()))); orgView.getUrls().forEach(u -> urlRepository.save(new Url(orgId, u))); orgView.getRelations().forEach(r -> makeRelation(orgId, r.getRelatedOrgId(), RelationType.valueOf(r.getType()))); } @Cacheable("vocs") public List listValuesOfVocabularyTable(final VocabularyTable table) { final String sql = "select val as value, name as name from " + table + " order by name"; return jdbcTemplate.query(sql, new BeanPropertyRowMapper<>(VocabularyTerm.class)); } @Cacheable("countries_for_user") public List listCountriesForUser(final String name) { final String sql = "select uc.country as value, c.name as name from user_countries uc left outer join countries c on (c.val = uc.country) where uc.email = ? order by c.name"; return jdbcTemplate.query(sql, new BeanPropertyRowMapper<>(VocabularyTerm.class), name); } @Transactional public void saveUser(@RequestBody final UserView userView) { final User user = userRepository.findById(userView.getEmail()).orElseThrow(() -> new RuntimeException("User not found")); user.setRole(userView.getRole()); user.setValid(userView.isValid()); userRepository.save(user); userCountryRepository.deleteByEmail(userView.getEmail()); if (userView.getCountries() != null) { userCountryRepository .saveAll(Arrays.stream(userView.getCountries()).map(c -> new UserCountry(userView.getEmail(), c)).collect(Collectors.toList())); } } @Transactional public void deleteUser(final String email) { userCountryRepository.deleteByEmail(email); userRepository.deleteById(email); } @Transactional public void newUser(final String email, final List countries) { final User user = new User(); user.setEmail(email); user.setRole(UserRole.PENDING.name()); user.setValid(false); userRepository.save(user); if (countries != null) { userCountryRepository.saveAll(countries.stream().map(c -> new UserCountry(email, c)).collect(Collectors.toList())); } } @Transactional public List makeRelation(final String id1, final String id2, final RelationType type) { final Relationship r1 = new Relationship(id1, id2, type.toString()); final Relationship r2 = new Relationship(id2, id1, type.getInverse().toString()); relationshipRepository.save(r1); relationshipRepository.save(r2); return Arrays.asList(r1, r2); } // BROWSE BY COUNTRY public List browseCountries() { final String sql = "select o.country as code, c.name as name, o.status as group, count(o.status) as count from organizations o left outer join countries c on (o.country = c.val) group by o.country, c.name, o.status"; return listBrowseEntries(sql); } // BROWSE BY COUNTRY FOR USER public List browseCountriesForUser(final String email) { final String sql = "select o.country as code, c.name as name, o.status as group, count(o.status) as count from user_countries uc left outer join organizations o on (uc.country = o.country) left outer join countries c on (o.country = c.val) where uc.email=? group by o.country, c.name, o.status"; return listBrowseEntries(sql, email); } // BROWSE BY ORG TYPE public List browseTypes() { final String sql = "select type as code, type as name, status as group, count(status) as count from organizations group by type, status"; return listBrowseEntries(sql); } // BROWSE BY ORG TYPE FOR USER public List browseTypesForUser(final String email) { final String sql = "select o.type as code, o.type as name," + "o.status as group, count(o.status) as count " + "from organizations o " + "left outer join user_countries uc on (uc.country = o.country) " + "where uc.email=? " + "group by o.type, o.status"; return listBrowseEntries(sql, email); } private List listBrowseEntries(final String sql, final Object... params) { final Map map = new HashMap<>(); for (final TempBrowseEntry t : jdbcTemplate.query(sql, new BeanPropertyRowMapper<>(TempBrowseEntry.class), params)) { if (StringUtils.isNotBlank(t.getCode())) { if (!map.containsKey(t.getCode())) { final BrowseEntry e = new BrowseEntry(); e.setCode(t.getCode()); e.setName(t.getName()); map.put(t.getCode(), e); } map.get(t.getCode()).getValues().put(t.getGroup(), t.getCount()); } } return map.values().stream().sorted((o1, o2) -> StringUtils.compare(o1.getName(), o2.getName())).collect(Collectors.toList()); } public List listConflictsForId(final String id) { final String sql = "select o.id, o.name, o.type, o.city, o.country from oa_conflicts c left outer join organizations o on (c.id2 = o.id) where o.id is not null and c.id1 = ? and c.reltype = 'suggested'"; return jdbcTemplate.query(sql, new BeanPropertyRowMapper<>(OrganizationConflict.class), id); } @Transactional public void importDedupEvents() { try { log.info("Importing conflicts and duplicates..."); jdbcTemplate.update(IOUtils.toString(getClass().getResourceAsStream("/sql/importDedupEvents.sql"))); log.info("...done"); // verifyConflictGroups(true); } catch (final Exception e) { log.error("Error importing conflicts and duplicates", e); } } @Transactional public void updateFulltextIndex() { try { log.info("Updating Fulltext Index..."); jdbcTemplate.queryForList("SELECT refresh_index_search()"); log.info("...done"); } catch (final Exception e) { log.error("Error updating Fulltext Index", e); } } @Transactional public String fixConflictSimilars(final List similarIds, final String user) { final OffsetDateTime now = OffsetDateTime.now(); final List views = similarIds.stream().map(organizationViewRepository::findById).filter(Optional::isPresent).map(Optional::get).collect(Collectors.toList()); // I create a new org final OrganizationView newOrg = new OrganizationView(); newOrg.setId(null); newOrg.setStatus(null); newOrg.setName(findFirstString(views, OrganizationView::getName)); newOrg.setType(findFirstString(views, OrganizationView::getType)); newOrg.setLat(findFirstNumber(views, OrganizationView::getLat)); newOrg.setLng(findFirstNumber(views, OrganizationView::getLng)); newOrg.setCity(findFirstString(views, OrganizationView::getCity)); newOrg.setCountry(findFirstString(views, OrganizationView::getCountry)); newOrg.setOtherIdentifiers(findAll(views, OrganizationView::getOtherIdentifiers)); newOrg.setOtherNames(findAll(views, OrganizationView::getOtherNames)); newOrg.setAcronyms(findAll(views, OrganizationView::getAcronyms)); newOrg.setUrls(findAll(views, OrganizationView::getUrls)); newOrg.setRelations(findAll(views, OrganizationView::getRelations)); newOrg.getOtherNames() .addAll(views.stream() .map(OrganizationView::getName) .filter(StringUtils::isNotBlank) .filter(s -> StringUtils.equalsIgnoreCase(s, newOrg.getName())) .map(s -> new eu.dnetlib.organizations.model.view.OtherName(s, "UNKNOWN")) .collect(Collectors.toList())); final String masterId = insertOrUpdateOrganization(newOrg, user, false); // I hide the merged organizations similarIds.forEach(id -> { hideConflictOrgs(masterId, id); journalEntryRepository.save(new JournalEntry(masterId, JournalOperations.FIX_CONFLICT, "The org has been hidded and merged in " + masterId, user)); }); // I reassign the duplicates to the new org final List newDuplicates = similarIds.stream() .map(openaireDuplicateRepository::findByLocalId) .flatMap(l -> l.stream()) .map(d -> new OpenaireDuplicate(masterId, d.getOaOriginalId(), d.getRelType(), d.getOaCollectedFrom())) .collect(Collectors.toList()); openaireDuplicateRepository.saveAll(newDuplicates); newDuplicates.forEach(d -> { openaireDuplicateRepository.updateCreatedByIfMissing(d.getLocalId(), d.getOaOriginalId(), user); openaireDuplicateRepository.updateModificationDate(d.getLocalId(), d.getOaOriginalId(), user, now); }); for (final String similarId : similarIds) { openaireConflictRepository.updateMultipleStatusAndResetGroup(similarId, SimilarityType.is_different.toString(), user, now); } for (int i = 0; i < similarIds.size(); i++) { for (int j = i + 1; j < similarIds.size(); j++) { openaireConflictRepository.updateStatusAndResetGroup(similarIds.get(i), similarIds.get(j), SimilarityType.is_similar.toString(), user, now); } } journalEntryRepository .save(new JournalEntry(masterId, JournalOperations.FIX_CONFLICT, "New org created merging: " + StringUtils.join(similarIds, ", "), user)); return masterId; } @Transactional public void fixConflictDifferents(final List differentsIds, final String user) { final OffsetDateTime now = OffsetDateTime.now(); final String message = "Mark the following orgs as different: " + StringUtils.join(differentsIds, ", "); for (int i = 0; i < differentsIds.size(); i++) { for (int j = i + 1; j < differentsIds.size(); j++) { openaireConflictRepository .updateStatusAndResetGroup(differentsIds.get(i), differentsIds.get(j), SimilarityType.is_different.toString(), user, now); } journalEntryRepository.save(new JournalEntry(differentsIds.get(i), JournalOperations.NO_CONFLICT, message, user)); } } @Transactional public Optional findUser(final String email) { final Optional user = userRepository.findById(email); if (user.isPresent()) { userRepository.updateLastAccess(email, OffsetDateTime.now()); } return user; } private String findFirstString(final List views, final Function mapper) { return views.stream().map(mapper).filter(StringUtils::isNotBlank).findFirst().orElse(null); } private Double findFirstNumber(final List views, final Function mapper) { return views.stream().map(mapper).filter(Objects::nonNull).filter(n -> n != 0).findFirst().orElse(0.0); } private Set findAll(final List views, final Function> mapper) { return views.stream().map(mapper).flatMap(s -> s.stream()).collect(Collectors.toCollection(LinkedHashSet::new)); } private List hideConflictOrgs(final String masterId, final String otherId) { organizationRepository.updateStatus(otherId, OrganizationStatus.hidden.toString()); openaireConflictRepository.findById(new OpenaireConflictPK(masterId, otherId)).ifPresent(openaireConflictRepository::delete); openaireConflictRepository.findById(new OpenaireConflictPK(otherId, masterId)).ifPresent(openaireConflictRepository::delete); return makeRelation(masterId, otherId, RelationType.Merges); } }