re-packing all the D4I applications

2022-02-15 11:17:47 +01:00 · 2022-02-15 11:17:47 +01:00 · 2905051469
parent eaefc4d6d9
commit 2905051469
391 changed files with 17043 additions and 0 deletions
--- a/apps/data4impact-api-application/pom.xml
+++ b/apps/data4impact-api-application/pom.xml
@ -0,0 +1,119 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <project xmlns="http://maven.apache.org/POM/4.0.0"
 	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 	xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
 	<modelVersion>4.0.0</modelVersion>
 	<groupId>eu.dnetlib</groupId>
 	<artifactId>data4impact-api-application</artifactId>
 	<version>1.1.0-SNAPSHOT</version>
 <!--	<scm>
 		<developerConnection>scm:svn:https://svn.driver.research-infrastructures.eu/driver/data4impact/data4impact-api-application/trunk</developerConnection>
 	</scm>
 	<ciManagement>
 		<system>jenkins</system>
 		<url>https://jenkins-dnet.d4science.org/view/data4impact/job/data4impact-api-application/</url>
 	</ciManagement>
 	<distributionManagement>
 		<repository>
 			<id>dnet45-releases</id>
 			<name>D-Net 45 Releases</name>
 			<url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet45-releases</url>
 			<layout>default</layout>
 		</repository>
 	</distributionManagement>
 -->
 	<!-- Inherit defaults from Spring Boot -->
 	<parent>
 		<groupId>org.springframework.boot</groupId>
 		<artifactId>spring-boot-starter-parent</artifactId>
 		<version>2.0.3.RELEASE</version>
 		<relativePath></relativePath>
 	</parent>
 <!-- 
 	<repositories>
 		<repository>
 			<id>dnet-deps</id>
 			<name>dnet-dependencies</name>
 			<url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet-deps</url>
 			<layout>default</layout>
 		</repository>
 		<repository>
 			<id>dnet45-releases</id>
 			<name>D-Net 45 Releases</name>
 			<url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet45-releases</url>
 			<layout>default</layout>
 			<snapshots>
 				<enabled>true</enabled>
 			</snapshots>
 		</repository>
 		<repository>
 			<id>dnet45-snapshots</id>
 			<name>D-Net 45 Snapshots</name>
 			<url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet45-snapshots</url>
 			<layout>default</layout>
 			<snapshots>
 				<enabled>true</enabled>
 			</snapshots>
 		</repository>
 	</repositories>
 -->
 	<!-- Add typical dependencies for a web application -->
 	<dependencies>
 		<dependency>
 			<groupId>org.springframework.boot</groupId>
 			<artifactId>spring-boot-starter-web</artifactId>
 		</dependency>
 		<dependency>
 			<groupId>eu.dnetlib</groupId>
 			<artifactId>data4impact-model</artifactId>
 			<version>1.1.0-SNAPSHOT</version>
 		</dependency>
 		<!-- Swagger -->
 		<dependency>
 			<groupId>io.springfox</groupId>
 			<artifactId>springfox-swagger2</artifactId>
 			<version>2.9.2</version>
 		</dependency>
 		<dependency>
 			<groupId>io.springfox</groupId>
 			<artifactId>springfox-swagger-ui</artifactId>
 			<version>2.9.2</version>
 		</dependency>
 		<!-- JUnit -->
 		<dependency>
 			<groupId>junit</groupId>
 			<artifactId>junit</artifactId>
 			<scope>test</scope>
 		</dependency>
 	</dependencies>
 	<build>
 		<plugins>
 			<plugin>
 				<groupId>org.springframework.boot</groupId>
 				<artifactId>spring-boot-maven-plugin</artifactId>
 				<configuration>
 					<executable>true</executable>
 				</configuration>
 			</plugin>
 		</plugins>
 	</build>
 	<properties>
 		<java.version>1.8</java.version>
 		<apache.solr.version>7.1.0</apache.solr.version>
 		<mongodb.driver.version>3.4.2</mongodb.driver.version>
 		<springfox-version>2.8.0</springfox-version>
 		<prometheus.version>0.2.0</prometheus.version>
 		<javamelody.version>1.71.0</javamelody.version>
 		<maven.javadoc.failOnError>false</maven.javadoc.failOnError>
 		<dockerfile-maven-version>1.3.6</dockerfile-maven-version>
 	</properties>
 </project>
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/MainApplication.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/MainApplication.java
@ -0,0 +1,47 @@
 package eu.data4impact;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 import org.springframework.boot.SpringApplication;
 import org.springframework.boot.autoconfigure.SpringBootApplication;
 import org.springframework.cache.annotation.EnableCaching;
 import org.springframework.context.annotation.Bean;
 import springfox.documentation.builders.ApiInfoBuilder;
 import springfox.documentation.builders.RequestHandlerSelectors;
 import springfox.documentation.service.ApiInfo;
 import springfox.documentation.spi.DocumentationType;
 import springfox.documentation.spring.web.plugins.Docket;
 import springfox.documentation.swagger2.annotations.EnableSwagger2;
@SpringBootApplication
@EnableSwagger2
@EnableCaching
 public class MainApplication {
 	private static final Logger log = LoggerFactory.getLogger(MainApplication.class);
 	public static void main(final String[] args) {
 		SpringApplication.run(MainApplication.class, args);
 	}
 	@Bean
 	public static Docket newSwaggerDocket() {
 		log.info("Initializing SWAGGER...");
 		return new Docket(DocumentationType.SWAGGER_2)
 				.select()
 				.apis(RequestHandlerSelectors.any())
 				.paths(p -> p.startsWith("/api/"))
 				.build().apiInfo((new ApiInfoBuilder())
 						.title("Data4impact Service APIs")
 						.description("APIs documentation")
 						.version("1.1")
 						.contact(ApiInfo.DEFAULT_CONTACT)
 						.license("Apache 2.0")
 						.licenseUrl("http://www.apache.org/licenses/LICENSE-2.0")
 						.build());
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/SwaggerController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/SwaggerController.java
@ -0,0 +1,14 @@
 package eu.data4impact;
 import org.springframework.stereotype.Controller;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RequestMethod;
@Controller
 public class SwaggerController {
 	@RequestMapping(value = { "/", "/apidoc", "/api-doc", "/doc", "/swagger" }, method = RequestMethod.GET)
 	public String apiDoc() {
 		return "redirect:swagger-ui.html";
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AbstractJpaController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AbstractJpaController.java
@ -0,0 +1,38 @@
 package eu.data4impact.controller;
 import java.util.List;
 import java.util.stream.Collectors;
 import org.springframework.data.domain.PageRequest;
 import org.springframework.data.jpa.repository.JpaRepository;
 import org.springframework.web.bind.annotation.PathVariable;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RequestMethod;
 import org.springframework.web.bind.annotation.RequestParam;
 import eu.data4impact.utils.MainEntity;
 public abstract class AbstractJpaController<T extends MainEntity> {
 	public abstract JpaRepository<T, String> getRepo();
 	@RequestMapping(value = "/list/{page}/{size}", method = RequestMethod.GET)
 	public final List<T> find(@PathVariable final int page, @PathVariable final int size) {
 		return getRepo().findAll(PageRequest.of(page, size)).getContent();
 	}
 	@RequestMapping(value = "/identifiers/{page}/{size}", method = RequestMethod.GET)
 	public final List<String> findIdentifiers(@PathVariable final int page, @PathVariable final int size) {
 		return find(page, size).stream().map(MainEntity::getId).collect(Collectors.toList());
 	}
 	@RequestMapping(value = "/get", method = RequestMethod.GET)
 	public final T get(@RequestParam final String id) {
 		return getRepo().findById(id).orElse(null);
 	}
 	@RequestMapping(value = "/count", method = RequestMethod.GET)
 	public final long count() {
 		return getRepo().count();
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AbstractReadOnlyController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AbstractReadOnlyController.java
@ -0,0 +1,38 @@
 package eu.data4impact.controller;
 import java.util.List;
 import java.util.stream.Collectors;
 import org.springframework.data.domain.PageRequest;
 import org.springframework.web.bind.annotation.PathVariable;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RequestMethod;
 import org.springframework.web.bind.annotation.RequestParam;
 import eu.data4impact.utils.MainEntity;
 import eu.data4impact.utils.ReadOnlyRepository;
 public abstract class AbstractReadOnlyController<T extends MainEntity> {
 	public abstract ReadOnlyRepository<T, String> getRepo();
 	@RequestMapping(value = "/list/{page}/{size}", method = RequestMethod.GET)
 	public final List<T> find(@PathVariable final int page, @PathVariable final int size) {
 		return getRepo().findAll(PageRequest.of(page, size)).getContent();
 	}
 	@RequestMapping(value = "/identifiers/{page}/{size}", method = RequestMethod.GET)
 	public final List<String> findIdentifiers(@PathVariable final int page, @PathVariable final int size) {
 		return find(page, size).stream().map(MainEntity::getId).collect(Collectors.toList());
 	}
 	@RequestMapping(value = "/get", method = RequestMethod.GET)
 	public final T get(@RequestParam final String id) {
 		return getRepo().findById(id).orElse(null);
 	}
 	@RequestMapping(value = "/count", method = RequestMethod.GET)
 	public final long count() {
 		return getRepo().count();
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AdminController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AdminController.java
@ -0,0 +1,40 @@
 package eu.data4impact.controller;
 import java.util.Arrays;
 import java.util.List;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.cache.annotation.CacheEvict;
 import org.springframework.cache.annotation.Cacheable;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RequestMethod;
 import org.springframework.web.bind.annotation.RequestParam;
 import org.springframework.web.bind.annotation.RestController;
 import eu.data4impact.utils.Counter;
 import eu.data4impact.utils.DatabaseUtils;
@RestController
@RequestMapping("/admin")
 public class AdminController {
 	@Autowired
 	private DatabaseUtils databaseUtils;
 	@RequestMapping(value = "/materializedViews", method = RequestMethod.GET)
 	public List<String> materializedViews(@RequestParam(required = false, defaultValue = "false") final boolean refresh) {
 		return refresh ? databaseUtils.refreshMaterializedViews() : databaseUtils.materializedViews();
 	}
 	@Cacheable(value = "simpleCache", key = "'tables'")
 	@RequestMapping(value = "/tables", method = RequestMethod.GET)
 	public List<Counter> tables() {
 		return databaseUtils.tableSizes();
 	}
 	@CacheEvict(cacheNames = { "simpleCache" }, allEntries = true)
 	@RequestMapping(value = "/clearCaches", method = RequestMethod.GET)
 	public List<String> clearCaches() {
 		return Arrays.asList("Done.");
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/DocumentController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/DocumentController.java
@ -0,0 +1,51 @@
 package eu.data4impact.controller;
 import java.util.List;
 import java.util.Map;
 import java.util.stream.Collectors;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.data.domain.PageRequest;
 import org.springframework.data.jpa.repository.JpaRepository;
 import org.springframework.web.bind.annotation.PathVariable;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RequestMethod;
 import org.springframework.web.bind.annotation.RequestParam;
 import org.springframework.web.bind.annotation.RestController;
 import eu.data4impact.model.documents.DocFulltext;
 import eu.data4impact.model.documents.Document;
 import eu.data4impact.repository.DocFulltextRepository;
 import eu.data4impact.repository.DocumentRepository;
@RestController
@RequestMapping("/api/docs")
 public class DocumentController extends AbstractJpaController<Document> {
 	@Autowired
 	private DocumentRepository documentRepository;
 	@Autowired
 	private DocFulltextRepository docFulltextRepository;
 	@Override
 	public JpaRepository<Document, String> getRepo() {
 		return documentRepository;
 	}
 	@RequestMapping(value = "/fulltext", method = RequestMethod.GET, produces = "text/plain")
 	public String fulltext(@RequestParam final String id) {
 		return docFulltextRepository.findById(id).map(DocFulltext::getFulltext).orElse("");
 	}
 	@RequestMapping(value = "/byType/{type}/{page}/{size}", method = RequestMethod.GET)
 	public List<Document> findByType(@PathVariable final String type, @PathVariable final int page, @PathVariable final int size) {
 		return documentRepository.findByType(type, PageRequest.of(page, size)).getContent();
 	}
 	@RequestMapping(value = "/types", method = RequestMethod.GET)
 	public Map<String, Long> types() {
 		return documentRepository.types().stream().collect(Collectors.toMap(s -> s, s -> documentRepository.countByType(s)));
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/JournalController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/JournalController.java
@ -0,0 +1,23 @@
 package eu.data4impact.controller;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.data.jpa.repository.JpaRepository;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RestController;
 import eu.data4impact.model.journals.Journal;
 import eu.data4impact.repository.JournalRepository;
@RestController
@RequestMapping("/api/journals")
 public class JournalController extends AbstractJpaController<Journal> {
 	@Autowired
 	private JournalRepository journalRepository;
 	@Override
 	public JpaRepository<Journal, String> getRepo() {
 		return journalRepository;
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/OrganizationController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/OrganizationController.java
@ -0,0 +1,43 @@
 package eu.data4impact.controller;
 import java.util.LinkedHashMap;
 import java.util.List;
 import java.util.Map;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.data.domain.PageRequest;
 import org.springframework.web.bind.annotation.PathVariable;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RequestMethod;
 import org.springframework.web.bind.annotation.RestController;
 import eu.data4impact.repository.readonly.OrganizationViewRepository;
 import eu.data4impact.utils.ReadOnlyRepository;
 import eu.data4impact.views.OrganizationView;
@RestController
@RequestMapping("/api/organizations")
 public class OrganizationController extends AbstractReadOnlyController<OrganizationView> {
 	@Autowired
 	private OrganizationViewRepository organizationViewRepository;
 	@Override
 	public ReadOnlyRepository<OrganizationView, String> getRepo() {
 		return organizationViewRepository;
 	}
 	@RequestMapping(value = "/companies/{page}/{size}", method = RequestMethod.GET)
 	public List<OrganizationView> findCompanies(@PathVariable final int page, @PathVariable final int size) {
 		return organizationViewRepository.findByCompany(true, PageRequest.of(page, size)).getContent();
 	}
 	@RequestMapping(value = "/summary", method = RequestMethod.GET)
 	public Map<String, Long> summary() {
 		final Map<String, Long> res = new LinkedHashMap<>();
 		res.put("all", organizationViewRepository.count());
 		res.put("companies", organizationViewRepository.countByCompany(true));
 		return res;
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/ProjectController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/ProjectController.java
@ -0,0 +1,76 @@
 package eu.data4impact.controller;
 import java.io.ByteArrayInputStream;
 import java.io.IOException;
 import java.nio.charset.Charset;
 import java.util.List;
 import java.util.Map;
 import java.util.stream.Collectors;
 import java.util.zip.GZIPInputStream;
 import javax.servlet.http.HttpServletResponse;
 import org.apache.commons.io.IOUtils;
 import org.postgresql.util.Base64;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.data.domain.PageRequest;
 import org.springframework.web.bind.annotation.PathVariable;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RequestMethod;
 import org.springframework.web.bind.annotation.RequestParam;
 import org.springframework.web.bind.annotation.RestController;
 import eu.data4impact.model.projects.ProjectPortfolio;
 import eu.data4impact.repository.ProjectPortfolioRepository;
 import eu.data4impact.repository.readonly.ProjectViewRepository;
 import eu.data4impact.utils.ReadOnlyRepository;
 import eu.data4impact.views.ProjectView;
@RestController
@RequestMapping("/api/projects")
 public class ProjectController extends AbstractReadOnlyController<ProjectView> {
 	@Autowired
 	private ProjectViewRepository projectRepository;
 	@Autowired
 	private ProjectPortfolioRepository projectPortfolioRepository;
 	@Override
 	public ReadOnlyRepository<ProjectView, String> getRepo() {
 		return projectRepository;
 	}
 	@RequestMapping(value = "/byFunder/{funder}/{page}/{size}", method = RequestMethod.GET)
 	public List<ProjectView> findByFunder(@PathVariable final String funder, @PathVariable final int page, @PathVariable final int size) {
 		return projectRepository.findByFunder(funder, PageRequest.of(page, size)).getContent();
 	}
 	@RequestMapping(value = "/funders", method = RequestMethod.GET)
 	public Map<String, Long> funders() {
 		return projectRepository.funders().stream().collect(Collectors.toMap(s -> s, s -> projectRepository.countByFunder(s)));
 	}
 	@RequestMapping(value = "/portfolio", method = RequestMethod.GET)
 	public final void getPortfolio(@RequestParam final String id, final HttpServletResponse res) throws IOException {
 		res.setContentType("application/json");
 		IOUtils.write(projectPortfolioRepository.findById(id)
 				.map(ProjectPortfolio::getPortfolio)
 				.map(Base64::decode)
 				.map(this::gunzip)
 				.orElse("{}"),
 				res.getOutputStream(),
 				Charset.defaultCharset());
 	}
 	private String gunzip(final byte[] bytes) {
 		try (final ByteArrayInputStream bis = new ByteArrayInputStream(bytes);
 				final GZIPInputStream gis = new GZIPInputStream(bis)) {
 			return IOUtils.toString(gis, Charset.defaultCharset());
 		} catch (final IOException e) {
 			throw new RuntimeException(e);
 		}
 	}
 }
--- a/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/TopicController.java
+++ b/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/TopicController.java
@ -0,0 +1,22 @@
 package eu.data4impact.controller;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.data.jpa.repository.JpaRepository;
 import org.springframework.web.bind.annotation.RequestMapping;
 import org.springframework.web.bind.annotation.RestController;
 import eu.data4impact.model.topics.Topic;
 import eu.data4impact.repository.TopicRepository;
@RestController
@RequestMapping("/api/topics")
 public class TopicController extends AbstractJpaController<Topic> {
 	@Autowired
 	private TopicRepository topicRepository;
 	@Override
 	public JpaRepository<Topic, String> getRepo() {
 		return topicRepository;
 	}
 }
--- a/apps/data4impact-api-application/src/main/resources/application.properties
+++ b/apps/data4impact-api-application/src/main/resources/application.properties
@ -0,0 +1,14 @@
 spring.main.banner-mode = off
 logging.level.root      = INFO
 spring.datasource.url=jdbc:postgresql://localhost:5432/data4impact
 spring.datasource.username=
 spring.datasource.password=
 spring.jpa.properties.hibernate.dialect = org.hibernate.dialect.PostgreSQLDialect
 # Hibernate ddl auto (create, create-drop, validate, update)
 spring.jpa.hibernate.ddl-auto = validate
 spring.jpa.properties.hibernate.hbm2dll.extra_physical_table_types = MATERIALIZED VIEW
 spring.jpa.properties.hibernate.jdbc.lob.non_contextual_creation=true
 spring.jpa.open-in-view=true
--- a/apps/data4impact-api-application/target/classes/application.properties
+++ b/apps/data4impact-api-application/target/classes/application.properties
@ -0,0 +1,14 @@
 spring.main.banner-mode = off
 logging.level.root      = INFO
 spring.datasource.url=jdbc:postgresql://localhost:5432/data4impact
 spring.datasource.username=
 spring.datasource.password=
 spring.jpa.properties.hibernate.dialect = org.hibernate.dialect.PostgreSQLDialect
 # Hibernate ddl auto (create, create-drop, validate, update)
 spring.jpa.hibernate.ddl-auto = validate
 spring.jpa.properties.hibernate.hbm2dll.extra_physical_table_types = MATERIALIZED VIEW
 spring.jpa.properties.hibernate.jdbc.lob.non_contextual_creation=true
 spring.jpa.open-in-view=true
--- a/apps/data4impact-api-application/target/classes/eu/data4impact/controller/AbstractJpaController.class
+++ b/apps/data4impact-api-application/target/classes/eu/data4impact/controller/AbstractJpaController.class
--- a/apps/data4impact-api-application/target/classes/eu/data4impact/controller/AbstractReadOnlyController.class
+++ b/apps/data4impact-api-application/target/classes/eu/data4impact/controller/AbstractReadOnlyController.class
--- a/apps/data4impact-api-application/target/classes/eu/data4impact/controller/AdminController.class
+++ b/apps/data4impact-api-application/target/classes/eu/data4impact/controller/AdminController.class
--- a/apps/data4impact-api-application/target/classes/eu/data4impact/controller/JournalController.class
+++ b/apps/data4impact-api-application/target/classes/eu/data4impact/controller/JournalController.class
--- a/apps/data4impact-api-application/target/classes/eu/data4impact/controller/OrganizationController.class
+++ b/apps/data4impact-api-application/target/classes/eu/data4impact/controller/OrganizationController.class
--- a/apps/data4impact-api-application/target/maven-status/maven-compiler-plugin/compile/default-compile/createdFiles.lst
+++ b/apps/data4impact-api-application/target/maven-status/maven-compiler-plugin/compile/default-compile/createdFiles.lst
@ -0,0 +1,5 @@
 eu/data4impact/controller/AbstractJpaController.class
 eu/data4impact/controller/JournalController.class
 eu/data4impact/controller/OrganizationController.class
 eu/data4impact/controller/AbstractReadOnlyController.class
 eu/data4impact/controller/AdminController.class
--- a/apps/data4impact-api-application/target/maven-status/maven-compiler-plugin/compile/default-compile/inputFiles.lst
+++ b/apps/data4impact-api-application/target/maven-status/maven-compiler-plugin/compile/default-compile/inputFiles.lst
@ -0,0 +1,10 @@
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/OrganizationController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AbstractReadOnlyController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AdminController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/JournalController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/MainApplication.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/TopicController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/ProjectController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/AbstractJpaController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/SwaggerController.java
 /Users/claudio/workspace/git/data4impact/apps/data4impact-api-application/src/main/java/eu/data4impact/controller/DocumentController.java
--- a/apps/data4impact-import-scripts/dataExtensions.sql
+++ b/apps/data4impact-import-scripts/dataExtensions.sql
@ -0,0 +1,3 @@
 UPDATE public.Document
 SET batchid = SUBSTR(pubyear,0,5) ;
--- a/apps/data4impact-import-scripts/fixRelations.sql
+++ b/apps/data4impact-import-scripts/fixRelations.sql
@ -0,0 +1,58 @@
 -- Population of the doc_project relation using the data from  project -> project_doc_other_id ->  doc_other_identifier -> document
 insert into
 	doc_project(projectid, docid, inferred)
 select 
 	p.projectid,
 	d.docid,
 	true as inferred
 from
 	project_doc_other_id p
 	left outer join doc_other_identifier d on (p.docid = d.id and p.docidtype = d.idtype)
 where
 	d.docid is not null
 on conflict do nothing;	
 -- Population of the doc_doc relation using the data from  document(eg: guidelines) -> doc_doc_other_id ->  doc_other_identifier -> document(eg: publication)
 insert into
 	doc_doc(docid1, docid2, reltype, inferred)
 select 
 	d.docid1   as docid1,
 	i.docid    as docid2,
 	d.reltype  as reltype,
 	true       as inferred
 from
 	doc_doc_other_id d
 	left outer join doc_other_identifier i on (d.docid2 = i.id and d.docid2type = i.idtype)
 where
 	i.docid is not null
 on conflict do nothing;
 -- Remove redundant doc_project relations (references to MOCK PROJECTS would be counted twice, otherwise)
 create table temp_delete_doc_project as select t.docid||'@'||t.projectid as item from (
 	select
 		dp.docid,
 		unnest(array_agg(dp.projectid)) as projectid
 	from
 		doc_project dp
 		left outer join project p on (dp.projectid = p.id)
 	group by
 		dp.docid, p.funder
 	having
 		array_to_string(array_agg(dp.projectid), ',', '') like '%MOCK_PROJECT%'
 		and array_length(array_agg(DISTINCT dp.projectid), 1) > 1
 ) as t 
 where t.projectid like '40|MOCK_PROJECT::%';
 create index temp_delete_doc_project_item_idx on temp_delete_doc_project(item);
 delete from doc_project where docid||'@'||projectid in (
    select item
    from temp_delete_doc_project 
 );
 drop table temp_delete_doc_project;
--- a/apps/data4impact-import-scripts/importAll.sh
+++ b/apps/data4impact-import-scripts/importAll.sh
@ -0,0 +1,29 @@
 #!/bin/bash
 java -jar /Users/michele/.m2/repository/eu/dnetlib/data4impact-importer/1.1.0-SNAPSHOT/data4impact-importer-1.1.0-SNAPSHOT.jar \
 	./jsonfiles/swedishProjects/project.json \
 	./jsonfiles/swedishProjects/projectOtherId.json \
 	./jsonfiles/swedishProjects/organization.json \
 	./jsonfiles/swedishProjects/projectOrganization.json \
 	./jsonfiles/swedishProjects/docotherid.json \
 	./jsonfiles/swedishProjects/projectdocotherid.json \
 	./jsonfiles/ecProjectsOpenaire/project.json \
 	./jsonfiles/ecProjectsOpenaire/projectOtherId.json \
 	./jsonfiles/ecProjectsOpenaire/organization.json \
 	./jsonfiles/ecProjectsOpenaire/organizationOtherId.json \
 	./jsonfiles/ecProjectsOpenaire/projectOrganization.json \
 	./jsonfiles/cordis/project.json \
 	./jsonfiles/cordis/projectOtherId.json \
 	./jsonfiles/cordis/organization.json \
 	./jsonfiles/cordis/organizationOtherId.json \
 	./jsonfiles/cordis/projectOrganization.json \
 	./jsonfiles/companydata/orgCompanyMetrics.json \
 	./jsonfiles/funderdata/project.json \
 	./jsonfiles/funderdata/docotherid.json \
 	./jsonfiles/funderdata/projectdocotherid.json \
 	./jsonfiles/patents/document.json \
 	./jsonfiles/patents/doc_fulltext.json \
 	./jsonfiles/patents/doc_other_identifier.json \
 	./jsonfiles/guidelines/document.json \
 	./jsonfiles/guidelines/docotherid.json
--- a/apps/data4impact-import-scripts/scripts/clinical_trials/script.sh
+++ b/apps/data4impact-import-scripts/scripts/clinical_trials/script.sh
@ -0,0 +1,18 @@
 # MANUAL STEPS FOR clinical trials
 1) cd /data/ftp/d4i/clinical_trials
 2) Recreate the table in the DB using
 DROP TABLE clinical_trials;
 CREATE TABLE clinical_trials (
 	doi             text,
 	trial_number    text,
 	trial_registry  text
 );
 4) Insert data:
 COPY clinical_trials(doi,trial_number,trial_registry) FROM '/data/ftp/d4i/clinical_trials/clintrial.txt' DELIMITER E'\t';
 DELETE FROM clinical_trials where doi = 'pub-with-clin-trial';
--- a/apps/data4impact-import-scripts/scripts/companyData/companydata.sh
+++ b/apps/data4impact-import-scripts/scripts/companyData/companydata.sh
@ -0,0 +1,37 @@
 #!/bin/bash
 detailsFile=../../orig/CompanyData/D4I_companies_summary.txt
 workdir=/tmp/companydata
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "CompanyData Import:"
 #--------------------------------
 echo " - Generating csv files"
 csvDetails="$workdir/details.csv"
 cat $detailsFile | jq 'to_entries' | jq 'map([.key, .value."data gathered?", .value."tangible + pre_market", .value."tangible + market", .value."intangible + pre_market", .value."intangible + market", .value."innovation?"])' | jq .[] | jq -r @csv > $csvDetails
 #--------------------------------
 echo " - Recreating the companydata database"
 dropdb companydata --if-exists;
 createdb companydata;
 psql companydata -f schema.sql
 if [[ -f "$csvDetails" ]]; then
 	echo " - Importing details: $csvDetails"
 	psql companydata -c "COPY companymetrics(orgid, data_gathered, tangible_pre_market, tangible_market, intangible_pre_market, intangible_market, innovation) FROM '$csvDetails' CSV;"
 else
   	echo " - Invalid file: $csvDetails"
 fi
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/companydata/*.json
 psql companydata -f metrics2json.sql     | sed 's/\\\\/\\/g' > ../../jsonfiles/companydata/orgCompanyMetrics.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/companyData/companydata_innovation_texts.sh
+++ b/apps/data4impact-import-scripts/scripts/companyData/companydata_innovation_texts.sh
@ -0,0 +1,40 @@
 #!/bin/bash
 detailsFile=../../orig/CompanyData/D4I_company_innovation_texts.json
 workdir=/tmp/companydata_texts
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "CompanyData Innovation texts Import:"
 #--------------------------------
 echo " - Generating csv files"
 csvDetails="$workdir/details.csv"
 cat $detailsFile | jq --slurp -r '(map(keys) | add | unique) as $cols | map(. as $row | $cols | map($row[.])) as $rows | $cols, $rows[] | @csv' > $csvDetails
 #--------------------------------
 echo " - Recreating the companydata_texts database"
 dropdb companydata_texts --if-exists;
 createdb companydata_texts;
 psql companydata_texts -f schema_texts.sql
 if [[ -f "$csvDetails" ]]; then
 	echo " - Importing details: $csvDetails"
 	psql companydata_texts -c "COPY data(company_id,prediction_revised,site_url,source,text_clean_gentle,text_clean_strong,text_is_duplicated) FROM '$csvDetails' CSV HEADER;"
 else
   	echo " - Invalid file: $csvDetails"
 fi
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/companydata_texts/*.json
 psql companydata_texts -f innovationTexts2json.sql | sed 's/\\\\/\\/g' > ../../jsonfiles/companydata_texts/orgCompanyInnovationTexts.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/companyData/innovationTexts2json.sql
+++ b/apps/data4impact-import-scripts/scripts/companyData/innovationTexts2json.sql
@ -0,0 +1,11 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'20|ec__________::'||MD5(company_id) AS "orgId",
 		prediction_revised                   AS "predictionRevised",
 		site_url                             AS "siteUrl",
 		source                               AS "source",
 		text_clean_gentle                    AS "textCleanGentle",
 		text_clean_strong                    AS "textCleanStrong",
 		text_is_duplicated                   AS "duplicated"
 	FROM data
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/companyData/metrics2json.sql
+++ b/apps/data4impact-import-scripts/scripts/companyData/metrics2json.sql
@ -0,0 +1,15 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'20|ec__________::'||MD5(orgid) AS "orgId",
 		(LOWER(data_gathered)='yes')    AS "dataGathered",
 	    tangible_pre_market             AS "tangiblePreMarket",
 	    tangible_market                 AS "tangibleMarket",
 	    intangible_pre_market           AS "intangiblePreMarket",
 	    intangible_market               AS "intangibleMarket",
 	    CASE 
 			WHEN innovation='0' THEN false
 			WHEN innovation='1' THEN true
 			ELSE                     NULL
 		END                             AS "innovation"
 	FROM companymetrics
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/companyData/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/companyData/schema.sql
@ -0,0 +1,11 @@
 CREATE TABLE companymetrics (
 	orgid                 text,
 	data_gathered         varchar(5),
    tangible_pre_market   int,
    tangible_market       int,
    intangible_pre_market int,
    intangible_market     int,
    innovation            varchar(5)
 );
--- a/apps/data4impact-import-scripts/scripts/companyData/schema_texts.sql
+++ b/apps/data4impact-import-scripts/scripts/companyData/schema_texts.sql
@ -0,0 +1,10 @@
 CREATE TABLE data (
 	company_id         text,
 	prediction_revised float,
 	site_url           text,
 	source             text,
 	text_clean_gentle  text,
 	text_clean_strong  text,
 	text_is_duplicated boolean
 );
--- a/apps/data4impact-import-scripts/scripts/crossrefEventData/TODO.txt
+++ b/apps/data4impact-import-scripts/scripts/crossrefEventData/TODO.txt
@ -0,0 +1,21 @@
 Paolo, Vilius, all
 Last week I was in London attending a "special" event for publishers and I
 had the opportunity to meet a guy from the Strategic Initiatives dep. of
 Crossref who pointed me out the events API
 (https://www.crossref.org/services/event-data/). Such API links
 publications to several external sources including Patents, Twitter,
 Wikipedia, Reddit, StackExchange, Wordpress etc.
 Running some queries on their db we saw that for Twitter they do have data
 for more than a year.
 For patents they are based on Gambia Lens (https://www.lens.org/) -and
 they do have links from patents to pubs-. Unfortunately for some reason,
 Gambia uploaded data only once and then stopped. They will talk to them to
 see what has happened.
 In every case, I think that such API is very useful both for D4I and OA,
 and we should have a look and possibly integrate such data the soonest
 possible.
 All the best,
 Omiros
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database/docOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database/docOtherId2json.sql
@ -0,0 +1,32 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 	 	pmcid   AS "id",
 	 	'pmcid' AS "type"
 	FROM data
 	WHERE pmcid IS NOT NULL AND pmcid != '' AND pmcid not ilike 'none'
 	UNION ALL
 	SELECT
 	 	pmid   AS "id",
 	 	'pmid' AS "type"
 	FROM data
 	WHERE pmid IS NOT NULL AND pmid != '' AND pmid not ilike 'none'
 	UNION ALL
 	SELECT
 	 	doi   AS "id",
 	 	'doi' AS "type"
 	FROM data
 	WHERE doi IS NOT NULL AND doi != '' AND doi not ilike 'none'
 	UNION ALL
 	SELECT
 	 	d_b_id         AS "id",
 	 	'drug_bank_id' AS "type"
 	FROM data
 	WHERE d_b_id IS NOT NULL AND d_b_id != '' AND d_b_id not ilike 'none'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database/projDocOtherIds2json.sql
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database/projDocOtherIds2json.sql
@ -0,0 +1,36 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	pmcid                            AS "docId",
 	 	'pmcid'                          AS "docIdType"
 	FROM data
 	WHERE pmcid IS NOT NULL AND pmcid != '' AND pmcid not ilike 'none'
 	UNION ALL
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	pmid                             AS "docId",
 	 	'pmid'                           AS "docIdType"
 	FROM data
 	WHERE pmid IS NOT NULL AND pmid != '' AND pmid not ilike 'none'
 	UNION ALL
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	doi                              AS "docId",
 	 	'doi'                            AS "docIdType"
 	FROM data
 	WHERE doi IS NOT NULL AND doi != '' AND doi not ilike 'none'
 	UNION ALL
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	d_b_id                           AS "docId",
 	 	'drug_bank_id'                   AS "docIdType"
 	FROM data
 	WHERE d_b_id IS NOT NULL AND d_b_id != '' AND d_b_id not ilike 'none'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database/projects2json.sql
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database/projects2json.sql
@ -0,0 +1,6 @@
 COPY (SELECT row_to_json(t) FROM (SELECT distinct
 	'40|MOCK_PROJECT::'||MD5(funder) AS "id",
 	'MOCK PROJECT'                   AS "title",
 	funder                           AS "funder"
 FROM data
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database/schema.sql
@ -0,0 +1,10 @@
 CREATE TABLE data (
 id text,
 d_b_id text,
 doi text,
 pmcid text,
 pmid text,
 drug_substance text,
 funder text,
 section_of_drug_bank_entry_where_citation_occured text
 )
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database/script.sh
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database/script.sh
@ -0,0 +1,52 @@
 #!/bin/bash
 excelFile="../../orig/drug_bank_database/Publication_citations_in_Drug_Bank_database.xlsx"
 workdir=/tmp/drugbank
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "Links from drugbank db Import:"
 #--------------------------------
 echo " - Generating csv file"
 csv="$workdir/drugbank.csv"
 xlsx2csv -c UTF-8 "$excelFile" > $csv
 #--------------------------------
 echo " - Recreating the drugbank database"
 dbname=drugbank
 dropdb $dbname --if-exists;
 createdb $dbname;
 psql $dbname -f schema.sql
 if [[ -f "$csv" ]]; then
 	echo " - Importing data: $csv"
 	psql $dbname -c "COPY data(id,d_b_id,doi,pmcid,pmid,drug_substance,funder,section_of_drug_bank_entry_where_citation_occured) FROM '$csv' CSV HEADER;"
 else
   	echo " - Invalid file: $csv"
 fi
 echo " - Fix funder names"
 psql $dbname -c "UPDATE data SET funder='EC' WHERE funder = 'European Research Council'"
 psql $dbname -c "UPDATE data SET funder='Austrian Science Fund FWF' WHERE funder = 'FWF'"
 psql $dbname -c "UPDATE data SET funder='Swiss National Science Foundation SNSF' WHERE funder = 'Swiss National Science Foundation'"
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/drug_bank_database/*.json
 psql $dbname -f projects2json.sql        | sed 's/\\\\/\\/g' > ../../jsonfiles/drug_bank_database/project.json
 psql $dbname -f docOtherId2json.sql      | sed 's/\\\\/\\/g' > ../../jsonfiles/drug_bank_database/docotherid.json
 psql $dbname -f projDocOtherIds2json.sql | sed 's/\\\\/\\/g' > ../../jsonfiles/drug_bank_database/projectdocotherid.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/docOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/docOtherId2json.sql
@ -0,0 +1,32 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 	 	pmcid   AS "id",
 	 	'pmcid' AS "type"
 	FROM data
 	WHERE pmcid IS NOT NULL AND pmcid != '' AND pmcid not ilike 'none'
 	UNION ALL
 	SELECT
 	 	pmid   AS "id",
 	 	'pmid' AS "type"
 	FROM data
 	WHERE pmid IS NOT NULL AND pmid != '' AND pmid not ilike 'none'
 	UNION ALL
 	SELECT
 	 	doi   AS "id",
 	 	'doi' AS "type"
 	FROM data
 	WHERE doi IS NOT NULL AND doi != '' AND doi not ilike 'none'
 	UNION ALL
 	SELECT
 	 	d_b_id         AS "id",
 	 	'drug_bank_id' AS "type"
 	FROM data
 	WHERE d_b_id IS NOT NULL AND d_b_id != '' AND d_b_id not ilike 'none'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/projDocOtherIds2json.sql
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/projDocOtherIds2json.sql
@ -0,0 +1,36 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'40|corda_______::'||MD5(ec_project_code) AS "projectId",
 	 	pmcid                            AS "docId",
 	 	'pmcid'                          AS "docIdType"
 	FROM data
 	WHERE pmcid IS NOT NULL AND pmcid != '' AND pmcid not ilike 'none' AND ec_project_code not ilike 'unknown' AND funding_scheme ilike 'FP7%'
 	UNION ALL
 	SELECT
 		'40|corda_______::'||MD5(ec_project_code) AS "projectId",
 	 	pmid                             AS "docId",
 	 	'pmid'                           AS "docIdType"
 	FROM data
 	WHERE pmid IS NOT NULL AND pmid != '' AND pmid not ilike 'none' AND ec_project_code not ilike 'unknown' AND funding_scheme ilike 'FP7%'
 	UNION ALL
 	SELECT
 		'40|corda_______::'||MD5(ec_project_code) AS "projectId",
 	 	doi                             AS "docId",
 	 	'doi'                           AS "docIdType"
 	FROM data
 	WHERE doi IS NOT NULL AND doi != '' AND doi not ilike 'none' AND ec_project_code not ilike 'unknown' AND funding_scheme ilike 'FP7%'
 	UNION ALL
 	SELECT
 		'40|corda_______::'||MD5(ec_project_code) AS "projectId",
 	 	d_b_id                                    AS "docId",
 	 	'drug_bank_id'                            AS "docIdType"
 	FROM data
 	WHERE d_b_id IS NOT NULL AND d_b_id != '' AND d_b_id not ilike 'none' AND ec_project_code not ilike 'unknown' AND funding_scheme ilike 'FP7%'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/schema.sql
@ -0,0 +1,11 @@
 CREATE TABLE data (
 	doi                 text,
 	d_b_id              text,
 	pmcid               text,
 	pmid                text,
 	drug_substance      text,
 	ec_project_acronym  text,
 	ec_project_code     text,
 	funding_scheme      text,
 	match_type          text
 );
--- a/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/script.sh
+++ b/apps/data4impact-import-scripts/scripts/drug_bank_database_part2/script.sh
@ -0,0 +1,39 @@
 #!/bin/bash
 excelFile="../../orig/drug_bank_database/DB_Publication_project_links.xlsx"
 workdir=/tmp/drugbank_part2
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "Links from drugbank db Import:"
 #--------------------------------
 echo " - Generating csv file"
 csv="$workdir/drugbank.csv"
 xlsx2csv -c UTF-8 "$excelFile" > $csv
 #--------------------------------
 echo " - Recreating the drugbank database"
 dbname=drugbank_p2
 dropdb $dbname --if-exists;
 createdb $dbname;
 psql $dbname -f schema.sql
 if [[ -f "$csv" ]]; then
 	echo " - Importing data: $csv"
 	psql $dbname -c "COPY data(doi,d_b_id,pmcid,pmid,drug_substance,ec_project_acronym,ec_project_code,funding_scheme,match_type) FROM '$csv' CSV HEADER;"
 else
   	echo " - Invalid file: $csv"
 fi
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/drug_bank_database/*.json
 psql $dbname -f docOtherId2json.sql      | sed 's/\\\\/\\/g' > ../../jsonfiles/drug_bank_database_part2/docotherid.json
 psql $dbname -f projDocOtherIds2json.sql | sed 's/\\\\/\\/g' > ../../jsonfiles/drug_bank_database_part2/projectdocotherid.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/ec_projects_cordis/cordis.sh
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_cordis/cordis.sh
@ -0,0 +1,56 @@
 #!/bin/bash
 urlOrgFp7=http://cordis.europa.eu/data/cordis-fp7organizations.xlsx
 urlOrgH2020=http://cordis.europa.eu/data/cordis-h2020organizations.xlsx
 workdir=/tmp/cordis
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "cordis Import:"
 #--------------------------------
 echo " - Downloading files"
 wget "$urlOrgFp7"   -O "$workdir/fp7orgs.xlsx"   -q --show-progress
 wget "$urlOrgH2020" -O "$workdir/h2020orgs.xlsx" -q --show-progress
 #--------------------------------
 echo " - Generating csv files"
 csvfp7="$workdir/fp7orgs.csv"
 csvh2020="$workdir/h2020orgs.csv"
 xlsx2csv -c UTF-8 "$workdir/fp7orgs.xlsx" > $csvfp7
 xlsx2csv -c UTF-8 "$workdir/h2020orgs.xlsx" > $csvh2020
 #--------------------------------
 echo " - Recreating the cordis database"
 dropdb cordis --if-exists;
 createdb cordis;
 psql cordis -f schema.sql
 if [[ -f "$csvfp7" ]]; then
 	echo " - Importing FP7 participants: $csvfp7"
 	psql cordis -c "COPY participants(projectrcn,projectiD,projectacronym,role,orgid,orgname,orgshortname,activitytype,endofparticipation,eccontribution,country,street,city,postCode,organizationurl,vatnumber,contactform,contacttype,contacttitle,contactfirstnames,contactlastnames,contactfunction,contacttelephonenumber,contactfaxnumber) FROM '$csvfp7' CSV HEADER;"
 	psql cordis -c "UPDATE participants SET fundingprogram='FP7' WHERE fundingprogram IS NULL"
 else
   	echo " - Invalid file fp7: $csvfp7"
 fi
 if [[ -f "$csvh2020" ]]; then
 	echo " - Importing H2020 participants: $csvh2020"
 	psql cordis -c "COPY participants(projectrcn,projectiD,projectacronym,role,orgid,orgname,orgshortname,activitytype,endofparticipation,eccontribution,country,street,city,postCode,organizationurl,vatnumber,contactform,contacttype,contacttitle,contactfirstnames,contactlastnames,contactfunction,contacttelephonenumber,contactfaxnumber) FROM '$csvh2020' CSV HEADER;"
 	psql cordis -c "UPDATE participants SET fundingprogram='H2020' WHERE fundingprogram IS NULL"
 else
   	echo " - Invalid file h2020: $csvh2020"
 fi
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/cordis/*.json
 psql cordis -f projects2json.sql    | sed 's/\\\\/\\/g' > ../../jsonfiles/cordis/project.json
 psql cordis -f orgs2json.sql        | sed 's/\\\\/\\/g' > ../../jsonfiles/cordis/organization.json
 psql cordis -f projOrg2json.sql     | sed 's/\\\\/\\/g' > ../../jsonfiles/cordis/projectOrganization.json
 psql cordis -f projOtherId2json.sql | sed 's/\\\\/\\/g' > ../../jsonfiles/cordis/projectOtherId.json
 psql cordis -f orgOtherId2json.sql  | sed 's/\\\\/\\/g' > ../../jsonfiles/cordis/organizationOtherId.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/ec_projects_cordis/orgOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_cordis/orgOtherId2json.sql
@ -0,0 +1,9 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'20|ec__________::'||MD5(orgid) AS "orgId",
 	     orgid                          AS "id",
 	     'ec:PIC'                       AS "type"
 	FROM participants
 	WHERE orgid IS NOT NULL
 	GROUP BY orgid 
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_cordis/orgs2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_cordis/orgs2json.sql
@ -0,0 +1,13 @@
 COPY (SELECT row_to_json(t) FROM (SELECT
 	'20|ec__________::'||MD5(orgid) AS "id",
 	MAX(orgname)                    AS "name",
 	MAX(orgshortname)               AS "shortName",
 	MAX(country)                    AS "country",
 	MAX(street)                     AS "street",
 	MAX(city)                       AS "city",
 	MAX(postcode)                   AS "postCode",
 	MAX(organizationurl)            AS "url"
 FROM participants
 WHERE orgid IS NOT NULL
 GROUP BY orgid
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_cordis/projOrg2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_cordis/projOrg2json.sql
@ -0,0 +1,26 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		CASE 
 			WHEN fundingprogram='FP7'   THEN '40|corda_______::'||MD5(projectid)
 			WHEN fundingprogram='H2020' THEN '40|corda__h2020::'||MD5(projectid)
 			ELSE                             '40|unknown_____::'||MD5(projectid)
 		END                             AS "projectId",
 		'20|ec__________::'||MD5(orgid) AS "orgId",
 		MAX(role)                       AS "role",
 		MAX(activitytype)               AS "activityType",
 		MAX(endofparticipation)         AS "endOfParticipation",
 		MAX(eccontribution)             AS "ecContribution",
 		MAX(contacttype)                AS "contactType",
 		MAX(contacttitle)               AS "contactTitle",
 		MAX(contactfirstnames)          AS "contactFirstNames",
 		MAX(contactlastnames)           AS "contactLastNames",
 		MAX(contactfunction)            AS "contactFunction",
 		MAX(contacttelephonenumber)     AS "contactTelephoneNumber",
 		MAX(contactfaxnumber)           AS "contactFaxNumber",
 		MAX(contactform)                AS "contactForm"
 	FROM participants
 	WHERE orgid IS NOT NULL AND projectid IS NOT NULL
 	GROUP BY orgid, projectid, fundingprogram
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_cordis/projOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_cordis/projOtherId2json.sql
@ -0,0 +1,27 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		CASE 
 			WHEN fundingprogram='FP7'   THEN '40|corda_______::'||MD5(projectid)
 			WHEN fundingprogram='H2020' THEN '40|corda__h2020::'||MD5(projectid)
 			ELSE                             '40|unknown_____::'||MD5(projectid)
 		END           AS "projectId",
 	    projectid     AS "id",
 	    'ec:grant_id' AS "type"
 	FROM participants
 	WHERE projectid IS NOT NULL
 	GROUP BY projectid, fundingprogram
 	UNION ALL
 	SELECT
 		CASE 
 			WHEN fundingprogram='FP7'   THEN '40|corda_______::'||MD5(projectid)
 			WHEN fundingprogram='H2020' THEN '40|corda__h2020::'||MD5(projectid)
 			ELSE                             '40|unknown_____::'||MD5(projectid)
 		END             AS "projectId",
 	    MAX(projectrcn) AS "id",
 	    'ec:RCN'        AS "type"
 	FROM participants
 	WHERE projectid IS NOT NULL AND projectrcn IS NOT NULL
 	GROUP BY projectid, fundingprogram
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_cordis/projects2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_cordis/projects2json.sql
@ -0,0 +1,16 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		CASE 
 			WHEN fundingprogram='FP7'   THEN '40|corda_______::'||MD5(projectid)
 			WHEN fundingprogram='H2020' THEN '40|corda__h2020::'||MD5(projectid)
 			ELSE                             '40|unknown_____::'||MD5(projectid)
 		END                 AS "id",
 		MAX(projectacronym) AS "acronym",
 		'EC'                AS "funder",
 		fundingprogram      AS "fundingLevel0"
 	FROM participants
 	WHERE projectid IS NOT NULL
 	GROUP BY
 		projectid,
 		fundingprogram
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_cordis/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_cordis/schema.sql
@ -0,0 +1,28 @@
 CREATE TABLE participants (
 	projectrcn             text,
 	projectid              text,
 	projectacronym         text,
 	role                   text,
 	orgid                  text,
 	orgname                text,
 	orgshortname           text,
 	activitytype           text,
 	endofparticipation     text,
 	eccontribution         text,
 	country                text,
 	street                 text,
 	city                   text,
 	postcode               text,
 	organizationurl        text,
 	vatnumber              text,
 	contacttype            text,
 	contacttitle           text,
 	contactfirstnames      text,
 	contactlastnames       text,
 	contactfunction        text,
 	contacttelephonenumber text,
 	contactfaxnumber       text,
 	contactform            text,
 	fundingprogram         varchar(10)
 );
--- a/apps/data4impact-import-scripts/scripts/ec_projects_openaire/README.txt
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_openaire/README.txt
@ -0,0 +1 @@
 The script should be launched in OpenAIRE production server (services.openaire.eu)
--- a/apps/data4impact-import-scripts/scripts/ec_projects_openaire/ecProjects.sh
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_openaire/ecProjects.sh
@ -0,0 +1,16 @@
 #!/bin/bash
 BASEDIR=/tmp/ecProjectsOpenaire
 echo "Saving files in $BASEDIR ..."
 rm -rf $BASEDIR
 mkdir $BASEDIR
 psql -h postgresql.services.openaire.eu -U dnet dnet_openaireplus -f projects2json.sql | sed 's/\\\\/\\/g' > $BASEDIR/project.json
 psql -h postgresql.services.openaire.eu -U dnet dnet_openaireplus -f orgs2json.sql     | sed 's/\\\\/\\/g' > $BASEDIR/organization.json
 psql -h postgresql.services.openaire.eu -U dnet dnet_openaireplus -f projOrg2json.sql  | sed 's/\\\\/\\/g' > $BASEDIR/projectOrganization.json
 psql -h postgresql.services.openaire.eu -U dnet dnet_openaireplus -f orgOtherId2json.sql  | sed 's/\\\\/\\/g' > $BASEDIR/organizationOtherId.json
 psql -h postgresql.services.openaire.eu -U dnet dnet_openaireplus -f projOtherId2json.sql | sed 's/\\\\/\\/g' > $BASEDIR/projectOtherId.json
 echo Done.
--- a/apps/data4impact-import-scripts/scripts/ec_projects_openaire/orgOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_openaire/orgOtherId2json.sql
@ -0,0 +1,8 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'20|ec__________::'||MD5(substring(id from 15)) AS "orgId",
 	     substring(id from 15)                          AS "id",
 	     'ec:PIC'                                       AS "type"
 	FROM dsm_organizations
 	WHERE id LIKE 'corda%'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_openaire/orgs2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_openaire/orgs2json.sql
@ -0,0 +1,28 @@
 COPY (SELECT row_to_json(t) FROM (SELECT
 	'20|ec__________::'||MD5(substring(o.id from 15)) AS "id",
 	o.legalname                                       AS "name",
 	o.legalshortname                                  AS "shortName",
 	o.country                                         AS "country",
 	o.websiteurl                                      AS "url",
 	o.ec_legalbody                                    AS "ecLegalBody",
 	o.ec_legalperson                                  AS "ecLegalPerson",
 	o.ec_nonprofit                                    AS "ecNonProfit",
 	o.ec_researchorganization                         AS "ecResearchOrganization",
 	o.ec_highereducation                              AS "ecHigherEducation",
 	o.ec_internationalorganizationeurinterests        AS "ecInternationalOrganizationEurInterests",
 	o.ec_internationalorganization                    AS "ecInternationalOrganization",
 	o.ec_enterprise                                   AS "ecEnterprise",
 	o.ec_smevalidated                                 AS "ecSmeValidated",
 	o.ec_nutscode                                     AS "ecNutsCode"
 FROM 
 	dsm_organizations o 
 	LEFT OUTER JOIN project_organization po ON (po.resporganization = o.id)
 WHERE 
 	o.id LIKE 'corda%'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_openaire/projOrg2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_openaire/projOrg2json.sql
@ -0,0 +1,13 @@
 COPY (SELECT row_to_json(t) FROM (SELECT
 	'40|'||substring(project from 1 for 12)||'::'||MD5(substring(project from 15)) AS "projectId",
 	'20|ec__________::'||MD5(substring(resporganization from 15))                  AS "orgId",
 	semanticclass                                                                  AS "role"
 FROM
 	project_organization
 WHERE 
 	project LIKE 'corda%'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_openaire/projOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_openaire/projOtherId2json.sql
@ -0,0 +1,8 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'40|'||substring(id from 1 for 12)||'::'||MD5(substring(id from 15)) AS "projectId",
 	    code                                                                 AS "id",
 	    'ec:grant_id'                                                        AS "type"
 	FROM projects
 	WHERE id LIKE 'corda%'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/ec_projects_openaire/projects2json.sql
+++ b/apps/data4impact-import-scripts/scripts/ec_projects_openaire/projects2json.sql
@ -0,0 +1,23 @@
 COPY (SELECT row_to_json(t) FROM (SELECT
 	'40|'||substring(p.id from 1 for 12)||'::'||MD5(substring(p.id from 15)) AS "id",
 	p.title                                                                  AS "title",
 	p.acronym                                                                AS "acronym",
 	p.call_identifier                                                        AS "callId",
 	split_part(pf.funding, '::', 2)                                          AS "funder",
 	split_part(pf.funding, '::', 3)                                          AS "fundingLevel0",
 	split_part(pf.funding, '::', 4)                                          AS "fundingLevel1",
 	split_part(pf.funding, '::', 5)                                          AS "fundingLevel2",
 	p.startdate                                                              AS "startDate",
 	p.enddate                                                                AS "endDate",
 	p.websiteurl                                                             AS "websiteUrl",
 	p.keywords                                                               AS "keywords",
 	p.contracttypescheme||':'||p.contracttypeclass                           AS "contractType",
 	p.ec_sc39                                                                AS "ecSc39",
 	p.oa_mandate_for_publications                                            AS "oaMandateForPublications",
 	p.ec_article29_3                                                         AS "ecArticle29_3"
 FROM 
 	projects p 
 	LEFT OUTER JOIN project_fundingpath pf ON (pf.project = p.id)
 WHERE 
 	p.id LIKE 'corda%'
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/fundersData/docOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/fundersData/docOtherId2json.sql
@ -0,0 +1,24 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 	 	pmcid   AS "id",
 	 	'pmcid' AS "type"
 	FROM data
 	WHERE pmcid IS NOT NULL AND pmcid != ''
 	UNION ALL
 	SELECT
 	 	pmid   AS "id",
 	 	'pmid' AS "type"
 	FROM data
 	WHERE pmid IS NOT NULL AND pmid != ''
 	UNION ALL
 	SELECT
 	 	doi   AS "id",
 	 	'doi' AS "type"
 	FROM data
 	WHERE doi IS NOT NULL AND doi != ''
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/fundersData/funderData.sh
+++ b/apps/data4impact-import-scripts/scripts/fundersData/funderData.sh
@ -0,0 +1,51 @@
 #!/bin/bash
 excelFile="../../orig/fundersData/Funders, DOIS 31122018.xlsx" 
 workdir=/tmp/funderData
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "Funder Data Import:"
 #--------------------------------
 echo " - Generating csv file"
 csv="$workdir/funderdata.csv"
 xlsx2csv -c UTF-8 "$excelFile" > $csv
 #--------------------------------
 echo " - Recreating the funderdata database"
 dropdb funderdata --if-exists;
 createdb funderdata;
 psql funderdata -f schema.sql
 if [[ -f "$csv" ]]; then
 	echo " - Importing data: $csv"
 	psql funderdata -c "COPY data(funder,pmcid,pmid,source,doi) FROM '$csv' CSV HEADER;"
 else
   	echo " - Invalid file: $csv"
 fi
 echo " - Fix funder names"
 psql funderdata -c "UPDATE data SET funder='EC' WHERE funder = 'Marie Curie'"
 psql funderdata -c "UPDATE data SET funder='EC' WHERE funder = 'European Research Council'"
 psql funderdata -c "UPDATE data SET funder='Breast Cancer Now' WHERE funder = 'BreastCancerNow'"
 psql funderdata -c "UPDATE data SET funder='Wellcome Trust' WHERE funder = 'Wellcome Trust/DBT India Alliance'"
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/funderdata/*.json
 psql funderdata -f projects2json.sql        | sed 's/\\\\/\\/g' > ../../jsonfiles/funderdata/project.json
 psql funderdata -f docOtherId2json.sql      | sed 's/\\\\/\\/g' > ../../jsonfiles/funderdata/docotherid.json
 psql funderdata -f projDocOtherIds2json.sql | sed 's/\\\\/\\/g' > ../../jsonfiles/funderdata/projectdocotherid.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/fundersData/projDocOtherIds2json.sql
+++ b/apps/data4impact-import-scripts/scripts/fundersData/projDocOtherIds2json.sql
@ -0,0 +1,26 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	pmcid                            AS "docId",
 	 	'pmcid'                          AS "docIdType"
 	FROM data
 	WHERE pmcid IS NOT NULL AND pmcid != ''
 	UNION ALL
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	pmid                             AS "docId",
 	 	'pmid'                           AS "docIdType"
 	FROM data
 	WHERE pmid IS NOT NULL AND pmid != ''
 	UNION ALL
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	doi                             AS "docId",
 	 	'doi'                           AS "docIdType"
 	FROM data
 	WHERE doi IS NOT NULL AND doi != ''
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/fundersData/projects2json.sql
+++ b/apps/data4impact-import-scripts/scripts/fundersData/projects2json.sql
@ -0,0 +1,6 @@
 COPY (SELECT row_to_json(t) FROM (SELECT distinct
 	'40|MOCK_PROJECT::'||MD5(funder) AS "id",
 	'MOCK PROJECT'                   AS "title",
 	funder                           AS "funder"
 FROM data
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/fundersData/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/fundersData/schema.sql
@ -0,0 +1,8 @@
 CREATE TABLE data (
 	funder text,
 	pmcid  text,
 	pmid   text,
 	source text,
 	doi    text
 );
--- a/apps/data4impact-import-scripts/scripts/guidelines/README.txt
+++ b/apps/data4impact-import-scripts/scripts/guidelines/README.txt
@ -0,0 +1,21 @@
 Dear Claudio, Please find the json file containing the clinical guideline base data attached.
 It is formatted as follows:
 LocalID    [Our local guideline ID]
 Type    "guideline"
 Title    [Title of guideline]
 PubYear   [Guideline publication year]
 Originator    [Organization that created the guideline (subset of ProviderCollection)]
 ProviderCollection    [Collection name]
 Abstract    [Guideline abstract (from PubMed, if available (only from WHO, NICE and Cochrane))]
 PMID    [PMID if available]
 DOI    [DOI if available]
 PMCID   [PMCID if available]
 MatchedReferences: [references matched with Our set of publications as PMID (as well as PMCID and funder name)]
 [All]References: [All references in each guideline]
 We also have the full text for WHO, NICE and Cochrane, as well as the PDF:s for the German AWMF guidelines, but it is still uncertain how this material could be shared due to copyright issues.
 FILE: /data/d4i/guidelines.json.zip
--- a/apps/data4impact-import-scripts/scripts/guidelines/TODO.txt
+++ b/apps/data4impact-import-scripts/scripts/guidelines/TODO.txt
@ -0,0 +1,5 @@
 Al momento non sono gestite le MatchedReferences.
 Il modello attuale prevede la tabella Citation per mmetere in relazione due documenti.
 Forse deve essere rivisto.
--- a/apps/data4impact-import-scripts/scripts/guidelines/docDocumentOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/guidelines/docDocumentOtherId2json.sql
@ -0,0 +1,39 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'50|guidelines__::'||MD5(gid) AS "docId1",
 	 	pmcid                         AS "docId2",
 	 	'pmcid'                       AS "docId2Type",
 	 	'guidelines_matched'          AS "relType"
 	FROM relations
 	WHERE pmcid IS NOT NULL AND pmcid != ''
 	UNION
 	SELECT
 		'50|guidelines__::'||MD5(gid) AS "docId1",
 	 	pmid                          AS "docId2",
 	 	'pmid'                        AS "docId2Type",
 	 	'guidelines_matched'          AS "relType"
 	FROM relations
 	WHERE pmid IS NOT NULL AND pmid != ''
 	UNION
 	SELECT
 	'50|guidelines__::'||MD5(gid) AS "docId1",
 	doi 	                        AS "docId2",
 	'doi'                        	AS "docId2Type",
 	'guidelines_matched'          AS "relType"
 	FROM relations
 	WHERE doi IS NOT NULL AND doi != ''
 	UNION
 	SELECT
 		'50|guidelines__::'||MD5(gid) AS "docId1",
 		rel                           AS "docId2",
 		'pmid'                        AS "docId2Type",
 		'guidelines_all'              AS "relType"
 	FROM allrefs
 	WHERE rel IS NOT NULL AND rel != ''
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/guidelines/docOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/guidelines/docOtherId2json.sql
@ -0,0 +1,72 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'50|guidelines__::'||MD5(id) AS "docId",
 	 	id                           AS "id",
 	 	'guidelineLocalID'           AS "type"
 	FROM guidelines
 	UNION ALL
 	SELECT
 		'50|guidelines__::'||MD5(id) AS "docId",
 	 	pmcid                        AS "id",
 	 	'pmcid'                      AS "type"
 	FROM guidelines
 	WHERE pmcid IS NOT NULL AND pmcid != ''
 	UNION ALL
 	SELECT
 		'50|guidelines__::'||MD5(id) AS "docId",
 		pmid                         AS "id",
 	 	'pmid'                       AS "type"
 	FROM guidelines
 	WHERE pmid IS NOT NULL AND pmid != ''
 	UNION ALL
 	SELECT
 		'50|guidelines__::'||MD5(id) AS "docId",
 	 	doi                          AS "id",
 	 	'doi'                        AS "type"
 	FROM guidelines
 	WHERE doi IS NOT NULL AND doi != ''
 	UNION
 	SELECT
 		NULL                         AS "docId",
 	 	pmcid                        AS "id",
 	 	'pmcid'                      AS "type"
 	FROM relations
 	WHERE pmcid IS NOT NULL AND pmcid != ''
 	UNION
 	SELECT
 		NULL                         AS "docId",
 	 	pmid                         AS "id",
 	 	'pmid'                       AS "type"
 	FROM relations
 	WHERE pmid IS NOT NULL AND pmid != ''
 	UNION
 	SELECT
 	NULL                         AS "docId",
 	doi                          AS "id",
 	'doi'                        AS "type"
 	FROM relations
 	WHERE pmid IS NOT NULL AND doi != ''
 	UNION
 	SELECT
 		NULL                        AS "docId",
 	 	rel                         AS "id",
 	 	'pmid'                      AS "type"
 	FROM allrefs
 	WHERE rel IS NOT NULL AND rel != ''
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/guidelines/document2json.sql
+++ b/apps/data4impact-import-scripts/scripts/guidelines/document2json.sql
@ -0,0 +1,12 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'50|guidelines__::'||MD5(g.id)          AS "id",
 		g.title                                 AS "title",
 		g.abstract                              AS "abstractText",
 		g.gtype                                 AS "type",
 		g.year                                  AS "pubYear",
 		g.orig                                  AS "repository",
 		g.collection                            AS "collection"
 	FROM 
 		guidelines	g
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/guidelines/guidelines.sh
+++ b/apps/data4impact-import-scripts/scripts/guidelines/guidelines.sh
@ -0,0 +1,67 @@
 #!/bin/bash
 #detailsFile=../../orig/guidelines/guidelines.json
 detailsFile=/tmp/guidelines.json
 workdir=/tmp/guidelines
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "Guidelines Import:"
 #--------------------------------
 echo " - Generating csv files"
 csvGuidelines="$workdir/guidelines.csv"
 csvRels="$workdir/rels.csv"
 csvAllRels="$workdir/allRels.csv"
 cat $detailsFile | jq 'map([.LocalID, .Type, .Title, .PubYear, .Originator, .ProviderCollection, .Abstract, .PMID, .DOI, .PMCID])' | jq .[] | jq -r @csv > $csvGuidelines
 cat $detailsFile | jq -r '.[] | .LocalID as $id | (.MatchedReferences | map([$id, (.PMID + ""), (.PMCID + ""), (.DOI + "") , ( .Funders | map(.+"#") | add | . + "" )  ]) )[] | @csv' > $csvRels
 cat $detailsFile | jq -r '.[] | .LocalID as $id | (.AllReferences | map([$id, .]) )[] | @csv' > $csvAllRels
 #--------------------------------
 echo " - Recreating the guidelines database"
 dropdb guidelines --if-exists;
 createdb guidelines;
 psql guidelines -f schema.sql
 if [[ -f "$csvGuidelines" ]]; then
 	echo " - Importing guidelines: $csvGuidelines"
 	psql guidelines -c "COPY guidelines(id, gtype, title, year, orig, collection, abstract, pmid, doi, pmcid) FROM '$csvGuidelines' CSV;"
 else
   	echo " - Invalid file: $csvGuidelines"
 fi
 if [[ -f "$csvRels" ]]; then
 	echo " - Importing rels: $csvRels"
 	psql guidelines -c "COPY relations(gid, pmid, pmcid, doi, funder) FROM '$csvRels' CSV;"
 else
   	echo " - Invalid file: $csvRels"
 fi
 if [[ -f "$csvAllRels" ]]; then
 	echo " - Importing all rels: $csvAllRels"
 	psql guidelines -c "COPY allrefs(gid, rel) FROM '$csvAllRels' CSV;"
 else
   	echo " - Invalid file: $csvAllRels"
 fi
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/guidelines/*.json
 psql guidelines -f document2json.sql           | sed 's/\\\\/\\/g' > ../../jsonfiles/guidelines/document.json
 psql guidelines -f docOtherId2json.sql         | sed 's/\\\\/\\/g' > ../../jsonfiles/guidelines/docotherid.json
 psql guidelines -f projects2json.sql           | sed 's/\\\\/\\/g' > ../../jsonfiles/guidelines/project.json
 psql guidelines -f projDocOtherIds2json.sql    | sed 's/\\\\/\\/g' > ../../jsonfiles/guidelines/projectdocotherid.json
 psql guidelines -f docDocumentOtherId2json.sql | sed 's/\\\\/\\/g' > ../../jsonfiles/guidelines/docDocumentOtherId.json
 #--------------------------------
 echo " - Importing final files"
 cd  ../../jsonfiles/guidelines
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/guidelines/projDocOtherIds2json.sql
+++ b/apps/data4impact-import-scripts/scripts/guidelines/projDocOtherIds2json.sql
@ -0,0 +1,20 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	pmcid                            AS "docId",
 	 	'pmcid'                          AS "docIdType"
 	FROM (select * from (select pmid, pmcid, unnest(string_to_array(funder, '#')) as funder from relations) as t where length(t.funder) > 0) r
 	WHERE pmcid IS NOT NULL AND pmcid != ''
 	UNION ALL
 	SELECT
 		'40|MOCK_PROJECT::'||MD5(funder) AS "projectId",
 	 	pmid                             AS "docId",
 	 	'pmid'                           AS "docIdType"
 	FROM (select * from (select pmid, pmcid, unnest(string_to_array(funder, '#')) as funder from relations) as t where length(t.funder) > 0) r
 	WHERE pmid IS NOT NULL AND pmid != ''
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/guidelines/projects2json.sql
+++ b/apps/data4impact-import-scripts/scripts/guidelines/projects2json.sql
@ -0,0 +1,7 @@
 COPY (SELECT row_to_json(t) FROM (SELECT distinct
 	'40|MOCK_PROJECT::'||MD5(funder) AS "id",
 	'MOCK PROJECT'                   AS "title",
 	funder                           AS "funder"
 FROM
 	(SELECT DISTINCT unnest(string_to_array(funder, '#')) AS funder FROM relations ) r WHERE LENGTH(r.funder) > 0
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/guidelines/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/guidelines/schema.sql
@ -0,0 +1,25 @@
 CREATE TABLE guidelines (
 	id         text,
 	gtype      text,
 	title      text,
 	year       text,
 	orig       text,
 	collection text,
 	abstract   text,
 	pmid       text,
 	doi        text,
 	pmcid      text
 );
 CREATE TABLE relations (
 	gid    text,
 	pmid   text, 
 	pmcid  text,
 	doi		 text,
 	funder text
 );
 CREATE TABLE allrefs (
 	gid    text,
 	rel    text
 );
--- a/apps/data4impact-import-scripts/scripts/network_analysis_extracts/process.sh
+++ b/apps/data4impact-import-scripts/scripts/network_analysis_extracts/process.sh
@ -0,0 +1,49 @@
 #!/bin/bash
 DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null 2>&1 && pwd )"
 table=network_analysis_metrics
 echo "Recrreating table $table"
 psql -h localhost -U d4i data4impact -c "DROP TABLE IF EXISTS $table;"
 psql -h localhost -U d4i data4impact -c "CREATE TABLE $table (betweenness_centrality double precision,closeness_centrality double precision,degree_centrality double precision,eccentricity_centrality double precision,eigenvector_centrality double precision,farness_centrality double precision,pic text,name text, icd int, period text, orgid text);"
 echo
 for icd in {1..19}
 do
 	if [ -d "$DIR/$icd" ]; then
 		cd "$DIR/$icd"
 		for csv in *.csv
 		do
 			y1=$(echo $csv | cut -c1-4)
 			y2=$(expr $y1 + 1)
 			period="$y1-$y2"
 			echo "Processing file $DIR/$icd/$csv..."
 			if grep --quiet eccentricity_centrality  "$DIR/$icd/$csv"; then
 				psql -h localhost -U d4i data4impact -c "COPY $table (betweenness_centrality,closeness_centrality,degree_centrality,eccentricity_centrality,eigenvector_centrality,farness_centrality,pic,name) FROM '$DIR/$icd/$csv' CSV HEADER;"
 			else
 				psql -h localhost -U d4i data4impact -c "COPY $table (betweenness_centrality,closeness_centrality,degree_centrality,eigenvector_centrality,farness_centrality,pic,name) FROM '$DIR/$icd/$csv' CSV HEADER;"
 			fi
 			psql -h localhost -U d4i data4impact -c "UPDATE $table SET (icd,period) = ($icd,'$period') WHERE icd IS NULL;" 
 			echo;
 		done
 	fi
 done
 echo "Fixing values..."
 psql -h localhost -U d4i data4impact -c "UPDATE $table SET pic = replace(pic, '.0', '') WHERE pic IS NOT NULL;"
 psql -h localhost -U d4i data4impact -c "UPDATE $table SET orgid = '20|ec__________::'||MD5(pic) WHERE pic IS NOT NULL;"
 echo
 echo "Done."
 echo
 echo
--- a/apps/data4impact-import-scripts/scripts/news-blogs-forum-twitter/script.sh
+++ b/apps/data4impact-import-scripts/scripts/news-blogs-forum-twitter/script.sh
@ -0,0 +1,211 @@
 # MANUAL STEPS FOR news-blogs-forum
 1) cd /data/ftp/d4i/social_data/news-blogs-forum
 2) find *.zip -exec bash -c "unzip -p {} | jq --slurp -r 'map([.content,.actor,.topicId,.mediatype,.source,.headline,.url,.dt,.language,.country]) | .[] | @csv'" \; | sed 's/\x00//g' > data4impact_corpus_allmedia.csv
 3) Recreate the table in the DB using 
 DROP TABLE socialdata;
 DROP SEQUENCE socialdata_serial;
 CREATE SEQUENCE socialdata_serial START 1;
 CREATE TABLE socialdata (
 	id        text PRIMARY KEY DEFAULT '51|social__data::'||MD5(nextval('socialdata_serial')::text),
 	content   text,
 	actor     text,
 	topicId   text,
 	mediatype text,
 	source    text,
 	headline  text,
 	url       text,
 	dt        text,
 	language  text,
 	country   text	
 );
 4) Insert data:
 COPY socialdata(content,actor,topicId,mediatype,source,headline,url,dt,language,country) FROM '/data/ftp/d4i/social_data/news-blogs-forum/data4impact_corpus_allmedia.csv' CSV;
 (OPTIONAL) if (error_during_copy)  ->   perl -pi -e 's/\x00//g' data4impact_corpus_allmedia.csv
 #############################################################################################################################################################
 # MANUAL STEPS FOR twitter (Buzz)
 1) cd "/data/ftp/d4i/social_data/twitter/Buzz JSON Feb"
 2) find *.json -exec jq -r 'def join(sep): sep as $sep | reduce .[1:][] as $item (.[0]|tostring; . + $sep + $item); map ([(.tags | join(",")),.language,.country,.content,.topicId,.sourceType,.source,.actor,.rtid,.rtDate,.date,.headline]) | .[] | @csv' {} \; | sed 's/\x00//g' > twitter_buzz.csv  
 3) recreate the table
 DROP TABLE twitterbuzz;
 DROP SEQUENCE twitterbuzz_serial;
 CREATE SEQUENCE twitterbuzz_serial START 1;
 CREATE TABLE twitterbuzz (
 	id         text PRIMARY KEY DEFAULT '52|twitter_buzz::'||MD5(nextval('twitterbuzz_serial')::text),
 	tags       text,
 	language   text,
 	country    text,
 	content    text,
 	topicid    text,
 	sourcetype text,
 	source     text,
 	actor      text,
 	rtid       text,
 	rtdate     text,
 	date       text,
 	headline   text
 );
 CREATE TABLE twitterbuzz_tags(
 	tb_id text REFERENCES twitterbuzz(id),
 	tag   text,
 	PRIMARY KEY(tb_id, tag)
 );
 4) Insert data:
 COPY twitterbuzz(tags,language,country,content,topicid,sourcetype,source,actor,rtid,rtdate,date,headline) FROM '/data/ftp/d4i/social_data/twitter/Buzz JSON Feb/twitter_buzz.csv' CSV;
 5) patch data:
 UPDATE twitterbuzz SET tags = '' WHERE tags = 'null';
 UPDATE twitterbuzz SET tags = replace(tags, ',,', ',') WHERE tags LIKE '%,,%';
 insert into twitterbuzz_tags(tb_id, tag) select distinct * from (select id, regexp_split_to_table(tags, ',') as tag from twitterbuzz) as t where tag != '';
 alter table twitterbuzz drop column tags;
 #############################################################################################################################################################
 # MANUAL STEPS FOR twitter
 1) cd "/data/ftp/d4i/social_data/twitter/Corrected JSON"
 2) find *.json -exec jq -r 'def join(sep): sep as $sep | reduce .[1:][] as $item (.[0]|tostring; . + $sep + $item); map ([(.tags | join(",")),.language,.country,.content,.topicId,.sourceType,.source,.actor,.retweetedActor,(.urls | join("§")),.datetime,.headline]) | .[] | @csv' {} \; | sed 's/\x00//g' > twitter.csv  
 DROP TABLE twitter;
 DROP SEQUENCE twitter_serial;
 CREATE SEQUENCE twitter_serial START 1;
 CREATE TABLE twitter (
 	id         text PRIMARY KEY DEFAULT '52|twitter_____::'||MD5(nextval('twitter_serial')::text),
 	tags       text,
 	language   text,
 	country    text,
 	content    text,
 	topicid    text,
 	sourcetype text,
 	source     text,
 	actor      text,
 	retweetedactor text,
 	urls       text,
 	datetime   timestamp,
 	headline   text
 );
 CREATE TABLE twitter_tags(
 	t_id text REFERENCES twitter(id),
 	tag   text,
 	PRIMARY KEY(t_id, tag)
 );
 CREATE TABLE twitter_urls(
 	t_id text REFERENCES twitter(id),
 	url   text,
 	PRIMARY KEY(t_id, url)
 );
 4) Insert data:
 COPY twitter(tags,language,country,content,topicid,sourcetype,source,actor,retweetedactor,urls,datetime,headline) FROM '/data/ftp/d4i/social_data/twitter/Corrected JSON/twitter.csv' CSV;
 5) patch data:
 insert into twitter_tags(t_id, tag) select distinct * from (select id, regexp_split_to_table(tags, ',') as tag from twitter) as t where tag != '' and tag != 'null';
 insert into twitter_urls(t_id, url) select distinct * from (select id, regexp_split_to_table(urls, '§') as url from twitter) as t where url != '' and url != 'null';
 alter table twitter drop column tags;
 alter table twitter drop column urls;
 #############################################################################################################################################################
 # MANUAL STEPS FOR twitter_threads
 1) cd "/data/ftp/d4i/social_data/twitter/Threads"
 2) 
 jq -r 'map([.threadId, .length, .velocity, .participants, .startId, .startTime, .endTime]) | .[] | @csv' twitter_threads_metadata.json > twitter_threads_metadata.csv
 rm twitter_threads_tweets.csv
 # jq-1.6 is required
 jq -r 'map([.threadId, .tweetId, .fromUser, .toUser, .inReplyTo, .dateTime, .content, .quotedStatus, (.mentions|join("§")), (.urls|join("§"))]) | .[] | @csv' twitter_threads_doi.json >> twitter_threads_tweets.csv
 jq -r 'map([.threadId, .tweetId, .fromUser, .toUser, .inReplyTo, .dateTime, .content, .quotedStatus, (.mentions|join("§")), (.urls|join("§"))]) | .[] | @csv' twitter_threads_q1.json >> twitter_threads_tweets.csv
 jq -r 'map([.threadId, .tweetId, .fromUser, .toUser, .inReplyTo, .dateTime, .content, .quotedStatus, (.mentions|join("§")), (.urls|join("§"))]) | .[] | @csv' twitter_threads_q2.json >> twitter_threads_tweets.csv
 jq -r 'map([.threadId, .tweetId, .fromUser, .toUser, .inReplyTo, .dateTime, .content, .quotedStatus, (.mentions|join("§")), (.urls|join("§"))]) | .[] | @csv' twitter_threads_q3.json >> twitter_threads_tweets.csv
 jq -r 'map([.threadId, .tweetId, .fromUser, .toUser, .inReplyTo, .dateTime, .content, .quotedStatus, (.mentions|join("§")), (.urls|join("§"))]) | .[] | @csv' twitter_threads_q4.json >> twitter_threads_tweets.csv
 jq -r 'map([.threadId, .tweetId, .fromUser, .toUser, .inReplyTo, .dateTime, .content, .quotedStatus, (.mentions|join("§")), (.urls|join("§"))]) | .[] | @csv' twitter_threads_q5.json >> twitter_threads_tweets.csv
 3)
 DROP TABLE IF EXISTS twitter_threads
 CREATE TABLE twitter_threads (
 	id           text PRIMARY KEY,
 	length       int,
 	velocity     double precision,
 	participants int,
 	startid      int,
 	starttime    timestamp,
 	endtime      timestamp
 );
 CREATE TABLE twitter_threads_tweets(
 	threadid     text REFERENCES twitter_threads(id), 
 	tweetid      int,
 	fromuser     text,
 	touser       text,
 	inreplyto    int,
 	datetime     timestamp,
 	content      text,
 	quotedstatus text,
 	mentions     text,
 	urls         text,
 	PRIMARY KEY (threadid, tweetid)
 );
 CREATE TABLE twitter_threads_tweets_mentions(
 	threadid     text, 
 	tweetid      int,
 	mention      text,
 	PRIMARY KEY (threadid, tweetid, mention),
 	FOREIGN KEY (threadid, tweetid) REFERENCES twitter_threads_tweets(threadid, tweetid)
 );
 CREATE TABLE twitter_threads_tweets_urls(
 	threadid text, 
 	tweetid  int,
 	url      text,
 	PRIMARY KEY (threadid, tweetid, url),
 	FOREIGN KEY (threadid, tweetid) REFERENCES twitter_threads_tweets(threadid, tweetid)
 );
 4) Insert data:
 COPY twitter_threads(id, length, velocity, participants, startid, starttime, endtime) FROM '/data/ftp/d4i/social_data/twitter/Threads/twitter_threads_metadata.csv' CSV;
 COPY twitter_threads_tweets(threadid, tweetid, fromuser, touser, inreplyto, datetime, content, quotedstatus, mentions, urls) FROM '/data/ftp/d4i/social_data/twitter/Threads/twitter_threads_tweets.csv' CSV;
 5) patch data:
 insert into twitter_threads_tweets_mentions(threadid, tweetid, mention) select distinct * from (select threadid, tweetid, regexp_split_to_table(mentions, '§') as mention from twitter_threads_tweets) as t where mention != '' and mention != 'null';
 insert into twitter_threads_tweets_urls    (threadid, tweetid, url)     select distinct * from (select threadid, tweetid, regexp_split_to_table(urls,     '§') as url     from twitter_threads_tweets) as t where url     != '' and url     != 'null';
 alter table twitter_threads_tweets drop column mentions;
 alter table twitter_threads_tweets drop column urls;
--- a/apps/data4impact-import-scripts/scripts/patent_excel/process.sh
+++ b/apps/data4impact-import-scripts/scripts/patent_excel/process.sh
@ -0,0 +1,43 @@
 #!/bin/bash
 excelFile="../../orig/patents/FP7_patents_full_list_Except_for_ICT.xlsx" 
 workdir=/tmp/patentsExcel
 rm -rf "$workdir" && mkdir "$workdir"
 echo
 echo "Patents Import:"
 #--------------------------------
 echo " - Generating csv file"
 csv="$workdir/patents.csv"
 xlsx2csv -c UTF-8 "$excelFile" > $csv
 #--------------------------------
 echo " - Recreating the patents_excel database"
 dropdb patents_excel --if-exists;
 createdb patents_excel;
 psql patents_excel -f schema.sql
 if [[ -f "$csv" ]]; then
 	echo " - Importing data: $csv"
 	psql patents_excel -c "COPY data(pat_id,type_ip,appnum,appnt,title,pat_url,pat_ref,pat_auth,pat_num,pat_kind,note,appln_id,appln_title_patstat,priority_year,var15,projectid) FROM '$csv' CSV HEADER;"
 else
   	echo " - Invalid file: $csv"
 fi
 psql patents -c "REFRESH MATERIALIZED VIEW document"
 psql patents -c "REFRESH MATERIALIZED VIEW doc_other_identifier"
 psql patents -c "REFRESH MATERIALIZED VIEW doc_project"
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/patents_excel/*.json
 #psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM document            ) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents_excel/document.json
 #psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM doc_other_identifier) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents_excel/doc_other_identifier.json
 #psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM doc_project         ) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents_excel/doc_project.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/patent_excel/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/patent_excel/schema.sql
@ -0,0 +1,42 @@
 CREATE TABLE data(
 	pat_id              text,
 	type_ip             text,
 	appnum              text,
 	appnt               text,
 	title               text,
 	pat_url             text,
 	pat_ref             text,
 	pat_auth            text,
 	pat_num             text,
 	pat_kind            text,
 	note                text,
 	appln_id            text,
 	appln_title_patstat text,
 	priority_year       text,
 	var15               text,
 	projectid           text
 );
 CREATE MATERIALIZED VIEW document AS SELECT
 	'50|patents_____::'||MD5(lower(trim(appln_id))) AS "id",
 	title                                           AS "title",
 	lower(regexp_replace(type_ip,'s$',''))          AS "type",
 	priority_year                                   AS "pubYear",
 	'patent repo'::text                             AS "repository"
 FROM data
 WHERE appln_id IS NOT NULL AND trim(appln_id) != '';
 CREATE MATERIALIZED VIEW doc_other_identifier AS SELECT
 	'50|patents_____::'||MD5(lower(trim(appln_id))) AS "docId",
 	trim(appln_id)                                  AS "id",
 	'patent'::text                                       AS "type"
 FROM data
 WHERE appln_id IS NOT NULL AND trim(appln_id) != '';
 CREATE MATERIALIZED VIEW doc_project AS SELECT
 	'50|patents_____::'||MD5(lower(trim(appln_id)))  AS "docId",
 	'40|corda_______::'||MD5(lower(trim(projectid))) AS "projectId"
 FROM data
 WHERE appln_id IS NOT NULL AND trim(appln_id) != '' AND projectid IS NOT NULL AND trim(projectid) != '';
--- a/apps/data4impact-import-scripts/scripts/patents/README.txt
+++ b/apps/data4impact-import-scripts/scripts/patents/README.txt
@ -0,0 +1,3 @@
 Patent data are available at ftp://prozac.madgik.di.uoa.gr
 username: patentdata
 passwd: d4ipatents
--- a/apps/data4impact-import-scripts/scripts/patents/patents.sh
+++ b/apps/data4impact-import-scripts/scripts/patents/patents.sh
@ -0,0 +1,48 @@
 #!/bin/bash
 #jsonPatents=../../orig/patents/patents.json
 #jsonFulltexts=../../orig/patents/patents_txt.json
 jsonPatents=../../orig/patents/patents_update.json
 jsonFulltexts=../../orig/patents/patents_update_txt.json
 echo
 echo "Patents Import:"
 #--------------------------------
 echo " - Recreating the patents database"
 dropdb patents --if-exists
 createdb patents
 psql patents -f schema.sql
 #--------------------------------
 inputJsonPatentsFile="$(cd "$(dirname "$jsonPatents")"; pwd -P)/$(basename "$jsonPatents")"
 echo " - Importing json $inputJsonPatentsFile"
 psql patents -c "copy patents_json from '$inputJsonPatentsFile' csv quote e'\x01' delimiter e'\x02'"
 #--------------------------------
 inputJsonFulltextsFile="$(cd "$(dirname "$jsonFulltexts")"; pwd -P)/$(basename "$jsonFulltexts")"
 echo " - Importing json $jsonFulltexts"
 psql patents -c "copy patents_text_json from '$inputJsonFulltextsFile' csv quote e'\x01' delimiter e'\x02'"
 #--------------------------------
 echo " - Refreshing views"
 psql patents -c "REFRESH MATERIALIZED VIEW document"
 psql patents -c "REFRESH MATERIALIZED VIEW doc_fulltext"
 psql patents -c "REFRESH MATERIALIZED VIEW doc_other_identifier"
 psql patents -c "REFRESH MATERIALIZED VIEW project"
 psql patents -c "REFRESH MATERIALIZED VIEW doc_project"
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/patents/*.json
 psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM document            ) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents/document.json
 psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM doc_fulltext        ) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents/doc_fulltext.json
 psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM doc_other_identifier) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents/doc_other_identifier.json
 # COMMENT THE FOLLOWING LINES IF THE PATENTS ARE NOT RELATED TO FP7
 psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM project             ) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents/project.json
 psql patents -c "COPY (SELECT row_to_json(t) FROM (SELECT * FROM doc_project         ) t) TO STDOUT" | sed 's/\\\\/\\/g' > ../../jsonfiles/patents/doc_project.json
 echo "Done."
 echo
--- a/apps/data4impact-import-scripts/scripts/patents/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/patents/schema.sql
@ -0,0 +1,41 @@
 CREATE TABLE patents_json (
 	json	text
 );
 CREATE TABLE patents_text_json (
 	json	text
 );
 CREATE MATERIALIZED VIEW document AS SELECT
 	'50|patents_____::'||MD5(lower(trim(p->>'LocalID'))) AS "id",
 	p->>'Title'                                          AS "title",
 	p->>'Abstract'                                       AS "abstractText",
 	p->>'Type'                                           AS "type",
 	p->>'PubYear'                                        AS "pubYear",
 	'patent repo'::text                                  AS "repository"
 FROM (SELECT replace(json,'\\','\"')::json AS p FROM patents_json) a;
 CREATE MATERIALIZED VIEW doc_fulltext AS SELECT
 	'50|patents_____::'||MD5(lower(trim(p->>'LocalID'))) AS "docId",
 	trim(p->>'text')                                     AS "fulltext"
 FROM (SELECT replace(json,'\\"','\"')::json AS p FROM patents_text_json) a
 WHERE length(trim(p->>'text')) > 0;
 CREATE MATERIALIZED VIEW doc_other_identifier AS SELECT
 	'50|patents_____::'||MD5(lower(trim(p->>'LocalID'))) AS "docId",
 	trim(p->>'LocalID')                                  AS "id",
 	'patent'::text                                       AS "type"
 FROM (SELECT replace(json,'\\"','\"')::json AS p FROM patents_json) a;
 CREATE MATERIALIZED VIEW project AS SELECT
 	'50|MOCK_PROJECT::'||MD5('EC_FP7')::text AS "id",
 	'MOCK PROJECT'::text                     AS "title",
 	'EC'::text                               AS "funder",
 	'FP7'::text                              AS "fundingLevel0";	
 CREATE MATERIALIZED VIEW doc_project AS SELECT
 	'50|patents_____::'||MD5(lower(trim(p->>'LocalID'))) AS "docId",
 	'50|MOCK_PROJECT::'||MD5('EC_FP7')                   AS "projectId"
 FROM (SELECT replace(json,'\\"','\"')::json AS p FROM patents_json) a;
--- a/apps/data4impact-import-scripts/scripts/project_portfolios/TODO.txt
+++ b/apps/data4impact-import-scripts/scripts/project_portfolios/TODO.txt
@ -0,0 +1 @@
 usare i documenti nella relativa directory
--- a/apps/data4impact-import-scripts/scripts/project_portfolios/additional_scripts.sql
+++ b/apps/data4impact-import-scripts/scripts/project_portfolios/additional_scripts.sql
@ -0,0 +1,381 @@
 alter table project_portfolio add column json json;
 alter table project_portfolio add column administrative_data json;
 alter table project_portfolio add column governance_data json;
 --sections
 alter table project_portfolio add column executive_summary json;
 alter table project_portfolio add column final_report_summary json;
 alter table project_portfolio add column impact json;
 alter table project_portfolio add column objective json;
 alter table project_portfolio add column title json;
 --/sections
 update project_portfolio set json = convert_from(decode(portfolio, 'base64'), 'UTF8')::json ;
 update project_portfolio set administrative_data    = json->'administrative_data';
 update project_portfolio set governance_data        = json->'governance_data';
 update project_portfolio set executive_summary      = json->'sections'->'executive_summary';
 update project_portfolio set final_report_summary   = json->'sections'->'final_report_summary';
 update project_portfolio set impact                 = json->'sections'->'impact';
 update project_portfolio set objective              = json->'sections'->'objective';
 update project_portfolio set results_in_brief       = json->'sections'->'results_in_brief';
 update project_portfolio set results                = json->'sections'->'results';
 update project_portfolio set impact                 = json->'sections'->'impact';
 update project_portfolio set title                  = json->'sections'->'title';
 -- document
 INSERT INTO DOCUMENT
            (id,
             title,
             abstract,
             doctype,
             repository,
             rights,
             pubyear)
 SELECT Replace(Replace(projectid, '40|corda__h2020', '50|h2020_object'),
              '40|corda_______', '50|fp7___object')    AS id,
       'Objectives of project '
       ||( administrative_data ->> 'acronym' :: TEXT ) AS title,
       objective ->> 'text'                            AS abstract,
       'project_report'                                AS doctype,
       'CORDIS'                                        AS repository,
       'OPEN' :: TEXT                                  AS rights,
       administrative_data ->> 'date_to' :: TEXT       AS pubyear
 FROM   project_portfolio
 WHERE objective ->> 'text' IS NOT NULL
 UNION ALL
 SELECT Replace(Replace(projectid, '40|corda__h2020', '50|h2020summary'),
              '40|corda_______', '50|fp7__summary')    AS id,
       'Final report summary of project '
       ||( administrative_data ->> 'acronym' :: TEXT ) AS title,
       final_report_summary ->> 'text'                 AS abstract,
       'project_report'                                AS doctype,
       'CORDIS'                                        AS repository,
       'OPEN' :: TEXT                                  AS rights,
       administrative_data ->> 'date_to' :: TEXT       AS pubyear
 FROM   project_portfolio
 WHERE final_report_summary ->> 'text' IS NOT NULL
 UNION ALL
 SELECT Replace(Replace(projectid, '40|corda__h2020', '50|h2020___exec'),
              '40|corda_______', '50|fp7_____exec')    AS id,
       'Executive summary of project '
       ||( administrative_data ->> 'acronym' :: TEXT ) AS title,
       executive_summary ->> 'text'                    AS abstract,
       'project_report'                                AS doctype,
       'CORDIS'                                        AS repository,
       'OPEN' :: TEXT                                  AS rights,
       administrative_data ->> 'date_to' :: TEXT       AS pubyear
 FROM   project_portfolio
 WHERE executive_summary ->> 'text' IS NOT NULL
 UNION ALL
 SELECT Replace(Replace(projectid, '40|corda__h2020', '50|h2020__brief'),
              '40|corda_______', '50|fp7____brief')    AS id,
       'Results in brief of project '
       ||( administrative_data ->> 'acronym' :: TEXT ) AS title,
       results_in_brief ->> 'text'                     AS abstract,
       'project_report'                                AS doctype,
       'CORDIS'                                        AS repository,
       'OPEN' :: TEXT                                  AS rights,
       administrative_data ->> 'date_to' :: TEXT       AS pubyear
 FROM   project_portfolio
 WHERE results_in_brief ->> 'text' IS NOT NULL
 UNION ALL
 SELECT Replace(Replace(projectid, '40|corda__h2020', '50|h2020results'),
              '40|corda_______', '50|fp7__results')    AS id,
       'Results of project '
       ||( administrative_data ->> 'acronym' :: TEXT ) AS title,
       results ->> 'text'                              AS abstract,
       'project_report'                                AS doctype,
       'CORDIS'                                        AS repository,
       'OPEN' :: TEXT                                  AS rights,
       administrative_data ->> 'date_to' :: TEXT       AS pubyear
 FROM   project_portfolio
 WHERE results ->> 'text' IS NOT NULL
 UNION ALL
 SELECT Replace(Replace(projectid, '40|corda__h2020', '50|h2020_impact'),
              '40|corda_______', '50|fp7___impact')    AS id,
       'Impact of project '
       ||( administrative_data ->> 'acronym' :: TEXT ) AS title,
       impact ->> 'text'                               AS abstract,
       'project_report'                                AS doctype,
       'CORDIS'                                        AS repository,
       'OPEN' :: TEXT                                  AS rights,
       administrative_data ->> 'date_to' :: TEXT       AS pubyear
 FROM   project_portfolio
 WHERE impact ->> 'text' IS NOT NULL
 -- doc_project
 INSERT INTO doc_project
            (docid,
             projectid,
             inferred)
 SELECT REPLACE(REPLACE(projectid, '40|corda__h2020', '50|h2020_object'),
              '40|corda_______', '50|fp7___object') AS docid,
       projectid,
       TRUE                                         AS inferred
 FROM   project_portfolio
 WHERE objective ->> 'text' IS NOT NULL
 UNION ALL
 SELECT REPLACE(REPLACE(projectid, '40|corda__h2020', '50|h2020summary'),
              '40|corda_______', '50|fp7__summary') AS docid,
       projectid,
       TRUE                                         AS inferred
 FROM   project_portfolio
 WHERE final_report_summary ->> 'text' IS NOT NULL
 UNION ALL
 SELECT REPLACE(REPLACE(projectid, '40|corda__h2020', '50|h2020___exec'),
              '40|corda_______', '50|fp7_____exec') AS docid,
       projectid,
       TRUE                                         AS inferred
 FROM   project_portfolio
 WHERE executive_summary ->> 'text' IS NOT NULL
 UNION ALL
 SELECT REPLACE(REPLACE(projectid, '40|corda__h2020', '50|h2020__brief'),
              '40|corda_______', '50|fp7____brief') AS docid,
       projectid,
       TRUE                                         AS inferred
 FROM   project_portfolio
 WHERE results_in_brief ->> 'text' IS NOT NULL
 UNION ALL
 SELECT REPLACE(REPLACE(projectid, '40|corda__h2020', '50|h2020results'),
              '40|corda_______', '50|fp7__results') AS docid,
       projectid,
       TRUE                                         AS inferred
 FROM   project_portfolio
 WHERE results ->> 'text' IS NOT NULL
 UNION ALL
 SELECT REPLACE(REPLACE(projectid, '40|corda__h2020', '50|h2020_impact'),
              '40|corda_______', '50|fp7___impact') AS docid,
       projectid,
       TRUE                                         AS inferred
 FROM   project_portfolio
 WHERE impact ->> 'text' IS NOT NULL
 -- updates the project table with data from the project_portfolios
 update project p set (total_cost,contribution,currency) = ((administrative_data->>'Total cost')::numeric, (administrative_data->>'contribution')::numeric, 'EURO'::text) from
 project_portfolio pp where pp.projectid = p.id ;
 update project_organization po set (contribution, currency) = (U.contribution, 'EURO'::text) from
 (
 	select projectid, '20|ec__________::'||MD5(o->>'pic') as orgid, (o->>'contribution')::numeric as contribution from
 		(
 			select projectid, json_array_elements(administrative_data->'coordinators') as o from project_portfolio
 			union all
 			select projectid, json_array_elements(administrative_data->'participants') as o from project_portfolio
 		) as T
 ) as U where po.orgid = U.orgid and po.projectid = U.projectid
 -- include start/end dates from project portfolios
 update project p set startdate = pp.administrative_data->>'date_from' from project_portfolio pp where p.startdate is null and p.id = pp.projectid ;
 update project p set enddate = pp.administrative_data->>'date_to' from project_portfolio pp where p.enddate is null and p.id = pp.projectid ;
 -- work in progress, waiting for ARC to fix the data. For now we keep only the activity types that do not contain any new-line characters
 update project_organization po set activitytype = o.activitytype from (select '20|ec__________::'||MD5(o->>'pic') as orgid, o->>'activity_type' as activitytype from
 (
 select json_array_elements(administrative_data->'coordinators') as o from project_portfolio
 union all
 select json_array_elements(administrative_data->'participants') as o from project_portfolio
 ) as T
 where o->>'pic' is not null and o->>'activity_type' !~ E'.*\n.*') o where po.orgid = o.orgid;
 -- extract PubMed publications from the project portfolios
 find . -name '*.json' -exec jq -r '.publications.pubmed_abstracts | to_entries | map([.key, .value.ArticleTitle, .value.AbstractText, .value.ArticleDate]) | .[] | @csv' {} \; > ../document_pp.csv
 find . -name '*.json' -exec bash -c "jq -r '.publications.pubmed_abstracts | to_entries | .[] | (.key as \$id | .value.Authors | to_entries | .[] | .key as \$i | { docid : \$id, fullname : (.value.LastName+\", \"+.value.ForeName), rank: (map(\$i+1) | unique | .[0]) }  ) ' \"{}\" | jq -s -r 'map([.docid, .fullname, .rank]) | .[] | @csv'  " \; > ../doc_author_pp.csv
 find . -name '*.json' -exec  jq -r '.publications.pubmed_abstracts | to_entries | .[] | (.key as $id | .value.OtherIDs | map([$id, .Source, .id ] )) | .[] | @csv ' {} \; > ../doc_other_id.csv
 find . -name 'FP7*.json' -exec  jq -r ".administrative_data.project_id as \$grant | .publications.pubmed_abstracts | to_entries | .[] | [ .key, \"40|corda_______::\",  \$grant ] | @csv  " {} \; > ../doc_project_pp.csv                                 15:50:53
 find . -name 'H2020*.json' -exec  jq -r ".administrative_data.project_id as \$grant | .publications.pubmed_abstracts | to_entries | .[] | [ .key, \"40|corda__h2020::\",  \$grant ] | @csv  " {} \; >> ../doc_project_pp.csv
 find . -name '*.json' -exec jq -r '.publications.pubmed_abstracts | to_entries | .[] | (.key as $id | .value.MeshHeadings | map([$id,  (group_by(.Label) | .[] )])) | map([.[0], .[1][0].text, ([(.[2][]?.text )] | join("@"))  ]) | .[] | @csv ' {} \;  > ../doc_subject_pp.csv
 //DOCUMENTS
 create table document_pp(id text, title text, abstract text, pubyear text, repository text, rights text default 'UNKNOWN', doctype text default 'publication');
 copy document_pp (id, title, abstract, pubyear) from '/Users/claudio/workspace/data/d4i/document_pp.csv' CSV ;
 create table document_pp_unique as (select distinct * from document_pp );
 drop table document_pp;
 alter table document_pp_unique rename to document_pp ;
 update document_pp set repository = 'PubMed Central PP' ;
 update document_pp set pubyear = to_date(pubyear, 'DD/MM/YYYY')::text ;
 update document_pp set id= '50|pp_______267::'||MD5(id) ;
 // DOC_AUTHOR
 create table doc_author_pp (docid text, fullname text, rank integer);
 copy doc_author_pp (docid, fullname, rank) from '/Users/claudio/workspace/data/d4i/doc_author_pp.csv' CSV ;
 update doc_author_pp set fullname = SUBSTRING(fullname, 0, length(fullname) + 1 - 2) where fullname like '%, ';
 create table doc_author_pp_u as (select distinct * from doc_author_pp) ;
 drop table doc_author_pp;
 alter table doc_author_pp_u rename to doc_author_pp ;
 update doc_author_pp set docid = '50|pp_______267::'||MD5(docid) ;
 // DOC_SUBJECT
 create table doc_subject_pp(docid text, subject text, typology text);
 create table subject_tmp(id text, descriptor text, qualifiers text);
 copy subject_tmp (id, descriptor, qualifiers) from '/Users/claudio/workspace/data/d4i/doc_subject_pp.csv' CSV;
 insert into doc_subject_pp select '50|pp_______267::'||MD5(id) as docid, s as subject, 'MeshHeadings' as typology from ( select id, d||'|'||q as s from ( select id, descriptor as d, unnest(regexp_split_to_array(qualifiers, '@')) as q from subject_tmp where qualifiers <> '') as t UNION ALL select distinct id, descriptor as s from subject_tmp) as t ;
 create table doc_subject_pp_u as select distinct * from doc_subject_pp;
 drop table doc_subject_pp;
 alter table doc_subject_pp_u rename to doc_subject_pp;
 // DOC_PROJECT
 create table doc_project_pp(docid text, projectid text);
 create table dp_tmp (docid text, profix text, grantid text) ;
 copy dp_tmp(docid, profix, grantid) from '/Users/claudio/workspace/data/d4i/doc_project_pp.csv' CSV;
 insert into doc_project_pp select '50|pp_______267::'||MD5(docid), profix||MD5(grantid) from dp_tmp ;
 // DOC_OTHER_IDENTIFIER
 create table doc_other_identifier_pp(docid text, idtype text, id text);
 copy doc_other_identifier_pp (docid, idtype, id) from '/Users/claudio/workspace/data/d4i/doc_other_id.csv' CSV;
 update doc_other_identifier_pp set idtype = 'pmid' where idtype = 'pubmed' ;
 update doc_other_identifier_pp set idtype = 'pmcid' where idtype = 'pmc' ;
 update doc_other_identifier_pp set docid=  '50|pp_______267::'||MD5(docid);
 // Caricamento dei csv sul db, cleaning degli idtype, generazione dei subject (mesh), distinct values, ... 
 create table doc_alias_pp(id text, idpp text);
 insert into doc_alias_pp select distinct doi.docid as id, pp.docid as idpp from doc_other_identifier_pp pp join doc_other_identifier doi on (doi.id = pp.id and doi.idtype = pp.idtype) where doi.docid is not null and doi.docid <> '';
 alter table document_pp             add column existing_docid text;
 alter table doc_other_identifier_pp add column existing_docid text;
 alter table doc_author_pp           add column existing_docid text;
 alter table doc_project_pp          add column existing_docid text;
 alter table doc_subject_pp          add column existing_docid text;
 update document_pp             set existing_docid = doc_alias_pp.id from doc_alias_pp where document_pp.id = doc_alias_pp.idpp;
 update doc_other_identifier_pp set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_other_identifier_pp.docid = doc_alias_pp.idpp;
 update doc_author_pp           set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_author_pp.docid  = doc_alias_pp.idpp;
 update doc_project_pp          set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_project_pp.docid = doc_alias_pp.idpp;
 update doc_subject_pp          set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_subject_pp.docid = doc_alias_pp.idpp;
 update document_pp             set id    = existing_docid where existing_docid is not null;
 update doc_other_identifier_pp set docid = existing_docid where existing_docid is not null;
 update doc_author_pp           set docid = existing_docid where existing_docid is not null;
 update doc_project_pp          set docid = existing_docid where existing_docid is not null;
 update doc_subject_pp          set docid = existing_docid where existing_docid is not null;
 alter table document_pp             drop column existing_docid ;
 alter table doc_other_identifier_pp drop column existing_docid ;
 alter table doc_author_pp           drop column existing_docid ;
 alter table doc_project_pp          drop column existing_docid ;
 alter table doc_subject_pp          drop column existing_docid ;
 -- ONLY FOR MISSING DOCUMENT
 insert into document (id, title, abstract, doctype, repository, pubyear, rights) select id, title, abstract, doctype, repository, pubyear, rights from document_pp where id like '50|pp_______267::%';
 insert into doc_author(docid, fullname, rank) select docid, fullname, rank from doc_author_pp where docid like '50|pp_______267::%' on conflict do nothing;
 -- FOR ALL DOCUMENTS (I exclude the pii ids because it seems that the same id is associated to many documents)
 insert into doc_other_identifier(docid, id, idtype) select distinct docid, id, idtype from doc_other_identifier_pp where idtype != 'pii' on conflict (id,idtype) do update set docid = EXCLUDED.docid;
 insert into doc_project(docid, projectid) select docid, projectid from doc_project_pp on conflict do nothing;
 insert into doc_subject(docid, subject, typology) select docid, subject, typology from doc_subject_pp on conflict do nothing;
 ----------------------------
 -- extract RestPublications publications from the project portfolios
 //--PART 1 - to be run in local
 	find . -name '*.json' -exec jq -r '.publications.rest_publications | to_entries | map([.key, .value.title, .value.resulttype, .value.description, .value.dateofacceptance]) | .[] | @csv' {} \; > ../document_pp.csv
 	find . -name '*.json' -exec jq -r '.publications.rest_publications | to_entries | .[] | (.key as $id | .value.creators | map([$id, .full, .rank])) | .[] | @csv' {} \; > ../doc_author_pp.csv
 	find . -name 'FP7*.json' -exec  jq -r ".administrative_data.project_id as \$grant | .publications.rest_publications | to_entries | .[] | [ .key, \"40|corda_______::\",  \$grant ] | @csv  " {} \; > ../doc_project_pp.csv
 	find . -name 'H2020*.json' -exec  jq -r ".administrative_data.project_id as \$grant | .publications.rest_publications | to_entries | .[] | [ .key, \"40|corda__h2020::\",  \$grant ] | @csv  " {} \; >> ../doc_project_pp.csv
 	find . -name '*.json' -exec jq -r '.publications.rest_publications | to_entries | .[] | (.key as $id | .value.subjects | map([$id, .value, .class])) | .[] | @csv' {} \;  > ../doc_subject_pp.csv
 	find . -name '*.json' -exec  jq -r '.publications.rest_publications | to_entries | .[] | (.key as $id | .value.pids | map([$id, .value, .class])) | .[] | @csv' {} \; > ../doc_other_id.csv
 //DOCUMENTS
 	drop table if exists document_pp;
 	create table document_pp(id text, title text, doctype text, abstract text, pubyear text, repository text, rights text default 'UNKNOWN');
 	copy document_pp (id, title, doctype, abstract, pubyear) from '/Users/michele/Develop/data4impact/data4impact-import-scripts/orig/project_portfolios/document_pp.csv' CSV ;
 	create table document_pp_unique as (select distinct * from document_pp );
 	drop table document_pp;
 	alter table document_pp_unique rename to document_pp ;
 	update document_pp set repository = 'Rest Publications PP' ;
 	update document_pp set id= '50|pp__restpubs::'||MD5(id);
 // DOC_AUTHOR
 	drop table if exists doc_author_pp;
 	create table doc_author_pp (docid text, fullname text, rank integer);
 	copy doc_author_pp (docid, fullname, rank) from '/Users/michele/Develop/data4impact/data4impact-import-scripts/orig/project_portfolios/doc_author_pp.csv' CSV ;
 	create table doc_author_pp_u as (select distinct * from doc_author_pp) ;
 	drop table doc_author_pp;
 	alter table doc_author_pp_u rename to doc_author_pp ;
 	update doc_author_pp set docid = '50|pp__restpubs::'||MD5(docid) ;
 // DOC_PROJECT
 	drop table if exists doc_project_pp;
 	create table doc_project_pp(docid text, projectid text);
 	create table dp_tmp (docid text, prefix text, grantid text) ;
 	copy dp_tmp(docid, prefix, grantid) from '/Users/michele/Develop/data4impact/data4impact-import-scripts/orig/project_portfolios/doc_project_pp.csv' CSV;
 	insert into doc_project_pp select distinct '50|pp__restpubs::'||MD5(docid), prefix||MD5(grantid) from dp_tmp ;
 // DOC_SUBJECT
 	drop table if exists doc_subject_pp;
 	create table doc_subject_pp(docid text, subject text, typology text);
 	copy doc_subject_pp (docid, subject, typology) from '/Users/michele/Develop/data4impact/data4impact-import-scripts/orig/project_portfolios/doc_subject_pp.csv' CSV;
 	delete from doc_subject_pp where subject is null OR subject = '';
 	create table doc_subject_pp_u as select distinct * from doc_subject_pp;
 	drop table doc_subject_pp;
 	alter table doc_subject_pp_u rename to doc_subject_pp;
 	update doc_subject_pp set docid = '50|pp__restpubs::'||MD5(docid) ;
 // DOC_OTHER_IDENTIFIER
 	drop table if exists doc_other_identifier_pp;
 	create table doc_other_identifier_pp(docid text, id text, idtype text);
 	copy doc_other_identifier_pp (docid, id, idtype) from '/Users/michele/Develop/data4impact/data4impact-import-scripts/orig/project_portfolios/doc_other_id.csv' CSV;
 	delete from doc_other_identifier_pp where id is null OR id = '';
 	create table doc_other_identifier_pp_u as select distinct * from doc_other_identifier_pp;
 	drop table doc_other_identifier_pp;
 	alter table doc_other_identifier_pp_u rename to doc_other_identifier_pp;
 	update doc_other_identifier_pp set idtype = 'pmid'  where idtype = 'pubmed' ;
 	update doc_other_identifier_pp set idtype = 'pmcid' where idtype = 'pmc' ;
 	update doc_other_identifier_pp set docid =  '50|pp__restpubs::'||MD5(docid);
 // -- PART 2 - to be run on the server
 	create table doc_alias_pp(id text, idpp text);
 	insert into doc_alias_pp select distinct doi.docid as id, pp.docid as idpp from doc_other_identifier_pp pp join doc_other_identifier doi on (doi.id = pp.id and doi.idtype = pp.idtype) where doi.docid is not null and doi.docid <> '';
 	alter table document_pp             add column existing_docid text;
 	alter table doc_other_identifier_pp add column existing_docid text;
 	alter table doc_author_pp           add column existing_docid text;
 	alter table doc_project_pp          add column existing_docid text;
 	alter table doc_subject_pp          add column existing_docid text;
 	update document_pp             set existing_docid = doc_alias_pp.id from doc_alias_pp where document_pp.id = doc_alias_pp.idpp;
 	update doc_other_identifier_pp set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_other_identifier_pp.docid = doc_alias_pp.idpp;
 	update doc_author_pp           set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_author_pp.docid  = doc_alias_pp.idpp;
 	update doc_project_pp          set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_project_pp.docid = doc_alias_pp.idpp;
 	update doc_subject_pp          set existing_docid = doc_alias_pp.id from doc_alias_pp where doc_subject_pp.docid = doc_alias_pp.idpp;
 	update document_pp             set id    = existing_docid where existing_docid is not null;
 	update doc_other_identifier_pp set docid = existing_docid where existing_docid is not null;
 	update doc_author_pp           set docid = existing_docid where existing_docid is not null;
 	update doc_project_pp          set docid = existing_docid where existing_docid is not null;
 	update doc_subject_pp          set docid = existing_docid where existing_docid is not null;
 	alter table document_pp             drop column existing_docid ;
 	alter table doc_other_identifier_pp drop column existing_docid ;
 	alter table doc_author_pp           drop column existing_docid ;
 	alter table doc_project_pp          drop column existing_docid ;
 	alter table doc_subject_pp          drop column existing_docid ;
 -- ONLY FOR MISSING DOCUMENT
 insert into document (id, title, abstract, doctype, repository, pubyear, rights) select distinct id, title, abstract, doctype, repository, pubyear, rights from document_pp where id like '50|pp__restpubs::%';
 insert into doc_author(docid, fullname, rank) select docid, fullname, rank from doc_author_pp where docid like '50|pp__restpubs::%' on conflict do nothing;
 -- FOR ALL DOCUMENTS (I exclude the pii ids because it seems that the same id is associated to many documents)
 insert into doc_other_identifier(docid, id, idtype) select distinct docid, id, idtype from doc_other_identifier_pp where idtype != 'pii' on conflict (id,idtype) do update set docid = EXCLUDED.docid;
 insert into doc_project(docid, projectid) select docid, projectid from doc_project_pp on conflict do nothing;
 insert into doc_subject(docid, subject, typology) select docid, subject, typology from doc_subject_pp on conflict do nothing;
--- a/apps/data4impact-import-scripts/scripts/project_portfolios/bulkImporter.sh
+++ b/apps/data4impact-import-scripts/scripts/project_portfolios/bulkImporter.sh
@ -0,0 +1,31 @@
 #!/bin/bash
 SAVEIFS=$IFS
 IFS=$(echo -en "\n\b")
 tmp="/tmp/tempfile.sql"
 rm -f "$tmp"
 echo "DELETE FROM project_portfolio;" >> "$tmp"
 for f in `ls /data/d4i/project_portfolios/november2018/D4I_Analytics_ARC_Release04_WP52_31Nov2018_fixed/FP7_*.json`
 do
 	id=$(jq .administrative_data.project_id "$f" | tr -d '"')
 	echo -n "INSERT INTO project_portfolio(projectid, portfolio) VALUES ('40|corda_______::'||MD5('$id'), '" >> "$tmp"
 	cat "$f" | gzip -c | base64 | tr -d '\n' >> "$tmp"
 	echo "');" >> "$tmp"
 done
 for f in `ls /data/d4i/project_portfolios/november2018/D4I_Analytics_ARC_Release04_WP52_31Nov2018_fixed/H2020_*.json`
 do
 	id=$(jq .administrative_data.project_id "$f" | tr -d '"')
 	echo -n "INSERT INTO project_portfolio(projectid, portfolio) VALUES ('40|corda__h2020::'||MD5('$id'), '" >> "$tmp"
 	cat "$f" | gzip -c | base64 | tr -d '\n' >> "$tmp"
 	echo "');" >> "$tmp"
 done
 echo "Inserting file: $tmp"
 #psql data4impact -f "$tmp"
 IFS=$SAVEIFS
--- a/apps/data4impact-import-scripts/scripts/project_portfolios_metrics/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/project_portfolios_metrics/schema.sql
@ -0,0 +1,199 @@
 CREATE TABLE pp_metrics (
 	id                             text PRIMARY KEY,
 	eu_contribution                numeric,
 	number_of_innovations          integer,
 	number_of_companies_founded    integer,
 	number_of_patents              integer,
 	number_of_projects             integer,
 	number_of_pubmed_publications  integer,
 	number_of_rest_publications    integer,
 	number_of_segments             integer,
 	total_cost                     numeric
 );
 CREATE TABLE pp_countries_cooccurrences (
 	funding         text REFERENCES pp_metrics(id),
 	country1        text,
 	country2        text,
 	number          integer,
 	PRIMARY KEY (funding, country1, country2)
 );
 CREATE TABLE pp_eu_contribution_per_country (
 	funding         text REFERENCES pp_metrics(id),
 	country         text,
 	contribution    numeric,
 	PRIMARY KEY (funding, country)
 );
 CREATE TABLE pp_eu_contribution_per_participant_sector (
 	funding         text REFERENCES pp_metrics(id),
 	sector          text,
 	contribution    numeric,
 	PRIMARY KEY (funding, sector)
 );
 CREATE TABLE pp_eu_contribution_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	contribution    numeric,
 	PRIMARY KEY (funding, area)
 );
 CREATE TABLE pp_eu_contribution_per_research_area_over_time (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	year            integer,
 	contribution    numeric,
 	PRIMARY KEY (funding, area, year)
 );
 CREATE TABLE pp_eu_contribution_per_year (
 	funding         text REFERENCES pp_metrics(id),
 	year            integer,
 	contribution    numeric,
 	PRIMARY KEY (funding, year)
 );
 CREATE TABLE pp_number_of_innovations_per_type (
 	funding         text REFERENCES pp_metrics(id),
 	type            text,
 	number          integer,
 	PRIMARY KEY (funding, type)
 );
 CREATE TABLE pp_number_of_innovations_per_type_per_country (
 	funding         text REFERENCES pp_metrics(id),
 	type            text,
 	country         text,
 	number          integer,
 	PRIMARY KEY (funding, type, country)
 );
 CREATE TABLE pp_number_of_innovations_per_type_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	type            text,
 	area            text,
 	number          integer,
 	PRIMARY KEY (funding, type, area)
 );
 CREATE TABLE pp_number_of_patents_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	number          integer,
 	PRIMARY KEY (funding, area)
 );
 CREATE TABLE pp_number_of_projects_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	number          integer,
 	PRIMARY KEY (funding, area)
 );
 CREATE TABLE pp_number_of_pubmed_publications_per_country (
 	funding         text REFERENCES pp_metrics(id),
 	country         text,
 	number          integer,
 	PRIMARY KEY (funding, country)
 );
 CREATE TABLE pp_number_of_pubmed_publications_per_journal (
 	funding         text REFERENCES pp_metrics(id),
 	journal         text,
 	number          integer,
 	PRIMARY KEY (funding, journal)
 );
 CREATE TABLE pp_number_of_pubmed_publications_per_journal_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	journal         text,
 	area            text,
 	number          integer,
 	PRIMARY KEY (funding, journal, area)
 );
 CREATE TABLE pp_number_of_pubmed_publications_per_journal_per_year (
 	funding         text REFERENCES pp_metrics(id),
 	journal         text,
 	year            integer,
 	number          integer,
 	PRIMARY KEY (funding, journal, year)
 );
 CREATE TABLE pp_number_of_pubmed_publications_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	number          integer,
 	PRIMARY KEY (funding, area)
 );
 CREATE TABLE pp_number_of_pubmed_publications_per_year (
 	funding         text REFERENCES pp_metrics(id),
 	year            integer,
 	number          integer,
 	PRIMARY KEY (funding, year)
 );
 -- IT IS EQUIVALENT TO pp_number_of_pubmed_publications_per_journal_per_year --
 CREATE TABLE pp_number_of_pubmed_publications_per_year_per_journal (
 	funding         text REFERENCES pp_metrics(id),
 	journal         text,
 	year            integer,
 	number          integer,
 	PRIMARY KEY (funding, journal, year)
 );
 CREATE TABLE pp_number_of_rest_publications_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	number          integer,
 	PRIMARY KEY (funding, area)
 );
 CREATE TABLE pp_number_of_rest_publications_per_year (
 	funding         text REFERENCES pp_metrics(id),
 	year            integer,
 	number          integer,
 	PRIMARY KEY (funding, year)
 );
 CREATE TABLE pp_research_areas_cooccurrences (
 	funding         text REFERENCES pp_metrics(id),
 	area1           text,
 	area2           text,
 	number          integer,
 	PRIMARY KEY (funding, area1, area2)
 );
 CREATE TABLE pp_research_areas_to_icd10 (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	icd10           text,
 	PRIMARY KEY (funding, area)
 );
 CREATE TABLE pp_total_cost_per_research_area (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	cost            numeric,
 	PRIMARY KEY (funding, area)
 );
 CREATE TABLE pp_total_cost_per_research_area_over_time (
 	funding         text REFERENCES pp_metrics(id),
 	area            text,
 	year            integer,
 	cost            numeric,
 	PRIMARY KEY (funding, area, year)
 );
 CREATE TABLE pp_total_cost_per_year (
 	funding         text REFERENCES pp_metrics(id),
 	year            integer,
 	cost            numeric,
 	PRIMARY KEY (funding, year)
 );
--- a/apps/data4impact-import-scripts/scripts/project_portfolios_metrics/script.sh
+++ b/apps/data4impact-import-scripts/scripts/project_portfolios_metrics/script.sh
@ -0,0 +1,194 @@
 #!/bin/bash
 file=/Users/claudio/workspace/data/d4i/november2018/D4I_Metrics_ARC_Release04_WP52_31Nov2018/statistics_on_release.json
 db=metrics_tmp
 echo "Recreating the database $db"
 dropdb $db --if-exists
 createdb $db
 psql $db -f schema.sql
 echo
 echo "Importing table pp_metrics"
 cat $file \
 | jq -r 'to_entries | map([.key, .value.eu_contribution, .value.number_of_innovations, .value.number_of_companies_founded, .value.number_of_patents, .value.number_of_projects, .value.number_of_pubmed_publications, .value.number_of_rest_publications, .value.number_of_segments, .value.total_cost]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_metrics(id,eu_contribution,number_of_innovations,number_of_companies_founded,number_of_patents,number_of_projects,number_of_pubmed_publications,number_of_rest_publications,number_of_segments,total_cost) FROM STDIN CSV" 
 echo
 echo "Importing table pp_countries_cooccurrences"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.countries_cooccurrences | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_countries_cooccurrences(funding,country1,country2,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_eu_contribution_per_country"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.eu_contribution_per_country | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_eu_contribution_per_country(funding,country,contribution) FROM STDIN CSV"
 echo
 echo "Importing table pp_eu_contribution_per_participant_sector"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.eu_contribution_per_participant_sector | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_eu_contribution_per_participant_sector(funding,sector,contribution) FROM STDIN CSV"
 echo
 echo "Importing table pp_eu_contribution_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.eu_contribution_per_research_area | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_eu_contribution_per_research_area(funding,area,contribution) FROM STDIN CSV"
 echo
 echo "Importing table pp_eu_contribution_per_research_area_over_time"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.eu_contribution_per_research_area_over_time | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_eu_contribution_per_research_area_over_time(funding,year,area,contribution) FROM STDIN CSV"
 echo
 echo "Importing table pp_eu_contribution_per_year"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.eu_contribution_per_year | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_eu_contribution_per_year(funding,year,contribution) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_innovations_per_type"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_innovations_per_type | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_innovations_per_type(funding,type,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_innovations_per_type_per_country"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_innovations_per_type_per_country | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_innovations_per_type_per_country(funding,country,type,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_innovations_per_type_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_innovations_per_type_per_research_area | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_innovations_per_type_per_research_area(funding,area,type,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_patents_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_patents_per_research_area | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_patents_per_research_area(funding,area,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_projects_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_projects_per_research_area | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_projects_per_research_area(funding,area,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_pubmed_publications_per_country"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_pubmed_publications_per_country | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_pubmed_publications_per_country(funding,country,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_pubmed_publications_per_journal"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_pubmed_publications_per_journal | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_pubmed_publications_per_journal(funding,journal,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_pubmed_publications_per_journal_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_pubmed_publications_per_journal_per_research_area | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_pubmed_publications_per_journal_per_research_area(funding,journal,area,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_pubmed_publications_per_journal_per_year"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_pubmed_publications_per_journal_per_year | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_pubmed_publications_per_journal_per_year(funding,journal,year,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_pubmed_publications_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_pubmed_publications_per_research_area | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_pubmed_publications_per_research_area(funding,area,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_pubmed_publications_per_year"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_pubmed_publications_per_year | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_pubmed_publications_per_year(funding,year,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_pubmed_publications_per_year_per_journal"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_pubmed_publications_per_year_per_journal | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_pubmed_publications_per_year_per_journal(funding,year,journal,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_rest_publications_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_rest_publications_per_research_area | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_rest_publications_per_research_area(funding,area,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_number_of_rest_publications_per_year"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.number_of_rest_publications_per_year | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_number_of_rest_publications_per_year(funding,year,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_research_areas_cooccurrences"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.research_areas_cooccurrences | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_research_areas_cooccurrences(funding,area1,area2,number) FROM STDIN CSV"
 echo
 echo "Importing table pp_research_areas_to_icd10"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.research_areas_to_icd10 | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_research_areas_to_icd10(funding,area,icd10) FROM STDIN CSV"
 echo
 echo "Importing table pp_total_cost_per_research_area"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.total_cost_per_research_area | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_total_cost_per_research_area(funding,area,cost) FROM STDIN CSV"
 echo
 echo "Importing table pp_total_cost_per_research_area_over_time"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.total_cost_per_research_area_over_time | to_entries | map([.key, (.value | to_entries | map([.key, .value ]))]))])) | .[] | to_entries | .[0].value as $id | .[1].value[] | to_entries | .[0].value as $x | .[1].value | map([$id,$x,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_total_cost_per_research_area_over_time(funding,year,area,cost) FROM STDIN CSV"
 echo
 echo "Importing table pp_total_cost_per_year"
 cat $file \
 | jq -r 'to_entries | (map([.key, (.value.total_cost_per_year | to_entries | map([.key, .value] ))]) ) | .[] | to_entries | .[0].value as $id | .[1].value | map([$id,.[0],.[1]]) | .[] | @csv' \
 | sed -e 's/"null"/-1/' \
 | psql $db -c "COPY pp_total_cost_per_year(funding,year,cost) FROM STDIN CSV"
 echo
--- a/apps/data4impact-import-scripts/scripts/ptm/help_queries.sql
+++ b/apps/data4impact-import-scripts/scripts/ptm/help_queries.sql
@ -0,0 +1,3 @@
 insert into doc_fulltext(docid, fulltext) select d.id as docid, t.fulltext as fulltext from document d left outer join temp_fulltext t on (d.id = t.pubid) where t.fulltext is not null;
--- a/apps/data4impact-import-scripts/scripts/pubmed_docs/README.txt
+++ b/apps/data4impact-import-scripts/scripts/pubmed_docs/README.txt
@ -0,0 +1,5 @@
 DONE using a java application
 cat pubmed.json | while read -r line; do echo $line | jq '.body["$binary"]' | sed 's/"//g' | base64 -d | gunzip -c; done
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/docOtherId2json.sql
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/docOtherId2json.sql
@ -0,0 +1,7 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 	 	token AS "id",
 	 	'doi' AS "type"
 	FROM projects p , unnest(string_to_array(p.doi_list, ',')) s(token) 
 	WHERE token IS NOT NULL
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/orgs2json.sql
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/orgs2json.sql
@ -0,0 +1,6 @@
 COPY (SELECT row_to_json(t) FROM (SELECT distinct
 	'20|swedish_orgs::'||MD5(lower(organizations_coordinating_en)) AS "id",
 	organizations_coordinating_en                                  AS "name",
 	'SE'                                                           AS "country"
 FROM projects
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/projDoi2json.sql
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/projDoi2json.sql
@ -0,0 +1,8 @@
 COPY (SELECT row_to_json(t) FROM (
 	SELECT
 		'40|'||rpad(lower(organization_short),12,'_')||'::'||MD5(dnr) AS "projectId",
 	 	token                                                         AS "docId",
 	 	'doi'                                                         AS "docIdType"
 	FROM projects p , unnest(string_to_array(p.doi_list, ',')) s(token) 
 	WHERE token IS NOT NULL
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/projOrg2json.sql
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/projOrg2json.sql
@ -0,0 +1,9 @@
 COPY (SELECT row_to_json(t) FROM (SELECT
 	'40|'||rpad(lower(organization_short),12,'_')||'::'||MD5(dnr)  AS "projectId",
 	'20|swedish_orgs::'||MD5(lower(organizations_coordinating_en)) AS "orgId",
 	'coordinator'                       AS "role",
 	people_project_leaders_0_firstname          AS "contactFirstNames",
 	people_project_leaders_0_surname           AS "contactLastNames"
 FROM projects
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/projOtherIds2json.sql
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/projOtherIds2json.sql
@ -0,0 +1,6 @@
 COPY (SELECT row_to_json(t) FROM (SELECT
 	'40|'||rpad(lower(organization_short),12,'_')||'::'||MD5(dnr) AS "projectId",
 	dnr                                                           AS "id",
 	lower(organization_short)||':grant_id'                        AS "type"
 FROM projects 
 ) t) TO STDOUT;
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/projects2json.sql
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/projects2json.sql
@ -0,0 +1,19 @@
 COPY (SELECT row_to_json(t) FROM (SELECT
 	'40|'||rpad(lower(organization_short),12,'_')||'::'||MD5(dnr) AS "id",
 	title_en                                                      AS "title",
 	organization_short                                            AS "funder",
 	type_of_awards                                                AS "fundingLevel0",
 	dates_start_date                                              AS "startDate",
 	dates_end_date                                                AS "endDate",
 	abstract_en                                                   AS "abstractText",
 	tags_0_en                                                     AS "keywords",
 	total_funding                                                 AS "contribution",
 	'SEK'::text                                                   AS "currency"
 FROM projects 
 ) t) TO STDOUT;
 --	intrascientific_report_en          text,
 --	popular_report_sv                  text,
 --	doi_list                           text,
 --	total_funding                      text
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/schema.sql
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/schema.sql
@ -0,0 +1,22 @@
 CREATE TABLE projects (
 	swecris_info                       text,
 	doi                                text,
 	final_reports                      text,
 	Organization_short                 text,
 	Organization_long                  text,
 	dnr                                text,
 	people_project_leaders_0_surname   text,
 	people_project_leaders_0_firstname text,
 	organizations_coordinating_en      text,
 	type_of_awards                     text,
 	dates_start_date                   text,
 	dates_end_date                     text,
 	title_en                           text,
 	abstract_en                        text,
 	intrascientific_report_en          text,
 	popular_report_sv                  text,
 	tags_0_en                          text,
 	doi_list                           text,
 	total_funding                      numeric
 );
--- a/apps/data4impact-import-scripts/scripts/swedishProjects/swedishProjects.sh
+++ b/apps/data4impact-import-scripts/scripts/swedishProjects/swedishProjects.sh
@ -0,0 +1,29 @@
 #!/bin/bash
 csv=/tmp/180626-swe_proj_data-delivery.csv
 inputCsvFile="$(cd "$(dirname "$csv")"; pwd -P)/$(basename "$csv")"
 echo
 echo "Swedish Projects Import:"
 #--------------------------------
 echo " - Recreating the swedishprojects database"
 dropdb swedishprojects --if-exists;
 createdb swedishprojects;
 psql swedishprojects -f schema.sql
 psql swedishprojects -c "COPY projects(swecris_info, doi, final_reports, Organization_short, Organization_long, dnr, people_project_leaders_0_surname, people_project_leaders_0_firstname, organizations_coordinating_en, type_of_awards, dates_start_date, dates_end_date, title_en, abstract_en, intrascientific_report_en, popular_report_sv, tags_0_en, doi_list, total_funding) FROM '$inputCsvFile' DELIMITER ',' CSV HEADER;"
 #--------------------------------
 echo " - Generating json files"
 rm  -f ../../jsonfiles/swedishProjects/*.json
 psql swedishprojects -f projects2json.sql      | sed 's/\\\\/\\/g' > ../../jsonfiles/swedishProjects/project.json
 psql swedishprojects -f orgs2json.sql          | sed 's/\\\\/\\/g' > ../../jsonfiles/swedishProjects/organization.json
 psql swedishprojects -f projOrg2json.sql       | sed 's/\\\\/\\/g' > ../../jsonfiles/swedishProjects/projectOrganization.json
 psql swedishprojects -f projOtherIds2json.sql  | sed 's/\\\\/\\/g' > ../../jsonfiles/swedishProjects/projectOtherId.json
 psql swedishprojects -f docOtherId2json.sql    | sed 's/\\\\/\\/g' > ../../jsonfiles/swedishProjects/docotherid.json
 psql swedishprojects -f projDoi2json.sql       | sed 's/\\\\/\\/g' > ../../jsonfiles/swedishProjects/projectdocotherid.json
 echo "Done."
 echo
--- a/apps/data4impact-importer/pom.xml
+++ b/apps/data4impact-importer/pom.xml
@ -0,0 +1,93 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <project xmlns="http://maven.apache.org/POM/4.0.0"
 	xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 	xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
 	<modelVersion>4.0.0</modelVersion>
 	<groupId>eu.dnetlib</groupId>
 	<artifactId>data4impact-importer</artifactId>
 	<version>1.1.0-SNAPSHOT</version>
 	<!-- <scm> <developerConnection>scm:svn:https://svn.driver.research-infrastructures.eu/driver/data4impact/data4impact-importer/trunk</developerConnection> 
 		</scm> <ciManagement> <system>jenkins</system> <url>https://jenkins-dnet.d4science.org/view/data4impact/job/data4impact-importer/</url> 
 		</ciManagement> <distributionManagement> <repository> <id>dnet45-releases</id> 
 		<name>D-Net 45 Releases</name> <url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet45-releases</url> 
 		<layout>default</layout> </repository> </distributionManagement> -->
 	<!-- Inherit defaults from Spring Boot -->
 	<parent>
 		<groupId>org.springframework.boot</groupId>
 		<artifactId>spring-boot-starter-parent</artifactId>
 		<version>2.0.3.RELEASE</version>
 		<relativePath></relativePath>
 	</parent>
 	<!-- <repositories> <repository> <id>dnet-deps</id> <name>dnet-dependencies</name> 
 		<url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet-deps</url> 
 		<layout>default</layout> </repository> <repository> <id>dnet45-releases</id> 
 		<name>D-Net 45 Releases</name> <url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet45-releases</url> 
 		<layout>default</layout> <snapshots> <enabled>true</enabled> </snapshots> 
 		</repository> <repository> <id>dnet45-snapshots</id> <name>D-Net 45 Snapshots</name> 
 		<url>http://maven.research-infrastructures.eu/nexus/content/repositories/dnet45-snapshots</url> 
 		<layout>default</layout> <snapshots> <enabled>true</enabled> </snapshots> 
 		</repository> </repositories> -->
 	<!-- Add typical dependencies for a web application -->
 	<dependencies>
 		<dependency>
 			<groupId>org.springframework.boot</groupId>
 			<artifactId>spring-boot-starter</artifactId>
 		</dependency>
 		<dependency>
 			<groupId>eu.dnetlib</groupId>
 			<artifactId>data4impact-model</artifactId>
 			<version>1.1.0-SNAPSHOT</version>
 		</dependency>
 		<dependency>
 			<groupId>org.reflections</groupId>
 			<artifactId>reflections</artifactId>
 			<version>0.9.11</version>
 		</dependency>
 		<dependency>
 			<groupId>com.fasterxml.jackson.core</groupId>
 			<artifactId>jackson-core</artifactId>
 		</dependency>
 		<dependency>
 			<groupId>com.fasterxml.jackson.core</groupId>
 			<artifactId>jackson-annotations</artifactId>
 		</dependency>
 		<dependency>
 			<groupId>com.fasterxml.jackson.core</groupId>
 			<artifactId>jackson-databind</artifactId>
 		</dependency>
 		<!-- JUnit -->
 		<dependency>
 			<groupId>junit</groupId>
 			<artifactId>junit</artifactId>
 			<scope>test</scope>
 		</dependency>
 	</dependencies>
 	<build>
 		<plugins>
 			<plugin>
 				<groupId>org.springframework.boot</groupId>
 				<artifactId>spring-boot-maven-plugin</artifactId>
 				<configuration>
 					<executable>true</executable>
 				</configuration>
 			</plugin>
 		</plugins>
 	</build>
 	<properties>
 		<java.version>1.8</java.version>
 		<apache.solr.version>7.1.0</apache.solr.version>
 		<mongodb.driver.version>3.4.2</mongodb.driver.version>
 		<springfox-version>2.8.0</springfox-version>
 		<prometheus.version>0.2.0</prometheus.version>
 		<javamelody.version>1.71.0</javamelody.version>
 		<maven.javadoc.failOnError>false</maven.javadoc.failOnError>
 		<dockerfile-maven-version>1.3.6</dockerfile-maven-version>
 	</properties>
 </project>
--- a/apps/data4impact-importer/src/main/java/eu/data4impact/Data4ImpactImporter.java
+++ b/apps/data4impact-importer/src/main/java/eu/data4impact/Data4ImpactImporter.java
@ -0,0 +1,88 @@
 package eu.data4impact;
 import java.io.IOException;
 import java.nio.charset.StandardCharsets;
 import java.nio.file.Files;
 import java.nio.file.Path;
 import java.time.Duration;
 import java.time.LocalDateTime;
 import java.util.Optional;
 import javax.persistence.EntityManagerFactory;
 import javax.transaction.Transactional;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.context.ApplicationContext;
 import org.springframework.data.jpa.repository.JpaRepository;
 import org.springframework.stereotype.Component;
 import com.fasterxml.jackson.databind.ObjectMapper;
@Component
 public class Data4ImpactImporter {
 	@Autowired
 	private ApplicationContext applicationContext;
 	@Autowired
 	private EntityManagerFactory entityManagerFactory;
 	private final ObjectMapper jsonMapper = new ObjectMapper();
 	@Transactional
 	public <T> void importFileJson(final Path file, final Class<T> tableClass) {
 		try {
 			final LocalDateTime start = LocalDateTime.now();
 			final JpaRepository<T, ?> repo = findRepositorForTable(tableClass);
 			Files.lines(file, StandardCharsets.UTF_8).forEach(l -> processLine(l, tableClass, repo));
 			final LocalDateTime end = LocalDateTime.now();
 			final double time = Duration.between(start, end).toNanos() / 1000000000.0;
 			System.out.printf("\nDone in %.3f sec.\n\n", time);
 		} catch (final IOException e) {
 			throw new RuntimeException(e);
 		}
 	}
 	@SuppressWarnings("unchecked")
 	private <T, K> void processLine(final String line, final Class<T> tableClass, final JpaRepository<T, K> repo) {
 		try {
 			final T obj = jsonMapper.readValue(line, tableClass);
 			final K id = (K) entityManagerFactory.getPersistenceUnitUtil().getIdentifier(obj);
 			processObject(obj, id, repo);
 		} catch (final IOException | IllegalAccessException | InstantiationException e) {
 			throw new RuntimeException(e);
 		}
 	}
 	private <T, K> void processObject(final T obj, final K id, final JpaRepository<T, K> repo) throws IllegalAccessException, InstantiationException {
 		System.out.println(id);
 		final Optional<T> old = repo.findById(id);
 		if (old.isPresent()) {
 			repo.save(ObjectMerger.mergeObjects(old.get(), obj));
 		} else {
 			repo.save(obj);
 		}
 	}
 	@Transactional
 	public <T> void importFileXML(final String file, final Class<?> tableClass) {
 		throw new RuntimeException("-- NOT IMPLEMENTED --");
 	}
 	@SuppressWarnings("unchecked")
 	private <T, K> JpaRepository<T, K> findRepositorForTable(final Class<T> clazz) {
 		final String repoName = clazz.getSimpleName() + "Repository";
 		return applicationContext.getBeansOfType(JpaRepository.class)
 				.entrySet()
 				.stream()
 				.filter(e -> e.getKey().equalsIgnoreCase(repoName))
 				.map(e -> e.getValue())
 				.findFirst()
 				.orElseThrow(() -> new RuntimeException("No repository found for class " + clazz.getName()));
 	}
 }
--- a/apps/data4impact-importer/src/main/java/eu/data4impact/Data4ImpactImporterApplication.java
+++ b/apps/data4impact-importer/src/main/java/eu/data4impact/Data4ImpactImporterApplication.java
@ -0,0 +1,99 @@
 package eu.data4impact;
 import java.nio.file.Path;
 import java.nio.file.Paths;
 import java.util.HashMap;
 import java.util.Map;
 import java.util.stream.Collectors;
 import javax.persistence.Table;
 import org.reflections.Reflections;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.boot.CommandLineRunner;
 import org.springframework.boot.SpringApplication;
 import org.springframework.boot.autoconfigure.SpringBootApplication;
 import eu.data4impact.utils.DatabaseUtils;
@SpringBootApplication
 public class Data4ImpactImporterApplication implements CommandLineRunner {
 	// private static final Logger log = LoggerFactory.getLogger(Data4ImpactImporterApplication.class);
 	@Autowired
 	private Data4ImpactImporter importer;
 	@Autowired
 	private DatabaseUtils databaseUtils;
 	public static void main(final String... args) {
 		SpringApplication.run(Data4ImpactImporterApplication.class, args);
 	}
 	@Override
 	public void run(final String... args) {
 		final Map<String, Class<?>> validEntities = validEntities();
 		if (args.length == 0) {
 			printHelp();
 			printValidFiles(validEntities);
 			System.exit(1);
 		}
 		for (final String f : args) {
 			if (f.toLowerCase().endsWith(".json")) {
 				System.out.println("Processing file: " + f);
 				final Path path = Paths.get(f);
 				final String fileName = path.getFileName().toString();
 				final String entityName = fileName.substring(0, fileName.lastIndexOf('.')).toLowerCase();
 				if (validEntities.containsKey(entityName)) {
 					importer.importFileJson(path, validEntities.get(entityName));
 				} else {
 					System.err.println("\n[ERROR] Entity not found for file " + f);
 					printValidFiles(validEntities);
 					System.exit(-1);
 				}
 			} else {
 				System.err.println("\nNot a json file: " + f);
 				printValidFiles(validEntities);
 				System.exit(-1);
 			}
 		}
 		System.out.println("Refreshing views...");
 		databaseUtils.refreshMaterializedViews(v -> System.out.println(" - " + v));
 		System.out.println("Done.\n");
 	}
 	private void printHelp() {
 		System.out.println();
 		System.out.println("Missing input files !");
 		System.out.println();
 		System.out.println("Example: java -jar file1.json file2.json ...");
 		System.out.println();
 	}
 	private void printValidFiles(final Map<String, Class<?>> validEntities) {
 		System.out.println("\nValid filenames are (ignore case):\n" +
 				validEntities.keySet()
 						.stream()
 						.collect(Collectors.groupingBy(validEntities::get))
 						.entrySet()
 						.stream()
 						.map(e -> String.format(" - For class %s: %s\n",
 								e.getKey().getSimpleName(),
 								e.getValue().stream().collect(Collectors.joining(".json, ")) + ".json"))
 						.collect(Collectors.joining()));
 	}
 	private Map<String, Class<?>> validEntities() {
 		final Map<String, Class<?>> res = new HashMap<>();
 		for (final Class<?> cl : new Reflections("eu.data4impact.model").getTypesAnnotatedWith(Table.class)) {
 			res.put(cl.getSimpleName().toLowerCase(), cl);
 			res.put(cl.getAnnotation(Table.class).name().toLowerCase(), cl);
 		}
 		return res;
 	}
 }
--- a/apps/data4impact-importer/src/main/java/eu/data4impact/ObjectMerger.java
+++ b/apps/data4impact-importer/src/main/java/eu/data4impact/ObjectMerger.java
@ -0,0 +1,23 @@
 package eu.data4impact;
 import java.lang.reflect.Field;
 import java.lang.reflect.Modifier;
 public class ObjectMerger {
 	@SuppressWarnings("unchecked")
 	public static <T> T mergeObjects(final T first, final T second) throws IllegalAccessException, InstantiationException {
 		final Class<?> clazz = first.getClass();
 		final Field[] fields = clazz.getDeclaredFields();
 		final T res = (T) clazz.newInstance();
 		for (final Field f : fields) {
 			if (!Modifier.isFinal(f.getModifiers())) {
 				f.setAccessible(true);
 				final Object v1 = f.get(first);
 				final Object v2 = f.get(second);
 				f.set(res, (v2 != null ? v2 : v1));
 			}
 		}
 		return res;
 	}
 }
--- a/apps/data4impact-importer/src/main/resources/application.properties
+++ b/apps/data4impact-importer/src/main/resources/application.properties
@ -0,0 +1,14 @@
 spring.main.banner-mode = off
 logging.level.root      = WARN
 spring.datasource.url=jdbc:postgresql://localhost:5432/data4impact
 spring.datasource.username=
 spring.datasource.password=
 spring.jpa.properties.hibernate.dialect = org.hibernate.dialect.PostgreSQLDialect
 # Hibernate ddl auto (create, create-drop, validate, update)
 spring.jpa.hibernate.ddl-auto = validate
 spring.jpa.properties.hibernate.hbm2dll.extra_physical_table_types = MATERIALIZED VIEW
 spring.jpa.properties.hibernate.jdbc.lob.non_contextual_creation=true
 spring.jpa.open-in-view=true
--- a/apps/data4impact-importer/src/test/java/eu/data4impact/ObjectMergerTest.java
+++ b/apps/data4impact-importer/src/test/java/eu/data4impact/ObjectMergerTest.java
@ -0,0 +1,26 @@
 package eu.data4impact;
 import static org.junit.Assert.assertTrue;
 import org.junit.Test;
 import eu.data4impact.model.projects.Project;
 public class ObjectMergerTest {
 	@Test
 	public void test() throws IllegalAccessException, InstantiationException {
 		final Project p1 = new Project();
 		final Project p2 = new Project();
 		p2.setEcSc39(true);
 		final Project p3 = ObjectMerger.mergeObjects(p1, p2);
 		final Project p4 = ObjectMerger.mergeObjects(p2, p1);
 		assertTrue(p3.getEcSc39());
 		assertTrue(p4.getEcSc39());
 	}
 }
--- a/apps/data4impact-importer/target/classes/application.properties
+++ b/apps/data4impact-importer/target/classes/application.properties
@ -0,0 +1,14 @@
 spring.main.banner-mode = off
 logging.level.root      = WARN
 spring.datasource.url=jdbc:postgresql://localhost:5432/data4impact
 spring.datasource.username=
 spring.datasource.password=
 spring.jpa.properties.hibernate.dialect = org.hibernate.dialect.PostgreSQLDialect
 # Hibernate ddl auto (create, create-drop, validate, update)
 spring.jpa.hibernate.ddl-auto = validate
 spring.jpa.properties.hibernate.hbm2dll.extra_physical_table_types = MATERIALIZED VIEW
 spring.jpa.properties.hibernate.jdbc.lob.non_contextual_creation=true
 spring.jpa.open-in-view=true
--- a/apps/data4impact-importer/target/classes/eu/data4impact/Data4ImpactImporter.class
+++ b/apps/data4impact-importer/target/classes/eu/data4impact/Data4ImpactImporter.class
--- a/apps/data4impact-importer/target/classes/eu/data4impact/Data4ImpactImporterApplication.class
+++ b/apps/data4impact-importer/target/classes/eu/data4impact/Data4ImpactImporterApplication.class
--- a/apps/data4impact-importer/target/classes/eu/data4impact/ObjectMerger.class
+++ b/apps/data4impact-importer/target/classes/eu/data4impact/ObjectMerger.class
--- a/Show More
+++ b/Show More
		`@ -0,0 +1,3 @@`
							`UPDATE public.Document`
							`SET batchid = SUBSTR(pubyear,0,5) ;`
		`@ -0,0 +1 @@`
							`The script should be launched in OpenAIRE production server (services.openaire.eu)`
		`@ -0,0 +1,3 @@`
							`insert into doc_fulltext(docid, fulltext) select d.id as docid, t.fulltext as fulltext from document d left outer join temp_fulltext t on (d.id = t.pubid) where t.fulltext is not null;`
		`@ -0,0 +1,5 @@`
							`DONE using a java application`

							`cat pubmed.json \| while read -r line; do echo $line \| jq '.body["$binary"]' \| sed 's/"//g' \| base64 -d \| gunzip -c; done`