forked from D-Net/dnet-hadoop
implementation of the spark action for the simrel creation
This commit is contained in:
parent
af835f2f98
commit
f32eae5ce9
|
@ -82,8 +82,10 @@
|
||||||
<groupId>com.fasterxml.jackson.core</groupId>
|
<groupId>com.fasterxml.jackson.core</groupId>
|
||||||
<artifactId>jackson-core</artifactId>
|
<artifactId>jackson-core</artifactId>
|
||||||
</dependency>
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>eu.dnetlib</groupId>
|
||||||
|
<artifactId>dnet-actionmanager-common</artifactId>
|
||||||
|
</dependency>
|
||||||
|
|
||||||
</dependencies>
|
</dependencies>
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,142 @@
|
||||||
|
package eu.dnetlib.dedup;
|
||||||
|
|
||||||
|
import com.fasterxml.jackson.core.JsonProcessingException;
|
||||||
|
import com.fasterxml.jackson.databind.ObjectMapper;
|
||||||
|
import eu.dnetlib.dhp.application.ArgumentApplicationParser;
|
||||||
|
import eu.dnetlib.dhp.schema.oaf.Relation;
|
||||||
|
import eu.dnetlib.pace.config.DedupConfig;
|
||||||
|
import eu.dnetlib.pace.model.MapDocument;
|
||||||
|
import eu.dnetlib.pace.util.MapDocumentUtil;
|
||||||
|
import org.apache.commons.io.IOUtils;
|
||||||
|
import org.apache.commons.logging.Log;
|
||||||
|
import org.apache.commons.logging.LogFactory;
|
||||||
|
import org.apache.hadoop.io.Text;
|
||||||
|
import org.apache.hadoop.io.compress.GzipCodec;
|
||||||
|
import org.apache.hadoop.mapred.SequenceFileOutputFormat;
|
||||||
|
import org.apache.spark.SparkConf;
|
||||||
|
import org.apache.spark.api.java.JavaPairRDD;
|
||||||
|
import org.apache.spark.api.java.JavaRDD;
|
||||||
|
import org.apache.spark.api.java.JavaSparkContext;
|
||||||
|
import org.apache.spark.sql.Encoders;
|
||||||
|
import org.apache.spark.sql.SparkSession;
|
||||||
|
import scala.Tuple2;
|
||||||
|
import eu.dnetlib.actionmanager.actions.AtomicAction;
|
||||||
|
import eu.dnetlib.actionmanager.common.Agent;
|
||||||
|
|
||||||
|
import java.io.Serializable;
|
||||||
|
import java.util.Arrays;
|
||||||
|
import java.util.List;
|
||||||
|
import java.util.stream.Collectors;
|
||||||
|
|
||||||
|
public class SparkCreateSimRels2 implements Serializable {
|
||||||
|
|
||||||
|
final static String CONF_SEPARATOR = "@@@";
|
||||||
|
|
||||||
|
private static final Log log = LogFactory.getLog(SparkCreateSimRels2.class);
|
||||||
|
|
||||||
|
public static List<DedupConfig> decompressConfs(String compressedConfs){
|
||||||
|
|
||||||
|
return Arrays.stream(compressedConfs.split(CONF_SEPARATOR))
|
||||||
|
.map(ArgumentApplicationParser::decompressValue)
|
||||||
|
.map(DedupConfig::load)
|
||||||
|
.collect(Collectors.toList());
|
||||||
|
}
|
||||||
|
|
||||||
|
public static void main(String[] args) throws Exception {
|
||||||
|
final ArgumentApplicationParser parser = new ArgumentApplicationParser(IOUtils.toString(SparkCreateSimRels.class.getResourceAsStream("/eu/dnetlib/dhp/dedup/dedup_parameters.json")));
|
||||||
|
|
||||||
|
parser.parseArgument(args);
|
||||||
|
|
||||||
|
new SparkCreateSimRels2().run(parser, decompressConfs(parser.get("dedupConf")));
|
||||||
|
}
|
||||||
|
|
||||||
|
private void run(ArgumentApplicationParser parser, List<DedupConfig> dedupConfs) {
|
||||||
|
|
||||||
|
//read oozie parameters
|
||||||
|
final String sourcePath = parser.get("sourcePath");
|
||||||
|
final String targetPath = parser.get("targetPath");
|
||||||
|
final String rawSetName = parser.get("rawSet");
|
||||||
|
final String agentId = parser.get("agentId");
|
||||||
|
final String agentName = parser.get("agentName");
|
||||||
|
|
||||||
|
try (SparkSession spark = getSparkSession(parser)) {
|
||||||
|
final JavaSparkContext sc = new JavaSparkContext(spark.sparkContext());
|
||||||
|
|
||||||
|
//create empty sequenceFile for the accumulation
|
||||||
|
JavaRDD<Tuple2<Text,Text>> simRel = sc.emptyRDD();
|
||||||
|
|
||||||
|
//for each dedup configuration
|
||||||
|
for (DedupConfig dedupConf: dedupConfs) {
|
||||||
|
final String entity = dedupConf.getWf().getEntityType();
|
||||||
|
|
||||||
|
JavaPairRDD<String, MapDocument> mapDocument = sc.textFile(sourcePath + "/" + entity)
|
||||||
|
.mapToPair(s -> {
|
||||||
|
MapDocument d = MapDocumentUtil.asMapDocumentWithJPath(dedupConf, s);
|
||||||
|
return new Tuple2<>(d.getIdentifier(), d);
|
||||||
|
});
|
||||||
|
|
||||||
|
//create blocks for deduplication
|
||||||
|
JavaPairRDD<String, List<MapDocument>> blocks = Deduper.createsortedBlocks(sc, mapDocument, dedupConf);
|
||||||
|
|
||||||
|
//create relations by comparing only elements in the same group
|
||||||
|
final JavaPairRDD<String, String> dedupRels = Deduper.computeRelations2(sc, blocks, dedupConf);
|
||||||
|
|
||||||
|
JavaRDD<Relation> relationsRDD = dedupRels.map(r -> createSimRel(r._1(), r._2()));
|
||||||
|
|
||||||
|
//create atomic actions
|
||||||
|
JavaRDD<Tuple2<Text, Text>> newSimRels = relationsRDD
|
||||||
|
.mapToPair(rel ->
|
||||||
|
new Tuple2<>(
|
||||||
|
createActionId(rel.getSource(), rel.getTarget(), entity), //TODO update the type, maybe take it from the configuration?
|
||||||
|
new AtomicAction(rawSetName, new Agent(agentId, agentName, Agent.AGENT_TYPE.service), rel.getSource(), "isSimilarTo", rel.getTarget(), new ObjectMapper().writeValueAsString(rel).getBytes())))
|
||||||
|
.map(aa -> new Tuple2<>(aa._1(), transformAction(aa._2())));
|
||||||
|
|
||||||
|
simRel = simRel.union(newSimRels);
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
String targetDirectory = targetPath + "/" + rawSetName;
|
||||||
|
|
||||||
|
// simRel.map(s -> s._1().toString()).saveAsTextFile(targetDirectory);
|
||||||
|
|
||||||
|
simRel.mapToPair(r -> r)
|
||||||
|
.saveAsHadoopFile(targetDirectory, Text.class, Text.class, SequenceFileOutputFormat.class, GzipCodec.class);
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
public Text createActionId(String source, String target, String type) {
|
||||||
|
String id = source + "@" + type + "@" + target;
|
||||||
|
|
||||||
|
return new Text(id);
|
||||||
|
}
|
||||||
|
|
||||||
|
public Text transformAction(AtomicAction aa) throws JsonProcessingException {
|
||||||
|
|
||||||
|
ObjectMapper mapper = new ObjectMapper();
|
||||||
|
|
||||||
|
return new Text(mapper.writeValueAsString(aa));
|
||||||
|
}
|
||||||
|
|
||||||
|
public Relation createSimRel(String source, String target){
|
||||||
|
final Relation r = new Relation();
|
||||||
|
r.setSource(source);
|
||||||
|
r.setTarget(target);
|
||||||
|
r.setRelClass("isSimilarTo");
|
||||||
|
return r;
|
||||||
|
}
|
||||||
|
|
||||||
|
private static SparkSession getSparkSession(ArgumentApplicationParser parser) {
|
||||||
|
SparkConf conf = new SparkConf();
|
||||||
|
|
||||||
|
return SparkSession
|
||||||
|
.builder()
|
||||||
|
.appName(SparkCreateSimRels2.class.getSimpleName())
|
||||||
|
.master(parser.get("master"))
|
||||||
|
.config(conf)
|
||||||
|
// .enableHiveSupport()
|
||||||
|
.getOrCreate();
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
|
@ -8,26 +8,43 @@
|
||||||
{
|
{
|
||||||
"paramName": "s",
|
"paramName": "s",
|
||||||
"paramLongName": "sourcePath",
|
"paramLongName": "sourcePath",
|
||||||
"paramDescription": "the path of the sequential file to read",
|
"paramDescription": "the base path of the raw graph",
|
||||||
"paramRequired": true
|
"paramRequired": true
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"paramName": "e",
|
"paramName": "e",
|
||||||
"paramLongName": "entity",
|
"paramLongName": "entity",
|
||||||
"paramDescription": "the type of entity to be deduped",
|
"paramDescription": "the type of entity to be deduped (directory in the sourcePath)",
|
||||||
"paramRequired": true
|
"paramRequired": true
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"paramName": "c",
|
"paramName": "c",
|
||||||
"paramLongName": "dedupConf",
|
"paramLongName": "dedupConf",
|
||||||
"paramDescription": "dedup configuration to be used",
|
"paramDescription": "list of dedup configuration to be used",
|
||||||
"compressed": true,
|
|
||||||
"paramRequired": true
|
"paramRequired": true
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"paramName": "t",
|
"paramName": "t",
|
||||||
"paramLongName": "targetPath",
|
"paramLongName": "targetPath",
|
||||||
"paramDescription": "target path to save dedup result",
|
"paramDescription": "target base path to save dedup result (actions)",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "rs",
|
||||||
|
"paramLongName": "rawSet",
|
||||||
|
"paramDescription": "the raw set to be saved (directory in the targetPath)",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "ai",
|
||||||
|
"paramLongName": "agentId",
|
||||||
|
"paramDescription": "the agent identifier",
|
||||||
|
"paramRequired": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"paramName": "an",
|
||||||
|
"paramLongName": "agentName",
|
||||||
|
"paramDescription": "the agent name",
|
||||||
"paramRequired": true
|
"paramRequired": true
|
||||||
}
|
}
|
||||||
]
|
]
|
|
@ -0,0 +1,88 @@
|
||||||
|
<workflow-app name="Create Similarity Relations" xmlns="uri:oozie:workflow:0.5">
|
||||||
|
<parameters>
|
||||||
|
<property>
|
||||||
|
<name>sourcePath</name>
|
||||||
|
<description>the raw graph base path</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>entity</name>
|
||||||
|
<description>the entity that should be processed</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>dedupConf</name>
|
||||||
|
<description>the (list of) dedup Configuration(s)</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>targetPath</name>
|
||||||
|
<description>the output base path</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>rawSet</name>
|
||||||
|
<description>the output directory in the targetPath</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>agentId</name>
|
||||||
|
<description>the agent identifier</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>agentName</name>
|
||||||
|
<description>the agent name</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>sparkDriverMemory</name>
|
||||||
|
<description>memory for driver process</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>sparkExecutorMemory</name>
|
||||||
|
<description>memory for individual executor</description>
|
||||||
|
</property>
|
||||||
|
<property>
|
||||||
|
<name>sparkExecutorCores</name>
|
||||||
|
<description>number of cores used by single executor</description>
|
||||||
|
</property>
|
||||||
|
</parameters>
|
||||||
|
|
||||||
|
<start to="DeleteTargetPath"/>
|
||||||
|
|
||||||
|
<kill name="Kill">
|
||||||
|
<message>Action failed, error message[${wf:errorMessage(wf:lastErrorNode())}]</message>
|
||||||
|
</kill>
|
||||||
|
|
||||||
|
<action name="DeleteTargetPath">
|
||||||
|
<fs>
|
||||||
|
<delete path='${targetPath}/${rawSet}'/>
|
||||||
|
</fs>
|
||||||
|
<ok to="DuplicateScan"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<action name="DuplicateScan">
|
||||||
|
<spark xmlns="uri:oozie:spark-action:0.2">
|
||||||
|
<job-tracker>${jobTracker}</job-tracker>
|
||||||
|
<name-node>${nameNode}</name-node>
|
||||||
|
<master>yarn-cluster</master>
|
||||||
|
<mode>cluster</mode>
|
||||||
|
<name>Create Similarity Relations</name>
|
||||||
|
<class>eu.dnetlib.dedup.SparkCreateSimRels2</class>
|
||||||
|
<jar>dhp-dedup-${projectVersion}.jar</jar>
|
||||||
|
<spark-opts>--executor-memory ${sparkExecutorMemory} --executor-cores ${sparkExecutorCores}
|
||||||
|
--driver-memory=${sparkDriverMemory} --conf
|
||||||
|
spark.extraListeners="com.cloudera.spark.lineage.NavigatorAppListener" --conf
|
||||||
|
spark.sql.queryExecutionListeners="com.cloudera.spark.lineage.NavigatorQueryListener" --conf
|
||||||
|
spark.sql.warehouse.dir="/user/hive/warehouse"
|
||||||
|
</spark-opts>
|
||||||
|
<arg>-mt</arg><arg>yarn-cluster</arg>
|
||||||
|
<arg>--sourcePath</arg><arg>${sourcePath}</arg>
|
||||||
|
<arg>--targetPath</arg><arg>${targetPath}</arg>
|
||||||
|
<arg>--entity</arg><arg>${entity}</arg>
|
||||||
|
<arg>--dedupConf</arg><arg>${dedupConf}</arg>
|
||||||
|
<arg>--rawSet</arg><arg>${rawSet}</arg>
|
||||||
|
<arg>--agentId</arg><arg>${agentId}</arg>
|
||||||
|
<arg>--agentName</arg><arg>${agentName}</arg>
|
||||||
|
</spark>
|
||||||
|
<ok to="End"/>
|
||||||
|
<error to="Kill"/>
|
||||||
|
</action>
|
||||||
|
|
||||||
|
<end name="End"/>
|
||||||
|
</workflow-app>
|
|
@ -13,17 +13,20 @@ import org.junit.Test;
|
||||||
|
|
||||||
import java.io.File;
|
import java.io.File;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.HashSet;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
|
import java.util.Set;
|
||||||
|
|
||||||
public class SparkCreateDedupTest {
|
public class SparkCreateDedupTest {
|
||||||
|
|
||||||
String configuration;
|
String configuration;
|
||||||
String entity = "organization";
|
String configuration2;
|
||||||
|
String entity = "publication";
|
||||||
|
|
||||||
@Before
|
@Before
|
||||||
public void setUp() throws IOException {
|
public void setUp() throws IOException {
|
||||||
configuration = IOUtils.toString(getClass().getResourceAsStream("/eu/dnetlib/dedup/conf/org.curr.conf.json"));
|
configuration = IOUtils.toString(getClass().getResourceAsStream("/eu/dnetlib/dedup/conf/org1.curr.conf.json"));
|
||||||
|
configuration2 = IOUtils.toString(getClass().getResourceAsStream("/eu/dnetlib/dedup/conf/org2.curr.conf.json"));
|
||||||
}
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
|
@ -38,6 +41,21 @@ public class SparkCreateDedupTest {
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
@Ignore
|
||||||
|
public void createSimRelsTest2() throws Exception {
|
||||||
|
SparkCreateSimRels2.main(new String[] {
|
||||||
|
"-mt", "local[*]",
|
||||||
|
"-s", "/Users/miconis/dumps",
|
||||||
|
"-e", entity,
|
||||||
|
"-c", ArgumentApplicationParser.compressArgument(configuration) + "@@@" + ArgumentApplicationParser.compressArgument(configuration2),
|
||||||
|
"-t", "/tmp/dedup",
|
||||||
|
"-rs", "rawset_test",
|
||||||
|
"-ai", "agentId",
|
||||||
|
"-an", "agentName"
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
@Ignore
|
@Ignore
|
||||||
public void createCCTest() throws Exception {
|
public void createCCTest() throws Exception {
|
||||||
|
@ -79,8 +97,6 @@ public class SparkCreateDedupTest {
|
||||||
System.out.println(hashFunction.hashUnencodedChars(s1).asLong());
|
System.out.println(hashFunction.hashUnencodedChars(s1).asLong());
|
||||||
System.out.println( s2.hashCode());
|
System.out.println( s2.hashCode());
|
||||||
System.out.println(hashFunction.hashUnencodedChars(s2).asLong());
|
System.out.println(hashFunction.hashUnencodedChars(s2).asLong());
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
|
@ -87,8 +87,8 @@
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
],
|
],
|
||||||
"threshold": 0.7,
|
"threshold": 0.1,
|
||||||
"aggregation": "W_MEAN",
|
"aggregation": "AVG",
|
||||||
"positive": "layer4",
|
"positive": "layer4",
|
||||||
"negative": "NO_MATCH",
|
"negative": "NO_MATCH",
|
||||||
"undefined": "NO_MATCH",
|
"undefined": "NO_MATCH",
|
||||||
|
@ -106,7 +106,7 @@
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
],
|
],
|
||||||
"threshold": 0.9,
|
"threshold": 0.7,
|
||||||
"aggregation": "AVG",
|
"aggregation": "AVG",
|
||||||
"positive": "layer5",
|
"positive": "layer5",
|
||||||
"negative": "NO_MATCH",
|
"negative": "NO_MATCH",
|
||||||
|
@ -129,7 +129,9 @@
|
||||||
"comparator": "jaroWinklerNormalizedName",
|
"comparator": "jaroWinklerNormalizedName",
|
||||||
"weight": 0.1,
|
"weight": 0.1,
|
||||||
"countIfUndefined": "false",
|
"countIfUndefined": "false",
|
||||||
"params": {}
|
"params": {
|
||||||
|
"windowSize": 4
|
||||||
|
}
|
||||||
}
|
}
|
||||||
],
|
],
|
||||||
"threshold": 0.9,
|
"threshold": 0.9,
|
||||||
|
@ -145,14 +147,14 @@
|
||||||
{ "name" : "legalshortname", "type" : "String", "path" : "$.legalshortname.value"},
|
{ "name" : "legalshortname", "type" : "String", "path" : "$.legalshortname.value"},
|
||||||
{ "name" : "legalname", "type" : "String", "path" : "$.legalname.value" },
|
{ "name" : "legalname", "type" : "String", "path" : "$.legalname.value" },
|
||||||
{ "name" : "websiteurl", "type" : "URL", "path" : "$.websiteurl.value" },
|
{ "name" : "websiteurl", "type" : "URL", "path" : "$.websiteurl.value" },
|
||||||
{ "name" : "gridid", "type" : "String", "path" : "$.pid[?(@.qualifier.classid =='grid.ac')].value"},
|
{ "name" : "gridid", "type" : "String", "path" : "$.pid[?(@.qualifier.classid =='grid')].value"},
|
||||||
{ "name" : "originalId", "type" : "String", "path" : "$.id" }
|
{ "name" : "originalId", "type" : "String", "path" : "$.id" }
|
||||||
],
|
],
|
||||||
"blacklists" : {
|
"blacklists" : {
|
||||||
"legalname" : []
|
"legalname" : []
|
||||||
},
|
},
|
||||||
"synonyms": {
|
"synonyms": {
|
||||||
"key::1": ["university","università","università studi","universitario","universitaria","université", "universite", "universitaire","universitaires","universidad","universitade","Universität","universitaet","Uniwersytet","университет","universiteit","πανεπιστήμιο","universitesi","universiteti", "universiti"],
|
"key::1": ["university","università", "universitas", "università studi","universitario","universitaria","université", "universite", "universitaire","universitaires","universidad","universitade","Universität","universitaet","Uniwersytet","университет","universiteit","πανεπιστήμιο","universitesi","universiteti", "universiti"],
|
||||||
"key::2": ["studies","studi","études","estudios","estudos","Studien","studia","исследования","studies","σπουδές"],
|
"key::2": ["studies","studi","études","estudios","estudos","Studien","studia","исследования","studies","σπουδές"],
|
||||||
"key::3": ["advanced","superiore","supérieur","supérieure","supérieurs","supérieures","avancado","avancados","fortgeschrittene","fortgeschritten","zaawansowany","передовой","gevorderd","gevorderde","προχωρημένος","προχωρημένη","προχωρημένο","προχωρημένες","προχωρημένα","wyzsza"],
|
"key::3": ["advanced","superiore","supérieur","supérieure","supérieurs","supérieures","avancado","avancados","fortgeschrittene","fortgeschritten","zaawansowany","передовой","gevorderd","gevorderde","προχωρημένος","προχωρημένη","προχωρημένο","προχωρημένες","προχωρημένα","wyzsza"],
|
||||||
"key::4": ["institute","istituto","institut","instituto","instituto","Institut","instytut","институт","instituut","ινστιτούτο"],
|
"key::4": ["institute","istituto","institut","instituto","instituto","Institut","instytut","институт","instituut","ινστιτούτο"],
|
||||||
|
|
|
@ -1,42 +1,134 @@
|
||||||
{
|
{
|
||||||
"wf" : {
|
"wf": {
|
||||||
"threshold" : "0.99",
|
"threshold": "0.99",
|
||||||
"dedupRun" : "001",
|
"dedupRun": "001",
|
||||||
"entityType" : "result",
|
"entityType": "result",
|
||||||
"subEntityType" : "resulttype",
|
"subEntityType": "resulttype",
|
||||||
"subEntityValue" : "publication",
|
"subEntityValue": "publication",
|
||||||
"orderField" : "title",
|
"orderField": "title",
|
||||||
"queueMaxSize" : "2000",
|
"queueMaxSize": "2000",
|
||||||
"groupMaxSize" : "100",
|
"groupMaxSize": "100",
|
||||||
"maxChildren" : "100",
|
"maxChildren": "100",
|
||||||
"idPath": "$.id",
|
"slidingWindowSize": "200",
|
||||||
"slidingWindowSize" : "200",
|
"rootBuilder": [
|
||||||
"rootBuilder" : [ "result", "resultProject_outcome_isProducedBy", "resultResult_publicationDataset_isRelatedTo", "resultResult_similarity_isAmongTopNSimilarDocuments", "resultResult_similarity_hasAmongTopNSimilarDocuments", "resultOrganization_affiliation_isAffiliatedWith", "resultResult_part_hasPart", "resultResult_part_isPartOf", "resultResult_supplement_isSupplementTo", "resultResult_supplement_isSupplementedBy", "resultResult_version_isVersionOf" ],
|
"result",
|
||||||
"includeChildren" : "true"
|
"resultProject_outcome_isProducedBy",
|
||||||
|
"resultResult_publicationDataset_isRelatedTo",
|
||||||
|
"resultResult_similarity_isAmongTopNSimilarDocuments",
|
||||||
|
"resultResult_similarity_hasAmongTopNSimilarDocuments",
|
||||||
|
"resultOrganization_affiliation_isAffiliatedWith",
|
||||||
|
"resultResult_part_hasPart",
|
||||||
|
"resultResult_part_isPartOf",
|
||||||
|
"resultResult_supplement_isSupplementTo",
|
||||||
|
"resultResult_supplement_isSupplementedBy",
|
||||||
|
"resultResult_version_isVersionOf"
|
||||||
|
],
|
||||||
|
"includeChildren": "true",
|
||||||
|
"maxIterations": 20,
|
||||||
|
"idPath": "$.id"
|
||||||
},
|
},
|
||||||
"pace" : {
|
"pace": {
|
||||||
"clustering" : [
|
"clustering" : [
|
||||||
{ "name" : "ngrampairs", "fields" : [ "title" ], "params" : { "max" : "1", "ngramLen" : "3"} },
|
{ "name" : "ngrampairs", "fields" : [ "title" ], "params" : { "max" : "1", "ngramLen" : "3"} },
|
||||||
{ "name" : "suffixprefix", "fields" : [ "title" ], "params" : { "max" : "1", "len" : "3" } },
|
{ "name" : "suffixprefix", "fields" : [ "title" ], "params" : { "max" : "1", "len" : "3" } },
|
||||||
{ "name" : "lowercase", "fields" : [ "doi" ], "params" : { } }
|
{ "name" : "lowercase", "fields" : [ "doi" ], "params" : { } }
|
||||||
],
|
],
|
||||||
"strictConditions" : [
|
"decisionTree": {
|
||||||
{ "name" : "pidMatch", "fields" : [ "pid" ] }
|
"start": {
|
||||||
|
"fields": [
|
||||||
|
{
|
||||||
|
"field": "pid",
|
||||||
|
"comparator": "jsonListMatch",
|
||||||
|
"weight": 1.0,
|
||||||
|
"countIfUndefined": "false",
|
||||||
|
"params": {
|
||||||
|
"jpath_value": "$.value",
|
||||||
|
"jpath_classid": "$.qualifier.classid"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"threshold": 0.5,
|
||||||
|
"aggregation": "AVG",
|
||||||
|
"positive": "MATCH",
|
||||||
|
"negative": "layer2",
|
||||||
|
"undefined": "layer2",
|
||||||
|
"ignoreUndefined": "true"
|
||||||
|
},
|
||||||
|
"layer2": {
|
||||||
|
"fields": [
|
||||||
|
{
|
||||||
|
"field": "title",
|
||||||
|
"comparator": "titleVersionMatch",
|
||||||
|
"weight": 1.0,
|
||||||
|
"countIfUndefined": "false",
|
||||||
|
"params": {}
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"field": "authors",
|
||||||
|
"comparator": "sizeMatch",
|
||||||
|
"weight": 1.0,
|
||||||
|
"countIfUndefined": "false",
|
||||||
|
"params": {}
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"threshold": 1.0,
|
||||||
|
"aggregation": "AND",
|
||||||
|
"positive": "layer3",
|
||||||
|
"negative": "NO_MATCH",
|
||||||
|
"undefined": "layer3",
|
||||||
|
"ignoreUndefined": "false"
|
||||||
|
},
|
||||||
|
"layer3": {
|
||||||
|
"fields": [
|
||||||
|
{
|
||||||
|
"field": "title",
|
||||||
|
"comparator": "levensteinTitle",
|
||||||
|
"weight": 1.0,
|
||||||
|
"countIfUndefined": "true",
|
||||||
|
"params": {}
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"threshold": 0.99,
|
||||||
|
"aggregation": "AVG",
|
||||||
|
"positive": "MATCH",
|
||||||
|
"negative": "NO_MATCH",
|
||||||
|
"undefined": "NO_MATCH",
|
||||||
|
"ignoreUndefined": "true"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"model": [
|
||||||
|
{
|
||||||
|
"name": "doi",
|
||||||
|
"type": "String",
|
||||||
|
"path": "$.pid[?(@.qualifier.classid == 'doi')].value"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "pid",
|
||||||
|
"type": "JSON",
|
||||||
|
"path": "$.pid",
|
||||||
|
"overrideMatch": "true"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "title",
|
||||||
|
"type": "String",
|
||||||
|
"path": "$.title[?(@.qualifier.classid == 'main title')].value",
|
||||||
|
"length": 250,
|
||||||
|
"size": 5
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "authors",
|
||||||
|
"type": "List",
|
||||||
|
"path": "$.author[*].fullname",
|
||||||
|
"size": 200
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "resulttype",
|
||||||
|
"type": "String",
|
||||||
|
"path": "$.resulttype.classid"
|
||||||
|
}
|
||||||
],
|
],
|
||||||
"conditions" : [
|
"blacklists": {
|
||||||
{ "name" : "titleVersionMatch", "fields" : [ "title" ] },
|
"title": [
|
||||||
{ "name" : "sizeMatch", "fields" : [ "authors" ] }
|
|
||||||
],
|
|
||||||
"model" : [
|
|
||||||
{ "name" : "doi", "algo" : "Null", "type" : "String", "weight" : "0.0", "ignoreMissing" : "true", "path" : "$.pid[?(@.qualifier.classid ==\"doi\")].value" },
|
|
||||||
{ "name" : "pid", "algo" : "Null", "type" : "JSON", "weight" : "0.0", "ignoreMissing" : "true", "path" : "$.pid", "overrideMatch" : "true" },
|
|
||||||
{ "name" : "title", "algo" : "LevensteinTitle", "type" : "String", "weight" : "1.0", "ignoreMissing" : "false", "path" : "$.title[?(@.qualifier.classid ==\"main title\")].value", "length" : 250, "size" : 5 },
|
|
||||||
{ "name" : "authors", "algo" : "Null", "type" : "List", "weight" : "0.0", "ignoreMissing" : "true", "path" : "$.author[*].fullname", "size" : 200 },
|
|
||||||
{ "name" : "resulttype", "algo" : "Null", "type" : "String", "weight" : "0.0", "ignoreMissing" : "false", "path" : "$.resulttype.classid" }
|
|
||||||
],
|
|
||||||
"synonyms": {},
|
|
||||||
"blacklists" : {
|
|
||||||
"title" : [
|
|
||||||
"^Inside Front Cover$",
|
"^Inside Front Cover$",
|
||||||
"(?i)^Poster presentations$",
|
"(?i)^Poster presentations$",
|
||||||
"^THE ASSOCIATION AND THE GENERAL MEDICAL COUNCIL$",
|
"^THE ASSOCIATION AND THE GENERAL MEDICAL COUNCIL$",
|
||||||
|
@ -48,7 +140,6 @@
|
||||||
"^Cartas? ao editor Letters? to the Editor$",
|
"^Cartas? ao editor Letters? to the Editor$",
|
||||||
"^Note from the Editor$",
|
"^Note from the Editor$",
|
||||||
"^Anesthesia Abstract$",
|
"^Anesthesia Abstract$",
|
||||||
|
|
||||||
"^Annual report$",
|
"^Annual report$",
|
||||||
"(?i)^“?THE RADICAL PREVENTION OF VENEREAL DISEASE\\.?”?$",
|
"(?i)^“?THE RADICAL PREVENTION OF VENEREAL DISEASE\\.?”?$",
|
||||||
"(?i)^Graph and Table of Infectious Diseases?$",
|
"(?i)^Graph and Table of Infectious Diseases?$",
|
||||||
|
@ -68,14 +159,12 @@
|
||||||
"^Cálculo de concentraciones en disoluciones acuosas. Ejercicio interactivo\\..*\\.$",
|
"^Cálculo de concentraciones en disoluciones acuosas. Ejercicio interactivo\\..*\\.$",
|
||||||
"(?i)^Genetic and functional analyses of SHANK2 mutations suggest a multiple hit model of Autism spectrum disorders?\\.?$",
|
"(?i)^Genetic and functional analyses of SHANK2 mutations suggest a multiple hit model of Autism spectrum disorders?\\.?$",
|
||||||
"^Gushi hakubutsugaku$",
|
"^Gushi hakubutsugaku$",
|
||||||
|
|
||||||
"^Starobosanski nadpisi u Bosni i Hercegovini \\(.*\\)$",
|
"^Starobosanski nadpisi u Bosni i Hercegovini \\(.*\\)$",
|
||||||
"^Intestinal spirocha?etosis$",
|
"^Intestinal spirocha?etosis$",
|
||||||
"^Treatment of Rodent Ulcer$",
|
"^Treatment of Rodent Ulcer$",
|
||||||
"(?i)^\\W*Cloud Computing\\W*$",
|
"(?i)^\\W*Cloud Computing\\W*$",
|
||||||
"^Compendio mathematico : en que se contienen todas las materias mas principales de las Ciencias que tratan de la cantidad$",
|
"^Compendio mathematico : en que se contienen todas las materias mas principales de las Ciencias que tratan de la cantidad$",
|
||||||
"^Free Communications, Poster Presentations: Session [A-F]$",
|
"^Free Communications, Poster Presentations: Session [A-F]$",
|
||||||
|
|
||||||
"^“The Historical Aspects? of Quackery\\.?”$",
|
"^“The Historical Aspects? of Quackery\\.?”$",
|
||||||
"^A designated centre for people with disabilities operated by St John of God Community Services (Limited|Ltd), Louth$",
|
"^A designated centre for people with disabilities operated by St John of God Community Services (Limited|Ltd), Louth$",
|
||||||
"^P(er|re)-Mile Premiums for Auto Insurance\\.?$",
|
"^P(er|re)-Mile Premiums for Auto Insurance\\.?$",
|
||||||
|
@ -96,10 +185,8 @@
|
||||||
"(?i)^Measurement of the pseudorapidity and centrality dependence of the transverse energy density in Pb(-?)Pb collisions at.*tev(\\.?)$",
|
"(?i)^Measurement of the pseudorapidity and centrality dependence of the transverse energy density in Pb(-?)Pb collisions at.*tev(\\.?)$",
|
||||||
"(?i)^Search for resonances decaying into top-quark pairs using fully hadronic decays in pp collisions with ATLAS at.*TeV$",
|
"(?i)^Search for resonances decaying into top-quark pairs using fully hadronic decays in pp collisions with ATLAS at.*TeV$",
|
||||||
"(?i)^Search for neutral minimal supersymmetric standard model Higgs bosons decaying to tau pairs in pp collisions at.*tev$",
|
"(?i)^Search for neutral minimal supersymmetric standard model Higgs bosons decaying to tau pairs in pp collisions at.*tev$",
|
||||||
|
|
||||||
"(?i)^Relatório de Estágio (de|em) Angiologia e Cirurgia Vascular$",
|
"(?i)^Relatório de Estágio (de|em) Angiologia e Cirurgia Vascular$",
|
||||||
"^Aus der AGMB$",
|
"^Aus der AGMB$",
|
||||||
|
|
||||||
"^Znanstveno-stručni prilozi$",
|
"^Znanstveno-stručni prilozi$",
|
||||||
"(?i)^Zhodnocení finanční situace podniku a návrhy na zlepšení$",
|
"(?i)^Zhodnocení finanční situace podniku a návrhy na zlepšení$",
|
||||||
"(?i)^Evaluation of the Financial Situation in the Firm and Proposals to its Improvement$",
|
"(?i)^Evaluation of the Financial Situation in the Firm and Proposals to its Improvement$",
|
||||||
|
@ -136,7 +223,6 @@
|
||||||
"(?i)^RUBRIKA UREDNIKA$",
|
"(?i)^RUBRIKA UREDNIKA$",
|
||||||
"^A Matching Model of the Academic Publication Market$",
|
"^A Matching Model of the Academic Publication Market$",
|
||||||
"^Yōgaku kōyō$",
|
"^Yōgaku kōyō$",
|
||||||
|
|
||||||
"^Internetový marketing$",
|
"^Internetový marketing$",
|
||||||
"^Internet marketing$",
|
"^Internet marketing$",
|
||||||
"^Chūtō kokugo dokuhon$",
|
"^Chūtō kokugo dokuhon$",
|
||||||
|
@ -169,21 +255,17 @@
|
||||||
"^Information System Assessment and Proposal for ICT Modification$",
|
"^Information System Assessment and Proposal for ICT Modification$",
|
||||||
"^Stresové zatížení pracovníků ve vybrané profesi$",
|
"^Stresové zatížení pracovníků ve vybrané profesi$",
|
||||||
"^Stress load in a specific job$",
|
"^Stress load in a specific job$",
|
||||||
|
|
||||||
"^Sunday: Poster Sessions, Pt.*$",
|
"^Sunday: Poster Sessions, Pt.*$",
|
||||||
"^Monday: Poster Sessions, Pt.*$",
|
"^Monday: Poster Sessions, Pt.*$",
|
||||||
"^Wednesday: Poster Sessions, Pt.*",
|
"^Wednesday: Poster Sessions, Pt.*",
|
||||||
"^Tuesday: Poster Sessions, Pt.*$",
|
"^Tuesday: Poster Sessions, Pt.*$",
|
||||||
|
|
||||||
"^Analýza reklamy$",
|
"^Analýza reklamy$",
|
||||||
"^Analysis of advertising$",
|
"^Analysis of advertising$",
|
||||||
|
|
||||||
"^Shōgaku shūshinsho$",
|
"^Shōgaku shūshinsho$",
|
||||||
"^Shōgaku sansū$",
|
"^Shōgaku sansū$",
|
||||||
"^Shintei joshi kokubun$",
|
"^Shintei joshi kokubun$",
|
||||||
"^Taishō joshi kokubun dokuhon$",
|
"^Taishō joshi kokubun dokuhon$",
|
||||||
"^Joshi kokubun$",
|
"^Joshi kokubun$",
|
||||||
|
|
||||||
"^Účetní uzávěrka a účetní závěrka v ČR$",
|
"^Účetní uzávěrka a účetní závěrka v ČR$",
|
||||||
"(?i)^The \"?Causes\"? of Cancer$",
|
"(?i)^The \"?Causes\"? of Cancer$",
|
||||||
"^Normas para la publicación de artículos$",
|
"^Normas para la publicación de artículos$",
|
||||||
|
@ -202,7 +284,6 @@
|
||||||
"^Abdominal [Aa]ortic [Aa]neurysms.*$",
|
"^Abdominal [Aa]ortic [Aa]neurysms.*$",
|
||||||
"^Pseudomyxoma peritonei$",
|
"^Pseudomyxoma peritonei$",
|
||||||
"^Kazalo autora$",
|
"^Kazalo autora$",
|
||||||
|
|
||||||
"(?i)^uvodna riječ$",
|
"(?i)^uvodna riječ$",
|
||||||
"^Motivace jako způsob vedení lidí$",
|
"^Motivace jako způsob vedení lidí$",
|
||||||
"^Motivation as a leadership$",
|
"^Motivation as a leadership$",
|
||||||
|
@ -275,6 +356,7 @@
|
||||||
"(?i)^.*authors['’′]? reply\\.?$",
|
"(?i)^.*authors['’′]? reply\\.?$",
|
||||||
"(?i)^.*authors['’′]? response\\.?$"
|
"(?i)^.*authors['’′]? response\\.?$"
|
||||||
]
|
]
|
||||||
}
|
},
|
||||||
|
"synonyms": {}
|
||||||
}
|
}
|
||||||
}
|
}
|
|
@ -1,386 +0,0 @@
|
||||||
{
|
|
||||||
"wf": {
|
|
||||||
"threshold": "0.99",
|
|
||||||
"dedupRun": "001",
|
|
||||||
"entityType": "result",
|
|
||||||
"subEntityType": "resulttype",
|
|
||||||
"subEntityValue": "publication",
|
|
||||||
"orderField": "title",
|
|
||||||
"queueMaxSize": "2000",
|
|
||||||
"groupMaxSize": "100",
|
|
||||||
"maxChildren": "100",
|
|
||||||
"slidingWindowSize": "200",
|
|
||||||
"rootBuilder": [
|
|
||||||
"result",
|
|
||||||
"resultProject_outcome_isProducedBy",
|
|
||||||
"resultResult_publicationDataset_isRelatedTo",
|
|
||||||
"resultResult_similarity_isAmongTopNSimilarDocuments",
|
|
||||||
"resultResult_similarity_hasAmongTopNSimilarDocuments",
|
|
||||||
"resultOrganization_affiliation_isAffiliatedWith",
|
|
||||||
"resultResult_part_hasPart",
|
|
||||||
"resultResult_part_isPartOf",
|
|
||||||
"resultResult_supplement_isSupplementTo",
|
|
||||||
"resultResult_supplement_isSupplementedBy",
|
|
||||||
"resultResult_version_isVersionOf"
|
|
||||||
],
|
|
||||||
"includeChildren": "true",
|
|
||||||
"maxIterations": 20,
|
|
||||||
"idPath": "$.id"
|
|
||||||
},
|
|
||||||
"pace": {
|
|
||||||
"clustering": [
|
|
||||||
{
|
|
||||||
"name": "ngrampairs",
|
|
||||||
"fields": [
|
|
||||||
"title"
|
|
||||||
],
|
|
||||||
"params": {
|
|
||||||
"max": "1",
|
|
||||||
"ngramLen": "3"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"name": "suffixprefix",
|
|
||||||
"fields": [
|
|
||||||
"title"
|
|
||||||
],
|
|
||||||
"params": {
|
|
||||||
"max": "1",
|
|
||||||
"len": "3"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"name": "lowercase",
|
|
||||||
"fields": [
|
|
||||||
"doi"
|
|
||||||
],
|
|
||||||
"params": {}
|
|
||||||
}
|
|
||||||
],
|
|
||||||
"decisionTree": {
|
|
||||||
"start": {
|
|
||||||
"fields": [
|
|
||||||
{
|
|
||||||
"field": "pid",
|
|
||||||
"comparator": "jsonListMatch",
|
|
||||||
"weight": 1.0,
|
|
||||||
"countIfUndefined": "false",
|
|
||||||
"params": {
|
|
||||||
"jpath_value": "$.value",
|
|
||||||
"jpath_classid": "$.qualifier.classid"
|
|
||||||
}
|
|
||||||
}
|
|
||||||
],
|
|
||||||
"threshold": 0.5,
|
|
||||||
"aggregation": "AVG",
|
|
||||||
"positive": "MATCH",
|
|
||||||
"negative": "layer2",
|
|
||||||
"undefined": "layer2",
|
|
||||||
"ignoreUndefined": "true"
|
|
||||||
},
|
|
||||||
"layer2": {
|
|
||||||
"fields": [
|
|
||||||
{
|
|
||||||
"field": "title",
|
|
||||||
"comparator": "titleVersionMatch",
|
|
||||||
"weight": 1.0,
|
|
||||||
"countIfUndefined": "false",
|
|
||||||
"params": {}
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"field": "authors",
|
|
||||||
"comparator": "sizeMatch",
|
|
||||||
"weight": 1.0,
|
|
||||||
"countIfUndefined": "false",
|
|
||||||
"params": {}
|
|
||||||
}
|
|
||||||
],
|
|
||||||
"threshold": 1.0,
|
|
||||||
"aggregation": "AND",
|
|
||||||
"positive": "layer3",
|
|
||||||
"negative": "NO_MATCH",
|
|
||||||
"undefined": "layer3",
|
|
||||||
"ignoreUndefined": "false"
|
|
||||||
},
|
|
||||||
"layer3": {
|
|
||||||
"fields": [
|
|
||||||
{
|
|
||||||
"field": "title",
|
|
||||||
"comparator": "levensteinTitle",
|
|
||||||
"weight": 1.0,
|
|
||||||
"countIfUndefined": "true",
|
|
||||||
"params": {}
|
|
||||||
}
|
|
||||||
],
|
|
||||||
"threshold": 0.99,
|
|
||||||
"aggregation": "AVG",
|
|
||||||
"positive": "MATCH",
|
|
||||||
"negative": "NO_MATCH",
|
|
||||||
"undefined": "NO_MATCH",
|
|
||||||
"ignoreUndefined": "true"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"model": [
|
|
||||||
{
|
|
||||||
"name": "doi",
|
|
||||||
"type": "String",
|
|
||||||
"path": "$.pid[?(@.qualifier.classid == 'doi')].value"
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"name": "pid",
|
|
||||||
"type": "JSON",
|
|
||||||
"path": "$.pid",
|
|
||||||
"overrideMatch": "true"
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"name": "title",
|
|
||||||
"type": "String",
|
|
||||||
"path": "$.title[?(@.qualifier.classid == 'main title')].value",
|
|
||||||
"length": 250,
|
|
||||||
"size": 5
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"name": "authors",
|
|
||||||
"type": "List",
|
|
||||||
"path": "$.author[*].fullname",
|
|
||||||
"size": 200
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"name": "resulttype",
|
|
||||||
"type": "String",
|
|
||||||
"path": "$.resulttype.classid"
|
|
||||||
}
|
|
||||||
],
|
|
||||||
"blacklists": {
|
|
||||||
"title": [
|
|
||||||
"^Inside Front Cover$",
|
|
||||||
"(?i)^Poster presentations$",
|
|
||||||
"^THE ASSOCIATION AND THE GENERAL MEDICAL COUNCIL$",
|
|
||||||
"^Problems with perinatal pathology\\.?$",
|
|
||||||
"(?i)^Cases? of Puerperal Convulsions$",
|
|
||||||
"(?i)^Operative Gyna?ecology$",
|
|
||||||
"(?i)^Mind the gap\\!?\\:?$",
|
|
||||||
"^Chronic fatigue syndrome\\.?$",
|
|
||||||
"^Cartas? ao editor Letters? to the Editor$",
|
|
||||||
"^Note from the Editor$",
|
|
||||||
"^Anesthesia Abstract$",
|
|
||||||
"^Annual report$",
|
|
||||||
"(?i)^“?THE RADICAL PREVENTION OF VENEREAL DISEASE\\.?”?$",
|
|
||||||
"(?i)^Graph and Table of Infectious Diseases?$",
|
|
||||||
"^Presentation$",
|
|
||||||
"(?i)^Reviews and Information on Publications$",
|
|
||||||
"(?i)^PUBLIC HEALTH SERVICES?$",
|
|
||||||
"(?i)^COMBINED TEXT-?BOOK OF OBSTETRICS AND GYN(Æ|ae)COLOGY$",
|
|
||||||
"(?i)^Adrese autora$",
|
|
||||||
"(?i)^Systematic Part .*\\. Catalogus Fossilium Austriae, Band 2: Echinoidea neogenica$",
|
|
||||||
"(?i)^Acknowledgement to Referees$",
|
|
||||||
"(?i)^Behçet's disease\\.?$",
|
|
||||||
"(?i)^Isolation and identification of restriction endonuclease.*$",
|
|
||||||
"(?i)^CEREBROVASCULAR DISEASES?.?$",
|
|
||||||
"(?i)^Screening for abdominal aortic aneurysms?\\.?$",
|
|
||||||
"^Event management$",
|
|
||||||
"(?i)^Breakfast and Crohn's disease.*\\.?$",
|
|
||||||
"^Cálculo de concentraciones en disoluciones acuosas. Ejercicio interactivo\\..*\\.$",
|
|
||||||
"(?i)^Genetic and functional analyses of SHANK2 mutations suggest a multiple hit model of Autism spectrum disorders?\\.?$",
|
|
||||||
"^Gushi hakubutsugaku$",
|
|
||||||
"^Starobosanski nadpisi u Bosni i Hercegovini \\(.*\\)$",
|
|
||||||
"^Intestinal spirocha?etosis$",
|
|
||||||
"^Treatment of Rodent Ulcer$",
|
|
||||||
"(?i)^\\W*Cloud Computing\\W*$",
|
|
||||||
"^Compendio mathematico : en que se contienen todas las materias mas principales de las Ciencias que tratan de la cantidad$",
|
|
||||||
"^Free Communications, Poster Presentations: Session [A-F]$",
|
|
||||||
"^“The Historical Aspects? of Quackery\\.?”$",
|
|
||||||
"^A designated centre for people with disabilities operated by St John of God Community Services (Limited|Ltd), Louth$",
|
|
||||||
"^P(er|re)-Mile Premiums for Auto Insurance\\.?$",
|
|
||||||
"(?i)^Case Report$",
|
|
||||||
"^Boletín Informativo$",
|
|
||||||
"(?i)^Glioblastoma Multiforme$",
|
|
||||||
"(?i)^Nuevos táxones animales descritos en la península Ibérica y Macaronesia desde 1994 \\(.*\\)$",
|
|
||||||
"^Zaměstnanecké výhody$",
|
|
||||||
"(?i)^The Economics of Terrorism and Counter-Terrorism: A Survey \\(Part .*\\)$",
|
|
||||||
"(?i)^Carotid body tumours?\\.?$",
|
|
||||||
"(?i)^\\[Españoles en Francia : La condición Emigrante.*\\]$",
|
|
||||||
"^Avant-propos$",
|
|
||||||
"(?i)^St\\. Patrick's Cathedral, Dublin, County Dublin - Head(s)? and Capital(s)?$",
|
|
||||||
"(?i)^St\\. Patrick's Cathedral, Dublin, County Dublin - Bases?$",
|
|
||||||
"(?i)^PUBLIC HEALTH VERSUS THE STATE$",
|
|
||||||
"^Viñetas de Cortázar$",
|
|
||||||
"(?i)^Search for heavy neutrinos and W(\\[|_|\\(|_\\{|-)?R(\\]|\\)|\\})? bosons with right-handed couplings in a left-right symmetric model in pp collisions at.*TeV(\\.)?$",
|
|
||||||
"(?i)^Measurement of the pseudorapidity and centrality dependence of the transverse energy density in Pb(-?)Pb collisions at.*tev(\\.?)$",
|
|
||||||
"(?i)^Search for resonances decaying into top-quark pairs using fully hadronic decays in pp collisions with ATLAS at.*TeV$",
|
|
||||||
"(?i)^Search for neutral minimal supersymmetric standard model Higgs bosons decaying to tau pairs in pp collisions at.*tev$",
|
|
||||||
"(?i)^Relatório de Estágio (de|em) Angiologia e Cirurgia Vascular$",
|
|
||||||
"^Aus der AGMB$",
|
|
||||||
"^Znanstveno-stručni prilozi$",
|
|
||||||
"(?i)^Zhodnocení finanční situace podniku a návrhy na zlepšení$",
|
|
||||||
"(?i)^Evaluation of the Financial Situation in the Firm and Proposals to its Improvement$",
|
|
||||||
"(?i)^Hodnocení finanční situace podniku a návrhy na její zlepšení$",
|
|
||||||
"^Finanční analýza podniku$",
|
|
||||||
"^Financial analysis( of business)?$",
|
|
||||||
"(?i)^Textbook of Gyn(a)?(Æ)?(e)?cology$",
|
|
||||||
"^Jikken nihon shūshinsho$",
|
|
||||||
"(?i)^CORONER('|s)(s|') INQUESTS$",
|
|
||||||
"(?i)^(Μελέτη παραγόντων )?risk management( για ανάπτυξη και εφαρμογή ενός πληροφοριακού συστήματος| και ανάπτυξη συστήματος)?$",
|
|
||||||
"(?i)^Consultants' contract(s)?$",
|
|
||||||
"(?i)^Upute autorima$",
|
|
||||||
"(?i)^Bijdrage tot de Kennis van den Godsdienst der Dajaks van Lan(d|f)ak en Tajan$",
|
|
||||||
"^Joshi shin kokubun$",
|
|
||||||
"^Kōtō shōgaku dokuhon nōson'yō$",
|
|
||||||
"^Jinjō shōgaku shōka$",
|
|
||||||
"^Shōgaku shūjichō$",
|
|
||||||
"^Nihon joshi dokuhon$",
|
|
||||||
"^Joshi shin dokuhon$",
|
|
||||||
"^Chūtō kanbun dokuhon$",
|
|
||||||
"^Wabun dokuhon$",
|
|
||||||
"(?i)^(Analysis of economy selected village or town|Rozbor hospodaření vybrané obce či města)$",
|
|
||||||
"(?i)^cardiac rehabilitation$",
|
|
||||||
"(?i)^Analytical summary$",
|
|
||||||
"^Thesaurus resolutionum Sacrae Congregationis Concilii$",
|
|
||||||
"(?i)^Sumario analítico(\\s{1})?(Analitic summary)?$",
|
|
||||||
"^Prikazi i osvrti$",
|
|
||||||
"^Rodinný dům s provozovnou$",
|
|
||||||
"^Family house with an establishment$",
|
|
||||||
"^Shinsei chūtō shin kokugun$",
|
|
||||||
"^Pulmonary alveolar proteinosis(\\.?)$",
|
|
||||||
"^Shinshū kanbun$",
|
|
||||||
"^Viñeta(s?) de Rodríguez$",
|
|
||||||
"(?i)^RUBRIKA UREDNIKA$",
|
|
||||||
"^A Matching Model of the Academic Publication Market$",
|
|
||||||
"^Yōgaku kōyō$",
|
|
||||||
"^Internetový marketing$",
|
|
||||||
"^Internet marketing$",
|
|
||||||
"^Chūtō kokugo dokuhon$",
|
|
||||||
"^Kokugo dokuhon$",
|
|
||||||
"^Antibiotic Cover for Dental Extraction(s?)$",
|
|
||||||
"^Strategie podniku$",
|
|
||||||
"^Strategy of an Enterprise$",
|
|
||||||
"(?i)^respiratory disease(s?)(\\.?)$",
|
|
||||||
"^Award(s?) for Gallantry in Civil Defence$",
|
|
||||||
"^Podniková kultura$",
|
|
||||||
"^Corporate Culture$",
|
|
||||||
"^Severe hyponatraemia in hospital inpatient(s?)(\\.?)$",
|
|
||||||
"^Pracovní motivace$",
|
|
||||||
"^Work Motivation$",
|
|
||||||
"^Kaitei kōtō jogaku dokuhon$",
|
|
||||||
"^Konsolidovaná účetní závěrka$",
|
|
||||||
"^Consolidated Financial Statements$",
|
|
||||||
"(?i)^intracranial tumour(s?)$",
|
|
||||||
"^Climate Change Mitigation Options and Directed Technical Change: A Decentralized Equilibrium Analysis$",
|
|
||||||
"^\\[CERVECERIAS MAHOU(\\.|\\:) INTERIOR\\] \\[Material gráfico\\]$",
|
|
||||||
"^Housing Market Dynamics(\\:|\\.) On the Contribution of Income Shocks and Credit Constraint(s?)$",
|
|
||||||
"^\\[Funciones auxiliares de la música en Radio París,.*\\]$",
|
|
||||||
"^Úroveň motivačního procesu jako způsobu vedení lidí$",
|
|
||||||
"^The level of motivation process as a leadership$",
|
|
||||||
"^Pay-beds in N(\\.?)H(\\.?)S(\\.?) Hospitals$",
|
|
||||||
"(?i)^news and events$",
|
|
||||||
"(?i)^NOVOSTI I DOGAĐAJI$",
|
|
||||||
"^Sansū no gakushū$",
|
|
||||||
"^Posouzení informačního systému firmy a návrh změn$",
|
|
||||||
"^Information System Assessment and Proposal for ICT Modification$",
|
|
||||||
"^Stresové zatížení pracovníků ve vybrané profesi$",
|
|
||||||
"^Stress load in a specific job$",
|
|
||||||
"^Sunday: Poster Sessions, Pt.*$",
|
|
||||||
"^Monday: Poster Sessions, Pt.*$",
|
|
||||||
"^Wednesday: Poster Sessions, Pt.*",
|
|
||||||
"^Tuesday: Poster Sessions, Pt.*$",
|
|
||||||
"^Analýza reklamy$",
|
|
||||||
"^Analysis of advertising$",
|
|
||||||
"^Shōgaku shūshinsho$",
|
|
||||||
"^Shōgaku sansū$",
|
|
||||||
"^Shintei joshi kokubun$",
|
|
||||||
"^Taishō joshi kokubun dokuhon$",
|
|
||||||
"^Joshi kokubun$",
|
|
||||||
"^Účetní uzávěrka a účetní závěrka v ČR$",
|
|
||||||
"(?i)^The \"?Causes\"? of Cancer$",
|
|
||||||
"^Normas para la publicación de artículos$",
|
|
||||||
"^Editor('|s)(s|') [Rr]eply$",
|
|
||||||
"^Editor(’|s)(s|’) letter$",
|
|
||||||
"^Redaktoriaus žodis$",
|
|
||||||
"^DISCUSSION ON THE PRECEDING PAPER$",
|
|
||||||
"^Kōtō shōgaku shūshinsho jidōyō$",
|
|
||||||
"^Shōgaku nihon rekishi$",
|
|
||||||
"^(Theory of the flow of action currents in isolated myelinated nerve fibers).*$",
|
|
||||||
"^Préface$",
|
|
||||||
"^Occupational [Hh]ealth [Ss]ervices.$",
|
|
||||||
"^In Memoriam Professor Toshiyuki TAKESHIMA$",
|
|
||||||
"^Účetní závěrka ve vybraném podniku.*$",
|
|
||||||
"^Financial statements in selected company$",
|
|
||||||
"^Abdominal [Aa]ortic [Aa]neurysms.*$",
|
|
||||||
"^Pseudomyxoma peritonei$",
|
|
||||||
"^Kazalo autora$",
|
|
||||||
"(?i)^uvodna riječ$",
|
|
||||||
"^Motivace jako způsob vedení lidí$",
|
|
||||||
"^Motivation as a leadership$",
|
|
||||||
"^Polyfunkční dům$",
|
|
||||||
"^Multi\\-funkcional building$",
|
|
||||||
"^Podnikatelský plán$",
|
|
||||||
"(?i)^Podnikatelský záměr$",
|
|
||||||
"(?i)^Business Plan$",
|
|
||||||
"^Oceňování nemovitostí$",
|
|
||||||
"^Marketingová komunikace$",
|
|
||||||
"^Marketing communication$",
|
|
||||||
"^Sumario Analítico$",
|
|
||||||
"^Riječ uredništva$",
|
|
||||||
"^Savjetovanja i priredbe$",
|
|
||||||
"^Índice$",
|
|
||||||
"^(Starobosanski nadpisi).*$",
|
|
||||||
"^Vzdělávání pracovníků v organizaci$",
|
|
||||||
"^Staff training in organization$",
|
|
||||||
"^(Life Histories of North American Geometridae).*$",
|
|
||||||
"^Strategická analýza podniku$",
|
|
||||||
"^Strategic Analysis of an Enterprise$",
|
|
||||||
"^Sadržaj$",
|
|
||||||
"^Upute suradnicima$",
|
|
||||||
"^Rodinný dům$",
|
|
||||||
"(?i)^Fami(l)?ly house$",
|
|
||||||
"^Upute autorima$",
|
|
||||||
"^Strategic Analysis$",
|
|
||||||
"^Finanční analýza vybraného podniku$",
|
|
||||||
"^Finanční analýza$",
|
|
||||||
"^Riječ urednika$",
|
|
||||||
"(?i)^Content(s?)$",
|
|
||||||
"(?i)^Inhalt$",
|
|
||||||
"^Jinjō shōgaku shūshinsho jidōyō$",
|
|
||||||
"(?i)^Index$",
|
|
||||||
"^Chūgaku kokubun kyōkasho$",
|
|
||||||
"^Retrato de una mujer$",
|
|
||||||
"^Retrato de un hombre$",
|
|
||||||
"^Kōtō shōgaku dokuhon$",
|
|
||||||
"^Shotōka kokugo$",
|
|
||||||
"^Shōgaku dokuhon$",
|
|
||||||
"^Jinjō shōgaku kokugo dokuhon$",
|
|
||||||
"^Shinsei kokugo dokuhon$",
|
|
||||||
"^Teikoku dokuhon$",
|
|
||||||
"^Instructions to Authors$",
|
|
||||||
"^KİTAP TAHLİLİ$",
|
|
||||||
"^PRZEGLĄD PIŚMIENNICTWA$",
|
|
||||||
"(?i)^Presentación$",
|
|
||||||
"^İçindekiler$",
|
|
||||||
"(?i)^Tabl?e of contents$",
|
|
||||||
"^(CODICE DEL BEATO DE LOS REYES FERNANDO I Y SANCHA).*$",
|
|
||||||
"^(\\[MADRID\\. BIBL\\. NAC\\. N.*KING FERDINAND I.*FROM SAN ISIDORO DE LEON\\. FACUNDUS SCRIPSIT DATED.*\\]).*",
|
|
||||||
"^Editorial( Board)?$",
|
|
||||||
"(?i)^Editorial \\(English\\)$",
|
|
||||||
"^Editörden$",
|
|
||||||
"^(Corpus Oral Dialectal \\(COD\\)\\.).*$",
|
|
||||||
"^(Kiri Karl Morgensternile).*$",
|
|
||||||
"^(\\[Eksliibris Aleksandr).*\\]$",
|
|
||||||
"^(\\[Eksliibris Aleksandr).*$",
|
|
||||||
"^(Eksliibris Aleksandr).*$",
|
|
||||||
"^(Kiri A\\. de Vignolles).*$",
|
|
||||||
"^(2 kirja Karl Morgensternile).*$",
|
|
||||||
"^(Pirita kloostri idaosa arheoloogilised).*$",
|
|
||||||
"^(Kiri tundmatule).*$",
|
|
||||||
"^(Kiri Jenaer Allgemeine Literaturzeitung toimetusele).*$",
|
|
||||||
"^(Eksliibris Nikolai Birukovile).*$",
|
|
||||||
"^(Eksliibris Nikolai Issakovile).*$",
|
|
||||||
"^(WHP Cruise Summary Information of section).*$",
|
|
||||||
"^(Measurement of the top quark\\-pair production cross section with ATLAS in pp collisions at).*$",
|
|
||||||
"^(Measurement of the spin\\-dependent structure function).*",
|
|
||||||
"(?i)^.*authors['’′]? reply\\.?$",
|
|
||||||
"(?i)^.*authors['’′]? response\\.?$"
|
|
||||||
]
|
|
||||||
},
|
|
||||||
"synonyms": {}
|
|
||||||
}
|
|
||||||
}
|
|
16
pom.xml
16
pom.xml
|
@ -345,6 +345,22 @@
|
||||||
</exclusion>
|
</exclusion>
|
||||||
</exclusions>
|
</exclusions>
|
||||||
</dependency>
|
</dependency>
|
||||||
|
|
||||||
|
<dependency>
|
||||||
|
<groupId>eu.dnetlib</groupId>
|
||||||
|
<artifactId>dnet-actionmanager-common</artifactId>
|
||||||
|
<version>[6.0.0,7.0.0)</version>
|
||||||
|
<exclusions>
|
||||||
|
<exclusion>
|
||||||
|
<groupId>commons-httpclient</groupId>
|
||||||
|
<artifactId>commons-httpclient</artifactId>
|
||||||
|
</exclusion>
|
||||||
|
<exclusion>
|
||||||
|
<groupId>eu.dnetlib</groupId>
|
||||||
|
<artifactId>dnet-openaireplus-mapping-utils</artifactId>
|
||||||
|
</exclusion>
|
||||||
|
</exclusions>
|
||||||
|
</dependency>
|
||||||
</dependencies>
|
</dependencies>
|
||||||
</dependencyManagement>
|
</dependencyManagement>
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue