diff --git a/dnet-dedup-test/src/main/java/eu/dnetlib/Deduper.java b/dnet-dedup-test/src/main/java/eu/dnetlib/Deduper.java index 471250c..fdd00da 100644 --- a/dnet-dedup-test/src/main/java/eu/dnetlib/Deduper.java +++ b/dnet-dedup-test/src/main/java/eu/dnetlib/Deduper.java @@ -49,7 +49,7 @@ public class Deduper implements Serializable { System.out.println("Number of relations = " + relationRDD.distinct().count()); - final RDD> edgeRdd = relationRDD.map(it -> new Edge<>(Utility.getHashcode(it._1()),Utility.getHashcode(it._2()), "equalTo")).rdd(); + final RDD> edgeRdd = relationRDD.map(it -> new Edge<>(Utility.getHashcode(it._1()),Utility.getHashcode(it._2()), "isSimilarTo")).rdd(); accumulators.forEach((name, acc) -> log.info(name + " -> " + acc.value())); diff --git a/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/organization.current.conf.json b/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/organization.current.conf.json index d13aeab..39e5141 100644 --- a/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/organization.current.conf.json +++ b/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/organization.current.conf.json @@ -87,7 +87,7 @@ } } ], - "threshold": 0.7, + "threshold": 0.1, "aggregation": "W_MEAN", "positive": "layer4", "negative": "NO_MATCH", @@ -106,7 +106,7 @@ } } ], - "threshold": 0.9, + "threshold": 0.7, "aggregation": "AVG", "positive": "layer5", "negative": "NO_MATCH", @@ -129,7 +129,9 @@ "comparator": "jaroWinklerNormalizedName", "weight": 0.1, "countIfUndefined": "false", - "params": {} + "params": { + "windowSize": 4 + } } ], "threshold": 0.9, diff --git a/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/publication.current.conf.json b/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/publication.current.conf.json index 52352d7..fafe429 100644 --- a/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/publication.current.conf.json +++ b/dnet-dedup-test/src/test/resources/eu/dnetlib/pace/config/publication.current.conf.json @@ -66,13 +66,12 @@ "weight": 1.0, "countIfUndefined": "false", "params": { - "threshold": "0.5", "jpath_value": "$.value", "jpath_classid": "$.qualifier.classid" } } ], - "threshold": 1.0, + "threshold": 0.5, "aggregation": "MAX", "positive": "MATCH", "negative": "layer2",