forked from D-Net/dnet-hadoop
using _the right_ scala 2.11 converters
This commit is contained in:
parent
e6ca382deb
commit
9b4415cb67
|
@ -26,6 +26,7 @@ import eu.dnetlib.dhp.utils.ISLookupClientFactory;
|
||||||
import eu.dnetlib.enabling.is.lookup.rmi.ISLookUpException;
|
import eu.dnetlib.enabling.is.lookup.rmi.ISLookUpException;
|
||||||
import eu.dnetlib.enabling.is.lookup.rmi.ISLookUpService;
|
import eu.dnetlib.enabling.is.lookup.rmi.ISLookUpService;
|
||||||
import eu.dnetlib.pace.config.DedupConfig;
|
import eu.dnetlib.pace.config.DedupConfig;
|
||||||
|
import scala.collection.JavaConversions;
|
||||||
import scala.collection.JavaConverters;
|
import scala.collection.JavaConverters;
|
||||||
|
|
||||||
public class SparkCreateDedupRecord extends AbstractSparkAction {
|
public class SparkCreateDedupRecord extends AbstractSparkAction {
|
||||||
|
@ -98,9 +99,7 @@ public class SparkCreateDedupRecord extends AbstractSparkAction {
|
||||||
.read()
|
.read()
|
||||||
.load(mergeRelPath)
|
.load(mergeRelPath)
|
||||||
.where("relClass == 'merges'")
|
.where("relClass == 'merges'")
|
||||||
.join(
|
.join(dedupIds, JavaConversions.asScalaBuffer(Arrays.asList("source", "target")), "left_semi")
|
||||||
dedupIds, JavaConverters.asScalaBufferConverter(Arrays.asList("source", "target")).asScala(),
|
|
||||||
"left_semi")
|
|
||||||
.write()
|
.write()
|
||||||
.mode(SaveMode.Overwrite)
|
.mode(SaveMode.Overwrite)
|
||||||
.option("compression", "gzip")
|
.option("compression", "gzip")
|
||||||
|
|
Loading…
Reference in New Issue