forked from D-Net/dnet-hadoop
WIP aggregator to make relationships unique
This commit is contained in:
parent
ecf119f37a
commit
770adc26e9
|
@ -96,7 +96,7 @@ public class SparkPropagateRelation extends AbstractSparkAction {
|
|||
FieldType.TARGET,
|
||||
getDeletedFn());
|
||||
|
||||
save(distinctRelations(newRels.union(updated).union(mergeRels)), outputRelationPath, SaveMode.Overwrite);
|
||||
save(newRels.union(updated).union(mergeRels).distinct(), outputRelationPath, SaveMode.Overwrite);
|
||||
}
|
||||
|
||||
private Dataset<Relation> distinctRelations(Dataset<Relation> rels) {
|
||||
|
@ -115,13 +115,11 @@ public class SparkPropagateRelation extends AbstractSparkAction {
|
|||
|
||||
@Override
|
||||
public Relation reduce(Relation b, Relation a) {
|
||||
b.mergeFrom(a);
|
||||
return b;
|
||||
}
|
||||
|
||||
@Override
|
||||
public Relation merge(Relation b, Relation a) {
|
||||
b.mergeFrom(a);
|
||||
return b;
|
||||
}
|
||||
|
||||
|
|
Loading…
Reference in New Issue