44 lines
1.3 KiB
Java
44 lines
1.3 KiB
Java
package eu.dnetlib.manager.wf.nodes.aggregation;
|
|
|
|
import java.util.stream.Stream;
|
|
|
|
import org.springframework.beans.BeanUtils;
|
|
import org.springframework.beans.factory.annotation.Autowired;
|
|
|
|
import eu.dnetlib.data.mapping.cleaner.Cleaner;
|
|
import eu.dnetlib.data.mapping.cleaner.CleanerFactory;
|
|
import eu.dnetlib.data.mdstore.model.records.MetadataRecord;
|
|
import eu.dnetlib.data.mdstore.model.records.MetadataRecordImpl;
|
|
import eu.dnetlib.manager.wf.annotations.WfInputParam;
|
|
import eu.dnetlib.manager.wf.annotations.WfNode;
|
|
import eu.dnetlib.manager.wf.nodes.stream.StreamMapperNode;
|
|
|
|
@WfNode("clean")
|
|
public class MetadataCleanerNode extends StreamMapperNode<MetadataRecord, MetadataRecord> {
|
|
|
|
@WfInputParam
|
|
private String ruleId;
|
|
|
|
@Autowired
|
|
private CleanerFactory cleanerFactory;
|
|
|
|
@Override
|
|
protected Stream<MetadataRecord> mapStream(final Stream<MetadataRecord> input) {
|
|
try {
|
|
final Cleaner cleaner = cleanerFactory.obtainCleaningRule(ruleId);
|
|
|
|
return input.map(in -> {
|
|
final MetadataRecord out = new MetadataRecordImpl();
|
|
BeanUtils.copyProperties(in, out);
|
|
out.setBody(cleaner.transform(in.getBody()));
|
|
out.setDateOfTransformation(System.currentTimeMillis());
|
|
return out;
|
|
|
|
});
|
|
} catch (final Exception e) {
|
|
throw new RuntimeException(e);
|
|
}
|
|
}
|
|
|
|
}
|