108 lines
3.3 KiB
Java
108 lines
3.3 KiB
Java
package eu.dnetlib.wfs.nodes;
|
|
|
|
import java.time.LocalDateTime;
|
|
import java.util.HashMap;
|
|
import java.util.Map;
|
|
import java.util.function.Predicate;
|
|
import java.util.stream.Stream;
|
|
|
|
import org.dom4j.Document;
|
|
import org.dom4j.DocumentException;
|
|
import org.dom4j.DocumentHelper;
|
|
import org.springframework.beans.BeanUtils;
|
|
import org.springframework.beans.factory.annotation.Autowired;
|
|
|
|
import eu.dnetlib.common.clients.DnetServiceClientFactory;
|
|
import eu.dnetlib.common.clients.DsmClient;
|
|
import eu.dnetlib.common.clients.MDStoreManagerClient;
|
|
import eu.dnetlib.common.mapping.RecordTransformer;
|
|
import eu.dnetlib.common.mapping.xslt.XsltTransformFactory;
|
|
import eu.dnetlib.common.mdstores.backends.sql.MDStoreSqlBackend;
|
|
import eu.dnetlib.domain.dsm.Api;
|
|
import eu.dnetlib.domain.dsm.Datasource;
|
|
import eu.dnetlib.domain.mdstore.MDStoreVersion;
|
|
import eu.dnetlib.domain.mdstore.records.MetadataRecord;
|
|
import eu.dnetlib.wfs.annotations.WfInputParam;
|
|
import eu.dnetlib.wfs.annotations.WfNode;
|
|
import eu.dnetlib.wfs.utils.XpathFilterFactory;
|
|
import jakarta.transaction.Transactional;
|
|
|
|
@WfNode("md_transform_xslt")
|
|
public class MdTransformJobNode extends ProcessNode {
|
|
|
|
@WfInputParam
|
|
private Datasource ds;
|
|
|
|
@WfInputParam
|
|
private Api api;
|
|
|
|
@WfInputParam
|
|
private String inputMdId;
|
|
|
|
@WfInputParam
|
|
private String outputMdId;
|
|
|
|
@WfInputParam(optional = true)
|
|
private String filterXpath;
|
|
|
|
@WfInputParam
|
|
private String ruleId;
|
|
|
|
@Autowired
|
|
private XsltTransformFactory xsltTransformFactory;
|
|
|
|
@Autowired
|
|
private DnetServiceClientFactory clientFactory;
|
|
|
|
@Autowired
|
|
private MDStoreSqlBackend mdStoreSqlBackend;
|
|
|
|
@Override
|
|
@Transactional
|
|
protected void execute() throws Exception {
|
|
|
|
final Predicate<Document> filter = XpathFilterFactory.createFilter(this.filterXpath);
|
|
|
|
final Map<String, Object> params = new HashMap<>();
|
|
// TODO (LOW PRIORITY): which params ?
|
|
final RecordTransformer<String, String> xslt = this.xsltTransformFactory.getTransformer(this.ruleId, params);
|
|
final MDStoreManagerClient mdstoreManager = this.clientFactory.getClient(MDStoreManagerClient.class);
|
|
|
|
final MDStoreVersion inputVersion = mdstoreManager.startReading(this.inputMdId);
|
|
final MDStoreVersion outputVersion = mdstoreManager.newVersion(this.outputMdId);
|
|
|
|
try {
|
|
final Stream<MetadataRecord> stream = this.mdStoreSqlBackend.streamEntries(inputVersion)
|
|
.map(input -> {
|
|
final MetadataRecord output = new MetadataRecord();
|
|
BeanUtils.copyProperties(input, output);
|
|
output.setBody(xslt.transform(input.getBody()));
|
|
output.setDateOfTransformation(LocalDateTime.now());
|
|
return output;
|
|
})
|
|
.filter(record -> {
|
|
try {
|
|
final Document doc = DocumentHelper.parseText(record.getBody());
|
|
return filter.test(doc);
|
|
} catch (final DocumentException e) {
|
|
throw new RuntimeException("Invalid record: " + record.getBody());
|
|
}
|
|
});
|
|
|
|
this.mdStoreSqlBackend.saveRecords(outputVersion, stream);
|
|
|
|
final long size = this.mdStoreSqlBackend.countRecords(outputVersion.getId());
|
|
|
|
mdstoreManager.commitVersion(outputVersion.getId(), size);
|
|
|
|
this.clientFactory.getClient(DsmClient.class).updateApiAggregationInfo(this.api.getId(), this.outputMdId, size);
|
|
} catch (final Throwable e) {
|
|
mdstoreManager.abortVersion(outputVersion);
|
|
throw e;
|
|
} finally {
|
|
mdstoreManager.endReading(inputVersion);
|
|
}
|
|
}
|
|
|
|
}
|