dnet-docker/dnet-app/apps/dnet-wf-aggregation-postgres/src/main/java/eu/dnetlib/wfs/nodes/MdTransformJobNode.java

108 lines
3.3 KiB
Java

package eu.dnetlib.wfs.nodes;
import java.time.LocalDateTime;
import java.util.HashMap;
import java.util.Map;
import java.util.function.Predicate;
import java.util.stream.Stream;
import org.dom4j.Document;
import org.dom4j.DocumentException;
import org.dom4j.DocumentHelper;
import org.springframework.beans.BeanUtils;
import org.springframework.beans.factory.annotation.Autowired;
import eu.dnetlib.common.clients.DnetServiceClientFactory;
import eu.dnetlib.common.clients.DsmClient;
import eu.dnetlib.common.clients.MDStoreManagerClient;
import eu.dnetlib.common.mapping.RecordTransformer;
import eu.dnetlib.common.mapping.xslt.XsltTransformFactory;
import eu.dnetlib.common.mdstores.backends.sql.MDStoreSqlBackend;
import eu.dnetlib.domain.dsm.Api;
import eu.dnetlib.domain.dsm.Datasource;
import eu.dnetlib.domain.mdstore.MDStoreVersion;
import eu.dnetlib.domain.mdstore.records.MetadataRecord;
import eu.dnetlib.wfs.annotations.WfInputParam;
import eu.dnetlib.wfs.annotations.WfNode;
import eu.dnetlib.wfs.utils.XpathFilterFactory;
import jakarta.transaction.Transactional;
@WfNode("md_transform_xslt")
public class MdTransformJobNode extends ProcessNode {
@WfInputParam
private Datasource ds;
@WfInputParam
private Api api;
@WfInputParam
private String inputMdId;
@WfInputParam
private String outputMdId;
@WfInputParam(optional = true)
private String filterXpath;
@WfInputParam
private String ruleId;
@Autowired
private XsltTransformFactory xsltTransformFactory;
@Autowired
private DnetServiceClientFactory clientFactory;
@Autowired
private MDStoreSqlBackend mdStoreSqlBackend;
@Override
@Transactional
protected void execute() throws Exception {
final Predicate<Document> filter = XpathFilterFactory.createFilter(this.filterXpath);
final Map<String, Object> params = new HashMap<>();
// TODO (LOW PRIORITY): which params ?
final RecordTransformer<String, String> xslt = this.xsltTransformFactory.getTransformer(this.ruleId, params);
final MDStoreManagerClient mdstoreManager = this.clientFactory.getClient(MDStoreManagerClient.class);
final MDStoreVersion inputVersion = mdstoreManager.startReading(this.inputMdId);
final MDStoreVersion outputVersion = mdstoreManager.newVersion(this.outputMdId);
try {
final Stream<MetadataRecord> stream = this.mdStoreSqlBackend.streamEntries(inputVersion)
.map(input -> {
final MetadataRecord output = new MetadataRecord();
BeanUtils.copyProperties(input, output);
output.setBody(xslt.transform(input.getBody()));
output.setDateOfTransformation(LocalDateTime.now());
return output;
})
.filter(record -> {
try {
final Document doc = DocumentHelper.parseText(record.getBody());
return filter.test(doc);
} catch (final DocumentException e) {
throw new RuntimeException("Invalid record: " + record.getBody());
}
});
this.mdStoreSqlBackend.saveRecords(outputVersion, stream);
final long size = this.mdStoreSqlBackend.countRecords(outputVersion.getId());
mdstoreManager.commitVersion(outputVersion.getId(), size);
this.clientFactory.getClient(DsmClient.class).updateApiAggregationInfo(this.api.getId(), this.outputMdId, size);
} catch (final Throwable e) {
mdstoreManager.abortVersion(outputVersion);
throw e;
} finally {
mdstoreManager.endReading(inputVersion);
}
}
}