forked from D-Net/dnet-hadoop
Merge pull request 'Align Solr JSON records to the explore portal requirements' (#448) from json_payload into beta_to_master_may2024
Reviewed-on: D-Net/dnet-hadoop#448
This commit is contained in:
commit
8220e27110
|
@ -5,6 +5,7 @@ import java.io.StringReader;
|
||||||
import java.util.*;
|
import java.util.*;
|
||||||
import java.util.stream.Collectors;
|
import java.util.stream.Collectors;
|
||||||
|
|
||||||
|
import eu.dnetlib.dhp.schema.solr.Measure;
|
||||||
import org.apache.commons.lang3.StringUtils;
|
import org.apache.commons.lang3.StringUtils;
|
||||||
import org.dom4j.Document;
|
import org.dom4j.Document;
|
||||||
import org.dom4j.DocumentException;
|
import org.dom4j.DocumentException;
|
||||||
|
@ -76,6 +77,7 @@ public class ProvisionModelSupport {
|
||||||
r.setCollectedfrom(asProvenance(e.getCollectedfrom()));
|
r.setCollectedfrom(asProvenance(e.getCollectedfrom()));
|
||||||
r.setContext(asContext(e.getContext(), contextMapper));
|
r.setContext(asContext(e.getContext(), contextMapper));
|
||||||
r.setPid(asPid(e.getPid()));
|
r.setPid(asPid(e.getPid()));
|
||||||
|
r.setMeasures(mapMeasures(e.getMeasures()));
|
||||||
|
|
||||||
if (e instanceof eu.dnetlib.dhp.schema.oaf.Result) {
|
if (e instanceof eu.dnetlib.dhp.schema.oaf.Result) {
|
||||||
r.setResult(mapResult((eu.dnetlib.dhp.schema.oaf.Result) e));
|
r.setResult(mapResult((eu.dnetlib.dhp.schema.oaf.Result) e));
|
||||||
|
@ -106,6 +108,13 @@ public class ProvisionModelSupport {
|
||||||
final RelatedEntity re = rew.getTarget();
|
final RelatedEntity re = rew.getTarget();
|
||||||
final RecordType relatedRecordType = RecordType.valueOf(re.getType());
|
final RecordType relatedRecordType = RecordType.valueOf(re.getType());
|
||||||
final Relation relation = rew.getRelation();
|
final Relation relation = rew.getRelation();
|
||||||
|
final String relationProvenance = Optional
|
||||||
|
.ofNullable(relation.getDataInfo())
|
||||||
|
.map(d -> Optional
|
||||||
|
.ofNullable(d.getProvenanceaction())
|
||||||
|
.map(Qualifier::getClassid)
|
||||||
|
.orElse(null))
|
||||||
|
.orElse(null);
|
||||||
rr
|
rr
|
||||||
.setHeader(
|
.setHeader(
|
||||||
RelatedRecordHeader
|
RelatedRecordHeader
|
||||||
|
@ -113,7 +122,9 @@ public class ProvisionModelSupport {
|
||||||
relation.getRelType(),
|
relation.getRelType(),
|
||||||
relation.getRelClass(),
|
relation.getRelClass(),
|
||||||
StringUtils.substringAfter(relation.getTarget(), IdentifierFactory.ID_PREFIX_SEPARATOR),
|
StringUtils.substringAfter(relation.getTarget(), IdentifierFactory.ID_PREFIX_SEPARATOR),
|
||||||
relatedRecordType));
|
relatedRecordType,
|
||||||
|
relationProvenance,
|
||||||
|
Optional.ofNullable(relation.getDataInfo()).map(DataInfo::getTrust).orElse(null)));
|
||||||
|
|
||||||
rr.setAcronym(re.getAcronym());
|
rr.setAcronym(re.getAcronym());
|
||||||
rr.setCode(re.getCode());
|
rr.setCode(re.getCode());
|
||||||
|
@ -131,11 +142,19 @@ public class ProvisionModelSupport {
|
||||||
rr.setOfficialname(re.getOfficialname());
|
rr.setOfficialname(re.getOfficialname());
|
||||||
rr.setOpenairecompatibility(mapCodeLabel(re.getOpenairecompatibility()));
|
rr.setOpenairecompatibility(mapCodeLabel(re.getOpenairecompatibility()));
|
||||||
rr.setPid(asPid(re.getPid()));
|
rr.setPid(asPid(re.getPid()));
|
||||||
rr.setProjectTitle(rr.getProjectTitle());
|
rr.setWebsiteurl(re.getWebsiteurl());
|
||||||
|
rr.setProjectTitle(re.getProjectTitle());
|
||||||
rr.setPublisher(re.getPublisher());
|
rr.setPublisher(re.getPublisher());
|
||||||
rr.setResulttype(mapQualifier(re.getResulttype()));
|
rr.setResulttype(mapQualifier(re.getResulttype()));
|
||||||
rr.setTitle(Optional.ofNullable(re.getTitle()).map(StructuredProperty::getValue).orElse(null));
|
rr.setTitle(Optional.ofNullable(re.getTitle()).map(StructuredProperty::getValue).orElse(null));
|
||||||
|
|
||||||
|
if (relation.getValidated() == null) {
|
||||||
|
relation.setValidated(false);
|
||||||
|
}
|
||||||
|
if (ModelConstants.OUTCOME.equals(relation.getSubRelType()) && StringUtils.isNotBlank(relation.getValidationDate())) {
|
||||||
|
rr.setValidationDate(relation.getValidationDate());
|
||||||
|
}
|
||||||
|
|
||||||
return rr;
|
return rr;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -266,6 +285,7 @@ public class ProvisionModelSupport {
|
||||||
ds.setOfficialname(mapField(d.getOfficialname()));
|
ds.setOfficialname(mapField(d.getOfficialname()));
|
||||||
ds.setDescription(mapField(d.getDescription()));
|
ds.setDescription(mapField(d.getDescription()));
|
||||||
ds.setJournal(mapJournal(d.getJournal()));
|
ds.setJournal(mapJournal(d.getJournal()));
|
||||||
|
ds.setWebsiteurl(mapField(d.getWebsiteurl()));
|
||||||
ds.setLogourl(mapField(d.getLogourl()));
|
ds.setLogourl(mapField(d.getLogourl()));
|
||||||
ds.setAccessinfopackage(mapFieldList(d.getAccessinfopackage()));
|
ds.setAccessinfopackage(mapFieldList(d.getAccessinfopackage()));
|
||||||
ds.setCertificates(mapField(d.getCertificates()));
|
ds.setCertificates(mapField(d.getCertificates()));
|
||||||
|
@ -311,6 +331,7 @@ public class ProvisionModelSupport {
|
||||||
ds.setSubjects(asSubjectSP(d.getSubjects()));
|
ds.setSubjects(asSubjectSP(d.getSubjects()));
|
||||||
ds.setSubmissionpolicyurl(d.getSubmissionpolicyurl());
|
ds.setSubmissionpolicyurl(d.getSubmissionpolicyurl());
|
||||||
ds.setThematic(d.getThematic());
|
ds.setThematic(d.getThematic());
|
||||||
|
ds.setContentpolicies(mapCodeLabel(d.getContentpolicies()));
|
||||||
ds.setVersioncontrol(d.getVersioncontrol());
|
ds.setVersioncontrol(d.getVersioncontrol());
|
||||||
ds.setVersioning(mapField(d.getVersioning()));
|
ds.setVersioning(mapField(d.getVersioning()));
|
||||||
|
|
||||||
|
@ -326,6 +347,7 @@ public class ProvisionModelSupport {
|
||||||
rs.setOtherTitles(getOtherTitles(r.getTitle()));
|
rs.setOtherTitles(getOtherTitles(r.getTitle()));
|
||||||
rs.setDescription(mapFieldList(r.getDescription()));
|
rs.setDescription(mapFieldList(r.getDescription()));
|
||||||
rs.setSubject(asSubject(r.getSubject()));
|
rs.setSubject(asSubject(r.getSubject()));
|
||||||
|
rs.setLanguage(asLanguage(r.getLanguage()));
|
||||||
rs.setPublicationdate(mapField(r.getDateofacceptance()));
|
rs.setPublicationdate(mapField(r.getDateofacceptance()));
|
||||||
rs.setPublisher(mapField(r.getPublisher()));
|
rs.setPublisher(mapField(r.getPublisher()));
|
||||||
rs.setEmbargoenddate(mapField(r.getEmbargoenddate()));
|
rs.setEmbargoenddate(mapField(r.getEmbargoenddate()));
|
||||||
|
@ -375,6 +397,12 @@ public class ProvisionModelSupport {
|
||||||
return rs;
|
return rs;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private static Language asLanguage(Qualifier lang) {
|
||||||
|
return Optional.ofNullable(lang)
|
||||||
|
.map(q -> Language.newInstance(q.getClassid(), q.getClassname()))
|
||||||
|
.orElse(null);
|
||||||
|
}
|
||||||
|
|
||||||
@Nullable
|
@Nullable
|
||||||
private static List<String> getOtherTitles(List<StructuredProperty> titleList) {
|
private static List<String> getOtherTitles(List<StructuredProperty> titleList) {
|
||||||
return Optional
|
return Optional
|
||||||
|
@ -422,7 +450,7 @@ public class ProvisionModelSupport {
|
||||||
Instance i = new Instance();
|
Instance i = new Instance();
|
||||||
i.setCollectedfrom(asProvenance(instance.getCollectedfrom()));
|
i.setCollectedfrom(asProvenance(instance.getCollectedfrom()));
|
||||||
i.setHostedby(asProvenance(instance.getHostedby()));
|
i.setHostedby(asProvenance(instance.getHostedby()));
|
||||||
i.setFulltext(i.getFulltext());
|
i.setFulltext(instance.getFulltext());
|
||||||
i.setPid(asPid(instance.getPid()));
|
i.setPid(asPid(instance.getPid()));
|
||||||
i.setAlternateIdentifier(asPid(instance.getAlternateIdentifier()));
|
i.setAlternateIdentifier(asPid(instance.getAlternateIdentifier()));
|
||||||
i.setAccessright(mapAccessRight(instance.getAccessright()));
|
i.setAccessright(mapAccessRight(instance.getAccessright()));
|
||||||
|
@ -453,7 +481,8 @@ public class ProvisionModelSupport {
|
||||||
private static AccessRight mapAccessRight(eu.dnetlib.dhp.schema.oaf.AccessRight accessright) {
|
private static AccessRight mapAccessRight(eu.dnetlib.dhp.schema.oaf.AccessRight accessright) {
|
||||||
return AccessRight
|
return AccessRight
|
||||||
.newInstance(
|
.newInstance(
|
||||||
mapQualifier(accessright),
|
accessright.getClassid(),
|
||||||
|
accessright.getClassname(),
|
||||||
Optional
|
Optional
|
||||||
.ofNullable(accessright.getOpenAccessRoute())
|
.ofNullable(accessright.getOpenAccessRoute())
|
||||||
.map(route -> OpenAccessRoute.valueOf(route.toString()))
|
.map(route -> OpenAccessRoute.valueOf(route.toString()))
|
||||||
|
@ -508,7 +537,18 @@ public class ProvisionModelSupport {
|
||||||
}
|
}
|
||||||
|
|
||||||
private static Provenance asProvenance(KeyValue keyValue) {
|
private static Provenance asProvenance(KeyValue keyValue) {
|
||||||
return Optional.ofNullable(keyValue).map(cf -> Provenance.newInstance(cf.getKey(), cf.getValue())).orElse(null);
|
return Optional.ofNullable(keyValue).map(kv ->
|
||||||
|
Provenance.newInstance(
|
||||||
|
StringUtils.substringAfter(kv.getKey(), IdentifierFactory.ID_PREFIX_SEPARATOR),
|
||||||
|
kv.getValue())).orElse(null);
|
||||||
|
}
|
||||||
|
|
||||||
|
private static List<Measure> mapMeasures(List<eu.dnetlib.dhp.schema.oaf.Measure> measures) {
|
||||||
|
return Optional.ofNullable(measures)
|
||||||
|
.map(ml -> ml.stream()
|
||||||
|
.map(m -> Measure.newInstance(m.getId(), mapCodeLabelKV(m.getUnit())))
|
||||||
|
.collect(Collectors.toList()))
|
||||||
|
.orElse(null);
|
||||||
}
|
}
|
||||||
|
|
||||||
private static List<Context> asContext(List<eu.dnetlib.dhp.schema.oaf.Context> ctxList,
|
private static List<Context> asContext(List<eu.dnetlib.dhp.schema.oaf.Context> ctxList,
|
||||||
|
@ -581,7 +621,12 @@ public class ProvisionModelSupport {
|
||||||
.map(
|
.map(
|
||||||
pids -> pids
|
pids -> pids
|
||||||
.stream()
|
.stream()
|
||||||
.map(p -> Pid.newInstance(p.getQualifier().getClassname(), p.getValue()))
|
.filter(p -> Objects.nonNull(p.getQualifier()))
|
||||||
|
.filter(p -> Objects.nonNull(p.getQualifier().getClassid()))
|
||||||
|
.map(p -> Pid.newInstance(
|
||||||
|
p.getValue(),
|
||||||
|
p.getQualifier().getClassid(),
|
||||||
|
p.getQualifier().getClassname()))
|
||||||
.collect(Collectors.toList()))
|
.collect(Collectors.toList()))
|
||||||
.orElse(null);
|
.orElse(null);
|
||||||
}
|
}
|
||||||
|
@ -607,7 +652,7 @@ public class ProvisionModelSupport {
|
||||||
.stream()
|
.stream()
|
||||||
.filter(s -> Objects.nonNull(s.getQualifier()))
|
.filter(s -> Objects.nonNull(s.getQualifier()))
|
||||||
.filter(s -> Objects.nonNull(s.getQualifier().getClassname()))
|
.filter(s -> Objects.nonNull(s.getQualifier().getClassname()))
|
||||||
.map(s -> Subject.newInstance(s.getValue(), s.getQualifier().getClassname()))
|
.map(s -> Subject.newInstance(s.getValue(), s.getQualifier().getClassid(), s.getQualifier().getClassname()))
|
||||||
.collect(Collectors.toList()))
|
.collect(Collectors.toList()))
|
||||||
.orElse(null);
|
.orElse(null);
|
||||||
}
|
}
|
||||||
|
@ -620,7 +665,7 @@ public class ProvisionModelSupport {
|
||||||
.stream()
|
.stream()
|
||||||
.filter(s -> Objects.nonNull(s.getQualifier()))
|
.filter(s -> Objects.nonNull(s.getQualifier()))
|
||||||
.filter(s -> Objects.nonNull(s.getQualifier().getClassname()))
|
.filter(s -> Objects.nonNull(s.getQualifier().getClassname()))
|
||||||
.map(s -> Subject.newInstance(s.getValue(), s.getQualifier().getClassname()))
|
.map(s -> Subject.newInstance(s.getValue(), s.getQualifier().getClassid(), s.getQualifier().getClassname()))
|
||||||
.collect(Collectors.toList()))
|
.collect(Collectors.toList()))
|
||||||
.orElse(null);
|
.orElse(null);
|
||||||
}
|
}
|
||||||
|
@ -689,7 +734,7 @@ public class ProvisionModelSupport {
|
||||||
private static CodeLabel mapCodeLabel(KeyValue kv) {
|
private static CodeLabel mapCodeLabel(KeyValue kv) {
|
||||||
return Optional
|
return Optional
|
||||||
.ofNullable(kv)
|
.ofNullable(kv)
|
||||||
.map(q -> CodeLabel.newInstance(kv.getKey(), kv.getValue()))
|
.map(k -> CodeLabel.newInstance(k.getKey(), k.getValue()))
|
||||||
.orElse(null);
|
.orElse(null);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -213,7 +213,7 @@ public class StreamingInputDocumentFactory implements Serializable {
|
||||||
}
|
}
|
||||||
writer.close();
|
writer.close();
|
||||||
indexDocument.addField(INDEX_RESULT, results.toString());
|
indexDocument.addField(INDEX_RESULT, results.toString());
|
||||||
// indexDocument.addField(INDEX_JSON_RESULT, json);
|
indexDocument.addField(INDEX_JSON_RESULT, json);
|
||||||
} finally {
|
} finally {
|
||||||
outputFactory.remove();
|
outputFactory.remove();
|
||||||
eventFactory.remove();
|
eventFactory.remove();
|
||||||
|
|
|
@ -115,12 +115,12 @@ public class XmlIndexingJobTest extends SolrTest {
|
||||||
|
|
||||||
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "isgreen:true"));
|
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "isgreen:true"));
|
||||||
assertEquals(
|
assertEquals(
|
||||||
0, rsp.getResults().getNumFound(),
|
4, rsp.getResults().getNumFound(),
|
||||||
"the number of indexed records having isgreen = true");
|
"the number of indexed records having isgreen = true");
|
||||||
|
|
||||||
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "openaccesscolor:bronze"));
|
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "openaccesscolor:bronze"));
|
||||||
assertEquals(
|
assertEquals(
|
||||||
0, rsp.getResults().getNumFound(),
|
2, rsp.getResults().getNumFound(),
|
||||||
"the number of indexed records having openaccesscolor = bronze");
|
"the number of indexed records having openaccesscolor = bronze");
|
||||||
|
|
||||||
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "isindiamondjournal:true"));
|
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "isindiamondjournal:true"));
|
||||||
|
@ -135,14 +135,14 @@ public class XmlIndexingJobTest extends SolrTest {
|
||||||
|
|
||||||
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "peerreviewed:true"));
|
rsp = miniCluster.getSolrClient().query(new SolrQuery().add(CommonParams.Q, "peerreviewed:true"));
|
||||||
assertEquals(
|
assertEquals(
|
||||||
0, rsp.getResults().getNumFound(),
|
35, rsp.getResults().getNumFound(),
|
||||||
"the number of indexed records having peerreviewed = true");
|
"the number of indexed records having peerreviewed = true");
|
||||||
|
|
||||||
rsp = miniCluster
|
rsp = miniCluster
|
||||||
.getSolrClient()
|
.getSolrClient()
|
||||||
.query(
|
.query(
|
||||||
new SolrQuery()
|
new SolrQuery()
|
||||||
.add(CommonParams.Q, "objidentifier:\"iddesignpres::ae77e56e84ad058d9e7f19fa2f7325db\"")
|
.add(CommonParams.Q, "objidentifier:\"57a035e5b1ae::236d6d8c1e03368b5ae72acfeeb11bbc\"")
|
||||||
.add(CommonParams.FL, "__json"));
|
.add(CommonParams.FL, "__json"));
|
||||||
assertEquals(
|
assertEquals(
|
||||||
1, rsp.getResults().getNumFound(),
|
1, rsp.getResults().getNumFound(),
|
||||||
|
|
Binary file not shown.
Binary file not shown.
2
pom.xml
2
pom.xml
|
@ -888,7 +888,7 @@
|
||||||
<mockito-core.version>3.3.3</mockito-core.version>
|
<mockito-core.version>3.3.3</mockito-core.version>
|
||||||
<mongodb.driver.version>3.4.2</mongodb.driver.version>
|
<mongodb.driver.version>3.4.2</mongodb.driver.version>
|
||||||
<vtd.version>[2.12,3.0)</vtd.version>
|
<vtd.version>[2.12,3.0)</vtd.version>
|
||||||
<dhp-schemas.version>[6.1.2]</dhp-schemas.version>
|
<dhp-schemas.version>[6.1.3]</dhp-schemas.version>
|
||||||
<dnet-actionmanager-api.version>[4.0.3]</dnet-actionmanager-api.version>
|
<dnet-actionmanager-api.version>[4.0.3]</dnet-actionmanager-api.version>
|
||||||
<dnet-actionmanager-common.version>[6.0.5]</dnet-actionmanager-common.version>
|
<dnet-actionmanager-common.version>[6.0.5]</dnet-actionmanager-common.version>
|
||||||
<dnet-openaire-broker-common.version>[3.1.6]</dnet-openaire-broker-common.version>
|
<dnet-openaire-broker-common.version>[3.1.6]</dnet-openaire-broker-common.version>
|
||||||
|
|
Loading…
Reference in New Issue