dnet-hadoop/dhp-workflows/dhp-graph-mapper/src/main/java/eu/dnetlib/dhp/oa/graph/clean/CleaningRuleMap.java

41 lines
1.2 KiB
Java
Raw Normal View History

2020-06-09 17:20:40 +02:00
package eu.dnetlib.dhp.oa.graph.clean;
2020-06-13 13:06:04 +02:00
import java.io.Serializable;
import java.util.HashMap;
2020-06-12 12:03:25 +02:00
2020-06-13 13:06:04 +02:00
import eu.dnetlib.dhp.common.FunctionalInterfaceSupport.SerializableConsumer;
2020-06-09 17:20:40 +02:00
import eu.dnetlib.dhp.oa.graph.raw.common.VocabularyGroup;
import eu.dnetlib.dhp.schema.oaf.Qualifier;
2020-06-12 12:03:25 +02:00
import eu.dnetlib.dhp.schema.oaf.StructuredProperty;
2020-06-12 10:45:18 +02:00
2020-06-13 13:06:04 +02:00
public class CleaningRuleMap extends HashMap<Class, SerializableConsumer<Object>> implements Serializable {
2020-06-09 17:20:40 +02:00
2020-06-12 18:25:47 +02:00
/**
2020-06-13 13:06:04 +02:00
* Creates the mapping for the Oaf types subject to cleaning
*
2020-06-12 18:25:47 +02:00
* @param vocabularies
*/
2020-06-13 13:06:04 +02:00
public static CleaningRuleMap create(VocabularyGroup vocabularies) {
CleaningRuleMap mapping = new CleaningRuleMap();
2020-06-12 18:25:47 +02:00
mapping.put(Qualifier.class, o -> {
Qualifier q = (Qualifier) o;
if (vocabularies.vocabularyExists(q.getSchemeid())) {
Qualifier newValue = vocabularies.lookup(q.getSchemeid(), q.getClassid());
q.setClassid(newValue.getClassid());
q.setClassname(newValue.getClassname());
2020-06-12 10:45:18 +02:00
}
2020-06-12 18:25:47 +02:00
});
mapping.put(StructuredProperty.class, o -> {
StructuredProperty sp = (StructuredProperty) o;
// TODO implement a policy
/*
* if (StringUtils.isBlank(sp.getValue())) { sp.setValue(null); sp.setQualifier(null); sp.setDataInfo(null);
* }
*/
});
2020-06-13 13:06:04 +02:00
return mapping;
2020-06-09 19:52:53 +02:00
}
2020-06-12 18:25:47 +02:00
2020-06-09 17:20:40 +02:00
}