dnet-hadoop/dhp-pace-core/src/main/java/eu/dnetlib/pace/tree/TitleVersionMatch.java

40 lines
965 B
Java
Raw Normal View History

2023-06-26 13:58:11 +02:00
package eu.dnetlib.pace.tree;
2023-06-26 13:58:11 +02:00
import java.util.Map;
import eu.dnetlib.pace.config.Config;
import eu.dnetlib.pace.tree.support.AbstractStringComparator;
import eu.dnetlib.pace.tree.support.ComparatorClass;
/**
* Returns true if the titles in the given documents contains the same numbers, false otherwise.
*
* @author claudio
*
*/
@ComparatorClass("titleVersionMatch")
public class TitleVersionMatch extends AbstractStringComparator {
2023-06-26 13:58:11 +02:00
public TitleVersionMatch(final Map<String, String> params) {
super(params);
}
2023-06-26 13:58:11 +02:00
@Override
public double compare(final String valueA, final String valueB, final Config conf) {
if (valueA.isEmpty() || valueB.isEmpty())
return -1;
2023-06-26 13:58:11 +02:00
return notNull(valueA) && notNull(valueB) && !checkNumbers(valueA, valueB) ? 1 : 0;
}
2023-06-26 13:58:11 +02:00
@Override
public String toString() {
return getClass().getSimpleName() + ":" + super.toString();
}
2023-06-26 13:58:11 +02:00
protected String toString(final Object object) {
return toFirstString(object);
}
}