2023-06-09 16:47:25 +02:00
|
|
|
|
|
|
|
package eu.dnetlib.dhp.schema.oaf.utils;
|
|
|
|
|
2023-06-23 16:10:49 +02:00
|
|
|
import java.util.regex.Matcher;
|
|
|
|
import java.util.regex.Pattern;
|
|
|
|
|
2023-06-09 16:47:25 +02:00
|
|
|
// https://researchguides.stevens.edu/c.php?g=442331&p=6577176
|
|
|
|
public class PmidCleaningRule {
|
|
|
|
|
2023-10-06 12:35:54 +02:00
|
|
|
public static final Pattern PATTERN = Pattern.compile("0*(\\d{1,8})");
|
2023-06-23 16:10:49 +02:00
|
|
|
|
2023-06-09 16:47:25 +02:00
|
|
|
public static String clean(String pmid) {
|
|
|
|
String s = pmid
|
|
|
|
.toLowerCase()
|
2023-06-23 16:10:49 +02:00
|
|
|
.replaceAll("\\s", "");
|
|
|
|
|
|
|
|
final Matcher m = PATTERN.matcher(s);
|
|
|
|
|
|
|
|
if (m.find()) {
|
2023-10-06 12:35:54 +02:00
|
|
|
return m.group(1);
|
2023-06-23 16:10:49 +02:00
|
|
|
}
|
|
|
|
return "";
|
2023-06-09 16:47:25 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|