forked from D-Net/dnet-hadoop
fix bug on oai iterator that skip record cleaned
This commit is contained in:
parent
d64a942a76
commit
370dddb2fa
|
@ -161,7 +161,7 @@ public class OaiIterator implements Iterator<String> {
|
||||||
report.put(e.getClass().getName(), e.getMessage());
|
report.put(e.getClass().getName(), e.getMessage());
|
||||||
final String cleaned = XmlCleaner.cleanAllEntities(xml);
|
final String cleaned = XmlCleaner.cleanAllEntities(xml);
|
||||||
try {
|
try {
|
||||||
doc = DocumentHelper.parseText(xml);
|
doc = DocumentHelper.parseText(cleaned);
|
||||||
} catch (final DocumentException e1) {
|
} catch (final DocumentException e1) {
|
||||||
final String resumptionToken = extractResumptionToken(xml);
|
final String resumptionToken = extractResumptionToken(xml);
|
||||||
if (resumptionToken == null) {
|
if (resumptionToken == null) {
|
||||||
|
|
Loading…
Reference in New Issue