partial refactoring

This commit is contained in:
Michele Artini 2024-02-09 14:33:04 +01:00
parent c974c75f83
commit 5add433b74
1 changed files with 25 additions and 18 deletions

View File

@ -25,34 +25,49 @@ import eu.dnetlib.dhp.common.aggregation.AggregatorReport;
public class BaseCollectorIterator implements Iterator<Element> {
private final BlockingQueue<Element> queue = new LinkedBlockingQueue<>();
private Object nextElement;
private final BlockingQueue<Object> queue = new LinkedBlockingQueue<>();
private static final Logger log = LoggerFactory.getLogger(BaseCollectorIterator.class);
private boolean completed = false;
public BaseCollectorIterator(final FileSystem fs, final Path filePath, final AggregatorReport report) {
new Thread(() -> importHadoopFile(fs, filePath, report)).start();
try {
this.nextElement = this.queue.take();
} catch (final InterruptedException e) {
throw new RuntimeException(e);
}
}
protected BaseCollectorIterator(final String resourcePath, final AggregatorReport report) {
new Thread(() -> importTestFile(resourcePath, report)).start();
try {
this.nextElement = this.queue.take();
} catch (final InterruptedException e) {
throw new RuntimeException(e);
}
}
@Override
public synchronized boolean hasNext() {
return !this.queue.isEmpty() || !isCompleted();
return (this.nextElement != null) && (this.nextElement instanceof Element);
}
@Override
public synchronized Element next() {
try {
return this.queue.take();
return this.nextElement instanceof Element ? (Element) this.nextElement : null;
} finally {
try {
this.nextElement = this.queue.take();
} catch (final InterruptedException e) {
throw new RuntimeException(e);
}
}
}
private void importHadoopFile(final FileSystem fs, final Path filePath, final AggregatorReport report) {
log.info("I start to read the TAR stream");
@ -64,7 +79,7 @@ public class BaseCollectorIterator implements Iterator<Element> {
report.put(e.getClass().getName(), e.getMessage());
throw new RuntimeException("Error processing BASE records", e);
} finally {
setCompleted(true);
this.queue.add("__END__"); // I ADD A NOT ELEMENT OBJECT TO INDICATE THE END OF THE QUEUE
}
}
@ -77,7 +92,7 @@ public class BaseCollectorIterator implements Iterator<Element> {
report.put(e.getClass().getName(), e.getMessage());
throw new RuntimeException("Error processing BASE records", e);
} finally {
setCompleted(true);
this.queue.add("__END__"); // I ADD A NOT ELEMENT OBJECT TO INDICATE THE END OF THE QUEUE
}
}
@ -104,7 +119,7 @@ public class BaseCollectorIterator implements Iterator<Element> {
for (final Object o : doc.selectNodes("//*[local-name()='ListRecords']/*[local-name()='record']")) {
if (o instanceof Element) {
this.queue.add((Element) o);
this.queue.add(o);
count++;
}
}
@ -114,12 +129,4 @@ public class BaseCollectorIterator implements Iterator<Element> {
log.info("Total records (written in queue): " + count);
}
private synchronized boolean isCompleted() {
return this.completed;
}
private synchronized void setCompleted(final boolean completed) {
this.completed = completed;
}
}