HDFS-9829. Erasure Coding: Improve few exception handling logic of ErasureCodingWorker. Contributed by Rakesh R.
This commit is contained in:
parent
ba1c9d484a
commit
6546d9e7ff
|
@ -225,6 +225,9 @@ Trunk (Unreleased)
|
|||
|
||||
HDFS-9795. OIV Delimited should show which files are ACL-enabled (lei)
|
||||
|
||||
HDFS-9829. Erasure Coding: Improve few exception handling logic of
|
||||
ErasureCodingWorker. (Rakesh R via jing9)
|
||||
|
||||
OPTIMIZATIONS
|
||||
|
||||
BUG FIXES
|
||||
|
|
|
@ -124,7 +124,7 @@ public final class ErasureCodingWorker {
|
|||
}
|
||||
|
||||
private void initializeStripedReadThreadPool(int num) {
|
||||
LOG.debug("Using striped reads; pool threads=" + num);
|
||||
LOG.debug("Using striped reads; pool threads={}", num);
|
||||
|
||||
EC_RECONSTRUCTION_STRIPED_READ_THREAD_POOL = new ThreadPoolExecutor(1, num,
|
||||
60, TimeUnit.SECONDS, new SynchronousQueue<Runnable>(),
|
||||
|
@ -150,7 +150,7 @@ public final class ErasureCodingWorker {
|
|||
}
|
||||
|
||||
private void initializeStripedBlkReconstructionThreadPool(int num) {
|
||||
LOG.debug("Using striped block reconstruction; pool threads=" + num);
|
||||
LOG.debug("Using striped block reconstruction; pool threads={}" + num);
|
||||
EC_RECONSTRUCTION_STRIPED_BLK_THREAD_POOL = new ThreadPoolExecutor(2, num,
|
||||
60, TimeUnit.SECONDS, new LinkedBlockingQueue<Runnable>(),
|
||||
new Daemon.DaemonFactory() {
|
||||
|
@ -180,8 +180,8 @@ public final class ErasureCodingWorker {
|
|||
EC_RECONSTRUCTION_STRIPED_BLK_THREAD_POOL
|
||||
.submit(new ReconstructAndTransferBlock(reconstructionInfo));
|
||||
} catch (Throwable e) {
|
||||
LOG.warn("Failed to reconstruct striped block "
|
||||
+ reconstructionInfo.getExtendedBlock().getLocalBlock(), e);
|
||||
LOG.warn("Failed to reconstruct striped block {}",
|
||||
reconstructionInfo.getExtendedBlock().getLocalBlock(), e);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
@ -476,12 +476,12 @@ public final class ErasureCodingWorker {
|
|||
// Currently we don't check the acks for packets, this is similar as
|
||||
// block replication.
|
||||
} catch (Throwable e) {
|
||||
LOG.warn("Failed to reconstruct striped block: " + blockGroup, e);
|
||||
LOG.warn("Failed to reconstruct striped block: {}", blockGroup, e);
|
||||
} finally {
|
||||
datanode.decrementXmitsInProgress();
|
||||
// close block readers
|
||||
for (StripedReader stripedReader : stripedReaders) {
|
||||
closeBlockReader(stripedReader.blockReader);
|
||||
IOUtils.closeStream(stripedReader.blockReader);
|
||||
}
|
||||
for (int i = 0; i < targets.length; i++) {
|
||||
IOUtils.closeStream(targetOutputStreams[i]);
|
||||
|
@ -588,7 +588,7 @@ public final class ErasureCodingWorker {
|
|||
// If read failed for some source DN, we should not use it anymore
|
||||
// and schedule read from another source DN.
|
||||
StripedReader failedReader = stripedReaders.get(result.index);
|
||||
closeBlockReader(failedReader.blockReader);
|
||||
IOUtils.closeStream(failedReader.blockReader);
|
||||
failedReader.blockReader = null;
|
||||
resultIndex = scheduleNewRead(used, reconstructLength,
|
||||
corruptionMap);
|
||||
|
@ -609,6 +609,8 @@ public final class ErasureCodingWorker {
|
|||
}
|
||||
} catch (InterruptedException e) {
|
||||
LOG.info("Read data interrupted.", e);
|
||||
cancelReads(futures.keySet());
|
||||
futures.clear();
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
@ -736,7 +738,7 @@ public final class ErasureCodingWorker {
|
|||
StripedReader r = stripedReaders.get(i);
|
||||
toRead = getReadLength(liveIndices[i], reconstructLen);
|
||||
if (toRead > 0) {
|
||||
closeBlockReader(r.blockReader);
|
||||
IOUtils.closeStream(r.blockReader);
|
||||
r.blockReader = newBlockReader(
|
||||
getBlock(blockGroup, liveIndices[i]), positionInBlock,
|
||||
sources[i]);
|
||||
|
@ -784,8 +786,8 @@ public final class ErasureCodingWorker {
|
|||
actualReadFromBlock(reader.blockReader, buf);
|
||||
return null;
|
||||
} catch (ChecksumException e) {
|
||||
LOG.warn("Found Checksum error for " + reader.block + " from "
|
||||
+ reader.source + " at " + e.getPos());
|
||||
LOG.warn("Found Checksum error for {} from {} at {}", reader.block,
|
||||
reader.source, e.getPos());
|
||||
addCorruptedBlock(reader.block, reader.source, corruptionMap);
|
||||
throw e;
|
||||
} catch (IOException e) {
|
||||
|
@ -837,17 +839,6 @@ public final class ErasureCodingWorker {
|
|||
}
|
||||
}
|
||||
|
||||
// close block reader
|
||||
private void closeBlockReader(BlockReader blockReader) {
|
||||
try {
|
||||
if (blockReader != null) {
|
||||
blockReader.close();
|
||||
}
|
||||
} catch (IOException e) {
|
||||
// ignore
|
||||
}
|
||||
}
|
||||
|
||||
private InetSocketAddress getSocketAddress4Transfer(DatanodeInfo dnInfo) {
|
||||
return NetUtils.createSocketAddr(dnInfo.getXferAddr(
|
||||
datanode.getDnConf().getConnectToDnViaHostname()));
|
||||
|
@ -867,8 +858,6 @@ public final class ErasureCodingWorker {
|
|||
* read directly from DN and need to check the replica is FINALIZED
|
||||
* state, notice we should not use short-circuit local read which
|
||||
* requires config for domain-socket in UNIX or legacy config in Windows.
|
||||
*
|
||||
* TODO: add proper tracer
|
||||
*/
|
||||
return RemoteBlockReader2.newBlockReader(
|
||||
"dummy", block, blockToken, offsetInBlock,
|
||||
|
@ -876,6 +865,8 @@ public final class ErasureCodingWorker {
|
|||
"", newConnectedPeer(block, dnAddr, blockToken, dnInfo), dnInfo,
|
||||
null, cachingStrategy, datanode.getTracer());
|
||||
} catch (IOException e) {
|
||||
LOG.debug("Exception while creating remote block reader, datanode {}",
|
||||
dnInfo, e);
|
||||
return null;
|
||||
}
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue