From 51fc96f5cf5d5e1253e65298db32e90ba57402ad Mon Sep 17 00:00:00 2001 From: Kihwal Lee Date: Thu, 14 Apr 2016 07:59:41 -0500 Subject: [PATCH] HDFS-10282. The VolumeScanner should warn about replica files which are misplaced. Contributed by Colin Patrick McCabe. (cherry picked from commit 0d1c1152f1ce2706f92109bfbdff0d62e98e6797) --- .../server/datanode/DirectoryScanner.java | 14 ++--- .../hdfs/server/datanode/VolumeScanner.java | 2 +- .../datanode/fsdataset/impl/FsVolumeImpl.java | 12 ++++ .../server/datanode/FsDatasetTestUtils.java | 7 +++ .../server/datanode/TestBlockScanner.java | 63 +++++++++++++++++++ .../impl/FsDatasetImplTestUtils.java | 21 +++++++ 6 files changed, 111 insertions(+), 8 deletions(-) diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/DirectoryScanner.java b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/DirectoryScanner.java index 0e51cecf2b6..1db445e4167 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/DirectoryScanner.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/DirectoryScanner.java @@ -914,13 +914,13 @@ public class DirectoryScanner implements Runnable { */ private void verifyFileLocation(File actualBlockFile, File bpFinalizedDir, long blockId) { - File blockDir = DatanodeUtil.idToBlockDir(bpFinalizedDir, blockId); - if (actualBlockFile.getParentFile().compareTo(blockDir) != 0) { - File expBlockFile = new File(blockDir, actualBlockFile.getName()); - LOG.warn("Block: " + blockId - + " has to be upgraded to block ID-based layout. " - + "Actual block file path: " + actualBlockFile - + ", expected block file path: " + expBlockFile); + File expectedBlockDir = + DatanodeUtil.idToBlockDir(bpFinalizedDir, blockId); + File actualBlockDir = actualBlockFile.getParentFile(); + if (actualBlockDir.compareTo(expectedBlockDir) != 0) { + LOG.warn("Block: " + blockId + + " found in invalid directory. Expected directory: " + + expectedBlockDir + ". Actual directory: " + actualBlockDir); } } diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/VolumeScanner.java b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/VolumeScanner.java index d1f2d051760..d0dc9edbc82 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/VolumeScanner.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/VolumeScanner.java @@ -414,7 +414,7 @@ public class VolumeScanner extends Thread { Block b = volume.getDataset().getStoredBlock( cblock.getBlockPoolId(), cblock.getBlockId()); if (b == null) { - LOG.info("FileNotFound while finding block {} on volume {}", + LOG.info("Replica {} was not found in the VolumeMap for volume {}", cblock, volume.getBasePath()); } else { block = new ExtendedBlock(cblock.getBlockPoolId(), b); diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsVolumeImpl.java b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsVolumeImpl.java index 6971d8055e5..57c39e777a0 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsVolumeImpl.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsVolumeImpl.java @@ -697,6 +697,18 @@ public class FsVolumeImpl implements FsVolumeSpi { } else { ExtendedBlock block = new ExtendedBlock(bpid, Block.filename2id(state.curEntry)); + File expectedBlockDir = DatanodeUtil.idToBlockDir( + new File("."), block.getBlockId()); + File actualBlockDir = Paths.get(".", + state.curFinalizedDir, state.curFinalizedSubDir).toFile(); + if (!expectedBlockDir.equals(actualBlockDir)) { + LOG.error("nextBlock({}, {}): block id {} found in invalid " + + "directory. Expected directory: {}. " + + "Actual directory: {}", storageID, bpid, + block.getBlockId(), expectedBlockDir.getPath(), + actualBlockDir.getPath()); + continue; + } LOG.trace("nextBlock({}, {}): advancing to {}", storageID, bpid, block); return block; diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/FsDatasetTestUtils.java b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/FsDatasetTestUtils.java index f5bf4e9f6a8..867d6c92155 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/FsDatasetTestUtils.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/FsDatasetTestUtils.java @@ -135,6 +135,13 @@ public interface FsDatasetTestUtils { * @throws IOException I/O error. */ void truncateMeta(long newSize) throws IOException; + + /** + * Make the replica unreachable, perhaps by renaming it to an + * invalid file name. + * @throws IOException On I/O error. + */ + void makeUnreachable() throws IOException; } /** diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/TestBlockScanner.java b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/TestBlockScanner.java index 4628a4651bc..021361b2d8a 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/TestBlockScanner.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/TestBlockScanner.java @@ -24,6 +24,7 @@ import static org.apache.hadoop.hdfs.server.datanode.BlockScanner.Conf.INTERNAL_ import static org.apache.hadoop.hdfs.server.datanode.BlockScanner.Conf.INTERNAL_DFS_BLOCK_SCANNER_CURSOR_SAVE_INTERVAL_MS; import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertTrue; +import static org.junit.Assert.assertFalse; import java.io.Closeable; import java.io.File; @@ -38,6 +39,7 @@ import java.util.concurrent.Semaphore; import com.google.common.base.Supplier; import org.apache.hadoop.hdfs.MiniDFSNNTopology; import org.apache.hadoop.hdfs.protocol.ExtendedBlock; +import org.apache.hadoop.hdfs.server.datanode.FsDatasetTestUtils.MaterializedReplica; import org.apache.hadoop.hdfs.server.datanode.fsdataset.FsDatasetSpi; import org.apache.hadoop.hdfs.server.datanode.VolumeScanner.ScanResultHandler; import org.apache.hadoop.conf.Configuration; @@ -139,6 +141,11 @@ public class TestBlockScanner { throws Exception { return DFSTestUtil.getFirstBlock(dfs[nsIdx], getPath(fileIdx)); } + + public MaterializedReplica getMaterializedReplica(int nsIdx, int fileIdx) + throws Exception { + return cluster.getMaterializedReplica(0, getFileBlock(nsIdx, fileIdx)); + } } /** @@ -806,4 +813,60 @@ public class TestBlockScanner { info.blocksScanned = 0; } } + + /** + * Test that blocks which are in the wrong location are ignored. + */ + @Test(timeout=120000) + public void testIgnoreMisplacedBlock() throws Exception { + Configuration conf = new Configuration(); + // Set a really long scan period. + conf.setLong(DFS_DATANODE_SCAN_PERIOD_HOURS_KEY, 100L); + conf.set(INTERNAL_VOLUME_SCANNER_SCAN_RESULT_HANDLER, + TestScanResultHandler.class.getName()); + conf.setLong(INTERNAL_DFS_BLOCK_SCANNER_CURSOR_SAVE_INTERVAL_MS, 0L); + final TestContext ctx = new TestContext(conf, 1); + final int NUM_FILES = 4; + ctx.createFiles(0, NUM_FILES, 5); + MaterializedReplica unreachableReplica = ctx.getMaterializedReplica(0, 1); + ExtendedBlock unreachableBlock = ctx.getFileBlock(0, 1); + unreachableReplica.makeUnreachable(); + final TestScanResultHandler.Info info = + TestScanResultHandler.getInfo(ctx.volumes.get(0)); + String storageID = ctx.volumes.get(0).getStorageID(); + synchronized (info) { + info.sem = new Semaphore(NUM_FILES); + info.shouldRun = true; + info.notify(); + } + // Scan the first 4 blocks + LOG.info("Waiting for the blocks to be scanned."); + GenericTestUtils.waitFor(new Supplier() { + @Override + public Boolean get() { + synchronized (info) { + if (info.blocksScanned >= NUM_FILES - 1) { + LOG.info("info = {}. blockScanned has now reached " + + info.blocksScanned, info); + return true; + } else { + LOG.info("info = {}. Waiting for blockScanned to reach " + + (NUM_FILES - 1), info); + return false; + } + } + } + }, 50, 30000); + // We should have scanned 4 blocks + synchronized (info) { + assertFalse(info.goodBlocks.contains(unreachableBlock)); + assertFalse(info.badBlocks.contains(unreachableBlock)); + assertEquals("Expected 3 good blocks.", 3, info.goodBlocks.size()); + info.goodBlocks.clear(); + assertEquals("Expected 3 blocksScanned", 3, info.blocksScanned); + assertEquals("Did not expect bad blocks.", 0, info.badBlocks.size()); + info.blocksScanned = 0; + } + info.sem.release(1); + } } diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsDatasetImplTestUtils.java b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsDatasetImplTestUtils.java index f3c740a3200..f780a14f2a8 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsDatasetImplTestUtils.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/server/datanode/fsdataset/impl/FsDatasetImplTestUtils.java @@ -170,6 +170,27 @@ public class FsDatasetImplTestUtils implements FsDatasetTestUtils { truncate(metaFile, newSize); } + @Override + public void makeUnreachable() throws IOException { + long blockId = Block.getBlockId(blockFile.getAbsolutePath()); + File origDir = blockFile.getParentFile(); + File root = origDir.getParentFile().getParentFile(); + File newDir = null; + // Keep incrementing the block ID until the block and metadata + // files end up in a different directory. Actually, with the + // current replica file placement scheme, this should only ever + // require one increment, but this is a bit of defensive coding. + do { + blockId++; + newDir = DatanodeUtil.idToBlockDir(root, blockId); + } while (origDir.equals(newDir)); + Files.createDirectories(newDir.toPath()); + Files.move(blockFile.toPath(), + new File(newDir, blockFile.getName()).toPath()); + Files.move(metaFile.toPath(), + new File(newDir, metaFile.getName()).toPath()); + } + @Override public String toString() { return String.format("MaterializedReplica: file=%s", blockFile);