HDFS-9869. Erasure Coding: Rename replication-based names in BlockManager to more generic [part-2]. Contributed by Rakesh R.

This commit is contained in:
Zhe Zhang 2016-04-25 22:01:54 -07:00
parent 8eadd7145e
commit 5865fe2bf0
30 changed files with 253 additions and 241 deletions

View File

@ -45,7 +45,8 @@ The following table lists the configuration property names that are deprecated i
| dfs.replication.considerLoad | dfs.namenode.replication.considerLoad | | dfs.replication.considerLoad | dfs.namenode.replication.considerLoad |
| dfs.replication.interval | dfs.namenode.replication.interval | | dfs.replication.interval | dfs.namenode.replication.interval |
| dfs.replication.min | dfs.namenode.replication.min | | dfs.replication.min | dfs.namenode.replication.min |
| dfs.replication.pending.timeout.sec | dfs.namenode.replication.pending.timeout-sec | | dfs.replication.pending.timeout.sec | dfs.namenode.reconstruction.pending.timeout-sec |
| dfs.namenode.replication.pending.timeout-sec | dfs.namenode.reconstruction.pending.timeout-sec |
| dfs.safemode.extension | dfs.namenode.safemode.extension | | dfs.safemode.extension | dfs.namenode.safemode.extension |
| dfs.safemode.threshold.pct | dfs.namenode.safemode.threshold-pct | | dfs.safemode.threshold.pct | dfs.namenode.safemode.threshold-pct |
| dfs.secondary.http.address | dfs.namenode.secondary.http-address | | dfs.secondary.http.address | dfs.namenode.secondary.http-address |

View File

@ -120,7 +120,9 @@ public class HdfsConfiguration extends Configuration {
new DeprecationDelta("dfs.replication.min", new DeprecationDelta("dfs.replication.min",
DeprecatedKeys.DFS_NAMENODE_REPLICATION_MIN_KEY), DeprecatedKeys.DFS_NAMENODE_REPLICATION_MIN_KEY),
new DeprecationDelta("dfs.replication.pending.timeout.sec", new DeprecationDelta("dfs.replication.pending.timeout.sec",
DeprecatedKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY), DeprecatedKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY),
new DeprecationDelta("dfs.namenode.replication.pending.timeout-sec",
DeprecatedKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY),
new DeprecationDelta("dfs.max-repl-streams", new DeprecationDelta("dfs.max-repl-streams",
DeprecatedKeys.DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY), DeprecatedKeys.DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY),
new DeprecationDelta("dfs.permissions", new DeprecationDelta("dfs.permissions",

View File

@ -216,8 +216,8 @@ public interface HdfsClientConfigKeys {
String DFS_NAMENODE_REPLICATION_INTERVAL_KEY = String DFS_NAMENODE_REPLICATION_INTERVAL_KEY =
"dfs.namenode.replication.interval"; "dfs.namenode.replication.interval";
String DFS_NAMENODE_REPLICATION_MIN_KEY = "dfs.namenode.replication.min"; String DFS_NAMENODE_REPLICATION_MIN_KEY = "dfs.namenode.replication.min";
String DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY = String DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY =
"dfs.namenode.replication.pending.timeout-sec"; "dfs.namenode.reconstruction.pending.timeout-sec";
String DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY = String DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY =
"dfs.namenode.replication.max-streams"; "dfs.namenode.replication.max-streams";
String DFS_PERMISSIONS_ENABLED_KEY = "dfs.permissions.enabled"; String DFS_PERMISSIONS_ENABLED_KEY = "dfs.permissions.enabled";

View File

@ -213,9 +213,11 @@ public class DFSConfigKeys extends CommonConfigurationKeys {
public static final int DFS_NAMENODE_STRIPE_MIN_DEFAULT = 1; public static final int DFS_NAMENODE_STRIPE_MIN_DEFAULT = 1;
public static final String DFS_NAMENODE_SAFEMODE_REPLICATION_MIN_KEY = public static final String DFS_NAMENODE_SAFEMODE_REPLICATION_MIN_KEY =
"dfs.namenode.safemode.replication.min"; "dfs.namenode.safemode.replication.min";
public static final String DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY =
HdfsClientConfigKeys.DeprecatedKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY; public static final String DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY =
public static final int DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_DEFAULT = -1; "dfs.namenode.reconstruction.pending.timeout-sec";
public static final int DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_DEFAULT = -1;
public static final String DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY = public static final String DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY =
HdfsClientConfigKeys.DeprecatedKeys.DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY; HdfsClientConfigKeys.DeprecatedKeys.DFS_NAMENODE_REPLICATION_MAX_STREAMS_KEY;
public static final int DFS_NAMENODE_REPLICATION_MAX_STREAMS_DEFAULT = 2; public static final int DFS_NAMENODE_REPLICATION_MAX_STREAMS_DEFAULT = 2;

View File

@ -147,7 +147,7 @@ public class BlockManager implements BlockStatsMXBean {
private final PendingDataNodeMessages pendingDNMessages = private final PendingDataNodeMessages pendingDNMessages =
new PendingDataNodeMessages(); new PendingDataNodeMessages();
private volatile long pendingReplicationBlocksCount = 0L; private volatile long pendingReconstructionBlocksCount = 0L;
private volatile long corruptReplicaBlocksCount = 0L; private volatile long corruptReplicaBlocksCount = 0L;
private volatile long lowRedundancyBlocksCount = 0L; private volatile long lowRedundancyBlocksCount = 0L;
private volatile long scheduledReplicationBlocksCount = 0L; private volatile long scheduledReplicationBlocksCount = 0L;
@ -161,8 +161,8 @@ public class BlockManager implements BlockStatsMXBean {
private ObjectName mxBeanName; private ObjectName mxBeanName;
/** Used by metrics */ /** Used by metrics */
public long getPendingReplicationBlocksCount() { public long getPendingReconstructionBlocksCount() {
return pendingReplicationBlocksCount; return pendingReconstructionBlocksCount;
} }
/** Used by metrics */ /** Used by metrics */
public long getUnderReplicatedBlocksCount() { public long getUnderReplicatedBlocksCount() {
@ -186,7 +186,7 @@ public class BlockManager implements BlockStatsMXBean {
} }
/** Used by metrics */ /** Used by metrics */
public long getExcessBlocksCount() { public long getExcessBlocksCount() {
return excessReplicas.size(); return excessRedundancyMap.size();
} }
/** Used by metrics */ /** Used by metrics */
public long getPostponedMisreplicatedBlocksCount() { public long getPostponedMisreplicatedBlocksCount() {
@ -246,7 +246,8 @@ public class BlockManager implements BlockStatsMXBean {
* Maps a StorageID to the set of blocks that are "extra" for this * Maps a StorageID to the set of blocks that are "extra" for this
* DataNode. We'll eventually remove these extras. * DataNode. We'll eventually remove these extras.
*/ */
private final ExcessReplicaMap excessReplicas = new ExcessReplicaMap(); private final ExcessRedundancyMap excessRedundancyMap =
new ExcessRedundancyMap();
/** /**
* Store set of Blocks that need to be replicated 1 or more times. * Store set of Blocks that need to be replicated 1 or more times.
@ -256,7 +257,7 @@ public class BlockManager implements BlockStatsMXBean {
new LowRedundancyBlocks(); new LowRedundancyBlocks();
@VisibleForTesting @VisibleForTesting
final PendingReplicationBlocks pendingReplications; final PendingReconstructionBlocks pendingReconstruction;
/** The maximum number of replicas allowed for a block */ /** The maximum number of replicas allowed for a block */
public final short maxReplication; public final short maxReplication;
@ -352,9 +353,10 @@ public class BlockManager implements BlockStatsMXBean {
datanodeManager.getNetworkTopology(), datanodeManager.getNetworkTopology(),
datanodeManager.getHost2DatanodeMap()); datanodeManager.getHost2DatanodeMap());
storagePolicySuite = BlockStoragePolicySuite.createDefaultSuite(); storagePolicySuite = BlockStoragePolicySuite.createDefaultSuite();
pendingReplications = new PendingReplicationBlocks(conf.getInt( pendingReconstruction = new PendingReconstructionBlocks(conf.getInt(
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY,
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_DEFAULT) * 1000L); DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_DEFAULT)
* 1000L);
blockTokenSecretManager = createBlockTokenSecretManager(conf); blockTokenSecretManager = createBlockTokenSecretManager(conf);
@ -542,7 +544,7 @@ public class BlockManager implements BlockStatsMXBean {
} }
public void activate(Configuration conf, long blockTotal) { public void activate(Configuration conf, long blockTotal) {
pendingReplications.start(); pendingReconstruction.start();
datanodeManager.activate(conf); datanodeManager.activate(conf);
this.replicationThread.setName("ReplicationMonitor"); this.replicationThread.setName("ReplicationMonitor");
this.replicationThread.start(); this.replicationThread.start();
@ -565,7 +567,7 @@ public class BlockManager implements BlockStatsMXBean {
} catch (InterruptedException ie) { } catch (InterruptedException ie) {
} }
datanodeManager.close(); datanodeManager.close();
pendingReplications.stop(); pendingReconstruction.stop();
blocksMap.close(); blocksMap.close();
} }
@ -604,8 +606,8 @@ public class BlockManager implements BlockStatsMXBean {
dumpBlockMeta(block, out); dumpBlockMeta(block, out);
} }
// Dump blocks from pendingReplication // Dump blocks from pendingReconstruction
pendingReplications.metaSave(out); pendingReconstruction.metaSave(out);
// Dump blocks that are waiting to be deleted // Dump blocks that are waiting to be deleted
invalidateBlocks.dump(out); invalidateBlocks.dump(out);
@ -765,7 +767,7 @@ public class BlockManager implements BlockStatsMXBean {
/** /**
* If IBR is not sent from expected locations yet, add the datanodes to * If IBR is not sent from expected locations yet, add the datanodes to
* pendingReplications in order to keep ReplicationMonitor from scheduling * pendingReconstruction in order to keep ReplicationMonitor from scheduling
* the block. * the block.
*/ */
public void addExpectedReplicasToPending(BlockInfo blk) { public void addExpectedReplicasToPending(BlockInfo blk) {
@ -780,7 +782,7 @@ public class BlockManager implements BlockStatsMXBean {
pendingNodes.add(dnd); pendingNodes.add(dnd);
} }
} }
pendingReplications.increment(blk, pendingReconstruction.increment(blk,
pendingNodes.toArray(new DatanodeDescriptor[pendingNodes.size()])); pendingNodes.toArray(new DatanodeDescriptor[pendingNodes.size()]));
} }
} }
@ -866,7 +868,7 @@ public class BlockManager implements BlockStatsMXBean {
neededReconstruction.remove(lastBlock, replicas.liveReplicas(), neededReconstruction.remove(lastBlock, replicas.liveReplicas(),
replicas.readOnlyReplicas(), replicas.readOnlyReplicas(),
replicas.decommissionedAndDecommissioning(), getReplication(lastBlock)); replicas.decommissionedAndDecommissioning(), getReplication(lastBlock));
pendingReplications.remove(lastBlock); pendingReconstruction.remove(lastBlock);
// remove this block from the list of pending blocks to be deleted. // remove this block from the list of pending blocks to be deleted.
for (DatanodeStorageInfo storage : targets) { for (DatanodeStorageInfo storage : targets) {
@ -1435,7 +1437,7 @@ public class BlockManager implements BlockStatsMXBean {
void updateState() { void updateState() {
pendingReplicationBlocksCount = pendingReplications.size(); pendingReconstructionBlocksCount = pendingReconstruction.size();
lowRedundancyBlocksCount = neededReconstruction.size(); lowRedundancyBlocksCount = neededReconstruction.size();
corruptReplicaBlocksCount = corruptReplicas.size(); corruptReplicaBlocksCount = corruptReplicas.size();
} }
@ -1578,8 +1580,8 @@ public class BlockManager implements BlockStatsMXBean {
} }
blockLog.debug( blockLog.debug(
"BLOCK* neededReconstruction = {} pendingReplications = {}", "BLOCK* neededReconstruction = {} pendingReconstruction = {}",
neededReconstruction.size(), pendingReplications.size()); neededReconstruction.size(), pendingReconstruction.size());
} }
return scheduledWork; return scheduledWork;
@ -1622,7 +1624,7 @@ public class BlockManager implements BlockStatsMXBean {
// not included in the numReplicas.liveReplicas() count // not included in the numReplicas.liveReplicas() count
assert liveReplicaNodes.size() >= numReplicas.liveReplicas(); assert liveReplicaNodes.size() >= numReplicas.liveReplicas();
int pendingNum = pendingReplications.getNumReplicas(block); int pendingNum = pendingReconstruction.getNumReplicas(block);
if (hasEnoughEffectiveReplicas(block, numReplicas, pendingNum, if (hasEnoughEffectiveReplicas(block, numReplicas, pendingNum,
requiredReplication)) { requiredReplication)) {
neededReconstruction.remove(block, priority); neededReconstruction.remove(block, priority);
@ -1690,7 +1692,7 @@ public class BlockManager implements BlockStatsMXBean {
// do not schedule more if enough replicas is already pending // do not schedule more if enough replicas is already pending
final short requiredReplication = getExpectedReplicaNum(block); final short requiredReplication = getExpectedReplicaNum(block);
NumberReplicas numReplicas = countNodes(block); NumberReplicas numReplicas = countNodes(block);
final int pendingNum = pendingReplications.getNumReplicas(block); final int pendingNum = pendingReconstruction.getNumReplicas(block);
if (hasEnoughEffectiveReplicas(block, numReplicas, pendingNum, if (hasEnoughEffectiveReplicas(block, numReplicas, pendingNum,
requiredReplication)) { requiredReplication)) {
neededReconstruction.remove(block, priority); neededReconstruction.remove(block, priority);
@ -1718,8 +1720,8 @@ public class BlockManager implements BlockStatsMXBean {
// Move the block-replication into a "pending" state. // Move the block-replication into a "pending" state.
// The reason we use 'pending' is so we can retry // The reason we use 'pending' is so we can retry
// replications that fail after an appropriate amount of time. // reconstructions that fail after an appropriate amount of time.
pendingReplications.increment(block, pendingReconstruction.increment(block,
DatanodeStorageInfo.toDatanodeDescriptors(targets)); DatanodeStorageInfo.toDatanodeDescriptors(targets));
blockLog.debug("BLOCK* block {} is moved from neededReplications to " blockLog.debug("BLOCK* block {} is moved from neededReplications to "
+ "pendingReplications", block); + "pendingReplications", block);
@ -1907,11 +1909,11 @@ public class BlockManager implements BlockStatsMXBean {
} }
/** /**
* If there were any replication requests that timed out, reap them * If there were any reconstruction requests that timed out, reap them
* and put them back into the neededReplication queue * and put them back into the neededReconstruction queue
*/ */
private void processPendingReplications() { private void processPendingReconstructions() {
BlockInfo[] timedOutItems = pendingReplications.getTimedOutBlocks(); BlockInfo[] timedOutItems = pendingReconstruction.getTimedOutBlocks();
if (timedOutItems != null) { if (timedOutItems != null) {
namesystem.writeLock(); namesystem.writeLock();
try { try {
@ -2890,7 +2892,7 @@ public class BlockManager implements BlockStatsMXBean {
// Now check for completion of blocks and safe block count // Now check for completion of blocks and safe block count
NumberReplicas num = countNodes(storedBlock); NumberReplicas num = countNodes(storedBlock);
int numLiveReplicas = num.liveReplicas(); int numLiveReplicas = num.liveReplicas();
int pendingNum = pendingReplications.getNumReplicas(storedBlock); int pendingNum = pendingReconstruction.getNumReplicas(storedBlock);
int numCurrentReplica = numLiveReplicas + pendingNum; int numCurrentReplica = numLiveReplicas + pendingNum;
if(storedBlock.getBlockUCState() == BlockUCState.COMMITTED && if(storedBlock.getBlockUCState() == BlockUCState.COMMITTED &&
@ -3203,8 +3205,8 @@ public class BlockManager implements BlockStatsMXBean {
/** /**
* Find how many of the containing nodes are "extra", if any. * Find how many of the containing nodes are "extra", if any.
* If there are any extras, call chooseExcessReplicates() to * If there are any extras, call chooseExcessRedundancies() to
* mark them in the excessReplicateMap. * mark them in the excessRedundancyMap.
*/ */
private void processExtraRedundancyBlock(final BlockInfo block, private void processExtraRedundancyBlock(final BlockInfo block,
final short replication, final DatanodeDescriptor addedNode, final short replication, final DatanodeDescriptor addedNode,
@ -3237,11 +3239,11 @@ public class BlockManager implements BlockStatsMXBean {
} }
} }
} }
chooseExcessReplicates(nonExcess, block, replication, addedNode, chooseExcessRedundancies(nonExcess, block, replication, addedNode,
delNodeHint); delNodeHint);
} }
private void chooseExcessReplicates( private void chooseExcessRedundancies(
final Collection<DatanodeStorageInfo> nonExcess, final Collection<DatanodeStorageInfo> nonExcess,
BlockInfo storedBlock, short replication, BlockInfo storedBlock, short replication,
DatanodeDescriptor addedNode, DatanodeDescriptor addedNode,
@ -3250,19 +3252,19 @@ public class BlockManager implements BlockStatsMXBean {
// first form a rack to datanodes map and // first form a rack to datanodes map and
BlockCollection bc = getBlockCollection(storedBlock); BlockCollection bc = getBlockCollection(storedBlock);
if (storedBlock.isStriped()) { if (storedBlock.isStriped()) {
chooseExcessReplicasStriped(bc, nonExcess, storedBlock, delNodeHint); chooseExcessRedundancyStriped(bc, nonExcess, storedBlock, delNodeHint);
} else { } else {
final BlockStoragePolicy storagePolicy = storagePolicySuite.getPolicy( final BlockStoragePolicy storagePolicy = storagePolicySuite.getPolicy(
bc.getStoragePolicyID()); bc.getStoragePolicyID());
final List<StorageType> excessTypes = storagePolicy.chooseExcess( final List<StorageType> excessTypes = storagePolicy.chooseExcess(
replication, DatanodeStorageInfo.toStorageTypes(nonExcess)); replication, DatanodeStorageInfo.toStorageTypes(nonExcess));
chooseExcessReplicasContiguous(nonExcess, storedBlock, replication, chooseExcessRedundancyContiguous(nonExcess, storedBlock, replication,
addedNode, delNodeHint, excessTypes); addedNode, delNodeHint, excessTypes);
} }
} }
/** /**
* We want "replication" replicates for the block, but we now have too many. * We want sufficient redundancy for the block, but we now have too many.
* In this method, copy enough nodes from 'srcNodes' into 'dstNodes' such that: * In this method, copy enough nodes from 'srcNodes' into 'dstNodes' such that:
* *
* srcNodes.size() - dstNodes.size() == replication * srcNodes.size() - dstNodes.size() == replication
@ -3275,7 +3277,7 @@ public class BlockManager implements BlockStatsMXBean {
* If no such a node is available, * If no such a node is available,
* then pick a node with least free space * then pick a node with least free space
*/ */
private void chooseExcessReplicasContiguous( private void chooseExcessRedundancyContiguous(
final Collection<DatanodeStorageInfo> nonExcess, BlockInfo storedBlock, final Collection<DatanodeStorageInfo> nonExcess, BlockInfo storedBlock,
short replication, DatanodeDescriptor addedNode, short replication, DatanodeDescriptor addedNode,
DatanodeDescriptor delNodeHint, List<StorageType> excessTypes) { DatanodeDescriptor delNodeHint, List<StorageType> excessTypes) {
@ -3284,7 +3286,7 @@ public class BlockManager implements BlockStatsMXBean {
.chooseReplicasToDelete(nonExcess, nonExcess, replication, excessTypes, .chooseReplicasToDelete(nonExcess, nonExcess, replication, excessTypes,
addedNode, delNodeHint); addedNode, delNodeHint);
for (DatanodeStorageInfo choosenReplica : replicasToDelete) { for (DatanodeStorageInfo choosenReplica : replicasToDelete) {
processChosenExcessReplica(nonExcess, choosenReplica, storedBlock); processChosenExcessRedundancy(nonExcess, choosenReplica, storedBlock);
} }
} }
@ -3297,7 +3299,7 @@ public class BlockManager implements BlockStatsMXBean {
* The block placement policy will make sure that the left internal blocks are * The block placement policy will make sure that the left internal blocks are
* spread across racks and also try hard to pick one with least free space. * spread across racks and also try hard to pick one with least free space.
*/ */
private void chooseExcessReplicasStriped(BlockCollection bc, private void chooseExcessRedundancyStriped(BlockCollection bc,
final Collection<DatanodeStorageInfo> nonExcess, final Collection<DatanodeStorageInfo> nonExcess,
BlockInfo storedBlock, BlockInfo storedBlock,
DatanodeDescriptor delNodeHint) { DatanodeDescriptor delNodeHint) {
@ -3325,7 +3327,7 @@ public class BlockManager implements BlockStatsMXBean {
if (delStorageHint != null) { if (delStorageHint != null) {
Integer index = storage2index.get(delStorageHint); Integer index = storage2index.get(delStorageHint);
if (index != null && duplicated.get(index)) { if (index != null && duplicated.get(index)) {
processChosenExcessReplica(nonExcess, delStorageHint, storedBlock); processChosenExcessRedundancy(nonExcess, delStorageHint, storedBlock);
} }
} }
@ -3357,7 +3359,7 @@ public class BlockManager implements BlockStatsMXBean {
.chooseReplicasToDelete(nonExcess, candidates, (short) 1, .chooseReplicasToDelete(nonExcess, candidates, (short) 1,
excessTypes, null, null); excessTypes, null, null);
for (DatanodeStorageInfo chosen : replicasToDelete) { for (DatanodeStorageInfo chosen : replicasToDelete) {
processChosenExcessReplica(nonExcess, chosen, storedBlock); processChosenExcessRedundancy(nonExcess, chosen, storedBlock);
candidates.remove(chosen); candidates.remove(chosen);
} }
} }
@ -3365,11 +3367,11 @@ public class BlockManager implements BlockStatsMXBean {
} }
} }
private void processChosenExcessReplica( private void processChosenExcessRedundancy(
final Collection<DatanodeStorageInfo> nonExcess, final Collection<DatanodeStorageInfo> nonExcess,
final DatanodeStorageInfo chosen, BlockInfo storedBlock) { final DatanodeStorageInfo chosen, BlockInfo storedBlock) {
nonExcess.remove(chosen); nonExcess.remove(chosen);
excessReplicas.add(chosen.getDatanodeDescriptor(), storedBlock); excessRedundancyMap.add(chosen.getDatanodeDescriptor(), storedBlock);
// //
// The 'excessblocks' tracks blocks until we get confirmation // The 'excessblocks' tracks blocks until we get confirmation
// that the datanode has deleted them; the only way we remove them // that the datanode has deleted them; the only way we remove them
@ -3381,7 +3383,7 @@ public class BlockManager implements BlockStatsMXBean {
// //
final Block blockToInvalidate = getBlockOnStorage(storedBlock, chosen); final Block blockToInvalidate = getBlockOnStorage(storedBlock, chosen);
addToInvalidates(blockToInvalidate, chosen.getDatanodeDescriptor()); addToInvalidates(blockToInvalidate, chosen.getDatanodeDescriptor());
blockLog.debug("BLOCK* chooseExcessReplicates: " blockLog.debug("BLOCK* chooseExcessRedundancies: "
+ "({}, {}) is added to invalidated blocks set", chosen, storedBlock); + "({}, {}) is added to invalidated blocks set", chosen, storedBlock);
} }
@ -3433,7 +3435,7 @@ public class BlockManager implements BlockStatsMXBean {
updateNeededReconstructions(storedBlock, -1, 0); updateNeededReconstructions(storedBlock, -1, 0);
} }
excessReplicas.remove(node, storedBlock); excessRedundancyMap.remove(node, storedBlock);
corruptReplicas.removeFromCorruptReplicasMap(storedBlock, node); corruptReplicas.removeFromCorruptReplicasMap(storedBlock, node);
} }
} }
@ -3504,7 +3506,7 @@ public class BlockManager implements BlockStatsMXBean {
// //
BlockInfo storedBlock = getStoredBlock(block); BlockInfo storedBlock = getStoredBlock(block);
if (storedBlock != null) { if (storedBlock != null) {
pendingReplications.decrement(storedBlock, node); pendingReconstruction.decrement(storedBlock, node);
} }
processAndHandleReportedBlock(storageInfo, block, ReplicaState.FINALIZED, processAndHandleReportedBlock(storageInfo, block, ReplicaState.FINALIZED,
delHintNode); delHintNode);
@ -3749,11 +3751,11 @@ public class BlockManager implements BlockStatsMXBean {
@VisibleForTesting @VisibleForTesting
int getExcessSize4Testing(String dnUuid) { int getExcessSize4Testing(String dnUuid) {
return excessReplicas.getSize4Testing(dnUuid); return excessRedundancyMap.getSize4Testing(dnUuid);
} }
public boolean isExcess(DatanodeDescriptor dn, BlockInfo blk) { public boolean isExcess(DatanodeDescriptor dn, BlockInfo blk) {
return excessReplicas.contains(dn, blk); return excessRedundancyMap.contains(dn, blk);
} }
/** /**
@ -3813,7 +3815,7 @@ public class BlockManager implements BlockStatsMXBean {
} }
updateState(); updateState();
if (pendingReplicationBlocksCount == 0 && if (pendingReconstructionBlocksCount == 0 &&
lowRedundancyBlocksCount == 0) { lowRedundancyBlocksCount == 0) {
LOG.info("Node {} is dead and there are no low redundancy" + LOG.info("Node {} is dead and there are no low redundancy" +
" blocks or blocks pending reconstruction. Safe to decommission.", " blocks or blocks pending reconstruction. Safe to decommission.",
@ -3860,8 +3862,8 @@ public class BlockManager implements BlockStatsMXBean {
block.setNumBytes(BlockCommand.NO_ACK); block.setNumBytes(BlockCommand.NO_ACK);
addToInvalidates(block); addToInvalidates(block);
removeBlockFromMap(block); removeBlockFromMap(block);
// Remove the block from pendingReplications and neededReconstruction // Remove the block from pendingReconstruction and neededReconstruction
pendingReplications.remove(block); pendingReconstruction.remove(block);
neededReconstruction.remove(block, LowRedundancyBlocks.LEVEL); neededReconstruction.remove(block, LowRedundancyBlocks.LEVEL);
if (postponedMisreplicatedBlocks.remove(block)) { if (postponedMisreplicatedBlocks.remove(block)) {
postponedMisreplicatedBlocksCount.decrementAndGet(); postponedMisreplicatedBlocksCount.decrementAndGet();
@ -3919,7 +3921,7 @@ public class BlockManager implements BlockStatsMXBean {
for (BlockInfo block : bc.getBlocks()) { for (BlockInfo block : bc.getBlocks()) {
short expected = getExpectedReplicaNum(block); short expected = getExpectedReplicaNum(block);
final NumberReplicas n = countNodes(block); final NumberReplicas n = countNodes(block);
final int pending = pendingReplications.getNumReplicas(block); final int pending = pendingReconstruction.getNumReplicas(block);
if (!hasEnoughEffectiveReplicas(block, n, pending, expected)) { if (!hasEnoughEffectiveReplicas(block, n, pending, expected)) {
neededReconstruction.add(block, n.liveReplicas() + pending, neededReconstruction.add(block, n.liveReplicas() + pending,
n.readOnlyReplicas(), n.readOnlyReplicas(),
@ -4059,7 +4061,7 @@ public class BlockManager implements BlockStatsMXBean {
public void removeBlockFromMap(BlockInfo block) { public void removeBlockFromMap(BlockInfo block) {
for(DatanodeStorageInfo info : blocksMap.getStorages(block)) { for(DatanodeStorageInfo info : blocksMap.getStorages(block)) {
excessReplicas.remove(info.getDatanodeDescriptor(), block); excessRedundancyMap.remove(info.getDatanodeDescriptor(), block);
} }
blocksMap.removeBlock(block); blocksMap.removeBlock(block);
@ -4110,7 +4112,7 @@ public class BlockManager implements BlockStatsMXBean {
// Process replication work only when active NN is out of safe mode. // Process replication work only when active NN is out of safe mode.
if (isPopulatingReplQueues()) { if (isPopulatingReplQueues()) {
computeDatanodeWork(); computeDatanodeWork();
processPendingReplications(); processPendingReconstructions();
rescanPostponedMisreplicatedBlocks(); rescanPostponedMisreplicatedBlocks();
} }
Thread.sleep(replicationRecheckInterval); Thread.sleep(replicationRecheckInterval);
@ -4258,8 +4260,8 @@ public class BlockManager implements BlockStatsMXBean {
*/ */
public void clearQueues() { public void clearQueues() {
neededReconstruction.clear(); neededReconstruction.clear();
pendingReplications.clear(); pendingReconstruction.clear();
excessReplicas.clear(); excessRedundancyMap.clear();
invalidateBlocks.clear(); invalidateBlocks.clear();
datanodeManager.clearPendingQueues(); datanodeManager.clearPendingQueues();
postponedMisreplicatedBlocks.clear(); postponedMisreplicatedBlocks.clear();

View File

@ -541,7 +541,7 @@ public class DecommissionManager {
// pending // pending
if (blockManager.isNeededReconstruction(block, liveReplicas)) { if (blockManager.isNeededReconstruction(block, liveReplicas)) {
if (!blockManager.neededReconstruction.contains(block) && if (!blockManager.neededReconstruction.contains(block) &&
blockManager.pendingReplications.getNumReplicas(block) == 0 && blockManager.pendingReconstruction.getNumReplicas(block) == 0 &&
blockManager.isPopulatingReplQueues()) { blockManager.isPopulatingReplQueues()) {
// Process these blocks only when active NN is out of safe mode. // Process these blocks only when active NN is out of safe mode.
blockManager.neededReconstruction.add(block, blockManager.neededReconstruction.add(block,

View File

@ -28,22 +28,26 @@ import org.slf4j.Logger;
import com.google.common.annotations.VisibleForTesting; import com.google.common.annotations.VisibleForTesting;
/** /**
* Maps a datnode to the set of excess replicas. * Maps a datnode to the set of excess redundancy details.
* *
* This class is thread safe. * This class is thread safe.
*/ */
class ExcessReplicaMap { class ExcessRedundancyMap {
public static final Logger blockLog = NameNode.blockStateChangeLog; public static final Logger blockLog = NameNode.blockStateChangeLog;
private final Map<String, LightWeightHashSet<BlockInfo>> map =new HashMap<>(); private final Map<String, LightWeightHashSet<BlockInfo>> map =new HashMap<>();
private final AtomicLong size = new AtomicLong(0L); private final AtomicLong size = new AtomicLong(0L);
/** @return the number of replicas in this map. */ /**
* @return the number of redundancies in this map.
*/
long size() { long size() {
return size.get(); return size.get();
} }
/** @return the number of replicas corresponding to the given datanode. */ /**
* @return the number of redundancies corresponding to the given datanode.
*/
@VisibleForTesting @VisibleForTesting
synchronized int getSize4Testing(String dnUuid) { synchronized int getSize4Testing(String dnUuid) {
final LightWeightHashSet<BlockInfo> set = map.get(dnUuid); final LightWeightHashSet<BlockInfo> set = map.get(dnUuid);
@ -56,7 +60,7 @@ class ExcessReplicaMap {
} }
/** /**
* @return does this map contains a replica corresponding to the given * @return does this map contains a redundancy corresponding to the given
* datanode and the given block? * datanode and the given block?
*/ */
synchronized boolean contains(DatanodeDescriptor dn, BlockInfo blk) { synchronized boolean contains(DatanodeDescriptor dn, BlockInfo blk) {
@ -65,7 +69,9 @@ class ExcessReplicaMap {
} }
/** /**
* Add the replica of the given block stored in the given datanode to the map. * Add the redundancy of the given block stored in the given datanode to the
* map.
*
* @return true if the block is added. * @return true if the block is added.
*/ */
synchronized boolean add(DatanodeDescriptor dn, BlockInfo blk) { synchronized boolean add(DatanodeDescriptor dn, BlockInfo blk) {
@ -77,13 +83,15 @@ class ExcessReplicaMap {
final boolean added = set.add(blk); final boolean added = set.add(blk);
if (added) { if (added) {
size.incrementAndGet(); size.incrementAndGet();
blockLog.debug("BLOCK* ExcessReplicaMap.add({}, {})", dn, blk); blockLog.debug("BLOCK* ExcessRedundancyMap.add({}, {})", dn, blk);
} }
return added; return added;
} }
/** /**
* Remove the replica corresponding to the given datanode and the given block. * Remove the redundancy corresponding to the given datanode and the given
* block.
*
* @return true if the block is removed. * @return true if the block is removed.
*/ */
synchronized boolean remove(DatanodeDescriptor dn, BlockInfo blk) { synchronized boolean remove(DatanodeDescriptor dn, BlockInfo blk) {
@ -95,7 +103,7 @@ class ExcessReplicaMap {
final boolean removed = set.remove(blk); final boolean removed = set.remove(blk);
if (removed) { if (removed) {
size.decrementAndGet(); size.decrementAndGet();
blockLog.debug("BLOCK* ExcessReplicaMap.remove({}, {})", dn, blk); blockLog.debug("BLOCK* ExcessRedundancyMap.remove({}, {})", dn, blk);
if (set.isEmpty()) { if (set.isEmpty()) {
map.remove(dn.getDatanodeUuid()); map.remove(dn.getDatanodeUuid());

View File

@ -33,20 +33,20 @@ import org.apache.hadoop.util.Daemon;
import org.slf4j.Logger; import org.slf4j.Logger;
/*************************************************** /***************************************************
* PendingReplicationBlocks does the bookkeeping of all * PendingReconstructionBlocks does the bookkeeping of all
* blocks that are getting replicated. * blocks that gains stronger redundancy.
* *
* It does the following: * It does the following:
* 1) record blocks that are getting replicated at this instant. * 1) record blocks that gains stronger redundancy at this instant.
* 2) a coarse grain timer to track age of replication request * 2) a coarse grain timer to track age of reconstruction request
* 3) a thread that periodically identifies replication-requests * 3) a thread that periodically identifies reconstruction-requests
* that never made it. * that never made it.
* *
***************************************************/ ***************************************************/
class PendingReplicationBlocks { class PendingReconstructionBlocks {
private static final Logger LOG = BlockManager.LOG; private static final Logger LOG = BlockManager.LOG;
private final Map<BlockInfo, PendingBlockInfo> pendingReplications; private final Map<BlockInfo, PendingBlockInfo> pendingReconstructions;
private final ArrayList<BlockInfo> timedOutItems; private final ArrayList<BlockInfo> timedOutItems;
Daemon timerThread = null; Daemon timerThread = null;
private volatile boolean fsRunning = true; private volatile boolean fsRunning = true;
@ -58,29 +58,29 @@ class PendingReplicationBlocks {
private long timeout = 5 * 60 * 1000; private long timeout = 5 * 60 * 1000;
private final static long DEFAULT_RECHECK_INTERVAL = 5 * 60 * 1000; private final static long DEFAULT_RECHECK_INTERVAL = 5 * 60 * 1000;
PendingReplicationBlocks(long timeoutPeriod) { PendingReconstructionBlocks(long timeoutPeriod) {
if ( timeoutPeriod > 0 ) { if ( timeoutPeriod > 0 ) {
this.timeout = timeoutPeriod; this.timeout = timeoutPeriod;
} }
pendingReplications = new HashMap<>(); pendingReconstructions = new HashMap<>();
timedOutItems = new ArrayList<>(); timedOutItems = new ArrayList<>();
} }
void start() { void start() {
timerThread = new Daemon(new PendingReplicationMonitor()); timerThread = new Daemon(new PendingReconstructionMonitor());
timerThread.start(); timerThread.start();
} }
/** /**
* Add a block to the list of pending Replications * Add a block to the list of pending reconstructions
* @param block The corresponding block * @param block The corresponding block
* @param targets The DataNodes where replicas of the block should be placed * @param targets The DataNodes where replicas of the block should be placed
*/ */
void increment(BlockInfo block, DatanodeDescriptor... targets) { void increment(BlockInfo block, DatanodeDescriptor... targets) {
synchronized (pendingReplications) { synchronized (pendingReconstructions) {
PendingBlockInfo found = pendingReplications.get(block); PendingBlockInfo found = pendingReconstructions.get(block);
if (found == null) { if (found == null) {
pendingReplications.put(block, new PendingBlockInfo(targets)); pendingReconstructions.put(block, new PendingBlockInfo(targets));
} else { } else {
found.incrementReplicas(targets); found.incrementReplicas(targets);
found.setTimeStamp(); found.setTimeStamp();
@ -89,58 +89,58 @@ class PendingReplicationBlocks {
} }
/** /**
* One replication request for this block has finished. * One reconstruction request for this block has finished.
* Decrement the number of pending replication requests * Decrement the number of pending reconstruction requests
* for this block. * for this block.
* *
* @param dn The DataNode that finishes the replication * @param dn The DataNode that finishes the reconstruction
*/ */
void decrement(BlockInfo block, DatanodeDescriptor dn) { void decrement(BlockInfo block, DatanodeDescriptor dn) {
synchronized (pendingReplications) { synchronized (pendingReconstructions) {
PendingBlockInfo found = pendingReplications.get(block); PendingBlockInfo found = pendingReconstructions.get(block);
if (found != null) { if (found != null) {
if(LOG.isDebugEnabled()) { LOG.debug("Removing pending reconstruction for {}", block);
LOG.debug("Removing pending replication for " + block);
}
found.decrementReplicas(dn); found.decrementReplicas(dn);
if (found.getNumReplicas() <= 0) { if (found.getNumReplicas() <= 0) {
pendingReplications.remove(block); pendingReconstructions.remove(block);
} }
} }
} }
} }
/** /**
* Remove the record about the given block from pendingReplications. * Remove the record about the given block from pending reconstructions.
* @param block The given block whose pending replication requests need to be *
* @param block
* The given block whose pending reconstruction requests need to be
* removed * removed
*/ */
void remove(BlockInfo block) { void remove(BlockInfo block) {
synchronized (pendingReplications) { synchronized (pendingReconstructions) {
pendingReplications.remove(block); pendingReconstructions.remove(block);
} }
} }
public void clear() { public void clear() {
synchronized (pendingReplications) { synchronized (pendingReconstructions) {
pendingReplications.clear(); pendingReconstructions.clear();
timedOutItems.clear(); timedOutItems.clear();
} }
} }
/** /**
* The total number of blocks that are undergoing replication * The total number of blocks that are undergoing reconstruction.
*/ */
int size() { int size() {
return pendingReplications.size(); return pendingReconstructions.size();
} }
/** /**
* How many copies of this block is pending replication? * How many copies of this block is pending reconstruction?.
*/ */
int getNumReplicas(BlockInfo block) { int getNumReplicas(BlockInfo block) {
synchronized (pendingReplications) { synchronized (pendingReconstructions) {
PendingBlockInfo found = pendingReplications.get(block); PendingBlockInfo found = pendingReconstructions.get(block);
if (found != null) { if (found != null) {
return found.getNumReplicas(); return found.getNumReplicas();
} }
@ -150,7 +150,7 @@ class PendingReplicationBlocks {
/** /**
* Returns a list of blocks that have timed out their * Returns a list of blocks that have timed out their
* replication requests. Returns null if no blocks have * reconstruction requests. Returns null if no blocks have
* timed out. * timed out.
*/ */
BlockInfo[] getTimedOutBlocks() { BlockInfo[] getTimedOutBlocks() {
@ -167,10 +167,10 @@ class PendingReplicationBlocks {
/** /**
* An object that contains information about a block that * An object that contains information about a block that
* is being replicated. It records the timestamp when the * is being reconstructed. It records the timestamp when the
* system started replicating the most recent copy of this * system started reconstructing the most recent copy of this
* block. It also records the list of Datanodes where the * block. It also records the list of Datanodes where the
* replication requests are in progress. * reconstruction requests are in progress.
*/ */
static class PendingBlockInfo { static class PendingBlockInfo {
private long timeStamp; private long timeStamp;
@ -211,20 +211,18 @@ class PendingReplicationBlocks {
/* /*
* A periodic thread that scans for blocks that never finished * A periodic thread that scans for blocks that never finished
* their replication request. * their reconstruction request.
*/ */
class PendingReplicationMonitor implements Runnable { class PendingReconstructionMonitor implements Runnable {
@Override @Override
public void run() { public void run() {
while (fsRunning) { while (fsRunning) {
long period = Math.min(DEFAULT_RECHECK_INTERVAL, timeout); long period = Math.min(DEFAULT_RECHECK_INTERVAL, timeout);
try { try {
pendingReplicationCheck(); pendingReconstructionCheck();
Thread.sleep(period); Thread.sleep(period);
} catch (InterruptedException ie) { } catch (InterruptedException ie) {
if(LOG.isDebugEnabled()) { LOG.debug("PendingReconstructionMonitor thread is interrupted.", ie);
LOG.debug("PendingReplicationMonitor thread is interrupted.", ie);
}
} }
} }
} }
@ -232,14 +230,12 @@ class PendingReplicationBlocks {
/** /**
* Iterate through all items and detect timed-out items * Iterate through all items and detect timed-out items
*/ */
void pendingReplicationCheck() { void pendingReconstructionCheck() {
synchronized (pendingReplications) { synchronized (pendingReconstructions) {
Iterator<Map.Entry<BlockInfo, PendingBlockInfo>> iter = Iterator<Map.Entry<BlockInfo, PendingBlockInfo>> iter =
pendingReplications.entrySet().iterator(); pendingReconstructions.entrySet().iterator();
long now = monotonicNow(); long now = monotonicNow();
if(LOG.isDebugEnabled()) { LOG.debug("PendingReconstructionMonitor checking Q");
LOG.debug("PendingReplicationMonitor checking Q");
}
while (iter.hasNext()) { while (iter.hasNext()) {
Map.Entry<BlockInfo, PendingBlockInfo> entry = iter.next(); Map.Entry<BlockInfo, PendingBlockInfo> entry = iter.next();
PendingBlockInfo pendingBlock = entry.getValue(); PendingBlockInfo pendingBlock = entry.getValue();
@ -248,7 +244,7 @@ class PendingReplicationBlocks {
synchronized (timedOutItems) { synchronized (timedOutItems) {
timedOutItems.add(block); timedOutItems.add(block);
} }
LOG.warn("PendingReplicationMonitor timed out " + block); LOG.warn("PendingReconstructionMonitor timed out " + block);
iter.remove(); iter.remove();
} }
} }
@ -257,7 +253,7 @@ class PendingReplicationBlocks {
} }
/* /*
* Shuts down the pending replication monitor thread. * Shuts down the pending reconstruction monitor thread.
* Waits for the thread to exit. * Waits for the thread to exit.
*/ */
void stop() { void stop() {
@ -274,16 +270,16 @@ class PendingReplicationBlocks {
* Iterate through all items and print them. * Iterate through all items and print them.
*/ */
void metaSave(PrintWriter out) { void metaSave(PrintWriter out) {
synchronized (pendingReplications) { synchronized (pendingReconstructions) {
out.println("Metasave: Blocks being replicated: " + out.println("Metasave: Blocks being reconstructed: " +
pendingReplications.size()); pendingReconstructions.size());
for (Map.Entry<BlockInfo, PendingBlockInfo> entry : for (Map.Entry<BlockInfo, PendingBlockInfo> entry :
pendingReplications.entrySet()) { pendingReconstructions.entrySet()) {
PendingBlockInfo pendingBlock = entry.getValue(); PendingBlockInfo pendingBlock = entry.getValue();
Block block = entry.getKey(); Block block = entry.getKey();
out.println(block + out.println(block +
" StartTime: " + new Time(pendingBlock.timeStamp) + " StartTime: " + new Time(pendingBlock.timeStamp) +
" NumReplicaInProgress: " + " NumReconstructInProgress: " +
pendingBlock.getNumReplicas()); pendingBlock.getNumReplicas());
} }
} }

View File

@ -472,8 +472,8 @@ public class BackupNode extends NameNode {
* {@link BlockManager.ReplicationMonitor} protected by SafeMode. * {@link BlockManager.ReplicationMonitor} protected by SafeMode.
* {@link HeartbeatManager.Monitor} protected by SafeMode. * {@link HeartbeatManager.Monitor} protected by SafeMode.
* {@link DecommissionManager.Monitor} need to prohibit refreshNodes(). * {@link DecommissionManager.Monitor} need to prohibit refreshNodes().
* {@link PendingReplicationBlocks.PendingReplicationMonitor} harmless, * {@link PendingReconstructionBlocks.PendingReconstructionMonitor}
* because ReplicationMonitor is muted. * harmless, because ReplicationMonitor is muted.
*/ */
@Override @Override
public void startActiveServices() throws IOException { public void startActiveServices() throws IOException {

View File

@ -4469,7 +4469,7 @@ public class FSNamesystem implements Namesystem, FSNamesystemMBean,
@Override // FSNamesystemMBean @Override // FSNamesystemMBean
@Metric @Metric
public long getPendingReplicationBlocks() { public long getPendingReplicationBlocks() {
return blockManager.getPendingReplicationBlocksCount(); return blockManager.getPendingReconstructionBlocksCount();
} }
@Override // FSNamesystemMBean @Override // FSNamesystemMBean

View File

@ -3790,10 +3790,10 @@
</property> </property>
<property> <property>
<name>dfs.namenode.replication.pending.timeout-sec</name> <name>dfs.namenode.reconstruction.pending.timeout-sec</name>
<value>-1</value> <value>-1</value>
<description> <description>
Timeout in seconds for block replication. If this value is 0 or less, Timeout in seconds for block reconstruction. If this value is 0 or less,
then it will default to 5 minutes. then it will default to 5 minutes.
</description> </description>
</property> </property>

View File

@ -85,7 +85,7 @@ public class TestAppendSnapshotTruncate {
conf.setInt(DFSConfigKeys.DFS_BYTES_PER_CHECKSUM_KEY, BLOCK_SIZE); conf.setInt(DFSConfigKeys.DFS_BYTES_PER_CHECKSUM_KEY, BLOCK_SIZE);
conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, SHORT_HEARTBEAT); conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, SHORT_HEARTBEAT);
conf.setLong( conf.setLong(
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 1); DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 1);
conf.setBoolean(ReplaceDatanodeOnFailure.BEST_EFFORT_KEY, true); conf.setBoolean(ReplaceDatanodeOnFailure.BEST_EFFORT_KEY, true);
cluster = new MiniDFSCluster.Builder(conf) cluster = new MiniDFSCluster.Builder(conf)
.format(true) .format(true)

View File

@ -286,7 +286,7 @@ public class TestDatanodeDeath {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY, 2000); conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY, 2000);
conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 2); conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 2);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 2); conf.setInt(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 2);
conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 5000); conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 5000);
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf) MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf)
.numDataNodes(numDatanodes).build(); .numDataNodes(numDatanodes).build();
@ -342,7 +342,7 @@ public class TestDatanodeDeath {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY, 2000); conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY, 2000);
conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 1); conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 1);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 2); conf.setInt(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 2);
conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 5000); conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 5000);
int myMaxNodes = 5; int myMaxNodes = 5;
System.out.println("SimpleTest starting with DataNode to Kill " + System.out.println("SimpleTest starting with DataNode to Kill " +

View File

@ -114,7 +114,7 @@ public class TestDecommission {
conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, HEARTBEAT_INTERVAL); conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, HEARTBEAT_INTERVAL);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1); conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1);
conf.setInt(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, BLOCKREPORT_INTERVAL_MSEC); conf.setInt(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, BLOCKREPORT_INTERVAL_MSEC);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 4); conf.setInt(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 4);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, NAMENODE_REPLICATION_INTERVAL); conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, NAMENODE_REPLICATION_INTERVAL);
writeConfigFile(hostsFile, null); writeConfigFile(hostsFile, null);

View File

@ -124,7 +124,7 @@ public class TestDecommissionWithStriped {
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1); conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1);
conf.setInt(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, conf.setInt(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY,
BLOCKREPORT_INTERVAL_MSEC); BLOCKREPORT_INTERVAL_MSEC);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, conf.setInt(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY,
4); 4);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY,
NAMENODE_REPLICATION_INTERVAL); NAMENODE_REPLICATION_INTERVAL);

View File

@ -481,7 +481,7 @@ public class TestFileAppend2 {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY, 2000); conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY, 2000);
conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 2); conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 2);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 2); conf.setInt(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 2);
conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 30000); conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 30000);
conf.setInt(HdfsClientConfigKeys.DFS_DATANODE_SOCKET_WRITE_TIMEOUT_KEY, 30000); conf.setInt(HdfsClientConfigKeys.DFS_DATANODE_SOCKET_WRITE_TIMEOUT_KEY, 30000);
conf.setInt(DFSConfigKeys.DFS_DATANODE_HANDLER_COUNT_KEY, 50); conf.setInt(DFSConfigKeys.DFS_DATANODE_HANDLER_COUNT_KEY, 50);

View File

@ -84,7 +84,7 @@ public class TestFileAppend4 {
conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 5000); conf.setInt(HdfsClientConfigKeys.DFS_CLIENT_SOCKET_TIMEOUT_KEY, 5000);
// handle under-replicated blocks quickly (for replication asserts) // handle under-replicated blocks quickly (for replication asserts)
conf.setInt( conf.setInt(
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 5); DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 5);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1); conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1);
// handle failures in the DFSClient pipeline quickly // handle failures in the DFSClient pipeline quickly

View File

@ -410,7 +410,7 @@ public class TestReplication {
LOG.info("Restarting minicluster after deleting a replica and corrupting 2 crcs"); LOG.info("Restarting minicluster after deleting a replica and corrupting 2 crcs");
conf = new HdfsConfiguration(); conf = new HdfsConfiguration();
conf.set(DFSConfigKeys.DFS_REPLICATION_KEY, Integer.toString(numDataNodes)); conf.set(DFSConfigKeys.DFS_REPLICATION_KEY, Integer.toString(numDataNodes));
conf.set(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2)); conf.set(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2));
conf.set("dfs.datanode.block.write.timeout.sec", Integer.toString(5)); conf.set("dfs.datanode.block.write.timeout.sec", Integer.toString(5));
conf.set(DFSConfigKeys.DFS_NAMENODE_SAFEMODE_THRESHOLD_PCT_KEY, "0.75f"); // only 3 copies exist conf.set(DFSConfigKeys.DFS_NAMENODE_SAFEMODE_THRESHOLD_PCT_KEY, "0.75f"); // only 3 copies exist
@ -507,7 +507,7 @@ public class TestReplication {
try { try {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setLong( conf.setLong(
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 1); DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 1);
cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3) cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3)
.storagesPerDatanode(1).build(); .storagesPerDatanode(1).build();
FileSystem fs = cluster.getFileSystem(); FileSystem fs = cluster.getFileSystem();
@ -687,7 +687,7 @@ public class TestReplication {
private long pendingReplicationCount(BlockManager bm) { private long pendingReplicationCount(BlockManager bm) {
BlockManagerTestUtil.updateState(bm); BlockManagerTestUtil.updateState(bm);
return bm.getPendingReplicationBlocksCount(); return bm.getPendingReconstructionBlocksCount();
} }
private void assertNoReplicationWasPerformed(MiniDFSCluster cluster) { private void assertNoReplicationWasPerformed(MiniDFSCluster cluster) {

View File

@ -39,7 +39,7 @@ public class TestSetrepIncreasing {
} }
conf.set(DFSConfigKeys.DFS_REPLICATION_KEY, "" + fromREP); conf.set(DFSConfigKeys.DFS_REPLICATION_KEY, "" + fromREP);
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);
conf.set(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2)); conf.set(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2));
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(10).build(); MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(10).build();
FileSystem fs = cluster.getFileSystem(); FileSystem fs = cluster.getFileSystem();
assertTrue("Not a HDFS: "+fs.getUri(), fs instanceof DistributedFileSystem); assertTrue("Not a HDFS: "+fs.getUri(), fs instanceof DistributedFileSystem);

View File

@ -537,15 +537,16 @@ public class TestBlockManager {
list_all.add(new ArrayList<BlockInfo>()); // for priority 0 list_all.add(new ArrayList<BlockInfo>()); // for priority 0
list_all.add(list_p1); // for priority 1 list_all.add(list_p1); // for priority 1
assertEquals("Block not initially pending replication", 0, assertEquals("Block not initially pending reconstruction", 0,
bm.pendingReplications.getNumReplicas(block)); bm.pendingReconstruction.getNumReplicas(block));
assertEquals( assertEquals(
"computeBlockReconstructionWork should indicate replication is needed", "computeBlockReconstructionWork should indicate reconstruction is needed",
1, bm.computeReconstructionWorkForBlocks(list_all)); 1, bm.computeReconstructionWorkForBlocks(list_all));
assertTrue("replication is pending after work is computed", assertTrue("reconstruction is pending after work is computed",
bm.pendingReplications.getNumReplicas(block) > 0); bm.pendingReconstruction.getNumReplicas(block) > 0);
LinkedListMultimap<DatanodeStorageInfo, BlockTargetPair> repls = getAllPendingReplications(); LinkedListMultimap<DatanodeStorageInfo, BlockTargetPair> repls =
getAllPendingReconstruction();
assertEquals(1, repls.size()); assertEquals(1, repls.size());
Entry<DatanodeStorageInfo, BlockTargetPair> repl = Entry<DatanodeStorageInfo, BlockTargetPair> repl =
repls.entries().iterator().next(); repls.entries().iterator().next();
@ -559,7 +560,7 @@ public class TestBlockManager {
return pipeline; return pipeline;
} }
private LinkedListMultimap<DatanodeStorageInfo, BlockTargetPair> getAllPendingReplications() { private LinkedListMultimap<DatanodeStorageInfo, BlockTargetPair> getAllPendingReconstruction() {
LinkedListMultimap<DatanodeStorageInfo, BlockTargetPair> repls = LinkedListMultimap<DatanodeStorageInfo, BlockTargetPair> repls =
LinkedListMultimap.create(); LinkedListMultimap.create();
for (DatanodeDescriptor dn : nodes) { for (DatanodeDescriptor dn : nodes) {
@ -574,8 +575,8 @@ public class TestBlockManager {
} }
/** /**
* Test that a source node for a highest-priority replication is chosen even if all available * Test that a source node for a highest-priority reconstruction is chosen
* source nodes have reached their replication limits. * even if all available source nodes have reached their replication limits.
*/ */
@Test @Test
public void testHighestPriReplSrcChosenDespiteMaxReplLimit() throws Exception { public void testHighestPriReplSrcChosenDespiteMaxReplLimit() throws Exception {

View File

@ -68,7 +68,7 @@ public class TestBlocksWithNotEnoughRacks {
// Have the NN check for pending replications every second so it // Have the NN check for pending replications every second so it
// quickly schedules additional replicas as they are identified. // quickly schedules additional replicas as they are identified.
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 1); conf.setInt(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 1);
// The DNs report blocks every second. // The DNs report blocks every second.
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);

View File

@ -54,7 +54,7 @@ public class TestOverReplicatedBlocks {
conf.setLong(DFSConfigKeys.DFS_DATANODE_SCAN_PERIOD_HOURS_KEY, 100L); conf.setLong(DFSConfigKeys.DFS_DATANODE_SCAN_PERIOD_HOURS_KEY, 100L);
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);
conf.set( conf.set(
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY,
Integer.toString(2)); Integer.toString(2));
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3).build(); MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3).build();
FileSystem fs = cluster.getFileSystem(); FileSystem fs = cluster.getFileSystem();

View File

@ -45,10 +45,10 @@ import org.junit.Test;
import org.mockito.Mockito; import org.mockito.Mockito;
/** /**
* This class tests the internals of PendingReplicationBlocks.java, * This class tests the internals of PendingReconstructionBlocks.java, as well
* as well as how PendingReplicationBlocks acts in BlockManager * as how PendingReconstructionBlocks acts in BlockManager
*/ */
public class TestPendingReplication { public class TestPendingReconstruction {
final static int TIMEOUT = 3; // 3 seconds final static int TIMEOUT = 3; // 3 seconds
private static final int DFS_REPLICATION_INTERVAL = 1; private static final int DFS_REPLICATION_INTERVAL = 1;
// Number of datanodes in the cluster // Number of datanodes in the cluster
@ -60,49 +60,49 @@ public class TestPendingReplication {
} }
@Test @Test
public void testPendingReplication() { public void testPendingReconstruction() {
PendingReplicationBlocks pendingReplications; PendingReconstructionBlocks pendingReconstructions;
pendingReplications = new PendingReplicationBlocks(TIMEOUT * 1000); pendingReconstructions = new PendingReconstructionBlocks(TIMEOUT * 1000);
pendingReplications.start(); pendingReconstructions.start();
// //
// Add 10 blocks to pendingReplications. // Add 10 blocks to pendingReconstruction.
// //
DatanodeStorageInfo[] storages = DFSTestUtil.createDatanodeStorageInfos(10); DatanodeStorageInfo[] storages = DFSTestUtil.createDatanodeStorageInfos(10);
for (int i = 0; i < storages.length; i++) { for (int i = 0; i < storages.length; i++) {
BlockInfo block = genBlockInfo(i, i, 0); BlockInfo block = genBlockInfo(i, i, 0);
DatanodeStorageInfo[] targets = new DatanodeStorageInfo[i]; DatanodeStorageInfo[] targets = new DatanodeStorageInfo[i];
System.arraycopy(storages, 0, targets, 0, i); System.arraycopy(storages, 0, targets, 0, i);
pendingReplications.increment(block, pendingReconstructions.increment(block,
DatanodeStorageInfo.toDatanodeDescriptors(targets)); DatanodeStorageInfo.toDatanodeDescriptors(targets));
} }
assertEquals("Size of pendingReplications ", assertEquals("Size of pendingReconstruction ",
10, pendingReplications.size()); 10, pendingReconstructions.size());
// //
// remove one item // remove one item
// //
BlockInfo blk = genBlockInfo(8, 8, 0); BlockInfo blk = genBlockInfo(8, 8, 0);
pendingReplications.decrement(blk, storages[7].getDatanodeDescriptor()); // removes one replica pendingReconstructions.decrement(blk, storages[7].getDatanodeDescriptor()); // removes one replica
assertEquals("pendingReplications.getNumReplicas ", assertEquals("pendingReconstructions.getNumReplicas ",
7, pendingReplications.getNumReplicas(blk)); 7, pendingReconstructions.getNumReplicas(blk));
// //
// insert the same item twice should be counted as once // insert the same item twice should be counted as once
// //
pendingReplications.increment(blk, storages[0].getDatanodeDescriptor()); pendingReconstructions.increment(blk, storages[0].getDatanodeDescriptor());
assertEquals("pendingReplications.getNumReplicas ", assertEquals("pendingReconstructions.getNumReplicas ",
7, pendingReplications.getNumReplicas(blk)); 7, pendingReconstructions.getNumReplicas(blk));
for (int i = 0; i < 7; i++) { for (int i = 0; i < 7; i++) {
// removes all replicas // removes all replicas
pendingReplications.decrement(blk, storages[i].getDatanodeDescriptor()); pendingReconstructions.decrement(blk, storages[i].getDatanodeDescriptor());
} }
assertTrue(pendingReplications.size() == 9); assertTrue(pendingReconstructions.size() == 9);
pendingReplications.increment(blk, pendingReconstructions.increment(blk,
DatanodeStorageInfo.toDatanodeDescriptors( DatanodeStorageInfo.toDatanodeDescriptors(
DFSTestUtil.createDatanodeStorageInfos(8))); DFSTestUtil.createDatanodeStorageInfos(8)));
assertTrue(pendingReplications.size() == 10); assertTrue(pendingReconstructions.size() == 10);
// //
// verify that the number of replicas returned // verify that the number of replicas returned
@ -110,14 +110,14 @@ public class TestPendingReplication {
// //
for (int i = 0; i < 10; i++) { for (int i = 0; i < 10; i++) {
BlockInfo block = genBlockInfo(i, i, 0); BlockInfo block = genBlockInfo(i, i, 0);
int numReplicas = pendingReplications.getNumReplicas(block); int numReplicas = pendingReconstructions.getNumReplicas(block);
assertTrue(numReplicas == i); assertTrue(numReplicas == i);
} }
// //
// verify that nothing has timed out so far // verify that nothing has timed out so far
// //
assertTrue(pendingReplications.getTimedOutBlocks() == null); assertTrue(pendingReconstructions.getTimedOutBlocks() == null);
// //
// Wait for one second and then insert some more items. // Wait for one second and then insert some more items.
@ -129,17 +129,17 @@ public class TestPendingReplication {
for (int i = 10; i < 15; i++) { for (int i = 10; i < 15; i++) {
BlockInfo block = genBlockInfo(i, i, 0); BlockInfo block = genBlockInfo(i, i, 0);
pendingReplications.increment(block, pendingReconstructions.increment(block,
DatanodeStorageInfo.toDatanodeDescriptors( DatanodeStorageInfo.toDatanodeDescriptors(
DFSTestUtil.createDatanodeStorageInfos(i))); DFSTestUtil.createDatanodeStorageInfos(i)));
} }
assertTrue(pendingReplications.size() == 15); assertTrue(pendingReconstructions.size() == 15);
// //
// Wait for everything to timeout. // Wait for everything to timeout.
// //
int loop = 0; int loop = 0;
while (pendingReplications.size() > 0) { while (pendingReconstructions.size() > 0) {
try { try {
Thread.sleep(1000); Thread.sleep(1000);
} catch (Exception e) { } catch (Exception e) {
@ -152,24 +152,24 @@ public class TestPendingReplication {
// //
// Verify that everything has timed out. // Verify that everything has timed out.
// //
assertEquals("Size of pendingReplications ", 0, pendingReplications.size()); assertEquals("Size of pendingReconstructions ", 0, pendingReconstructions.size());
Block[] timedOut = pendingReplications.getTimedOutBlocks(); Block[] timedOut = pendingReconstructions.getTimedOutBlocks();
assertTrue(timedOut != null && timedOut.length == 15); assertTrue(timedOut != null && timedOut.length == 15);
for (int i = 0; i < timedOut.length; i++) { for (int i = 0; i < timedOut.length; i++) {
assertTrue(timedOut[i].getBlockId() < 15); assertTrue(timedOut[i].getBlockId() < 15);
} }
pendingReplications.stop(); pendingReconstructions.stop();
} }
/* Test that processPendingReplications will use the most recent /* Test that processpendingReconstructions will use the most recent
* blockinfo from the blocksmap by placing a larger genstamp into * blockinfo from the blocksmap by placing a larger genstamp into
* the blocksmap. * the blocksmap.
*/ */
@Test @Test
public void testProcessPendingReplications() throws Exception { public void testProcessPendingReconstructions() throws Exception {
final Configuration conf = new HdfsConfiguration(); final Configuration conf = new HdfsConfiguration();
conf.setLong( conf.setLong(
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, TIMEOUT); DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, TIMEOUT);
MiniDFSCluster cluster = null; MiniDFSCluster cluster = null;
Block block; Block block;
BlockInfo blockInfo; BlockInfo blockInfo;
@ -181,19 +181,19 @@ public class TestPendingReplication {
FSNamesystem fsn = cluster.getNamesystem(); FSNamesystem fsn = cluster.getNamesystem();
BlockManager blkManager = fsn.getBlockManager(); BlockManager blkManager = fsn.getBlockManager();
PendingReplicationBlocks pendingReplications = PendingReconstructionBlocks pendingReconstruction =
blkManager.pendingReplications; blkManager.pendingReconstruction;
LowRedundancyBlocks neededReconstruction = blkManager.neededReconstruction; LowRedundancyBlocks neededReconstruction = blkManager.neededReconstruction;
BlocksMap blocksMap = blkManager.blocksMap; BlocksMap blocksMap = blkManager.blocksMap;
// //
// Add 1 block to pendingReplications with GenerationStamp = 0. // Add 1 block to pendingReconstructions with GenerationStamp = 0.
// //
block = new Block(1, 1, 0); block = new Block(1, 1, 0);
blockInfo = new BlockInfoContiguous(block, (short) 3); blockInfo = new BlockInfoContiguous(block, (short) 3);
pendingReplications.increment(blockInfo, pendingReconstruction.increment(blockInfo,
DatanodeStorageInfo.toDatanodeDescriptors( DatanodeStorageInfo.toDatanodeDescriptors(
DFSTestUtil.createDatanodeStorageInfos(1))); DFSTestUtil.createDatanodeStorageInfos(1)));
BlockCollection bc = Mockito.mock(BlockCollection.class); BlockCollection bc = Mockito.mock(BlockCollection.class);
@ -201,25 +201,25 @@ public class TestPendingReplication {
blockInfo.setGenerationStamp(1); blockInfo.setGenerationStamp(1);
blocksMap.addBlockCollection(blockInfo, bc); blocksMap.addBlockCollection(blockInfo, bc);
assertEquals("Size of pendingReplications ", 1, assertEquals("Size of pendingReconstructions ", 1,
pendingReplications.size()); pendingReconstruction.size());
// Add a second block to pendingReplications that has no // Add a second block to pendingReconstructions that has no
// corresponding entry in blocksmap // corresponding entry in blocksmap
block = new Block(2, 2, 0); block = new Block(2, 2, 0);
blockInfo = new BlockInfoContiguous(block, (short) 3); blockInfo = new BlockInfoContiguous(block, (short) 3);
pendingReplications.increment(blockInfo, pendingReconstruction.increment(blockInfo,
DatanodeStorageInfo.toDatanodeDescriptors( DatanodeStorageInfo.toDatanodeDescriptors(
DFSTestUtil.createDatanodeStorageInfos(1))); DFSTestUtil.createDatanodeStorageInfos(1)));
// verify 2 blocks in pendingReplications // verify 2 blocks in pendingReconstructions
assertEquals("Size of pendingReplications ", 2, assertEquals("Size of pendingReconstructions ", 2,
pendingReplications.size()); pendingReconstruction.size());
// //
// Wait for everything to timeout. // Wait for everything to timeout.
// //
while (pendingReplications.size() > 0) { while (pendingReconstruction.size() > 0) {
try { try {
Thread.sleep(100); Thread.sleep(100);
} catch (Exception e) { } catch (Exception e) {
@ -255,8 +255,8 @@ public class TestPendingReplication {
/** /**
* Test if DatanodeProtocol#blockReceivedAndDeleted can correctly update the * Test if DatanodeProtocol#blockReceivedAndDeleted can correctly update the
* pending replications. Also make sure the blockReceivedAndDeleted call is * pending reconstruction. Also make sure the blockReceivedAndDeleted call is
* idempotent to the pending replications. * idempotent to the pending reconstruction.
*/ */
@Test @Test
public void testBlockReceived() throws Exception { public void testBlockReceived() throws Exception {
@ -286,11 +286,11 @@ public class TestPendingReplication {
hdfs.setReplication(filePath, (short) DATANODE_COUNT); hdfs.setReplication(filePath, (short) DATANODE_COUNT);
BlockManagerTestUtil.computeAllPendingWork(blkManager); BlockManagerTestUtil.computeAllPendingWork(blkManager);
assertEquals(1, blkManager.pendingReplications.size()); assertEquals(1, blkManager.pendingReconstruction.size());
INodeFile fileNode = fsn.getFSDirectory().getINode4Write(file).asFile(); INodeFile fileNode = fsn.getFSDirectory().getINode4Write(file).asFile();
BlockInfo[] blocks = fileNode.getBlocks(); BlockInfo[] blocks = fileNode.getBlocks();
assertEquals(DATANODE_COUNT - 1, assertEquals(DATANODE_COUNT - 1,
blkManager.pendingReplications.getNumReplicas(blocks[0])); blkManager.pendingReconstruction.getNumReplicas(blocks[0]));
LocatedBlock locatedBlock = hdfs.getClient().getLocatedBlocks(file, 0) LocatedBlock locatedBlock = hdfs.getClient().getLocatedBlocks(file, 0)
.get(0); .get(0);
@ -314,7 +314,7 @@ public class TestPendingReplication {
// IBRs are async, make sure the NN processes all of them. // IBRs are async, make sure the NN processes all of them.
cluster.getNamesystem().getBlockManager().flushBlockOps(); cluster.getNamesystem().getBlockManager().flushBlockOps();
assertEquals(DATANODE_COUNT - 3, assertEquals(DATANODE_COUNT - 3,
blkManager.pendingReplications.getNumReplicas(blocks[0])); blkManager.pendingReconstruction.getNumReplicas(blocks[0]));
// let the same datanodes report again // let the same datanodes report again
for (int i = 0; i < DATANODE_COUNT && reportDnNum < 2; i++) { for (int i = 0; i < DATANODE_COUNT && reportDnNum < 2; i++) {
@ -332,7 +332,7 @@ public class TestPendingReplication {
cluster.getNamesystem().getBlockManager().flushBlockOps(); cluster.getNamesystem().getBlockManager().flushBlockOps();
assertEquals(DATANODE_COUNT - 3, assertEquals(DATANODE_COUNT - 3,
blkManager.pendingReplications.getNumReplicas(blocks[0])); blkManager.pendingReconstruction.getNumReplicas(blocks[0]));
// re-enable heartbeat for the datanode that has data // re-enable heartbeat for the datanode that has data
for (int i = 0; i < DATANODE_COUNT; i++) { for (int i = 0; i < DATANODE_COUNT; i++) {
@ -342,7 +342,7 @@ public class TestPendingReplication {
} }
Thread.sleep(5000); Thread.sleep(5000);
assertEquals(0, blkManager.pendingReplications.size()); assertEquals(0, blkManager.pendingReconstruction.size());
} finally { } finally {
if (cluster != null) { if (cluster != null) {
cluster.shutdown(); cluster.shutdown();
@ -395,20 +395,20 @@ public class TestPendingReplication {
} }
BlockManagerTestUtil.computeAllPendingWork(bm); BlockManagerTestUtil.computeAllPendingWork(bm);
BlockManagerTestUtil.updateState(bm); BlockManagerTestUtil.updateState(bm);
assertEquals(bm.getPendingReplicationBlocksCount(), 1L); assertEquals(bm.getPendingReconstructionBlocksCount(), 1L);
BlockInfo storedBlock = bm.getStoredBlock(block.getBlock().getLocalBlock()); BlockInfo storedBlock = bm.getStoredBlock(block.getBlock().getLocalBlock());
assertEquals(bm.pendingReplications.getNumReplicas(storedBlock), 2); assertEquals(bm.pendingReconstruction.getNumReplicas(storedBlock), 2);
// 4. delete the file // 4. delete the file
fs.delete(filePath, true); fs.delete(filePath, true);
// retry at most 10 times, each time sleep for 1s. Note that 10s is much // retry at most 10 times, each time sleep for 1s. Note that 10s is much
// less than the default pending record timeout (5~10min) // less than the default pending record timeout (5~10min)
int retries = 10; int retries = 10;
long pendingNum = bm.getPendingReplicationBlocksCount(); long pendingNum = bm.getPendingReconstructionBlocksCount();
while (pendingNum != 0 && retries-- > 0) { while (pendingNum != 0 && retries-- > 0) {
Thread.sleep(1000); // let NN do the deletion Thread.sleep(1000); // let NN do the deletion
BlockManagerTestUtil.updateState(bm); BlockManagerTestUtil.updateState(bm);
pendingNum = bm.getPendingReplicationBlocksCount(); pendingNum = bm.getPendingReconstructionBlocksCount();
} }
assertEquals(pendingNum, 0L); assertEquals(pendingNum, 0L);
} finally { } finally {

View File

@ -96,8 +96,8 @@ public class TestDecommissioningStatus {
conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY, conf.setInt(DFSConfigKeys.DFS_NAMENODE_HEARTBEAT_RECHECK_INTERVAL_KEY,
1000); 1000);
conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 1); conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, 1);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, conf.setInt(
4); DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 4);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1000); conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_INTERVAL_KEY, 1000);
conf.setInt(DFSConfigKeys.DFS_NAMENODE_DECOMMISSION_INTERVAL_KEY, 1); conf.setInt(DFSConfigKeys.DFS_NAMENODE_DECOMMISSION_INTERVAL_KEY, 1);
conf.setLong(DFSConfigKeys.DFS_DATANODE_BALANCE_BANDWIDTHPERSEC_KEY, 1); conf.setLong(DFSConfigKeys.DFS_DATANODE_BALANCE_BANDWIDTHPERSEC_KEY, 1);

View File

@ -98,7 +98,7 @@ public class TestFileTruncate {
conf.setInt(DFSConfigKeys.DFS_BYTES_PER_CHECKSUM_KEY, BLOCK_SIZE); conf.setInt(DFSConfigKeys.DFS_BYTES_PER_CHECKSUM_KEY, BLOCK_SIZE);
conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, SHORT_HEARTBEAT); conf.setInt(DFSConfigKeys.DFS_HEARTBEAT_INTERVAL_KEY, SHORT_HEARTBEAT);
conf.setLong( conf.setLong(
DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 1); DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 1);
cluster = new MiniDFSCluster.Builder(conf) cluster = new MiniDFSCluster.Builder(conf)
.format(true) .format(true)
.numDataNodes(DATANODE_NUM) .numDataNodes(DATANODE_NUM)

View File

@ -82,7 +82,7 @@ public class TestHostsFiles {
// Have the NN check for pending replications every second so it // Have the NN check for pending replications every second so it
// quickly schedules additional replicas as they are identified. // quickly schedules additional replicas as they are identified.
conf.setInt(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, 1); conf.setInt(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, 1);
// The DNs report blocks every second. // The DNs report blocks every second.
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);

View File

@ -156,7 +156,7 @@ public class TestMetaSave {
line = reader.readLine(); line = reader.readLine();
assertTrue(line.equals("Mis-replicated blocks that have been postponed:")); assertTrue(line.equals("Mis-replicated blocks that have been postponed:"));
line = reader.readLine(); line = reader.readLine();
assertTrue(line.equals("Metasave: Blocks being replicated: 0")); assertTrue(line.equals("Metasave: Blocks being reconstructed: 0"));
line = reader.readLine(); line = reader.readLine();
assertTrue(line.equals("Metasave: Blocks 2 waiting deletion from 1 datanodes.")); assertTrue(line.equals("Metasave: Blocks 2 waiting deletion from 1 datanodes."));
//skip 2 lines to reach HDFS-9033 scenario. //skip 2 lines to reach HDFS-9033 scenario.

View File

@ -58,7 +58,7 @@ public class TestProcessCorruptBlocks {
public void testWhenDecreasingReplication() throws Exception { public void testWhenDecreasingReplication() throws Exception {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);
conf.set(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2)); conf.set(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2));
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3).build(); MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3).build();
FileSystem fs = cluster.getFileSystem(); FileSystem fs = cluster.getFileSystem();
final FSNamesystem namesystem = cluster.getNamesystem(); final FSNamesystem namesystem = cluster.getNamesystem();
@ -113,7 +113,7 @@ public class TestProcessCorruptBlocks {
public void testByAddingAnExtraDataNode() throws Exception { public void testByAddingAnExtraDataNode() throws Exception {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);
conf.set(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2)); conf.set(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2));
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(4).build(); MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(4).build();
FileSystem fs = cluster.getFileSystem(); FileSystem fs = cluster.getFileSystem();
final FSNamesystem namesystem = cluster.getNamesystem(); final FSNamesystem namesystem = cluster.getNamesystem();
@ -164,7 +164,7 @@ public class TestProcessCorruptBlocks {
public void testWithReplicationFactorAsOne() throws Exception { public void testWithReplicationFactorAsOne() throws Exception {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);
conf.set(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2)); conf.set(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2));
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(2).build(); MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(2).build();
FileSystem fs = cluster.getFileSystem(); FileSystem fs = cluster.getFileSystem();
final FSNamesystem namesystem = cluster.getNamesystem(); final FSNamesystem namesystem = cluster.getNamesystem();
@ -218,7 +218,7 @@ public class TestProcessCorruptBlocks {
public void testWithAllCorruptReplicas() throws Exception { public void testWithAllCorruptReplicas() throws Exception {
Configuration conf = new HdfsConfiguration(); Configuration conf = new HdfsConfiguration();
conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L); conf.setLong(DFSConfigKeys.DFS_BLOCKREPORT_INTERVAL_MSEC_KEY, 1000L);
conf.set(DFSConfigKeys.DFS_NAMENODE_REPLICATION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2)); conf.set(DFSConfigKeys.DFS_NAMENODE_RECONSTRUCTION_PENDING_TIMEOUT_SEC_KEY, Integer.toString(2));
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3).build(); MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).numDataNodes(3).build();
FileSystem fs = cluster.getFileSystem(); FileSystem fs = cluster.getFileSystem();
final FSNamesystem namesystem = cluster.getNamesystem(); final FSNamesystem namesystem = cluster.getNamesystem();

View File

@ -209,7 +209,7 @@ public class TestReconstructStripedBlocks {
cellSize, NUM_DATA_BLOCKS, NUM_PARITY_BLOCKS); cellSize, NUM_DATA_BLOCKS, NUM_PARITY_BLOCKS);
assertEquals(0, getNumberOfBlocksToBeErasureCoded(cluster)); assertEquals(0, getNumberOfBlocksToBeErasureCoded(cluster));
assertEquals(0, bm.getPendingReplicationBlocksCount()); assertEquals(0, bm.getPendingReconstructionBlocksCount());
// missing 1 block, so 1 task should be scheduled // missing 1 block, so 1 task should be scheduled
DatanodeInfo dn0 = lbs[0].getLocations()[0]; DatanodeInfo dn0 = lbs[0].getLocations()[0];
@ -217,7 +217,7 @@ public class TestReconstructStripedBlocks {
cluster.setDataNodeDead(dn0); cluster.setDataNodeDead(dn0);
BlockManagerTestUtil.getComputedDatanodeWork(bm); BlockManagerTestUtil.getComputedDatanodeWork(bm);
assertEquals(1, getNumberOfBlocksToBeErasureCoded(cluster)); assertEquals(1, getNumberOfBlocksToBeErasureCoded(cluster));
assertEquals(1, bm.getPendingReplicationBlocksCount()); assertEquals(1, bm.getPendingReconstructionBlocksCount());
// missing another block, but no new task should be scheduled because // missing another block, but no new task should be scheduled because
// previous task isn't finished. // previous task isn't finished.
@ -226,7 +226,7 @@ public class TestReconstructStripedBlocks {
cluster.setDataNodeDead(dn1); cluster.setDataNodeDead(dn1);
BlockManagerTestUtil.getComputedDatanodeWork(bm); BlockManagerTestUtil.getComputedDatanodeWork(bm);
assertEquals(1, getNumberOfBlocksToBeErasureCoded(cluster)); assertEquals(1, getNumberOfBlocksToBeErasureCoded(cluster));
assertEquals(1, bm.getPendingReplicationBlocksCount()); assertEquals(1, bm.getPendingReconstructionBlocksCount());
} finally { } finally {
cluster.shutdown(); cluster.shutdown();
} }

View File

@ -296,7 +296,7 @@ public class TestDNFencing {
LOG.info("Getting more replication work computed"); LOG.info("Getting more replication work computed");
} }
BlockManager bm1 = nn1.getNamesystem().getBlockManager(); BlockManager bm1 = nn1.getNamesystem().getBlockManager();
while (bm1.getPendingReplicationBlocksCount() > 0) { while (bm1.getPendingReconstructionBlocksCount() > 0) {
BlockManagerTestUtil.updateState(bm1); BlockManagerTestUtil.updateState(bm1);
cluster.triggerHeartbeats(); cluster.triggerHeartbeats();
Thread.sleep(1000); Thread.sleep(1000);