HBASE-9092 OpenRegion could be ignored by mistake

git-svn-id: https://svn.apache.org/repos/asf/hbase/trunk@1509384 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
jxiang 2013-08-01 18:55:43 +00:00
parent 734e937179
commit 0b0c291410
3 changed files with 29 additions and 24 deletions

View File

@ -71,9 +71,7 @@ import org.apache.hadoop.hbase.master.handler.EnableTableHandler;
import org.apache.hadoop.hbase.master.handler.MergedRegionHandler; import org.apache.hadoop.hbase.master.handler.MergedRegionHandler;
import org.apache.hadoop.hbase.master.handler.OpenedRegionHandler; import org.apache.hadoop.hbase.master.handler.OpenedRegionHandler;
import org.apache.hadoop.hbase.master.handler.SplitRegionHandler; import org.apache.hadoop.hbase.master.handler.SplitRegionHandler;
import org.apache.hadoop.hbase.regionserver.RegionAlreadyInTransitionException;
import org.apache.hadoop.hbase.regionserver.RegionOpeningState; import org.apache.hadoop.hbase.regionserver.RegionOpeningState;
import org.apache.hadoop.hbase.regionserver.RegionServerStoppedException;
import org.apache.hadoop.hbase.util.EnvironmentEdgeManager; import org.apache.hadoop.hbase.util.EnvironmentEdgeManager;
import org.apache.hadoop.hbase.util.KeyLocker; import org.apache.hadoop.hbase.util.KeyLocker;
import org.apache.hadoop.hbase.util.Pair; import org.apache.hadoop.hbase.util.Pair;
@ -923,26 +921,25 @@ public class AssignmentManager extends ZooKeeperListener {
+ " or not on the expected server"); + " or not on the expected server");
return; return;
} }
// Handle this the same as if it were opened and then closed. AtomicInteger failedOpenCount = failedOpenTracker.get(encodedName);
regionState = regionStates.updateRegionState(rt, RegionState.State.CLOSED); if (failedOpenCount == null) {
// When there are more than one region server a new RS is selected as the failedOpenCount = new AtomicInteger();
// destination and the same is updated in the regionplan. (HBASE-5546) // No need to use putIfAbsent, or extra synchronization since
if (regionState != null) { // this whole handleRegion block is locked on the encoded region
AtomicInteger failedOpenCount = failedOpenTracker.get(encodedName); // name, and failedOpenTracker is updated only in this block
if (failedOpenCount == null) { failedOpenTracker.put(encodedName, failedOpenCount);
failedOpenCount = new AtomicInteger(); }
// No need to use putIfAbsent, or extra synchronization since if (failedOpenCount.incrementAndGet() >= maximumAttempts) {
// this whole handleRegion block is locked on the encoded region regionStates.updateRegionState(rt, RegionState.State.FAILED_OPEN);
// name, and failedOpenTracker is updated only in this block // remove the tracking info to save memory, also reset
failedOpenTracker.put(encodedName, failedOpenCount); // the count for next open initiative
} failedOpenTracker.remove(encodedName);
if (failedOpenCount.incrementAndGet() >= maximumAttempts) { } else {
regionStates.updateRegionState( // Handle this the same as if it were opened and then closed.
regionState.getRegion(), RegionState.State.FAILED_OPEN); regionState = regionStates.updateRegionState(rt, RegionState.State.CLOSED);
// remove the tracking info to save memory, also reset if (regionState != null) {
// the count for next open initiative // When there are more than one region server a new RS is selected as the
failedOpenTracker.remove(encodedName); // destination and the same is updated in the regionplan. (HBASE-5546)
} else {
getRegionPlan(regionState.getRegion(), sn, true); getRegionPlan(regionState.getRegion(), sn, true);
this.executorService.submit(new ClosedRegionHandler(server, this.executorService.submit(new ClosedRegionHandler(server,
this, regionState.getRegion())); this, regionState.getRegion()));
@ -1757,10 +1754,10 @@ public class AssignmentManager extends ZooKeeperListener {
case CLOSING: case CLOSING:
case PENDING_CLOSE: case PENDING_CLOSE:
case FAILED_CLOSE: case FAILED_CLOSE:
case FAILED_OPEN:
unassign(region, state, -1, null, false, null); unassign(region, state, -1, null, false, null);
state = regionStates.getRegionState(region); state = regionStates.getRegionState(region);
if (state.isOffline()) break; if (state.isOffline()) break;
case FAILED_OPEN:
case CLOSED: case CLOSED:
LOG.debug("Forcing OFFLINE; was=" + state); LOG.debug("Forcing OFFLINE; was=" + state);
state = regionStates.updateRegionState( state = regionStates.updateRegionState(

View File

@ -248,7 +248,7 @@ public class RegionStates {
if (state == State.FAILED_CLOSE || state == State.FAILED_OPEN) { if (state == State.FAILED_CLOSE || state == State.FAILED_OPEN) {
LOG.warn("Failed to transition " + hri.getShortNameToLog() LOG.warn("Failed to transition " + hri.getShortNameToLog()
+ " on " + serverName + ": " + state); + " on " + serverName + ", set to " + state);
} }
String regionName = hri.getEncodedName(); String regionName = hri.getEncodedName();

View File

@ -19,6 +19,8 @@ package org.apache.hadoop.hbase.master;
import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse; import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNotNull;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue; import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail; import static org.junit.Assert.fail;
@ -392,6 +394,8 @@ public class TestAssignmentManagerOnCluster {
RegionState state = am.getRegionStates().getRegionState(hri); RegionState state = am.getRegionStates().getRegionState(hri);
assertEquals(RegionState.State.FAILED_OPEN, state.getState()); assertEquals(RegionState.State.FAILED_OPEN, state.getState());
// Failed to open since no plan, so it's on no server
assertNull(state.getServerName());
MockLoadBalancer.controledRegion = null; MockLoadBalancer.controledRegion = null;
master.assignRegion(hri); master.assignRegion(hri);
@ -436,6 +440,10 @@ public class TestAssignmentManagerOnCluster {
RegionState state = am.getRegionStates().getRegionState(hri); RegionState state = am.getRegionStates().getRegionState(hri);
assertEquals(RegionState.State.FAILED_OPEN, state.getState()); assertEquals(RegionState.State.FAILED_OPEN, state.getState());
// Failed to open due to file system issue. Region state should
// carry the opening region server so that we can force close it
// later on before opening it again. See HBASE-9092.
assertNotNull(state.getServerName());
// remove the blocking file, so that region can be opened // remove the blocking file, so that region can be opened
fs.delete(regionDir, true); fs.delete(regionDir, true);