HBASE-18525 [AMv2] Fixed test TestAssignmentManager#testSocketTimeout on master branch

This commit is contained in:
Umesh Agashe 2017-08-08 17:01:00 -07:00 committed by Michael Stack
parent 7a00571795
commit f855b51650
3 changed files with 35 additions and 3 deletions

View File

@ -53,6 +53,34 @@ import org.apache.hadoop.hbase.shaded.protobuf.generated.RegionServerStatusProto
* to remote server is sent and the Procedure is suspended waiting on external * to remote server is sent and the Procedure is suspended waiting on external
* event to be woken again. Once the external event is triggered, Procedure * event to be woken again. Once the external event is triggered, Procedure
* moves to the REGION_TRANSITION_FINISH state. * moves to the REGION_TRANSITION_FINISH state.
*
* <p>NOTE: {@link AssignProcedure} and {@link UnassignProcedure} should not be thought of
* as being asymmetric, at least currently.
* <ul>
* <li>{@link AssignProcedure} moves through all the above described states and implements methods
* associated with each while {@link UnassignProcedure} starts at state
* REGION_TRANSITION_DISPATCH and state REGION_TRANSITION_QUEUE is not supported.</li>
*
* <li>When any step in {@link AssignProcedure} fails, failure handler
* AssignProcedure#handleFailure(MasterProcedureEnv, RegionStateNode) re-attempts the
* assignment by setting the procedure state to REGION_TRANSITION_QUEUE and forces
* assignment to a different target server by setting {@link AssignProcedure#forceNewPlan}. When
* the number of attempts reach hreshold configuration 'hbase.assignment.maximum.attempts',
* the procedure is aborted. For {@link UnassignProcedure}, similar re-attempts are
* intentionally not implemented. It is a 'one shot' procedure.
* </li>
* </ul>
*
* <p>TODO: Considering it is a priority doing all we can to get make a region available as soon as possible,
* re-attempting with any target makes sense if specified target fails in case of
* {@link AssignProcedure}. For {@link UnassignProcedure}, if communication with RS fails,
* similar re-attempt makes little sense (what should be different from previous attempt?). Also it
* could be complex with current implementation of
* {@link RegionTransitionProcedure#execute(MasterProcedureEnv)} and {@link UnassignProcedure}.
* We have made a choice of keeping {@link UnassignProcedure} simple, where the procedure either
* succeeds or fails depending on communication with RS. As parent will have broader context, parent
* can better handle the failed instance of {@link UnassignProcedure}. Similar simplicity for
* {@link AssignProcedure} is desired and should be explored/ discussed further.
*/ */
@InterfaceAudience.Private @InterfaceAudience.Private
public abstract class RegionTransitionProcedure public abstract class RegionTransitionProcedure
@ -378,4 +406,4 @@ public abstract class RegionTransitionProcedure
* @return ServerName the Assign or Unassign is going against. * @return ServerName the Assign or Unassign is going against.
*/ */
public abstract ServerName getServer(final MasterProcedureEnv env); public abstract ServerName getServer(final MasterProcedureEnv env);
} }

View File

@ -56,6 +56,7 @@ import org.apache.hadoop.hbase.master.procedure.MasterProcedureConstants;
import org.apache.hadoop.hbase.master.procedure.MasterProcedureScheduler; import org.apache.hadoop.hbase.master.procedure.MasterProcedureScheduler;
import org.apache.hadoop.hbase.master.procedure.ProcedureSyncWait; import org.apache.hadoop.hbase.master.procedure.ProcedureSyncWait;
import org.apache.hadoop.hbase.master.procedure.RSProcedureDispatcher; import org.apache.hadoop.hbase.master.procedure.RSProcedureDispatcher;
import org.apache.hadoop.hbase.master.procedure.ServerCrashException;
import org.apache.hadoop.hbase.procedure2.Procedure; import org.apache.hadoop.hbase.procedure2.Procedure;
import org.apache.hadoop.hbase.procedure2.ProcedureMetrics; import org.apache.hadoop.hbase.procedure2.ProcedureMetrics;
import org.apache.hadoop.hbase.procedure2.ProcedureTestingUtility; import org.apache.hadoop.hbase.procedure2.ProcedureTestingUtility;
@ -89,6 +90,7 @@ import org.junit.Ignore;
import org.junit.Rule; import org.junit.Rule;
import org.junit.Test; import org.junit.Test;
import org.junit.experimental.categories.Category; import org.junit.experimental.categories.Category;
import org.junit.rules.ExpectedException;
import org.junit.rules.TestName; import org.junit.rules.TestName;
import org.junit.rules.TestRule; import org.junit.rules.TestRule;
@ -102,6 +104,7 @@ public class TestAssignmentManager {
@Rule public final TestRule timeout = @Rule public final TestRule timeout =
CategoryBasedTimeout.builder().withTimeout(this.getClass()). CategoryBasedTimeout.builder().withTimeout(this.getClass()).
withLookingForStuckThread(true).build(); withLookingForStuckThread(true).build();
@Rule public final ExpectedException exception = ExpectedException.none();
private static final int PROC_NTHREADS = 64; private static final int PROC_NTHREADS = 64;
private static final int NREGIONS = 1 * 1000; private static final int NREGIONS = 1 * 1000;
@ -252,12 +255,14 @@ public class TestAssignmentManager {
waitOnFuture(submitProcedure(am.createAssignProcedure(hri, false))); waitOnFuture(submitProcedure(am.createAssignProcedure(hri, false)));
rsDispatcher.setMockRsExecutor(new SocketTimeoutRsExecutor(20, 3)); rsDispatcher.setMockRsExecutor(new SocketTimeoutRsExecutor(20, 3));
exception.expect(ServerCrashException.class);
waitOnFuture(submitProcedure(am.createUnassignProcedure(hri, null, false))); waitOnFuture(submitProcedure(am.createUnassignProcedure(hri, null, false)));
assertEquals(assignSubmittedCount + 1, assignProcMetrics.getSubmittedCounter().getCount()); assertEquals(assignSubmittedCount + 1, assignProcMetrics.getSubmittedCounter().getCount());
assertEquals(assignFailedCount, assignProcMetrics.getFailedCounter().getCount()); assertEquals(assignFailedCount, assignProcMetrics.getFailedCounter().getCount());
assertEquals(unassignSubmittedCount + 1, unassignProcMetrics.getSubmittedCounter().getCount()); assertEquals(unassignSubmittedCount + 1, unassignProcMetrics.getSubmittedCounter().getCount());
assertEquals(unassignFailedCount, unassignProcMetrics.getFailedCounter().getCount()); assertEquals(unassignFailedCount + 1, unassignProcMetrics.getFailedCounter().getCount());
} }
@Test @Test

View File

@ -1312,7 +1312,6 @@
</maven.build.timestamp.format> </maven.build.timestamp.format>
<buildDate>${maven.build.timestamp}</buildDate> <buildDate>${maven.build.timestamp}</buildDate>
<compileSource>1.8</compileSource> <compileSource>1.8</compileSource>
<hbase-thirdparty.version>1.0.0</hbase-thirdparty.version>
<!-- Build dependencies --> <!-- Build dependencies -->
<maven.min.version>3.0.4</maven.min.version> <maven.min.version>3.0.4</maven.min.version>
<java.min.version>${compileSource}</java.min.version> <java.min.version>${compileSource}</java.min.version>