MAPREDUCE-5833. TestRMContainerAllocator fails ocassionally. Contributed by Zhijie Shen.
git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/branches/branch-2@1589259 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
babe6545d4
commit
2d8f62f5c1
|
@ -79,6 +79,9 @@ Release 2.4.1 - UNRELEASED
|
||||||
MAPREDUCE-5827. TestSpeculativeExecutionWithMRApp fails.
|
MAPREDUCE-5827. TestSpeculativeExecutionWithMRApp fails.
|
||||||
(Zhijie Shen via cnauroth)
|
(Zhijie Shen via cnauroth)
|
||||||
|
|
||||||
|
MAPREDUCE-5833. TestRMContainerAllocator fails ocassionally.
|
||||||
|
(Zhijie Shen via cnauroth)
|
||||||
|
|
||||||
Release 2.4.0 - 2014-04-07
|
Release 2.4.0 - 2014-04-07
|
||||||
|
|
||||||
INCOMPATIBLE CHANGES
|
INCOMPATIBLE CHANGES
|
||||||
|
|
|
@ -151,7 +151,8 @@ public class RMContainerAllocator extends RMContainerRequestor
|
||||||
private long retryInterval;
|
private long retryInterval;
|
||||||
private long retrystartTime;
|
private long retrystartTime;
|
||||||
|
|
||||||
BlockingQueue<ContainerAllocatorEvent> eventQueue
|
@VisibleForTesting
|
||||||
|
protected BlockingQueue<ContainerAllocatorEvent> eventQueue
|
||||||
= new LinkedBlockingQueue<ContainerAllocatorEvent>();
|
= new LinkedBlockingQueue<ContainerAllocatorEvent>();
|
||||||
|
|
||||||
private ScheduleStats scheduleStats = new ScheduleStats();
|
private ScheduleStats scheduleStats = new ScheduleStats();
|
||||||
|
|
|
@ -54,6 +54,7 @@ import org.apache.hadoop.mapreduce.v2.api.records.TaskState;
|
||||||
import org.apache.hadoop.mapreduce.v2.api.records.TaskType;
|
import org.apache.hadoop.mapreduce.v2.api.records.TaskType;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.client.ClientService;
|
import org.apache.hadoop.mapreduce.v2.app.client.ClientService;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.Job;
|
import org.apache.hadoop.mapreduce.v2.app.job.Job;
|
||||||
|
import org.apache.hadoop.mapreduce.v2.app.job.JobStateInternal;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.Task;
|
import org.apache.hadoop.mapreduce.v2.app.job.Task;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.TaskAttempt;
|
import org.apache.hadoop.mapreduce.v2.app.job.TaskAttempt;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.TaskAttemptStateInternal;
|
import org.apache.hadoop.mapreduce.v2.app.job.TaskAttemptStateInternal;
|
||||||
|
@ -62,6 +63,7 @@ import org.apache.hadoop.mapreduce.v2.app.job.event.TaskAttemptContainerAssigned
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.event.TaskAttemptEvent;
|
import org.apache.hadoop.mapreduce.v2.app.job.event.TaskAttemptEvent;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.event.TaskAttemptEventType;
|
import org.apache.hadoop.mapreduce.v2.app.job.event.TaskAttemptEventType;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.event.TaskAttemptKillEvent;
|
import org.apache.hadoop.mapreduce.v2.app.job.event.TaskAttemptKillEvent;
|
||||||
|
import org.apache.hadoop.mapreduce.v2.app.job.impl.JobImpl;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.job.impl.TaskAttemptImpl;
|
import org.apache.hadoop.mapreduce.v2.app.job.impl.TaskAttemptImpl;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.rm.ContainerAllocator;
|
import org.apache.hadoop.mapreduce.v2.app.rm.ContainerAllocator;
|
||||||
import org.apache.hadoop.mapreduce.v2.app.rm.ContainerFailedEvent;
|
import org.apache.hadoop.mapreduce.v2.app.rm.ContainerFailedEvent;
|
||||||
|
@ -73,6 +75,7 @@ import org.apache.hadoop.net.NetUtils;
|
||||||
import org.apache.hadoop.net.NetworkTopology;
|
import org.apache.hadoop.net.NetworkTopology;
|
||||||
import org.apache.hadoop.security.UserGroupInformation;
|
import org.apache.hadoop.security.UserGroupInformation;
|
||||||
import org.apache.hadoop.security.token.Token;
|
import org.apache.hadoop.security.token.Token;
|
||||||
|
import org.apache.hadoop.test.GenericTestUtils;
|
||||||
import org.apache.hadoop.yarn.api.ApplicationMasterProtocol;
|
import org.apache.hadoop.yarn.api.ApplicationMasterProtocol;
|
||||||
import org.apache.hadoop.yarn.api.records.ApplicationAttemptId;
|
import org.apache.hadoop.yarn.api.records.ApplicationAttemptId;
|
||||||
import org.apache.hadoop.yarn.api.records.ApplicationId;
|
import org.apache.hadoop.yarn.api.records.ApplicationId;
|
||||||
|
@ -104,6 +107,8 @@ import org.junit.After;
|
||||||
import org.junit.Before;
|
import org.junit.Before;
|
||||||
import org.junit.Test;
|
import org.junit.Test;
|
||||||
|
|
||||||
|
import com.google.common.base.Supplier;
|
||||||
|
|
||||||
@SuppressWarnings("unchecked")
|
@SuppressWarnings("unchecked")
|
||||||
public class TestRMContainerAllocator {
|
public class TestRMContainerAllocator {
|
||||||
|
|
||||||
|
@ -579,7 +584,7 @@ public class TestRMContainerAllocator {
|
||||||
MyContainerAllocator allocator = (MyContainerAllocator) mrApp
|
MyContainerAllocator allocator = (MyContainerAllocator) mrApp
|
||||||
.getContainerAllocator();
|
.getContainerAllocator();
|
||||||
|
|
||||||
mrApp.waitForState(job, JobState.RUNNING);
|
mrApp.waitForInternalState((JobImpl) job, JobStateInternal.RUNNING);
|
||||||
|
|
||||||
amDispatcher.await();
|
amDispatcher.await();
|
||||||
// Wait till all map-attempts request for containers
|
// Wait till all map-attempts request for containers
|
||||||
|
@ -731,7 +736,7 @@ public class TestRMContainerAllocator {
|
||||||
MyContainerAllocator allocator = (MyContainerAllocator) mrApp
|
MyContainerAllocator allocator = (MyContainerAllocator) mrApp
|
||||||
.getContainerAllocator();
|
.getContainerAllocator();
|
||||||
|
|
||||||
mrApp.waitForState(job, JobState.RUNNING);
|
mrApp.waitForInternalState((JobImpl)job, JobStateInternal.RUNNING);
|
||||||
|
|
||||||
amDispatcher.await();
|
amDispatcher.await();
|
||||||
// Wait till all map-attempts request for containers
|
// Wait till all map-attempts request for containers
|
||||||
|
@ -1550,7 +1555,15 @@ public class TestRMContainerAllocator {
|
||||||
}
|
}
|
||||||
|
|
||||||
// API to be used by tests
|
// API to be used by tests
|
||||||
public List<TaskAttemptContainerAssignedEvent> schedule() {
|
public List<TaskAttemptContainerAssignedEvent> schedule()
|
||||||
|
throws Exception {
|
||||||
|
// before doing heartbeat with RM, drain all the outstanding events to
|
||||||
|
// ensure all the requests before this heartbeat is to be handled
|
||||||
|
GenericTestUtils.waitFor(new Supplier<Boolean>() {
|
||||||
|
public Boolean get() {
|
||||||
|
return eventQueue.isEmpty();
|
||||||
|
}
|
||||||
|
}, 100, 10000);
|
||||||
// run the scheduler
|
// run the scheduler
|
||||||
try {
|
try {
|
||||||
super.heartbeat();
|
super.heartbeat();
|
||||||
|
@ -1586,7 +1599,6 @@ public class TestRMContainerAllocator {
|
||||||
public boolean isUnregistered() {
|
public boolean isUnregistered() {
|
||||||
return isUnregistered;
|
return isUnregistered;
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
|
|
Loading…
Reference in New Issue