YARN-4677. RMNodeResourceUpdateEvent update from scheduler can lead to race condition (wilfreds and gphillips via rkanter)
(cherry picked from commit 0cd145a443
)
This commit is contained in:
parent
10e35ed322
commit
93d6ed859e
|
@ -1106,12 +1106,16 @@ public abstract class AbstractYarnScheduler
|
||||||
}
|
}
|
||||||
|
|
||||||
// Process new container information
|
// Process new container information
|
||||||
|
// NOTICE: it is possible to not find the NodeID as a node can be
|
||||||
|
// decommissioned at the same time. Skip updates if node is null.
|
||||||
SchedulerNode schedulerNode = getNode(nm.getNodeID());
|
SchedulerNode schedulerNode = getNode(nm.getNodeID());
|
||||||
List<ContainerStatus> completedContainers = updateNewContainerInfo(nm,
|
List<ContainerStatus> completedContainers = updateNewContainerInfo(nm,
|
||||||
schedulerNode);
|
schedulerNode);
|
||||||
|
|
||||||
// Notify Scheduler Node updated.
|
// Notify Scheduler Node updated.
|
||||||
schedulerNode.notifyNodeUpdate();
|
if (schedulerNode != null) {
|
||||||
|
schedulerNode.notifyNodeUpdate();
|
||||||
|
}
|
||||||
|
|
||||||
// Process completed containers
|
// Process completed containers
|
||||||
Resource releasedResources = Resource.newInstance(0, 0);
|
Resource releasedResources = Resource.newInstance(0, 0);
|
||||||
|
@ -1121,9 +1125,7 @@ public abstract class AbstractYarnScheduler
|
||||||
// If the node is decommissioning, send an update to have the total
|
// If the node is decommissioning, send an update to have the total
|
||||||
// resource equal to the used resource, so no available resource to
|
// resource equal to the used resource, so no available resource to
|
||||||
// schedule.
|
// schedule.
|
||||||
// TODO YARN-5128: Fix possible race-condition when request comes in before
|
if (nm.getState() == NodeState.DECOMMISSIONING && schedulerNode != null) {
|
||||||
// update is propagated
|
|
||||||
if (nm.getState() == NodeState.DECOMMISSIONING) {
|
|
||||||
this.rmContext
|
this.rmContext
|
||||||
.getDispatcher()
|
.getDispatcher()
|
||||||
.getEventHandler()
|
.getEventHandler()
|
||||||
|
@ -1133,13 +1135,16 @@ public abstract class AbstractYarnScheduler
|
||||||
}
|
}
|
||||||
|
|
||||||
updateSchedulerHealthInformation(releasedResources, releasedContainers);
|
updateSchedulerHealthInformation(releasedResources, releasedContainers);
|
||||||
updateNodeResourceUtilization(nm, schedulerNode);
|
if (schedulerNode != null) {
|
||||||
|
updateNodeResourceUtilization(nm, schedulerNode);
|
||||||
|
}
|
||||||
|
|
||||||
// Now node data structures are up-to-date and ready for scheduling.
|
// Now node data structures are up-to-date and ready for scheduling.
|
||||||
if(LOG.isDebugEnabled()) {
|
if(LOG.isDebugEnabled()) {
|
||||||
LOG.debug(
|
LOG.debug(
|
||||||
"Node being looked for scheduling " + nm + " availableResource: "
|
"Node being looked for scheduling " + nm + " availableResource: " +
|
||||||
+ schedulerNode.getUnallocatedResource());
|
(schedulerNode == null ? "unknown (decommissioned)" :
|
||||||
|
schedulerNode.getUnallocatedResource()));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -1030,7 +1030,7 @@ public class FairScheduler extends
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
final NodeId nodeID = node.getNodeID();
|
final NodeId nodeID = (node != null ? node.getNodeID() : null);
|
||||||
if (!nodeTracker.exists(nodeID)) {
|
if (!nodeTracker.exists(nodeID)) {
|
||||||
// The node might have just been removed while this thread was waiting
|
// The node might have just been removed while this thread was waiting
|
||||||
// on the synchronized lock before it entered this synchronized method
|
// on the synchronized lock before it entered this synchronized method
|
||||||
|
|
|
@ -966,8 +966,10 @@ public class FifoScheduler extends
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (Resources.greaterThanOrEqual(resourceCalculator, getClusterResource(),
|
// A decommissioned node might be removed before we get here
|
||||||
node.getUnallocatedResource(), minimumAllocation)) {
|
if (node != null &&
|
||||||
|
Resources.greaterThanOrEqual(resourceCalculator, getClusterResource(),
|
||||||
|
node.getUnallocatedResource(), minimumAllocation)) {
|
||||||
LOG.debug("Node heartbeat " + nm.getNodeID() +
|
LOG.debug("Node heartbeat " + nm.getNodeID() +
|
||||||
" available resource = " + node.getUnallocatedResource());
|
" available resource = " + node.getUnallocatedResource());
|
||||||
|
|
||||||
|
|
|
@ -258,14 +258,12 @@ public class TestCapacityScheduler extends CapacitySchedulerTestBase {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
private NodeManager
|
private NodeManager registerNode(String hostName, int containerManagerPort,
|
||||||
registerNode(String hostName, int containerManagerPort, int httpPort,
|
int httpPort, String rackName,
|
||||||
String rackName, Resource capability)
|
Resource capability)
|
||||||
throws IOException, YarnException {
|
throws IOException, YarnException {
|
||||||
NodeManager nm =
|
NodeManager nm = new NodeManager(hostName, containerManagerPort, httpPort,
|
||||||
new NodeManager(
|
rackName, capability, resourceManager);
|
||||||
hostName, containerManagerPort, httpPort, rackName, capability,
|
|
||||||
resourceManager);
|
|
||||||
NodeAddedSchedulerEvent nodeAddEvent1 =
|
NodeAddedSchedulerEvent nodeAddEvent1 =
|
||||||
new NodeAddedSchedulerEvent(resourceManager.getRMContext()
|
new NodeAddedSchedulerEvent(resourceManager.getRMContext()
|
||||||
.getRMNodes().get(nm.getNodeId()));
|
.getRMNodes().get(nm.getNodeId()));
|
||||||
|
@ -280,13 +278,13 @@ public class TestCapacityScheduler extends CapacitySchedulerTestBase {
|
||||||
|
|
||||||
// Register node1
|
// Register node1
|
||||||
String host_0 = "host_0";
|
String host_0 = "host_0";
|
||||||
org.apache.hadoop.yarn.server.resourcemanager.NodeManager nm_0 =
|
NodeManager nm_0 =
|
||||||
registerNode(host_0, 1234, 2345, NetworkTopology.DEFAULT_RACK,
|
registerNode(host_0, 1234, 2345, NetworkTopology.DEFAULT_RACK,
|
||||||
Resources.createResource(4 * GB, 1));
|
Resources.createResource(4 * GB, 1));
|
||||||
|
|
||||||
// Register node2
|
// Register node2
|
||||||
String host_1 = "host_1";
|
String host_1 = "host_1";
|
||||||
org.apache.hadoop.yarn.server.resourcemanager.NodeManager nm_1 =
|
NodeManager nm_1 =
|
||||||
registerNode(host_1, 1234, 2345, NetworkTopology.DEFAULT_RACK,
|
registerNode(host_1, 1234, 2345, NetworkTopology.DEFAULT_RACK,
|
||||||
Resources.createResource(2 * GB, 1));
|
Resources.createResource(2 * GB, 1));
|
||||||
|
|
||||||
|
@ -4038,6 +4036,29 @@ public class TestCapacityScheduler extends CapacitySchedulerTestBase {
|
||||||
Assert.fail("Cannot find RMContainer");
|
Assert.fail("Cannot find RMContainer");
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@Test
|
||||||
|
public void testRemovedNodeDecomissioningNode() throws Exception {
|
||||||
|
// Register nodemanager
|
||||||
|
NodeManager nm = registerNode("host_decom", 1234, 2345,
|
||||||
|
NetworkTopology.DEFAULT_RACK, Resources.createResource(8 * GB, 4));
|
||||||
|
|
||||||
|
RMNode node =
|
||||||
|
resourceManager.getRMContext().getRMNodes().get(nm.getNodeId());
|
||||||
|
// Send a heartbeat to kick the tires on the Scheduler
|
||||||
|
NodeUpdateSchedulerEvent nodeUpdate = new NodeUpdateSchedulerEvent(node);
|
||||||
|
resourceManager.getResourceScheduler().handle(nodeUpdate);
|
||||||
|
|
||||||
|
// force remove the node to simulate race condition
|
||||||
|
((CapacityScheduler) resourceManager.getResourceScheduler()).getNodeTracker().
|
||||||
|
removeNode(nm.getNodeId());
|
||||||
|
// Kick off another heartbeat with the node state mocked to decommissioning
|
||||||
|
RMNode spyNode =
|
||||||
|
Mockito.spy(resourceManager.getRMContext().getRMNodes()
|
||||||
|
.get(nm.getNodeId()));
|
||||||
|
when(spyNode.getState()).thenReturn(NodeState.DECOMMISSIONING);
|
||||||
|
resourceManager.getResourceScheduler().handle(
|
||||||
|
new NodeUpdateSchedulerEvent(spyNode));
|
||||||
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
public void testResourceUpdateDecommissioningNode() throws Exception {
|
public void testResourceUpdateDecommissioningNode() throws Exception {
|
||||||
|
@ -4064,9 +4085,8 @@ public class TestCapacityScheduler extends CapacitySchedulerTestBase {
|
||||||
((AsyncDispatcher) mockDispatcher).start();
|
((AsyncDispatcher) mockDispatcher).start();
|
||||||
// Register node
|
// Register node
|
||||||
String host_0 = "host_0";
|
String host_0 = "host_0";
|
||||||
org.apache.hadoop.yarn.server.resourcemanager.NodeManager nm_0 =
|
NodeManager nm_0 = registerNode(host_0, 1234, 2345,
|
||||||
registerNode(host_0, 1234, 2345, NetworkTopology.DEFAULT_RACK,
|
NetworkTopology.DEFAULT_RACK, Resources.createResource(8 * GB, 4));
|
||||||
Resources.createResource(8 * GB, 4));
|
|
||||||
// ResourceRequest priorities
|
// ResourceRequest priorities
|
||||||
Priority priority_0 = Priority.newInstance(0);
|
Priority priority_0 = Priority.newInstance(0);
|
||||||
|
|
||||||
|
|
|
@ -77,6 +77,7 @@ import org.apache.hadoop.yarn.server.resourcemanager.MockAM;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.MockNM;
|
import org.apache.hadoop.yarn.server.resourcemanager.MockNM;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.MockNodes;
|
import org.apache.hadoop.yarn.server.resourcemanager.MockNodes;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.MockRM;
|
import org.apache.hadoop.yarn.server.resourcemanager.MockRM;
|
||||||
|
import org.apache.hadoop.yarn.server.resourcemanager.NodeManager;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.RMContext;
|
import org.apache.hadoop.yarn.server.resourcemanager.RMContext;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.RMContextImpl;
|
import org.apache.hadoop.yarn.server.resourcemanager.RMContextImpl;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.recovery.MemoryRMStateStore;
|
import org.apache.hadoop.yarn.server.resourcemanager.recovery.MemoryRMStateStore;
|
||||||
|
@ -4968,6 +4969,30 @@ public class TestFairScheduler extends FairSchedulerTestBase {
|
||||||
.get(attId3.getApplicationId()).getQueue());
|
.get(attId3.getApplicationId()).getQueue());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testRemovedNodeDecomissioningNode() throws Exception {
|
||||||
|
// Register nodemanager
|
||||||
|
NodeManager nm = registerNode("host_decom", 1234, 2345,
|
||||||
|
NetworkTopology.DEFAULT_RACK, Resources.createResource(8 * GB, 4));
|
||||||
|
|
||||||
|
RMNode node =
|
||||||
|
resourceManager.getRMContext().getRMNodes().get(nm.getNodeId());
|
||||||
|
// Send a heartbeat to kick the tires on the Scheduler
|
||||||
|
NodeUpdateSchedulerEvent nodeUpdate = new NodeUpdateSchedulerEvent(node);
|
||||||
|
resourceManager.getResourceScheduler().handle(nodeUpdate);
|
||||||
|
|
||||||
|
// Force remove the node to simulate race condition
|
||||||
|
((FairScheduler) resourceManager.getResourceScheduler())
|
||||||
|
.getNodeTracker().removeNode(nm.getNodeId());
|
||||||
|
// Kick off another heartbeat with the node state mocked to decommissioning
|
||||||
|
RMNode spyNode =
|
||||||
|
Mockito.spy(resourceManager.getRMContext().getRMNodes()
|
||||||
|
.get(nm.getNodeId()));
|
||||||
|
when(spyNode.getState()).thenReturn(NodeState.DECOMMISSIONING);
|
||||||
|
resourceManager.getResourceScheduler().handle(
|
||||||
|
new NodeUpdateSchedulerEvent(spyNode));
|
||||||
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
public void testResourceUpdateDecommissioningNode() throws Exception {
|
public void testResourceUpdateDecommissioningNode() throws Exception {
|
||||||
// Mock the RMNodeResourceUpdate event handler to update SchedulerNode
|
// Mock the RMNodeResourceUpdate event handler to update SchedulerNode
|
||||||
|
@ -4993,9 +5018,8 @@ public class TestFairScheduler extends FairSchedulerTestBase {
|
||||||
((AsyncDispatcher) mockDispatcher).start();
|
((AsyncDispatcher) mockDispatcher).start();
|
||||||
// Register node
|
// Register node
|
||||||
String host_0 = "host_0";
|
String host_0 = "host_0";
|
||||||
org.apache.hadoop.yarn.server.resourcemanager.NodeManager nm_0 =
|
NodeManager nm_0 = registerNode(host_0, 1234, 2345,
|
||||||
registerNode(host_0, 1234, 2345, NetworkTopology.DEFAULT_RACK,
|
NetworkTopology.DEFAULT_RACK, Resources.createResource(8 * GB, 4));
|
||||||
Resources.createResource(8 * GB, 4));
|
|
||||||
|
|
||||||
RMNode node =
|
RMNode node =
|
||||||
resourceManager.getRMContext().getRMNodes().get(nm_0.getNodeId());
|
resourceManager.getRMContext().getRMNodes().get(nm_0.getNodeId());
|
||||||
|
@ -5033,13 +5057,12 @@ public class TestFairScheduler extends FairSchedulerTestBase {
|
||||||
Assert.assertEquals(availableResource.getVirtualCores(), 0);
|
Assert.assertEquals(availableResource.getVirtualCores(), 0);
|
||||||
}
|
}
|
||||||
|
|
||||||
private org.apache.hadoop.yarn.server.resourcemanager.NodeManager registerNode(
|
private NodeManager registerNode(String hostName, int containerManagerPort,
|
||||||
String hostName, int containerManagerPort, int httpPort, String rackName,
|
int httpPort, String rackName,
|
||||||
Resource capability) throws IOException, YarnException {
|
Resource capability)
|
||||||
org.apache.hadoop.yarn.server.resourcemanager.NodeManager nm =
|
throws IOException, YarnException {
|
||||||
new org.apache.hadoop.yarn.server.resourcemanager.NodeManager(hostName,
|
NodeManager nm = new NodeManager(hostName, containerManagerPort, httpPort,
|
||||||
containerManagerPort, httpPort, rackName, capability,
|
rackName, capability, resourceManager);
|
||||||
resourceManager);
|
|
||||||
|
|
||||||
// after YARN-5375, scheduler event is processed in rm main dispatcher,
|
// after YARN-5375, scheduler event is processed in rm main dispatcher,
|
||||||
// wait it processed, or may lead dead lock
|
// wait it processed, or may lead dead lock
|
||||||
|
|
|
@ -66,6 +66,7 @@ import org.apache.hadoop.yarn.server.resourcemanager.MockAM;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.MockNM;
|
import org.apache.hadoop.yarn.server.resourcemanager.MockNM;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.MockNodes;
|
import org.apache.hadoop.yarn.server.resourcemanager.MockNodes;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.MockRM;
|
import org.apache.hadoop.yarn.server.resourcemanager.MockRM;
|
||||||
|
import org.apache.hadoop.yarn.server.resourcemanager.NodeManager;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.RMContext;
|
import org.apache.hadoop.yarn.server.resourcemanager.RMContext;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.RMContextImpl;
|
import org.apache.hadoop.yarn.server.resourcemanager.RMContextImpl;
|
||||||
import org.apache.hadoop.yarn.server.resourcemanager.ResourceManager;
|
import org.apache.hadoop.yarn.server.resourcemanager.ResourceManager;
|
||||||
|
@ -138,14 +139,12 @@ public class TestFifoScheduler {
|
||||||
resourceManager.stop();
|
resourceManager.stop();
|
||||||
}
|
}
|
||||||
|
|
||||||
private org.apache.hadoop.yarn.server.resourcemanager.NodeManager
|
private NodeManager registerNode(String hostName, int containerManagerPort,
|
||||||
registerNode(String hostName, int containerManagerPort, int nmHttpPort,
|
int nmHttpPort, String rackName,
|
||||||
String rackName, Resource capability) throws IOException,
|
Resource capability)
|
||||||
YarnException {
|
throws IOException, YarnException {
|
||||||
org.apache.hadoop.yarn.server.resourcemanager.NodeManager nm =
|
NodeManager nm = new NodeManager(hostName, containerManagerPort,
|
||||||
new org.apache.hadoop.yarn.server.resourcemanager.NodeManager(hostName,
|
nmHttpPort, rackName, capability, resourceManager);
|
||||||
containerManagerPort, nmHttpPort, rackName, capability,
|
|
||||||
resourceManager);
|
|
||||||
NodeAddedSchedulerEvent nodeAddEvent1 =
|
NodeAddedSchedulerEvent nodeAddEvent1 =
|
||||||
new NodeAddedSchedulerEvent(resourceManager.getRMContext().getRMNodes()
|
new NodeAddedSchedulerEvent(resourceManager.getRMContext().getRMNodes()
|
||||||
.get(nm.getNodeId()));
|
.get(nm.getNodeId()));
|
||||||
|
@ -1195,6 +1194,30 @@ public class TestFifoScheduler {
|
||||||
rm.stop();
|
rm.stop();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testRemovedNodeDecomissioningNode() throws Exception {
|
||||||
|
// Register nodemanager
|
||||||
|
NodeManager nm = registerNode("host_decom", 1234, 2345,
|
||||||
|
NetworkTopology.DEFAULT_RACK, Resources.createResource(8 * GB, 4));
|
||||||
|
|
||||||
|
RMNode node =
|
||||||
|
resourceManager.getRMContext().getRMNodes().get(nm.getNodeId());
|
||||||
|
// Send a heartbeat to kick the tires on the Scheduler
|
||||||
|
NodeUpdateSchedulerEvent nodeUpdate = new NodeUpdateSchedulerEvent(node);
|
||||||
|
resourceManager.getResourceScheduler().handle(nodeUpdate);
|
||||||
|
|
||||||
|
// Force remove the node to simulate race condition
|
||||||
|
((FifoScheduler) resourceManager.getResourceScheduler())
|
||||||
|
.getNodeTracker().removeNode(nm.getNodeId());
|
||||||
|
// Kick off another heartbeat with the node state mocked to decommissioning
|
||||||
|
RMNode spyNode =
|
||||||
|
Mockito.spy(resourceManager.getRMContext().getRMNodes()
|
||||||
|
.get(nm.getNodeId()));
|
||||||
|
when(spyNode.getState()).thenReturn(NodeState.DECOMMISSIONING);
|
||||||
|
resourceManager.getResourceScheduler().handle(
|
||||||
|
new NodeUpdateSchedulerEvent(spyNode));
|
||||||
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
public void testResourceUpdateDecommissioningNode() throws Exception {
|
public void testResourceUpdateDecommissioningNode() throws Exception {
|
||||||
// Mock the RMNodeResourceUpdate event handler to update SchedulerNode
|
// Mock the RMNodeResourceUpdate event handler to update SchedulerNode
|
||||||
|
@ -1220,9 +1243,8 @@ public class TestFifoScheduler {
|
||||||
((AsyncDispatcher) mockDispatcher).start();
|
((AsyncDispatcher) mockDispatcher).start();
|
||||||
// Register node
|
// Register node
|
||||||
String host_0 = "host_0";
|
String host_0 = "host_0";
|
||||||
org.apache.hadoop.yarn.server.resourcemanager.NodeManager nm_0 =
|
NodeManager nm_0 = registerNode(host_0, 1234, 2345,
|
||||||
registerNode(host_0, 1234, 2345, NetworkTopology.DEFAULT_RACK,
|
NetworkTopology.DEFAULT_RACK, Resources.createResource(8 * GB, 4));
|
||||||
Resources.createResource(8 * GB, 4));
|
|
||||||
// ResourceRequest priorities
|
// ResourceRequest priorities
|
||||||
Priority priority_0 = Priority.newInstance(0);
|
Priority priority_0 = Priority.newInstance(0);
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue