From 9c55bca8fbe3c2a37693b2d3c2db7bb326a890de Mon Sep 17 00:00:00 2001 From: Yannick Welsch Date: Fri, 28 Apr 2017 19:52:27 +0200 Subject: [PATCH] Fix node failure detection race when updating cluster state Failure detection should only be updated in ZenDiscovery after the current state has been updated to prevent a race condition with handleLeaveRequest and handleNodeFailure as those check the current state to determine whether the failure is to be handled by this node. --- .../discovery/zen/ZenDiscovery.java | 23 +++++++++++-------- 1 file changed, 13 insertions(+), 10 deletions(-) diff --git a/core/src/main/java/org/elasticsearch/discovery/zen/ZenDiscovery.java b/core/src/main/java/org/elasticsearch/discovery/zen/ZenDiscovery.java index f4bef4b2d91..af32afb99c9 100644 --- a/core/src/main/java/org/elasticsearch/discovery/zen/ZenDiscovery.java +++ b/core/src/main/java/org/elasticsearch/discovery/zen/ZenDiscovery.java @@ -775,16 +775,6 @@ public class ZenDiscovery extends AbstractLifecycleComponent implements Discover return false; } - if (newClusterState.nodes().isLocalNodeElectedMaster()) { - // update the set of nodes to ping - nodesFD.updateNodesAndPing(newClusterState); - } else { - // check to see that we monitor the correct master of the cluster - if (masterFD.masterNode() == null || !masterFD.masterNode().equals(newClusterState.nodes().getMasterNode())) { - masterFD.restart(newClusterState.nodes().getMasterNode(), "new cluster state received and we are monitoring the wrong master [" + masterFD.masterNode() + "]"); - } - } - if (currentState.blocks().hasGlobalBlock(discoverySettings.getNoMasterBlock())) { // its a fresh update from the master as we transition from a start of not having a master to having one logger.debug("got first state from fresh master [{}]", newClusterState.nodes().getMasterNodeId()); @@ -827,6 +817,19 @@ public class ZenDiscovery extends AbstractLifecycleComponent implements Discover state.set(adaptedNewClusterState); + // update failure detection only after the state has been updated to prevent race condition with handleLeaveRequest + // and handleNodeFailure as those check the current state to determine whether the failure is to be handled by this node + if (adaptedNewClusterState.nodes().isLocalNodeElectedMaster()) { + // update the set of nodes to ping + nodesFD.updateNodesAndPing(adaptedNewClusterState); + } else { + // check to see that we monitor the correct master of the cluster + if (masterFD.masterNode() == null || !masterFD.masterNode().equals(adaptedNewClusterState.nodes().getMasterNode())) { + masterFD.restart(adaptedNewClusterState.nodes().getMasterNode(), + "new cluster state received and we are monitoring the wrong master [" + masterFD.masterNode() + "]"); + } + } + clusterApplier.onNewClusterState("apply cluster state (from master [" + reason + "])", this::clusterState, new ClusterStateTaskListener() {