mirror of https://github.com/apache/lucene.git
SOLR-11285: Initial refactoring.
This commit is contained in:
parent
1a1286b54b
commit
aee54ff7d1
|
@ -18,6 +18,7 @@
|
||||||
package org.apache.solr.cloud;
|
package org.apache.solr.cloud;
|
||||||
|
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
import java.lang.invoke.MethodHandles;
|
import java.lang.invoke.MethodHandles;
|
||||||
import java.util.Collection;
|
import java.util.Collection;
|
||||||
import java.util.Collections;
|
import java.util.Collections;
|
||||||
|
@ -71,7 +72,7 @@ public class AddReplicaCmd implements OverseerCollectionMessageHandler.Cmd {
|
||||||
}
|
}
|
||||||
|
|
||||||
ZkNodeProps addReplica(ClusterState clusterState, ZkNodeProps message, NamedList results, Runnable onComplete)
|
ZkNodeProps addReplica(ClusterState clusterState, ZkNodeProps message, NamedList results, Runnable onComplete)
|
||||||
throws KeeperException, InterruptedException {
|
throws IOException, InterruptedException {
|
||||||
log.debug("addReplica() : {}", Utils.toJSONString(message));
|
log.debug("addReplica() : {}", Utils.toJSONString(message));
|
||||||
String collection = message.getStr(COLLECTION_PROP);
|
String collection = message.getStr(COLLECTION_PROP);
|
||||||
String node = message.getStr(CoreAdminParams.NODE);
|
String node = message.getStr(CoreAdminParams.NODE);
|
||||||
|
@ -120,7 +121,7 @@ public class AddReplicaCmd implements OverseerCollectionMessageHandler.Cmd {
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
node = getNodesForNewReplicas(clusterState, collection, shard, 1, node,
|
node = getNodesForNewReplicas(clusterState, collection, shard, 1, node,
|
||||||
ocmh.overseer.getZkController().getCoreContainer()).get(0).nodeName;// TODO: use replica type in this logic too
|
ocmh.overseer.getClusterDataProvider(), ocmh.overseer.getCoreContainer()).get(0).nodeName;// TODO: use replica type in this logic too
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
log.info("Node Identified {} for creating new replica", node);
|
log.info("Node Identified {} for creating new replica", node);
|
||||||
|
@ -159,7 +160,11 @@ public class AddReplicaCmd implements OverseerCollectionMessageHandler.Cmd {
|
||||||
if (coreNodeName != null) {
|
if (coreNodeName != null) {
|
||||||
props = props.plus(ZkStateReader.CORE_NODE_NAME_PROP, coreNodeName);
|
props = props.plus(ZkStateReader.CORE_NODE_NAME_PROP, coreNodeName);
|
||||||
}
|
}
|
||||||
Overseer.getStateUpdateQueue(zkStateReader.getZkClient()).offer(Utils.toJSON(props));
|
try {
|
||||||
|
Overseer.getStateUpdateQueue(zkStateReader.getZkClient()).offer(Utils.toJSON(props));
|
||||||
|
} catch (Exception e) {
|
||||||
|
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, "Exception updating Overseer state queue", e);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
params.set(CoreAdminParams.CORE_NODE_NAME,
|
params.set(CoreAdminParams.CORE_NODE_NAME,
|
||||||
ocmh.waitToSeeReplicasInState(collection, Collections.singletonList(coreName)).get(coreName).getName());
|
ocmh.waitToSeeReplicasInState(collection, Collections.singletonList(coreName)).get(coreName).getName());
|
||||||
|
|
|
@ -31,6 +31,7 @@ import java.util.Set;
|
||||||
import java.util.stream.Collectors;
|
import java.util.stream.Collectors;
|
||||||
|
|
||||||
import com.google.common.collect.ImmutableMap;
|
import com.google.common.collect.ImmutableMap;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
||||||
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
||||||
import org.apache.solr.client.solrj.impl.SolrClientDataProvider;
|
import org.apache.solr.client.solrj.impl.SolrClientDataProvider;
|
||||||
|
@ -243,10 +244,10 @@ public class Assign {
|
||||||
List<String> shardNames,
|
List<String> shardNames,
|
||||||
int numNrtReplicas,
|
int numNrtReplicas,
|
||||||
int numTlogReplicas,
|
int numTlogReplicas,
|
||||||
int numPullReplicas) throws KeeperException, InterruptedException {
|
int numPullReplicas) throws IOException, InterruptedException {
|
||||||
List<Map> rulesMap = (List) message.get("rule");
|
List<Map> rulesMap = (List) message.get("rule");
|
||||||
String policyName = message.getStr(POLICY);
|
String policyName = message.getStr(POLICY);
|
||||||
AutoScalingConfig autoScalingConfig = ocmh.zkStateReader.getAutoScalingConfig();
|
AutoScalingConfig autoScalingConfig = ocmh.overseer.getClusterDataProvider().getAutoScalingConfig();
|
||||||
|
|
||||||
if (rulesMap == null && policyName == null && autoScalingConfig.getPolicy().getClusterPolicy().isEmpty()) {
|
if (rulesMap == null && policyName == null && autoScalingConfig.getPolicy().getClusterPolicy().isEmpty()) {
|
||||||
log.debug("Identify nodes using default");
|
log.debug("Identify nodes using default");
|
||||||
|
@ -295,7 +296,7 @@ public class Assign {
|
||||||
PolicyHelper.SESSION_REF.set(ocmh.policySessionRef);
|
PolicyHelper.SESSION_REF.set(ocmh.policySessionRef);
|
||||||
try {
|
try {
|
||||||
return getPositionsUsingPolicy(collectionName,
|
return getPositionsUsingPolicy(collectionName,
|
||||||
shardNames, numNrtReplicas, numTlogReplicas, numPullReplicas, policyName, ocmh.zkStateReader, nodeList);
|
shardNames, numNrtReplicas, numTlogReplicas, numPullReplicas, policyName, ocmh.overseer.getClusterDataProvider(), nodeList);
|
||||||
} finally {
|
} finally {
|
||||||
PolicyHelper.SESSION_REF.remove();
|
PolicyHelper.SESSION_REF.remove();
|
||||||
}
|
}
|
||||||
|
@ -324,7 +325,7 @@ public class Assign {
|
||||||
// could be created on live nodes given maxShardsPerNode, Replication factor (if from createShard) etc.
|
// could be created on live nodes given maxShardsPerNode, Replication factor (if from createShard) etc.
|
||||||
public static List<ReplicaCount> getNodesForNewReplicas(ClusterState clusterState, String collectionName,
|
public static List<ReplicaCount> getNodesForNewReplicas(ClusterState clusterState, String collectionName,
|
||||||
String shard, int nrtReplicas,
|
String shard, int nrtReplicas,
|
||||||
Object createNodeSet, CoreContainer cc) throws KeeperException, InterruptedException {
|
Object createNodeSet, ClusterDataProvider cdp, CoreContainer cc) throws IOException, InterruptedException {
|
||||||
log.debug("getNodesForNewReplicas() shard: {} , replicas : {} , createNodeSet {}", shard, nrtReplicas, createNodeSet );
|
log.debug("getNodesForNewReplicas() shard: {} , replicas : {} , createNodeSet {}", shard, nrtReplicas, createNodeSet );
|
||||||
DocCollection coll = clusterState.getCollection(collectionName);
|
DocCollection coll = clusterState.getCollection(collectionName);
|
||||||
Integer maxShardsPerNode = coll.getMaxShardsPerNode();
|
Integer maxShardsPerNode = coll.getMaxShardsPerNode();
|
||||||
|
@ -356,13 +357,14 @@ public class Assign {
|
||||||
List l = (List) coll.get(DocCollection.RULE);
|
List l = (List) coll.get(DocCollection.RULE);
|
||||||
List<ReplicaPosition> replicaPositions = null;
|
List<ReplicaPosition> replicaPositions = null;
|
||||||
if (l != null) {
|
if (l != null) {
|
||||||
|
// TODO nocommit: make it so that this method doesn't require access to CC
|
||||||
replicaPositions = getNodesViaRules(clusterState, shard, nrtReplicas, cc, coll, createNodeList, l);
|
replicaPositions = getNodesViaRules(clusterState, shard, nrtReplicas, cc, coll, createNodeList, l);
|
||||||
}
|
}
|
||||||
String policyName = coll.getStr(POLICY);
|
String policyName = coll.getStr(POLICY);
|
||||||
AutoScalingConfig autoScalingConfig = cc.getZkController().zkStateReader.getAutoScalingConfig();
|
AutoScalingConfig autoScalingConfig = cdp.getAutoScalingConfig();
|
||||||
if (policyName != null || !autoScalingConfig.getPolicy().getClusterPolicy().isEmpty()) {
|
if (policyName != null || !autoScalingConfig.getPolicy().getClusterPolicy().isEmpty()) {
|
||||||
replicaPositions = Assign.getPositionsUsingPolicy(collectionName, Collections.singletonList(shard), nrtReplicas, 0, 0,
|
replicaPositions = Assign.getPositionsUsingPolicy(collectionName, Collections.singletonList(shard), nrtReplicas, 0, 0,
|
||||||
policyName, cc.getZkController().zkStateReader, createNodeList);
|
policyName, cdp, createNodeList);
|
||||||
}
|
}
|
||||||
|
|
||||||
if(replicaPositions != null){
|
if(replicaPositions != null){
|
||||||
|
@ -383,21 +385,18 @@ public class Assign {
|
||||||
int nrtReplicas,
|
int nrtReplicas,
|
||||||
int tlogReplicas,
|
int tlogReplicas,
|
||||||
int pullReplicas,
|
int pullReplicas,
|
||||||
String policyName, ZkStateReader zkStateReader,
|
String policyName, ClusterDataProvider cdp,
|
||||||
List<String> nodesList) throws KeeperException, InterruptedException {
|
List<String> nodesList) throws IOException, InterruptedException {
|
||||||
log.debug("shardnames {} NRT {} TLOG {} PULL {} , policy {}, nodeList {}", shardNames, nrtReplicas, tlogReplicas, pullReplicas, policyName, nodesList);
|
log.debug("shardnames {} NRT {} TLOG {} PULL {} , policy {}, nodeList {}", shardNames, nrtReplicas, tlogReplicas, pullReplicas, policyName, nodesList);
|
||||||
SolrClientDataProvider clientDataProvider = null;
|
SolrClientDataProvider clientDataProvider = null;
|
||||||
List<ReplicaPosition> replicaPositions = null;
|
List<ReplicaPosition> replicaPositions = null;
|
||||||
AutoScalingConfig autoScalingConfig = zkStateReader.getAutoScalingConfig();
|
AutoScalingConfig autoScalingConfig = cdp.getAutoScalingConfig();
|
||||||
try (CloudSolrClient csc = new CloudSolrClient.Builder()
|
try {
|
||||||
.withClusterStateProvider(new ZkClientClusterStateProvider(zkStateReader))
|
|
||||||
.build()) {
|
|
||||||
clientDataProvider = new SolrClientDataProvider(csc);
|
|
||||||
Map<String, String> kvMap = Collections.singletonMap(collName, policyName);
|
Map<String, String> kvMap = Collections.singletonMap(collName, policyName);
|
||||||
replicaPositions = PolicyHelper.getReplicaLocations(
|
replicaPositions = PolicyHelper.getReplicaLocations(
|
||||||
collName,
|
collName,
|
||||||
autoScalingConfig,
|
autoScalingConfig,
|
||||||
clientDataProvider,
|
cdp,
|
||||||
kvMap,
|
kvMap,
|
||||||
shardNames,
|
shardNames,
|
||||||
nrtReplicas,
|
nrtReplicas,
|
||||||
|
@ -405,7 +404,7 @@ public class Assign {
|
||||||
pullReplicas,
|
pullReplicas,
|
||||||
nodesList);
|
nodesList);
|
||||||
return replicaPositions;
|
return replicaPositions;
|
||||||
} catch (IOException e) {
|
} catch (Exception e) {
|
||||||
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, "Error closing CloudSolrClient",e);
|
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, "Error closing CloudSolrClient",e);
|
||||||
} finally {
|
} finally {
|
||||||
if (log.isTraceEnabled()) {
|
if (log.isTraceEnabled()) {
|
||||||
|
|
|
@ -17,6 +17,7 @@
|
||||||
package org.apache.solr.cloud;
|
package org.apache.solr.cloud;
|
||||||
|
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
import java.lang.invoke.MethodHandles;
|
import java.lang.invoke.MethodHandles;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
import java.util.Collections;
|
import java.util.Collections;
|
||||||
|
@ -27,6 +28,7 @@ import java.util.concurrent.CountDownLatch;
|
||||||
import java.util.concurrent.TimeUnit;
|
import java.util.concurrent.TimeUnit;
|
||||||
|
|
||||||
import com.google.common.collect.ImmutableMap;
|
import com.google.common.collect.ImmutableMap;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.Policy;
|
import org.apache.solr.client.solrj.cloud.autoscaling.Policy;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
||||||
import org.apache.solr.cloud.OverseerCollectionMessageHandler.Cmd;
|
import org.apache.solr.cloud.OverseerCollectionMessageHandler.Cmd;
|
||||||
|
@ -103,7 +105,7 @@ public class CreateShardCmd implements Cmd {
|
||||||
numPullReplicas);
|
numPullReplicas);
|
||||||
} else {
|
} else {
|
||||||
List<Assign.ReplicaCount> sortedNodeList = getNodesForNewReplicas(clusterState, collectionName, sliceName, totalReplicas,
|
List<Assign.ReplicaCount> sortedNodeList = getNodesForNewReplicas(clusterState, collectionName, sliceName, totalReplicas,
|
||||||
createNodeSetStr, ocmh.overseer.getZkController().getCoreContainer());
|
createNodeSetStr, ocmh.overseer.getClusterDataProvider(), ocmh.overseer.getCoreContainer());
|
||||||
int i = 0;
|
int i = 0;
|
||||||
positions = new ArrayList<>();
|
positions = new ArrayList<>();
|
||||||
for (Map.Entry<Replica.Type, Integer> e : ImmutableMap.of(Replica.Type.NRT, numNrtReplicas,
|
for (Map.Entry<Replica.Type, Integer> e : ImmutableMap.of(Replica.Type.NRT, numNrtReplicas,
|
||||||
|
@ -173,8 +175,8 @@ public class CreateShardCmd implements Cmd {
|
||||||
}
|
}
|
||||||
|
|
||||||
static boolean usePolicyFramework(DocCollection collection, OverseerCollectionMessageHandler ocmh)
|
static boolean usePolicyFramework(DocCollection collection, OverseerCollectionMessageHandler ocmh)
|
||||||
throws KeeperException, InterruptedException {
|
throws IOException, InterruptedException {
|
||||||
Map autoScalingJson = Utils.getJson(ocmh.zkStateReader.getZkClient(), SOLR_AUTOSCALING_CONF_PATH, true);
|
AutoScalingConfig autoScalingConfig = ocmh.overseer.getClusterDataProvider().getAutoScalingConfig();
|
||||||
return autoScalingJson.get(Policy.CLUSTER_POLICY) != null || collection.getPolicyName() != null;
|
return !autoScalingConfig.isEmpty() || collection.getPolicyName() != null;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -26,6 +26,7 @@ import java.util.Map;
|
||||||
import java.util.concurrent.CountDownLatch;
|
import java.util.concurrent.CountDownLatch;
|
||||||
import java.util.concurrent.TimeUnit;
|
import java.util.concurrent.TimeUnit;
|
||||||
|
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.cloud.OverseerCollectionMessageHandler.Cmd;
|
import org.apache.solr.cloud.OverseerCollectionMessageHandler.Cmd;
|
||||||
import org.apache.solr.cloud.overseer.OverseerAction;
|
import org.apache.solr.cloud.overseer.OverseerAction;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
|
|
|
@ -223,7 +223,11 @@ class ShardLeaderElectionContextBase extends ElectionContext {
|
||||||
ZkStateReader.CORE_NAME_PROP,
|
ZkStateReader.CORE_NAME_PROP,
|
||||||
leaderProps.getProperties().get(ZkStateReader.CORE_NAME_PROP),
|
leaderProps.getProperties().get(ZkStateReader.CORE_NAME_PROP),
|
||||||
ZkStateReader.STATE_PROP, Replica.State.ACTIVE.toString());
|
ZkStateReader.STATE_PROP, Replica.State.ACTIVE.toString());
|
||||||
Overseer.getStateUpdateQueue(zkClient).offer(Utils.toJSON(m));
|
try {
|
||||||
|
Overseer.getStateUpdateQueue(zkClient).offer(Utils.toJSON(m));
|
||||||
|
} catch (Exception e) {
|
||||||
|
throw new IOException("Overseer state update queue error", e);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
public LeaderElector getLeaderElector() {
|
public LeaderElector getLeaderElector() {
|
||||||
|
@ -312,7 +316,11 @@ final class ShardLeaderElectionContext extends ShardLeaderElectionContextBase {
|
||||||
// clear the leader in clusterstate
|
// clear the leader in clusterstate
|
||||||
ZkNodeProps m = new ZkNodeProps(Overseer.QUEUE_OPERATION, OverseerAction.LEADER.toLower(),
|
ZkNodeProps m = new ZkNodeProps(Overseer.QUEUE_OPERATION, OverseerAction.LEADER.toLower(),
|
||||||
ZkStateReader.SHARD_ID_PROP, shardId, ZkStateReader.COLLECTION_PROP, collection);
|
ZkStateReader.SHARD_ID_PROP, shardId, ZkStateReader.COLLECTION_PROP, collection);
|
||||||
Overseer.getStateUpdateQueue(zkClient).offer(Utils.toJSON(m));
|
try {
|
||||||
|
Overseer.getStateUpdateQueue(zkClient).offer(Utils.toJSON(m));
|
||||||
|
} catch (Exception e) {
|
||||||
|
throw new IOException("Overseer state update queue error", e);
|
||||||
|
}
|
||||||
|
|
||||||
boolean allReplicasInLine = false;
|
boolean allReplicasInLine = false;
|
||||||
if (!weAreReplacement) {
|
if (!weAreReplacement) {
|
||||||
|
@ -494,7 +502,7 @@ final class ShardLeaderElectionContext extends ShardLeaderElectionContextBase {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
public void publishActiveIfRegisteredAndNotActive(SolrCore core) throws KeeperException, InterruptedException {
|
public void publishActiveIfRegisteredAndNotActive(SolrCore core) throws Exception {
|
||||||
if (core.getCoreDescriptor().getCloudDescriptor().hasRegistered()) {
|
if (core.getCoreDescriptor().getCloudDescriptor().hasRegistered()) {
|
||||||
ZkStateReader zkStateReader = zkController.getZkStateReader();
|
ZkStateReader zkStateReader = zkController.getZkStateReader();
|
||||||
zkStateReader.forceUpdateCollection(collection);
|
zkStateReader.forceUpdateCollection(collection);
|
||||||
|
|
|
@ -30,9 +30,15 @@ import java.util.concurrent.atomic.AtomicInteger;
|
||||||
|
|
||||||
import com.codahale.metrics.Timer;
|
import com.codahale.metrics.Timer;
|
||||||
import org.apache.solr.client.solrj.SolrResponse;
|
import org.apache.solr.client.solrj.SolrResponse;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
|
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
||||||
|
import org.apache.solr.client.solrj.impl.SolrClientDataProvider;
|
||||||
|
import org.apache.solr.client.solrj.impl.ZkClientClusterStateProvider;
|
||||||
import org.apache.solr.cloud.autoscaling.AutoScaling;
|
import org.apache.solr.cloud.autoscaling.AutoScaling;
|
||||||
import org.apache.solr.cloud.autoscaling.AutoScalingHandler;
|
import org.apache.solr.cloud.autoscaling.AutoScalingHandler;
|
||||||
import org.apache.solr.cloud.autoscaling.OverseerTriggerThread;
|
import org.apache.solr.cloud.autoscaling.OverseerTriggerThread;
|
||||||
|
import org.apache.solr.cloud.autoscaling.ZkDistributedQueueFactory;
|
||||||
import org.apache.solr.cloud.overseer.ClusterStateMutator;
|
import org.apache.solr.cloud.overseer.ClusterStateMutator;
|
||||||
import org.apache.solr.cloud.overseer.CollectionMutator;
|
import org.apache.solr.cloud.overseer.CollectionMutator;
|
||||||
import org.apache.solr.cloud.overseer.NodeMutator;
|
import org.apache.solr.cloud.overseer.NodeMutator;
|
||||||
|
@ -53,6 +59,7 @@ import org.apache.solr.common.util.IOUtils;
|
||||||
import org.apache.solr.common.util.ObjectReleaseTracker;
|
import org.apache.solr.common.util.ObjectReleaseTracker;
|
||||||
import org.apache.solr.common.util.Utils;
|
import org.apache.solr.common.util.Utils;
|
||||||
import org.apache.solr.core.CloudConfig;
|
import org.apache.solr.core.CloudConfig;
|
||||||
|
import org.apache.solr.core.CoreContainer;
|
||||||
import org.apache.solr.handler.admin.CollectionsHandler;
|
import org.apache.solr.handler.admin.CollectionsHandler;
|
||||||
import org.apache.solr.handler.component.ShardHandler;
|
import org.apache.solr.handler.component.ShardHandler;
|
||||||
import org.apache.solr.request.LocalSolrQueryRequest;
|
import org.apache.solr.request.LocalSolrQueryRequest;
|
||||||
|
@ -88,10 +95,10 @@ public class Overseer implements Closeable {
|
||||||
private final SolrZkClient zkClient;
|
private final SolrZkClient zkClient;
|
||||||
private final String myId;
|
private final String myId;
|
||||||
//queue where everybody can throw tasks
|
//queue where everybody can throw tasks
|
||||||
private final DistributedQueue stateUpdateQueue;
|
private final ZkDistributedQueue stateUpdateQueue;
|
||||||
//Internal queue where overseer stores events that have not yet been published into cloudstate
|
//Internal queue where overseer stores events that have not yet been published into cloudstate
|
||||||
//If Overseer dies while extracting the main queue a new overseer will start from this queue
|
//If Overseer dies while extracting the main queue a new overseer will start from this queue
|
||||||
private final DistributedQueue workQueue;
|
private final ZkDistributedQueue workQueue;
|
||||||
// Internal map which holds the information about running tasks.
|
// Internal map which holds the information about running tasks.
|
||||||
private final DistributedMap runningMap;
|
private final DistributedMap runningMap;
|
||||||
// Internal map which holds the information about successfully completed tasks.
|
// Internal map which holds the information about successfully completed tasks.
|
||||||
|
@ -538,7 +545,8 @@ public class Overseer implements Closeable {
|
||||||
autoscalingTriggerCreator.start();
|
autoscalingTriggerCreator.start();
|
||||||
|
|
||||||
ThreadGroup triggerThreadGroup = new ThreadGroup("Overseer autoscaling triggers");
|
ThreadGroup triggerThreadGroup = new ThreadGroup("Overseer autoscaling triggers");
|
||||||
OverseerTriggerThread trigger = new OverseerTriggerThread(zkController);
|
OverseerTriggerThread trigger = new OverseerTriggerThread(zkController.getCoreContainer().getResourceLoader(),
|
||||||
|
zkController.getClusterDataProvider());
|
||||||
triggerThread = new OverseerThread(triggerThreadGroup, trigger, "OverseerAutoScalingTriggerThread-" + id);
|
triggerThread = new OverseerThread(triggerThreadGroup, trigger, "OverseerAutoScalingTriggerThread-" + id);
|
||||||
|
|
||||||
updaterThread.start();
|
updaterThread.start();
|
||||||
|
@ -554,7 +562,15 @@ public class Overseer implements Closeable {
|
||||||
ZkController getZkController(){
|
ZkController getZkController(){
|
||||||
return zkController;
|
return zkController;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public CoreContainer getCoreContainer() {
|
||||||
|
return zkController.getCoreContainer();
|
||||||
|
}
|
||||||
|
|
||||||
|
public ClusterDataProvider getClusterDataProvider() {
|
||||||
|
return zkController.getClusterDataProvider();
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* For tests.
|
* For tests.
|
||||||
*
|
*
|
||||||
|
@ -679,7 +695,7 @@ public class Overseer implements Closeable {
|
||||||
* This method will create the /overseer znode in ZooKeeper if it does not exist already.
|
* This method will create the /overseer znode in ZooKeeper if it does not exist already.
|
||||||
*
|
*
|
||||||
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
||||||
* @return a {@link DistributedQueue} object
|
* @return a {@link ZkDistributedQueue} object
|
||||||
*/
|
*/
|
||||||
public static DistributedQueue getStateUpdateQueue(final SolrZkClient zkClient) {
|
public static DistributedQueue getStateUpdateQueue(final SolrZkClient zkClient) {
|
||||||
return getStateUpdateQueue(zkClient, new Stats());
|
return getStateUpdateQueue(zkClient, new Stats());
|
||||||
|
@ -692,11 +708,11 @@ public class Overseer implements Closeable {
|
||||||
*
|
*
|
||||||
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
||||||
* @param zkStats a {@link Overseer.Stats} object which tracks statistics for all zookeeper operations performed by this queue
|
* @param zkStats a {@link Overseer.Stats} object which tracks statistics for all zookeeper operations performed by this queue
|
||||||
* @return a {@link DistributedQueue} object
|
* @return a {@link ZkDistributedQueue} object
|
||||||
*/
|
*/
|
||||||
static DistributedQueue getStateUpdateQueue(final SolrZkClient zkClient, Stats zkStats) {
|
static ZkDistributedQueue getStateUpdateQueue(final SolrZkClient zkClient, Stats zkStats) {
|
||||||
createOverseerNode(zkClient);
|
createOverseerNode(zkClient);
|
||||||
return new DistributedQueue(zkClient, "/overseer/queue", zkStats);
|
return new ZkDistributedQueue(zkClient, "/overseer/queue", zkStats);
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -712,11 +728,11 @@ public class Overseer implements Closeable {
|
||||||
*
|
*
|
||||||
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
||||||
* @param zkStats a {@link Overseer.Stats} object which tracks statistics for all zookeeper operations performed by this queue
|
* @param zkStats a {@link Overseer.Stats} object which tracks statistics for all zookeeper operations performed by this queue
|
||||||
* @return a {@link DistributedQueue} object
|
* @return a {@link ZkDistributedQueue} object
|
||||||
*/
|
*/
|
||||||
static DistributedQueue getInternalWorkQueue(final SolrZkClient zkClient, Stats zkStats) {
|
static ZkDistributedQueue getInternalWorkQueue(final SolrZkClient zkClient, Stats zkStats) {
|
||||||
createOverseerNode(zkClient);
|
createOverseerNode(zkClient);
|
||||||
return new DistributedQueue(zkClient, "/overseer/queue-work", zkStats);
|
return new ZkDistributedQueue(zkClient, "/overseer/queue-work", zkStats);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Internal map for failed tasks, not to be used outside of the Overseer */
|
/* Internal map for failed tasks, not to be used outside of the Overseer */
|
||||||
|
@ -750,7 +766,7 @@ public class Overseer implements Closeable {
|
||||||
* see {@link org.apache.solr.common.params.CollectionParams.CollectionAction#OVERSEERSTATUS}.
|
* see {@link org.apache.solr.common.params.CollectionParams.CollectionAction#OVERSEERSTATUS}.
|
||||||
*
|
*
|
||||||
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
||||||
* @return a {@link DistributedQueue} object
|
* @return a {@link ZkDistributedQueue} object
|
||||||
*/
|
*/
|
||||||
static OverseerTaskQueue getCollectionQueue(final SolrZkClient zkClient) {
|
static OverseerTaskQueue getCollectionQueue(final SolrZkClient zkClient) {
|
||||||
return getCollectionQueue(zkClient, new Stats());
|
return getCollectionQueue(zkClient, new Stats());
|
||||||
|
@ -768,7 +784,7 @@ public class Overseer implements Closeable {
|
||||||
* see {@link org.apache.solr.common.params.CollectionParams.CollectionAction#OVERSEERSTATUS}.
|
* see {@link org.apache.solr.common.params.CollectionParams.CollectionAction#OVERSEERSTATUS}.
|
||||||
*
|
*
|
||||||
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
||||||
* @return a {@link DistributedQueue} object
|
* @return a {@link ZkDistributedQueue} object
|
||||||
*/
|
*/
|
||||||
static OverseerTaskQueue getCollectionQueue(final SolrZkClient zkClient, Stats zkStats) {
|
static OverseerTaskQueue getCollectionQueue(final SolrZkClient zkClient, Stats zkStats) {
|
||||||
createOverseerNode(zkClient);
|
createOverseerNode(zkClient);
|
||||||
|
@ -788,7 +804,7 @@ public class Overseer implements Closeable {
|
||||||
* see {@link org.apache.solr.common.params.CollectionParams.CollectionAction#OVERSEERSTATUS}.
|
* see {@link org.apache.solr.common.params.CollectionParams.CollectionAction#OVERSEERSTATUS}.
|
||||||
*
|
*
|
||||||
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
||||||
* @return a {@link DistributedQueue} object
|
* @return a {@link ZkDistributedQueue} object
|
||||||
*/
|
*/
|
||||||
static OverseerTaskQueue getConfigSetQueue(final SolrZkClient zkClient) {
|
static OverseerTaskQueue getConfigSetQueue(final SolrZkClient zkClient) {
|
||||||
return getConfigSetQueue(zkClient, new Stats());
|
return getConfigSetQueue(zkClient, new Stats());
|
||||||
|
@ -811,7 +827,7 @@ public class Overseer implements Closeable {
|
||||||
* {@link OverseerConfigSetMessageHandler}.
|
* {@link OverseerConfigSetMessageHandler}.
|
||||||
*
|
*
|
||||||
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
* @param zkClient the {@link SolrZkClient} to be used for reading/writing to the queue
|
||||||
* @return a {@link DistributedQueue} object
|
* @return a {@link ZkDistributedQueue} object
|
||||||
*/
|
*/
|
||||||
static OverseerTaskQueue getConfigSetQueue(final SolrZkClient zkClient, Stats zkStats) {
|
static OverseerTaskQueue getConfigSetQueue(final SolrZkClient zkClient, Stats zkStats) {
|
||||||
// For now, we use the same queue as the collection queue, but ensure
|
// For now, we use the same queue as the collection queue, but ensure
|
||||||
|
|
|
@ -36,6 +36,7 @@ import com.google.common.collect.ImmutableMap;
|
||||||
import org.apache.commons.lang.StringUtils;
|
import org.apache.commons.lang.StringUtils;
|
||||||
import org.apache.solr.client.solrj.SolrResponse;
|
import org.apache.solr.client.solrj.SolrResponse;
|
||||||
import org.apache.solr.client.solrj.SolrServerException;
|
import org.apache.solr.client.solrj.SolrServerException;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient.RemoteSolrException;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient.RemoteSolrException;
|
||||||
|
@ -321,7 +322,7 @@ public class OverseerCollectionMessageHandler implements OverseerMessageHandler
|
||||||
}
|
}
|
||||||
|
|
||||||
private void processReplicaDeletePropertyCommand(ClusterState clusterState, ZkNodeProps message, NamedList results)
|
private void processReplicaDeletePropertyCommand(ClusterState clusterState, ZkNodeProps message, NamedList results)
|
||||||
throws KeeperException, InterruptedException {
|
throws Exception {
|
||||||
checkRequired(message, COLLECTION_PROP, SHARD_ID_PROP, REPLICA_PROP, PROPERTY_PROP);
|
checkRequired(message, COLLECTION_PROP, SHARD_ID_PROP, REPLICA_PROP, PROPERTY_PROP);
|
||||||
SolrZkClient zkClient = zkStateReader.getZkClient();
|
SolrZkClient zkClient = zkStateReader.getZkClient();
|
||||||
DistributedQueue inQueue = Overseer.getStateUpdateQueue(zkClient);
|
DistributedQueue inQueue = Overseer.getStateUpdateQueue(zkClient);
|
||||||
|
@ -332,7 +333,7 @@ public class OverseerCollectionMessageHandler implements OverseerMessageHandler
|
||||||
inQueue.offer(Utils.toJSON(m));
|
inQueue.offer(Utils.toJSON(m));
|
||||||
}
|
}
|
||||||
|
|
||||||
private void balanceProperty(ClusterState clusterState, ZkNodeProps message, NamedList results) throws KeeperException, InterruptedException {
|
private void balanceProperty(ClusterState clusterState, ZkNodeProps message, NamedList results) throws Exception {
|
||||||
if (StringUtils.isBlank(message.getStr(COLLECTION_PROP)) || StringUtils.isBlank(message.getStr(PROPERTY_PROP))) {
|
if (StringUtils.isBlank(message.getStr(COLLECTION_PROP)) || StringUtils.isBlank(message.getStr(PROPERTY_PROP))) {
|
||||||
throw new SolrException(ErrorCode.BAD_REQUEST,
|
throw new SolrException(ErrorCode.BAD_REQUEST,
|
||||||
"The '" + COLLECTION_PROP + "' and '" + PROPERTY_PROP +
|
"The '" + COLLECTION_PROP + "' and '" + PROPERTY_PROP +
|
||||||
|
@ -441,7 +442,7 @@ public class OverseerCollectionMessageHandler implements OverseerMessageHandler
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void deleteCoreNode(String collectionName, String replicaName, Replica replica, String core) throws KeeperException, InterruptedException {
|
void deleteCoreNode(String collectionName, String replicaName, Replica replica, String core) throws Exception {
|
||||||
ZkNodeProps m = new ZkNodeProps(
|
ZkNodeProps m = new ZkNodeProps(
|
||||||
Overseer.QUEUE_OPERATION, OverseerAction.DELETECORE.toLower(),
|
Overseer.QUEUE_OPERATION, OverseerAction.DELETECORE.toLower(),
|
||||||
ZkStateReader.CORE_NAME_PROP, core,
|
ZkStateReader.CORE_NAME_PROP, core,
|
||||||
|
@ -462,8 +463,7 @@ public class OverseerCollectionMessageHandler implements OverseerMessageHandler
|
||||||
}
|
}
|
||||||
|
|
||||||
//TODO should we not remove in the next release ?
|
//TODO should we not remove in the next release ?
|
||||||
private void migrateStateFormat(ClusterState state, ZkNodeProps message, NamedList results)
|
private void migrateStateFormat(ClusterState state, ZkNodeProps message, NamedList results) throws Exception {
|
||||||
throws KeeperException, InterruptedException {
|
|
||||||
final String collectionName = message.getStr(COLLECTION_PROP);
|
final String collectionName = message.getStr(COLLECTION_PROP);
|
||||||
|
|
||||||
boolean firstLoop = true;
|
boolean firstLoop = true;
|
||||||
|
@ -634,7 +634,7 @@ public class OverseerCollectionMessageHandler implements OverseerMessageHandler
|
||||||
|
|
||||||
|
|
||||||
private void modifyCollection(ClusterState clusterState, ZkNodeProps message, NamedList results)
|
private void modifyCollection(ClusterState clusterState, ZkNodeProps message, NamedList results)
|
||||||
throws KeeperException, InterruptedException {
|
throws Exception {
|
||||||
|
|
||||||
final String collectionName = message.getStr(ZkStateReader.COLLECTION_PROP);
|
final String collectionName = message.getStr(ZkStateReader.COLLECTION_PROP);
|
||||||
//the rest of the processing is based on writing cluster state properties
|
//the rest of the processing is based on writing cluster state properties
|
||||||
|
@ -712,7 +712,7 @@ public class OverseerCollectionMessageHandler implements OverseerMessageHandler
|
||||||
}
|
}
|
||||||
|
|
||||||
ZkNodeProps addReplica(ClusterState clusterState, ZkNodeProps message, NamedList results, Runnable onComplete)
|
ZkNodeProps addReplica(ClusterState clusterState, ZkNodeProps message, NamedList results, Runnable onComplete)
|
||||||
throws KeeperException, InterruptedException {
|
throws Exception {
|
||||||
|
|
||||||
return ((AddReplicaCmd) commandMap.get(ADDREPLICA)).addReplica(clusterState, message, results, onComplete);
|
return ((AddReplicaCmd) commandMap.get(ADDREPLICA)).addReplica(clusterState, message, results, onComplete);
|
||||||
}
|
}
|
||||||
|
|
|
@ -56,7 +56,7 @@ public class OverseerNodePrioritizer {
|
||||||
this.shardHandlerFactory = shardHandlerFactory;
|
this.shardHandlerFactory = shardHandlerFactory;
|
||||||
}
|
}
|
||||||
|
|
||||||
public synchronized void prioritizeOverseerNodes(String overseerId) throws KeeperException, InterruptedException {
|
public synchronized void prioritizeOverseerNodes(String overseerId) throws Exception {
|
||||||
SolrZkClient zk = zkStateReader.getZkClient();
|
SolrZkClient zk = zkStateReader.getZkClient();
|
||||||
if(!zk.exists(ZkStateReader.ROLES,true))return;
|
if(!zk.exists(ZkStateReader.ROLES,true))return;
|
||||||
Map m = (Map) Utils.fromJSON(zk.getData(ZkStateReader.ROLES, null, new Stat(), true));
|
Map m = (Map) Utils.fromJSON(zk.getData(ZkStateReader.ROLES, null, new Stat(), true));
|
||||||
|
|
|
@ -35,11 +35,11 @@ import org.slf4j.Logger;
|
||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* A {@link DistributedQueue} augmented with helper methods specific to the overseer task queues.
|
* A {@link ZkDistributedQueue} augmented with helper methods specific to the overseer task queues.
|
||||||
* Methods specific to this subclass ignore superclass internal state and hit ZK directly.
|
* Methods specific to this subclass ignore superclass internal state and hit ZK directly.
|
||||||
* This is inefficient! But the API on this class is kind of muddy..
|
* This is inefficient! But the API on this class is kind of muddy..
|
||||||
*/
|
*/
|
||||||
public class OverseerTaskQueue extends DistributedQueue {
|
public class OverseerTaskQueue extends ZkDistributedQueue {
|
||||||
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
private static final String RESPONSE_PREFIX = "qnr-" ;
|
private static final String RESPONSE_PREFIX = "qnr-" ;
|
||||||
|
|
|
@ -174,7 +174,7 @@ public class RecoveryStrategy implements Runnable, Closeable {
|
||||||
|
|
||||||
final private void recoveryFailed(final SolrCore core,
|
final private void recoveryFailed(final SolrCore core,
|
||||||
final ZkController zkController, final String baseUrl,
|
final ZkController zkController, final String baseUrl,
|
||||||
final String shardZkNodeName, final CoreDescriptor cd) throws KeeperException, InterruptedException {
|
final String shardZkNodeName, final CoreDescriptor cd) throws Exception {
|
||||||
SolrException.log(LOG, "Recovery failed - I give up.");
|
SolrException.log(LOG, "Recovery failed - I give up.");
|
||||||
try {
|
try {
|
||||||
zkController.publish(cd, Replica.State.RECOVERY_FAILED);
|
zkController.publish(cd, Replica.State.RECOVERY_FAILED);
|
||||||
|
@ -297,7 +297,7 @@ public class RecoveryStrategy implements Runnable, Closeable {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
final public void doRecovery(SolrCore core) throws KeeperException, InterruptedException {
|
final public void doRecovery(SolrCore core) throws Exception {
|
||||||
if (core.getCoreDescriptor().getCloudDescriptor().requiresTransactionLog()) {
|
if (core.getCoreDescriptor().getCloudDescriptor().requiresTransactionLog()) {
|
||||||
doSyncOrReplicateRecovery(core);
|
doSyncOrReplicateRecovery(core);
|
||||||
} else {
|
} else {
|
||||||
|
@ -440,7 +440,7 @@ public class RecoveryStrategy implements Runnable, Closeable {
|
||||||
}
|
}
|
||||||
|
|
||||||
// TODO: perhaps make this grab a new core each time through the loop to handle core reloads?
|
// TODO: perhaps make this grab a new core each time through the loop to handle core reloads?
|
||||||
final public void doSyncOrReplicateRecovery(SolrCore core) throws KeeperException, InterruptedException {
|
final public void doSyncOrReplicateRecovery(SolrCore core) throws Exception {
|
||||||
boolean replayed = false;
|
boolean replayed = false;
|
||||||
boolean successfulRecovery = false;
|
boolean successfulRecovery = false;
|
||||||
|
|
||||||
|
|
|
@ -32,8 +32,8 @@ import java.util.Objects;
|
||||||
import java.util.Optional;
|
import java.util.Optional;
|
||||||
import java.util.Properties;
|
import java.util.Properties;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
import java.util.concurrent.atomic.AtomicReference;
|
|
||||||
|
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
||||||
import org.apache.solr.cloud.overseer.OverseerAction;
|
import org.apache.solr.cloud.overseer.OverseerAction;
|
||||||
import org.apache.solr.common.cloud.ReplicaPosition;
|
import org.apache.solr.common.cloud.ReplicaPosition;
|
||||||
|
|
|
@ -27,6 +27,7 @@ import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
|
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
import org.apache.solr.client.solrj.cloud.autoscaling.PolicyHelper;
|
||||||
import org.apache.solr.client.solrj.request.CoreAdminRequest;
|
import org.apache.solr.client.solrj.request.CoreAdminRequest;
|
||||||
import org.apache.solr.cloud.OverseerCollectionMessageHandler.Cmd;
|
import org.apache.solr.cloud.OverseerCollectionMessageHandler.Cmd;
|
||||||
|
|
|
@ -51,10 +51,16 @@ import java.util.concurrent.atomic.AtomicReference;
|
||||||
|
|
||||||
import com.google.common.base.Strings;
|
import com.google.common.base.Strings;
|
||||||
import org.apache.commons.lang.StringUtils;
|
import org.apache.commons.lang.StringUtils;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
|
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient.Builder;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient.Builder;
|
||||||
|
import org.apache.solr.client.solrj.impl.SolrClientDataProvider;
|
||||||
|
import org.apache.solr.client.solrj.impl.ZkClientClusterStateProvider;
|
||||||
import org.apache.solr.client.solrj.request.CoreAdminRequest.WaitForState;
|
import org.apache.solr.client.solrj.request.CoreAdminRequest.WaitForState;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
|
import org.apache.solr.cloud.autoscaling.ZkDistributedQueueFactory;
|
||||||
import org.apache.solr.cloud.overseer.OverseerAction;
|
import org.apache.solr.cloud.overseer.OverseerAction;
|
||||||
import org.apache.solr.cloud.overseer.SliceMutator;
|
import org.apache.solr.cloud.overseer.SliceMutator;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
|
@ -191,6 +197,8 @@ public class ZkController {
|
||||||
private final SolrZkClient zkClient;
|
private final SolrZkClient zkClient;
|
||||||
private final ZkCmdExecutor cmdExecutor;
|
private final ZkCmdExecutor cmdExecutor;
|
||||||
public final ZkStateReader zkStateReader;
|
public final ZkStateReader zkStateReader;
|
||||||
|
private ClusterDataProvider clusterDataProvider;
|
||||||
|
private CloudSolrClient cloudSolrClient;
|
||||||
|
|
||||||
private final String zkServerAddress; // example: 127.0.0.1:54062/solr
|
private final String zkServerAddress; // example: 127.0.0.1:54062/solr
|
||||||
|
|
||||||
|
@ -435,7 +443,7 @@ public class ZkController {
|
||||||
});
|
});
|
||||||
|
|
||||||
init(registerOnReconnect);
|
init(registerOnReconnect);
|
||||||
|
|
||||||
assert ObjectReleaseTracker.track(this);
|
assert ObjectReleaseTracker.track(this);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -554,6 +562,12 @@ public class ZkController {
|
||||||
IOUtils.closeQuietly(overseerElector.getContext());
|
IOUtils.closeQuietly(overseerElector.getContext());
|
||||||
IOUtils.closeQuietly(overseer);
|
IOUtils.closeQuietly(overseer);
|
||||||
} finally {
|
} finally {
|
||||||
|
if (cloudSolrClient != null) {
|
||||||
|
IOUtils.closeQuietly(cloudSolrClient);
|
||||||
|
}
|
||||||
|
if (clusterDataProvider != null) {
|
||||||
|
IOUtils.closeQuietly(clusterDataProvider);
|
||||||
|
}
|
||||||
try {
|
try {
|
||||||
try {
|
try {
|
||||||
zkStateReader.close();
|
zkStateReader.close();
|
||||||
|
@ -588,6 +602,22 @@ public class ZkController {
|
||||||
return zkStateReader.getClusterState();
|
return zkStateReader.getClusterState();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public ClusterDataProvider getClusterDataProvider() {
|
||||||
|
if (clusterDataProvider != null) {
|
||||||
|
return clusterDataProvider;
|
||||||
|
}
|
||||||
|
synchronized(this) {
|
||||||
|
if (clusterDataProvider != null) {
|
||||||
|
return clusterDataProvider;
|
||||||
|
}
|
||||||
|
cloudSolrClient = new CloudSolrClient.Builder()
|
||||||
|
.withClusterStateProvider(new ZkClientClusterStateProvider(zkStateReader))
|
||||||
|
.build();
|
||||||
|
clusterDataProvider = new SolrClientDataProvider(new ZkDistributedQueueFactory(zkClient), cloudSolrClient);
|
||||||
|
}
|
||||||
|
return clusterDataProvider;
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Returns config file data (in bytes)
|
* Returns config file data (in bytes)
|
||||||
*/
|
*/
|
||||||
|
@ -1290,18 +1320,18 @@ public class ZkController {
|
||||||
return baseURL;
|
return baseURL;
|
||||||
}
|
}
|
||||||
|
|
||||||
public void publish(final CoreDescriptor cd, final Replica.State state) throws KeeperException, InterruptedException {
|
public void publish(final CoreDescriptor cd, final Replica.State state) throws Exception {
|
||||||
publish(cd, state, true);
|
publish(cd, state, true);
|
||||||
}
|
}
|
||||||
|
|
||||||
public void publish(final CoreDescriptor cd, final Replica.State state, boolean updateLastState) throws KeeperException, InterruptedException {
|
public void publish(final CoreDescriptor cd, final Replica.State state, boolean updateLastState) throws Exception {
|
||||||
publish(cd, state, updateLastState, false);
|
publish(cd, state, updateLastState, false);
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Publish core state to overseer.
|
* Publish core state to overseer.
|
||||||
*/
|
*/
|
||||||
public void publish(final CoreDescriptor cd, final Replica.State state, boolean updateLastState, boolean forcePublish) throws KeeperException, InterruptedException {
|
public void publish(final CoreDescriptor cd, final Replica.State state, boolean updateLastState, boolean forcePublish) throws Exception {
|
||||||
if (!forcePublish) {
|
if (!forcePublish) {
|
||||||
try (SolrCore core = cc.getCore(cd.getName())) {
|
try (SolrCore core = cc.getCore(cd.getName())) {
|
||||||
if (core == null || core.isClosed()) {
|
if (core == null || core.isClosed()) {
|
||||||
|
@ -1410,7 +1440,7 @@ public class ZkController {
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
public void unregister(String coreName, CoreDescriptor cd) throws InterruptedException, KeeperException {
|
public void unregister(String coreName, CoreDescriptor cd) throws Exception {
|
||||||
final String coreNodeName = cd.getCloudDescriptor().getCoreNodeName();
|
final String coreNodeName = cd.getCloudDescriptor().getCoreNodeName();
|
||||||
final String collection = cd.getCloudDescriptor().getCollectionName();
|
final String collection = cd.getCloudDescriptor().getCollectionName();
|
||||||
|
|
||||||
|
@ -1441,8 +1471,7 @@ public class ZkController {
|
||||||
overseerJobQueue.offer(Utils.toJSON(m));
|
overseerJobQueue.offer(Utils.toJSON(m));
|
||||||
}
|
}
|
||||||
|
|
||||||
public void createCollection(String collection) throws KeeperException,
|
public void createCollection(String collection) throws Exception {
|
||||||
InterruptedException {
|
|
||||||
ZkNodeProps m = new ZkNodeProps(Overseer.QUEUE_OPERATION,
|
ZkNodeProps m = new ZkNodeProps(Overseer.QUEUE_OPERATION,
|
||||||
CollectionParams.CollectionAction.CREATE.toLower(), ZkStateReader.NODE_NAME_PROP, getNodeName(),
|
CollectionParams.CollectionAction.CREATE.toLower(), ZkStateReader.NODE_NAME_PROP, getNodeName(),
|
||||||
ZkStateReader.COLLECTION_PROP, collection);
|
ZkStateReader.COLLECTION_PROP, collection);
|
||||||
|
@ -1567,6 +1596,9 @@ public class ZkController {
|
||||||
Thread.currentThread().interrupt();
|
Thread.currentThread().interrupt();
|
||||||
log.error("", e);
|
log.error("", e);
|
||||||
throw new ZooKeeperException(SolrException.ErrorCode.SERVER_ERROR, "", e);
|
throw new ZooKeeperException(SolrException.ErrorCode.SERVER_ERROR, "", e);
|
||||||
|
} catch (Exception e) {
|
||||||
|
log.error("", e);
|
||||||
|
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, "", e);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cd.getCloudDescriptor().getShardId() == null && needsToBeAssignedShardId(cd, zkStateReader.getClusterState(), coreNodeName)) {
|
if (cd.getCloudDescriptor().getShardId() == null && needsToBeAssignedShardId(cd, zkStateReader.getClusterState(), coreNodeName)) {
|
||||||
|
|
|
@ -30,6 +30,7 @@ import java.util.function.Predicate;
|
||||||
import com.codahale.metrics.Timer;
|
import com.codahale.metrics.Timer;
|
||||||
import com.google.common.annotations.VisibleForTesting;
|
import com.google.common.annotations.VisibleForTesting;
|
||||||
import com.google.common.base.Preconditions;
|
import com.google.common.base.Preconditions;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
import org.apache.solr.common.SolrException.ErrorCode;
|
import org.apache.solr.common.SolrException.ErrorCode;
|
||||||
import org.apache.solr.common.cloud.SolrZkClient;
|
import org.apache.solr.common.cloud.SolrZkClient;
|
||||||
|
@ -43,11 +44,11 @@ import org.slf4j.Logger;
|
||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* A distributed queue. Optimized for single-consumer,
|
* A ZK-based distributed queue. Optimized for single-consumer,
|
||||||
* multiple-producer: if there are multiple consumers on the same ZK queue,
|
* multiple-producer: if there are multiple consumers on the same ZK queue,
|
||||||
* the results should be correct but inefficient
|
* the results should be correct but inefficient
|
||||||
*/
|
*/
|
||||||
public class DistributedQueue {
|
public class ZkDistributedQueue implements DistributedQueue {
|
||||||
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
static final String PREFIX = "qn-";
|
static final String PREFIX = "qn-";
|
||||||
|
@ -92,11 +93,11 @@ public class DistributedQueue {
|
||||||
|
|
||||||
private int watcherCount = 0;
|
private int watcherCount = 0;
|
||||||
|
|
||||||
public DistributedQueue(SolrZkClient zookeeper, String dir) {
|
public ZkDistributedQueue(SolrZkClient zookeeper, String dir) {
|
||||||
this(zookeeper, dir, new Overseer.Stats());
|
this(zookeeper, dir, new Overseer.Stats());
|
||||||
}
|
}
|
||||||
|
|
||||||
public DistributedQueue(SolrZkClient zookeeper, String dir, Overseer.Stats stats) {
|
public ZkDistributedQueue(SolrZkClient zookeeper, String dir, Overseer.Stats stats) {
|
||||||
this.dir = dir;
|
this.dir = dir;
|
||||||
|
|
||||||
ZkCmdExecutor cmdExecutor = new ZkCmdExecutor(zookeeper.getZkClientTimeout());
|
ZkCmdExecutor cmdExecutor = new ZkCmdExecutor(zookeeper.getZkClientTimeout());
|
||||||
|
@ -119,6 +120,7 @@ public class DistributedQueue {
|
||||||
*
|
*
|
||||||
* @return data at the first element of the queue, or null.
|
* @return data at the first element of the queue, or null.
|
||||||
*/
|
*/
|
||||||
|
@Override
|
||||||
public byte[] peek() throws KeeperException, InterruptedException {
|
public byte[] peek() throws KeeperException, InterruptedException {
|
||||||
Timer.Context time = stats.time(dir + "_peek");
|
Timer.Context time = stats.time(dir + "_peek");
|
||||||
try {
|
try {
|
||||||
|
@ -135,6 +137,7 @@ public class DistributedQueue {
|
||||||
* @param block if true, blocks until an element enters the queue
|
* @param block if true, blocks until an element enters the queue
|
||||||
* @return data at the first element of the queue, or null.
|
* @return data at the first element of the queue, or null.
|
||||||
*/
|
*/
|
||||||
|
@Override
|
||||||
public byte[] peek(boolean block) throws KeeperException, InterruptedException {
|
public byte[] peek(boolean block) throws KeeperException, InterruptedException {
|
||||||
return block ? peek(Long.MAX_VALUE) : peek();
|
return block ? peek(Long.MAX_VALUE) : peek();
|
||||||
}
|
}
|
||||||
|
@ -146,6 +149,7 @@ public class DistributedQueue {
|
||||||
* @param wait max wait time in ms.
|
* @param wait max wait time in ms.
|
||||||
* @return data at the first element of the queue, or null.
|
* @return data at the first element of the queue, or null.
|
||||||
*/
|
*/
|
||||||
|
@Override
|
||||||
public byte[] peek(long wait) throws KeeperException, InterruptedException {
|
public byte[] peek(long wait) throws KeeperException, InterruptedException {
|
||||||
Preconditions.checkArgument(wait > 0);
|
Preconditions.checkArgument(wait > 0);
|
||||||
Timer.Context time;
|
Timer.Context time;
|
||||||
|
@ -177,6 +181,7 @@ public class DistributedQueue {
|
||||||
*
|
*
|
||||||
* @return Head of the queue or null.
|
* @return Head of the queue or null.
|
||||||
*/
|
*/
|
||||||
|
@Override
|
||||||
public byte[] poll() throws KeeperException, InterruptedException {
|
public byte[] poll() throws KeeperException, InterruptedException {
|
||||||
Timer.Context time = stats.time(dir + "_poll");
|
Timer.Context time = stats.time(dir + "_poll");
|
||||||
try {
|
try {
|
||||||
|
@ -191,6 +196,7 @@ public class DistributedQueue {
|
||||||
*
|
*
|
||||||
* @return The former head of the queue
|
* @return The former head of the queue
|
||||||
*/
|
*/
|
||||||
|
@Override
|
||||||
public byte[] remove() throws NoSuchElementException, KeeperException, InterruptedException {
|
public byte[] remove() throws NoSuchElementException, KeeperException, InterruptedException {
|
||||||
Timer.Context time = stats.time(dir + "_remove");
|
Timer.Context time = stats.time(dir + "_remove");
|
||||||
try {
|
try {
|
||||||
|
@ -209,6 +215,7 @@ public class DistributedQueue {
|
||||||
*
|
*
|
||||||
* @return The former head of the queue
|
* @return The former head of the queue
|
||||||
*/
|
*/
|
||||||
|
@Override
|
||||||
public byte[] take() throws KeeperException, InterruptedException {
|
public byte[] take() throws KeeperException, InterruptedException {
|
||||||
// Same as for element. Should refactor this.
|
// Same as for element. Should refactor this.
|
||||||
Timer.Context timer = stats.time(dir + "_take");
|
Timer.Context timer = stats.time(dir + "_take");
|
||||||
|
@ -231,6 +238,7 @@ public class DistributedQueue {
|
||||||
* Inserts data into queue. If there are no other queue consumers, the offered element
|
* Inserts data into queue. If there are no other queue consumers, the offered element
|
||||||
* will be immediately visible when this method returns.
|
* will be immediately visible when this method returns.
|
||||||
*/
|
*/
|
||||||
|
@Override
|
||||||
public void offer(byte[] data) throws KeeperException, InterruptedException {
|
public void offer(byte[] data) throws KeeperException, InterruptedException {
|
||||||
Timer.Context time = stats.time(dir + "_offer");
|
Timer.Context time = stats.time(dir + "_offer");
|
||||||
try {
|
try {
|
||||||
|
@ -326,7 +334,8 @@ public class DistributedQueue {
|
||||||
* <p/>
|
* <p/>
|
||||||
* Package-private to support {@link OverseerTaskQueue} specifically.
|
* Package-private to support {@link OverseerTaskQueue} specifically.
|
||||||
*/
|
*/
|
||||||
Collection<Pair<String, byte[]>> peekElements(int max, long waitMillis, Predicate<String> acceptFilter) throws KeeperException, InterruptedException {
|
@Override
|
||||||
|
public Collection<Pair<String, byte[]>> peekElements(int max, long waitMillis, Predicate<String> acceptFilter) throws KeeperException, InterruptedException {
|
||||||
List<String> foundChildren = new ArrayList<>();
|
List<String> foundChildren = new ArrayList<>();
|
||||||
long waitNanos = TimeUnit.MILLISECONDS.toNanos(waitMillis);
|
long waitNanos = TimeUnit.MILLISECONDS.toNanos(waitMillis);
|
||||||
boolean first = true;
|
boolean first = true;
|
|
@ -20,6 +20,7 @@ package org.apache.solr.cloud.autoscaling;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.common.MapWriter;
|
import org.apache.solr.common.MapWriter;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.core.CoreContainer;
|
||||||
|
|
||||||
|
@ -30,18 +31,18 @@ import org.apache.solr.core.CoreContainer;
|
||||||
*/
|
*/
|
||||||
public class ActionContext implements MapWriter {
|
public class ActionContext implements MapWriter {
|
||||||
|
|
||||||
private final CoreContainer coreContainer;
|
private final ClusterDataProvider clusterDataProvider;
|
||||||
private final AutoScaling.Trigger source;
|
private final AutoScaling.Trigger source;
|
||||||
private final Map<String, Object> properties;
|
private final Map<String, Object> properties;
|
||||||
|
|
||||||
public ActionContext(CoreContainer coreContainer, AutoScaling.Trigger source, Map<String, Object> properties) {
|
public ActionContext(ClusterDataProvider clusterDataProvider, AutoScaling.Trigger source, Map<String, Object> properties) {
|
||||||
this.coreContainer = coreContainer;
|
this.clusterDataProvider = clusterDataProvider;
|
||||||
this.source = source;
|
this.source = source;
|
||||||
this.properties = properties;
|
this.properties = properties;
|
||||||
}
|
}
|
||||||
|
|
||||||
public CoreContainer getCoreContainer() {
|
public ClusterDataProvider getClusterDataProvider() {
|
||||||
return coreContainer;
|
return clusterDataProvider;
|
||||||
}
|
}
|
||||||
|
|
||||||
public AutoScaling.Trigger getSource() {
|
public AutoScaling.Trigger getSource() {
|
||||||
|
|
|
@ -18,8 +18,12 @@
|
||||||
package org.apache.solr.cloud.autoscaling;
|
package org.apache.solr.cloud.autoscaling;
|
||||||
|
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
|
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.NoneSuggester;
|
import org.apache.solr.client.solrj.cloud.autoscaling.NoneSuggester;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.Policy;
|
import org.apache.solr.client.solrj.cloud.autoscaling.Policy;
|
||||||
|
import org.apache.solr.common.SolrException;
|
||||||
import org.apache.solr.common.cloud.ClusterState;
|
import org.apache.solr.common.cloud.ClusterState;
|
||||||
import org.apache.solr.common.cloud.DocCollection;
|
import org.apache.solr.common.cloud.DocCollection;
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
|
@ -27,15 +31,20 @@ import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
public class AutoAddReplicasPlanAction extends ComputePlanAction {
|
public class AutoAddReplicasPlanAction extends ComputePlanAction {
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
protected Policy.Suggester getSuggester(Policy.Session session, TriggerEvent event, ZkStateReader zkStateReader) {
|
protected Policy.Suggester getSuggester(Policy.Session session, TriggerEvent event, ClusterDataProvider cdp) {
|
||||||
// for backward compatibility
|
// for backward compatibility
|
||||||
String autoAddReplicas = zkStateReader.getClusterProperty(ZkStateReader.AUTO_ADD_REPLICAS, (String) null);
|
String autoAddReplicas = cdp.getClusterProperty(ZkStateReader.AUTO_ADD_REPLICAS, (String) null);
|
||||||
if (autoAddReplicas != null && autoAddReplicas.equals("false")) {
|
if (autoAddReplicas != null && autoAddReplicas.equals("false")) {
|
||||||
return new NoneSuggester();
|
return new NoneSuggester();
|
||||||
}
|
}
|
||||||
|
|
||||||
Policy.Suggester suggester = super.getSuggester(session, event, zkStateReader);
|
Policy.Suggester suggester = super.getSuggester(session, event, cdp);
|
||||||
ClusterState clusterState = zkStateReader.getClusterState();
|
ClusterState clusterState;
|
||||||
|
try {
|
||||||
|
clusterState = cdp.getClusterState();
|
||||||
|
} catch (IOException e) {
|
||||||
|
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, "Exception getting cluster state", e);
|
||||||
|
}
|
||||||
|
|
||||||
boolean anyCollections = false;
|
boolean anyCollections = false;
|
||||||
for (DocCollection collection: clusterState.getCollectionsMap().values()) {
|
for (DocCollection collection: clusterState.getCollectionsMap().values()) {
|
||||||
|
|
|
@ -24,8 +24,10 @@ import java.util.Map;
|
||||||
|
|
||||||
import com.google.common.base.Preconditions;
|
import com.google.common.base.Preconditions;
|
||||||
import org.apache.lucene.store.AlreadyClosedException;
|
import org.apache.lucene.store.AlreadyClosedException;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.core.CoreContainer;
|
||||||
|
import org.apache.solr.core.SolrResourceLoader;
|
||||||
|
|
||||||
public class AutoScaling {
|
public class AutoScaling {
|
||||||
|
|
||||||
|
@ -110,30 +112,13 @@ public class AutoScaling {
|
||||||
void init();
|
void init();
|
||||||
}
|
}
|
||||||
|
|
||||||
public static class TriggerFactory implements Closeable {
|
/**
|
||||||
|
* Factory to produce instances of {@link Trigger}.
|
||||||
|
*/
|
||||||
|
public static abstract class TriggerFactory implements Closeable {
|
||||||
|
protected boolean isClosed = false;
|
||||||
|
|
||||||
private final CoreContainer coreContainer;
|
public abstract Trigger create(TriggerEventType type, String name, Map<String, Object> props);
|
||||||
|
|
||||||
private boolean isClosed = false;
|
|
||||||
|
|
||||||
public TriggerFactory(CoreContainer coreContainer) {
|
|
||||||
Preconditions.checkNotNull(coreContainer);
|
|
||||||
this.coreContainer = coreContainer;
|
|
||||||
}
|
|
||||||
|
|
||||||
public synchronized Trigger create(TriggerEventType type, String name, Map<String, Object> props) {
|
|
||||||
if (isClosed) {
|
|
||||||
throw new AlreadyClosedException("TriggerFactory has already been closed, cannot create new triggers");
|
|
||||||
}
|
|
||||||
switch (type) {
|
|
||||||
case NODEADDED:
|
|
||||||
return new NodeAddedTrigger(name, props, coreContainer);
|
|
||||||
case NODELOST:
|
|
||||||
return new NodeLostTrigger(name, props, coreContainer);
|
|
||||||
default:
|
|
||||||
throw new IllegalArgumentException("Unknown event type: " + type + " in trigger: " + name);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void close() throws IOException {
|
public void close() throws IOException {
|
||||||
|
@ -143,6 +128,38 @@ public class AutoScaling {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Default implementation of {@link TriggerFactory}.
|
||||||
|
*/
|
||||||
|
public static class TriggerFactoryImpl extends TriggerFactory {
|
||||||
|
|
||||||
|
private final ClusterDataProvider clusterDataProvider;
|
||||||
|
private final SolrResourceLoader loader;
|
||||||
|
|
||||||
|
public TriggerFactoryImpl(SolrResourceLoader loader, ClusterDataProvider clusterDataProvider) {
|
||||||
|
Preconditions.checkNotNull(clusterDataProvider);
|
||||||
|
Preconditions.checkNotNull(loader);
|
||||||
|
this.clusterDataProvider = clusterDataProvider;
|
||||||
|
this.loader = loader;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public synchronized Trigger create(TriggerEventType type, String name, Map<String, Object> props) {
|
||||||
|
if (isClosed) {
|
||||||
|
throw new AlreadyClosedException("TriggerFactory has already been closed, cannot create new triggers");
|
||||||
|
}
|
||||||
|
switch (type) {
|
||||||
|
case NODEADDED:
|
||||||
|
return new NodeAddedTrigger(name, props, loader, clusterDataProvider);
|
||||||
|
case NODELOST:
|
||||||
|
return new NodeLostTrigger(name, props, loader, clusterDataProvider);
|
||||||
|
default:
|
||||||
|
throw new IllegalArgumentException("Unknown event type: " + type + " in trigger: " + name);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
public static final String AUTO_ADD_REPLICAS_TRIGGER_DSL =
|
public static final String AUTO_ADD_REPLICAS_TRIGGER_DSL =
|
||||||
"{" +
|
"{" +
|
||||||
" 'set-trigger' : {" +
|
" 'set-trigger' : {" +
|
||||||
|
|
|
@ -214,7 +214,7 @@ public class AutoScalingHandler extends RequestHandlerBase implements Permission
|
||||||
try (CloudSolrClient build = new CloudSolrClient.Builder()
|
try (CloudSolrClient build = new CloudSolrClient.Builder()
|
||||||
.withHttpClient(container.getUpdateShardHandler().getHttpClient())
|
.withHttpClient(container.getUpdateShardHandler().getHttpClient())
|
||||||
.withZkHost(container.getZkController().getZkServerAddress()).build()) {
|
.withZkHost(container.getZkController().getZkServerAddress()).build()) {
|
||||||
Policy.Session session = policy.createSession(new SolrClientDataProvider(build));
|
Policy.Session session = policy.createSession(new SolrClientDataProvider(new ZkDistributedQueueFactory(container.getZkController().getZkClient()), build));
|
||||||
List<Row> sorted = session.getSorted();
|
List<Row> sorted = session.getSorted();
|
||||||
List<Clause.Violation> violations = session.getViolations();
|
List<Clause.Violation> violations = session.getViolations();
|
||||||
|
|
||||||
|
@ -638,7 +638,8 @@ public class AutoScalingHandler extends RequestHandlerBase implements Permission
|
||||||
try (CloudSolrClient build = new CloudSolrClient.Builder()
|
try (CloudSolrClient build = new CloudSolrClient.Builder()
|
||||||
.withHttpClient(container.getUpdateShardHandler().getHttpClient())
|
.withHttpClient(container.getUpdateShardHandler().getHttpClient())
|
||||||
.withZkHost(container.getZkController().getZkServerAddress()).build()) {
|
.withZkHost(container.getZkController().getZkServerAddress()).build()) {
|
||||||
Policy.Session session = autoScalingConf.getPolicy().createSession(new SolrClientDataProvider(build));
|
Policy.Session session = autoScalingConf.getPolicy()
|
||||||
|
.createSession(new SolrClientDataProvider(new ZkDistributedQueueFactory(container.getZkController().getZkClient()), build));
|
||||||
log.debug("Verified autoscaling configuration");
|
log.debug("Verified autoscaling configuration");
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -25,6 +25,7 @@ import java.util.Map;
|
||||||
|
|
||||||
import org.apache.solr.client.solrj.SolrRequest;
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.Policy;
|
import org.apache.solr.client.solrj.cloud.autoscaling.Policy;
|
||||||
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
||||||
import org.apache.solr.client.solrj.impl.SolrClientDataProvider;
|
import org.apache.solr.client.solrj.impl.SolrClientDataProvider;
|
||||||
|
@ -48,40 +49,30 @@ public class ComputePlanAction extends TriggerActionBase {
|
||||||
@Override
|
@Override
|
||||||
public void process(TriggerEvent event, ActionContext context) {
|
public void process(TriggerEvent event, ActionContext context) {
|
||||||
log.debug("-- processing event: {} with context properties: {}", event, context.getProperties());
|
log.debug("-- processing event: {} with context properties: {}", event, context.getProperties());
|
||||||
CoreContainer container = context.getCoreContainer();
|
ClusterDataProvider cdp = context.getClusterDataProvider();
|
||||||
try {
|
try {
|
||||||
try (CloudSolrClient cloudSolrClient = new CloudSolrClient.Builder()
|
AutoScalingConfig autoScalingConf = cdp.getAutoScalingConfig();
|
||||||
.withZkHost(container.getZkController().getZkServerAddress())
|
if (autoScalingConf.isEmpty()) {
|
||||||
.withHttpClient(container.getUpdateShardHandler().getHttpClient())
|
log.error("Action: " + getName() + " executed but no policy is configured");
|
||||||
.build()) {
|
return;
|
||||||
ZkStateReader zkStateReader = cloudSolrClient.getZkStateReader();
|
}
|
||||||
AutoScalingConfig autoScalingConf = zkStateReader.getAutoScalingConfig();
|
Policy policy = autoScalingConf.getPolicy();
|
||||||
if (autoScalingConf.isEmpty()) {
|
Policy.Session session = policy.createSession(cdp);
|
||||||
log.error("Action: " + getName() + " executed but no policy is configured");
|
Policy.Suggester suggester = getSuggester(session, event, cdp);
|
||||||
return;
|
while (true) {
|
||||||
}
|
SolrRequest operation = suggester.getOperation();
|
||||||
Policy policy = autoScalingConf.getPolicy();
|
if (operation == null) break;
|
||||||
Policy.Session session = policy.createSession(new SolrClientDataProvider(cloudSolrClient));
|
log.info("Computed Plan: {}", operation.getParams());
|
||||||
Policy.Suggester suggester = getSuggester(session, event, zkStateReader);
|
Map<String, Object> props = context.getProperties();
|
||||||
while (true) {
|
props.compute("operations", (k, v) -> {
|
||||||
SolrRequest operation = suggester.getOperation();
|
List<SolrRequest> operations = (List<SolrRequest>) v;
|
||||||
if (operation == null) break;
|
if (operations == null) operations = new ArrayList<>();
|
||||||
log.info("Computed Plan: {}", operation.getParams());
|
operations.add(operation);
|
||||||
Map<String, Object> props = context.getProperties();
|
return operations;
|
||||||
props.compute("operations", (k, v) -> {
|
});
|
||||||
List<SolrRequest> operations = (List<SolrRequest>) v;
|
session = suggester.getSession();
|
||||||
if (operations == null) operations = new ArrayList<>();
|
suggester = getSuggester(session, event, cdp);
|
||||||
operations.add(operation);
|
|
||||||
return operations;
|
|
||||||
});
|
|
||||||
session = suggester.getSession();
|
|
||||||
suggester = getSuggester(session, event, zkStateReader);
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
} catch (KeeperException e) {
|
|
||||||
log.error("ZooKeeperException while processing event: " + event, e);
|
|
||||||
} catch (InterruptedException e) {
|
|
||||||
log.error("Interrupted while processing event: " + event, e);
|
|
||||||
} catch (IOException e) {
|
} catch (IOException e) {
|
||||||
log.error("IOException while processing event: " + event, e);
|
log.error("IOException while processing event: " + event, e);
|
||||||
} catch (Exception e) {
|
} catch (Exception e) {
|
||||||
|
@ -89,7 +80,7 @@ public class ComputePlanAction extends TriggerActionBase {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
protected Policy.Suggester getSuggester(Policy.Session session, TriggerEvent event, ZkStateReader zkStateReader) {
|
protected Policy.Suggester getSuggester(Policy.Session session, TriggerEvent event, ClusterDataProvider cdp) {
|
||||||
Policy.Suggester suggester;
|
Policy.Suggester suggester;
|
||||||
switch (event.getEventType()) {
|
switch (event.getEventType()) {
|
||||||
case NODEADDED:
|
case NODEADDED:
|
||||||
|
|
|
@ -25,6 +25,7 @@ import java.util.List;
|
||||||
import org.apache.solr.client.solrj.SolrRequest;
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
import org.apache.solr.client.solrj.SolrResponse;
|
import org.apache.solr.client.solrj.SolrResponse;
|
||||||
import org.apache.solr.client.solrj.SolrServerException;
|
import org.apache.solr.client.solrj.SolrServerException;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
|
@ -43,32 +44,29 @@ public class ExecutePlanAction extends TriggerActionBase {
|
||||||
@Override
|
@Override
|
||||||
public void process(TriggerEvent event, ActionContext context) {
|
public void process(TriggerEvent event, ActionContext context) {
|
||||||
log.debug("-- processing event: {} with context properties: {}", event, context.getProperties());
|
log.debug("-- processing event: {} with context properties: {}", event, context.getProperties());
|
||||||
CoreContainer container = context.getCoreContainer();
|
ClusterDataProvider clusterDataProvider = context.getClusterDataProvider();
|
||||||
List<SolrRequest> operations = (List<SolrRequest>) context.getProperty("operations");
|
List<SolrRequest> operations = (List<SolrRequest>) context.getProperty("operations");
|
||||||
if (operations == null || operations.isEmpty()) {
|
if (operations == null || operations.isEmpty()) {
|
||||||
log.info("No operations to execute for event: {}", event);
|
log.info("No operations to execute for event: {}", event);
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
try (CloudSolrClient cloudSolrClient = new CloudSolrClient.Builder()
|
try {
|
||||||
.withZkHost(container.getZkController().getZkServerAddress())
|
|
||||||
.withHttpClient(container.getUpdateShardHandler().getHttpClient())
|
|
||||||
.build()) {
|
|
||||||
for (SolrRequest operation : operations) {
|
for (SolrRequest operation : operations) {
|
||||||
log.info("Executing operation: {}", operation.getParams());
|
log.info("Executing operation: {}", operation.getParams());
|
||||||
try {
|
try {
|
||||||
SolrResponse response = operation.process(cloudSolrClient);
|
SolrResponse response = clusterDataProvider.request(operation);
|
||||||
context.getProperties().compute("responses", (s, o) -> {
|
context.getProperties().compute("responses", (s, o) -> {
|
||||||
List<NamedList<Object>> responses = (List<NamedList<Object>>) o;
|
List<NamedList<Object>> responses = (List<NamedList<Object>>) o;
|
||||||
if (responses == null) responses = new ArrayList<>(operations.size());
|
if (responses == null) responses = new ArrayList<>(operations.size());
|
||||||
responses.add(response.getResponse());
|
responses.add(response.getResponse());
|
||||||
return responses;
|
return responses;
|
||||||
});
|
});
|
||||||
} catch (SolrServerException | HttpSolrClient.RemoteSolrException e) {
|
} catch (Exception e) {
|
||||||
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR,
|
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR,
|
||||||
"Unexpected exception executing operation: " + operation.getParams(), e);
|
"Unexpected exception executing operation: " + operation.getParams(), e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} catch (IOException e) {
|
} catch (Exception e) {
|
||||||
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR,
|
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR,
|
||||||
"Unexpected IOException while processing event: " + event, e);
|
"Unexpected IOException while processing event: " + event, e);
|
||||||
}
|
}
|
||||||
|
|
|
@ -30,6 +30,7 @@ import org.apache.http.client.methods.HttpPost;
|
||||||
import org.apache.http.client.protocol.HttpClientContext;
|
import org.apache.http.client.protocol.HttpClientContext;
|
||||||
import org.apache.http.entity.StringEntity;
|
import org.apache.http.entity.StringEntity;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
||||||
import org.apache.solr.client.solrj.impl.HttpClientUtil;
|
import org.apache.solr.client.solrj.impl.HttpClientUtil;
|
||||||
import org.apache.solr.common.util.Utils;
|
import org.apache.solr.common.util.Utils;
|
||||||
|
@ -72,9 +73,9 @@ public class HttpTriggerListener extends TriggerListenerBase {
|
||||||
private boolean followRedirects;
|
private boolean followRedirects;
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void init(CoreContainer coreContainer, AutoScalingConfig.TriggerListenerConfig config) {
|
public void init(ClusterDataProvider clusterDataProvider, AutoScalingConfig.TriggerListenerConfig config) {
|
||||||
super.init(coreContainer, config);
|
super.init(clusterDataProvider, config);
|
||||||
httpClient = coreContainer.getUpdateShardHandler().getHttpClient();
|
httpClient = clusterDataProvider.getHttpClient();
|
||||||
urlTemplate = (String)config.properties.get("url");
|
urlTemplate = (String)config.properties.get("url");
|
||||||
payloadTemplate = (String)config.properties.get("payload");
|
payloadTemplate = (String)config.properties.get("payload");
|
||||||
contentType = (String)config.properties.get("contentType");
|
contentType = (String)config.properties.get("contentType");
|
||||||
|
|
|
@ -17,29 +17,24 @@
|
||||||
|
|
||||||
package org.apache.solr.cloud.autoscaling;
|
package org.apache.solr.cloud.autoscaling;
|
||||||
|
|
||||||
import java.io.IOException;
|
|
||||||
import java.lang.invoke.MethodHandles;
|
import java.lang.invoke.MethodHandles;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
import java.util.Collection;
|
import java.util.Collection;
|
||||||
import java.util.Collections;
|
|
||||||
import java.util.HashMap;
|
import java.util.HashMap;
|
||||||
import java.util.HashSet;
|
import java.util.HashSet;
|
||||||
import java.util.Iterator;
|
import java.util.Iterator;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Locale;
|
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
import java.util.Objects;
|
import java.util.NoSuchElementException;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
import java.util.concurrent.TimeUnit;
|
import java.util.concurrent.TimeUnit;
|
||||||
import java.util.concurrent.atomic.AtomicReference;
|
|
||||||
|
|
||||||
import org.apache.lucene.util.IOUtils;
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.core.SolrResourceLoader;
|
||||||
import org.apache.solr.util.TimeSource;
|
import org.apache.solr.util.TimeSource;
|
||||||
import org.apache.zookeeper.KeeperException;
|
|
||||||
import org.slf4j.Logger;
|
import org.slf4j.Logger;
|
||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
@ -49,60 +44,28 @@ import org.slf4j.LoggerFactory;
|
||||||
public class NodeAddedTrigger extends TriggerBase {
|
public class NodeAddedTrigger extends TriggerBase {
|
||||||
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
private final String name;
|
|
||||||
private final Map<String, Object> properties;
|
|
||||||
private final CoreContainer container;
|
|
||||||
private final List<TriggerAction> actions;
|
|
||||||
private final AtomicReference<AutoScaling.TriggerEventProcessor> processorRef;
|
|
||||||
private final boolean enabled;
|
|
||||||
private final int waitForSecond;
|
|
||||||
private final TriggerEventType eventType;
|
|
||||||
private final TimeSource timeSource;
|
private final TimeSource timeSource;
|
||||||
|
|
||||||
private boolean isClosed = false;
|
|
||||||
|
|
||||||
private Set<String> lastLiveNodes;
|
private Set<String> lastLiveNodes;
|
||||||
|
|
||||||
private Map<String, Long> nodeNameVsTimeAdded = new HashMap<>();
|
private Map<String, Long> nodeNameVsTimeAdded = new HashMap<>();
|
||||||
|
|
||||||
public NodeAddedTrigger(String name, Map<String, Object> properties,
|
public NodeAddedTrigger(String name, Map<String, Object> properties,
|
||||||
CoreContainer container) {
|
SolrResourceLoader loader,
|
||||||
super(container.getZkController().getZkClient());
|
ClusterDataProvider clusterDataProvider) {
|
||||||
this.name = name;
|
super(name, properties, loader, clusterDataProvider);
|
||||||
this.properties = properties;
|
|
||||||
this.container = container;
|
|
||||||
this.timeSource = TimeSource.CURRENT_TIME;
|
this.timeSource = TimeSource.CURRENT_TIME;
|
||||||
this.processorRef = new AtomicReference<>();
|
lastLiveNodes = new HashSet<>(clusterDataProvider.getLiveNodes());
|
||||||
List<Map<String, String>> o = (List<Map<String, String>>) properties.get("actions");
|
|
||||||
if (o != null && !o.isEmpty()) {
|
|
||||||
actions = new ArrayList<>(3);
|
|
||||||
for (Map<String, String> map : o) {
|
|
||||||
TriggerAction action = container.getResourceLoader().newInstance(map.get("class"), TriggerAction.class);
|
|
||||||
actions.add(action);
|
|
||||||
}
|
|
||||||
} else {
|
|
||||||
actions = Collections.emptyList();
|
|
||||||
}
|
|
||||||
lastLiveNodes = new HashSet<>(container.getZkController().getZkStateReader().getClusterState().getLiveNodes());
|
|
||||||
log.debug("Initial livenodes: {}", lastLiveNodes);
|
log.debug("Initial livenodes: {}", lastLiveNodes);
|
||||||
this.enabled = Boolean.parseBoolean(String.valueOf(properties.getOrDefault("enabled", "true")));
|
|
||||||
this.waitForSecond = ((Long) properties.getOrDefault("waitFor", -1L)).intValue();
|
|
||||||
this.eventType = TriggerEventType.valueOf(properties.get("event").toString().toUpperCase(Locale.ROOT));
|
|
||||||
log.debug("NodeAddedTrigger {} instantiated with properties: {}", name, properties);
|
log.debug("NodeAddedTrigger {} instantiated with properties: {}", name, properties);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void init() {
|
public void init() {
|
||||||
List<Map<String, String>> o = (List<Map<String, String>>) properties.get("actions");
|
super.init();
|
||||||
if (o != null && !o.isEmpty()) {
|
|
||||||
for (int i = 0; i < o.size(); i++) {
|
|
||||||
Map<String, String> map = o.get(i);
|
|
||||||
actions.get(i).init(map);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
// pick up added nodes for which marker paths were created
|
// pick up added nodes for which marker paths were created
|
||||||
try {
|
try {
|
||||||
List<String> added = container.getZkController().getZkClient().getChildren(ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH, null, true);
|
List<String> added = clusterDataProvider.listData(ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH);
|
||||||
added.forEach(n -> {
|
added.forEach(n -> {
|
||||||
// don't add nodes that have since gone away
|
// don't add nodes that have since gone away
|
||||||
if (lastLiveNodes.contains(n)) {
|
if (lastLiveNodes.contains(n)) {
|
||||||
|
@ -111,77 +74,14 @@ public class NodeAddedTrigger extends TriggerBase {
|
||||||
}
|
}
|
||||||
removeMarker(n);
|
removeMarker(n);
|
||||||
});
|
});
|
||||||
} catch (KeeperException.NoNodeException e) {
|
} catch (NoSuchElementException e) {
|
||||||
// ignore
|
// ignore
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Exception retrieving nodeLost markers", e);
|
log.warn("Exception retrieving nodeLost markers", e);
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
public void setProcessor(AutoScaling.TriggerEventProcessor processor) {
|
|
||||||
processorRef.set(processor);
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public AutoScaling.TriggerEventProcessor getProcessor() {
|
|
||||||
return processorRef.get();
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public String getName() {
|
|
||||||
return name;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public TriggerEventType getEventType() {
|
|
||||||
return eventType;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public boolean isEnabled() {
|
|
||||||
return enabled;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public int getWaitForSecond() {
|
|
||||||
return waitForSecond;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public Map<String, Object> getProperties() {
|
|
||||||
return properties;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public List<TriggerAction> getActions() {
|
|
||||||
return actions;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public boolean equals(Object obj) {
|
|
||||||
if (obj instanceof NodeAddedTrigger) {
|
|
||||||
NodeAddedTrigger that = (NodeAddedTrigger) obj;
|
|
||||||
return this.name.equals(that.name)
|
|
||||||
&& this.properties.equals(that.properties);
|
|
||||||
}
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public int hashCode() {
|
|
||||||
return Objects.hash(name, properties);
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public void close() throws IOException {
|
|
||||||
synchronized (this) {
|
|
||||||
isClosed = true;
|
|
||||||
IOUtils.closeWhileHandlingException(actions);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void restoreState(AutoScaling.Trigger old) {
|
public void restoreState(AutoScaling.Trigger old) {
|
||||||
assert old.isClosed();
|
assert old.isClosed();
|
||||||
|
@ -229,8 +129,7 @@ public class NodeAddedTrigger extends TriggerBase {
|
||||||
}
|
}
|
||||||
log.debug("Running NodeAddedTrigger {}", name);
|
log.debug("Running NodeAddedTrigger {}", name);
|
||||||
|
|
||||||
ZkStateReader reader = container.getZkController().getZkStateReader();
|
Set<String> newLiveNodes = new HashSet<>(clusterDataProvider.getLiveNodes());
|
||||||
Set<String> newLiveNodes = reader.getClusterState().getLiveNodes();
|
|
||||||
log.debug("Found livenodes: {}", newLiveNodes);
|
log.debug("Found livenodes: {}", newLiveNodes);
|
||||||
|
|
||||||
// have any nodes that we were tracking been removed from the cluster?
|
// have any nodes that we were tracking been removed from the cluster?
|
||||||
|
@ -287,24 +186,17 @@ public class NodeAddedTrigger extends TriggerBase {
|
||||||
private void removeMarker(String nodeName) {
|
private void removeMarker(String nodeName) {
|
||||||
String path = ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH + "/" + nodeName;
|
String path = ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH + "/" + nodeName;
|
||||||
try {
|
try {
|
||||||
if (container.getZkController().getZkClient().exists(path, true)) {
|
if (clusterDataProvider.hasData(path)) {
|
||||||
container.getZkController().getZkClient().delete(path, -1, true);
|
clusterDataProvider.removeData(path, -1);
|
||||||
}
|
}
|
||||||
} catch (KeeperException.NoNodeException e) {
|
} catch (NoSuchElementException e) {
|
||||||
// ignore
|
// ignore
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.debug("Exception removing nodeAdded marker " + nodeName, e);
|
log.debug("Exception removing nodeAdded marker " + nodeName, e);
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
public boolean isClosed() {
|
|
||||||
synchronized (this) {
|
|
||||||
return isClosed;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
public static class NodeAddedEvent extends TriggerEvent {
|
public static class NodeAddedEvent extends TriggerEvent {
|
||||||
|
|
||||||
public NodeAddedEvent(TriggerEventType eventType, String source, List<Long> times, List<String> nodeNames) {
|
public NodeAddedEvent(TriggerEventType eventType, String source, List<Long> times, List<String> nodeNames) {
|
||||||
|
|
|
@ -17,29 +17,24 @@
|
||||||
|
|
||||||
package org.apache.solr.cloud.autoscaling;
|
package org.apache.solr.cloud.autoscaling;
|
||||||
|
|
||||||
import java.io.IOException;
|
|
||||||
import java.lang.invoke.MethodHandles;
|
import java.lang.invoke.MethodHandles;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
import java.util.Collection;
|
import java.util.Collection;
|
||||||
import java.util.Collections;
|
|
||||||
import java.util.HashMap;
|
import java.util.HashMap;
|
||||||
import java.util.HashSet;
|
import java.util.HashSet;
|
||||||
import java.util.Iterator;
|
import java.util.Iterator;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Locale;
|
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
import java.util.Objects;
|
import java.util.NoSuchElementException;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
import java.util.concurrent.TimeUnit;
|
import java.util.concurrent.TimeUnit;
|
||||||
import java.util.concurrent.atomic.AtomicReference;
|
|
||||||
|
|
||||||
import org.apache.lucene.util.IOUtils;
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.core.SolrResourceLoader;
|
||||||
import org.apache.solr.util.TimeSource;
|
import org.apache.solr.util.TimeSource;
|
||||||
import org.apache.zookeeper.KeeperException;
|
|
||||||
import org.slf4j.Logger;
|
import org.slf4j.Logger;
|
||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
@ -49,59 +44,27 @@ import org.slf4j.LoggerFactory;
|
||||||
public class NodeLostTrigger extends TriggerBase {
|
public class NodeLostTrigger extends TriggerBase {
|
||||||
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
private final String name;
|
|
||||||
private final Map<String, Object> properties;
|
|
||||||
private final CoreContainer container;
|
|
||||||
private final List<TriggerAction> actions;
|
|
||||||
private final AtomicReference<AutoScaling.TriggerEventProcessor> processorRef;
|
|
||||||
private final boolean enabled;
|
|
||||||
private final int waitForSecond;
|
|
||||||
private final TriggerEventType eventType;
|
|
||||||
private final TimeSource timeSource;
|
private final TimeSource timeSource;
|
||||||
|
|
||||||
private boolean isClosed = false;
|
|
||||||
|
|
||||||
private Set<String> lastLiveNodes;
|
private Set<String> lastLiveNodes;
|
||||||
|
|
||||||
private Map<String, Long> nodeNameVsTimeRemoved = new HashMap<>();
|
private Map<String, Long> nodeNameVsTimeRemoved = new HashMap<>();
|
||||||
|
|
||||||
public NodeLostTrigger(String name, Map<String, Object> properties,
|
public NodeLostTrigger(String name, Map<String, Object> properties,
|
||||||
CoreContainer container) {
|
SolrResourceLoader loader,
|
||||||
super(container.getZkController().getZkClient());
|
ClusterDataProvider clusterDataProvider) {
|
||||||
this.name = name;
|
super(name, properties, loader, clusterDataProvider);
|
||||||
this.properties = properties;
|
|
||||||
this.container = container;
|
|
||||||
this.timeSource = TimeSource.CURRENT_TIME;
|
this.timeSource = TimeSource.CURRENT_TIME;
|
||||||
this.processorRef = new AtomicReference<>();
|
lastLiveNodes = new HashSet<>(clusterDataProvider.getLiveNodes());
|
||||||
List<Map<String, String>> o = (List<Map<String, String>>) properties.get("actions");
|
|
||||||
if (o != null && !o.isEmpty()) {
|
|
||||||
actions = new ArrayList<>(3);
|
|
||||||
for (Map<String, String> map : o) {
|
|
||||||
TriggerAction action = container.getResourceLoader().newInstance(map.get("class"), TriggerAction.class);
|
|
||||||
actions.add(action);
|
|
||||||
}
|
|
||||||
} else {
|
|
||||||
actions = Collections.emptyList();
|
|
||||||
}
|
|
||||||
lastLiveNodes = new HashSet<>(container.getZkController().getZkStateReader().getClusterState().getLiveNodes());
|
|
||||||
log.debug("Initial livenodes: {}", lastLiveNodes);
|
log.debug("Initial livenodes: {}", lastLiveNodes);
|
||||||
this.enabled = Boolean.parseBoolean(String.valueOf(properties.getOrDefault("enabled", "true")));
|
|
||||||
this.waitForSecond = ((Long) properties.getOrDefault("waitFor", -1L)).intValue();
|
|
||||||
this.eventType = TriggerEventType.valueOf(properties.get("event").toString().toUpperCase(Locale.ROOT));
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void init() {
|
public void init() {
|
||||||
List<Map<String, String>> o = (List<Map<String, String>>) properties.get("actions");
|
super.init();
|
||||||
if (o != null && !o.isEmpty()) {
|
|
||||||
for (int i = 0; i < o.size(); i++) {
|
|
||||||
Map<String, String> map = o.get(i);
|
|
||||||
actions.get(i).init(map);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
// pick up lost nodes for which marker paths were created
|
// pick up lost nodes for which marker paths were created
|
||||||
try {
|
try {
|
||||||
List<String> lost = container.getZkController().getZkClient().getChildren(ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH, null, true);
|
List<String> lost = clusterDataProvider.listData(ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH);
|
||||||
lost.forEach(n -> {
|
lost.forEach(n -> {
|
||||||
// don't add nodes that have since came back
|
// don't add nodes that have since came back
|
||||||
if (!lastLiveNodes.contains(n)) {
|
if (!lastLiveNodes.contains(n)) {
|
||||||
|
@ -110,76 +73,18 @@ public class NodeLostTrigger extends TriggerBase {
|
||||||
}
|
}
|
||||||
removeMarker(n);
|
removeMarker(n);
|
||||||
});
|
});
|
||||||
} catch (KeeperException.NoNodeException e) {
|
} catch (NoSuchElementException e) {
|
||||||
// ignore
|
// ignore
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Exception retrieving nodeLost markers", e);
|
log.warn("Exception retrieving nodeLost markers", e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
public void setProcessor(AutoScaling.TriggerEventProcessor processor) {
|
|
||||||
processorRef.set(processor);
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public AutoScaling.TriggerEventProcessor getProcessor() {
|
|
||||||
return processorRef.get();
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public String getName() {
|
|
||||||
return name;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public TriggerEventType getEventType() {
|
|
||||||
return eventType;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public boolean isEnabled() {
|
|
||||||
return enabled;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public int getWaitForSecond() {
|
|
||||||
return waitForSecond;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public Map<String, Object> getProperties() {
|
|
||||||
return properties;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public List<TriggerAction> getActions() {
|
public List<TriggerAction> getActions() {
|
||||||
return actions;
|
return actions;
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
public boolean equals(Object obj) {
|
|
||||||
if (obj instanceof NodeLostTrigger) {
|
|
||||||
NodeLostTrigger that = (NodeLostTrigger) obj;
|
|
||||||
return this.name.equals(that.name)
|
|
||||||
&& this.properties.equals(that.properties);
|
|
||||||
}
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public int hashCode() {
|
|
||||||
return Objects.hash(name, properties);
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public void close() throws IOException {
|
|
||||||
synchronized (this) {
|
|
||||||
isClosed = true;
|
|
||||||
IOUtils.closeWhileHandlingException(actions);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void restoreState(AutoScaling.Trigger old) {
|
public void restoreState(AutoScaling.Trigger old) {
|
||||||
assert old.isClosed();
|
assert old.isClosed();
|
||||||
|
@ -226,8 +131,7 @@ public class NodeLostTrigger extends TriggerBase {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
ZkStateReader reader = container.getZkController().getZkStateReader();
|
Set<String> newLiveNodes = new HashSet<>(clusterDataProvider.getLiveNodes());
|
||||||
Set<String> newLiveNodes = reader.getClusterState().getLiveNodes();
|
|
||||||
log.debug("Running NodeLostTrigger: {} with currently live nodes: {}", name, newLiveNodes);
|
log.debug("Running NodeLostTrigger: {} with currently live nodes: {}", name, newLiveNodes);
|
||||||
|
|
||||||
// have any nodes that we were tracking been added to the cluster?
|
// have any nodes that we were tracking been added to the cluster?
|
||||||
|
@ -286,23 +190,16 @@ public class NodeLostTrigger extends TriggerBase {
|
||||||
private void removeMarker(String nodeName) {
|
private void removeMarker(String nodeName) {
|
||||||
String path = ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH + "/" + nodeName;
|
String path = ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH + "/" + nodeName;
|
||||||
try {
|
try {
|
||||||
if (container.getZkController().getZkClient().exists(path, true)) {
|
if (clusterDataProvider.hasData(path)) {
|
||||||
container.getZkController().getZkClient().delete(path, -1, true);
|
clusterDataProvider.removeData(path, -1);
|
||||||
}
|
}
|
||||||
} catch (KeeperException.NoNodeException e) {
|
} catch (NoSuchElementException e) {
|
||||||
// ignore
|
// ignore
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Exception removing nodeLost marker " + nodeName, e);
|
log.warn("Exception removing nodeLost marker " + nodeName, e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
public boolean isClosed() {
|
|
||||||
synchronized (this) {
|
|
||||||
return isClosed;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
public static class NodeLostEvent extends TriggerEvent {
|
public static class NodeLostEvent extends TriggerEvent {
|
||||||
|
|
||||||
public NodeLostEvent(TriggerEventType eventType, String source, List<Long> times, List<String> nodeNames) {
|
public NodeLostEvent(TriggerEventType eventType, String source, List<Long> times, List<String> nodeNames) {
|
||||||
|
|
|
@ -20,16 +20,19 @@ package org.apache.solr.cloud.autoscaling;
|
||||||
import java.io.Closeable;
|
import java.io.Closeable;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.lang.invoke.MethodHandles;
|
import java.lang.invoke.MethodHandles;
|
||||||
|
import java.net.ConnectException;
|
||||||
import java.util.Collections;
|
import java.util.Collections;
|
||||||
import java.util.HashMap;
|
import java.util.HashMap;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
import java.util.NoSuchElementException;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
import java.util.concurrent.locks.Condition;
|
import java.util.concurrent.locks.Condition;
|
||||||
import java.util.concurrent.locks.ReentrantLock;
|
import java.util.concurrent.locks.ReentrantLock;
|
||||||
|
|
||||||
import org.apache.lucene.store.AlreadyClosedException;
|
import org.apache.lucene.store.AlreadyClosedException;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
import org.apache.solr.cloud.ZkController;
|
import org.apache.solr.cloud.ZkController;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
|
@ -37,6 +40,7 @@ import org.apache.solr.common.cloud.SolrZkClient;
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
import org.apache.solr.common.cloud.ZooKeeperException;
|
import org.apache.solr.common.cloud.ZooKeeperException;
|
||||||
import org.apache.solr.common.util.IOUtils;
|
import org.apache.solr.common.util.IOUtils;
|
||||||
|
import org.apache.solr.core.SolrResourceLoader;
|
||||||
import org.apache.zookeeper.KeeperException;
|
import org.apache.zookeeper.KeeperException;
|
||||||
import org.apache.zookeeper.WatchedEvent;
|
import org.apache.zookeeper.WatchedEvent;
|
||||||
import org.apache.zookeeper.Watcher;
|
import org.apache.zookeeper.Watcher;
|
||||||
|
@ -52,11 +56,7 @@ public class OverseerTriggerThread implements Runnable, Closeable {
|
||||||
|
|
||||||
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
private final ZkController zkController;
|
private final ClusterDataProvider clusterDataProvider;
|
||||||
|
|
||||||
private final ZkStateReader zkStateReader;
|
|
||||||
|
|
||||||
private final SolrZkClient zkClient;
|
|
||||||
|
|
||||||
private final ScheduledTriggers scheduledTriggers;
|
private final ScheduledTriggers scheduledTriggers;
|
||||||
|
|
||||||
|
@ -77,12 +77,10 @@ public class OverseerTriggerThread implements Runnable, Closeable {
|
||||||
|
|
||||||
private AutoScalingConfig autoScalingConfig;
|
private AutoScalingConfig autoScalingConfig;
|
||||||
|
|
||||||
public OverseerTriggerThread(ZkController zkController) {
|
public OverseerTriggerThread(SolrResourceLoader loader, ClusterDataProvider clusterDataProvider) {
|
||||||
this.zkController = zkController;
|
this.clusterDataProvider = clusterDataProvider;
|
||||||
zkStateReader = zkController.getZkStateReader();
|
scheduledTriggers = new ScheduledTriggers(loader, clusterDataProvider);
|
||||||
zkClient = zkController.getZkClient();
|
triggerFactory = new AutoScaling.TriggerFactoryImpl(loader, clusterDataProvider);
|
||||||
scheduledTriggers = new ScheduledTriggers(zkController);
|
|
||||||
triggerFactory = new AutoScaling.TriggerFactory(zkController.getCoreContainer());
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -106,11 +104,8 @@ public class OverseerTriggerThread implements Runnable, Closeable {
|
||||||
|
|
||||||
try {
|
try {
|
||||||
refreshAutoScalingConf(new AutoScalingWatcher());
|
refreshAutoScalingConf(new AutoScalingWatcher());
|
||||||
} catch (KeeperException.ConnectionLossException | KeeperException.SessionExpiredException e) {
|
} catch (ConnectException e) {
|
||||||
log.warn("ZooKeeper watch triggered for autoscaling conf, but Solr cannot talk to ZK: [{}]", e.getMessage());
|
log.warn("ZooKeeper watch triggered for autoscaling conf, but Solr cannot talk to ZK: [{}]", e.getMessage());
|
||||||
} catch (KeeperException e) {
|
|
||||||
log.error("A ZK error has occurred", e);
|
|
||||||
throw new ZooKeeperException(SolrException.ErrorCode.SERVER_ERROR, "A ZK error has occurred", e);
|
|
||||||
} catch (InterruptedException e) {
|
} catch (InterruptedException e) {
|
||||||
// Restore the interrupted status
|
// Restore the interrupted status
|
||||||
Thread.currentThread().interrupt();
|
Thread.currentThread().interrupt();
|
||||||
|
@ -201,26 +196,26 @@ public class OverseerTriggerThread implements Runnable, Closeable {
|
||||||
if (cleanOldNodeLostMarkers) {
|
if (cleanOldNodeLostMarkers) {
|
||||||
log.debug("-- clean old nodeLost markers");
|
log.debug("-- clean old nodeLost markers");
|
||||||
try {
|
try {
|
||||||
List<String> markers = zkClient.getChildren(ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH, null, true);
|
List<String> markers = clusterDataProvider.listData(ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH);
|
||||||
markers.forEach(n -> {
|
markers.forEach(n -> {
|
||||||
removeNodeMarker(ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH, n);
|
removeNodeMarker(ZkStateReader.SOLR_AUTOSCALING_NODE_LOST_PATH, n);
|
||||||
});
|
});
|
||||||
} catch (KeeperException.NoNodeException e) {
|
} catch (NoSuchElementException e) {
|
||||||
// ignore
|
// ignore
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Error removing old nodeLost markers", e);
|
log.warn("Error removing old nodeLost markers", e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if (cleanOldNodeAddedMarkers) {
|
if (cleanOldNodeAddedMarkers) {
|
||||||
log.debug("-- clean old nodeAdded markers");
|
log.debug("-- clean old nodeAdded markers");
|
||||||
try {
|
try {
|
||||||
List<String> markers = zkClient.getChildren(ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH, null, true);
|
List<String> markers = clusterDataProvider.listData(ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH);
|
||||||
markers.forEach(n -> {
|
markers.forEach(n -> {
|
||||||
removeNodeMarker(ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH, n);
|
removeNodeMarker(ZkStateReader.SOLR_AUTOSCALING_NODE_ADDED_PATH, n);
|
||||||
});
|
});
|
||||||
} catch (KeeperException.NoNodeException e) {
|
} catch (NoSuchElementException e) {
|
||||||
// ignore
|
// ignore
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Error removing old nodeAdded markers", e);
|
log.warn("Error removing old nodeAdded markers", e);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -231,11 +226,11 @@ public class OverseerTriggerThread implements Runnable, Closeable {
|
||||||
private void removeNodeMarker(String path, String nodeName) {
|
private void removeNodeMarker(String path, String nodeName) {
|
||||||
path = path + "/" + nodeName;
|
path = path + "/" + nodeName;
|
||||||
try {
|
try {
|
||||||
zkClient.delete(path, -1, true);
|
clusterDataProvider.removeData(path, -1);
|
||||||
log.debug(" -- deleted " + path);
|
log.debug(" -- deleted " + path);
|
||||||
} catch (KeeperException.NoNodeException e) {
|
} catch (NoSuchElementException e) {
|
||||||
// ignore
|
// ignore
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Error removing old marker " + path, e);
|
log.warn("Error removing old marker " + path, e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -250,11 +245,8 @@ public class OverseerTriggerThread implements Runnable, Closeable {
|
||||||
|
|
||||||
try {
|
try {
|
||||||
refreshAutoScalingConf(this);
|
refreshAutoScalingConf(this);
|
||||||
} catch (KeeperException.ConnectionLossException | KeeperException.SessionExpiredException e) {
|
} catch (ConnectException e) {
|
||||||
log.warn("ZooKeeper watch triggered for autoscaling conf, but Solr cannot talk to ZK: [{}]", e.getMessage());
|
log.warn("ZooKeeper watch triggered for autoscaling conf, but we cannot talk to ZK: [{}]", e.getMessage());
|
||||||
} catch (KeeperException e) {
|
|
||||||
log.error("A ZK error has occurred", e);
|
|
||||||
throw new ZooKeeperException(SolrException.ErrorCode.SERVER_ERROR, "A ZK error has occurred", e);
|
|
||||||
} catch (InterruptedException e) {
|
} catch (InterruptedException e) {
|
||||||
// Restore the interrupted status
|
// Restore the interrupted status
|
||||||
Thread.currentThread().interrupt();
|
Thread.currentThread().interrupt();
|
||||||
|
@ -266,13 +258,13 @@ public class OverseerTriggerThread implements Runnable, Closeable {
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
private void refreshAutoScalingConf(Watcher watcher) throws KeeperException, InterruptedException {
|
private void refreshAutoScalingConf(Watcher watcher) throws ConnectException, InterruptedException, IOException {
|
||||||
updateLock.lock();
|
updateLock.lock();
|
||||||
try {
|
try {
|
||||||
if (isClosed) {
|
if (isClosed) {
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
AutoScalingConfig currentConfig = zkStateReader.getAutoScalingConfig(watcher);
|
AutoScalingConfig currentConfig = clusterDataProvider.getAutoScalingConfig(watcher);
|
||||||
log.debug("Refreshing {} with znode version {}", ZkStateReader.SOLR_AUTOSCALING_CONF_PATH, currentConfig.getZkVersion());
|
log.debug("Refreshing {} with znode version {}", ZkStateReader.SOLR_AUTOSCALING_CONF_PATH, currentConfig.getZkVersion());
|
||||||
if (znodeVersion >= currentConfig.getZkVersion()) {
|
if (znodeVersion >= currentConfig.getZkVersion()) {
|
||||||
// protect against reordered watcher fires by ensuring that we only move forward
|
// protect against reordered watcher fires by ensuring that we only move forward
|
||||||
|
|
|
@ -41,15 +41,18 @@ import java.util.stream.Collectors;
|
||||||
|
|
||||||
import org.apache.lucene.store.AlreadyClosedException;
|
import org.apache.lucene.store.AlreadyClosedException;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
||||||
import org.apache.solr.cloud.ActionThrottle;
|
import org.apache.solr.cloud.ActionThrottle;
|
||||||
import org.apache.solr.cloud.Overseer;
|
import org.apache.solr.cloud.Overseer;
|
||||||
import org.apache.solr.cloud.ZkController;
|
import org.apache.solr.cloud.ZkController;
|
||||||
|
import org.apache.solr.common.SolrException;
|
||||||
import org.apache.solr.common.cloud.SolrZkClient;
|
import org.apache.solr.common.cloud.SolrZkClient;
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
import org.apache.solr.common.util.ExecutorUtil;
|
import org.apache.solr.common.util.ExecutorUtil;
|
||||||
import org.apache.solr.common.util.IOUtils;
|
import org.apache.solr.common.util.IOUtils;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.core.CoreContainer;
|
||||||
|
import org.apache.solr.core.SolrResourceLoader;
|
||||||
import org.apache.solr.util.DefaultSolrThreadFactory;
|
import org.apache.solr.util.DefaultSolrThreadFactory;
|
||||||
import org.apache.zookeeper.KeeperException;
|
import org.apache.zookeeper.KeeperException;
|
||||||
import org.apache.zookeeper.Op;
|
import org.apache.zookeeper.Op;
|
||||||
|
@ -85,17 +88,17 @@ public class ScheduledTriggers implements Closeable {
|
||||||
|
|
||||||
private final ActionThrottle actionThrottle;
|
private final ActionThrottle actionThrottle;
|
||||||
|
|
||||||
private final SolrZkClient zkClient;
|
private final ClusterDataProvider clusterDataProvider;
|
||||||
|
|
||||||
|
private final SolrResourceLoader loader;
|
||||||
|
|
||||||
private final Overseer.Stats queueStats;
|
private final Overseer.Stats queueStats;
|
||||||
|
|
||||||
private final CoreContainer coreContainer;
|
|
||||||
|
|
||||||
private final TriggerListeners listeners;
|
private final TriggerListeners listeners;
|
||||||
|
|
||||||
private AutoScalingConfig autoScalingConfig;
|
private AutoScalingConfig autoScalingConfig;
|
||||||
|
|
||||||
public ScheduledTriggers(ZkController zkController) {
|
public ScheduledTriggers(SolrResourceLoader loader, ClusterDataProvider clusterDataProvider) {
|
||||||
// todo make the core pool size configurable
|
// todo make the core pool size configurable
|
||||||
// it is important to use more than one because a time taking trigger can starve other scheduled triggers
|
// it is important to use more than one because a time taking trigger can starve other scheduled triggers
|
||||||
// ideally we should have as many core threads as the number of triggers but firstly, we don't know beforehand
|
// ideally we should have as many core threads as the number of triggers but firstly, we don't know beforehand
|
||||||
|
@ -108,8 +111,8 @@ public class ScheduledTriggers implements Closeable {
|
||||||
actionExecutor = ExecutorUtil.newMDCAwareSingleThreadExecutor(new DefaultSolrThreadFactory("AutoscalingActionExecutor"));
|
actionExecutor = ExecutorUtil.newMDCAwareSingleThreadExecutor(new DefaultSolrThreadFactory("AutoscalingActionExecutor"));
|
||||||
// todo make the wait time configurable
|
// todo make the wait time configurable
|
||||||
actionThrottle = new ActionThrottle("action", DEFAULT_MIN_MS_BETWEEN_ACTIONS);
|
actionThrottle = new ActionThrottle("action", DEFAULT_MIN_MS_BETWEEN_ACTIONS);
|
||||||
coreContainer = zkController.getCoreContainer();
|
this.clusterDataProvider = clusterDataProvider;
|
||||||
zkClient = zkController.getZkClient();
|
this.loader = loader;
|
||||||
queueStats = new Overseer.Stats();
|
queueStats = new Overseer.Stats();
|
||||||
listeners = new TriggerListeners();
|
listeners = new TriggerListeners();
|
||||||
}
|
}
|
||||||
|
@ -136,7 +139,12 @@ public class ScheduledTriggers implements Closeable {
|
||||||
if (isClosed) {
|
if (isClosed) {
|
||||||
throw new AlreadyClosedException("ScheduledTriggers has been closed and cannot be used anymore");
|
throw new AlreadyClosedException("ScheduledTriggers has been closed and cannot be used anymore");
|
||||||
}
|
}
|
||||||
ScheduledTrigger scheduledTrigger = new ScheduledTrigger(newTrigger, zkClient, queueStats);
|
ScheduledTrigger scheduledTrigger;
|
||||||
|
try {
|
||||||
|
scheduledTrigger = new ScheduledTrigger(newTrigger, clusterDataProvider, queueStats);
|
||||||
|
} catch (IOException e) {
|
||||||
|
throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, "exception creating scheduled trigger", e);
|
||||||
|
}
|
||||||
ScheduledTrigger old = scheduledTriggers.putIfAbsent(newTrigger.getName(), scheduledTrigger);
|
ScheduledTrigger old = scheduledTriggers.putIfAbsent(newTrigger.getName(), scheduledTrigger);
|
||||||
if (old != null) {
|
if (old != null) {
|
||||||
if (old.trigger.equals(newTrigger)) {
|
if (old.trigger.equals(newTrigger)) {
|
||||||
|
@ -182,7 +190,7 @@ public class ScheduledTriggers implements Closeable {
|
||||||
// let the action executor thread wait instead of the trigger thread so we use the throttle here
|
// let the action executor thread wait instead of the trigger thread so we use the throttle here
|
||||||
actionThrottle.minimumWaitBetweenActions();
|
actionThrottle.minimumWaitBetweenActions();
|
||||||
actionThrottle.markAttemptingAction();
|
actionThrottle.markAttemptingAction();
|
||||||
ActionContext actionContext = new ActionContext(coreContainer, newTrigger, new HashMap<>());
|
ActionContext actionContext = new ActionContext(clusterDataProvider, newTrigger, new HashMap<>());
|
||||||
for (TriggerAction action : actions) {
|
for (TriggerAction action : actions) {
|
||||||
List<String> beforeActions = (List<String>)actionContext.getProperties().computeIfAbsent(TriggerEventProcessorStage.BEFORE_ACTION.toString(), k -> new ArrayList<String>());
|
List<String> beforeActions = (List<String>)actionContext.getProperties().computeIfAbsent(TriggerEventProcessorStage.BEFORE_ACTION.toString(), k -> new ArrayList<String>());
|
||||||
beforeActions.add(action.getName());
|
beforeActions.add(action.getName());
|
||||||
|
@ -244,23 +252,23 @@ public class ScheduledTriggers implements Closeable {
|
||||||
String statePath = ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH + "/" + triggerName;
|
String statePath = ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH + "/" + triggerName;
|
||||||
String eventsPath = ZkStateReader.SOLR_AUTOSCALING_EVENTS_PATH + "/" + triggerName;
|
String eventsPath = ZkStateReader.SOLR_AUTOSCALING_EVENTS_PATH + "/" + triggerName;
|
||||||
try {
|
try {
|
||||||
if (zkClient.exists(statePath, true)) {
|
if (clusterDataProvider.hasData(statePath)) {
|
||||||
zkClient.delete(statePath, -1, true);
|
clusterDataProvider.removeData(statePath, -1);
|
||||||
}
|
}
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Failed to remove state for removed trigger " + statePath, e);
|
log.warn("Failed to remove state for removed trigger " + statePath, e);
|
||||||
}
|
}
|
||||||
try {
|
try {
|
||||||
if (zkClient.exists(eventsPath, true)) {
|
if (clusterDataProvider.hasData(eventsPath)) {
|
||||||
List<String> events = zkClient.getChildren(eventsPath, null, true);
|
List<String> events = clusterDataProvider.listData(eventsPath);
|
||||||
List<Op> ops = new ArrayList<>(events.size() + 1);
|
List<Op> ops = new ArrayList<>(events.size() + 1);
|
||||||
events.forEach(ev -> {
|
events.forEach(ev -> {
|
||||||
ops.add(Op.delete(eventsPath + "/" + ev, -1));
|
ops.add(Op.delete(eventsPath + "/" + ev, -1));
|
||||||
});
|
});
|
||||||
ops.add(Op.delete(eventsPath, -1));
|
ops.add(Op.delete(eventsPath, -1));
|
||||||
zkClient.multi(ops, true);
|
clusterDataProvider.multi(ops);
|
||||||
}
|
}
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
log.warn("Failed to remove events for removed trigger " + eventsPath, e);
|
log.warn("Failed to remove events for removed trigger " + eventsPath, e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -297,9 +305,9 @@ public class ScheduledTriggers implements Closeable {
|
||||||
boolean replay;
|
boolean replay;
|
||||||
volatile boolean isClosed;
|
volatile boolean isClosed;
|
||||||
|
|
||||||
ScheduledTrigger(AutoScaling.Trigger trigger, SolrZkClient zkClient, Overseer.Stats stats) {
|
ScheduledTrigger(AutoScaling.Trigger trigger, ClusterDataProvider clusterDataProvider, Overseer.Stats stats) throws IOException {
|
||||||
this.trigger = trigger;
|
this.trigger = trigger;
|
||||||
this.queue = new TriggerEventQueue(zkClient, trigger.getName(), stats);
|
this.queue = new TriggerEventQueue(clusterDataProvider, trigger.getName(), stats);
|
||||||
this.replay = true;
|
this.replay = true;
|
||||||
this.isClosed = false;
|
this.isClosed = false;
|
||||||
}
|
}
|
||||||
|
@ -426,13 +434,13 @@ public class ScheduledTriggers implements Closeable {
|
||||||
if (listener == null) { // create new instance
|
if (listener == null) { // create new instance
|
||||||
String clazz = config.listenerClass;
|
String clazz = config.listenerClass;
|
||||||
try {
|
try {
|
||||||
listener = coreContainer.getResourceLoader().newInstance(clazz, TriggerListener.class);
|
listener = loader.newInstance(clazz, TriggerListener.class);
|
||||||
} catch (Exception e) {
|
} catch (Exception e) {
|
||||||
log.warn("Invalid TriggerListener class name '" + clazz + "', skipping...", e);
|
log.warn("Invalid TriggerListener class name '" + clazz + "', skipping...", e);
|
||||||
}
|
}
|
||||||
if (listener != null) {
|
if (listener != null) {
|
||||||
try {
|
try {
|
||||||
listener.init(coreContainer, config);
|
listener.init(clusterDataProvider, config);
|
||||||
listenersPerName.put(config.name, listener);
|
listenersPerName.put(config.name, listener);
|
||||||
} catch (Exception e) {
|
} catch (Exception e) {
|
||||||
log.warn("Error initializing TriggerListener " + config, e);
|
log.warn("Error initializing TriggerListener " + config, e);
|
||||||
|
|
|
@ -31,6 +31,7 @@ import java.util.StringJoiner;
|
||||||
|
|
||||||
import org.apache.solr.client.solrj.SolrRequest;
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
||||||
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
||||||
import org.apache.solr.client.solrj.request.UpdateRequest;
|
import org.apache.solr.client.solrj.request.UpdateRequest;
|
||||||
|
@ -73,8 +74,8 @@ public class SystemLogListener extends TriggerListenerBase {
|
||||||
private boolean enabled = true;
|
private boolean enabled = true;
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void init(CoreContainer coreContainer, AutoScalingConfig.TriggerListenerConfig config) {
|
public void init(ClusterDataProvider clusterDataProvider, AutoScalingConfig.TriggerListenerConfig config) {
|
||||||
super.init(coreContainer, config);
|
super.init(clusterDataProvider, config);
|
||||||
collection = (String)config.properties.getOrDefault(CollectionAdminParams.COLLECTION, CollectionAdminParams.SYSTEM_COLL);
|
collection = (String)config.properties.getOrDefault(CollectionAdminParams.COLLECTION, CollectionAdminParams.SYSTEM_COLL);
|
||||||
enabled = Boolean.parseBoolean(String.valueOf(config.properties.getOrDefault("enabled", true)));
|
enabled = Boolean.parseBoolean(String.valueOf(config.properties.getOrDefault("enabled", true)));
|
||||||
}
|
}
|
||||||
|
@ -85,10 +86,7 @@ public class SystemLogListener extends TriggerListenerBase {
|
||||||
if (!enabled) {
|
if (!enabled) {
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
try (CloudSolrClient cloudSolrClient = new CloudSolrClient.Builder()
|
try {
|
||||||
.withZkHost(coreContainer.getZkController().getZkServerAddress())
|
|
||||||
.withHttpClient(coreContainer.getUpdateShardHandler().getHttpClient())
|
|
||||||
.build()) {
|
|
||||||
SolrInputDocument doc = new SolrInputDocument();
|
SolrInputDocument doc = new SolrInputDocument();
|
||||||
doc.addField(CommonParams.TYPE, DOC_TYPE);
|
doc.addField(CommonParams.TYPE, DOC_TYPE);
|
||||||
doc.addField(SOURCE_FIELD, SOURCE);
|
doc.addField(SOURCE_FIELD, SOURCE);
|
||||||
|
@ -122,7 +120,8 @@ public class SystemLogListener extends TriggerListenerBase {
|
||||||
}
|
}
|
||||||
UpdateRequest req = new UpdateRequest();
|
UpdateRequest req = new UpdateRequest();
|
||||||
req.add(doc);
|
req.add(doc);
|
||||||
cloudSolrClient.request(req, collection);
|
req.setParam(CollectionAdminParams.COLLECTION, collection);
|
||||||
|
clusterDataProvider.request(req);
|
||||||
} catch (Exception e) {
|
} catch (Exception e) {
|
||||||
if ((e instanceof SolrException) && e.getMessage().contains("Collection not found")) {
|
if ((e instanceof SolrException) && e.getMessage().contains("Collection not found")) {
|
||||||
// relatively benign
|
// relatively benign
|
||||||
|
|
|
@ -16,14 +16,26 @@
|
||||||
*/
|
*/
|
||||||
package org.apache.solr.cloud.autoscaling;
|
package org.apache.solr.cloud.autoscaling;
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
import java.lang.invoke.MethodHandles;
|
import java.lang.invoke.MethodHandles;
|
||||||
|
import java.util.ArrayList;
|
||||||
import java.util.Arrays;
|
import java.util.Arrays;
|
||||||
|
import java.util.Collections;
|
||||||
|
import java.util.HashMap;
|
||||||
|
import java.util.List;
|
||||||
|
import java.util.Locale;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
import java.util.Objects;
|
||||||
import java.util.TreeMap;
|
import java.util.TreeMap;
|
||||||
|
import java.util.concurrent.atomic.AtomicReference;
|
||||||
|
|
||||||
|
import org.apache.lucene.util.IOUtils;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
import org.apache.solr.common.cloud.SolrZkClient;
|
import org.apache.solr.common.cloud.SolrZkClient;
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
import org.apache.solr.common.util.Utils;
|
import org.apache.solr.common.util.Utils;
|
||||||
|
import org.apache.solr.core.SolrResourceLoader;
|
||||||
import org.apache.zookeeper.CreateMode;
|
import org.apache.zookeeper.CreateMode;
|
||||||
import org.apache.zookeeper.KeeperException;
|
import org.apache.zookeeper.KeeperException;
|
||||||
import org.apache.zookeeper.data.Stat;
|
import org.apache.zookeeper.data.Stat;
|
||||||
|
@ -37,19 +49,130 @@ import org.slf4j.LoggerFactory;
|
||||||
public abstract class TriggerBase implements AutoScaling.Trigger {
|
public abstract class TriggerBase implements AutoScaling.Trigger {
|
||||||
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
protected SolrZkClient zkClient;
|
protected final String name;
|
||||||
|
protected final ClusterDataProvider clusterDataProvider;
|
||||||
|
protected final Map<String, Object> properties = new HashMap<>();
|
||||||
|
protected final TriggerEventType eventType;
|
||||||
|
protected final int waitForSecond;
|
||||||
protected Map<String,Object> lastState;
|
protected Map<String,Object> lastState;
|
||||||
|
protected final AtomicReference<AutoScaling.TriggerEventProcessor> processorRef = new AtomicReference<>();
|
||||||
|
protected final List<TriggerAction> actions;
|
||||||
|
protected final boolean enabled;
|
||||||
|
protected boolean isClosed;
|
||||||
|
|
||||||
|
|
||||||
protected TriggerBase(SolrZkClient zkClient) {
|
protected TriggerBase(String name, Map<String, Object> properties, SolrResourceLoader loader, ClusterDataProvider clusterDataProvider) {
|
||||||
this.zkClient = zkClient;
|
this.name = name;
|
||||||
|
if (properties != null) {
|
||||||
|
this.properties.putAll(properties);
|
||||||
|
}
|
||||||
|
this.clusterDataProvider = clusterDataProvider;
|
||||||
|
this.enabled = Boolean.parseBoolean(String.valueOf(this.properties.getOrDefault("enabled", "true")));
|
||||||
|
this.eventType = TriggerEventType.valueOf(this.properties.getOrDefault("event", TriggerEventType.INVALID.toString()).toString().toUpperCase(Locale.ROOT));
|
||||||
|
this.waitForSecond = ((Long) this.properties.getOrDefault("waitFor", -1L)).intValue();
|
||||||
|
List<Map<String, String>> o = (List<Map<String, String>>) properties.get("actions");
|
||||||
|
if (o != null && !o.isEmpty()) {
|
||||||
|
actions = new ArrayList<>(3);
|
||||||
|
for (Map<String, String> map : o) {
|
||||||
|
TriggerAction action = loader.newInstance(map.get("class"), TriggerAction.class);
|
||||||
|
actions.add(action);
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
actions = Collections.emptyList();
|
||||||
|
}
|
||||||
|
|
||||||
try {
|
try {
|
||||||
zkClient.makePath(ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH, false, true);
|
if (!clusterDataProvider.hasData(ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH)) {
|
||||||
} catch (KeeperException | InterruptedException e) {
|
clusterDataProvider.makePath(ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH);
|
||||||
|
}
|
||||||
|
} catch (IOException e) {
|
||||||
LOG.warn("Exception checking ZK path " + ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH, e);
|
LOG.warn("Exception checking ZK path " + ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH, e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void init() {
|
||||||
|
List<Map<String, String>> o = (List<Map<String, String>>) properties.get("actions");
|
||||||
|
if (o != null && !o.isEmpty()) {
|
||||||
|
for (int i = 0; i < o.size(); i++) {
|
||||||
|
Map<String, String> map = o.get(i);
|
||||||
|
actions.get(i).init(map);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void setProcessor(AutoScaling.TriggerEventProcessor processor) {
|
||||||
|
processorRef.set(processor);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public AutoScaling.TriggerEventProcessor getProcessor() {
|
||||||
|
return processorRef.get();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public String getName() {
|
||||||
|
return name;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public TriggerEventType getEventType() {
|
||||||
|
return eventType;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public boolean isEnabled() {
|
||||||
|
return enabled;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public int getWaitForSecond() {
|
||||||
|
return waitForSecond;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Map<String, Object> getProperties() {
|
||||||
|
return properties;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public List<TriggerAction> getActions() {
|
||||||
|
return actions;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public boolean isClosed() {
|
||||||
|
synchronized (this) {
|
||||||
|
return isClosed;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
@Override
|
||||||
|
public void close() throws IOException {
|
||||||
|
synchronized (this) {
|
||||||
|
isClosed = true;
|
||||||
|
IOUtils.closeWhileHandlingException(actions);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public int hashCode() {
|
||||||
|
return Objects.hash(name, properties);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public boolean equals(Object obj) {
|
||||||
|
if (obj == null) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if (obj.getClass().equals(this.getClass())) {
|
||||||
|
TriggerBase that = (TriggerBase) obj;
|
||||||
|
return this.name.equals(that.name)
|
||||||
|
&& this.properties.equals(that.properties);
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Prepare and return internal state of this trigger in a format suitable for persisting in ZK.
|
* Prepare and return internal state of this trigger in a format suitable for persisting in ZK.
|
||||||
* @return map of internal state properties. Note: values must be supported by {@link Utils#toJSON(Object)}.
|
* @return map of internal state properties. Note: values must be supported by {@link Utils#toJSON(Object)}.
|
||||||
|
@ -72,15 +195,15 @@ public abstract class TriggerBase implements AutoScaling.Trigger {
|
||||||
byte[] data = Utils.toJSON(state);
|
byte[] data = Utils.toJSON(state);
|
||||||
String path = ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH + "/" + getName();
|
String path = ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH + "/" + getName();
|
||||||
try {
|
try {
|
||||||
if (zkClient.exists(path, true)) {
|
if (clusterDataProvider.hasData(path)) {
|
||||||
// update
|
// update
|
||||||
zkClient.setData(path, data, -1, true);
|
clusterDataProvider.setData(path, data, -1);
|
||||||
} else {
|
} else {
|
||||||
// create
|
// create
|
||||||
zkClient.create(path, data, CreateMode.PERSISTENT, true);
|
clusterDataProvider.createData(path, data, CreateMode.PERSISTENT);
|
||||||
}
|
}
|
||||||
lastState = state;
|
lastState = state;
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (IOException e) {
|
||||||
LOG.warn("Exception updating trigger state '" + path + "'", e);
|
LOG.warn("Exception updating trigger state '" + path + "'", e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -90,10 +213,10 @@ public abstract class TriggerBase implements AutoScaling.Trigger {
|
||||||
byte[] data = null;
|
byte[] data = null;
|
||||||
String path = ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH + "/" + getName();
|
String path = ZkStateReader.SOLR_AUTOSCALING_TRIGGER_STATE_PATH + "/" + getName();
|
||||||
try {
|
try {
|
||||||
if (zkClient.exists(path, true)) {
|
if (clusterDataProvider.hasData(path)) {
|
||||||
data = zkClient.getData(path, null, new Stat(), true);
|
ClusterDataProvider.VersionedData versionedDat = clusterDataProvider.getData(path);
|
||||||
}
|
}
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
LOG.warn("Exception getting trigger state '" + path + "'", e);
|
LOG.warn("Exception getting trigger state '" + path + "'", e);
|
||||||
}
|
}
|
||||||
if (data != null) {
|
if (data != null) {
|
||||||
|
|
|
@ -1,23 +1,24 @@
|
||||||
package org.apache.solr.cloud.autoscaling;
|
package org.apache.solr.cloud.autoscaling;
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
import java.lang.invoke.MethodHandles;
|
import java.lang.invoke.MethodHandles;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
import java.util.Queue;
|
||||||
|
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
import org.apache.solr.cloud.DistributedQueue;
|
|
||||||
import org.apache.solr.cloud.Overseer;
|
import org.apache.solr.cloud.Overseer;
|
||||||
import org.apache.solr.common.cloud.SolrZkClient;
|
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
import org.apache.solr.common.util.Utils;
|
import org.apache.solr.common.util.Utils;
|
||||||
import org.apache.solr.util.TimeSource;
|
import org.apache.solr.util.TimeSource;
|
||||||
import org.apache.zookeeper.KeeperException;
|
|
||||||
import org.slf4j.Logger;
|
import org.slf4j.Logger;
|
||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
public class TriggerEventQueue extends DistributedQueue {
|
public class TriggerEventQueue {
|
||||||
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger LOG = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
public static final String ENQUEUE_TIME = "_enqueue_time_";
|
public static final String ENQUEUE_TIME = "_enqueue_time_";
|
||||||
|
@ -25,9 +26,11 @@ public class TriggerEventQueue extends DistributedQueue {
|
||||||
|
|
||||||
private final String triggerName;
|
private final String triggerName;
|
||||||
private final TimeSource timeSource;
|
private final TimeSource timeSource;
|
||||||
|
private final DistributedQueue delegate;
|
||||||
|
|
||||||
public TriggerEventQueue(SolrZkClient zookeeper, String triggerName, Overseer.Stats stats) {
|
public TriggerEventQueue(ClusterDataProvider clusterDataProvider, String triggerName, Overseer.Stats stats) throws IOException {
|
||||||
super(zookeeper, ZkStateReader.SOLR_AUTOSCALING_EVENTS_PATH + "/" + triggerName, stats);
|
// TODO: collect stats
|
||||||
|
this.delegate = clusterDataProvider.getDistributedQueueFactory().makeQueue(ZkStateReader.SOLR_AUTOSCALING_EVENTS_PATH + "/" + triggerName);
|
||||||
this.triggerName = triggerName;
|
this.triggerName = triggerName;
|
||||||
this.timeSource = TimeSource.CURRENT_TIME;
|
this.timeSource = TimeSource.CURRENT_TIME;
|
||||||
}
|
}
|
||||||
|
@ -36,9 +39,9 @@ public class TriggerEventQueue extends DistributedQueue {
|
||||||
event.getProperties().put(ENQUEUE_TIME, timeSource.getTime());
|
event.getProperties().put(ENQUEUE_TIME, timeSource.getTime());
|
||||||
try {
|
try {
|
||||||
byte[] data = Utils.toJSON(event);
|
byte[] data = Utils.toJSON(event);
|
||||||
offer(data);
|
delegate.offer(data);
|
||||||
return true;
|
return true;
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
LOG.warn("Exception adding event " + event + " to queue " + triggerName, e);
|
LOG.warn("Exception adding event " + event + " to queue " + triggerName, e);
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
@ -47,7 +50,7 @@ public class TriggerEventQueue extends DistributedQueue {
|
||||||
public TriggerEvent peekEvent() {
|
public TriggerEvent peekEvent() {
|
||||||
byte[] data;
|
byte[] data;
|
||||||
try {
|
try {
|
||||||
while ((data = peek()) != null) {
|
while ((data = delegate.peek()) != null) {
|
||||||
if (data.length == 0) {
|
if (data.length == 0) {
|
||||||
LOG.warn("ignoring empty data...");
|
LOG.warn("ignoring empty data...");
|
||||||
continue;
|
continue;
|
||||||
|
@ -60,7 +63,7 @@ public class TriggerEventQueue extends DistributedQueue {
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
LOG.warn("Exception peeking queue of trigger " + triggerName, e);
|
LOG.warn("Exception peeking queue of trigger " + triggerName, e);
|
||||||
}
|
}
|
||||||
return null;
|
return null;
|
||||||
|
@ -69,7 +72,7 @@ public class TriggerEventQueue extends DistributedQueue {
|
||||||
public TriggerEvent pollEvent() {
|
public TriggerEvent pollEvent() {
|
||||||
byte[] data;
|
byte[] data;
|
||||||
try {
|
try {
|
||||||
while ((data = poll()) != null) {
|
while ((data = delegate.poll()) != null) {
|
||||||
if (data.length == 0) {
|
if (data.length == 0) {
|
||||||
LOG.warn("ignoring empty data...");
|
LOG.warn("ignoring empty data...");
|
||||||
continue;
|
continue;
|
||||||
|
@ -82,7 +85,7 @@ public class TriggerEventQueue extends DistributedQueue {
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} catch (KeeperException | InterruptedException e) {
|
} catch (Exception e) {
|
||||||
LOG.warn("Exception polling queue of trigger " + triggerName, e);
|
LOG.warn("Exception polling queue of trigger " + triggerName, e);
|
||||||
}
|
}
|
||||||
return null;
|
return null;
|
||||||
|
|
|
@ -19,6 +19,7 @@ package org.apache.solr.cloud.autoscaling;
|
||||||
import java.io.Closeable;
|
import java.io.Closeable;
|
||||||
|
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.core.CoreContainer;
|
||||||
|
|
||||||
|
@ -28,7 +29,7 @@ import org.apache.solr.core.CoreContainer;
|
||||||
*/
|
*/
|
||||||
public interface TriggerListener extends Closeable {
|
public interface TriggerListener extends Closeable {
|
||||||
|
|
||||||
void init(CoreContainer coreContainer, AutoScalingConfig.TriggerListenerConfig config) throws Exception;
|
void init(ClusterDataProvider clusterDataProvider, AutoScalingConfig.TriggerListenerConfig config) throws Exception;
|
||||||
|
|
||||||
AutoScalingConfig.TriggerListenerConfig getConfig();
|
AutoScalingConfig.TriggerListenerConfig getConfig();
|
||||||
|
|
||||||
|
|
|
@ -19,7 +19,7 @@ package org.apache.solr.cloud.autoscaling;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Base class for implementations of {@link TriggerListener}.
|
* Base class for implementations of {@link TriggerListener}.
|
||||||
|
@ -27,11 +27,11 @@ import org.apache.solr.core.CoreContainer;
|
||||||
public abstract class TriggerListenerBase implements TriggerListener {
|
public abstract class TriggerListenerBase implements TriggerListener {
|
||||||
|
|
||||||
protected AutoScalingConfig.TriggerListenerConfig config;
|
protected AutoScalingConfig.TriggerListenerConfig config;
|
||||||
protected CoreContainer coreContainer;
|
protected ClusterDataProvider clusterDataProvider;
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void init(CoreContainer coreContainer, AutoScalingConfig.TriggerListenerConfig config) {
|
public void init(ClusterDataProvider clusterDataProvider, AutoScalingConfig.TriggerListenerConfig config) {
|
||||||
this.coreContainer = coreContainer;
|
this.clusterDataProvider = clusterDataProvider;
|
||||||
this.config = config;
|
this.config = config;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,28 @@
|
||||||
|
package org.apache.solr.cloud.autoscaling;
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
|
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
|
import org.apache.solr.cloud.ZkDistributedQueue;
|
||||||
|
import org.apache.solr.common.cloud.SolrZkClient;
|
||||||
|
|
||||||
|
/**
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public class ZkDistributedQueueFactory implements ClusterDataProvider.DistributedQueueFactory {
|
||||||
|
private final SolrZkClient zkClient;
|
||||||
|
|
||||||
|
public ZkDistributedQueueFactory(SolrZkClient zkClient) {
|
||||||
|
this.zkClient = zkClient;
|
||||||
|
}
|
||||||
|
@Override
|
||||||
|
public DistributedQueue makeQueue(String path) throws IOException {
|
||||||
|
return new ZkDistributedQueue(zkClient, path);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void removeQueue(String path) throws IOException {
|
||||||
|
|
||||||
|
}
|
||||||
|
}
|
|
@ -956,6 +956,8 @@ public class CoreContainer {
|
||||||
SolrException.log(log, null, e);
|
SolrException.log(log, null, e);
|
||||||
} catch (KeeperException e) {
|
} catch (KeeperException e) {
|
||||||
SolrException.log(log, null, e);
|
SolrException.log(log, null, e);
|
||||||
|
} catch (Exception e) {
|
||||||
|
SolrException.log(log, null, e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1377,6 +1379,8 @@ public class CoreContainer {
|
||||||
throw new SolrException(ErrorCode.SERVER_ERROR, "Interrupted while unregistering core [" + name + "] from cloud state");
|
throw new SolrException(ErrorCode.SERVER_ERROR, "Interrupted while unregistering core [" + name + "] from cloud state");
|
||||||
} catch (KeeperException e) {
|
} catch (KeeperException e) {
|
||||||
throw new SolrException(ErrorCode.SERVER_ERROR, "Error unregistering core [" + name + "] from cloud state", e);
|
throw new SolrException(ErrorCode.SERVER_ERROR, "Error unregistering core [" + name + "] from cloud state", e);
|
||||||
|
} catch (Exception e) {
|
||||||
|
throw new SolrException(ErrorCode.SERVER_ERROR, "Error unregistering core [" + name + "] from cloud state", e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -227,6 +227,8 @@ public class ZkContainer {
|
||||||
} catch (InterruptedException e) {
|
} catch (InterruptedException e) {
|
||||||
Thread.interrupted();
|
Thread.interrupted();
|
||||||
ZkContainer.log.error("", e);
|
ZkContainer.log.error("", e);
|
||||||
|
} catch (Exception e) {
|
||||||
|
ZkContainer.log.error("", e);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -46,7 +46,7 @@ import org.apache.solr.client.solrj.request.GenericSolrRequest;
|
||||||
import org.apache.solr.client.solrj.request.UpdateRequest;
|
import org.apache.solr.client.solrj.request.UpdateRequest;
|
||||||
import org.apache.solr.client.solrj.response.SimpleSolrResponse;
|
import org.apache.solr.client.solrj.response.SimpleSolrResponse;
|
||||||
import org.apache.solr.cloud.CloudDescriptor;
|
import org.apache.solr.cloud.CloudDescriptor;
|
||||||
import org.apache.solr.cloud.DistributedQueue;
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.cloud.Overseer;
|
import org.apache.solr.cloud.Overseer;
|
||||||
import org.apache.solr.cloud.ZkController;
|
import org.apache.solr.cloud.ZkController;
|
||||||
import org.apache.solr.cloud.overseer.OverseerAction;
|
import org.apache.solr.cloud.overseer.OverseerAction;
|
||||||
|
|
|
@ -21,6 +21,7 @@ import java.util.HashMap;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
|
||||||
import org.apache.solr.client.solrj.SolrServerException;
|
import org.apache.solr.client.solrj.SolrServerException;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
import org.apache.solr.client.solrj.impl.CloudSolrClient;
|
||||||
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
||||||
import org.apache.solr.client.solrj.request.CoreStatus;
|
import org.apache.solr.client.solrj.request.CoreStatus;
|
||||||
|
@ -82,8 +83,7 @@ public class DeleteShardTest extends SolrCloudTestCase {
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
protected void setSliceState(String collection, String slice, State state) throws SolrServerException, IOException,
|
protected void setSliceState(String collection, String slice, State state) throws Exception {
|
||||||
KeeperException, InterruptedException {
|
|
||||||
|
|
||||||
CloudSolrClient client = cluster.getSolrClient();
|
CloudSolrClient client = cluster.getSolrClient();
|
||||||
|
|
||||||
|
|
|
@ -25,6 +25,7 @@ import java.util.concurrent.TimeoutException;
|
||||||
import java.util.function.Predicate;
|
import java.util.function.Predicate;
|
||||||
|
|
||||||
import org.apache.solr.SolrTestCaseJ4;
|
import org.apache.solr.SolrTestCaseJ4;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.common.cloud.SolrZkClient;
|
import org.apache.solr.common.cloud.SolrZkClient;
|
||||||
import org.apache.solr.common.util.ExecutorUtil;
|
import org.apache.solr.common.util.ExecutorUtil;
|
||||||
import org.apache.solr.common.util.SolrjNamedThreadFactory;
|
import org.apache.solr.common.util.SolrjNamedThreadFactory;
|
||||||
|
@ -95,7 +96,7 @@ public class DistributedQueueTest extends SolrTestCaseJ4 {
|
||||||
String dqZNode = "/distqueue/test";
|
String dqZNode = "/distqueue/test";
|
||||||
byte[] data = "hello world".getBytes(UTF8);
|
byte[] data = "hello world".getBytes(UTF8);
|
||||||
|
|
||||||
DistributedQueue consumer = makeDistributedQueue(dqZNode);
|
ZkDistributedQueue consumer = makeDistributedQueue(dqZNode);
|
||||||
DistributedQueue producer = makeDistributedQueue(dqZNode);
|
DistributedQueue producer = makeDistributedQueue(dqZNode);
|
||||||
DistributedQueue producer2 = makeDistributedQueue(dqZNode);
|
DistributedQueue producer2 = makeDistributedQueue(dqZNode);
|
||||||
|
|
||||||
|
@ -124,7 +125,7 @@ public class DistributedQueueTest extends SolrTestCaseJ4 {
|
||||||
String dqZNode = "/distqueue/test";
|
String dqZNode = "/distqueue/test";
|
||||||
String testData = "hello world";
|
String testData = "hello world";
|
||||||
|
|
||||||
DistributedQueue dq = makeDistributedQueue(dqZNode);
|
ZkDistributedQueue dq = makeDistributedQueue(dqZNode);
|
||||||
|
|
||||||
assertNull(dq.peek());
|
assertNull(dq.peek());
|
||||||
Future<String> future = executor.submit(() -> new String(dq.peek(true), UTF8));
|
Future<String> future = executor.submit(() -> new String(dq.peek(true), UTF8));
|
||||||
|
@ -171,7 +172,7 @@ public class DistributedQueueTest extends SolrTestCaseJ4 {
|
||||||
@Test
|
@Test
|
||||||
public void testLeakChildWatcher() throws Exception {
|
public void testLeakChildWatcher() throws Exception {
|
||||||
String dqZNode = "/distqueue/test";
|
String dqZNode = "/distqueue/test";
|
||||||
DistributedQueue dq = makeDistributedQueue(dqZNode);
|
ZkDistributedQueue dq = makeDistributedQueue(dqZNode);
|
||||||
assertTrue(dq.peekElements(1, 1, s1 -> true).isEmpty());
|
assertTrue(dq.peekElements(1, 1, s1 -> true).isEmpty());
|
||||||
assertEquals(1, dq.watcherCount());
|
assertEquals(1, dq.watcherCount());
|
||||||
assertFalse(dq.isDirty());
|
assertFalse(dq.isDirty());
|
||||||
|
@ -280,8 +281,8 @@ public class DistributedQueueTest extends SolrTestCaseJ4 {
|
||||||
assertFalse(sessionId == zkClient.getSolrZooKeeper().getSessionId());
|
assertFalse(sessionId == zkClient.getSolrZooKeeper().getSessionId());
|
||||||
}
|
}
|
||||||
|
|
||||||
protected DistributedQueue makeDistributedQueue(String dqZNode) throws Exception {
|
protected ZkDistributedQueue makeDistributedQueue(String dqZNode) throws Exception {
|
||||||
return new DistributedQueue(zkClient, setupNewDistributedQueueZNode(dqZNode));
|
return new ZkDistributedQueue(zkClient, setupNewDistributedQueueZNode(dqZNode));
|
||||||
}
|
}
|
||||||
|
|
||||||
private static class QueueChangerThread extends Thread {
|
private static class QueueChangerThread extends Thread {
|
||||||
|
|
|
@ -26,6 +26,7 @@ import org.apache.solr.client.solrj.SolrClient;
|
||||||
import org.apache.solr.client.solrj.SolrRequest;
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
import org.apache.solr.client.solrj.SolrRequest.METHOD;
|
import org.apache.solr.client.solrj.SolrRequest.METHOD;
|
||||||
import org.apache.solr.client.solrj.SolrServerException;
|
import org.apache.solr.client.solrj.SolrServerException;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
||||||
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
||||||
|
@ -230,8 +231,7 @@ public class ForceLeaderTest extends HttpPartitionTest {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
protected void setReplicaState(String collection, String slice, Replica replica, Replica.State state) throws SolrServerException, IOException,
|
protected void setReplicaState(String collection, String slice, Replica replica, Replica.State state) throws Exception {
|
||||||
KeeperException, InterruptedException {
|
|
||||||
DistributedQueue inQueue = Overseer.getStateUpdateQueue(cloudClient.getZkStateReader().getZkClient());
|
DistributedQueue inQueue = Overseer.getStateUpdateQueue(cloudClient.getZkStateReader().getZkClient());
|
||||||
ZkStateReader zkStateReader = cloudClient.getZkStateReader();
|
ZkStateReader zkStateReader = cloudClient.getZkStateReader();
|
||||||
|
|
||||||
|
|
|
@ -23,6 +23,7 @@ import java.util.Random;
|
||||||
import org.apache.solr.client.solrj.SolrClient;
|
import org.apache.solr.client.solrj.SolrClient;
|
||||||
import org.apache.solr.client.solrj.SolrRequest;
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
import org.apache.solr.client.solrj.SolrServerException;
|
import org.apache.solr.client.solrj.SolrServerException;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
||||||
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
||||||
import org.apache.solr.client.solrj.request.CollectionAdminRequest.Create;
|
import org.apache.solr.client.solrj.request.CollectionAdminRequest.Create;
|
||||||
|
@ -68,7 +69,7 @@ public class MultiThreadedOCPTest extends AbstractFullDistribZkTestBase {
|
||||||
|
|
||||||
private void testFillWorkQueue() throws Exception {
|
private void testFillWorkQueue() throws Exception {
|
||||||
try (SolrClient client = createNewSolrClient("", getBaseUrl((HttpSolrClient) clients.get(0)))) {
|
try (SolrClient client = createNewSolrClient("", getBaseUrl((HttpSolrClient) clients.get(0)))) {
|
||||||
DistributedQueue distributedQueue = new DistributedQueue(cloudClient.getZkStateReader().getZkClient(),
|
DistributedQueue distributedQueue = new ZkDistributedQueue(cloudClient.getZkStateReader().getZkClient(),
|
||||||
"/overseer/collection-queue-work", new Overseer.Stats());
|
"/overseer/collection-queue-work", new Overseer.Stats());
|
||||||
//fill the work queue with blocked tasks by adding more than the no:of parallel tasks
|
//fill the work queue with blocked tasks by adding more than the no:of parallel tasks
|
||||||
for (int i = 0; i < MAX_PARALLEL_TASKS+5; i++) {
|
for (int i = 0; i < MAX_PARALLEL_TASKS+5; i++) {
|
||||||
|
@ -149,7 +150,7 @@ public class MultiThreadedOCPTest extends AbstractFullDistribZkTestBase {
|
||||||
|
|
||||||
private void testTaskExclusivity() throws Exception, SolrServerException {
|
private void testTaskExclusivity() throws Exception, SolrServerException {
|
||||||
|
|
||||||
DistributedQueue distributedQueue = new DistributedQueue(cloudClient.getZkStateReader().getZkClient(),
|
DistributedQueue distributedQueue = new ZkDistributedQueue(cloudClient.getZkStateReader().getZkClient(),
|
||||||
"/overseer/collection-queue-work", new Overseer.Stats());
|
"/overseer/collection-queue-work", new Overseer.Stats());
|
||||||
try (SolrClient client = createNewSolrClient("", getBaseUrl((HttpSolrClient) clients.get(0)))) {
|
try (SolrClient client = createNewSolrClient("", getBaseUrl((HttpSolrClient) clients.get(0)))) {
|
||||||
|
|
||||||
|
|
|
@ -37,6 +37,7 @@ import com.codahale.metrics.Snapshot;
|
||||||
import com.codahale.metrics.Timer;
|
import com.codahale.metrics.Timer;
|
||||||
import org.apache.lucene.util.LuceneTestCase.Slow;
|
import org.apache.lucene.util.LuceneTestCase.Slow;
|
||||||
import org.apache.solr.SolrTestCaseJ4;
|
import org.apache.solr.SolrTestCaseJ4;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.cloud.overseer.OverseerAction;
|
import org.apache.solr.cloud.overseer.OverseerAction;
|
||||||
import org.apache.solr.common.cloud.ClusterState;
|
import org.apache.solr.common.cloud.ClusterState;
|
||||||
import org.apache.solr.common.cloud.DocCollection;
|
import org.apache.solr.common.cloud.DocCollection;
|
||||||
|
@ -133,7 +134,7 @@ public class OverseerTest extends SolrTestCaseJ4 {
|
||||||
zkClient.close();
|
zkClient.close();
|
||||||
}
|
}
|
||||||
|
|
||||||
public void createCollection(String collection, int numShards) throws KeeperException, InterruptedException {
|
public void createCollection(String collection, int numShards) throws Exception {
|
||||||
|
|
||||||
ZkNodeProps m = new ZkNodeProps(Overseer.QUEUE_OPERATION, CollectionParams.CollectionAction.CREATE.toLower(),
|
ZkNodeProps m = new ZkNodeProps(Overseer.QUEUE_OPERATION, CollectionParams.CollectionAction.CREATE.toLower(),
|
||||||
"name", collection,
|
"name", collection,
|
||||||
|
@ -146,7 +147,7 @@ public class OverseerTest extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
public String publishState(String collection, String coreName, String coreNodeName, String shard, Replica.State stateName, int numShards)
|
public String publishState(String collection, String coreName, String coreNodeName, String shard, Replica.State stateName, int numShards)
|
||||||
throws KeeperException, InterruptedException, IOException {
|
throws Exception {
|
||||||
if (stateName == null) {
|
if (stateName == null) {
|
||||||
ElectionContext ec = electionContext.remove(coreName);
|
ElectionContext ec = electionContext.remove(coreName);
|
||||||
if (ec != null) {
|
if (ec != null) {
|
||||||
|
|
|
@ -31,6 +31,7 @@ import org.apache.lucene.util.TestUtil;
|
||||||
import org.apache.solr.BaseDistributedSearchTestCase;
|
import org.apache.solr.BaseDistributedSearchTestCase;
|
||||||
import org.apache.solr.SolrTestCaseJ4;
|
import org.apache.solr.SolrTestCaseJ4;
|
||||||
import org.apache.solr.client.solrj.SolrQuery;
|
import org.apache.solr.client.solrj.SolrQuery;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
||||||
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
import org.apache.solr.client.solrj.impl.HttpSolrClient;
|
||||||
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
import org.apache.solr.client.solrj.request.CollectionAdminRequest;
|
||||||
|
|
|
@ -150,7 +150,7 @@ public class AutoAddReplicasPlanActionTest extends SolrCloudTestCase{
|
||||||
private List<SolrRequest> getOperations(JettySolrRunner actionJetty, String lostNodeName) {
|
private List<SolrRequest> getOperations(JettySolrRunner actionJetty, String lostNodeName) {
|
||||||
AutoAddReplicasPlanAction action = new AutoAddReplicasPlanAction();
|
AutoAddReplicasPlanAction action = new AutoAddReplicasPlanAction();
|
||||||
TriggerEvent lostNode = new NodeLostTrigger.NodeLostEvent(TriggerEventType.NODELOST, ".auto_add_replicas", Collections.singletonList(System.currentTimeMillis()), Collections.singletonList(lostNodeName));
|
TriggerEvent lostNode = new NodeLostTrigger.NodeLostEvent(TriggerEventType.NODELOST, ".auto_add_replicas", Collections.singletonList(System.currentTimeMillis()), Collections.singletonList(lostNodeName));
|
||||||
ActionContext context = new ActionContext(actionJetty.getCoreContainer(), null, new HashMap<>());
|
ActionContext context = new ActionContext(actionJetty.getCoreContainer().getZkController().getClusterDataProvider(), null, new HashMap<>());
|
||||||
action.process(lostNode, context);
|
action.process(lostNode, context);
|
||||||
List<SolrRequest> operations = (List) context.getProperty("operations");
|
List<SolrRequest> operations = (List) context.getProperty("operations");
|
||||||
return operations;
|
return operations;
|
||||||
|
|
|
@ -110,7 +110,7 @@ public class ExecutePlanActionTest extends SolrCloudTestCase {
|
||||||
NodeLostTrigger.NodeLostEvent nodeLostEvent = new NodeLostTrigger.NodeLostEvent(TriggerEventType.NODELOST,
|
NodeLostTrigger.NodeLostEvent nodeLostEvent = new NodeLostTrigger.NodeLostEvent(TriggerEventType.NODELOST,
|
||||||
"mock_trigger_name", Collections.singletonList(TimeSource.CURRENT_TIME.getTime()),
|
"mock_trigger_name", Collections.singletonList(TimeSource.CURRENT_TIME.getTime()),
|
||||||
Collections.singletonList(sourceNodeName));
|
Collections.singletonList(sourceNodeName));
|
||||||
ActionContext actionContext = new ActionContext(survivor.getCoreContainer(), null,
|
ActionContext actionContext = new ActionContext(survivor.getCoreContainer().getZkController().getClusterDataProvider(), null,
|
||||||
new HashMap<>(Collections.singletonMap("operations", operations)));
|
new HashMap<>(Collections.singletonMap("operations", operations)));
|
||||||
action.process(nodeLostEvent, actionContext);
|
action.process(nodeLostEvent, actionContext);
|
||||||
|
|
||||||
|
|
|
@ -30,6 +30,7 @@ import java.util.concurrent.atomic.AtomicReference;
|
||||||
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
||||||
import org.apache.solr.cloud.SolrCloudTestCase;
|
import org.apache.solr.cloud.SolrCloudTestCase;
|
||||||
import org.apache.solr.core.CoreContainer;
|
import org.apache.solr.core.CoreContainer;
|
||||||
|
import org.apache.solr.core.SolrResourceLoader;
|
||||||
import org.apache.solr.util.TimeSource;
|
import org.apache.solr.util.TimeSource;
|
||||||
import org.junit.Before;
|
import org.junit.Before;
|
||||||
import org.junit.BeforeClass;
|
import org.junit.BeforeClass;
|
||||||
|
@ -72,7 +73,8 @@ public class NodeAddedTriggerTest extends SolrCloudTestCase {
|
||||||
long waitForSeconds = 1 + random().nextInt(5);
|
long waitForSeconds = 1 + random().nextInt(5);
|
||||||
Map<String, Object> props = createTriggerProps(waitForSeconds);
|
Map<String, Object> props = createTriggerProps(waitForSeconds);
|
||||||
|
|
||||||
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container)) {
|
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
trigger.run();
|
trigger.run();
|
||||||
|
|
||||||
|
@ -112,7 +114,8 @@ public class NodeAddedTriggerTest extends SolrCloudTestCase {
|
||||||
|
|
||||||
// add a new node but remove it before the waitFor period expires
|
// add a new node but remove it before the waitFor period expires
|
||||||
// and assert that the trigger doesn't fire at all
|
// and assert that the trigger doesn't fire at all
|
||||||
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container)) {
|
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
final long waitTime = 2;
|
final long waitTime = 2;
|
||||||
props.put("waitFor", waitTime);
|
props.put("waitFor", waitTime);
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
|
@ -157,7 +160,8 @@ public class NodeAddedTriggerTest extends SolrCloudTestCase {
|
||||||
action.put("name", "testActionInit");
|
action.put("name", "testActionInit");
|
||||||
action.put("class", NodeAddedTriggerTest.AssertInitTriggerAction.class.getName());
|
action.put("class", NodeAddedTriggerTest.AssertInitTriggerAction.class.getName());
|
||||||
actions.add(action);
|
actions.add(action);
|
||||||
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container)) {
|
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
assertEquals(true, actionConstructorCalled.get());
|
assertEquals(true, actionConstructorCalled.get());
|
||||||
assertEquals(false, actionInitCalled.get());
|
assertEquals(false, actionInitCalled.get());
|
||||||
assertEquals(false, actionCloseCalled.get());
|
assertEquals(false, actionCloseCalled.get());
|
||||||
|
@ -198,7 +202,8 @@ public class NodeAddedTriggerTest extends SolrCloudTestCase {
|
||||||
public void testListenerAcceptance() throws Exception {
|
public void testListenerAcceptance() throws Exception {
|
||||||
CoreContainer container = cluster.getJettySolrRunners().get(0).getCoreContainer();
|
CoreContainer container = cluster.getJettySolrRunners().get(0).getCoreContainer();
|
||||||
Map<String, Object> props = createTriggerProps(0);
|
Map<String, Object> props = createTriggerProps(0);
|
||||||
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container)) {
|
try (NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
trigger.run(); // starts tracking live nodes
|
trigger.run(); // starts tracking live nodes
|
||||||
|
|
||||||
|
@ -234,7 +239,8 @@ public class NodeAddedTriggerTest extends SolrCloudTestCase {
|
||||||
|
|
||||||
// add a new node but update the trigger before the waitFor period expires
|
// add a new node but update the trigger before the waitFor period expires
|
||||||
// and assert that the new trigger still fires
|
// and assert that the new trigger still fires
|
||||||
NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container);
|
NodeAddedTrigger trigger = new NodeAddedTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider());
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
trigger.run();
|
trigger.run();
|
||||||
|
|
||||||
|
@ -242,7 +248,8 @@ public class NodeAddedTriggerTest extends SolrCloudTestCase {
|
||||||
trigger.run(); // this run should detect the new node
|
trigger.run(); // this run should detect the new node
|
||||||
trigger.close(); // close the old trigger
|
trigger.close(); // close the old trigger
|
||||||
|
|
||||||
try (NodeAddedTrigger newTrigger = new NodeAddedTrigger("some_different_name", props, container)) {
|
try (NodeAddedTrigger newTrigger = new NodeAddedTrigger("some_different_name", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
try {
|
try {
|
||||||
newTrigger.restoreState(trigger);
|
newTrigger.restoreState(trigger);
|
||||||
fail("Trigger should only be able to restore state from an old trigger of the same name");
|
fail("Trigger should only be able to restore state from an old trigger of the same name");
|
||||||
|
@ -251,7 +258,8 @@ public class NodeAddedTriggerTest extends SolrCloudTestCase {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
try (NodeAddedTrigger newTrigger = new NodeAddedTrigger("node_added_trigger", props, container)) {
|
try (NodeAddedTrigger newTrigger = new NodeAddedTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
AtomicBoolean fired = new AtomicBoolean(false);
|
AtomicBoolean fired = new AtomicBoolean(false);
|
||||||
AtomicReference<TriggerEvent> eventRef = new AtomicReference<>();
|
AtomicReference<TriggerEvent> eventRef = new AtomicReference<>();
|
||||||
newTrigger.setProcessor(event -> {
|
newTrigger.setProcessor(event -> {
|
||||||
|
|
|
@ -73,7 +73,8 @@ public class NodeLostTriggerTest extends SolrCloudTestCase {
|
||||||
long waitForSeconds = 1 + random().nextInt(5);
|
long waitForSeconds = 1 + random().nextInt(5);
|
||||||
Map<String, Object> props = createTriggerProps(waitForSeconds);
|
Map<String, Object> props = createTriggerProps(waitForSeconds);
|
||||||
|
|
||||||
try (NodeLostTrigger trigger = new NodeLostTrigger("node_lost_trigger", props, container)) {
|
try (NodeLostTrigger trigger = new NodeLostTrigger("node_lost_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
trigger.run();
|
trigger.run();
|
||||||
String lostNodeName1 = cluster.getJettySolrRunner(1).getNodeName();
|
String lostNodeName1 = cluster.getJettySolrRunner(1).getNodeName();
|
||||||
|
@ -117,7 +118,8 @@ public class NodeLostTriggerTest extends SolrCloudTestCase {
|
||||||
|
|
||||||
// remove a node but add it back before the waitFor period expires
|
// remove a node but add it back before the waitFor period expires
|
||||||
// and assert that the trigger doesn't fire at all
|
// and assert that the trigger doesn't fire at all
|
||||||
try (NodeLostTrigger trigger = new NodeLostTrigger("node_lost_trigger", props, container)) {
|
try (NodeLostTrigger trigger = new NodeLostTrigger("node_lost_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
final long waitTime = 2;
|
final long waitTime = 2;
|
||||||
props.put("waitFor", waitTime);
|
props.put("waitFor", waitTime);
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
|
@ -173,7 +175,8 @@ public class NodeLostTriggerTest extends SolrCloudTestCase {
|
||||||
action.put("name", "testActionInit");
|
action.put("name", "testActionInit");
|
||||||
action.put("class", AssertInitTriggerAction.class.getName());
|
action.put("class", AssertInitTriggerAction.class.getName());
|
||||||
actions.add(action);
|
actions.add(action);
|
||||||
try (NodeLostTrigger trigger = new NodeLostTrigger("node_added_trigger", props, container)) {
|
try (NodeLostTrigger trigger = new NodeLostTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
assertEquals(true, actionConstructorCalled.get());
|
assertEquals(true, actionConstructorCalled.get());
|
||||||
assertEquals(false, actionInitCalled.get());
|
assertEquals(false, actionInitCalled.get());
|
||||||
assertEquals(false, actionCloseCalled.get());
|
assertEquals(false, actionCloseCalled.get());
|
||||||
|
@ -214,7 +217,8 @@ public class NodeLostTriggerTest extends SolrCloudTestCase {
|
||||||
public void testListenerAcceptance() throws Exception {
|
public void testListenerAcceptance() throws Exception {
|
||||||
CoreContainer container = cluster.getJettySolrRunners().get(0).getCoreContainer();
|
CoreContainer container = cluster.getJettySolrRunners().get(0).getCoreContainer();
|
||||||
Map<String, Object> props = createTriggerProps(0);
|
Map<String, Object> props = createTriggerProps(0);
|
||||||
try (NodeLostTrigger trigger = new NodeLostTrigger("node_added_trigger", props, container)) {
|
try (NodeLostTrigger trigger = new NodeLostTrigger("node_added_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
|
|
||||||
JettySolrRunner newNode = cluster.startJettySolrRunner();
|
JettySolrRunner newNode = cluster.startJettySolrRunner();
|
||||||
|
@ -267,7 +271,8 @@ public class NodeLostTriggerTest extends SolrCloudTestCase {
|
||||||
// remove a node but update the trigger before the waitFor period expires
|
// remove a node but update the trigger before the waitFor period expires
|
||||||
// and assert that the new trigger still fires
|
// and assert that the new trigger still fires
|
||||||
|
|
||||||
NodeLostTrigger trigger = new NodeLostTrigger("node_lost_trigger", props, container);
|
NodeLostTrigger trigger = new NodeLostTrigger("node_lost_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider());
|
||||||
trigger.setProcessor(noFirstRunProcessor);
|
trigger.setProcessor(noFirstRunProcessor);
|
||||||
trigger.run();
|
trigger.run();
|
||||||
|
|
||||||
|
@ -284,7 +289,8 @@ public class NodeLostTriggerTest extends SolrCloudTestCase {
|
||||||
trigger.run(); // this run should detect the lost node
|
trigger.run(); // this run should detect the lost node
|
||||||
trigger.close(); // close the old trigger
|
trigger.close(); // close the old trigger
|
||||||
|
|
||||||
try (NodeLostTrigger newTrigger = new NodeLostTrigger("some_different_name", props, container)) {
|
try (NodeLostTrigger newTrigger = new NodeLostTrigger("some_different_name", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
try {
|
try {
|
||||||
newTrigger.restoreState(trigger);
|
newTrigger.restoreState(trigger);
|
||||||
fail("Trigger should only be able to restore state from an old trigger of the same name");
|
fail("Trigger should only be able to restore state from an old trigger of the same name");
|
||||||
|
@ -293,7 +299,8 @@ public class NodeLostTriggerTest extends SolrCloudTestCase {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
try (NodeLostTrigger newTrigger = new NodeLostTrigger("node_lost_trigger", props, container)) {
|
try (NodeLostTrigger newTrigger = new NodeLostTrigger("node_lost_trigger", props, container.getResourceLoader(),
|
||||||
|
container.getZkController().getClusterDataProvider())) {
|
||||||
AtomicBoolean fired = new AtomicBoolean(false);
|
AtomicBoolean fired = new AtomicBoolean(false);
|
||||||
AtomicReference<TriggerEvent> eventRef = new AtomicReference<>();
|
AtomicReference<TriggerEvent> eventRef = new AtomicReference<>();
|
||||||
newTrigger.setProcessor(event -> {
|
newTrigger.setProcessor(event -> {
|
||||||
|
|
|
@ -168,7 +168,7 @@ public class TestPolicyCloud extends SolrCloudTestCase {
|
||||||
CollectionAdminRequest.createCollection("metricsTest", "conf", 1, 1)
|
CollectionAdminRequest.createCollection("metricsTest", "conf", 1, 1)
|
||||||
.process(cluster.getSolrClient());
|
.process(cluster.getSolrClient());
|
||||||
DocCollection collection = getCollectionState("metricsTest");
|
DocCollection collection = getCollectionState("metricsTest");
|
||||||
SolrClientDataProvider provider = new SolrClientDataProvider(solrClient);
|
SolrClientDataProvider provider = new SolrClientDataProvider(new ZkDistributedQueueFactory(cluster.getZkClient()), solrClient);
|
||||||
List<String> tags = Arrays.asList("metrics:solr.node:ADMIN./admin/authorization.clientErrors:count",
|
List<String> tags = Arrays.asList("metrics:solr.node:ADMIN./admin/authorization.clientErrors:count",
|
||||||
"metrics:solr.jvm:buffers.direct.Count");
|
"metrics:solr.jvm:buffers.direct.Count");
|
||||||
Map<String, Object> val = provider.getNodeValues(collection .getReplicas().get(0).getNodeName(), tags);
|
Map<String, Object> val = provider.getNodeValues(collection .getReplicas().get(0).getNodeName(), tags);
|
||||||
|
@ -268,7 +268,7 @@ public class TestPolicyCloud extends SolrCloudTestCase {
|
||||||
CollectionAdminRequest.createCollectionWithImplicitRouter("policiesTest", "conf", "shard1", 2)
|
CollectionAdminRequest.createCollectionWithImplicitRouter("policiesTest", "conf", "shard1", 2)
|
||||||
.process(cluster.getSolrClient());
|
.process(cluster.getSolrClient());
|
||||||
DocCollection rulesCollection = getCollectionState("policiesTest");
|
DocCollection rulesCollection = getCollectionState("policiesTest");
|
||||||
SolrClientDataProvider provider = new SolrClientDataProvider(cluster.getSolrClient());
|
SolrClientDataProvider provider = new SolrClientDataProvider(new ZkDistributedQueueFactory(cluster.getZkClient()), cluster.getSolrClient());
|
||||||
Map<String, Object> val = provider.getNodeValues(rulesCollection.getReplicas().get(0).getNodeName(), Arrays.asList(
|
Map<String, Object> val = provider.getNodeValues(rulesCollection.getReplicas().get(0).getNodeName(), Arrays.asList(
|
||||||
"freedisk",
|
"freedisk",
|
||||||
"cores",
|
"cores",
|
||||||
|
|
|
@ -34,6 +34,7 @@ import java.util.concurrent.locks.ReentrantLock;
|
||||||
|
|
||||||
import org.apache.solr.client.solrj.SolrRequest;
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventProcessorStage;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
import org.apache.solr.client.solrj.cloud.autoscaling.TriggerEventType;
|
||||||
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
import org.apache.solr.client.solrj.embedded.JettySolrRunner;
|
||||||
|
@ -965,8 +966,8 @@ public class TriggerIntegrationTest extends SolrCloudTestCase {
|
||||||
|
|
||||||
public static class TestTriggerListener extends TriggerListenerBase {
|
public static class TestTriggerListener extends TriggerListenerBase {
|
||||||
@Override
|
@Override
|
||||||
public void init(CoreContainer coreContainer, AutoScalingConfig.TriggerListenerConfig config) {
|
public void init(ClusterDataProvider clusterDataProvider, AutoScalingConfig.TriggerListenerConfig config) {
|
||||||
super.init(coreContainer, config);
|
super.init(clusterDataProvider, config);
|
||||||
listenerCreated.countDown();
|
listenerCreated.countDown();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,44 @@
|
||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
package org.apache.solr.client.solrj.cloud;
|
||||||
|
|
||||||
|
import java.util.Collection;
|
||||||
|
import java.util.function.Predicate;
|
||||||
|
|
||||||
|
import org.apache.solr.common.util.Pair;
|
||||||
|
|
||||||
|
/**
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public interface DistributedQueue {
|
||||||
|
byte[] peek() throws Exception;
|
||||||
|
|
||||||
|
byte[] peek(boolean block) throws Exception;
|
||||||
|
|
||||||
|
byte[] peek(long wait) throws Exception;
|
||||||
|
|
||||||
|
byte[] poll() throws Exception;
|
||||||
|
|
||||||
|
byte[] remove() throws Exception;
|
||||||
|
|
||||||
|
byte[] take() throws Exception;
|
||||||
|
|
||||||
|
void offer(byte[] data) throws Exception;
|
||||||
|
|
||||||
|
Collection<Pair<String, byte[]>> peekElements(int max, long waitMillis, Predicate<String> acceptFilter) throws Exception;
|
||||||
|
|
||||||
|
}
|
|
@ -19,12 +19,28 @@ package org.apache.solr.client.solrj.cloud.autoscaling;
|
||||||
|
|
||||||
import java.io.Closeable;
|
import java.io.Closeable;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.net.ConnectException;
|
||||||
import java.util.Collection;
|
import java.util.Collection;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
import java.util.NoSuchElementException;
|
||||||
|
|
||||||
|
import org.apache.http.client.HttpClient;
|
||||||
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
|
import org.apache.solr.client.solrj.SolrResponse;
|
||||||
|
import org.apache.solr.client.solrj.cloud.DistributedQueue;
|
||||||
|
import org.apache.solr.common.cloud.ClusterState;
|
||||||
|
import org.apache.zookeeper.CreateMode;
|
||||||
|
import org.apache.zookeeper.Op;
|
||||||
|
import org.apache.zookeeper.OpResult;
|
||||||
|
import org.apache.zookeeper.Watcher;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* This interface abstracts the details of dealing with Zookeeper and Solr from the autoscaling framework.
|
||||||
|
*/
|
||||||
public interface ClusterDataProvider extends Closeable {
|
public interface ClusterDataProvider extends Closeable {
|
||||||
/**Get the value of each tag for a given node
|
/**
|
||||||
|
* Get the value of each tag for a given node
|
||||||
*
|
*
|
||||||
* @param node node name
|
* @param node node name
|
||||||
* @param tags tag names
|
* @param tags tag names
|
||||||
|
@ -34,19 +50,87 @@ public interface ClusterDataProvider extends Closeable {
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Get the details of each replica in a node. It attempts to fetch as much details about
|
* Get the details of each replica in a node. It attempts to fetch as much details about
|
||||||
* the replica as mentioned in the keys list. It is not necessary to give al details
|
* the replica as mentioned in the keys list. It is not necessary to give all details
|
||||||
* <p>
|
* <p>
|
||||||
* the format is {collection:shard :[{replicadetails}]}
|
* the format is {collection:shard :[{replicadetails}]}
|
||||||
*/
|
*/
|
||||||
Map<String, Map<String, List<ReplicaInfo>>> getReplicaInfo(String node, Collection<String> keys);
|
Map<String, Map<String, List<ReplicaInfo>>> getReplicaInfo(String node, Collection<String> keys);
|
||||||
|
|
||||||
Collection<String> getNodes();
|
/**
|
||||||
|
* Get the current set of live nodes.
|
||||||
|
*/
|
||||||
|
Collection<String> getLiveNodes();
|
||||||
|
|
||||||
/**Get the collection-specific policy
|
ClusterState getClusterState() throws IOException;
|
||||||
|
|
||||||
|
Map<String, Object> getClusterProperties();
|
||||||
|
|
||||||
|
default <T> T getClusterProperty(String key, T defaultValue) {
|
||||||
|
T value = (T) getClusterProperties().get(key);
|
||||||
|
if (value == null)
|
||||||
|
return defaultValue;
|
||||||
|
return value;
|
||||||
|
}
|
||||||
|
|
||||||
|
AutoScalingConfig getAutoScalingConfig(Watcher watcher) throws ConnectException, InterruptedException, IOException;
|
||||||
|
|
||||||
|
default AutoScalingConfig getAutoScalingConfig() throws ConnectException, InterruptedException, IOException {
|
||||||
|
return getAutoScalingConfig(null);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Get the collection-specific policy
|
||||||
*/
|
*/
|
||||||
String getPolicyNameByCollection(String coll);
|
String getPolicyNameByCollection(String coll);
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
default void close() throws IOException {
|
default void close() throws IOException {
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// ZK-like methods
|
||||||
|
|
||||||
|
boolean hasData(String path) throws IOException;
|
||||||
|
|
||||||
|
List<String> listData(String path) throws NoSuchElementException, IOException;
|
||||||
|
|
||||||
|
class VersionedData {
|
||||||
|
public final int version;
|
||||||
|
public final byte[] data;
|
||||||
|
|
||||||
|
public VersionedData(int version, byte[] data) {
|
||||||
|
this.version = version;
|
||||||
|
this.data = data;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
VersionedData getData(String path, Watcher watcher) throws NoSuchElementException, IOException;
|
||||||
|
|
||||||
|
default VersionedData getData(String path) throws NoSuchElementException, IOException {
|
||||||
|
return getData(path, null);
|
||||||
|
}
|
||||||
|
|
||||||
|
// mutators
|
||||||
|
|
||||||
|
void makePath(String path) throws IOException;
|
||||||
|
|
||||||
|
void createData(String path, byte[] data, CreateMode mode) throws IOException;
|
||||||
|
|
||||||
|
void removeData(String path, int version) throws NoSuchElementException, IOException;
|
||||||
|
|
||||||
|
void setData(String path, byte[] data, int version) throws NoSuchElementException, IOException;
|
||||||
|
|
||||||
|
List<OpResult> multi(final Iterable<Op> ops) throws IOException;
|
||||||
|
|
||||||
|
// Solr-like methods
|
||||||
|
|
||||||
|
SolrResponse request(SolrRequest req) throws IOException;
|
||||||
|
|
||||||
|
HttpClient getHttpClient();
|
||||||
|
|
||||||
|
interface DistributedQueueFactory {
|
||||||
|
DistributedQueue makeQueue(String path) throws IOException;
|
||||||
|
void removeQueue(String path) throws IOException;
|
||||||
|
}
|
||||||
|
|
||||||
|
DistributedQueueFactory getDistributedQueueFactory();
|
||||||
}
|
}
|
||||||
|
|
|
@ -0,0 +1,118 @@
|
||||||
|
package org.apache.solr.client.solrj.cloud.autoscaling;
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
|
import java.net.ConnectException;
|
||||||
|
import java.util.Collection;
|
||||||
|
import java.util.List;
|
||||||
|
import java.util.Map;
|
||||||
|
import java.util.NoSuchElementException;
|
||||||
|
|
||||||
|
import org.apache.http.client.HttpClient;
|
||||||
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
|
import org.apache.solr.client.solrj.SolrResponse;
|
||||||
|
import org.apache.solr.common.cloud.ClusterState;
|
||||||
|
import org.apache.zookeeper.CreateMode;
|
||||||
|
import org.apache.zookeeper.Op;
|
||||||
|
import org.apache.zookeeper.OpResult;
|
||||||
|
import org.apache.zookeeper.Watcher;
|
||||||
|
|
||||||
|
/**
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public class DelegatingClusterDataProvider implements ClusterDataProvider {
|
||||||
|
protected ClusterDataProvider delegate;
|
||||||
|
|
||||||
|
public DelegatingClusterDataProvider(ClusterDataProvider delegate) {
|
||||||
|
this.delegate = delegate;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
||||||
|
return delegate.getNodeValues(node, tags);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Map<String, Map<String, List<ReplicaInfo>>> getReplicaInfo(String node, Collection<String> keys) {
|
||||||
|
return delegate.getReplicaInfo(node, keys);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Collection<String> getLiveNodes() {
|
||||||
|
return delegate.getLiveNodes();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Map<String, Object> getClusterProperties() {
|
||||||
|
return delegate.getClusterProperties();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public ClusterState getClusterState() throws IOException {
|
||||||
|
return delegate.getClusterState();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public AutoScalingConfig getAutoScalingConfig(Watcher watcher) throws ConnectException, InterruptedException, IOException {
|
||||||
|
return delegate.getAutoScalingConfig(watcher);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public String getPolicyNameByCollection(String coll) {
|
||||||
|
return delegate.getPolicyNameByCollection(coll);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public boolean hasData(String path) throws IOException {
|
||||||
|
return delegate.hasData(path);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public List<String> listData(String path) throws NoSuchElementException, IOException {
|
||||||
|
return delegate.listData(path);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public VersionedData getData(String path, Watcher watcher) throws NoSuchElementException, IOException {
|
||||||
|
return delegate.getData(path, watcher);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void makePath(String path) throws IOException {
|
||||||
|
delegate.makePath(path);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void createData(String path, byte[] data, CreateMode mode) throws IOException {
|
||||||
|
delegate.createData(path, data, mode);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void removeData(String path, int version) throws NoSuchElementException, IOException {
|
||||||
|
delegate.removeData(path, version);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void setData(String path, byte[] data, int version) throws NoSuchElementException, IOException {
|
||||||
|
delegate.setData(path, data, version);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public List<OpResult> multi(Iterable<Op> ops) throws IOException {
|
||||||
|
return delegate.multi(ops);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public SolrResponse request(SolrRequest req) throws IOException {
|
||||||
|
return delegate.request(req);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public HttpClient getHttpClient() {
|
||||||
|
return delegate.getHttpClient();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public DistributedQueueFactory getDistributedQueueFactory() {
|
||||||
|
return delegate.getDistributedQueueFactory();
|
||||||
|
}
|
||||||
|
}
|
|
@ -201,7 +201,7 @@ public class Policy implements MapWriter {
|
||||||
}
|
}
|
||||||
|
|
||||||
Session(ClusterDataProvider dataProvider) {
|
Session(ClusterDataProvider dataProvider) {
|
||||||
this.nodes = new ArrayList<>(dataProvider.getNodes());
|
this.nodes = new ArrayList<>(dataProvider.getLiveNodes());
|
||||||
this.dataProvider = dataProvider;
|
this.dataProvider = dataProvider;
|
||||||
for (String node : nodes) {
|
for (String node : nodes) {
|
||||||
collections.addAll(dataProvider.getReplicaInfo(node, Collections.emptyList()).keySet());
|
collections.addAll(dataProvider.getReplicaInfo(node, Collections.emptyList()).keySet());
|
||||||
|
|
|
@ -49,22 +49,7 @@ public class PolicyHelper {
|
||||||
List<String> nodesList) {
|
List<String> nodesList) {
|
||||||
List<ReplicaPosition> positions = new ArrayList<>();
|
List<ReplicaPosition> positions = new ArrayList<>();
|
||||||
final ClusterDataProvider delegate = cdp;
|
final ClusterDataProvider delegate = cdp;
|
||||||
cdp = new ClusterDataProvider() {
|
cdp = new DelegatingClusterDataProvider(delegate) {
|
||||||
@Override
|
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
|
||||||
return delegate.getNodeValues(node, tags);
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public Map<String, Map<String, List<ReplicaInfo>>> getReplicaInfo(String node, Collection<String> keys) {
|
|
||||||
return delegate.getReplicaInfo(node, keys);
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public Collection<String> getNodes() {
|
|
||||||
return delegate.getNodes();
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public String getPolicyNameByCollection(String coll) {
|
public String getPolicyNameByCollection(String coll) {
|
||||||
return policyMapping.get() != null && policyMapping.get().containsKey(coll) ?
|
return policyMapping.get() != null && policyMapping.get().containsKey(coll) ?
|
||||||
|
|
|
@ -46,7 +46,7 @@ public class Row implements MapWriter {
|
||||||
if (collectionVsShardVsReplicas == null) collectionVsShardVsReplicas = new HashMap<>();
|
if (collectionVsShardVsReplicas == null) collectionVsShardVsReplicas = new HashMap<>();
|
||||||
this.node = node;
|
this.node = node;
|
||||||
cells = new Cell[params.size()];
|
cells = new Cell[params.size()];
|
||||||
isLive = dataProvider.getNodes().contains(node);
|
isLive = dataProvider.getLiveNodes().contains(node);
|
||||||
Map<String, Object> vals = isLive ? dataProvider.getNodeValues(node, params) : Collections.emptyMap();
|
Map<String, Object> vals = isLive ? dataProvider.getNodeValues(node, params) : Collections.emptyMap();
|
||||||
for (int i = 0; i < params.size(); i++) {
|
for (int i = 0; i < params.size(); i++) {
|
||||||
String s = params.get(i);
|
String s = params.get(i);
|
||||||
|
|
|
@ -28,10 +28,15 @@ import java.util.HashMap;
|
||||||
import java.util.HashSet;
|
import java.util.HashSet;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
import java.util.NoSuchElementException;
|
||||||
|
import java.util.Queue;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
|
|
||||||
|
import org.apache.http.client.HttpClient;
|
||||||
import org.apache.solr.client.solrj.SolrRequest;
|
import org.apache.solr.client.solrj.SolrRequest;
|
||||||
|
import org.apache.solr.client.solrj.SolrResponse;
|
||||||
import org.apache.solr.client.solrj.SolrServerException;
|
import org.apache.solr.client.solrj.SolrServerException;
|
||||||
|
import org.apache.solr.client.solrj.cloud.autoscaling.AutoScalingConfig;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
import org.apache.solr.client.solrj.cloud.autoscaling.ClusterDataProvider;
|
||||||
import org.apache.solr.client.solrj.cloud.autoscaling.ReplicaInfo;
|
import org.apache.solr.client.solrj.cloud.autoscaling.ReplicaInfo;
|
||||||
import org.apache.solr.client.solrj.request.GenericSolrRequest;
|
import org.apache.solr.client.solrj.request.GenericSolrRequest;
|
||||||
|
@ -40,6 +45,7 @@ import org.apache.solr.common.MapWriter;
|
||||||
import org.apache.solr.common.SolrException;
|
import org.apache.solr.common.SolrException;
|
||||||
import org.apache.solr.common.cloud.ClusterState;
|
import org.apache.solr.common.cloud.ClusterState;
|
||||||
import org.apache.solr.common.cloud.DocCollection;
|
import org.apache.solr.common.cloud.DocCollection;
|
||||||
|
import org.apache.solr.common.cloud.SolrZkClient;
|
||||||
import org.apache.solr.common.cloud.ZkStateReader;
|
import org.apache.solr.common.cloud.ZkStateReader;
|
||||||
import org.apache.solr.common.cloud.rule.ImplicitSnitch;
|
import org.apache.solr.common.cloud.rule.ImplicitSnitch;
|
||||||
import org.apache.solr.common.cloud.rule.RemoteCallback;
|
import org.apache.solr.common.cloud.rule.RemoteCallback;
|
||||||
|
@ -50,7 +56,12 @@ import org.apache.solr.common.params.SolrParams;
|
||||||
import org.apache.solr.common.util.NamedList;
|
import org.apache.solr.common.util.NamedList;
|
||||||
import org.apache.solr.common.util.StrUtils;
|
import org.apache.solr.common.util.StrUtils;
|
||||||
import org.apache.solr.common.util.Utils;
|
import org.apache.solr.common.util.Utils;
|
||||||
|
import org.apache.zookeeper.CreateMode;
|
||||||
import org.apache.zookeeper.KeeperException;
|
import org.apache.zookeeper.KeeperException;
|
||||||
|
import org.apache.zookeeper.Op;
|
||||||
|
import org.apache.zookeeper.OpResult;
|
||||||
|
import org.apache.zookeeper.Watcher;
|
||||||
|
import org.apache.zookeeper.data.Stat;
|
||||||
import org.slf4j.Logger;
|
import org.slf4j.Logger;
|
||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
@ -63,16 +74,19 @@ public class SolrClientDataProvider implements ClusterDataProvider, MapWriter {
|
||||||
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
|
||||||
private final CloudSolrClient solrClient;
|
private final CloudSolrClient solrClient;
|
||||||
|
private final DistributedQueueFactory queueFactory;
|
||||||
|
private final ZkStateReader zkStateReader;
|
||||||
|
private final SolrZkClient zkClient;
|
||||||
private final Map<String, Map<String, Map<String, List<ReplicaInfo>>>> data = new HashMap<>();
|
private final Map<String, Map<String, Map<String, List<ReplicaInfo>>>> data = new HashMap<>();
|
||||||
private Set<String> liveNodes;
|
|
||||||
private Map<String, Object> snitchSession = new HashMap<>();
|
private Map<String, Object> snitchSession = new HashMap<>();
|
||||||
private Map<String, Map> nodeVsTags = new HashMap<>();
|
private Map<String, Map> nodeVsTags = new HashMap<>();
|
||||||
|
|
||||||
public SolrClientDataProvider(CloudSolrClient solrClient) {
|
public SolrClientDataProvider(DistributedQueueFactory queueFactory, CloudSolrClient solrClient) {
|
||||||
|
this.queueFactory = queueFactory;
|
||||||
this.solrClient = solrClient;
|
this.solrClient = solrClient;
|
||||||
ZkStateReader zkStateReader = solrClient.getZkStateReader();
|
this.zkStateReader = solrClient.getZkStateReader();
|
||||||
|
this.zkClient = zkStateReader.getZkClient();
|
||||||
ClusterState clusterState = zkStateReader.getClusterState();
|
ClusterState clusterState = zkStateReader.getClusterState();
|
||||||
this.liveNodes = clusterState.getLiveNodes();
|
|
||||||
Map<String, ClusterState.CollectionRef> all = clusterState.getCollectionStates();
|
Map<String, ClusterState.CollectionRef> all = clusterState.getCollectionStates();
|
||||||
all.forEach((collName, ref) -> {
|
all.forEach((collName, ref) -> {
|
||||||
DocCollection coll = ref.get();
|
DocCollection coll = ref.get();
|
||||||
|
@ -107,16 +121,135 @@ public class SolrClientDataProvider implements ClusterDataProvider, MapWriter {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return liveNodes;
|
return solrClient.getZkStateReader().getClusterState().getLiveNodes();
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void writeMap(EntryWriter ew) throws IOException {
|
public void writeMap(EntryWriter ew) throws IOException {
|
||||||
ew.put("liveNodes", liveNodes);
|
ew.put("liveNodes", zkStateReader.getClusterState().getLiveNodes());
|
||||||
ew.put("replicaInfo", Utils.getDeepCopy(data, 5));
|
ew.put("replicaInfo", Utils.getDeepCopy(data, 5));
|
||||||
ew.put("nodeValues", nodeVsTags);
|
ew.put("nodeValues", nodeVsTags);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Map<String, Object> getClusterProperties() {
|
||||||
|
return zkStateReader.getClusterProperties();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public ClusterState getClusterState() {
|
||||||
|
return zkStateReader.getClusterState();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public AutoScalingConfig getAutoScalingConfig(Watcher watcher) throws IOException {
|
||||||
|
try {
|
||||||
|
return zkStateReader.getAutoScalingConfig(watcher);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public boolean hasData(String path) throws IOException {
|
||||||
|
try {
|
||||||
|
return zkClient.exists(path, true);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public List<String> listData(String path) throws NoSuchElementException, IOException {
|
||||||
|
try {
|
||||||
|
return zkClient.getChildren(path, null, true);
|
||||||
|
} catch (KeeperException.NoNodeException e) {
|
||||||
|
throw new NoSuchElementException(path);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public VersionedData getData(String path, Watcher watcher) throws NoSuchElementException, IOException {
|
||||||
|
Stat stat = new Stat();
|
||||||
|
try {
|
||||||
|
byte[] bytes = zkClient.getData(path, watcher, stat, true);
|
||||||
|
return new VersionedData(stat.getVersion(), bytes);
|
||||||
|
} catch (KeeperException.NoNodeException e) {
|
||||||
|
throw new NoSuchElementException(path);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void makePath(String path) throws IOException {
|
||||||
|
try {
|
||||||
|
zkClient.makePath(path, true);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void createData(String path, byte[] data, CreateMode mode) throws IOException {
|
||||||
|
try {
|
||||||
|
zkClient.create(path, data, mode, true);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void removeData(String path, int version) throws NoSuchElementException, IOException {
|
||||||
|
try {
|
||||||
|
zkClient.delete(path, version, true);
|
||||||
|
} catch (KeeperException.NoNodeException e) {
|
||||||
|
throw new NoSuchElementException(path);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void setData(String path, byte[] data, int version) throws NoSuchElementException, IOException {
|
||||||
|
try {
|
||||||
|
zkClient.setData(path, data, version, true);
|
||||||
|
} catch (KeeperException.NoNodeException e) {
|
||||||
|
throw new NoSuchElementException(path);
|
||||||
|
} catch (KeeperException | InterruptedException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public SolrResponse request(SolrRequest req) throws IOException {
|
||||||
|
try {
|
||||||
|
return req.process(solrClient);
|
||||||
|
} catch (SolrServerException e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public List<OpResult> multi(Iterable<Op> ops) throws IOException {
|
||||||
|
try {
|
||||||
|
return zkClient.multi(ops, true);
|
||||||
|
} catch (Exception e) {
|
||||||
|
throw new IOException(e);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public HttpClient getHttpClient() {
|
||||||
|
return solrClient.getHttpClient();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public DistributedQueueFactory getDistributedQueueFactory() {
|
||||||
|
return queueFactory;
|
||||||
}
|
}
|
||||||
|
|
||||||
static class ClientSnitchCtx
|
static class ClientSnitchCtx
|
||||||
|
|
|
@ -27,7 +27,6 @@ import java.util.HashMap;
|
||||||
import java.util.LinkedHashMap;
|
import java.util.LinkedHashMap;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
import java.util.Objects;
|
|
||||||
|
|
||||||
import com.google.common.collect.ImmutableList;
|
import com.google.common.collect.ImmutableList;
|
||||||
import org.apache.solr.SolrTestCaseJ4;
|
import org.apache.solr.SolrTestCaseJ4;
|
||||||
|
@ -422,7 +421,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
});
|
});
|
||||||
|
|
||||||
});
|
});
|
||||||
return new ClusterDataProvider(){
|
return new DelegatingClusterDataProvider(null) {
|
||||||
@Override
|
@Override
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
||||||
return (Map<String, Object>) Utils.getObjectByPath(m,false, Arrays.asList("nodeValues", node));
|
return (Map<String, Object>) Utils.getObjectByPath(m,false, Arrays.asList("nodeValues", node));
|
||||||
|
@ -434,7 +433,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return (Collection<String>) m.get("liveNodes");
|
return (Collection<String>) m.get("liveNodes");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -963,7 +962,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
|
|
||||||
Policy policy = new Policy((Map<String, Object>) Utils.fromJSONString(autoscaleJson));
|
Policy policy = new Policy((Map<String, Object>) Utils.fromJSONString(autoscaleJson));
|
||||||
ClusterDataProvider clusterDataProvider = getClusterDataProvider(nodeValues, clusterState);
|
ClusterDataProvider clusterDataProvider = getClusterDataProvider(nodeValues, clusterState);
|
||||||
ClusterDataProvider cdp = new ClusterDataProvider() {
|
ClusterDataProvider cdp = new DelegatingClusterDataProvider(null) {
|
||||||
@Override
|
@Override
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
||||||
return clusterDataProvider.getNodeValues(node, tags);
|
return clusterDataProvider.getNodeValues(node, tags);
|
||||||
|
@ -975,8 +974,8 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return clusterDataProvider.getNodes();
|
return clusterDataProvider.getLiveNodes();
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -1041,7 +1040,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
" 'freedisk':918005641216}}}");
|
" 'freedisk':918005641216}}}");
|
||||||
|
|
||||||
Policy policy = new Policy((Map<String, Object>) Utils.fromJSONString(autoscaleJson));
|
Policy policy = new Policy((Map<String, Object>) Utils.fromJSONString(autoscaleJson));
|
||||||
Policy.Session session = policy.createSession(new ClusterDataProvider() {
|
Policy.Session session = policy.createSession(new DelegatingClusterDataProvider(null) {
|
||||||
@Override
|
@Override
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
||||||
return tagsMap.get(node);
|
return tagsMap.get(node);
|
||||||
|
@ -1053,7 +1052,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return replicaInfoMap.keySet();
|
return replicaInfoMap.keySet();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1099,7 +1098,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
"}");
|
"}");
|
||||||
Policy policy = new Policy((Map<String, Object>) Utils.fromJSONString(rules));
|
Policy policy = new Policy((Map<String, Object>) Utils.fromJSONString(rules));
|
||||||
ClusterDataProvider clusterDataProvider = getClusterDataProvider(nodeValues, clusterState);
|
ClusterDataProvider clusterDataProvider = getClusterDataProvider(nodeValues, clusterState);
|
||||||
ClusterDataProvider cdp = new ClusterDataProvider() {
|
ClusterDataProvider cdp = new DelegatingClusterDataProvider(null) {
|
||||||
@Override
|
@Override
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
||||||
return clusterDataProvider.getNodeValues(node, tags);
|
return clusterDataProvider.getNodeValues(node, tags);
|
||||||
|
@ -1111,8 +1110,8 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return clusterDataProvider.getNodes();
|
return clusterDataProvider.getLiveNodes();
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -1131,7 +1130,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
private ClusterDataProvider getClusterDataProvider(final Map<String, Map> nodeValues, String clusterState) {
|
private ClusterDataProvider getClusterDataProvider(final Map<String, Map> nodeValues, String clusterState) {
|
||||||
return new ClusterDataProvider() {
|
return new DelegatingClusterDataProvider(null) {
|
||||||
@Override
|
@Override
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
public Map<String, Object> getNodeValues(String node, Collection<String> tags) {
|
||||||
Map<String, Object> result = new LinkedHashMap<>();
|
Map<String, Object> result = new LinkedHashMap<>();
|
||||||
|
@ -1140,7 +1139,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return nodeValues.keySet();
|
return nodeValues.keySet();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1168,7 +1167,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
" '127.0.0.1:50096_solr':{" +
|
" '127.0.0.1:50096_solr':{" +
|
||||||
" 'cores':0," +
|
" 'cores':0," +
|
||||||
" 'port':'50096'}}");
|
" 'port':'50096'}}");
|
||||||
ClusterDataProvider dataProvider = new ClusterDataProvider() {
|
ClusterDataProvider dataProvider = new DelegatingClusterDataProvider(null) {
|
||||||
@Override
|
@Override
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> keys) {
|
public Map<String, Object> getNodeValues(String node, Collection<String> keys) {
|
||||||
Map<String, Object> result = new LinkedHashMap<>();
|
Map<String, Object> result = new LinkedHashMap<>();
|
||||||
|
@ -1187,7 +1186,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return Arrays.asList( "127.0.0.1:50097_solr", "127.0.0.1:50096_solr");
|
return Arrays.asList( "127.0.0.1:50097_solr", "127.0.0.1:50096_solr");
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
@ -1225,7 +1224,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
"node4:{cores:0, freedisk: 900, heap:16900, nodeRole:overseer, sysprop.rack:rack2}" +
|
"node4:{cores:0, freedisk: 900, heap:16900, nodeRole:overseer, sysprop.rack:rack2}" +
|
||||||
"}");
|
"}");
|
||||||
|
|
||||||
ClusterDataProvider dataProvider = new ClusterDataProvider() {
|
ClusterDataProvider dataProvider = new DelegatingClusterDataProvider(null) {
|
||||||
@Override
|
@Override
|
||||||
public Map<String, Object> getNodeValues(String node, Collection<String> keys) {
|
public Map<String, Object> getNodeValues(String node, Collection<String> keys) {
|
||||||
Map<String, Object> result = new LinkedHashMap<>();
|
Map<String, Object> result = new LinkedHashMap<>();
|
||||||
|
@ -1244,7 +1243,7 @@ public class TestPolicy extends SolrTestCaseJ4 {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Collection<String> getNodes() {
|
public Collection<String> getLiveNodes() {
|
||||||
return Arrays.asList("node1", "node2", "node3", "node4");
|
return Arrays.asList("node1", "node2", "node3", "node4");
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
Loading…
Reference in New Issue