mirror of https://github.com/apache/lucene.git
SOLR-14588: Implement Circuit Breakers (#1626)
* SOLR-14588: Implement Circuit Breakers This commit consists of two parts: add circuit breakers infrastructure and a "real" JVM heap memory based circuit breaker which monitors incoming search requests and rejects them with SERVICE_TOO_BUSY error if the defined threshold is breached, thus giving headroom to existing indexing and search requests to complete.
This commit is contained in:
parent
ccdfee2cf0
commit
3f9cc227f1
|
@ -12,6 +12,8 @@ New Features
|
||||||
---------------------
|
---------------------
|
||||||
* SOLR-14440: Introduce new Certificate Authentication Plugin to load Principal from certificate subject. (Mike Drob)
|
* SOLR-14440: Introduce new Certificate Authentication Plugin to load Principal from certificate subject. (Mike Drob)
|
||||||
|
|
||||||
|
* SOLR-14588: Introduce Circuit Breaker Infrastructure and a JVM heap usage memory tracking circuit breaker implementation (Atri Sharma)
|
||||||
|
|
||||||
Improvements
|
Improvements
|
||||||
----------------------
|
----------------------
|
||||||
* LUCENE-8984: MoreLikeThis MLT is biased for uncommon fields (Andy Hind via Anshum Gupta)
|
* LUCENE-8984: MoreLikeThis MLT is biased for uncommon fields (Andy Hind via Anshum Gupta)
|
||||||
|
|
|
@ -225,6 +225,11 @@ public class SolrConfig extends XmlConfigFile implements MapSerializable {
|
||||||
queryResultMaxDocsCached = getInt("query/queryResultMaxDocsCached", Integer.MAX_VALUE);
|
queryResultMaxDocsCached = getInt("query/queryResultMaxDocsCached", Integer.MAX_VALUE);
|
||||||
enableLazyFieldLoading = getBool("query/enableLazyFieldLoading", false);
|
enableLazyFieldLoading = getBool("query/enableLazyFieldLoading", false);
|
||||||
|
|
||||||
|
useCircuitBreakers = getBool("circuitBreaker/useCircuitBreakers", false);
|
||||||
|
memoryCircuitBreakerThresholdPct = getInt("circuitBreaker/memoryCircuitBreakerThresholdPct", 95);
|
||||||
|
|
||||||
|
validateMemoryBreakerThreshold();
|
||||||
|
|
||||||
useRangeVersionsForPeerSync = getBool("peerSync/useRangeVersions", true);
|
useRangeVersionsForPeerSync = getBool("peerSync/useRangeVersions", true);
|
||||||
|
|
||||||
filterCacheConfig = CacheConfig.getConfig(this, "query/filterCache");
|
filterCacheConfig = CacheConfig.getConfig(this, "query/filterCache");
|
||||||
|
@ -523,6 +528,10 @@ public class SolrConfig extends XmlConfigFile implements MapSerializable {
|
||||||
public final int queryResultMaxDocsCached;
|
public final int queryResultMaxDocsCached;
|
||||||
public final boolean enableLazyFieldLoading;
|
public final boolean enableLazyFieldLoading;
|
||||||
|
|
||||||
|
// Circuit Breaker Configuration
|
||||||
|
public final boolean useCircuitBreakers;
|
||||||
|
public final int memoryCircuitBreakerThresholdPct;
|
||||||
|
|
||||||
public final boolean useRangeVersionsForPeerSync;
|
public final boolean useRangeVersionsForPeerSync;
|
||||||
|
|
||||||
// IndexConfig settings
|
// IndexConfig settings
|
||||||
|
@ -804,6 +813,14 @@ public class SolrConfig extends XmlConfigFile implements MapSerializable {
|
||||||
loader.reloadLuceneSPI();
|
loader.reloadLuceneSPI();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private void validateMemoryBreakerThreshold() {
|
||||||
|
if (useCircuitBreakers) {
|
||||||
|
if (memoryCircuitBreakerThresholdPct > 95 || memoryCircuitBreakerThresholdPct < 50) {
|
||||||
|
throw new IllegalArgumentException("Valid value range of memoryCircuitBreakerThresholdPct is 50 - 95");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
public int getMultipartUploadLimitKB() {
|
public int getMultipartUploadLimitKB() {
|
||||||
return multipartUploadLimitKB;
|
return multipartUploadLimitKB;
|
||||||
}
|
}
|
||||||
|
@ -873,6 +890,8 @@ public class SolrConfig extends XmlConfigFile implements MapSerializable {
|
||||||
m.put("queryResultMaxDocsCached", queryResultMaxDocsCached);
|
m.put("queryResultMaxDocsCached", queryResultMaxDocsCached);
|
||||||
m.put("enableLazyFieldLoading", enableLazyFieldLoading);
|
m.put("enableLazyFieldLoading", enableLazyFieldLoading);
|
||||||
m.put("maxBooleanClauses", booleanQueryMaxClauseCount);
|
m.put("maxBooleanClauses", booleanQueryMaxClauseCount);
|
||||||
|
m.put("useCircuitBreakers", useCircuitBreakers);
|
||||||
|
m.put("memoryCircuitBreakerThresholdPct", memoryCircuitBreakerThresholdPct);
|
||||||
for (SolrPluginInfo plugin : plugins) {
|
for (SolrPluginInfo plugin : plugins) {
|
||||||
List<PluginInfo> infos = getPluginInfos(plugin.clazz.getName());
|
List<PluginInfo> infos = getPluginInfos(plugin.clazz.getName());
|
||||||
if (infos == null || infos.isEmpty()) continue;
|
if (infos == null || infos.isEmpty()) continue;
|
||||||
|
|
|
@ -94,6 +94,7 @@ import org.apache.solr.common.util.IOUtils;
|
||||||
import org.apache.solr.common.util.NamedList;
|
import org.apache.solr.common.util.NamedList;
|
||||||
import org.apache.solr.common.util.ObjectReleaseTracker;
|
import org.apache.solr.common.util.ObjectReleaseTracker;
|
||||||
import org.apache.solr.common.util.SimpleOrderedMap;
|
import org.apache.solr.common.util.SimpleOrderedMap;
|
||||||
|
import org.apache.solr.common.util.SolrNamedThreadFactory;
|
||||||
import org.apache.solr.common.util.Utils;
|
import org.apache.solr.common.util.Utils;
|
||||||
import org.apache.solr.core.DirectoryFactory.DirContext;
|
import org.apache.solr.core.DirectoryFactory.DirContext;
|
||||||
import org.apache.solr.core.snapshots.SolrSnapshotManager;
|
import org.apache.solr.core.snapshots.SolrSnapshotManager;
|
||||||
|
@ -157,13 +158,13 @@ import org.apache.solr.update.processor.RunUpdateProcessorFactory;
|
||||||
import org.apache.solr.update.processor.UpdateRequestProcessorChain;
|
import org.apache.solr.update.processor.UpdateRequestProcessorChain;
|
||||||
import org.apache.solr.update.processor.UpdateRequestProcessorChain.ProcessorInfo;
|
import org.apache.solr.update.processor.UpdateRequestProcessorChain.ProcessorInfo;
|
||||||
import org.apache.solr.update.processor.UpdateRequestProcessorFactory;
|
import org.apache.solr.update.processor.UpdateRequestProcessorFactory;
|
||||||
import org.apache.solr.common.util.SolrNamedThreadFactory;
|
|
||||||
import org.apache.solr.util.IOFunction;
|
import org.apache.solr.util.IOFunction;
|
||||||
import org.apache.solr.util.NumberUtils;
|
import org.apache.solr.util.NumberUtils;
|
||||||
import org.apache.solr.util.PropertiesInputStream;
|
import org.apache.solr.util.PropertiesInputStream;
|
||||||
import org.apache.solr.util.PropertiesOutputStream;
|
import org.apache.solr.util.PropertiesOutputStream;
|
||||||
import org.apache.solr.util.RefCounted;
|
import org.apache.solr.util.RefCounted;
|
||||||
import org.apache.solr.util.TestInjection;
|
import org.apache.solr.util.TestInjection;
|
||||||
|
import org.apache.solr.util.circuitbreaker.CircuitBreakerManager;
|
||||||
import org.apache.solr.util.plugin.NamedListInitializedPlugin;
|
import org.apache.solr.util.plugin.NamedListInitializedPlugin;
|
||||||
import org.apache.solr.util.plugin.PluginInfoInitialized;
|
import org.apache.solr.util.plugin.PluginInfoInitialized;
|
||||||
import org.apache.solr.util.plugin.SolrCoreAware;
|
import org.apache.solr.util.plugin.SolrCoreAware;
|
||||||
|
@ -219,6 +220,8 @@ public final class SolrCore implements SolrInfoBean, Closeable {
|
||||||
private final Codec codec;
|
private final Codec codec;
|
||||||
private final MemClassLoader memClassLoader;
|
private final MemClassLoader memClassLoader;
|
||||||
|
|
||||||
|
private final CircuitBreakerManager circuitBreakerManager;
|
||||||
|
|
||||||
private final List<Runnable> confListeners = new CopyOnWriteArrayList<>();
|
private final List<Runnable> confListeners = new CopyOnWriteArrayList<>();
|
||||||
|
|
||||||
private final ReentrantLock ruleExpiryLock;
|
private final ReentrantLock ruleExpiryLock;
|
||||||
|
@ -938,6 +941,7 @@ public final class SolrCore implements SolrInfoBean, Closeable {
|
||||||
this.configSetProperties = configSet.getProperties();
|
this.configSetProperties = configSet.getProperties();
|
||||||
// Initialize the metrics manager
|
// Initialize the metrics manager
|
||||||
this.coreMetricManager = initCoreMetricManager(solrConfig);
|
this.coreMetricManager = initCoreMetricManager(solrConfig);
|
||||||
|
this.circuitBreakerManager = initCircuitBreakerManager();
|
||||||
solrMetricsContext = coreMetricManager.getSolrMetricsContext();
|
solrMetricsContext = coreMetricManager.getSolrMetricsContext();
|
||||||
this.coreMetricManager.loadReporters();
|
this.coreMetricManager.loadReporters();
|
||||||
|
|
||||||
|
@ -1164,6 +1168,12 @@ public final class SolrCore implements SolrInfoBean, Closeable {
|
||||||
return coreMetricManager;
|
return coreMetricManager;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private CircuitBreakerManager initCircuitBreakerManager() {
|
||||||
|
CircuitBreakerManager circuitBreakerManager = CircuitBreakerManager.build(solrConfig);
|
||||||
|
|
||||||
|
return circuitBreakerManager;
|
||||||
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void initializeMetrics(SolrMetricsContext parentContext, String scope) {
|
public void initializeMetrics(SolrMetricsContext parentContext, String scope) {
|
||||||
newSearcherCounter = parentContext.counter("new", Category.SEARCHER.toString());
|
newSearcherCounter = parentContext.counter("new", Category.SEARCHER.toString());
|
||||||
|
@ -1499,6 +1509,10 @@ public final class SolrCore implements SolrInfoBean, Closeable {
|
||||||
return updateProcessors;
|
return updateProcessors;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public CircuitBreakerManager getCircuitBreakerManager() {
|
||||||
|
return circuitBreakerManager;
|
||||||
|
}
|
||||||
|
|
||||||
// this core current usage count
|
// this core current usage count
|
||||||
private final AtomicInteger refCount = new AtomicInteger(1);
|
private final AtomicInteger refCount = new AtomicInteger(1);
|
||||||
|
|
||||||
|
|
|
@ -51,13 +51,17 @@ import org.apache.solr.security.AuthorizationContext;
|
||||||
import org.apache.solr.security.PermissionNameProvider;
|
import org.apache.solr.security.PermissionNameProvider;
|
||||||
import org.apache.solr.util.RTimerTree;
|
import org.apache.solr.util.RTimerTree;
|
||||||
import org.apache.solr.util.SolrPluginUtils;
|
import org.apache.solr.util.SolrPluginUtils;
|
||||||
|
import org.apache.solr.util.circuitbreaker.CircuitBreaker;
|
||||||
|
import org.apache.solr.util.circuitbreaker.CircuitBreakerManager;
|
||||||
import org.apache.solr.util.plugin.PluginInfoInitialized;
|
import org.apache.solr.util.plugin.PluginInfoInitialized;
|
||||||
import org.apache.solr.util.plugin.SolrCoreAware;
|
import org.apache.solr.util.plugin.SolrCoreAware;
|
||||||
import org.slf4j.Logger;
|
import org.slf4j.Logger;
|
||||||
import org.slf4j.LoggerFactory;
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
import static org.apache.solr.common.params.CommonParams.DISTRIB;
|
import static org.apache.solr.common.params.CommonParams.DISTRIB;
|
||||||
|
import static org.apache.solr.common.params.CommonParams.FAILURE;
|
||||||
import static org.apache.solr.common.params.CommonParams.PATH;
|
import static org.apache.solr.common.params.CommonParams.PATH;
|
||||||
|
import static org.apache.solr.common.params.CommonParams.STATUS;
|
||||||
|
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -297,6 +301,30 @@ public class SearchHandler extends RequestHandlerBase implements SolrCoreAware,
|
||||||
|
|
||||||
final RTimerTree timer = rb.isDebug() ? req.getRequestTimer() : null;
|
final RTimerTree timer = rb.isDebug() ? req.getRequestTimer() : null;
|
||||||
|
|
||||||
|
if (req.getCore().getSolrConfig().useCircuitBreakers) {
|
||||||
|
List<CircuitBreaker> trippedCircuitBreakers;
|
||||||
|
|
||||||
|
if (timer != null) {
|
||||||
|
RTimerTree subt = timer.sub("circuitbreaker");
|
||||||
|
rb.setTimer(subt);
|
||||||
|
|
||||||
|
CircuitBreakerManager circuitBreakerManager = req.getCore().getCircuitBreakerManager();
|
||||||
|
trippedCircuitBreakers = circuitBreakerManager.checkTripped();
|
||||||
|
|
||||||
|
rb.getTimer().stop();
|
||||||
|
} else {
|
||||||
|
CircuitBreakerManager circuitBreakerManager = req.getCore().getCircuitBreakerManager();
|
||||||
|
trippedCircuitBreakers = circuitBreakerManager.checkTripped();
|
||||||
|
}
|
||||||
|
|
||||||
|
if (trippedCircuitBreakers != null) {
|
||||||
|
String errorMessage = CircuitBreakerManager.toErrorMessage(trippedCircuitBreakers);
|
||||||
|
rsp.add(STATUS, FAILURE);
|
||||||
|
rsp.setException(new SolrException(SolrException.ErrorCode.SERVICE_UNAVAILABLE, "Circuit Breakers tripped " + errorMessage));
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
final ShardHandler shardHandler1 = getAndPrepShardHandler(req, rb); // creates a ShardHandler object only if it's needed
|
final ShardHandler shardHandler1 = getAndPrepShardHandler(req, rb); // creates a ShardHandler object only if it's needed
|
||||||
|
|
||||||
if (timer == null) {
|
if (timer == null) {
|
||||||
|
|
|
@ -0,0 +1,56 @@
|
||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package org.apache.solr.util.circuitbreaker;
|
||||||
|
|
||||||
|
import org.apache.solr.core.SolrConfig;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Default class to define circuit breakers for Solr.
|
||||||
|
* <p>
|
||||||
|
* There are two (typical) ways to use circuit breakers:
|
||||||
|
* 1. Have them checked at admission control by default (use CircuitBreakerManager for the same).
|
||||||
|
* 2. Use the circuit breaker in a specific code path(s).
|
||||||
|
*
|
||||||
|
* TODO: This class should be grown as the scope of circuit breakers grow.
|
||||||
|
* </p>
|
||||||
|
*/
|
||||||
|
public abstract class CircuitBreaker {
|
||||||
|
public static final String NAME = "circuitbreaker";
|
||||||
|
|
||||||
|
protected final SolrConfig solrConfig;
|
||||||
|
|
||||||
|
public CircuitBreaker(SolrConfig solrConfig) {
|
||||||
|
this.solrConfig = solrConfig;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Global config for all circuit breakers. For specific circuit breaker configs, define
|
||||||
|
// your own config.
|
||||||
|
protected boolean isEnabled() {
|
||||||
|
return solrConfig.useCircuitBreakers;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Check if circuit breaker is tripped.
|
||||||
|
*/
|
||||||
|
public abstract boolean isTripped();
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Get debug useful info.
|
||||||
|
*/
|
||||||
|
public abstract String getDebugInfo();
|
||||||
|
}
|
|
@ -0,0 +1,134 @@
|
||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package org.apache.solr.util.circuitbreaker;
|
||||||
|
|
||||||
|
import java.util.ArrayList;
|
||||||
|
import java.util.List;
|
||||||
|
|
||||||
|
import org.apache.solr.core.SolrConfig;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Manages all registered circuit breaker instances. Responsible for a holistic view
|
||||||
|
* of whether a circuit breaker has tripped or not.
|
||||||
|
*
|
||||||
|
* There are two typical ways of using this class's instance:
|
||||||
|
* 1. Check if any circuit breaker has triggered -- and know which circuit breaker has triggered.
|
||||||
|
* 2. Get an instance of a specific circuit breaker and perform checks.
|
||||||
|
*
|
||||||
|
* It is a good practice to register new circuit breakers here if you want them checked for every
|
||||||
|
* request.
|
||||||
|
*
|
||||||
|
* NOTE: The current way of registering new default circuit breakers is minimal and not a long term
|
||||||
|
* solution. There will be a follow up with a SIP for a schema API design.
|
||||||
|
*/
|
||||||
|
public class CircuitBreakerManager {
|
||||||
|
// Class private to potentially allow "family" of circuit breakers to be enabled or disabled
|
||||||
|
private final boolean enableCircuitBreakerManager;
|
||||||
|
|
||||||
|
private final List<CircuitBreaker> circuitBreakerList = new ArrayList<>();
|
||||||
|
|
||||||
|
public CircuitBreakerManager(final boolean enableCircuitBreakerManager) {
|
||||||
|
this.enableCircuitBreakerManager = enableCircuitBreakerManager;
|
||||||
|
}
|
||||||
|
|
||||||
|
public void register(CircuitBreaker circuitBreaker) {
|
||||||
|
circuitBreakerList.add(circuitBreaker);
|
||||||
|
}
|
||||||
|
|
||||||
|
public void deregisterAll() {
|
||||||
|
circuitBreakerList.clear();
|
||||||
|
}
|
||||||
|
/**
|
||||||
|
* Check and return circuit breakers that have triggered
|
||||||
|
* @return CircuitBreakers which have triggered, null otherwise.
|
||||||
|
*/
|
||||||
|
public List<CircuitBreaker> checkTripped() {
|
||||||
|
List<CircuitBreaker> triggeredCircuitBreakers = null;
|
||||||
|
|
||||||
|
if (enableCircuitBreakerManager) {
|
||||||
|
for (CircuitBreaker circuitBreaker : circuitBreakerList) {
|
||||||
|
if (circuitBreaker.isEnabled() &&
|
||||||
|
circuitBreaker.isTripped()) {
|
||||||
|
if (triggeredCircuitBreakers == null) {
|
||||||
|
triggeredCircuitBreakers = new ArrayList<>();
|
||||||
|
}
|
||||||
|
|
||||||
|
triggeredCircuitBreakers.add(circuitBreaker);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return triggeredCircuitBreakers;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Returns true if *any* circuit breaker has triggered, false if none have triggered.
|
||||||
|
*
|
||||||
|
* <p>
|
||||||
|
* NOTE: This method short circuits the checking of circuit breakers -- the method will
|
||||||
|
* return as soon as it finds a circuit breaker that is enabled and has triggered.
|
||||||
|
* </p>
|
||||||
|
*/
|
||||||
|
public boolean checkAnyTripped() {
|
||||||
|
if (enableCircuitBreakerManager) {
|
||||||
|
for (CircuitBreaker circuitBreaker : circuitBreakerList) {
|
||||||
|
if (circuitBreaker.isEnabled() &&
|
||||||
|
circuitBreaker.isTripped()) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Construct the final error message to be printed when circuit breakers trip.
|
||||||
|
*
|
||||||
|
* @param circuitBreakerList Input list for circuit breakers.
|
||||||
|
* @return Constructed error message.
|
||||||
|
*/
|
||||||
|
public static String toErrorMessage(List<CircuitBreaker> circuitBreakerList) {
|
||||||
|
StringBuilder sb = new StringBuilder();
|
||||||
|
|
||||||
|
for (CircuitBreaker circuitBreaker : circuitBreakerList) {
|
||||||
|
sb.append(circuitBreaker.getClass().getName());
|
||||||
|
sb.append(" ");
|
||||||
|
sb.append(circuitBreaker.getDebugInfo());
|
||||||
|
sb.append("\n");
|
||||||
|
}
|
||||||
|
|
||||||
|
return sb.toString();
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Register default circuit breakers and return a constructed CircuitBreakerManager
|
||||||
|
* instance which serves the given circuit breakers.
|
||||||
|
*
|
||||||
|
* Any default circuit breakers should be registered here.
|
||||||
|
*/
|
||||||
|
public static CircuitBreakerManager build(SolrConfig solrConfig) {
|
||||||
|
CircuitBreakerManager circuitBreakerManager = new CircuitBreakerManager(solrConfig.useCircuitBreakers);
|
||||||
|
|
||||||
|
// Install the default circuit breakers
|
||||||
|
CircuitBreaker memoryCircuitBreaker = new MemoryCircuitBreaker(solrConfig);
|
||||||
|
circuitBreakerManager.register(memoryCircuitBreaker);
|
||||||
|
|
||||||
|
return circuitBreakerManager;
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,114 @@
|
||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package org.apache.solr.util.circuitbreaker;
|
||||||
|
|
||||||
|
import java.lang.invoke.MethodHandles;
|
||||||
|
import java.lang.management.ManagementFactory;
|
||||||
|
import java.lang.management.MemoryMXBean;
|
||||||
|
|
||||||
|
import org.apache.solr.core.SolrConfig;
|
||||||
|
import org.slf4j.Logger;
|
||||||
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* <p>
|
||||||
|
* Tracks the current JVM heap usage and triggers if it exceeds the defined percentage of the maximum
|
||||||
|
* heap size allocated to the JVM. This circuit breaker is a part of the default CircuitBreakerManager
|
||||||
|
* so is checked for every request -- hence it is realtime. Once the memory usage goes below the threshold,
|
||||||
|
* it will start allowing queries again.
|
||||||
|
* </p>
|
||||||
|
*
|
||||||
|
* <p>
|
||||||
|
* The memory threshold is defined as a percentage of the maximum memory allocated -- see memoryCircuitBreakerThresholdPct
|
||||||
|
* in solrconfig.xml.
|
||||||
|
* </p>
|
||||||
|
*/
|
||||||
|
|
||||||
|
public class MemoryCircuitBreaker extends CircuitBreaker {
|
||||||
|
private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
|
||||||
|
private static final MemoryMXBean MEMORY_MX_BEAN = ManagementFactory.getMemoryMXBean();
|
||||||
|
|
||||||
|
private final long heapMemoryThreshold;
|
||||||
|
|
||||||
|
// Assumption -- the value of these parameters will be set correctly before invoking getDebugInfo()
|
||||||
|
private final ThreadLocal<Long> seenMemory = new ThreadLocal<>();
|
||||||
|
private final ThreadLocal<Long> allowedMemory = new ThreadLocal<>();
|
||||||
|
|
||||||
|
public MemoryCircuitBreaker(SolrConfig solrConfig) {
|
||||||
|
super(solrConfig);
|
||||||
|
|
||||||
|
long currentMaxHeap = MEMORY_MX_BEAN.getHeapMemoryUsage().getMax();
|
||||||
|
|
||||||
|
if (currentMaxHeap <= 0) {
|
||||||
|
throw new IllegalArgumentException("Invalid JVM state for the max heap usage");
|
||||||
|
}
|
||||||
|
|
||||||
|
int thresholdValueInPercentage = solrConfig.memoryCircuitBreakerThresholdPct;
|
||||||
|
double thresholdInFraction = thresholdValueInPercentage / (double) 100;
|
||||||
|
heapMemoryThreshold = (long) (currentMaxHeap * thresholdInFraction);
|
||||||
|
|
||||||
|
if (heapMemoryThreshold <= 0) {
|
||||||
|
throw new IllegalStateException("Memory limit cannot be less than or equal to zero");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// TODO: An optimization can be to trip the circuit breaker for a duration of time
|
||||||
|
// after the circuit breaker condition is matched. This will optimize for per call
|
||||||
|
// overhead of calculating the condition parameters but can result in false positives.
|
||||||
|
@Override
|
||||||
|
public boolean isTripped() {
|
||||||
|
if (!isEnabled()) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
long localAllowedMemory = getCurrentMemoryThreshold();
|
||||||
|
long localSeenMemory = calculateLiveMemoryUsage();
|
||||||
|
|
||||||
|
allowedMemory.set(localAllowedMemory);
|
||||||
|
|
||||||
|
seenMemory.set(localSeenMemory);
|
||||||
|
|
||||||
|
return (localSeenMemory >= localAllowedMemory);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public String getDebugInfo() {
|
||||||
|
if (seenMemory.get() == 0L || allowedMemory.get() == 0L) {
|
||||||
|
log.warn("MemoryCircuitBreaker's monitored values (seenMemory, allowedMemory) not set");
|
||||||
|
}
|
||||||
|
|
||||||
|
return "seenMemory=" + seenMemory.get() + " allowedMemory=" + allowedMemory.get();
|
||||||
|
}
|
||||||
|
|
||||||
|
private long getCurrentMemoryThreshold() {
|
||||||
|
return heapMemoryThreshold;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Calculate the live memory usage for the system. This method has package visibility
|
||||||
|
* to allow using for testing.
|
||||||
|
* @return Memory usage in bytes.
|
||||||
|
*/
|
||||||
|
protected long calculateLiveMemoryUsage() {
|
||||||
|
// NOTE: MemoryUsageGaugeSet provides memory usage statistics but we do not use them
|
||||||
|
// here since it will require extra allocations and incur cost, hence it is cheaper to use
|
||||||
|
// MemoryMXBean directly. Ideally, this call should not add noticeable
|
||||||
|
// latency to a query -- but if it does, please signify on SOLR-14588
|
||||||
|
return MEMORY_MX_BEAN.getHeapMemoryUsage().getUsed();
|
||||||
|
}
|
||||||
|
}
|
|
@ -55,6 +55,8 @@
|
||||||
"queryResultMaxDocsCached":1,
|
"queryResultMaxDocsCached":1,
|
||||||
"enableLazyFieldLoading":1,
|
"enableLazyFieldLoading":1,
|
||||||
"boolTofilterOptimizer":1,
|
"boolTofilterOptimizer":1,
|
||||||
|
"useCircuitBreakers":10,
|
||||||
|
"memoryCircuitBreakerThresholdPct":20,
|
||||||
"maxBooleanClauses":1},
|
"maxBooleanClauses":1},
|
||||||
"jmx":{
|
"jmx":{
|
||||||
"agentId":0,
|
"agentId":0,
|
||||||
|
|
|
@ -0,0 +1,95 @@
|
||||||
|
<?xml version="1.0" ?>
|
||||||
|
|
||||||
|
<!--
|
||||||
|
Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
contributor license agreements. See the NOTICE file distributed with
|
||||||
|
this work for additional information regarding copyright ownership.
|
||||||
|
The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
(the "License"); you may not use this file except in compliance with
|
||||||
|
the License. You may obtain a copy of the License at
|
||||||
|
|
||||||
|
http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
|
||||||
|
Unless required by applicable law or agreed to in writing, software
|
||||||
|
distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
See the License for the specific language governing permissions and
|
||||||
|
limitations under the License.
|
||||||
|
-->
|
||||||
|
|
||||||
|
<config>
|
||||||
|
<luceneMatchVersion>${tests.luceneMatchVersion:LATEST}</luceneMatchVersion>
|
||||||
|
<dataDir>${solr.data.dir:}</dataDir>
|
||||||
|
<xi:include href="solrconfig.snippet.randomindexconfig.xml" xmlns:xi="http://www.w3.org/2001/XInclude"/>
|
||||||
|
<directoryFactory name="DirectoryFactory" class="${solr.directoryFactory:solr.RAMDirectoryFactory}"/>
|
||||||
|
<schemaFactory class="ClassicIndexSchemaFactory"/>
|
||||||
|
<requestHandler name="/select" class="solr.SearchHandler" />
|
||||||
|
|
||||||
|
<query>
|
||||||
|
<!-- Maximum number of clauses in a boolean query... can affect
|
||||||
|
range or wildcard queries that expand to big boolean
|
||||||
|
queries. An exception is thrown if exceeded.
|
||||||
|
-->
|
||||||
|
<maxBooleanClauses>${solr.max.booleanClauses:1024}</maxBooleanClauses>
|
||||||
|
|
||||||
|
<!-- Cache specification for Filters or DocSets - unordered set of *all* documents
|
||||||
|
that match a particular query.
|
||||||
|
-->
|
||||||
|
<filterCache
|
||||||
|
enabled="${filterCache.enabled}"
|
||||||
|
size="512"
|
||||||
|
initialSize="512"
|
||||||
|
autowarmCount="2"/>
|
||||||
|
|
||||||
|
<queryResultCache
|
||||||
|
enabled="${queryResultCache.enabled}"
|
||||||
|
size="512"
|
||||||
|
initialSize="512"
|
||||||
|
autowarmCount="2"/>
|
||||||
|
|
||||||
|
<documentCache
|
||||||
|
enabled="${documentCache.enabled}"
|
||||||
|
size="512"
|
||||||
|
initialSize="512"
|
||||||
|
autowarmCount="0"/>
|
||||||
|
|
||||||
|
<cache
|
||||||
|
name="user_definied_cache_XXX"
|
||||||
|
enabled="${user_definied_cache_XXX.enabled:false}"
|
||||||
|
/>
|
||||||
|
<cache
|
||||||
|
name="user_definied_cache_ZZZ"
|
||||||
|
enabled="${user_definied_cache_ZZZ.enabled:false}"
|
||||||
|
/>
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
<!-- If true, stored fields that are not requested will be loaded lazily.
|
||||||
|
-->
|
||||||
|
<enableLazyFieldLoading>true</enableLazyFieldLoading>
|
||||||
|
|
||||||
|
<queryResultWindowSize>10</queryResultWindowSize>
|
||||||
|
|
||||||
|
<!-- boolToFilterOptimizer converts boolean clauses with zero boost
|
||||||
|
into cached filters if the number of docs selected by the clause exceeds
|
||||||
|
the threshold (represented as a fraction of the total index)
|
||||||
|
-->
|
||||||
|
<boolTofilterOptimizer enabled="false" cacheSize="32" threshold=".05"/>
|
||||||
|
|
||||||
|
</query>
|
||||||
|
|
||||||
|
<circuitBreaker>
|
||||||
|
|
||||||
|
<useCircuitBreakers>true</useCircuitBreakers>
|
||||||
|
|
||||||
|
<memoryCircuitBreakerThresholdPct>75</memoryCircuitBreakerThresholdPct>
|
||||||
|
|
||||||
|
</circuitBreaker>
|
||||||
|
|
||||||
|
<initParams path="/select">
|
||||||
|
<lst name="defaults">
|
||||||
|
<str name="df">text</str>
|
||||||
|
</lst>
|
||||||
|
</initParams>
|
||||||
|
|
||||||
|
</config>
|
|
@ -266,6 +266,8 @@ public class SolrCoreTest extends SolrTestCaseJ4 {
|
||||||
assertEquals("wrong config for maxBooleanClauses", 1024, solrConfig.booleanQueryMaxClauseCount);
|
assertEquals("wrong config for maxBooleanClauses", 1024, solrConfig.booleanQueryMaxClauseCount);
|
||||||
assertEquals("wrong config for enableLazyFieldLoading", true, solrConfig.enableLazyFieldLoading);
|
assertEquals("wrong config for enableLazyFieldLoading", true, solrConfig.enableLazyFieldLoading);
|
||||||
assertEquals("wrong config for queryResultWindowSize", 10, solrConfig.queryResultWindowSize);
|
assertEquals("wrong config for queryResultWindowSize", 10, solrConfig.queryResultWindowSize);
|
||||||
|
assertEquals("wrong config for useCircuitBreakers", false, solrConfig.useCircuitBreakers);
|
||||||
|
assertEquals("wrong config for memoryCircuitBreakerThresholdPct", 95, solrConfig.memoryCircuitBreakerThresholdPct);
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
|
|
@ -46,6 +46,8 @@ public class TestConfigOverlay extends SolrTestCase {
|
||||||
assertTrue(isEditableProp("query.queryResultMaxDocsCached", false, null));
|
assertTrue(isEditableProp("query.queryResultMaxDocsCached", false, null));
|
||||||
assertTrue(isEditableProp("query.enableLazyFieldLoading", false, null));
|
assertTrue(isEditableProp("query.enableLazyFieldLoading", false, null));
|
||||||
assertTrue(isEditableProp("query.boolTofilterOptimizer", false, null));
|
assertTrue(isEditableProp("query.boolTofilterOptimizer", false, null));
|
||||||
|
assertTrue(isEditableProp("query.useCircuitBreakers", false, null));
|
||||||
|
assertTrue(isEditableProp("query.memoryCircuitBreakerThresholdPct", false, null));
|
||||||
assertTrue(isEditableProp("jmx.agentId", false, null));
|
assertTrue(isEditableProp("jmx.agentId", false, null));
|
||||||
assertTrue(isEditableProp("jmx.serviceUrl", false, null));
|
assertTrue(isEditableProp("jmx.serviceUrl", false, null));
|
||||||
assertTrue(isEditableProp("jmx.rootName", false, null));
|
assertTrue(isEditableProp("jmx.rootName", false, null));
|
||||||
|
|
|
@ -0,0 +1,218 @@
|
||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package org.apache.solr.util;
|
||||||
|
|
||||||
|
import java.util.HashMap;
|
||||||
|
import java.util.concurrent.ExecutorService;
|
||||||
|
import java.util.concurrent.TimeUnit;
|
||||||
|
import java.util.concurrent.atomic.AtomicInteger;
|
||||||
|
|
||||||
|
import com.carrotsearch.randomizedtesting.rules.SystemPropertiesRestoreRule;
|
||||||
|
import org.apache.solr.SolrTestCaseJ4;
|
||||||
|
import org.apache.solr.common.SolrException;
|
||||||
|
import org.apache.solr.common.params.CommonParams;
|
||||||
|
import org.apache.solr.common.util.ExecutorUtil;
|
||||||
|
import org.apache.solr.common.util.SolrNamedThreadFactory;
|
||||||
|
import org.apache.solr.core.SolrConfig;
|
||||||
|
import org.apache.solr.search.QueryParsing;
|
||||||
|
import org.apache.solr.util.circuitbreaker.CircuitBreaker;
|
||||||
|
import org.apache.solr.util.circuitbreaker.MemoryCircuitBreaker;
|
||||||
|
import org.junit.After;
|
||||||
|
import org.junit.BeforeClass;
|
||||||
|
import org.junit.Rule;
|
||||||
|
import org.junit.rules.RuleChain;
|
||||||
|
import org.junit.rules.TestRule;
|
||||||
|
|
||||||
|
public class TestCircuitBreaker extends SolrTestCaseJ4 {
|
||||||
|
private final static int NUM_DOCS = 20;
|
||||||
|
|
||||||
|
@Rule
|
||||||
|
public TestRule solrTestRules = RuleChain.outerRule(new SystemPropertiesRestoreRule());
|
||||||
|
|
||||||
|
@BeforeClass
|
||||||
|
public static void setUpClass() throws Exception {
|
||||||
|
System.setProperty("filterCache.enabled", "false");
|
||||||
|
System.setProperty("queryResultCache.enabled", "false");
|
||||||
|
System.setProperty("documentCache.enabled", "true");
|
||||||
|
|
||||||
|
initCore("solrconfig-memory-circuitbreaker.xml", "schema.xml");
|
||||||
|
for (int i = 0 ; i < NUM_DOCS ; i ++) {
|
||||||
|
assertU(adoc("name", "john smith", "id", "1"));
|
||||||
|
assertU(adoc("name", "johathon smith", "id", "2"));
|
||||||
|
assertU(adoc("name", "john percival smith", "id", "3"));
|
||||||
|
assertU(adoc("id", "1", "title", "this is a title.", "inStock_b1", "true"));
|
||||||
|
assertU(adoc("id", "2", "title", "this is another title.", "inStock_b1", "true"));
|
||||||
|
assertU(adoc("id", "3", "title", "Mary had a little lamb.", "inStock_b1", "false"));
|
||||||
|
|
||||||
|
//commit inside the loop to get multiple segments to make search as realistic as possible
|
||||||
|
assertU(commit());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void tearDown() throws Exception {
|
||||||
|
super.tearDown();
|
||||||
|
}
|
||||||
|
|
||||||
|
@After
|
||||||
|
public void after() {
|
||||||
|
h.getCore().getCircuitBreakerManager().deregisterAll();
|
||||||
|
}
|
||||||
|
|
||||||
|
public void testCBAlwaysTrips() {
|
||||||
|
HashMap<String, String> args = new HashMap<String, String>();
|
||||||
|
|
||||||
|
args.put(QueryParsing.DEFTYPE, CircuitBreaker.NAME);
|
||||||
|
args.put(CommonParams.FL, "id");
|
||||||
|
|
||||||
|
CircuitBreaker circuitBreaker = new MockCircuitBreaker(h.getCore().getSolrConfig());
|
||||||
|
|
||||||
|
h.getCore().getCircuitBreakerManager().register(circuitBreaker);
|
||||||
|
|
||||||
|
expectThrows(SolrException.class, () -> {
|
||||||
|
h.query(req("name:\"john smith\""));
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
public void testCBFakeMemoryPressure() {
|
||||||
|
HashMap<String, String> args = new HashMap<String, String>();
|
||||||
|
|
||||||
|
args.put(QueryParsing.DEFTYPE, CircuitBreaker.NAME);
|
||||||
|
args.put(CommonParams.FL, "id");
|
||||||
|
|
||||||
|
CircuitBreaker circuitBreaker = new FakeMemoryPressureCircuitBreaker(h.getCore().getSolrConfig());
|
||||||
|
|
||||||
|
h.getCore().getCircuitBreakerManager().register(circuitBreaker);
|
||||||
|
|
||||||
|
expectThrows(SolrException.class, () -> {
|
||||||
|
h.query(req("name:\"john smith\""));
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
public void testBuildingMemoryPressure() {
|
||||||
|
ExecutorService executor = ExecutorUtil.newMDCAwareCachedThreadPool(
|
||||||
|
new SolrNamedThreadFactory("TestCircuitBreaker"));
|
||||||
|
HashMap<String, String> args = new HashMap<String, String>();
|
||||||
|
|
||||||
|
args.put(QueryParsing.DEFTYPE, CircuitBreaker.NAME);
|
||||||
|
args.put(CommonParams.FL, "id");
|
||||||
|
|
||||||
|
AtomicInteger failureCount = new AtomicInteger();
|
||||||
|
|
||||||
|
try {
|
||||||
|
CircuitBreaker circuitBreaker = new BuildingUpMemoryPressureCircuitBreaker(h.getCore().getSolrConfig());
|
||||||
|
|
||||||
|
h.getCore().getCircuitBreakerManager().register(circuitBreaker);
|
||||||
|
|
||||||
|
for (int i = 0; i < 5; i++) {
|
||||||
|
executor.submit(() -> {
|
||||||
|
try {
|
||||||
|
h.query(req("name:\"john smith\""));
|
||||||
|
} catch (SolrException e) {
|
||||||
|
failureCount.incrementAndGet();
|
||||||
|
} catch (Exception e) {
|
||||||
|
throw new RuntimeException(e.getMessage());
|
||||||
|
}
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
executor.shutdown();
|
||||||
|
try {
|
||||||
|
executor.awaitTermination(Long.MAX_VALUE, TimeUnit.NANOSECONDS);
|
||||||
|
} catch (InterruptedException e) {
|
||||||
|
throw new RuntimeException(e.getMessage());
|
||||||
|
}
|
||||||
|
|
||||||
|
assertEquals("Number of failed queries is not correct", 1, failureCount.get());
|
||||||
|
} finally {
|
||||||
|
if (!executor.isShutdown()) {
|
||||||
|
executor.shutdown();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public void testResponseWithCBTiming() {
|
||||||
|
assertQ(req("q", "*:*", CommonParams.DEBUG_QUERY, "true"),
|
||||||
|
"//str[@name='rawquerystring']='*:*'",
|
||||||
|
"//str[@name='querystring']='*:*'",
|
||||||
|
"//str[@name='parsedquery']='MatchAllDocsQuery(*:*)'",
|
||||||
|
"//str[@name='parsedquery_toString']='*:*'",
|
||||||
|
"count(//lst[@name='explain']/*)=3",
|
||||||
|
"//lst[@name='explain']/str[@name='1']",
|
||||||
|
"//lst[@name='explain']/str[@name='2']",
|
||||||
|
"//lst[@name='explain']/str[@name='3']",
|
||||||
|
"//str[@name='QParser']",
|
||||||
|
"count(//lst[@name='timing']/*)=4",
|
||||||
|
"//lst[@name='timing']/double[@name='time']",
|
||||||
|
"count(//lst[@name='circuitbreaker']/*)>0",
|
||||||
|
"//lst[@name='circuitbreaker']/double[@name='time']",
|
||||||
|
"count(//lst[@name='prepare']/*)>0",
|
||||||
|
"//lst[@name='prepare']/double[@name='time']",
|
||||||
|
"count(//lst[@name='process']/*)>0",
|
||||||
|
"//lst[@name='process']/double[@name='time']"
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
private class MockCircuitBreaker extends CircuitBreaker {
|
||||||
|
|
||||||
|
public MockCircuitBreaker(SolrConfig solrConfig) {
|
||||||
|
super(solrConfig);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public boolean isTripped() {
|
||||||
|
// Always return true
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public String getDebugInfo() {
|
||||||
|
return "MockCircuitBreaker";
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
private class FakeMemoryPressureCircuitBreaker extends MemoryCircuitBreaker {
|
||||||
|
|
||||||
|
public FakeMemoryPressureCircuitBreaker(SolrConfig solrConfig) {
|
||||||
|
super(solrConfig);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
protected long calculateLiveMemoryUsage() {
|
||||||
|
// Return a number large enough to trigger a pushback from the circuit breaker
|
||||||
|
return Long.MAX_VALUE;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
private class BuildingUpMemoryPressureCircuitBreaker extends MemoryCircuitBreaker {
|
||||||
|
private AtomicInteger count = new AtomicInteger();
|
||||||
|
|
||||||
|
public BuildingUpMemoryPressureCircuitBreaker(SolrConfig solrConfig) {
|
||||||
|
super(solrConfig);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
protected long calculateLiveMemoryUsage() {
|
||||||
|
if (count.getAndIncrement() >= 4) {
|
||||||
|
return Long.MAX_VALUE;
|
||||||
|
}
|
||||||
|
|
||||||
|
return 5; // Random number guaranteed to not trip the circuit breaker
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
|
@ -546,6 +546,44 @@
|
||||||
|
|
||||||
</query>
|
</query>
|
||||||
|
|
||||||
|
<!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
||||||
|
Circuit Breaker Section - This section consists of configurations for
|
||||||
|
circuit breakers
|
||||||
|
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
|
||||||
|
<circuitBreaker>
|
||||||
|
<!-- Enable Circuit Breakers
|
||||||
|
|
||||||
|
Circuit breakers are designed to allow stability and predictable query
|
||||||
|
execution. They prevent operations that can take down the node and cause
|
||||||
|
noisy neighbour issues.
|
||||||
|
|
||||||
|
This flag is the uber control switch which controls the activation/deactivation of all circuit
|
||||||
|
breakers. At the moment, the only circuit breaker (max JVM circuit breaker) does not have its
|
||||||
|
own specific configuration. However, if a circuit breaker wishes to be independently configurable,
|
||||||
|
they are free to add their specific configuration but need to ensure that this flag is always
|
||||||
|
respected - this should have veto over all independent configuration flags.
|
||||||
|
-->
|
||||||
|
<useCircuitBreakers>false</useCircuitBreakers>
|
||||||
|
|
||||||
|
<!-- Memory Circuit Breaker Threshold In Percentage
|
||||||
|
|
||||||
|
Specific configuration for max JVM heap usage circuit breaker. This configuration defines the
|
||||||
|
threshold percentage of maximum heap allocated beyond which queries will be rejected until the
|
||||||
|
current JVM usage goes below the threshold. The valid value range for this parameter is 50 - 95.
|
||||||
|
|
||||||
|
Consider a scenario where the max heap allocated is 4 GB and memoryCircuitBreakerThresholdPct is
|
||||||
|
defined as 75. Threshold JVM usage will be 4 * 0.75 = 3 GB. Its generally a good idea to keep this value between 75 - 80% of maximum heap
|
||||||
|
allocated.
|
||||||
|
|
||||||
|
If, at any point, the current JVM heap usage goes above 3 GB, queries will be rejected until the heap usage goes below 3 GB again.
|
||||||
|
If you see queries getting rejected with 503 error code, check for "Circuit Breakers tripped"
|
||||||
|
in logs and the corresponding error message should tell you what transpired (if the failure
|
||||||
|
was caused by tripped circuit breakers).
|
||||||
|
-->
|
||||||
|
<memoryCircuitBreakerThresholdPct>100</memoryCircuitBreakerThresholdPct>
|
||||||
|
|
||||||
|
</circuitBreaker>
|
||||||
|
|
||||||
|
|
||||||
<!-- Request Dispatcher
|
<!-- Request Dispatcher
|
||||||
|
|
||||||
|
|
|
@ -513,6 +513,23 @@
|
||||||
-->
|
-->
|
||||||
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
|
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
|
||||||
|
|
||||||
|
<!-- Use Filter For Sorted Query
|
||||||
|
|
||||||
|
A possible optimization that attempts to use a filter to
|
||||||
|
satisfy a search. If the requested sort does not include
|
||||||
|
score, then the filterCache will be checked for a filter
|
||||||
|
matching the query. If found, the filter will be used as the
|
||||||
|
source of document ids, and then the sort will be applied to
|
||||||
|
that.
|
||||||
|
|
||||||
|
For most situations, this will not be useful unless you
|
||||||
|
frequently get the same search repeatedly with different sort
|
||||||
|
options, and none of them ever use "score"
|
||||||
|
-->
|
||||||
|
<!--
|
||||||
|
<useFilterForSortedQuery>true</useFilterForSortedQuery>
|
||||||
|
-->
|
||||||
|
|
||||||
<!-- Query Related Event Listeners
|
<!-- Query Related Event Listeners
|
||||||
|
|
||||||
Various IndexSearcher related events can trigger Listeners to
|
Various IndexSearcher related events can trigger Listeners to
|
||||||
|
@ -561,6 +578,48 @@
|
||||||
|
|
||||||
</query>
|
</query>
|
||||||
|
|
||||||
|
<!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
||||||
|
Circuit Breaker Section - This section consists of configurations for
|
||||||
|
circuit breakers
|
||||||
|
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
|
||||||
|
<circuitBreaker>
|
||||||
|
<!-- Enable Circuit Breakers
|
||||||
|
|
||||||
|
Circuit breakers are designed to allow stability and predictable query
|
||||||
|
execution. They prevent operations that can take down the node and cause
|
||||||
|
noisy neighbour issues.
|
||||||
|
|
||||||
|
This flag is the uber control switch which controls the activation/deactivation of all circuit
|
||||||
|
breakers. At the moment, the only circuit breaker (max JVM circuit breaker) does not have its
|
||||||
|
own specific configuration. However, if a circuit breaker wishes to be independently configurable,
|
||||||
|
they are free to add their specific configuration but need to ensure that this flag is always
|
||||||
|
respected - this should have veto over all independent configuration flags.
|
||||||
|
-->
|
||||||
|
<!--
|
||||||
|
<useCircuitBreakers>true</useCircuitBreakers>
|
||||||
|
-->
|
||||||
|
|
||||||
|
<!-- Memory Circuit Breaker Threshold In Percentage
|
||||||
|
|
||||||
|
Specific configuration for max JVM heap usage circuit breaker. This configuration defines the
|
||||||
|
threshold percentage of maximum heap allocated beyond which queries will be rejected until the
|
||||||
|
current JVM usage goes below the threshold. The valid value range for this value is 50-95.
|
||||||
|
|
||||||
|
Consider a scenario where the max heap allocated is 4 GB and memoryCircuitBreakerThreshold is
|
||||||
|
defined as 75. Threshold JVM usage will be 4 * 0.75 = 3 GB. Its generally a good idea to keep this value between 75 - 80% of maximum heap
|
||||||
|
allocated.
|
||||||
|
|
||||||
|
If, at any point, the current JVM heap usage goes above 3 GB, queries will be rejected until the heap usage goes below 3 GB again.
|
||||||
|
If you see queries getting rejected with 503 error code, check for "Circuit Breakers tripped"
|
||||||
|
in logs and the corresponding error message should tell you what transpired (if the failure
|
||||||
|
was caused by tripped circuit breakers).
|
||||||
|
-->
|
||||||
|
<!--
|
||||||
|
<memoryCircuitBreakerThresholdPct>100</memoryCircuitBreakerThresholdPct>
|
||||||
|
-->
|
||||||
|
|
||||||
|
</circuitBreaker>
|
||||||
|
|
||||||
|
|
||||||
<!-- Request Dispatcher
|
<!-- Request Dispatcher
|
||||||
|
|
||||||
|
|
|
@ -600,6 +600,48 @@
|
||||||
|
|
||||||
</query>
|
</query>
|
||||||
|
|
||||||
|
<!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
||||||
|
Circuit Breaker Section - This section consists of configurations for
|
||||||
|
circuit breakers
|
||||||
|
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
|
||||||
|
<circuitBreaker>
|
||||||
|
<!-- Enable Circuit Breakers
|
||||||
|
|
||||||
|
Circuit breakers are designed to allow stability and predictable query
|
||||||
|
execution. They prevent operations that can take down the node and cause
|
||||||
|
noisy neighbour issues.
|
||||||
|
|
||||||
|
This flag is the uber control switch which controls the activation/deactivation of all circuit
|
||||||
|
breakers. At the moment, the only circuit breaker (max JVM circuit breaker) does not have its
|
||||||
|
own specific configuration. However, if a circuit breaker wishes to be independently configurable,
|
||||||
|
they are free to add their specific configuration but need to ensure that this flag is always
|
||||||
|
respected - this should have veto over all independent configuration flags.
|
||||||
|
-->
|
||||||
|
<!--
|
||||||
|
<useCircuitBreakers>true</useCircuitBreakers>
|
||||||
|
-->
|
||||||
|
|
||||||
|
<!-- Memory Circuit Breaker Threshold In Percentage
|
||||||
|
|
||||||
|
Specific configuration for max JVM heap usage circuit breaker. This configuration defines the
|
||||||
|
threshold percentage of maximum heap allocated beyond which queries will be rejected until the
|
||||||
|
current JVM usage goes below the threshold. The valid value for this range is 50-95.
|
||||||
|
|
||||||
|
Consider a scenario where the max heap allocated is 4 GB and memoryCircuitBreakerThresholdPct is
|
||||||
|
defined as 75. Threshold JVM usage will be 4 * 0.75 = 3 GB. Its generally a good idea to keep this value between 75 - 80% of maximum heap
|
||||||
|
allocated.
|
||||||
|
|
||||||
|
If, at any point, the current JVM heap usage goes above 3 GB, queries will be rejected until the heap usage goes below 3 GB again.
|
||||||
|
If you see queries getting rejected with 503 error code, check for "Circuit Breakers tripped"
|
||||||
|
in logs and the corresponding error message should tell you what transpired (if the failure
|
||||||
|
was caused by tripped circuit breakers).
|
||||||
|
-->
|
||||||
|
<!--
|
||||||
|
<memoryCircuitBreakerThresholdPct>100</memoryCircuitBreakerThresholdPct>
|
||||||
|
-->
|
||||||
|
|
||||||
|
</circuitBreaker>
|
||||||
|
|
||||||
|
|
||||||
<!-- Request Dispatcher
|
<!-- Request Dispatcher
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,68 @@
|
||||||
|
= Circuit Breakers
|
||||||
|
// Licensed to the Apache Software Foundation (ASF) under one
|
||||||
|
// or more contributor license agreements. See the NOTICE file
|
||||||
|
// distributed with this work for additional information
|
||||||
|
// regarding copyright ownership. The ASF licenses this file
|
||||||
|
// to you under the Apache License, Version 2.0 (the
|
||||||
|
// "License"); you may not use this file except in compliance
|
||||||
|
// with the License. You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing,
|
||||||
|
// software distributed under the License is distributed on an
|
||||||
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
||||||
|
// KIND, either express or implied. See the License for the
|
||||||
|
// specific language governing permissions and limitations
|
||||||
|
// under the License.
|
||||||
|
|
||||||
|
Solr's circuit breaker infrastructure allows prevention of actions that can cause a node to go beyond its capacity or to go down. The
|
||||||
|
premise of circuit breakers is to ensure a higher quality of service and only accept request loads that are serviceable in the current
|
||||||
|
resource configuration.
|
||||||
|
|
||||||
|
== When To Use Circuit Breakers
|
||||||
|
Circuit breakers should be used when the user wishes to trade request throughput for a higher Solr stability. If circuit breakers
|
||||||
|
are enabled, requests may be rejected under the condition of high node duress with an appropriate HTTP error code (typically 503).
|
||||||
|
|
||||||
|
It is up to the client to handle this error and potentially build a retrial logic as this should ideally be a transient situation.
|
||||||
|
|
||||||
|
== Circuit Breaker Configurations
|
||||||
|
The following flag controls the global activation/deactivation of circuit breakers. If this flag is disabled, all circuit breakers
|
||||||
|
will be disabled globally. Per circuit breaker configurations are specified in their respective sections later.
|
||||||
|
|
||||||
|
[source,xml]
|
||||||
|
----
|
||||||
|
<useCircuitBreakers>false</useCircuitBreakers>
|
||||||
|
----
|
||||||
|
|
||||||
|
== Currently Supported Circuit Breakers
|
||||||
|
|
||||||
|
=== JVM Heap Usage Based Circuit Breaker
|
||||||
|
This circuit breaker tracks JVM heap memory usage and rejects incoming search requests with a 503 error code if the heap usage
|
||||||
|
exceeds a configured percentage of maximum heap allocated to the JVM (-Xmx). The main configuration for this circuit breaker is
|
||||||
|
controlling the threshold percentage at which the breaker will trip.
|
||||||
|
|
||||||
|
It does not logically make sense to have a threshold below 50% and above 95% of the max heap allocated to the JVM. Hence, the range
|
||||||
|
of valid values for this parameter is [50, 95], both inclusive.
|
||||||
|
|
||||||
|
[source,xml]
|
||||||
|
----
|
||||||
|
<memoryCircuitBreakerThresholdPct>75</memoryCircuitBreakerThresholdPct>
|
||||||
|
----
|
||||||
|
|
||||||
|
Consider the following example:
|
||||||
|
|
||||||
|
JVM has been allocated a maximum heap of 5GB (-Xmx) and memoryCircuitBreakerThresholdPct is set to 75. In this scenario, the heap usage
|
||||||
|
at which the circuit breaker will trip is 3.75GB.
|
||||||
|
|
||||||
|
Note that this circuit breaker is checked for each incoming search request and considers the current heap usage of the node, i.e every search
|
||||||
|
request will get the live heap usage and compare it against the set memory threshold. The check does not impact performance,
|
||||||
|
but any performance regressions that are suspected to be caused by this feature should be reported to the dev list.
|
||||||
|
|
||||||
|
|
||||||
|
== Performance Considerations
|
||||||
|
It is worth noting that while JVM circuit breaker does not add any noticeable overhead per query, having too many
|
||||||
|
circuit breakers checked for a single request can cause a performance overhead.
|
||||||
|
|
||||||
|
In addition, it is a good practice to exponentially back off while retrying requests on a busy node.
|
||||||
|
|
|
@ -202,6 +202,13 @@ _Query Sizing and Warming_
|
||||||
* `query.queryResultWindowSize`
|
* `query.queryResultWindowSize`
|
||||||
* `query.queryResultMaxDocCached`
|
* `query.queryResultMaxDocCached`
|
||||||
|
|
||||||
|
_Query Circuit Breakers_
|
||||||
|
|
||||||
|
See <<circuit-breakers.adoc#circuit-breakers,Circuit Breakers in Solr>> for more details
|
||||||
|
|
||||||
|
* `query.useCircuitBreakers`
|
||||||
|
* `query.memoryCircuitBreakerThresholdPct`
|
||||||
|
|
||||||
*RequestDispatcher Settings*
|
*RequestDispatcher Settings*
|
||||||
|
|
||||||
See <<requestdispatcher-in-solrconfig.adoc#requestdispatcher-in-solrconfig,RequestDispatcher in SolrConfig>> for defaults and acceptable values for these settings.
|
See <<requestdispatcher-in-solrconfig.adoc#requestdispatcher-in-solrconfig,RequestDispatcher in SolrConfig>> for defaults and acceptable values for these settings.
|
||||||
|
|
|
@ -10,6 +10,7 @@
|
||||||
streaming-expressions, \
|
streaming-expressions, \
|
||||||
solrcloud, \
|
solrcloud, \
|
||||||
legacy-scaling-and-distribution, \
|
legacy-scaling-and-distribution, \
|
||||||
|
circuit-breakers, \
|
||||||
solr-plugins, \
|
solr-plugins, \
|
||||||
the-well-configured-solr-instance, \
|
the-well-configured-solr-instance, \
|
||||||
monitoring-solr, \
|
monitoring-solr, \
|
||||||
|
@ -121,6 +122,8 @@ The *<<getting-started.adoc#getting-started,Getting Started>>* section guides yo
|
||||||
*<<solrcloud.adoc#solrcloud,SolrCloud>>*: This section describes SolrCloud, which provides comprehensive distributed capabilities.
|
*<<solrcloud.adoc#solrcloud,SolrCloud>>*: This section describes SolrCloud, which provides comprehensive distributed capabilities.
|
||||||
|
|
||||||
*<<legacy-scaling-and-distribution.adoc#legacy-scaling-and-distribution,Legacy Scaling and Distribution>>*: This section tells you how to grow a Solr distribution by dividing a large index into sections called shards, which are then distributed across multiple servers, or by replicating a single index across multiple services.
|
*<<legacy-scaling-and-distribution.adoc#legacy-scaling-and-distribution,Legacy Scaling and Distribution>>*: This section tells you how to grow a Solr distribution by dividing a large index into sections called shards, which are then distributed across multiple servers, or by replicating a single index across multiple services.
|
||||||
|
|
||||||
|
*<<circuit-breakers.adoc#circuit-breakers,Circuit Breakers>>*: This section talks about circuit breakers, a way of allowing a higher stability of Solr nodes and increased service level guarantees of requests that are accepted by Solr.
|
||||||
****
|
****
|
||||||
|
|
||||||
.Advanced Configuration
|
.Advanced Configuration
|
||||||
|
|
|
@ -172,6 +172,26 @@ This parameter sets the maximum number of documents to cache for any entry in th
|
||||||
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
|
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
|
||||||
----
|
----
|
||||||
|
|
||||||
|
=== useCircuitBreakers
|
||||||
|
|
||||||
|
Global control flag for enabling circuit breakers.
|
||||||
|
|
||||||
|
[source,xml]
|
||||||
|
----
|
||||||
|
<useCircuitBreakers>true</useCircuitBreakers>
|
||||||
|
----
|
||||||
|
|
||||||
|
=== memoryCircuitBreakerThresholdPct
|
||||||
|
|
||||||
|
Memory threshold in percentage for JVM heap usage defined in percentage of maximum heap allocated
|
||||||
|
to the JVM (-Xmx). Ideally, this value should be in the range of 75-80% of maximum heap allocated
|
||||||
|
to the JVM.
|
||||||
|
|
||||||
|
[source,xml]
|
||||||
|
----
|
||||||
|
<memoryCircuitBreakerThresholdPct>75</memoryCircuitBreakerThresholdPct>
|
||||||
|
----
|
||||||
|
|
||||||
=== useColdSearcher
|
=== useColdSearcher
|
||||||
|
|
||||||
This setting controls whether search requests for which there is not a currently registered searcher should wait for a new searcher to warm up (false) or proceed immediately (true). When set to "false", requests will block until the searcher has warmed its caches.
|
This setting controls whether search requests for which there is not a currently registered searcher should wait for a new searcher to warm up (false) or proceed immediately (true). When set to "false", requests will block until the searcher has warmed its caches.
|
||||||
|
|
Loading…
Reference in New Issue