HBASE-15429 Add split policy for busy regions
Signed-off-by: Gary Helmling <garyh@apache.org>
This commit is contained in:
parent
0bc9ad0628
commit
20cb390529
|
@ -322,8 +322,8 @@ possible configurations would overwhelm and obscure the important.
|
||||||
<value>org.apache.hadoop.hbase.regionserver.IncreasingToUpperBoundRegionSplitPolicy</value>
|
<value>org.apache.hadoop.hbase.regionserver.IncreasingToUpperBoundRegionSplitPolicy</value>
|
||||||
<description>
|
<description>
|
||||||
A split policy determines when a region should be split. The various other split policies that
|
A split policy determines when a region should be split. The various other split policies that
|
||||||
are available currently are ConstantSizeRegionSplitPolicy, DisabledRegionSplitPolicy,
|
are available currently are BusyRegionSplitPolicy, ConstantSizeRegionSplitPolicy,
|
||||||
DelimitedKeyPrefixRegionSplitPolicy, KeyPrefixRegionSplitPolicy etc.
|
DisabledRegionSplitPolicy, DelimitedKeyPrefixRegionSplitPolicy, KeyPrefixRegionSplitPolicy etc.
|
||||||
</description>
|
</description>
|
||||||
</property>
|
</property>
|
||||||
<property>
|
<property>
|
||||||
|
|
|
@ -0,0 +1,157 @@
|
||||||
|
/**
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one
|
||||||
|
* or more contributor license agreements. See the NOTICE file
|
||||||
|
* distributed with this work for additional information
|
||||||
|
* regarding copyright ownership. The ASF licenses this file
|
||||||
|
* to you under the Apache License, Version 2.0 (the
|
||||||
|
* "License"); you may not use this file except in compliance
|
||||||
|
* with the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package org.apache.hadoop.hbase.regionserver;
|
||||||
|
|
||||||
|
import org.apache.commons.logging.Log;
|
||||||
|
import org.apache.commons.logging.LogFactory;
|
||||||
|
import org.apache.hadoop.conf.Configuration;
|
||||||
|
import org.apache.hadoop.hbase.HBaseInterfaceAudience;
|
||||||
|
import org.apache.hadoop.hbase.classification.InterfaceAudience;
|
||||||
|
import org.apache.hadoop.hbase.util.EnvironmentEdgeManager;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* This class represents a split policy which makes the split decision based
|
||||||
|
* on how busy a region is. The metric that is used here is the fraction of
|
||||||
|
* total write requests that are blocked due to high memstore utilization.
|
||||||
|
* This fractional rate is calculated over a running window of
|
||||||
|
* "hbase.busy.policy.aggWindow" milliseconds. The rate is a time-weighted
|
||||||
|
* aggregated average of the rate in the current window and the
|
||||||
|
* true average rate in the previous window.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
|
||||||
|
@InterfaceAudience.LimitedPrivate(HBaseInterfaceAudience.CONFIG)
|
||||||
|
public class BusyRegionSplitPolicy extends IncreasingToUpperBoundRegionSplitPolicy {
|
||||||
|
|
||||||
|
private static final Log LOG = LogFactory.getLog(BusyRegionSplitPolicy.class);
|
||||||
|
|
||||||
|
// Maximum fraction blocked write requests before region is considered for split
|
||||||
|
private float maxBlockedRequests;
|
||||||
|
public static final float DEFAULT_MAX_BLOCKED_REQUESTS = 0.2f;
|
||||||
|
|
||||||
|
// Minimum age of the region in milliseconds before it is considered for split
|
||||||
|
private long minAge = -1;
|
||||||
|
public static final long DEFAULT_MIN_AGE_MS = 600000; // 10 minutes
|
||||||
|
|
||||||
|
// The window time in milliseconds over which the blocked requests rate is calculated
|
||||||
|
private long aggregationWindow;
|
||||||
|
public static final long DEFAULT_AGGREGATION_WINDOW = 300000; // 5 minutes
|
||||||
|
|
||||||
|
private HRegion region;
|
||||||
|
private long prevTime;
|
||||||
|
private long startTime;
|
||||||
|
private long writeRequestCount;
|
||||||
|
private long blockedRequestCount;
|
||||||
|
private float blockedRate;
|
||||||
|
|
||||||
|
@Override
|
||||||
|
protected void configureForRegion(final HRegion region) {
|
||||||
|
super.configureForRegion(region);
|
||||||
|
this.region = region;
|
||||||
|
Configuration conf = getConf();
|
||||||
|
|
||||||
|
maxBlockedRequests = conf.getFloat("hbase.busy.policy.blockedRequests",
|
||||||
|
DEFAULT_MAX_BLOCKED_REQUESTS);
|
||||||
|
minAge = conf.getLong("hbase.busy.policy.minAge", DEFAULT_MIN_AGE_MS);
|
||||||
|
aggregationWindow = conf.getLong("hbase.busy.policy.aggWindow",
|
||||||
|
DEFAULT_AGGREGATION_WINDOW);
|
||||||
|
|
||||||
|
if (maxBlockedRequests < 0.00001f || maxBlockedRequests > 0.99999f) {
|
||||||
|
LOG.warn("Threshold for maximum blocked requests is set too low or too high, "
|
||||||
|
+ " resetting to default of " + DEFAULT_MAX_BLOCKED_REQUESTS);
|
||||||
|
maxBlockedRequests = DEFAULT_MAX_BLOCKED_REQUESTS;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (aggregationWindow <= 0) {
|
||||||
|
LOG.warn("Aggregation window size is too low: " + aggregationWindow
|
||||||
|
+ ". Resetting it to default of " + DEFAULT_AGGREGATION_WINDOW);
|
||||||
|
aggregationWindow = DEFAULT_AGGREGATION_WINDOW;
|
||||||
|
}
|
||||||
|
|
||||||
|
init();
|
||||||
|
}
|
||||||
|
|
||||||
|
private synchronized void init() {
|
||||||
|
startTime = EnvironmentEdgeManager.currentTime();
|
||||||
|
prevTime = startTime;
|
||||||
|
blockedRequestCount = region.getBlockedRequestsCount();
|
||||||
|
writeRequestCount = region.getWriteRequestsCount();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
protected boolean shouldSplit() {
|
||||||
|
float blockedReqRate = updateRate();
|
||||||
|
if (super.shouldSplit()) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (EnvironmentEdgeManager.currentTime() < startTime + minAge) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
for (Store store: region.getStores()) {
|
||||||
|
if (!store.canSplit()) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (blockedReqRate >= maxBlockedRequests) {
|
||||||
|
if (LOG.isDebugEnabled()) {
|
||||||
|
LOG.debug("Going to split region " + region.getRegionInfo().getRegionNameAsString()
|
||||||
|
+ " because it's too busy. Blocked Request rate: " + blockedReqRate);
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Update the blocked request rate based on number of blocked and total write requests in the
|
||||||
|
* last aggregation window, or since last call to this method, whichever is farthest in time.
|
||||||
|
* Uses weighted rate calculation based on the previous rate and new data.
|
||||||
|
*
|
||||||
|
* @return Updated blocked request rate.
|
||||||
|
*/
|
||||||
|
private synchronized float updateRate() {
|
||||||
|
float aggBlockedRate;
|
||||||
|
long curTime = EnvironmentEdgeManager.currentTime();
|
||||||
|
|
||||||
|
long newBlockedReqs = region.getBlockedRequestsCount();
|
||||||
|
long newWriteReqs = region.getWriteRequestsCount();
|
||||||
|
|
||||||
|
aggBlockedRate =
|
||||||
|
(newBlockedReqs - blockedRequestCount) / (newWriteReqs - writeRequestCount + 0.00001f);
|
||||||
|
|
||||||
|
if (curTime - prevTime >= aggregationWindow) {
|
||||||
|
blockedRate = aggBlockedRate;
|
||||||
|
prevTime = curTime;
|
||||||
|
blockedRequestCount = newBlockedReqs;
|
||||||
|
writeRequestCount = newWriteReqs;
|
||||||
|
} else if (curTime - startTime >= aggregationWindow) {
|
||||||
|
// Calculate the aggregate blocked rate as the weighted sum of
|
||||||
|
// previous window's average blocked rate and blocked rate in this window so far.
|
||||||
|
float timeSlice = (curTime - prevTime) / (aggregationWindow + 0.0f);
|
||||||
|
aggBlockedRate = (1 - timeSlice) * blockedRate + timeSlice * aggBlockedRate;
|
||||||
|
} else {
|
||||||
|
aggBlockedRate = 0.0f;
|
||||||
|
}
|
||||||
|
return aggBlockedRate;
|
||||||
|
}
|
||||||
|
}
|
|
@ -34,6 +34,7 @@ import org.apache.hadoop.hbase.HRegionInfo;
|
||||||
import org.apache.hadoop.hbase.HTableDescriptor;
|
import org.apache.hadoop.hbase.HTableDescriptor;
|
||||||
import org.apache.hadoop.hbase.testclassification.SmallTests;
|
import org.apache.hadoop.hbase.testclassification.SmallTests;
|
||||||
import org.apache.hadoop.hbase.util.Bytes;
|
import org.apache.hadoop.hbase.util.Bytes;
|
||||||
|
import org.apache.hadoop.hbase.util.EnvironmentEdgeManager;
|
||||||
import org.junit.Before;
|
import org.junit.Before;
|
||||||
import org.junit.Test;
|
import org.junit.Test;
|
||||||
import org.junit.experimental.categories.Category;
|
import org.junit.experimental.categories.Category;
|
||||||
|
@ -147,6 +148,56 @@ public class TestRegionSplitPolicy {
|
||||||
assertWithinJitter(maxSplitSize, policy.getSizeToCheck(0));
|
assertWithinJitter(maxSplitSize, policy.getSizeToCheck(0));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testBusyRegionSplitPolicy() throws Exception {
|
||||||
|
conf.set(HConstants.HBASE_REGION_SPLIT_POLICY_KEY,
|
||||||
|
BusyRegionSplitPolicy.class.getName());
|
||||||
|
conf.setLong("hbase.busy.policy.minAge", 1000000L);
|
||||||
|
conf.setFloat("hbase.busy.policy.blockedRequests", 0.1f);
|
||||||
|
|
||||||
|
RegionServerServices rss = Mockito.mock(RegionServerServices.class);
|
||||||
|
final List<Region> regions = new ArrayList<Region>();
|
||||||
|
Mockito.when(rss.getOnlineRegions(TABLENAME)).thenReturn(regions);
|
||||||
|
Mockito.when(mockRegion.getRegionServerServices()).thenReturn(rss);
|
||||||
|
Mockito.when(mockRegion.getBlockedRequestsCount()).thenReturn(0L);
|
||||||
|
Mockito.when(mockRegion.getWriteRequestsCount()).thenReturn(0L);
|
||||||
|
|
||||||
|
|
||||||
|
BusyRegionSplitPolicy policy =
|
||||||
|
(BusyRegionSplitPolicy)RegionSplitPolicy.create(mockRegion, conf);
|
||||||
|
|
||||||
|
Mockito.when(mockRegion.getBlockedRequestsCount()).thenReturn(10L);
|
||||||
|
Mockito.when(mockRegion.getWriteRequestsCount()).thenReturn(10L);
|
||||||
|
// Not enough time since region came online
|
||||||
|
assertFalse(policy.shouldSplit());
|
||||||
|
|
||||||
|
|
||||||
|
// Reset min age for split to zero
|
||||||
|
conf.setLong("hbase.busy.policy.minAge", 0L);
|
||||||
|
// Aggregate over 500 ms periods
|
||||||
|
conf.setLong("hbase.busy.policy.aggWindow", 500L);
|
||||||
|
policy =
|
||||||
|
(BusyRegionSplitPolicy)RegionSplitPolicy.create(mockRegion, conf);
|
||||||
|
long start = EnvironmentEdgeManager.currentTime();
|
||||||
|
Mockito.when(mockRegion.getBlockedRequestsCount()).thenReturn(10L);
|
||||||
|
Mockito.when(mockRegion.getWriteRequestsCount()).thenReturn(20L);
|
||||||
|
Thread.sleep(300);
|
||||||
|
assertFalse(policy.shouldSplit());
|
||||||
|
Mockito.when(mockRegion.getBlockedRequestsCount()).thenReturn(12L);
|
||||||
|
Mockito.when(mockRegion.getWriteRequestsCount()).thenReturn(30L);
|
||||||
|
Thread.sleep(2);
|
||||||
|
// Enough blocked requests since last time, but aggregate blocked request
|
||||||
|
// rate over last 500 ms is still low, because major portion of the window is constituted
|
||||||
|
// by the previous zero blocked request period which lasted at least 300 ms off last 500 ms.
|
||||||
|
if (EnvironmentEdgeManager.currentTime() - start < 500) {
|
||||||
|
assertFalse(policy.shouldSplit());
|
||||||
|
}
|
||||||
|
Mockito.when(mockRegion.getBlockedRequestsCount()).thenReturn(14L);
|
||||||
|
Mockito.when(mockRegion.getWriteRequestsCount()).thenReturn(40L);
|
||||||
|
Thread.sleep(200);
|
||||||
|
assertTrue(policy.shouldSplit());
|
||||||
|
}
|
||||||
|
|
||||||
private void assertWithinJitter(long maxSplitSize, long sizeToCheck) {
|
private void assertWithinJitter(long maxSplitSize, long sizeToCheck) {
|
||||||
assertTrue("Size greater than lower bound of jitter",
|
assertTrue("Size greater than lower bound of jitter",
|
||||||
(long)(maxSplitSize * 0.75) <= sizeToCheck);
|
(long)(maxSplitSize * 0.75) <= sizeToCheck);
|
||||||
|
|
Loading…
Reference in New Issue