HBASE-20182 Can not locate region after split and merge
This commit is contained in:
parent
a422310dad
commit
adc0e85e85
|
@ -17,7 +17,6 @@
|
||||||
*/
|
*/
|
||||||
package org.apache.hadoop.hbase.client;
|
package org.apache.hadoop.hbase.client;
|
||||||
|
|
||||||
import static org.apache.hadoop.hbase.HConstants.CATALOG_FAMILY;
|
|
||||||
import static org.apache.hadoop.hbase.HConstants.NINES;
|
import static org.apache.hadoop.hbase.HConstants.NINES;
|
||||||
import static org.apache.hadoop.hbase.HConstants.ZEROES;
|
import static org.apache.hadoop.hbase.HConstants.ZEROES;
|
||||||
import static org.apache.hadoop.hbase.TableName.META_TABLE_NAME;
|
import static org.apache.hadoop.hbase.TableName.META_TABLE_NAME;
|
||||||
|
@ -32,7 +31,6 @@ import java.util.Arrays;
|
||||||
import java.util.HashSet;
|
import java.util.HashSet;
|
||||||
import java.util.Iterator;
|
import java.util.Iterator;
|
||||||
import java.util.LinkedHashMap;
|
import java.util.LinkedHashMap;
|
||||||
import java.util.List;
|
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
import java.util.Optional;
|
import java.util.Optional;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
|
@ -41,13 +39,14 @@ import java.util.concurrent.ConcurrentHashMap;
|
||||||
import java.util.concurrent.ConcurrentMap;
|
import java.util.concurrent.ConcurrentMap;
|
||||||
import java.util.concurrent.ConcurrentNavigableMap;
|
import java.util.concurrent.ConcurrentNavigableMap;
|
||||||
import java.util.concurrent.ConcurrentSkipListMap;
|
import java.util.concurrent.ConcurrentSkipListMap;
|
||||||
|
|
||||||
import org.apache.hadoop.hbase.DoNotRetryIOException;
|
import org.apache.hadoop.hbase.DoNotRetryIOException;
|
||||||
|
import org.apache.hadoop.hbase.HConstants;
|
||||||
import org.apache.hadoop.hbase.HRegionLocation;
|
import org.apache.hadoop.hbase.HRegionLocation;
|
||||||
import org.apache.hadoop.hbase.MetaTableAccessor;
|
import org.apache.hadoop.hbase.MetaTableAccessor;
|
||||||
import org.apache.hadoop.hbase.RegionLocations;
|
import org.apache.hadoop.hbase.RegionLocations;
|
||||||
import org.apache.hadoop.hbase.TableName;
|
import org.apache.hadoop.hbase.TableName;
|
||||||
import org.apache.hadoop.hbase.TableNotFoundException;
|
import org.apache.hadoop.hbase.TableNotFoundException;
|
||||||
|
import org.apache.hadoop.hbase.client.Scan.ReadType;
|
||||||
import org.apache.hadoop.hbase.util.Bytes;
|
import org.apache.hadoop.hbase.util.Bytes;
|
||||||
import org.apache.yetus.audience.InterfaceAudience;
|
import org.apache.yetus.audience.InterfaceAudience;
|
||||||
import org.slf4j.Logger;
|
import org.slf4j.Logger;
|
||||||
|
@ -269,26 +268,22 @@ class AsyncNonMetaRegionLocator {
|
||||||
toSend.ifPresent(r -> locateInMeta(tableName, r));
|
toSend.ifPresent(r -> locateInMeta(tableName, r));
|
||||||
}
|
}
|
||||||
|
|
||||||
private void onScanComplete(TableName tableName, LocateRequest req, List<Result> results,
|
// return whether we should stop the scan
|
||||||
|
private boolean onScanNext(TableName tableName, LocateRequest req, Result result,
|
||||||
Throwable error) {
|
Throwable error) {
|
||||||
if (error != null) {
|
if (error != null) {
|
||||||
complete(tableName, req, null, error);
|
complete(tableName, req, null, error);
|
||||||
return;
|
return true;
|
||||||
}
|
|
||||||
if (results.isEmpty()) {
|
|
||||||
complete(tableName, req, null, new TableNotFoundException(tableName));
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
RegionLocations locs = MetaTableAccessor.getRegionLocations(results.get(0));
|
|
||||||
if (LOG.isDebugEnabled()) {
|
|
||||||
LOG.debug("The fetched location of '" + tableName + "', row='" +
|
|
||||||
Bytes.toStringBinary(req.row) + "', locateType=" + req.locateType + " is " + locs);
|
|
||||||
}
|
}
|
||||||
|
RegionLocations locs = MetaTableAccessor.getRegionLocations(result);
|
||||||
|
LOG.debug("The fetched location of '{}', row='{}', locateType={} is {}", tableName,
|
||||||
|
Bytes.toStringBinary(req.row), req.locateType, locs);
|
||||||
|
|
||||||
if (locs == null || locs.getDefaultRegionLocation() == null) {
|
if (locs == null || locs.getDefaultRegionLocation() == null) {
|
||||||
complete(tableName, req, null,
|
complete(tableName, req, null,
|
||||||
new IOException(String.format("No location found for '%s', row='%s', locateType=%s",
|
new IOException(String.format("No location found for '%s', row='%s', locateType=%s",
|
||||||
tableName, Bytes.toStringBinary(req.row), req.locateType)));
|
tableName, Bytes.toStringBinary(req.row), req.locateType)));
|
||||||
return;
|
return true;
|
||||||
}
|
}
|
||||||
HRegionLocation loc = locs.getDefaultRegionLocation();
|
HRegionLocation loc = locs.getDefaultRegionLocation();
|
||||||
RegionInfo info = loc.getRegion();
|
RegionInfo info = loc.getRegion();
|
||||||
|
@ -296,33 +291,20 @@ class AsyncNonMetaRegionLocator {
|
||||||
complete(tableName, req, null,
|
complete(tableName, req, null,
|
||||||
new IOException(String.format("HRegionInfo is null for '%s', row='%s', locateType=%s",
|
new IOException(String.format("HRegionInfo is null for '%s', row='%s', locateType=%s",
|
||||||
tableName, Bytes.toStringBinary(req.row), req.locateType)));
|
tableName, Bytes.toStringBinary(req.row), req.locateType)));
|
||||||
return;
|
return true;
|
||||||
}
|
}
|
||||||
if (!info.getTable().equals(tableName)) {
|
if (info.isSplitParent()) {
|
||||||
complete(tableName, req, null, new TableNotFoundException(
|
return false;
|
||||||
"Table '" + tableName + "' was not found, got: '" + info.getTable() + "'"));
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
if (info.isSplit()) {
|
|
||||||
complete(tableName, req, null,
|
|
||||||
new RegionOfflineException(
|
|
||||||
"the only available region for the required row is a split parent," +
|
|
||||||
" the daughters should be online soon: '" + info.getRegionNameAsString() + "'"));
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
if (info.isOffline()) {
|
|
||||||
complete(tableName, req, null, new RegionOfflineException("the region is offline, could" +
|
|
||||||
" be caused by a disable table call: '" + info.getRegionNameAsString() + "'"));
|
|
||||||
return;
|
|
||||||
}
|
}
|
||||||
if (loc.getServerName() == null) {
|
if (loc.getServerName() == null) {
|
||||||
complete(tableName, req, null,
|
complete(tableName, req, null,
|
||||||
new NoServerForRegionException(
|
new NoServerForRegionException(
|
||||||
String.format("No server address listed for region '%s', row='%s', locateType=%s",
|
String.format("No server address listed for region '%s', row='%s', locateType=%s",
|
||||||
info.getRegionNameAsString(), Bytes.toStringBinary(req.row), req.locateType)));
|
info.getRegionNameAsString(), Bytes.toStringBinary(req.row), req.locateType)));
|
||||||
return;
|
return true;
|
||||||
}
|
}
|
||||||
complete(tableName, req, loc, null);
|
complete(tableName, req, loc, null);
|
||||||
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
private HRegionLocation locateRowInCache(TableCache tableCache, TableName tableName, byte[] row) {
|
private HRegionLocation locateRowInCache(TableCache tableCache, TableName tableName, byte[] row) {
|
||||||
|
@ -368,21 +350,49 @@ class AsyncNonMetaRegionLocator {
|
||||||
LOG.trace("Try locate '" + tableName + "', row='" + Bytes.toStringBinary(req.row) +
|
LOG.trace("Try locate '" + tableName + "', row='" + Bytes.toStringBinary(req.row) +
|
||||||
"', locateType=" + req.locateType + " in meta");
|
"', locateType=" + req.locateType + " in meta");
|
||||||
}
|
}
|
||||||
byte[] metaKey;
|
byte[] metaStartKey;
|
||||||
if (req.locateType.equals(RegionLocateType.BEFORE)) {
|
if (req.locateType.equals(RegionLocateType.BEFORE)) {
|
||||||
if (isEmptyStopRow(req.row)) {
|
if (isEmptyStopRow(req.row)) {
|
||||||
byte[] binaryTableName = tableName.getName();
|
byte[] binaryTableName = tableName.getName();
|
||||||
metaKey = Arrays.copyOf(binaryTableName, binaryTableName.length + 1);
|
metaStartKey = Arrays.copyOf(binaryTableName, binaryTableName.length + 1);
|
||||||
} else {
|
} else {
|
||||||
metaKey = createRegionName(tableName, req.row, ZEROES, false);
|
metaStartKey = createRegionName(tableName, req.row, ZEROES, false);
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
metaKey = createRegionName(tableName, req.row, NINES, false);
|
metaStartKey = createRegionName(tableName, req.row, NINES, false);
|
||||||
}
|
}
|
||||||
|
byte[] metaStopKey =
|
||||||
|
RegionInfo.createRegionName(tableName, HConstants.EMPTY_START_ROW, "", false);
|
||||||
conn.getTable(META_TABLE_NAME)
|
conn.getTable(META_TABLE_NAME)
|
||||||
.scanAll(new Scan().withStartRow(metaKey).setReversed(true).addFamily(CATALOG_FAMILY)
|
.scan(new Scan().withStartRow(metaStartKey).withStopRow(metaStopKey, true)
|
||||||
.setOneRowLimit())
|
.addFamily(HConstants.CATALOG_FAMILY).setReversed(true).setCaching(5)
|
||||||
.whenComplete((results, error) -> onScanComplete(tableName, req, results, error));
|
.setReadType(ReadType.PREAD), new AdvancedScanResultConsumer() {
|
||||||
|
|
||||||
|
private boolean completeNormally = false;
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void onError(Throwable error) {
|
||||||
|
onScanNext(tableName, req, null, error);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void onComplete() {
|
||||||
|
if (!completeNormally) {
|
||||||
|
onScanNext(tableName, req, null, new TableNotFoundException(tableName));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void onNext(Result[] results, ScanController controller) {
|
||||||
|
for (Result result : results) {
|
||||||
|
if (onScanNext(tableName, req, result, null)) {
|
||||||
|
completeNormally = true;
|
||||||
|
controller.terminate();
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
private HRegionLocation locateInCache(TableCache tableCache, TableName tableName, byte[] row,
|
private HRegionLocation locateInCache(TableCache tableCache, TableName tableName, byte[] row,
|
||||||
|
|
|
@ -58,6 +58,7 @@ import org.apache.hadoop.hbase.TableName;
|
||||||
import org.apache.hadoop.hbase.TableNotEnabledException;
|
import org.apache.hadoop.hbase.TableNotEnabledException;
|
||||||
import org.apache.hadoop.hbase.TableNotFoundException;
|
import org.apache.hadoop.hbase.TableNotFoundException;
|
||||||
import org.apache.hadoop.hbase.ZooKeeperConnectionException;
|
import org.apache.hadoop.hbase.ZooKeeperConnectionException;
|
||||||
|
import org.apache.hadoop.hbase.client.Scan.ReadType;
|
||||||
import org.apache.hadoop.hbase.client.backoff.ClientBackoffPolicy;
|
import org.apache.hadoop.hbase.client.backoff.ClientBackoffPolicy;
|
||||||
import org.apache.hadoop.hbase.client.backoff.ClientBackoffPolicyFactory;
|
import org.apache.hadoop.hbase.client.backoff.ClientBackoffPolicyFactory;
|
||||||
import org.apache.hadoop.hbase.exceptions.ClientExceptionsUtil;
|
import org.apache.hadoop.hbase.exceptions.ClientExceptionsUtil;
|
||||||
|
@ -771,41 +772,34 @@ class ConnectionImplementation implements ClusterConnection, Closeable {
|
||||||
return locations;
|
return locations;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/**
|
||||||
* Search the hbase:meta table for the HRegionLocation
|
* Search the hbase:meta table for the HRegionLocation info that contains the table and row we're
|
||||||
* info that contains the table and row we're seeking.
|
* seeking.
|
||||||
*/
|
*/
|
||||||
private RegionLocations locateRegionInMeta(TableName tableName, byte[] row,
|
private RegionLocations locateRegionInMeta(TableName tableName, byte[] row, boolean useCache,
|
||||||
boolean useCache, boolean retry, int replicaId) throws IOException {
|
boolean retry, int replicaId) throws IOException {
|
||||||
|
// If we are supposed to be using the cache, look in the cache to see if we already have the
|
||||||
// If we are supposed to be using the cache, look in the cache to see if
|
// region.
|
||||||
// we already have the region.
|
|
||||||
if (useCache) {
|
if (useCache) {
|
||||||
RegionLocations locations = getCachedLocation(tableName, row);
|
RegionLocations locations = getCachedLocation(tableName, row);
|
||||||
if (locations != null && locations.getRegionLocation(replicaId) != null) {
|
if (locations != null && locations.getRegionLocation(replicaId) != null) {
|
||||||
return locations;
|
return locations;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// build the key of the meta region we should be looking for.
|
// build the key of the meta region we should be looking for.
|
||||||
// the extra 9's on the end are necessary to allow "exact" matches
|
// the extra 9's on the end are necessary to allow "exact" matches
|
||||||
// without knowing the precise region names.
|
// without knowing the precise region names.
|
||||||
byte[] metaStartKey = RegionInfo.createRegionName(tableName, row, HConstants.NINES, false);
|
byte[] metaStartKey = RegionInfo.createRegionName(tableName, row, HConstants.NINES, false);
|
||||||
byte[] metaStopKey =
|
byte[] metaStopKey =
|
||||||
RegionInfo.createRegionName(tableName, HConstants.EMPTY_START_ROW, "", false);
|
RegionInfo.createRegionName(tableName, HConstants.EMPTY_START_ROW, "", false);
|
||||||
|
Scan s = new Scan().withStartRow(metaStartKey).withStopRow(metaStopKey, true)
|
||||||
Scan s = new Scan();
|
.addFamily(HConstants.CATALOG_FAMILY).setReversed(true).setCaching(5)
|
||||||
s.setReversed(true);
|
.setReadType(ReadType.PREAD);
|
||||||
s.withStartRow(metaStartKey);
|
|
||||||
s.withStopRow(metaStopKey, true);
|
|
||||||
s.addFamily(HConstants.CATALOG_FAMILY);
|
|
||||||
|
|
||||||
if (this.useMetaReplicas) {
|
if (this.useMetaReplicas) {
|
||||||
s.setConsistency(Consistency.TIMELINE);
|
s.setConsistency(Consistency.TIMELINE);
|
||||||
}
|
}
|
||||||
|
|
||||||
int maxAttempts = (retry ? numTries : 1);
|
int maxAttempts = (retry ? numTries : 1);
|
||||||
for (int tries = 0; true; tries++) {
|
for (int tries = 0; ; tries++) {
|
||||||
if (tries >= maxAttempts) {
|
if (tries >= maxAttempts) {
|
||||||
throw new NoServerForRegionException("Unable to find region for "
|
throw new NoServerForRegionException("Unable to find region for "
|
||||||
+ Bytes.toStringBinary(row) + " in " + tableName + " after " + tries + " tries.");
|
+ Bytes.toStringBinary(row) + " in " + tableName + " after " + tries + " tries.");
|
||||||
|
@ -821,7 +815,6 @@ class ConnectionImplementation implements ClusterConnection, Closeable {
|
||||||
// We are only supposed to clean the cache for the specific replicaId
|
// We are only supposed to clean the cache for the specific replicaId
|
||||||
metaCache.clearCache(tableName, row, replicaId);
|
metaCache.clearCache(tableName, row, replicaId);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Query the meta region
|
// Query the meta region
|
||||||
long pauseBase = this.pause;
|
long pauseBase = this.pause;
|
||||||
userRegionLock.lock();
|
userRegionLock.lock();
|
||||||
|
@ -832,60 +825,64 @@ class ConnectionImplementation implements ClusterConnection, Closeable {
|
||||||
return locations;
|
return locations;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
Result regionInfoRow = null;
|
|
||||||
s.resetMvccReadPoint();
|
s.resetMvccReadPoint();
|
||||||
s.setOneRowLimit();
|
|
||||||
try (ReversedClientScanner rcs =
|
try (ReversedClientScanner rcs =
|
||||||
new ReversedClientScanner(conf, s, TableName.META_TABLE_NAME, this, rpcCallerFactory,
|
new ReversedClientScanner(conf, s, TableName.META_TABLE_NAME, this, rpcCallerFactory,
|
||||||
rpcControllerFactory, getMetaLookupPool(), metaReplicaCallTimeoutScanInMicroSecond)) {
|
rpcControllerFactory, getMetaLookupPool(), metaReplicaCallTimeoutScanInMicroSecond)) {
|
||||||
regionInfoRow = rcs.next();
|
boolean tableNotFound = true;
|
||||||
|
for (;;) {
|
||||||
|
Result regionInfoRow = rcs.next();
|
||||||
|
if (regionInfoRow == null) {
|
||||||
|
if (tableNotFound) {
|
||||||
|
throw new TableNotFoundException(tableName);
|
||||||
|
} else {
|
||||||
|
throw new NoServerForRegionException(
|
||||||
|
"Unable to find region for " + Bytes.toStringBinary(row) + " in " + tableName);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
tableNotFound = false;
|
||||||
|
// convert the row result into the HRegionLocation we need!
|
||||||
|
RegionLocations locations = MetaTableAccessor.getRegionLocations(regionInfoRow);
|
||||||
|
if (locations == null || locations.getRegionLocation(replicaId) == null) {
|
||||||
|
throw new IOException("RegionInfo null in " + tableName + ", row=" + regionInfoRow);
|
||||||
|
}
|
||||||
|
RegionInfo regionInfo = locations.getRegionLocation(replicaId).getRegion();
|
||||||
|
if (regionInfo == null) {
|
||||||
|
throw new IOException("RegionInfo null or empty in " + TableName.META_TABLE_NAME +
|
||||||
|
", row=" + regionInfoRow);
|
||||||
|
}
|
||||||
|
// See HBASE-20182. It is possible that we locate to a split parent even after the
|
||||||
|
// children are online, so here we need to skip this region and go to the next one.
|
||||||
|
if (regionInfo.isSplitParent()) {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
if (regionInfo.isOffline()) {
|
||||||
|
throw new RegionOfflineException("Region offline; disable table call? " +
|
||||||
|
regionInfo.getRegionNameAsString());
|
||||||
|
}
|
||||||
|
// It is possible that the split children have not been online yet and we have skipped
|
||||||
|
// the parent in the above condition, so we may have already reached a region which does
|
||||||
|
// not contains us.
|
||||||
|
if (!regionInfo.containsRow(row)) {
|
||||||
|
throw new NoServerForRegionException(
|
||||||
|
"Unable to find region for " + Bytes.toStringBinary(row) + " in " + tableName);
|
||||||
|
}
|
||||||
|
ServerName serverName = locations.getRegionLocation(replicaId).getServerName();
|
||||||
|
if (serverName == null) {
|
||||||
|
throw new NoServerForRegionException("No server address listed in " +
|
||||||
|
TableName.META_TABLE_NAME + " for region " + regionInfo.getRegionNameAsString() +
|
||||||
|
" containing row " + Bytes.toStringBinary(row));
|
||||||
|
}
|
||||||
|
if (isDeadServer(serverName)) {
|
||||||
|
throw new RegionServerStoppedException(
|
||||||
|
"hbase:meta says the region " + regionInfo.getRegionNameAsString() +
|
||||||
|
" is managed by the server " + serverName + ", but it is dead.");
|
||||||
|
}
|
||||||
|
// Instantiate the location
|
||||||
|
cacheLocation(tableName, locations);
|
||||||
|
return locations;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if (regionInfoRow == null) {
|
|
||||||
throw new TableNotFoundException(tableName);
|
|
||||||
}
|
|
||||||
// convert the row result into the HRegionLocation we need!
|
|
||||||
RegionLocations locations = MetaTableAccessor.getRegionLocations(regionInfoRow);
|
|
||||||
if (locations == null || locations.getRegionLocation(replicaId) == null) {
|
|
||||||
throw new IOException("RegionInfo null in " + tableName + ", row=" + regionInfoRow);
|
|
||||||
}
|
|
||||||
RegionInfo regionInfo = locations.getRegionLocation(replicaId).getRegion();
|
|
||||||
if (regionInfo == null) {
|
|
||||||
throw new IOException("RegionInfo null or empty in " +
|
|
||||||
TableName.META_TABLE_NAME + ", row=" + regionInfoRow);
|
|
||||||
}
|
|
||||||
|
|
||||||
// possible we got a region of a different table...
|
|
||||||
if (!regionInfo.getTable().equals(tableName)) {
|
|
||||||
throw new TableNotFoundException(
|
|
||||||
"Region of '" + regionInfo.getRegionNameAsString() + "' is expected in the table of '" + tableName + "', " +
|
|
||||||
"but hbase:meta says it is in the table of '" + regionInfo.getTable() + "'. " +
|
|
||||||
"hbase:meta might be damaged.");
|
|
||||||
}
|
|
||||||
if (regionInfo.isSplit()) {
|
|
||||||
throw new RegionOfflineException ("Region for row is a split parent, daughters not online: " +
|
|
||||||
regionInfo.getRegionNameAsString());
|
|
||||||
}
|
|
||||||
if (regionInfo.isOffline()) {
|
|
||||||
throw new RegionOfflineException("Region offline; disable table call? " +
|
|
||||||
regionInfo.getRegionNameAsString());
|
|
||||||
}
|
|
||||||
|
|
||||||
ServerName serverName = locations.getRegionLocation(replicaId).getServerName();
|
|
||||||
if (serverName == null) {
|
|
||||||
throw new NoServerForRegionException("No server address listed in "
|
|
||||||
+ TableName.META_TABLE_NAME + " for region " + regionInfo.getRegionNameAsString()
|
|
||||||
+ " containing row " + Bytes.toStringBinary(row));
|
|
||||||
}
|
|
||||||
|
|
||||||
if (isDeadServer(serverName)){
|
|
||||||
throw new RegionServerStoppedException("hbase:meta says the region "+
|
|
||||||
regionInfo.getRegionNameAsString()+" is managed by the server " + serverName +
|
|
||||||
", but it is dead.");
|
|
||||||
}
|
|
||||||
// Instantiate the location
|
|
||||||
cacheLocation(tableName, locations);
|
|
||||||
return locations;
|
|
||||||
} catch (TableNotFoundException e) {
|
} catch (TableNotFoundException e) {
|
||||||
// if we got this error, probably means the table just plain doesn't
|
// if we got this error, probably means the table just plain doesn't
|
||||||
// exist. rethrow the error immediately. this should always be coming
|
// exist. rethrow the error immediately. this should always be coming
|
||||||
|
@ -901,12 +898,8 @@ class ConnectionImplementation implements ClusterConnection, Closeable {
|
||||||
pauseBase = this.pauseForCQTBE;
|
pauseBase = this.pauseForCQTBE;
|
||||||
}
|
}
|
||||||
if (tries < maxAttempts - 1) {
|
if (tries < maxAttempts - 1) {
|
||||||
if (LOG.isDebugEnabled()) {
|
LOG.debug("locateRegionInMeta parentTable='{}', attempt={} of {} failed; retrying " +
|
||||||
LOG.debug("locateRegionInMeta parentTable=" + TableName.META_TABLE_NAME
|
"after sleep of {}", TableName.META_TABLE_NAME, tries, maxAttempts, maxAttempts, e);
|
||||||
+ ", metaLocation=" + ", attempt=" + tries + " of " + maxAttempts
|
|
||||||
+ " failed; retrying after sleep of "
|
|
||||||
+ ConnectionUtils.getPauseTime(pauseBase, tries) + " because: " + e.getMessage());
|
|
||||||
}
|
|
||||||
} else {
|
} else {
|
||||||
throw e;
|
throw e;
|
||||||
}
|
}
|
||||||
|
|
|
@ -0,0 +1,106 @@
|
||||||
|
/**
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one
|
||||||
|
* or more contributor license agreements. See the NOTICE file
|
||||||
|
* distributed with this work for additional information
|
||||||
|
* regarding copyright ownership. The ASF licenses this file
|
||||||
|
* to you under the Apache License, Version 2.0 (the
|
||||||
|
* "License"); you may not use this file except in compliance
|
||||||
|
* with the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
package org.apache.hadoop.hbase;
|
||||||
|
|
||||||
|
import static org.junit.Assert.assertEquals;
|
||||||
|
import static org.junit.Assert.assertNotNull;
|
||||||
|
|
||||||
|
import java.util.concurrent.TimeUnit;
|
||||||
|
import org.apache.hadoop.hbase.Waiter.ExplainingPredicate;
|
||||||
|
import org.apache.hadoop.hbase.client.AsyncConnection;
|
||||||
|
import org.apache.hadoop.hbase.client.ColumnFamilyDescriptorBuilder;
|
||||||
|
import org.apache.hadoop.hbase.client.ConnectionFactory;
|
||||||
|
import org.apache.hadoop.hbase.client.RegionInfo;
|
||||||
|
import org.apache.hadoop.hbase.client.TableDescriptor;
|
||||||
|
import org.apache.hadoop.hbase.client.TableDescriptorBuilder;
|
||||||
|
import org.apache.hadoop.hbase.testclassification.MediumTests;
|
||||||
|
import org.apache.hadoop.hbase.testclassification.MiscTests;
|
||||||
|
import org.apache.hadoop.hbase.util.Bytes;
|
||||||
|
import org.junit.AfterClass;
|
||||||
|
import org.junit.BeforeClass;
|
||||||
|
import org.junit.ClassRule;
|
||||||
|
import org.junit.Test;
|
||||||
|
import org.junit.experimental.categories.Category;
|
||||||
|
|
||||||
|
@Category({ MiscTests.class, MediumTests.class })
|
||||||
|
public class TestSplitMerge {
|
||||||
|
|
||||||
|
@ClassRule
|
||||||
|
public static final HBaseClassTestRule CLASS_RULE =
|
||||||
|
HBaseClassTestRule.forClass(TestSplitMerge.class);
|
||||||
|
|
||||||
|
private static final HBaseTestingUtility UTIL = new HBaseTestingUtility();
|
||||||
|
|
||||||
|
@BeforeClass
|
||||||
|
public static void setUp() throws Exception {
|
||||||
|
UTIL.getConfiguration().setInt(HConstants.HBASE_CLIENT_META_OPERATION_TIMEOUT, 1000);
|
||||||
|
UTIL.getConfiguration().setInt(HConstants.HBASE_CLIENT_RETRIES_NUMBER, 2);
|
||||||
|
UTIL.startMiniCluster(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
@AfterClass
|
||||||
|
public static void tearDown() throws Exception {
|
||||||
|
UTIL.shutdownMiniCluster();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void test() throws Exception {
|
||||||
|
TableName tableName = TableName.valueOf("SplitMerge");
|
||||||
|
byte[] family = Bytes.toBytes("CF");
|
||||||
|
TableDescriptor td = TableDescriptorBuilder.newBuilder(tableName)
|
||||||
|
.setColumnFamily(ColumnFamilyDescriptorBuilder.of(family)).build();
|
||||||
|
UTIL.getAdmin().createTable(td, new byte[][] { Bytes.toBytes(1) });
|
||||||
|
UTIL.waitTableAvailable(tableName);
|
||||||
|
UTIL.getAdmin().split(tableName, Bytes.toBytes(2));
|
||||||
|
UTIL.waitFor(30000, new ExplainingPredicate<Exception>() {
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public boolean evaluate() throws Exception {
|
||||||
|
return UTIL.getMiniHBaseCluster().getRegions(tableName).size() == 3;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public String explainFailure() throws Exception {
|
||||||
|
return "Split has not finished yet";
|
||||||
|
}
|
||||||
|
});
|
||||||
|
RegionInfo regionA = null;
|
||||||
|
RegionInfo regionB = null;
|
||||||
|
for (RegionInfo region : UTIL.getAdmin().getRegions(tableName)) {
|
||||||
|
if (region.getStartKey().length == 0) {
|
||||||
|
regionA = region;
|
||||||
|
} else if (Bytes.equals(region.getStartKey(), Bytes.toBytes(1))) {
|
||||||
|
regionB = region;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
assertNotNull(regionA);
|
||||||
|
assertNotNull(regionB);
|
||||||
|
UTIL.getAdmin().mergeRegionsAsync(regionA.getRegionName(), regionB.getRegionName(), false)
|
||||||
|
.get(30, TimeUnit.SECONDS);
|
||||||
|
assertEquals(2, UTIL.getAdmin().getRegions(tableName).size());
|
||||||
|
|
||||||
|
ServerName expected = UTIL.getMiniHBaseCluster().getRegionServer(0).getServerName();
|
||||||
|
assertEquals(expected, UTIL.getConnection().getRegionLocator(tableName)
|
||||||
|
.getRegionLocation(Bytes.toBytes(1), true).getServerName());
|
||||||
|
try (AsyncConnection asyncConn =
|
||||||
|
ConnectionFactory.createAsyncConnection(UTIL.getConfiguration()).get()) {
|
||||||
|
assertEquals(expected, asyncConn.getRegionLocator(tableName)
|
||||||
|
.getRegionLocation(Bytes.toBytes(1), true).get().getServerName());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
|
@ -87,9 +87,9 @@ public class TestAsyncNonMetaRegionLocatorConcurrenyLimit {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void preScannerOpen(ObserverContext<RegionCoprocessorEnvironment> e, Scan scan)
|
public boolean preScannerNext(ObserverContext<RegionCoprocessorEnvironment> c,
|
||||||
throws IOException {
|
InternalScanner s, List<Result> result, int limit, boolean hasNext) throws IOException {
|
||||||
if (e.getEnvironment().getRegionInfo().isMetaRegion()) {
|
if (c.getEnvironment().getRegionInfo().isMetaRegion()) {
|
||||||
int concurrency = CONCURRENCY.incrementAndGet();
|
int concurrency = CONCURRENCY.incrementAndGet();
|
||||||
for (;;) {
|
for (;;) {
|
||||||
int max = MAX_CONCURRENCY.get();
|
int max = MAX_CONCURRENCY.get();
|
||||||
|
@ -102,14 +102,16 @@ public class TestAsyncNonMetaRegionLocatorConcurrenyLimit {
|
||||||
}
|
}
|
||||||
Threads.sleepWithoutInterrupt(10);
|
Threads.sleepWithoutInterrupt(10);
|
||||||
}
|
}
|
||||||
|
return hasNext;
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void postScannerClose(ObserverContext<RegionCoprocessorEnvironment> e, InternalScanner s)
|
public boolean postScannerNext(ObserverContext<RegionCoprocessorEnvironment> c,
|
||||||
throws IOException {
|
InternalScanner s, List<Result> result, int limit, boolean hasNext) throws IOException {
|
||||||
if (e.getEnvironment().getRegionInfo().isMetaRegion()) {
|
if (c.getEnvironment().getRegionInfo().isMetaRegion()) {
|
||||||
CONCURRENCY.decrementAndGet();
|
CONCURRENCY.decrementAndGet();
|
||||||
}
|
}
|
||||||
|
return hasNext;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -119,7 +121,7 @@ public class TestAsyncNonMetaRegionLocatorConcurrenyLimit {
|
||||||
conf.set(REGION_COPROCESSOR_CONF_KEY, CountingRegionObserver.class.getName());
|
conf.set(REGION_COPROCESSOR_CONF_KEY, CountingRegionObserver.class.getName());
|
||||||
conf.setInt(MAX_CONCURRENT_LOCATE_REQUEST_PER_TABLE, MAX_ALLOWED);
|
conf.setInt(MAX_CONCURRENT_LOCATE_REQUEST_PER_TABLE, MAX_ALLOWED);
|
||||||
TEST_UTIL.startMiniCluster(3);
|
TEST_UTIL.startMiniCluster(3);
|
||||||
TEST_UTIL.getAdmin().setBalancerRunning(false, true);
|
TEST_UTIL.getAdmin().balancerSwitch(false, true);
|
||||||
AsyncRegistry registry = AsyncRegistryFactory.getRegistry(TEST_UTIL.getConfiguration());
|
AsyncRegistry registry = AsyncRegistryFactory.getRegistry(TEST_UTIL.getConfiguration());
|
||||||
CONN = new AsyncConnectionImpl(TEST_UTIL.getConfiguration(), registry,
|
CONN = new AsyncConnectionImpl(TEST_UTIL.getConfiguration(), registry,
|
||||||
registry.getClusterId().get(), User.getCurrent());
|
registry.getClusterId().get(), User.getCurrent());
|
||||||
|
@ -142,14 +144,14 @@ public class TestAsyncNonMetaRegionLocatorConcurrenyLimit {
|
||||||
for (int i = 0; i < futures.size(); i++) {
|
for (int i = 0; i < futures.size(); i++) {
|
||||||
HRegionLocation loc = futures.get(i).get();
|
HRegionLocation loc = futures.get(i).get();
|
||||||
if (i == 0) {
|
if (i == 0) {
|
||||||
assertTrue(isEmptyStartRow(loc.getRegionInfo().getStartKey()));
|
assertTrue(isEmptyStartRow(loc.getRegion().getStartKey()));
|
||||||
} else {
|
} else {
|
||||||
assertEquals(String.format("%02x", i), Bytes.toString(loc.getRegionInfo().getStartKey()));
|
assertEquals(String.format("%02x", i), Bytes.toString(loc.getRegion().getStartKey()));
|
||||||
}
|
}
|
||||||
if (i == futures.size() - 1) {
|
if (i == futures.size() - 1) {
|
||||||
assertTrue(isEmptyStopRow(loc.getRegionInfo().getEndKey()));
|
assertTrue(isEmptyStopRow(loc.getRegion().getEndKey()));
|
||||||
} else {
|
} else {
|
||||||
assertEquals(String.format("%02x", i + 1), Bytes.toString(loc.getRegionInfo().getEndKey()));
|
assertEquals(String.format("%02x", i + 1), Bytes.toString(loc.getRegion().getEndKey()));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -161,6 +163,7 @@ public class TestAsyncNonMetaRegionLocatorConcurrenyLimit {
|
||||||
.map(r -> LOCATOR.getRegionLocation(TABLE_NAME, r, RegionLocateType.CURRENT, false))
|
.map(r -> LOCATOR.getRegionLocation(TABLE_NAME, r, RegionLocateType.CURRENT, false))
|
||||||
.collect(toList());
|
.collect(toList());
|
||||||
assertLocs(futures);
|
assertLocs(futures);
|
||||||
assertTrue(MAX_CONCURRENCY.get() <= MAX_ALLOWED);
|
assertTrue("max allowed is " + MAX_ALLOWED + " but actual is " + MAX_CONCURRENCY.get(),
|
||||||
|
MAX_CONCURRENCY.get() <= MAX_ALLOWED);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue