HBASE-22404 Open/Close region request may be executed twice when master restart
This commit is contained in:
parent
7878389669
commit
bdd2fc6149
|
@ -22,6 +22,7 @@ import java.io.IOException;
|
||||||
import java.lang.Thread.UncaughtExceptionHandler;
|
import java.lang.Thread.UncaughtExceptionHandler;
|
||||||
import java.util.HashSet;
|
import java.util.HashSet;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
|
import java.util.Optional;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
import java.util.concurrent.ConcurrentHashMap;
|
import java.util.concurrent.ConcurrentHashMap;
|
||||||
import java.util.concurrent.DelayQueue;
|
import java.util.concurrent.DelayQueue;
|
||||||
|
@ -232,8 +233,12 @@ public abstract class RemoteProcedureDispatcher<TEnv, TRemote extends Comparable
|
||||||
public interface RemoteProcedure<TEnv, TRemote> {
|
public interface RemoteProcedure<TEnv, TRemote> {
|
||||||
/**
|
/**
|
||||||
* For building the remote operation.
|
* For building the remote operation.
|
||||||
|
* May be empty if no need to send remote call. Usually, this means the RemoteProcedure has been
|
||||||
|
* finished already. This is possible, as we may have already sent the procedure to RS but then
|
||||||
|
* the rpc connection is broken so the executeProcedures call fails, but the RS does receive the
|
||||||
|
* procedure and execute it and then report back, before we retry again.
|
||||||
*/
|
*/
|
||||||
RemoteOperation remoteCallBuild(TEnv env, TRemote remote);
|
Optional<RemoteOperation> remoteCallBuild(TEnv env, TRemote remote);
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Called when the executeProcedure call is failed.
|
* Called when the executeProcedure call is failed.
|
||||||
|
@ -277,8 +282,8 @@ public abstract class RemoteProcedureDispatcher<TEnv, TRemote extends Comparable
|
||||||
final TRemote remote, final Set<RemoteProcedure> remoteProcedures) {
|
final TRemote remote, final Set<RemoteProcedure> remoteProcedures) {
|
||||||
final ArrayListMultimap<Class<?>, RemoteOperation> requestByType = ArrayListMultimap.create();
|
final ArrayListMultimap<Class<?>, RemoteOperation> requestByType = ArrayListMultimap.create();
|
||||||
for (RemoteProcedure proc : remoteProcedures) {
|
for (RemoteProcedure proc : remoteProcedures) {
|
||||||
RemoteOperation operation = proc.remoteCallBuild(env, remote);
|
Optional<RemoteOperation> operation = proc.remoteCallBuild(env, remote);
|
||||||
requestByType.put(operation.getClass(), operation);
|
operation.ifPresent(op -> requestByType.put(op.getClass(), op));
|
||||||
}
|
}
|
||||||
return requestByType;
|
return requestByType;
|
||||||
}
|
}
|
||||||
|
|
|
@ -18,6 +18,8 @@
|
||||||
package org.apache.hadoop.hbase.master.assignment;
|
package org.apache.hadoop.hbase.master.assignment;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.hadoop.hbase.ServerName;
|
import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.exceptions.UnexpectedStateException;
|
import org.apache.hadoop.hbase.exceptions.UnexpectedStateException;
|
||||||
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
||||||
|
@ -117,9 +119,9 @@ public class AssignProcedure extends RegionTransitionProcedure {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteOperation remoteCallBuild(final MasterProcedureEnv env,
|
public Optional<RemoteOperation> remoteCallBuild(final MasterProcedureEnv env,
|
||||||
final ServerName serverName) {
|
final ServerName serverName) {
|
||||||
return null;
|
return Optional.empty();
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
|
|
@ -61,7 +61,7 @@ public class CloseRegionProcedure extends RegionRemoteProcedureBase {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteOperation remoteCallBuild(MasterProcedureEnv env, ServerName remote) {
|
public RemoteOperation newRemoteOperation() {
|
||||||
return new RegionCloseOperation(this, region, getProcId(), assignCandidate);
|
return new RegionCloseOperation(this, region, getProcId(), assignCandidate);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -57,7 +57,7 @@ public class OpenRegionProcedure extends RegionRemoteProcedureBase {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteOperation remoteCallBuild(MasterProcedureEnv env, ServerName remote) {
|
public RemoteOperation newRemoteOperation() {
|
||||||
return new RegionOpenOperation(this, region, getProcId());
|
return new RegionOpenOperation(this, region, getProcId());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -18,6 +18,8 @@
|
||||||
package org.apache.hadoop.hbase.master.assignment;
|
package org.apache.hadoop.hbase.master.assignment;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.hadoop.hbase.HConstants;
|
import org.apache.hadoop.hbase.HConstants;
|
||||||
import org.apache.hadoop.hbase.ServerName;
|
import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.TableName;
|
import org.apache.hadoop.hbase.TableName;
|
||||||
|
@ -32,6 +34,7 @@ import org.apache.hadoop.hbase.procedure2.ProcedureStateSerializer;
|
||||||
import org.apache.hadoop.hbase.procedure2.ProcedureSuspendedException;
|
import org.apache.hadoop.hbase.procedure2.ProcedureSuspendedException;
|
||||||
import org.apache.hadoop.hbase.procedure2.ProcedureUtil;
|
import org.apache.hadoop.hbase.procedure2.ProcedureUtil;
|
||||||
import org.apache.hadoop.hbase.procedure2.ProcedureYieldException;
|
import org.apache.hadoop.hbase.procedure2.ProcedureYieldException;
|
||||||
|
import org.apache.hadoop.hbase.procedure2.RemoteProcedureDispatcher;
|
||||||
import org.apache.hadoop.hbase.procedure2.RemoteProcedureDispatcher.RemoteProcedure;
|
import org.apache.hadoop.hbase.procedure2.RemoteProcedureDispatcher.RemoteProcedure;
|
||||||
import org.apache.hadoop.hbase.procedure2.RemoteProcedureException;
|
import org.apache.hadoop.hbase.procedure2.RemoteProcedureException;
|
||||||
import org.apache.hadoop.hbase.util.RetryCounter;
|
import org.apache.hadoop.hbase.util.RetryCounter;
|
||||||
|
@ -81,6 +84,19 @@ public abstract class RegionRemoteProcedureBase extends Procedure<MasterProcedur
|
||||||
parent.attachRemoteProc(this);
|
parent.attachRemoteProc(this);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Optional<RemoteProcedureDispatcher.RemoteOperation> remoteCallBuild(MasterProcedureEnv env,
|
||||||
|
ServerName remote) {
|
||||||
|
// REPORT_SUCCEED means that this remote open/close request already executed in RegionServer.
|
||||||
|
// So return empty operation and RSProcedureDispatcher no need to send it again.
|
||||||
|
if (state == RegionRemoteProcedureBaseState.REGION_REMOTE_PROCEDURE_REPORT_SUCCEED) {
|
||||||
|
return Optional.empty();
|
||||||
|
}
|
||||||
|
return Optional.of(newRemoteOperation());
|
||||||
|
}
|
||||||
|
|
||||||
|
protected abstract RemoteProcedureDispatcher.RemoteOperation newRemoteOperation();
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void remoteOperationCompleted(MasterProcedureEnv env) {
|
public void remoteOperationCompleted(MasterProcedureEnv env) {
|
||||||
// should not be called since we use reportRegionStateTransition to report the result
|
// should not be called since we use reportRegionStateTransition to report the result
|
||||||
|
|
|
@ -18,6 +18,7 @@
|
||||||
package org.apache.hadoop.hbase.master.assignment;
|
package org.apache.hadoop.hbase.master.assignment;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.Optional;
|
||||||
import java.util.concurrent.atomic.AtomicBoolean;
|
import java.util.concurrent.atomic.AtomicBoolean;
|
||||||
import org.apache.hadoop.hbase.ServerName;
|
import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.TableName;
|
import org.apache.hadoop.hbase.TableName;
|
||||||
|
@ -124,7 +125,8 @@ public abstract class RegionTransitionProcedure extends Procedure<MasterProcedur
|
||||||
TransitionCode code, long seqId) throws UnexpectedStateException;
|
TransitionCode code, long seqId) throws UnexpectedStateException;
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public abstract RemoteOperation remoteCallBuild(MasterProcedureEnv env, ServerName serverName);
|
public abstract Optional<RemoteOperation> remoteCallBuild(MasterProcedureEnv env,
|
||||||
|
ServerName serverName);
|
||||||
|
|
||||||
protected abstract boolean remoteCallFailed(MasterProcedureEnv env, RegionStateNode regionNode,
|
protected abstract boolean remoteCallFailed(MasterProcedureEnv env, RegionStateNode regionNode,
|
||||||
IOException exception);
|
IOException exception);
|
||||||
|
|
|
@ -20,6 +20,8 @@
|
||||||
package org.apache.hadoop.hbase.master.assignment;
|
package org.apache.hadoop.hbase.master.assignment;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.hadoop.hbase.ServerName;
|
import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.exceptions.UnexpectedStateException;
|
import org.apache.hadoop.hbase.exceptions.UnexpectedStateException;
|
||||||
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
||||||
|
@ -126,9 +128,9 @@ public class UnassignProcedure extends RegionTransitionProcedure {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteOperation remoteCallBuild(final MasterProcedureEnv env,
|
public Optional<RemoteOperation> remoteCallBuild(final MasterProcedureEnv env,
|
||||||
final ServerName serverName) {
|
final ServerName serverName) {
|
||||||
return null;
|
return Optional.empty();
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
|
|
@ -19,6 +19,7 @@
|
||||||
package org.apache.hadoop.hbase.master.procedure;
|
package org.apache.hadoop.hbase.master.procedure;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.hadoop.fs.Path;
|
import org.apache.hadoop.fs.Path;
|
||||||
import org.apache.hadoop.hbase.DoNotRetryIOException;
|
import org.apache.hadoop.hbase.DoNotRetryIOException;
|
||||||
|
@ -84,11 +85,12 @@ public class SplitWALRemoteProcedure extends ServerRemoteProcedure
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteProcedureDispatcher.RemoteOperation remoteCallBuild(MasterProcedureEnv env,
|
public Optional<RemoteProcedureDispatcher.RemoteOperation> remoteCallBuild(MasterProcedureEnv env,
|
||||||
ServerName serverName) {
|
ServerName serverName) {
|
||||||
return new RSProcedureDispatcher.ServerOperation(this, getProcId(), SplitWALCallable.class,
|
return Optional
|
||||||
MasterProcedureProtos.SplitWALParameter.newBuilder().setWalPath(walPath).build()
|
.of(new RSProcedureDispatcher.ServerOperation(this, getProcId(), SplitWALCallable.class,
|
||||||
.toByteArray());
|
MasterProcedureProtos.SplitWALParameter.newBuilder().setWalPath(walPath).build()
|
||||||
|
.toByteArray()));
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
|
|
@ -18,6 +18,7 @@
|
||||||
package org.apache.hadoop.hbase.master.procedure;
|
package org.apache.hadoop.hbase.master.procedure;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.hadoop.hbase.ServerName;
|
import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.procedure2.ProcedureStateSerializer;
|
import org.apache.hadoop.hbase.procedure2.ProcedureStateSerializer;
|
||||||
|
@ -74,15 +75,13 @@ public class SwitchRpcThrottleRemoteProcedure extends ServerRemoteProcedure
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteProcedureDispatcher.RemoteOperation
|
public Optional<RemoteProcedureDispatcher.RemoteOperation> remoteCallBuild(
|
||||||
remoteCallBuild(MasterProcedureEnv masterProcedureEnv, ServerName remote) {
|
MasterProcedureEnv masterProcedureEnv, ServerName remote) {
|
||||||
assert targetServer.equals(remote);
|
assert targetServer.equals(remote);
|
||||||
return new RSProcedureDispatcher.ServerOperation(this, getProcId(),
|
return Optional.of(new RSProcedureDispatcher.ServerOperation(this, getProcId(),
|
||||||
SwitchRpcThrottleRemoteCallable.class,
|
SwitchRpcThrottleRemoteCallable.class, SwitchRpcThrottleRemoteStateData.newBuilder()
|
||||||
SwitchRpcThrottleRemoteStateData.newBuilder()
|
.setTargetServer(ProtobufUtil.toServerName(remote))
|
||||||
.setTargetServer(ProtobufUtil.toServerName(remote))
|
.setRpcThrottleEnabled(rpcThrottleEnabled).build().toByteArray()));
|
||||||
.setRpcThrottleEnabled(rpcThrottleEnabled).build()
|
|
||||||
.toByteArray());
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
|
|
@ -18,6 +18,8 @@
|
||||||
package org.apache.hadoop.hbase.master.replication;
|
package org.apache.hadoop.hbase.master.replication;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.hadoop.hbase.ServerName;
|
import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
||||||
import org.apache.hadoop.hbase.master.procedure.PeerProcedureInterface;
|
import org.apache.hadoop.hbase.master.procedure.PeerProcedureInterface;
|
||||||
|
@ -112,12 +114,12 @@ public class RefreshPeerProcedure extends ServerRemoteProcedure
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteOperation remoteCallBuild(MasterProcedureEnv env, ServerName remote) {
|
public Optional<RemoteOperation> remoteCallBuild(MasterProcedureEnv env, ServerName remote) {
|
||||||
assert targetServer.equals(remote);
|
assert targetServer.equals(remote);
|
||||||
return new ServerOperation(this, getProcId(), RefreshPeerCallable.class,
|
return Optional.of(new ServerOperation(this, getProcId(), RefreshPeerCallable.class,
|
||||||
RefreshPeerParameter.newBuilder().setPeerId(peerId).setType(toPeerModificationType(type))
|
RefreshPeerParameter.newBuilder().setPeerId(peerId).setType(toPeerModificationType(type))
|
||||||
.setTargetServer(ProtobufUtil.toServerName(remote)).setStage(stage).build()
|
.setTargetServer(ProtobufUtil.toServerName(remote)).setStage(stage).build()
|
||||||
.toByteArray());
|
.toByteArray()));
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
|
|
@ -20,6 +20,7 @@ package org.apache.hadoop.hbase.master.replication;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
|
import java.util.Optional;
|
||||||
|
|
||||||
import org.apache.hadoop.hbase.ServerName;
|
import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
import org.apache.hadoop.hbase.master.procedure.MasterProcedureEnv;
|
||||||
|
@ -62,13 +63,14 @@ public class SyncReplicationReplayWALRemoteProcedure extends ServerRemoteProcedu
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteOperation remoteCallBuild(MasterProcedureEnv env, ServerName remote) {
|
public Optional<RemoteOperation> remoteCallBuild(MasterProcedureEnv env, ServerName remote) {
|
||||||
ReplaySyncReplicationWALParameter.Builder builder =
|
ReplaySyncReplicationWALParameter.Builder builder =
|
||||||
ReplaySyncReplicationWALParameter.newBuilder();
|
ReplaySyncReplicationWALParameter.newBuilder();
|
||||||
builder.setPeerId(peerId);
|
builder.setPeerId(peerId);
|
||||||
wals.stream().forEach(builder::addWal);
|
wals.stream().forEach(builder::addWal);
|
||||||
return new ServerOperation(this, getProcId(), ReplaySyncReplicationWALCallable.class,
|
return Optional
|
||||||
builder.build().toByteArray());
|
.of(new ServerOperation(this, getProcId(), ReplaySyncReplicationWALCallable.class,
|
||||||
|
builder.build().toByteArray()));
|
||||||
}
|
}
|
||||||
|
|
||||||
protected void complete(MasterProcedureEnv env, Throwable error) {
|
protected void complete(MasterProcedureEnv env, Throwable error) {
|
||||||
|
|
|
@ -51,6 +51,7 @@ import java.util.TreeSet;
|
||||||
import java.util.concurrent.ConcurrentHashMap;
|
import java.util.concurrent.ConcurrentHashMap;
|
||||||
import java.util.concurrent.ConcurrentMap;
|
import java.util.concurrent.ConcurrentMap;
|
||||||
import java.util.concurrent.ConcurrentSkipListMap;
|
import java.util.concurrent.ConcurrentSkipListMap;
|
||||||
|
import java.util.concurrent.TimeUnit;
|
||||||
import java.util.concurrent.atomic.AtomicBoolean;
|
import java.util.concurrent.atomic.AtomicBoolean;
|
||||||
import java.util.concurrent.locks.ReentrantReadWriteLock;
|
import java.util.concurrent.locks.ReentrantReadWriteLock;
|
||||||
import java.util.function.Function;
|
import java.util.function.Function;
|
||||||
|
@ -191,6 +192,8 @@ import sun.misc.SignalHandler;
|
||||||
import org.apache.hbase.thirdparty.com.google.common.annotations.VisibleForTesting;
|
import org.apache.hbase.thirdparty.com.google.common.annotations.VisibleForTesting;
|
||||||
import org.apache.hbase.thirdparty.com.google.common.base.Preconditions;
|
import org.apache.hbase.thirdparty.com.google.common.base.Preconditions;
|
||||||
import org.apache.hbase.thirdparty.com.google.common.base.Throwables;
|
import org.apache.hbase.thirdparty.com.google.common.base.Throwables;
|
||||||
|
import org.apache.hbase.thirdparty.com.google.common.cache.Cache;
|
||||||
|
import org.apache.hbase.thirdparty.com.google.common.cache.CacheBuilder;
|
||||||
import org.apache.hbase.thirdparty.com.google.common.collect.Maps;
|
import org.apache.hbase.thirdparty.com.google.common.collect.Maps;
|
||||||
import org.apache.hbase.thirdparty.com.google.protobuf.BlockingRpcChannel;
|
import org.apache.hbase.thirdparty.com.google.protobuf.BlockingRpcChannel;
|
||||||
import org.apache.hbase.thirdparty.com.google.protobuf.RpcController;
|
import org.apache.hbase.thirdparty.com.google.protobuf.RpcController;
|
||||||
|
@ -255,6 +258,18 @@ public class HRegionServer extends HasThread implements
|
||||||
protected final ConcurrentMap<byte[], Boolean> regionsInTransitionInRS =
|
protected final ConcurrentMap<byte[], Boolean> regionsInTransitionInRS =
|
||||||
new ConcurrentSkipListMap<>(Bytes.BYTES_COMPARATOR);
|
new ConcurrentSkipListMap<>(Bytes.BYTES_COMPARATOR);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Used to cache the open/close region procedures which already submitted.
|
||||||
|
* See {@link #submitRegionProcedure(long)}.
|
||||||
|
*/
|
||||||
|
private final ConcurrentMap<Long, Long> submittedRegionProcedures = new ConcurrentHashMap<>();
|
||||||
|
/**
|
||||||
|
* Used to cache the open/close region procedures which already executed.
|
||||||
|
* See {@link #submitRegionProcedure(long)}.
|
||||||
|
*/
|
||||||
|
private final Cache<Long, Long> executedRegionProcedures =
|
||||||
|
CacheBuilder.newBuilder().expireAfterAccess(600, TimeUnit.SECONDS).build();
|
||||||
|
|
||||||
// Cache flushing
|
// Cache flushing
|
||||||
protected MemStoreFlusher cacheFlusher;
|
protected MemStoreFlusher cacheFlusher;
|
||||||
|
|
||||||
|
@ -3882,6 +3897,51 @@ public class HRegionServer extends HasThread implements
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Will ignore the open/close region procedures which already submitted or executed.
|
||||||
|
*
|
||||||
|
* When master had unfinished open/close region procedure and restarted, new active master may
|
||||||
|
* send duplicate open/close region request to regionserver. The open/close request is submitted
|
||||||
|
* to a thread pool and execute. So first need a cache for submitted open/close region procedures.
|
||||||
|
*
|
||||||
|
* After the open/close region request executed and report region transition succeed, cache it in
|
||||||
|
* executed region procedures cache. See {@link #finishRegionProcedure(long)}. After report region
|
||||||
|
* transition succeed, master will not send the open/close region request to regionserver again.
|
||||||
|
* And we thought that the ongoing duplicate open/close region request should not be delayed more
|
||||||
|
* than 600 seconds. So the executed region procedures cache will expire after 600 seconds.
|
||||||
|
*
|
||||||
|
* See HBASE-22404 for more details.
|
||||||
|
*
|
||||||
|
* @param procId the id of the open/close region procedure
|
||||||
|
* @return true if the procedure can be submitted.
|
||||||
|
*/
|
||||||
|
boolean submitRegionProcedure(long procId) {
|
||||||
|
if (procId == -1) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
// Ignore the region procedures which already submitted.
|
||||||
|
Long previous = submittedRegionProcedures.putIfAbsent(procId, procId);
|
||||||
|
if (previous != null) {
|
||||||
|
LOG.warn("Received procedure pid={}, which already submitted, just ignore it", procId);
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
// Ignore the region procedures which already executed.
|
||||||
|
if (executedRegionProcedures.getIfPresent(procId) != null) {
|
||||||
|
LOG.warn("Received procedure pid={}, which already executed, just ignore it", procId);
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* See {@link #submitRegionProcedure(long)}.
|
||||||
|
* @param procId the id of the open/close region procedure
|
||||||
|
*/
|
||||||
|
public void finishRegionProcedure(long procId) {
|
||||||
|
executedRegionProcedures.put(procId, procId);
|
||||||
|
submittedRegionProcedures.remove(procId);
|
||||||
|
}
|
||||||
|
|
||||||
public boolean isShutDown() {
|
public boolean isShutDown() {
|
||||||
return shutDown;
|
return shutDown;
|
||||||
}
|
}
|
||||||
|
|
|
@ -3721,8 +3721,12 @@ public class RSRpcServices implements HBaseRPCErrorHandler,
|
||||||
regionServer.updateRegionFavoredNodesMapping(regionInfo.getEncodedName(),
|
regionServer.updateRegionFavoredNodesMapping(regionInfo.getEncodedName(),
|
||||||
regionOpenInfo.getFavoredNodesList());
|
regionOpenInfo.getFavoredNodesList());
|
||||||
}
|
}
|
||||||
regionServer.executorService.submit(AssignRegionHandler.create(regionServer, regionInfo,
|
long procId = regionOpenInfo.getOpenProcId();
|
||||||
regionOpenInfo.getOpenProcId(), tableDesc, masterSystemTime));
|
if (regionServer.submitRegionProcedure(procId)) {
|
||||||
|
regionServer.executorService.submit(AssignRegionHandler
|
||||||
|
.create(regionServer, regionInfo, procId, tableDesc,
|
||||||
|
masterSystemTime));
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -3733,11 +3737,14 @@ public class RSRpcServices implements HBaseRPCErrorHandler,
|
||||||
} catch (DoNotRetryIOException e) {
|
} catch (DoNotRetryIOException e) {
|
||||||
throw new UncheckedIOException("Should not happen", e);
|
throw new UncheckedIOException("Should not happen", e);
|
||||||
}
|
}
|
||||||
ServerName destination =
|
ServerName destination = request.hasDestinationServer() ?
|
||||||
request.hasDestinationServer() ? ProtobufUtil.toServerName(request.getDestinationServer())
|
ProtobufUtil.toServerName(request.getDestinationServer()) :
|
||||||
: null;
|
null;
|
||||||
regionServer.executorService.submit(UnassignRegionHandler.create(regionServer, encodedName,
|
long procId = request.getCloseProcId();
|
||||||
request.getCloseProcId(), false, destination));
|
if (regionServer.submitRegionProcedure(procId)) {
|
||||||
|
regionServer.executorService.submit(UnassignRegionHandler
|
||||||
|
.create(regionServer, encodedName, procId, false, destination));
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
private void executeProcedures(RemoteProcedureRequest request) {
|
private void executeProcedures(RemoteProcedureRequest request) {
|
||||||
|
|
|
@ -26,8 +26,8 @@ import org.apache.hadoop.hbase.client.TableDescriptor;
|
||||||
import org.apache.hadoop.hbase.executor.EventHandler;
|
import org.apache.hadoop.hbase.executor.EventHandler;
|
||||||
import org.apache.hadoop.hbase.executor.EventType;
|
import org.apache.hadoop.hbase.executor.EventType;
|
||||||
import org.apache.hadoop.hbase.regionserver.HRegion;
|
import org.apache.hadoop.hbase.regionserver.HRegion;
|
||||||
|
import org.apache.hadoop.hbase.regionserver.HRegionServer;
|
||||||
import org.apache.hadoop.hbase.regionserver.Region;
|
import org.apache.hadoop.hbase.regionserver.Region;
|
||||||
import org.apache.hadoop.hbase.regionserver.RegionServerServices;
|
|
||||||
import org.apache.hadoop.hbase.regionserver.RegionServerServices.PostOpenDeployContext;
|
import org.apache.hadoop.hbase.regionserver.RegionServerServices.PostOpenDeployContext;
|
||||||
import org.apache.hadoop.hbase.regionserver.RegionServerServices.RegionStateTransitionContext;
|
import org.apache.hadoop.hbase.regionserver.RegionServerServices.RegionStateTransitionContext;
|
||||||
import org.apache.hadoop.hbase.util.RetryCounter;
|
import org.apache.hadoop.hbase.util.RetryCounter;
|
||||||
|
@ -59,7 +59,7 @@ public class AssignRegionHandler extends EventHandler {
|
||||||
|
|
||||||
private final RetryCounter retryCounter;
|
private final RetryCounter retryCounter;
|
||||||
|
|
||||||
public AssignRegionHandler(RegionServerServices server, RegionInfo regionInfo, long openProcId,
|
public AssignRegionHandler(HRegionServer server, RegionInfo regionInfo, long openProcId,
|
||||||
@Nullable TableDescriptor tableDesc, long masterSystemTime, EventType eventType) {
|
@Nullable TableDescriptor tableDesc, long masterSystemTime, EventType eventType) {
|
||||||
super(server, eventType);
|
super(server, eventType);
|
||||||
this.regionInfo = regionInfo;
|
this.regionInfo = regionInfo;
|
||||||
|
@ -69,14 +69,14 @@ public class AssignRegionHandler extends EventHandler {
|
||||||
this.retryCounter = HandlerUtil.getRetryCounter();
|
this.retryCounter = HandlerUtil.getRetryCounter();
|
||||||
}
|
}
|
||||||
|
|
||||||
private RegionServerServices getServer() {
|
private HRegionServer getServer() {
|
||||||
return (RegionServerServices) server;
|
return (HRegionServer) server;
|
||||||
}
|
}
|
||||||
|
|
||||||
private void cleanUpAndReportFailure(IOException error) throws IOException {
|
private void cleanUpAndReportFailure(IOException error) throws IOException {
|
||||||
LOG.warn("Failed to open region {}, will report to master", regionInfo.getRegionNameAsString(),
|
LOG.warn("Failed to open region {}, will report to master", regionInfo.getRegionNameAsString(),
|
||||||
error);
|
error);
|
||||||
RegionServerServices rs = getServer();
|
HRegionServer rs = getServer();
|
||||||
rs.getRegionsInTransitionInRS().remove(regionInfo.getEncodedNameAsBytes(), Boolean.TRUE);
|
rs.getRegionsInTransitionInRS().remove(regionInfo.getEncodedNameAsBytes(), Boolean.TRUE);
|
||||||
if (!rs.reportRegionStateTransition(new RegionStateTransitionContext(TransitionCode.FAILED_OPEN,
|
if (!rs.reportRegionStateTransition(new RegionStateTransitionContext(TransitionCode.FAILED_OPEN,
|
||||||
HConstants.NO_SEQNUM, openProcId, masterSystemTime, regionInfo))) {
|
HConstants.NO_SEQNUM, openProcId, masterSystemTime, regionInfo))) {
|
||||||
|
@ -87,7 +87,7 @@ public class AssignRegionHandler extends EventHandler {
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void process() throws IOException {
|
public void process() throws IOException {
|
||||||
RegionServerServices rs = getServer();
|
HRegionServer rs = getServer();
|
||||||
String encodedName = regionInfo.getEncodedName();
|
String encodedName = regionInfo.getEncodedName();
|
||||||
byte[] encodedNameBytes = regionInfo.getEncodedNameAsBytes();
|
byte[] encodedNameBytes = regionInfo.getEncodedNameAsBytes();
|
||||||
String regionName = regionInfo.getRegionNameAsString();
|
String regionName = regionInfo.getRegionNameAsString();
|
||||||
|
@ -101,7 +101,6 @@ public class AssignRegionHandler extends EventHandler {
|
||||||
// reportRegionStateTransition any more.
|
// reportRegionStateTransition any more.
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
LOG.info("Open {}", regionName);
|
|
||||||
Boolean previous = rs.getRegionsInTransitionInRS().putIfAbsent(encodedNameBytes, Boolean.TRUE);
|
Boolean previous = rs.getRegionsInTransitionInRS().putIfAbsent(encodedNameBytes, Boolean.TRUE);
|
||||||
if (previous != null) {
|
if (previous != null) {
|
||||||
if (previous) {
|
if (previous) {
|
||||||
|
@ -121,6 +120,7 @@ public class AssignRegionHandler extends EventHandler {
|
||||||
}
|
}
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
LOG.info("Open {}", regionName);
|
||||||
HRegion region;
|
HRegion region;
|
||||||
try {
|
try {
|
||||||
TableDescriptor htd =
|
TableDescriptor htd =
|
||||||
|
@ -139,6 +139,8 @@ public class AssignRegionHandler extends EventHandler {
|
||||||
rs.postOpenDeployTasks(new PostOpenDeployContext(region, openProcId, masterSystemTime));
|
rs.postOpenDeployTasks(new PostOpenDeployContext(region, openProcId, masterSystemTime));
|
||||||
rs.addRegion(region);
|
rs.addRegion(region);
|
||||||
LOG.info("Opened {}", regionName);
|
LOG.info("Opened {}", regionName);
|
||||||
|
// Cache the open region procedure id after report region transition succeed.
|
||||||
|
rs.finishRegionProcedure(openProcId);
|
||||||
Boolean current = rs.getRegionsInTransitionInRS().remove(regionInfo.getEncodedNameAsBytes());
|
Boolean current = rs.getRegionsInTransitionInRS().remove(regionInfo.getEncodedNameAsBytes());
|
||||||
if (current == null) {
|
if (current == null) {
|
||||||
// Should NEVER happen, but let's be paranoid.
|
// Should NEVER happen, but let's be paranoid.
|
||||||
|
@ -158,7 +160,7 @@ public class AssignRegionHandler extends EventHandler {
|
||||||
"Failed to open region " + regionInfo.getRegionNameAsString() + " and can not recover", t);
|
"Failed to open region " + regionInfo.getRegionNameAsString() + " and can not recover", t);
|
||||||
}
|
}
|
||||||
|
|
||||||
public static AssignRegionHandler create(RegionServerServices server, RegionInfo regionInfo,
|
public static AssignRegionHandler create(HRegionServer server, RegionInfo regionInfo,
|
||||||
long openProcId, TableDescriptor tableDesc, long masterSystemTime) {
|
long openProcId, TableDescriptor tableDesc, long masterSystemTime) {
|
||||||
EventType eventType;
|
EventType eventType;
|
||||||
if (regionInfo.isMetaRegion()) {
|
if (regionInfo.isMetaRegion()) {
|
||||||
|
|
|
@ -25,8 +25,8 @@ import org.apache.hadoop.hbase.ServerName;
|
||||||
import org.apache.hadoop.hbase.executor.EventHandler;
|
import org.apache.hadoop.hbase.executor.EventHandler;
|
||||||
import org.apache.hadoop.hbase.executor.EventType;
|
import org.apache.hadoop.hbase.executor.EventType;
|
||||||
import org.apache.hadoop.hbase.regionserver.HRegion;
|
import org.apache.hadoop.hbase.regionserver.HRegion;
|
||||||
|
import org.apache.hadoop.hbase.regionserver.HRegionServer;
|
||||||
import org.apache.hadoop.hbase.regionserver.Region;
|
import org.apache.hadoop.hbase.regionserver.Region;
|
||||||
import org.apache.hadoop.hbase.regionserver.RegionServerServices;
|
|
||||||
import org.apache.hadoop.hbase.regionserver.RegionServerServices.RegionStateTransitionContext;
|
import org.apache.hadoop.hbase.regionserver.RegionServerServices.RegionStateTransitionContext;
|
||||||
import org.apache.hadoop.hbase.util.Bytes;
|
import org.apache.hadoop.hbase.util.Bytes;
|
||||||
import org.apache.hadoop.hbase.util.RetryCounter;
|
import org.apache.hadoop.hbase.util.RetryCounter;
|
||||||
|
@ -60,7 +60,7 @@ public class UnassignRegionHandler extends EventHandler {
|
||||||
|
|
||||||
private final RetryCounter retryCounter;
|
private final RetryCounter retryCounter;
|
||||||
|
|
||||||
public UnassignRegionHandler(RegionServerServices server, String encodedName, long closeProcId,
|
public UnassignRegionHandler(HRegionServer server, String encodedName, long closeProcId,
|
||||||
boolean abort, @Nullable ServerName destination, EventType eventType) {
|
boolean abort, @Nullable ServerName destination, EventType eventType) {
|
||||||
super(server, eventType);
|
super(server, eventType);
|
||||||
this.encodedName = encodedName;
|
this.encodedName = encodedName;
|
||||||
|
@ -70,13 +70,13 @@ public class UnassignRegionHandler extends EventHandler {
|
||||||
this.retryCounter = HandlerUtil.getRetryCounter();
|
this.retryCounter = HandlerUtil.getRetryCounter();
|
||||||
}
|
}
|
||||||
|
|
||||||
private RegionServerServices getServer() {
|
private HRegionServer getServer() {
|
||||||
return (RegionServerServices) server;
|
return (HRegionServer) server;
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public void process() throws IOException {
|
public void process() throws IOException {
|
||||||
RegionServerServices rs = getServer();
|
HRegionServer rs = getServer();
|
||||||
byte[] encodedNameBytes = Bytes.toBytes(encodedName);
|
byte[] encodedNameBytes = Bytes.toBytes(encodedName);
|
||||||
Boolean previous = rs.getRegionsInTransitionInRS().putIfAbsent(encodedNameBytes, Boolean.FALSE);
|
Boolean previous = rs.getRegionsInTransitionInRS().putIfAbsent(encodedNameBytes, Boolean.FALSE);
|
||||||
if (previous != null) {
|
if (previous != null) {
|
||||||
|
@ -94,7 +94,7 @@ public class UnassignRegionHandler extends EventHandler {
|
||||||
}
|
}
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
HRegion region = (HRegion) rs.getRegion(encodedName);
|
HRegion region = rs.getRegion(encodedName);
|
||||||
if (region == null) {
|
if (region == null) {
|
||||||
LOG.debug(
|
LOG.debug(
|
||||||
"Received CLOSE for a region {} which is not online, and we're not opening/closing.",
|
"Received CLOSE for a region {} which is not online, and we're not opening/closing.",
|
||||||
|
@ -124,6 +124,8 @@ public class UnassignRegionHandler extends EventHandler {
|
||||||
HConstants.NO_SEQNUM, closeProcId, -1, region.getRegionInfo()))) {
|
HConstants.NO_SEQNUM, closeProcId, -1, region.getRegionInfo()))) {
|
||||||
throw new IOException("Failed to report close to master: " + regionName);
|
throw new IOException("Failed to report close to master: " + regionName);
|
||||||
}
|
}
|
||||||
|
// Cache the close region procedure id after report region transition succeed.
|
||||||
|
rs.finishRegionProcedure(closeProcId);
|
||||||
rs.getRegionsInTransitionInRS().remove(encodedNameBytes, Boolean.FALSE);
|
rs.getRegionsInTransitionInRS().remove(encodedNameBytes, Boolean.FALSE);
|
||||||
LOG.info("Closed {}", regionName);
|
LOG.info("Closed {}", regionName);
|
||||||
}
|
}
|
||||||
|
@ -134,7 +136,7 @@ public class UnassignRegionHandler extends EventHandler {
|
||||||
getServer().abort("Failed to close region " + encodedName + " and can not recover", t);
|
getServer().abort("Failed to close region " + encodedName + " and can not recover", t);
|
||||||
}
|
}
|
||||||
|
|
||||||
public static UnassignRegionHandler create(RegionServerServices server, String encodedName,
|
public static UnassignRegionHandler create(HRegionServer server, String encodedName,
|
||||||
long closeProcId, boolean abort, @Nullable ServerName destination) {
|
long closeProcId, boolean abort, @Nullable ServerName destination) {
|
||||||
// Just try our best to determine whether it is for closing meta. It is not the end of the world
|
// Just try our best to determine whether it is for closing meta. It is not the end of the world
|
||||||
// if we put the handler into a wrong executor.
|
// if we put the handler into a wrong executor.
|
||||||
|
|
|
@ -23,6 +23,7 @@ import static org.junit.Assert.fail;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.util.NavigableMap;
|
import java.util.NavigableMap;
|
||||||
|
import java.util.Optional;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
import java.util.SortedSet;
|
import java.util.SortedSet;
|
||||||
import java.util.concurrent.ConcurrentSkipListMap;
|
import java.util.concurrent.ConcurrentSkipListMap;
|
||||||
|
@ -189,9 +190,10 @@ public class TestServerRemoteProcedure {
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public RemoteProcedureDispatcher.RemoteOperation remoteCallBuild(MasterProcedureEnv env,
|
public Optional<RemoteProcedureDispatcher.RemoteOperation> remoteCallBuild(
|
||||||
ServerName serverName) {
|
MasterProcedureEnv env, ServerName serverName) {
|
||||||
return new RSProcedureDispatcher.ServerOperation(null, 0L, this.getClass(), new byte[0]);
|
return Optional
|
||||||
|
.of(new RSProcedureDispatcher.ServerOperation(null, 0L, this.getClass(), new byte[0]));
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
|
Loading…
Reference in New Issue