HBASE-8097 MetaServerShutdownHandler may potentially keep bumping up DeadServer.numProcessing (Jeffrey Zhong)

git-svn-id: https://svn.apache.org/repos/asf/hbase/trunk@1457932 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Zhihong Yu 2013-03-18 19:37:11 +00:00
parent a832f774c4
commit 84d0115d44
3 changed files with 36 additions and 32 deletions

View File

@ -98,9 +98,15 @@ public class DeadServer {
return clone; return clone;
} }
public synchronized boolean add(ServerName e) { /**
* Adds the server to the dead server list if it's not there already.
* @param sn the server name
*/
public synchronized void add(ServerName sn) {
this.numProcessing++; this.numProcessing++;
return deadServers.put(e, EnvironmentEdgeManager.currentTimeMillis()) != null; if (!deadServers.containsKey(sn)){
deadServers.put(sn, EnvironmentEdgeManager.currentTimeMillis());
}
} }
@SuppressWarnings("UnusedParameters") @SuppressWarnings("UnusedParameters")

View File

@ -487,7 +487,7 @@ public class ServerManager {
boolean carryingMeta = services.getAssignmentManager().isCarryingMeta(serverName); boolean carryingMeta = services.getAssignmentManager().isCarryingMeta(serverName);
if (carryingMeta) { if (carryingMeta) {
this.services.getExecutorService().submit(new MetaServerShutdownHandler(this.master, this.services.getExecutorService().submit(new MetaServerShutdownHandler(this.master,
this.services, this.deadservers, serverName, carryingMeta)); this.services, this.deadservers, serverName));
} else { } else {
this.services.getExecutorService().submit(new ServerShutdownHandler(this.master, this.services.getExecutorService().submit(new ServerShutdownHandler(this.master,
this.services, this.deadservers, serverName, true)); this.services, this.deadservers, serverName, true));

View File

@ -32,24 +32,22 @@ import org.apache.hadoop.hbase.master.MasterServices;
import org.apache.zookeeper.KeeperException; import org.apache.zookeeper.KeeperException;
/** /**
* Shutdown handler for the server hosting <code>-ROOT-</code>, * Shutdown handler for the server hosting <code>.META.</code>
* <code>.META.</code>, or both.
*/ */
@InterfaceAudience.Private @InterfaceAudience.Private
public class MetaServerShutdownHandler extends ServerShutdownHandler { public class MetaServerShutdownHandler extends ServerShutdownHandler {
private final boolean carryingMeta;
private static final Log LOG = LogFactory.getLog(MetaServerShutdownHandler.class); private static final Log LOG = LogFactory.getLog(MetaServerShutdownHandler.class);
public MetaServerShutdownHandler(final Server server, public MetaServerShutdownHandler(final Server server,
final MasterServices services, final MasterServices services,
final DeadServer deadServers, final ServerName serverName, final DeadServer deadServers, final ServerName serverName) {
final boolean carryingMeta) {
super(server, services, deadServers, serverName, super(server, services, deadServers, serverName,
EventType.M_META_SERVER_SHUTDOWN, true); EventType.M_META_SERVER_SHUTDOWN, true);
this.carryingMeta = carryingMeta;
} }
@Override @Override
public void process() throws IOException { public void process() throws IOException {
boolean gotException = true;
try{
try { try {
LOG.info("Splitting META logs for " + serverName); LOG.info("Splitting META logs for " + serverName);
if (this.shouldSplitHlog) { if (this.shouldSplitHlog) {
@ -62,19 +60,23 @@ public class MetaServerShutdownHandler extends ServerShutdownHandler {
serverName + ", will retry", ioe); serverName + ", will retry", ioe);
} }
// Assign root and meta if we were carrying them. // Assign meta if we were carrying it.
if (isCarryingMeta()) { // .META.
// Check again: region may be assigned to other where because of RIT // Check again: region may be assigned to other where because of RIT
// timeout // timeout
if (this.services.getAssignmentManager().isCarryingMeta(serverName)) { if (this.services.getAssignmentManager().isCarryingMeta(serverName)) {
LOG.info("Server " + serverName LOG.info("Server " + serverName + " was carrying META. Trying to assign.");
+ " was carrying META. Trying to assign."); this.services.getAssignmentManager().regionOffline(HRegionInfo.FIRST_META_REGIONINFO);
this.services.getAssignmentManager().regionOffline(
HRegionInfo.FIRST_META_REGIONINFO);
verifyAndAssignMetaWithRetries(); verifyAndAssignMetaWithRetries();
} else { } else {
LOG.info("META has been assigned to otherwhere, skip assigning."); LOG.info("META has been assigned to otherwhere, skip assigning.");
} }
gotException = false;
} finally {
if (gotException){
// If we had an exception, this.deadServers.finish will be skipped in super.process()
this.deadServers.finish(serverName);
}
} }
super.process(); super.process();
} }
@ -97,10 +99,10 @@ public class MetaServerShutdownHandler extends ServerShutdownHandler {
if (!this.server.getCatalogTracker().verifyMetaRegionLocation(timeout)) { if (!this.server.getCatalogTracker().verifyMetaRegionLocation(timeout)) {
this.services.getAssignmentManager().assignMeta(); this.services.getAssignmentManager().assignMeta();
} else if (serverName.equals(server.getCatalogTracker().getMetaLocation())) { } else if (serverName.equals(server.getCatalogTracker().getMetaLocation())) {
throw new IOException("-ROOT- is onlined on the dead server " throw new IOException(".META. is onlined on the dead server "
+ serverName); + serverName);
} else { } else {
LOG.info("Skip assigning -ROOT-, because it is online on the " LOG.info("Skip assigning .META., because it is online on the "
+ server.getCatalogTracker().getMetaLocation()); + server.getCatalogTracker().getMetaLocation());
} }
} }
@ -142,10 +144,6 @@ public class MetaServerShutdownHandler extends ServerShutdownHandler {
} }
} }
boolean isCarryingMeta() {
return this.carryingMeta;
}
@Override @Override
public String toString() { public String toString() {
String name = "UnknownServerName"; String name = "UnknownServerName";