Merge r:1344874 HDFS-3441. Race condition between rolling logs at active NN and purging at standby. Contributed by Rakesh R.

git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/branches/branch-2@1344876 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Uma Maheswara Rao G 2012-05-31 19:38:29 +00:00
parent 136e586272
commit 0719f5635d
3 changed files with 90 additions and 19 deletions

View File

@ -132,6 +132,9 @@ Release 2.0.1-alpha - UNRELEASED
HDFS-3423. BKJM: NN startup is failing, when tries to recoverUnfinalizedSegments() HDFS-3423. BKJM: NN startup is failing, when tries to recoverUnfinalizedSegments()
a bad inProgress_ ZNodes. (Ivan Kelly and Uma via umamahesh) a bad inProgress_ ZNodes. (Ivan Kelly and Uma via umamahesh)
HDFS-3441. Race condition between rolling logs at active NN and purging at standby.
(Rakesh R via umamahesh)
Release 2.0.0-alpha - UNRELEASED Release 2.0.0-alpha - UNRELEASED
INCOMPATIBLE CHANGES INCOMPATIBLE CHANGES

View File

@ -49,7 +49,7 @@ import java.net.URI;
import org.apache.commons.logging.Log; import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory; import org.apache.commons.logging.LogFactory;
import com.google.common.annotations.VisibleForTesting;
/** /**
* BookKeeper Journal Manager * BookKeeper Journal Manager
* *
@ -122,7 +122,9 @@ public class BookKeeperJournalManager implements JournalManager {
= "dfs.namenode.bookkeeperjournal.zk.session.timeout"; = "dfs.namenode.bookkeeperjournal.zk.session.timeout";
public static final int BKJM_ZK_SESSION_TIMEOUT_DEFAULT = 3000; public static final int BKJM_ZK_SESSION_TIMEOUT_DEFAULT = 3000;
private final ZooKeeper zkc; private static final String BKJM_EDIT_INPROGRESS = "inprogress_";
private ZooKeeper zkc;
private final Configuration conf; private final Configuration conf;
private final BookKeeper bkc; private final BookKeeper bkc;
private final CurrentInprogress ci; private final CurrentInprogress ci;
@ -351,13 +353,9 @@ public class BookKeeperJournalManager implements JournalManager {
EditLogInputStream getInputStream(long fromTxId, boolean inProgressOk) EditLogInputStream getInputStream(long fromTxId, boolean inProgressOk)
throws IOException { throws IOException {
for (EditLogLedgerMetadata l : getLedgerList()) { for (EditLogLedgerMetadata l : getLedgerList(inProgressOk)) {
long lastTxId = l.getLastTxId(); long lastTxId = l.getLastTxId();
if (l.isInProgress()) { if (l.isInProgress()) {
if (!inProgressOk) {
continue;
}
lastTxId = recoverLastTxId(l, false); lastTxId = recoverLastTxId(l, false);
} }
@ -413,13 +411,9 @@ public class BookKeeperJournalManager implements JournalManager {
throws IOException { throws IOException {
long count = 0; long count = 0;
long expectedStart = 0; long expectedStart = 0;
for (EditLogLedgerMetadata l : getLedgerList()) { for (EditLogLedgerMetadata l : getLedgerList(inProgressOk)) {
long lastTxId = l.getLastTxId(); long lastTxId = l.getLastTxId();
if (l.isInProgress()) { if (l.isInProgress()) {
if (!inProgressOk) {
continue;
}
lastTxId = recoverLastTxId(l, false); lastTxId = recoverLastTxId(l, false);
if (lastTxId == HdfsConstants.INVALID_TXID) { if (lastTxId == HdfsConstants.INVALID_TXID) {
break; break;
@ -457,7 +451,7 @@ public class BookKeeperJournalManager implements JournalManager {
try { try {
List<String> children = zkc.getChildren(ledgerPath, false); List<String> children = zkc.getChildren(ledgerPath, false);
for (String child : children) { for (String child : children) {
if (!child.startsWith("inprogress_")) { if (!child.startsWith(BKJM_EDIT_INPROGRESS)) {
continue; continue;
} }
String znode = ledgerPath + "/" + child; String znode = ledgerPath + "/" + child;
@ -504,9 +498,8 @@ public class BookKeeperJournalManager implements JournalManager {
@Override @Override
public void purgeLogsOlderThan(long minTxIdToKeep) public void purgeLogsOlderThan(long minTxIdToKeep)
throws IOException { throws IOException {
for (EditLogLedgerMetadata l : getLedgerList()) { for (EditLogLedgerMetadata l : getLedgerList(false)) {
if (!l.isInProgress() if (l.getLastTxId() < minTxIdToKeep) {
&& l.getLastTxId() < minTxIdToKeep) {
try { try {
Stat stat = zkc.exists(l.getZkPath(), false); Stat stat = zkc.exists(l.getZkPath(), false);
zkc.delete(l.getZkPath(), stat.getVersion()); zkc.delete(l.getZkPath(), stat.getVersion());
@ -597,13 +590,26 @@ public class BookKeeperJournalManager implements JournalManager {
/** /**
* Get a list of all segments in the journal. * Get a list of all segments in the journal.
*/ */
private List<EditLogLedgerMetadata> getLedgerList() throws IOException { List<EditLogLedgerMetadata> getLedgerList(boolean inProgressOk)
throws IOException {
List<EditLogLedgerMetadata> ledgers List<EditLogLedgerMetadata> ledgers
= new ArrayList<EditLogLedgerMetadata>(); = new ArrayList<EditLogLedgerMetadata>();
try { try {
List<String> ledgerNames = zkc.getChildren(ledgerPath, false); List<String> ledgerNames = zkc.getChildren(ledgerPath, false);
for (String n : ledgerNames) { for (String ledgerName : ledgerNames) {
ledgers.add(EditLogLedgerMetadata.read(zkc, ledgerPath + "/" + n)); if (!inProgressOk && ledgerName.contains(BKJM_EDIT_INPROGRESS)) {
continue;
}
String legderMetadataPath = ledgerPath + "/" + ledgerName;
try {
EditLogLedgerMetadata editLogLedgerMetadata = EditLogLedgerMetadata
.read(zkc, legderMetadataPath);
ledgers.add(editLogLedgerMetadata);
} catch (KeeperException.NoNodeException e) {
LOG.warn("ZNode: " + legderMetadataPath
+ " might have finalized and deleted."
+ " So ignoring NoNodeException.");
}
} }
} catch (KeeperException e) { } catch (KeeperException e) {
throw new IOException("Exception reading ledger list from zk", e); throw new IOException("Exception reading ledger list from zk", e);
@ -630,6 +636,11 @@ public class BookKeeperJournalManager implements JournalManager {
return ledgerPath + "/inprogress_" + Long.toString(startTxid, 16); return ledgerPath + "/inprogress_" + Long.toString(startTxid, 16);
} }
@VisibleForTesting
void setZooKeeper(ZooKeeper zk) {
this.zkc = zk;
}
/** /**
* Simple watcher to notify when zookeeper has connected * Simple watcher to notify when zookeeper has connected
*/ */

View File

@ -18,14 +18,17 @@
package org.apache.hadoop.contrib.bkjournal; package org.apache.hadoop.contrib.bkjournal;
import static org.junit.Assert.*; import static org.junit.Assert.*;
import static org.mockito.Mockito.spy;
import org.junit.Test; import org.junit.Test;
import org.junit.Before; import org.junit.Before;
import org.junit.After; import org.junit.After;
import org.junit.BeforeClass; import org.junit.BeforeClass;
import org.junit.AfterClass; import org.junit.AfterClass;
import org.mockito.Mockito;
import java.io.IOException; import java.io.IOException;
import java.net.URI; import java.net.URI;
import java.util.List;
import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.conf.Configuration;
@ -37,6 +40,7 @@ import org.apache.hadoop.hdfs.server.namenode.JournalManager;
import org.apache.bookkeeper.proto.BookieServer; import org.apache.bookkeeper.proto.BookieServer;
import org.apache.zookeeper.CreateMode; import org.apache.zookeeper.CreateMode;
import org.apache.zookeeper.KeeperException;
import org.apache.zookeeper.ZooKeeper; import org.apache.zookeeper.ZooKeeper;
import org.apache.zookeeper.ZooDefs.Ids; import org.apache.zookeeper.ZooDefs.Ids;
@ -614,4 +618,57 @@ public class TestBookKeeperJournalManager {
bkjm.close(); bkjm.close();
} }
/**
* Tests that the edit log file meta data reading from ZooKeeper should be
* able to handle the NoNodeException. bkjm.getInputStream(fromTxId,
* inProgressOk) should suppress the NoNodeException and continue. HDFS-3441.
*/
@Test
public void testEditLogFileNotExistsWhenReadingMetadata() throws Exception {
URI uri = BKJMUtil.createJournalURI("/hdfsjournal-editlogfile");
BookKeeperJournalManager bkjm = new BookKeeperJournalManager(conf, uri);
try {
// start new inprogress log segment with txid=1
// and write transactions till txid=50
String zkpath1 = startAndFinalizeLogSegment(bkjm, 1, 50);
// start new inprogress log segment with txid=51
// and write transactions till txid=100
String zkpath2 = startAndFinalizeLogSegment(bkjm, 51, 100);
// read the metadata from ZK. Here simulating the situation
// when reading,the edit log metadata can be removed by purger thread.
ZooKeeper zkspy = spy(BKJMUtil.connectZooKeeper());
bkjm.setZooKeeper(zkspy);
Mockito.doThrow(
new KeeperException.NoNodeException(zkpath2 + " doesn't exists"))
.when(zkspy).getData(zkpath2, false, null);
List<EditLogLedgerMetadata> ledgerList = bkjm.getLedgerList(false);
assertEquals("List contains the metadata of non exists path.", 1,
ledgerList.size());
assertEquals("LogLedgerMetadata contains wrong zk paths.", zkpath1,
ledgerList.get(0).getZkPath());
} finally {
bkjm.close();
}
}
private String startAndFinalizeLogSegment(BookKeeperJournalManager bkjm,
int startTxid, int endTxid) throws IOException, KeeperException,
InterruptedException {
EditLogOutputStream out = bkjm.startLogSegment(startTxid);
for (long i = startTxid; i <= endTxid; i++) {
FSEditLogOp op = FSEditLogTestUtil.getNoOpInstance();
op.setTransactionId(i);
out.write(op);
}
out.close();
// finalize the inprogress_1 log segment.
bkjm.finalizeLogSegment(startTxid, endTxid);
String zkpath1 = bkjm.finalizedLedgerZNode(startTxid, endTxid);
assertNotNull(zkc.exists(zkpath1, false));
assertNull(zkc.exists(bkjm.inprogressZNode(startTxid), false));
return zkpath1;
}
} }