diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/EditLogFileInputStream.java b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/EditLogFileInputStream.java index 4e9b174e3f7..0ee15e5c755 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/EditLogFileInputStream.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/EditLogFileInputStream.java @@ -163,6 +163,16 @@ public class EditLogFileInputStream extends EditLogInputStream { } catch (EOFException eofe) { throw new LogHeaderCorruptException("No header found in log"); } + if (logVersion == -1) { + // The edits in progress file is pre-allocated with 1MB of "-1" bytes + // when it is created, then the header is written. If the header is + // -1, it indicates the an exception occurred pre-allocating the file + // and the header was never written. Therefore this is effectively a + // corrupt and empty log. + throw new LogHeaderCorruptException("No header present in log (value " + + "is -1), probably due to disk space issues when it was created. " + + "The log has no transactions and will be sidelined."); + } // We assume future layout will also support ADD_LAYOUT_FLAGS if (NameNodeLayoutVersion.supports( LayoutVersion.Feature.ADD_LAYOUT_FLAGS, logVersion) || diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/FSEditLogLoader.java b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/FSEditLogLoader.java index 920a7275f8d..d9d8a6b13b5 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/FSEditLogLoader.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/main/java/org/apache/hadoop/hdfs/server/namenode/FSEditLogLoader.java @@ -1284,6 +1284,12 @@ public class FSEditLogLoader { + lastPos, t); in.resync(); FSImage.LOG.warn("After resync, position is " + in.getPosition()); + if (in.getPosition() <= lastPos) { + FSImage.LOG.warn("After resync, the position, " + + in.getPosition() + " is not greater than the previous " + + "position " + lastPos + ". Skipping remainder of this log."); + break; + } continue; } if (lastTxId == HdfsServerConstants.INVALID_TXID || txid > lastTxId) { diff --git a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/qjournal/server/TestJournal.java b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/qjournal/server/TestJournal.java index ac75db96103..52baab98aa5 100644 --- a/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/qjournal/server/TestJournal.java +++ b/hadoop-hdfs-project/hadoop-hdfs/src/test/java/org/apache/hadoop/hdfs/qjournal/server/TestJournal.java @@ -28,6 +28,7 @@ import java.io.ByteArrayOutputStream; import java.io.DataOutputStream; import java.io.File; import java.io.IOException; +import java.io.RandomAccessFile; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.fs.FileUtil; @@ -125,6 +126,48 @@ public class TestJournal { Assert.assertEquals(1, segmentState.getStartTxId()); } + /** + * Test for HDFS-14557 to ensure that a edit file that failed to fully + * allocate and has a header byte of -1 is moved aside to allow startup + * to progress. + */ + @Test + public void testEmptyEditsInProgressMovedAside() throws Exception { + // First, write 5 transactions to the journal + journal.startLogSegment(makeRI(1), 1, + NameNodeLayoutVersion.CURRENT_LAYOUT_VERSION - 1); + final int numTxns = 5; + byte[] ops = QJMTestUtil.createTxnData(1, 5); + journal.journal(makeRI(2), 1, 1, numTxns, ops); + // Now close the segment + journal.finalizeLogSegment(makeRI(3), 1, numTxns); + + // Create a new segment creating a new edits_inprogress file + journal.startLogSegment(makeRI(4), 6, + NameNodeLayoutVersion.CURRENT_LAYOUT_VERSION - 1); + ops = QJMTestUtil.createTxnData(6, 5); + journal.journal(makeRI(5), 6, 6, numTxns, ops); + File eip = journal.getStorage().getInProgressEditLog(6); + + // Now stop the journal without finalizing the segment + journal.close(); + + // Now "zero out" the EIP file with -1 bytes, similar to how it would + // appear if the pre-allocation failed + RandomAccessFile rwf = new RandomAccessFile(eip, "rw"); + for (int i=0; i