HDFS-16847: RBF: Prevents StateStoreFileSystemImpl from committing tmp file after encountering an IOException. (#5145)
This commit is contained in:
parent
f93167e678
commit
ec2856d79c
|
@ -85,7 +85,8 @@ public abstract class StateStoreFileBaseImpl
|
|||
* @param path Path of the record to write.
|
||||
* @return Writer for the record.
|
||||
*/
|
||||
protected abstract <T extends BaseRecord> BufferedWriter getWriter(
|
||||
@VisibleForTesting
|
||||
public abstract <T extends BaseRecord> BufferedWriter getWriter(
|
||||
String path);
|
||||
|
||||
/**
|
||||
|
@ -348,25 +349,18 @@ public abstract class StateStoreFileBaseImpl
|
|||
for (Entry<String, T> entry : toWrite.entrySet()) {
|
||||
String recordPath = entry.getKey();
|
||||
String recordPathTemp = recordPath + "." + now() + TMP_MARK;
|
||||
BufferedWriter writer = getWriter(recordPathTemp);
|
||||
try {
|
||||
boolean recordWrittenSuccessfully = true;
|
||||
try (BufferedWriter writer = getWriter(recordPathTemp)) {
|
||||
T record = entry.getValue();
|
||||
String line = serializeString(record);
|
||||
writer.write(line);
|
||||
} catch (IOException e) {
|
||||
LOG.error("Cannot write {}", recordPathTemp, e);
|
||||
recordWrittenSuccessfully = false;
|
||||
success = false;
|
||||
} finally {
|
||||
if (writer != null) {
|
||||
try {
|
||||
writer.close();
|
||||
} catch (IOException e) {
|
||||
LOG.error("Cannot close the writer for {}", recordPathTemp, e);
|
||||
}
|
||||
}
|
||||
}
|
||||
// Commit
|
||||
if (!rename(recordPathTemp, recordPath)) {
|
||||
if (recordWrittenSuccessfully && !rename(recordPathTemp, recordPath)) {
|
||||
LOG.error("Failed committing record into {}", recordPath);
|
||||
success = false;
|
||||
}
|
||||
|
|
|
@ -31,6 +31,7 @@ import java.util.Collections;
|
|||
import java.util.List;
|
||||
|
||||
import org.apache.commons.lang3.ArrayUtils;
|
||||
import org.apache.hadoop.classification.VisibleForTesting;
|
||||
import org.apache.hadoop.hdfs.server.federation.router.RBFConfigKeys;
|
||||
import org.apache.hadoop.hdfs.server.federation.store.records.BaseRecord;
|
||||
import org.slf4j.Logger;
|
||||
|
@ -125,7 +126,8 @@ public class StateStoreFileImpl extends StateStoreFileBaseImpl {
|
|||
}
|
||||
|
||||
@Override
|
||||
protected <T extends BaseRecord> BufferedWriter getWriter(String filename) {
|
||||
@VisibleForTesting
|
||||
public <T extends BaseRecord> BufferedWriter getWriter(String filename) {
|
||||
BufferedWriter writer = null;
|
||||
try {
|
||||
LOG.debug("Writing file: {}", filename);
|
||||
|
|
|
@ -28,13 +28,14 @@ import java.util.ArrayList;
|
|||
import java.util.Collections;
|
||||
import java.util.List;
|
||||
|
||||
import org.apache.hadoop.classification.VisibleForTesting;
|
||||
import org.apache.hadoop.fs.FSDataInputStream;
|
||||
import org.apache.hadoop.fs.FSDataOutputStream;
|
||||
import org.apache.hadoop.fs.FileStatus;
|
||||
import org.apache.hadoop.fs.FileSystem;
|
||||
import org.apache.hadoop.fs.FileUtil;
|
||||
import org.apache.hadoop.fs.Options;
|
||||
import org.apache.hadoop.fs.Path;
|
||||
import org.apache.hadoop.hdfs.DistributedFileSystem;
|
||||
import org.apache.hadoop.hdfs.server.federation.router.RBFConfigKeys;
|
||||
import org.apache.hadoop.hdfs.server.federation.store.driver.StateStoreDriver;
|
||||
import org.apache.hadoop.hdfs.server.federation.store.records.BaseRecord;
|
||||
|
@ -82,17 +83,8 @@ public class StateStoreFileSystemImpl extends StateStoreFileBaseImpl {
|
|||
@Override
|
||||
protected boolean rename(String src, String dst) {
|
||||
try {
|
||||
if (fs instanceof DistributedFileSystem) {
|
||||
DistributedFileSystem dfs = (DistributedFileSystem)fs;
|
||||
dfs.rename(new Path(src), new Path(dst), Options.Rename.OVERWRITE);
|
||||
FileUtil.rename(fs, new Path(src), new Path(dst), Options.Rename.OVERWRITE);
|
||||
return true;
|
||||
} else {
|
||||
// Replace should be atomic but not available
|
||||
if (fs.exists(new Path(dst))) {
|
||||
fs.delete(new Path(dst), true);
|
||||
}
|
||||
return fs.rename(new Path(src), new Path(dst));
|
||||
}
|
||||
} catch (Exception e) {
|
||||
LOG.error("Cannot rename {} to {}", src, dst, e);
|
||||
return false;
|
||||
|
@ -148,7 +140,8 @@ public class StateStoreFileSystemImpl extends StateStoreFileBaseImpl {
|
|||
}
|
||||
|
||||
@Override
|
||||
protected <T extends BaseRecord> BufferedWriter getWriter(String pathName) {
|
||||
@VisibleForTesting
|
||||
public <T extends BaseRecord> BufferedWriter getWriter(String pathName) {
|
||||
BufferedWriter writer = null;
|
||||
Path path = new Path(pathName);
|
||||
try {
|
||||
|
|
|
@ -234,6 +234,25 @@ public class TestStateStoreDriverBase {
|
|||
assertEquals(11, records2.size());
|
||||
}
|
||||
|
||||
public <T extends BaseRecord> void testInsertWithErrorDuringWrite(
|
||||
StateStoreDriver driver, Class<T> recordClass)
|
||||
throws IllegalArgumentException, IllegalAccessException, IOException {
|
||||
|
||||
assertTrue(driver.removeAll(recordClass));
|
||||
QueryResult<T> queryResult0 = driver.get(recordClass);
|
||||
List<T> records0 = queryResult0.getRecords();
|
||||
assertTrue(records0.isEmpty());
|
||||
|
||||
// Insert single
|
||||
BaseRecord record = generateFakeRecord(recordClass);
|
||||
driver.put(record, true, false);
|
||||
|
||||
// Verify that no record was inserted.
|
||||
QueryResult<T> queryResult1 = driver.get(recordClass);
|
||||
List<T> records1 = queryResult1.getRecords();
|
||||
assertEquals(0, records1.size());
|
||||
}
|
||||
|
||||
public <T extends BaseRecord> void testFetchErrors(StateStoreDriver driver,
|
||||
Class<T> clazz) throws IllegalAccessException, IOException {
|
||||
|
||||
|
|
|
@ -17,16 +17,26 @@
|
|||
*/
|
||||
package org.apache.hadoop.hdfs.server.federation.store.driver;
|
||||
|
||||
import java.io.BufferedWriter;
|
||||
import java.io.IOException;
|
||||
|
||||
import org.apache.hadoop.conf.Configuration;
|
||||
import org.apache.hadoop.hdfs.MiniDFSCluster;
|
||||
import org.apache.hadoop.hdfs.server.federation.store.FederationStateStoreTestUtils;
|
||||
import org.apache.hadoop.hdfs.server.federation.store.driver.impl.StateStoreFileBaseImpl;
|
||||
import org.apache.hadoop.hdfs.server.federation.store.driver.impl.StateStoreFileSystemImpl;
|
||||
import org.apache.hadoop.hdfs.server.federation.store.records.MembershipState;
|
||||
import org.junit.AfterClass;
|
||||
import org.junit.Before;
|
||||
import org.junit.BeforeClass;
|
||||
import org.junit.Test;
|
||||
import org.mockito.stubbing.Answer;
|
||||
|
||||
import static org.mockito.Mockito.any;
|
||||
import static org.mockito.Mockito.doAnswer;
|
||||
import static org.mockito.Mockito.doThrow;
|
||||
import static org.mockito.Mockito.spy;
|
||||
|
||||
|
||||
/**
|
||||
* Test the FileSystem (e.g., HDFS) implementation of the State Store driver.
|
||||
|
@ -91,4 +101,18 @@ public class TestStateStoreFileSystem extends TestStateStoreDriverBase {
|
|||
throws IllegalArgumentException, IllegalAccessException, IOException {
|
||||
testMetrics(getStateStoreDriver());
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testInsertWithErrorDuringWrite()
|
||||
throws IllegalArgumentException, IllegalAccessException, IOException {
|
||||
StateStoreFileBaseImpl driver = spy((StateStoreFileBaseImpl)getStateStoreDriver());
|
||||
doAnswer((Answer<BufferedWriter>) a -> {
|
||||
BufferedWriter writer = (BufferedWriter) a.callRealMethod();
|
||||
BufferedWriter spyWriter = spy(writer);
|
||||
doThrow(IOException.class).when(spyWriter).write(any(String.class));
|
||||
return spyWriter;
|
||||
}).when(driver).getWriter(any());
|
||||
|
||||
testInsertWithErrorDuringWrite(driver, MembershipState.class);
|
||||
}
|
||||
}
|
Loading…
Reference in New Issue