mirror of https://github.com/apache/druid.git
Retry S3 task log fetch in case of transient S3 exceptions (#14714)
This commit is contained in:
parent
b27d281b11
commit
20c48b6a3d
|
@ -19,7 +19,6 @@
|
||||||
|
|
||||||
package org.apache.druid.storage.s3;
|
package org.apache.druid.storage.s3;
|
||||||
|
|
||||||
import com.amazonaws.AmazonServiceException;
|
|
||||||
import com.amazonaws.services.s3.model.AmazonS3Exception;
|
import com.amazonaws.services.s3.model.AmazonS3Exception;
|
||||||
import com.amazonaws.services.s3.model.GetObjectRequest;
|
import com.amazonaws.services.s3.model.GetObjectRequest;
|
||||||
import com.amazonaws.services.s3.model.ObjectMetadata;
|
import com.amazonaws.services.s3.model.ObjectMetadata;
|
||||||
|
@ -67,38 +66,51 @@ public class S3TaskLogs implements TaskLogs
|
||||||
public Optional<InputStream> streamTaskLog(final String taskid, final long offset) throws IOException
|
public Optional<InputStream> streamTaskLog(final String taskid, final long offset) throws IOException
|
||||||
{
|
{
|
||||||
final String taskKey = getTaskLogKey(taskid, "log");
|
final String taskKey = getTaskLogKey(taskid, "log");
|
||||||
return streamTaskFile(offset, taskKey);
|
return streamTaskFileWithRetry(offset, taskKey);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Optional<InputStream> streamTaskReports(String taskid) throws IOException
|
public Optional<InputStream> streamTaskReports(String taskid) throws IOException
|
||||||
{
|
{
|
||||||
final String taskKey = getTaskLogKey(taskid, "report.json");
|
final String taskKey = getTaskLogKey(taskid, "report.json");
|
||||||
return streamTaskFile(0, taskKey);
|
return streamTaskFileWithRetry(0, taskKey);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public Optional<InputStream> streamTaskStatus(String taskid) throws IOException
|
public Optional<InputStream> streamTaskStatus(String taskid) throws IOException
|
||||||
{
|
{
|
||||||
final String taskKey = getTaskLogKey(taskid, "status.json");
|
final String taskKey = getTaskLogKey(taskid, "status.json");
|
||||||
return streamTaskFile(0, taskKey);
|
return streamTaskFileWithRetry(0, taskKey);
|
||||||
}
|
}
|
||||||
|
|
||||||
private Optional<InputStream> streamTaskFile(final long offset, String taskKey) throws IOException
|
/**
|
||||||
|
* Using the retry conditions defined in {@link S3Utils#S3RETRY}.
|
||||||
|
*/
|
||||||
|
private Optional<InputStream> streamTaskFileWithRetry(final long offset, String taskKey) throws IOException
|
||||||
|
{
|
||||||
|
try {
|
||||||
|
return S3Utils.retryS3Operation(() -> streamTaskFile(offset, taskKey));
|
||||||
|
}
|
||||||
|
catch (Exception e) {
|
||||||
|
throw new IOE(e, "Failed to stream logs for task[%s] starting at offset[%d]", taskKey, offset);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
private Optional<InputStream> streamTaskFile(final long offset, String taskKey)
|
||||||
{
|
{
|
||||||
try {
|
try {
|
||||||
final ObjectMetadata objectMetadata = service.getObjectMetadata(config.getS3Bucket(), taskKey);
|
final ObjectMetadata objectMetadata = service.getObjectMetadata(config.getS3Bucket(), taskKey);
|
||||||
|
|
||||||
try {
|
|
||||||
final long start;
|
final long start;
|
||||||
final long end = objectMetadata.getContentLength() - 1;
|
final long end = objectMetadata.getContentLength() - 1;
|
||||||
|
|
||||||
if (offset > 0 && offset < objectMetadata.getContentLength()) {
|
long contentLength = objectMetadata.getContentLength();
|
||||||
start = offset;
|
if (offset >= contentLength || offset <= -contentLength) {
|
||||||
} else if (offset < 0 && (-1 * offset) < objectMetadata.getContentLength()) {
|
|
||||||
start = objectMetadata.getContentLength() + offset;
|
|
||||||
} else {
|
|
||||||
start = 0;
|
start = 0;
|
||||||
|
} else if (offset >= 0) {
|
||||||
|
start = offset;
|
||||||
|
} else {
|
||||||
|
start = contentLength + offset;
|
||||||
}
|
}
|
||||||
|
|
||||||
final GetObjectRequest request = new GetObjectRequest(config.getS3Bucket(), taskKey)
|
final GetObjectRequest request = new GetObjectRequest(config.getS3Bucket(), taskKey)
|
||||||
|
@ -107,17 +119,13 @@ public class S3TaskLogs implements TaskLogs
|
||||||
|
|
||||||
return Optional.of(service.getObject(request).getObjectContent());
|
return Optional.of(service.getObject(request).getObjectContent());
|
||||||
}
|
}
|
||||||
catch (AmazonServiceException e) {
|
|
||||||
throw new IOException(e);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
catch (AmazonS3Exception e) {
|
catch (AmazonS3Exception e) {
|
||||||
if (404 == e.getStatusCode()
|
if (404 == e.getStatusCode()
|
||||||
|| "NoSuchKey".equals(e.getErrorCode())
|
|| "NoSuchKey".equals(e.getErrorCode())
|
||||||
|| "NoSuchBucket".equals(e.getErrorCode())) {
|
|| "NoSuchBucket".equals(e.getErrorCode())) {
|
||||||
return Optional.absent();
|
return Optional.absent();
|
||||||
} else {
|
} else {
|
||||||
throw new IOE(e, "Failed to stream logs from: %s", taskKey);
|
throw e;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -21,6 +21,7 @@ package org.apache.druid.storage.s3;
|
||||||
|
|
||||||
import com.amazonaws.SdkClientException;
|
import com.amazonaws.SdkClientException;
|
||||||
import com.amazonaws.services.s3.model.AccessControlList;
|
import com.amazonaws.services.s3.model.AccessControlList;
|
||||||
|
import com.amazonaws.services.s3.model.AmazonS3Exception;
|
||||||
import com.amazonaws.services.s3.model.DeleteObjectsRequest;
|
import com.amazonaws.services.s3.model.DeleteObjectsRequest;
|
||||||
import com.amazonaws.services.s3.model.GetObjectRequest;
|
import com.amazonaws.services.s3.model.GetObjectRequest;
|
||||||
import com.amazonaws.services.s3.model.Grant;
|
import com.amazonaws.services.s3.model.Grant;
|
||||||
|
@ -487,6 +488,45 @@ public class S3TaskLogsTest extends EasyMockSupport
|
||||||
Assert.assertEquals(STATUS_CONTENTS, report);
|
Assert.assertEquals(STATUS_CONTENTS, report);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void test_retryStatusFetch_whenExceptionThrown() throws IOException
|
||||||
|
{
|
||||||
|
EasyMock.reset(s3Client);
|
||||||
|
// throw exception on first call
|
||||||
|
AmazonS3Exception awsError = new AmazonS3Exception("AWS Error");
|
||||||
|
awsError.setErrorCode("503");
|
||||||
|
awsError.setStatusCode(503);
|
||||||
|
EasyMock.expect(s3Client.getObjectMetadata(EasyMock.anyString(), EasyMock.anyString())).andThrow(awsError);
|
||||||
|
EasyMock.expectLastCall().once();
|
||||||
|
|
||||||
|
String logPath = TEST_PREFIX + "/" + KEY_1 + "/status.json";
|
||||||
|
ObjectMetadata objectMetadata = new ObjectMetadata();
|
||||||
|
objectMetadata.setContentLength(STATUS_CONTENTS.length());
|
||||||
|
EasyMock.expect(s3Client.getObjectMetadata(TEST_BUCKET, logPath)).andReturn(objectMetadata);
|
||||||
|
S3Object s3Object = new S3Object();
|
||||||
|
s3Object.setObjectContent(new ByteArrayInputStream(STATUS_CONTENTS.getBytes(StandardCharsets.UTF_8)));
|
||||||
|
GetObjectRequest getObjectRequest = new GetObjectRequest(TEST_BUCKET, logPath);
|
||||||
|
getObjectRequest.setRange(0, STATUS_CONTENTS.length() - 1);
|
||||||
|
getObjectRequest.withMatchingETagConstraint(objectMetadata.getETag());
|
||||||
|
EasyMock.expect(s3Client.getObject(getObjectRequest)).andReturn(s3Object);
|
||||||
|
EasyMock.expectLastCall().once();
|
||||||
|
|
||||||
|
replayAll();
|
||||||
|
|
||||||
|
S3TaskLogs s3TaskLogs = getS3TaskLogs();
|
||||||
|
|
||||||
|
Optional<InputStream> inputStreamOptional = s3TaskLogs.streamTaskStatus(KEY_1);
|
||||||
|
String report;
|
||||||
|
try (BufferedReader reader = new BufferedReader(new InputStreamReader(
|
||||||
|
inputStreamOptional.get(),
|
||||||
|
StandardCharsets.UTF_8
|
||||||
|
))) {
|
||||||
|
report = reader.lines().collect(Collectors.joining("\n"));
|
||||||
|
}
|
||||||
|
|
||||||
|
Assert.assertEquals(STATUS_CONTENTS, report);
|
||||||
|
}
|
||||||
|
|
||||||
@Nonnull
|
@Nonnull
|
||||||
private S3TaskLogs getS3TaskLogs()
|
private S3TaskLogs getS3TaskLogs()
|
||||||
{
|
{
|
||||||
|
|
Loading…
Reference in New Issue