YARN-3925. ContainerLogsUtils#getContainerLogFile fails to read container log files from full disks. Contributed by zhihai xu
This commit is contained in:
parent
83fe34ac08
commit
ff9c13e0a7
|
@ -716,6 +716,8 @@ Release 2.7.2 - UNRELEASED
|
||||||
YARN-3969. Allow jobs to be submitted to reservation that is active
|
YARN-3969. Allow jobs to be submitted to reservation that is active
|
||||||
but does not have any allocations. (subru via curino)
|
but does not have any allocations. (subru via curino)
|
||||||
|
|
||||||
|
YARN-3925. ContainerLogsUtils#getContainerLogFile fails to read container
|
||||||
|
log files from full disks. (zhihai xu via jlowe)
|
||||||
|
|
||||||
Release 2.7.1 - 2015-07-06
|
Release 2.7.1 - 2015-07-06
|
||||||
|
|
||||||
|
|
|
@ -18,6 +18,7 @@
|
||||||
|
|
||||||
package org.apache.hadoop.yarn.server.nodemanager;
|
package org.apache.hadoop.yarn.server.nodemanager;
|
||||||
|
|
||||||
|
import java.io.File;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.net.URI;
|
import java.net.URI;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
|
@ -31,6 +32,7 @@ import org.apache.commons.logging.Log;
|
||||||
import org.apache.commons.logging.LogFactory;
|
import org.apache.commons.logging.LogFactory;
|
||||||
import org.apache.hadoop.conf.Configuration;
|
import org.apache.hadoop.conf.Configuration;
|
||||||
import org.apache.hadoop.fs.FileContext;
|
import org.apache.hadoop.fs.FileContext;
|
||||||
|
import org.apache.hadoop.fs.FileSystem;
|
||||||
import org.apache.hadoop.fs.LocalDirAllocator;
|
import org.apache.hadoop.fs.LocalDirAllocator;
|
||||||
import org.apache.hadoop.fs.Path;
|
import org.apache.hadoop.fs.Path;
|
||||||
import org.apache.hadoop.fs.permission.FsPermission;
|
import org.apache.hadoop.fs.permission.FsPermission;
|
||||||
|
@ -467,6 +469,35 @@ public class LocalDirsHandlerService extends AbstractService {
|
||||||
return disksTurnedGood;
|
return disksTurnedGood;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private Path getPathToRead(String pathStr, List<String> dirs)
|
||||||
|
throws IOException {
|
||||||
|
// remove the leading slash from the path (to make sure that the uri
|
||||||
|
// resolution results in a valid path on the dir being checked)
|
||||||
|
if (pathStr.startsWith("/")) {
|
||||||
|
pathStr = pathStr.substring(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
FileSystem localFS = FileSystem.getLocal(getConfig());
|
||||||
|
for (String dir : dirs) {
|
||||||
|
try {
|
||||||
|
Path tmpDir = new Path(dir);
|
||||||
|
File tmpFile = tmpDir.isAbsolute()
|
||||||
|
? new File(localFS.makeQualified(tmpDir).toUri())
|
||||||
|
: new File(dir);
|
||||||
|
Path file = new Path(tmpFile.getPath(), pathStr);
|
||||||
|
if (localFS.exists(file)) {
|
||||||
|
return file;
|
||||||
|
}
|
||||||
|
} catch (IOException ie) {
|
||||||
|
// ignore
|
||||||
|
LOG.warn("Failed to find " + pathStr + " at " + dir, ie);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
throw new IOException("Could not find " + pathStr + " in any of" +
|
||||||
|
" the directories");
|
||||||
|
}
|
||||||
|
|
||||||
public Path getLocalPathForWrite(String pathStr) throws IOException {
|
public Path getLocalPathForWrite(String pathStr) throws IOException {
|
||||||
return localDirsAllocator.getLocalPathForWrite(pathStr, getConfig());
|
return localDirsAllocator.getLocalPathForWrite(pathStr, getConfig());
|
||||||
}
|
}
|
||||||
|
@ -484,7 +515,7 @@ public class LocalDirsHandlerService extends AbstractService {
|
||||||
}
|
}
|
||||||
|
|
||||||
public Path getLogPathToRead(String pathStr) throws IOException {
|
public Path getLogPathToRead(String pathStr) throws IOException {
|
||||||
return logDirsAllocator.getLocalPathToRead(pathStr, getConfig());
|
return getPathToRead(pathStr, getLogDirsForRead());
|
||||||
}
|
}
|
||||||
|
|
||||||
public static String[] validatePaths(String[] paths) {
|
public static String[] validatePaths(String[] paths) {
|
||||||
|
|
|
@ -39,6 +39,7 @@ import java.util.concurrent.ConcurrentMap;
|
||||||
|
|
||||||
import org.apache.hadoop.conf.Configuration;
|
import org.apache.hadoop.conf.Configuration;
|
||||||
import org.apache.hadoop.fs.CommonConfigurationKeysPublic;
|
import org.apache.hadoop.fs.CommonConfigurationKeysPublic;
|
||||||
|
import org.apache.hadoop.fs.FileUtil;
|
||||||
import org.apache.hadoop.fs.Path;
|
import org.apache.hadoop.fs.Path;
|
||||||
import org.apache.hadoop.io.nativeio.NativeIO;
|
import org.apache.hadoop.io.nativeio.NativeIO;
|
||||||
import org.apache.hadoop.security.UserGroupInformation;
|
import org.apache.hadoop.security.UserGroupInformation;
|
||||||
|
@ -63,6 +64,7 @@ import org.apache.hadoop.yarn.server.nodemanager.NodeManager.NMContext;
|
||||||
import org.apache.hadoop.yarn.server.nodemanager.containermanager.application.Application;
|
import org.apache.hadoop.yarn.server.nodemanager.containermanager.application.Application;
|
||||||
import org.apache.hadoop.yarn.server.nodemanager.containermanager.container.Container;
|
import org.apache.hadoop.yarn.server.nodemanager.containermanager.container.Container;
|
||||||
import org.apache.hadoop.yarn.server.nodemanager.containermanager.container.ContainerState;
|
import org.apache.hadoop.yarn.server.nodemanager.containermanager.container.ContainerState;
|
||||||
|
import org.apache.hadoop.yarn.server.nodemanager.containermanager.launcher.ContainerLaunch;
|
||||||
import org.apache.hadoop.yarn.server.nodemanager.recovery.NMNullStateStoreService;
|
import org.apache.hadoop.yarn.server.nodemanager.recovery.NMNullStateStoreService;
|
||||||
import org.apache.hadoop.yarn.server.nodemanager.webapp.ContainerLogsPage.ContainersLogsBlock;
|
import org.apache.hadoop.yarn.server.nodemanager.webapp.ContainerLogsPage.ContainersLogsBlock;
|
||||||
import org.apache.hadoop.yarn.server.security.ApplicationACLsManager;
|
import org.apache.hadoop.yarn.server.security.ApplicationACLsManager;
|
||||||
|
@ -144,6 +146,52 @@ public class TestContainerLogsPage {
|
||||||
Assert.assertTrue(dirs.contains(containerLogDir));
|
Assert.assertTrue(dirs.contains(containerLogDir));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test(timeout=30000)
|
||||||
|
public void testContainerLogFile() throws IOException, YarnException {
|
||||||
|
File absLogDir = new File("target",
|
||||||
|
TestNMWebServer.class.getSimpleName() + "LogDir").getAbsoluteFile();
|
||||||
|
String logdirwithFile = absLogDir.toURI().toString();
|
||||||
|
Configuration conf = new Configuration();
|
||||||
|
conf.set(YarnConfiguration.NM_LOG_DIRS, logdirwithFile);
|
||||||
|
conf.setFloat(YarnConfiguration.NM_MAX_PER_DISK_UTILIZATION_PERCENTAGE,
|
||||||
|
0.0f);
|
||||||
|
LocalDirsHandlerService dirsHandler = new LocalDirsHandlerService();
|
||||||
|
dirsHandler.init(conf);
|
||||||
|
NMContext nmContext = new NodeManager.NMContext(null, null, dirsHandler,
|
||||||
|
new ApplicationACLsManager(conf), new NMNullStateStoreService());
|
||||||
|
// Add an application and the corresponding containers
|
||||||
|
String user = "nobody";
|
||||||
|
long clusterTimeStamp = 1234;
|
||||||
|
ApplicationId appId = BuilderUtils.newApplicationId(
|
||||||
|
clusterTimeStamp, 1);
|
||||||
|
Application app = mock(Application.class);
|
||||||
|
when(app.getUser()).thenReturn(user);
|
||||||
|
when(app.getAppId()).thenReturn(appId);
|
||||||
|
ApplicationAttemptId appAttemptId = BuilderUtils.newApplicationAttemptId(
|
||||||
|
appId, 1);
|
||||||
|
ContainerId containerId = BuilderUtils.newContainerId(
|
||||||
|
appAttemptId, 1);
|
||||||
|
nmContext.getApplications().put(appId, app);
|
||||||
|
|
||||||
|
MockContainer container =
|
||||||
|
new MockContainer(appAttemptId, new AsyncDispatcher(), conf, user,
|
||||||
|
appId, 1);
|
||||||
|
container.setState(ContainerState.RUNNING);
|
||||||
|
nmContext.getContainers().put(containerId, container);
|
||||||
|
File containerLogDir = new File(absLogDir,
|
||||||
|
ContainerLaunch.getRelativeContainerLogDir(appId.toString(),
|
||||||
|
containerId.toString()));
|
||||||
|
containerLogDir.mkdirs();
|
||||||
|
String fileName = "fileName";
|
||||||
|
File containerLogFile = new File(containerLogDir, fileName);
|
||||||
|
containerLogFile.createNewFile();
|
||||||
|
File file = ContainerLogsUtils.getContainerLogFile(containerId,
|
||||||
|
fileName, user, nmContext);
|
||||||
|
Assert.assertEquals(containerLogFile.toURI().toString(),
|
||||||
|
file.toURI().toString());
|
||||||
|
FileUtil.fullyDelete(absLogDir);
|
||||||
|
}
|
||||||
|
|
||||||
@Test(timeout = 10000)
|
@Test(timeout = 10000)
|
||||||
public void testContainerLogPageAccess() throws IOException {
|
public void testContainerLogPageAccess() throws IOException {
|
||||||
// SecureIOUtils require Native IO to be enabled. This test will run
|
// SecureIOUtils require Native IO to be enabled. This test will run
|
||||||
|
|
Loading…
Reference in New Issue