YARN-8672. TestContainerManager#testLocalingResourceWhileContainerRunning occasionally times out. Contributed by Chandni Singh and Jim Brennan.
This commit is contained in:
parent
5cca5ca81b
commit
ab29b54b19
|
@ -72,6 +72,7 @@ public abstract class ContainerExecutor implements Configurable {
|
|||
private static final Logger LOG =
|
||||
LoggerFactory.getLogger(ContainerExecutor.class);
|
||||
protected static final String WILDCARD = "*";
|
||||
public static final String TOKEN_FILE_NAME_FMT = "%s.tokens";
|
||||
|
||||
/**
|
||||
* The permissions to use when creating the launch script.
|
||||
|
|
|
@ -159,8 +159,7 @@ public class DefaultContainerExecutor extends ContainerExecutor {
|
|||
// randomly choose the local directory
|
||||
Path appStorageDir = getWorkingDir(localDirs, user, appId);
|
||||
|
||||
String tokenFn =
|
||||
String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT, locId);
|
||||
String tokenFn = String.format(TOKEN_FILE_NAME_FMT, locId);
|
||||
Path tokenDst = new Path(appStorageDir, tokenFn);
|
||||
copyFile(nmPrivateContainerTokensPath, tokenDst, user);
|
||||
LOG.info("Copying from " + nmPrivateContainerTokensPath
|
||||
|
@ -175,7 +174,8 @@ public class DefaultContainerExecutor extends ContainerExecutor {
|
|||
+ localizerFc.getWorkingDirectory());
|
||||
|
||||
ContainerLocalizer localizer =
|
||||
createContainerLocalizer(user, appId, locId, localDirs, localizerFc);
|
||||
createContainerLocalizer(user, appId, locId, tokenFn, localDirs,
|
||||
localizerFc);
|
||||
// TODO: DO it over RPC for maintaining similarity?
|
||||
localizer.runLocalization(nmAddr);
|
||||
}
|
||||
|
@ -199,10 +199,10 @@ public class DefaultContainerExecutor extends ContainerExecutor {
|
|||
@Private
|
||||
@VisibleForTesting
|
||||
protected ContainerLocalizer createContainerLocalizer(String user,
|
||||
String appId, String locId, List<String> localDirs,
|
||||
String appId, String locId, String tokenFileName, List<String> localDirs,
|
||||
FileContext localizerFc) throws IOException {
|
||||
ContainerLocalizer localizer =
|
||||
new ContainerLocalizer(localizerFc, user, appId, locId,
|
||||
new ContainerLocalizer(localizerFc, user, appId, locId, tokenFileName,
|
||||
getPaths(localDirs),
|
||||
RecordFactoryProvider.getRecordFactory(getConf()));
|
||||
return localizer;
|
||||
|
|
|
@ -146,8 +146,9 @@ public class DockerContainerExecutor extends ContainerExecutor {
|
|||
List<String> logDirs = dirsHandler.getLogDirs();
|
||||
|
||||
ContainerLocalizer localizer =
|
||||
new ContainerLocalizer(lfs, user, appId, locId, getPaths(localDirs),
|
||||
RecordFactoryProvider.getRecordFactory(getConf()));
|
||||
new ContainerLocalizer(lfs, user, appId, locId,
|
||||
nmPrivateContainerTokensPath.getName(), getPaths(localDirs),
|
||||
RecordFactoryProvider.getRecordFactory(getConf()));
|
||||
|
||||
createUserLocalDirs(localDirs, user);
|
||||
createUserCacheDirs(localDirs, user);
|
||||
|
@ -158,7 +159,7 @@ public class DockerContainerExecutor extends ContainerExecutor {
|
|||
Path appStorageDir = getWorkingDir(localDirs, user, appId);
|
||||
|
||||
String tokenFn =
|
||||
String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT, locId);
|
||||
String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT, locId);
|
||||
Path tokenDst = new Path(appStorageDir, tokenFn);
|
||||
copyFile(nmPrivateContainerTokensPath, tokenDst, user);
|
||||
LOG.info("Copying from " + nmPrivateContainerTokensPath + " to " + tokenDst);
|
||||
|
|
|
@ -383,8 +383,8 @@ public class LinuxContainerExecutor extends ContainerExecutor {
|
|||
|
||||
List<String> localizerArgs = new ArrayList<>();
|
||||
|
||||
buildMainArgs(localizerArgs, user, appId, locId, nmAddr, localDirs);
|
||||
|
||||
buildMainArgs(localizerArgs, user, appId, locId, nmAddr,
|
||||
nmPrivateContainerTokensPath.getName(), localDirs);
|
||||
Path containerLogDir = getContainerLogDir(dirsHandler, appId, locId);
|
||||
localizerArgs = replaceWithContainerLogDir(localizerArgs, containerLogDir);
|
||||
|
||||
|
@ -442,9 +442,10 @@ public class LinuxContainerExecutor extends ContainerExecutor {
|
|||
*/
|
||||
@VisibleForTesting
|
||||
public void buildMainArgs(List<String> command, String user, String appId,
|
||||
String locId, InetSocketAddress nmAddr, List<String> localDirs) {
|
||||
String locId, InetSocketAddress nmAddr, String tokenFileName,
|
||||
List<String> localDirs) {
|
||||
ContainerLocalizer.buildMainArgs(command, user, appId, locId, nmAddr,
|
||||
localDirs, super.getConf());
|
||||
tokenFileName, localDirs, super.getConf());
|
||||
}
|
||||
|
||||
@Override
|
||||
|
|
|
@ -663,8 +663,8 @@ public class WindowsSecureContainerExecutor extends DefaultContainerExecutor {
|
|||
|
||||
Path appStorageDir = getWorkingDir(localDirs, user, appId);
|
||||
|
||||
String tokenFn = String.format(
|
||||
ContainerLocalizer.TOKEN_FILE_NAME_FMT, locId);
|
||||
String tokenFn = String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT,
|
||||
locId);
|
||||
Path tokenDst = new Path(appStorageDir, tokenFn);
|
||||
copyFile(nmPrivateContainerTokensPath, tokenDst, user);
|
||||
|
||||
|
@ -702,7 +702,7 @@ public class WindowsSecureContainerExecutor extends DefaultContainerExecutor {
|
|||
command.addAll(ContainerLocalizer.getJavaOpts(getConf()));
|
||||
|
||||
ContainerLocalizer.buildMainArgs(command, user, appId, locId, nmAddr,
|
||||
localDirs, super.getConf());
|
||||
tokenFn, localDirs, super.getConf());
|
||||
|
||||
String cmdLine = StringUtils.join(command, " ");
|
||||
|
||||
|
|
|
@ -20,6 +20,7 @@ package org.apache.hadoop.yarn.server.nodemanager.containermanager.launcher;
|
|||
|
||||
import static org.apache.hadoop.fs.CreateFlag.CREATE;
|
||||
import static org.apache.hadoop.fs.CreateFlag.OVERWRITE;
|
||||
import static org.apache.hadoop.yarn.server.nodemanager.ContainerExecutor.TOKEN_FILE_NAME_FMT;
|
||||
import org.slf4j.Logger;
|
||||
import org.slf4j.LoggerFactory;
|
||||
|
||||
|
@ -220,8 +221,7 @@ public class ContainerLaunch implements Callable<Integer> {
|
|||
+ CONTAINER_SCRIPT);
|
||||
Path nmPrivateTokensPath = dirsHandler.getLocalPathForWrite(
|
||||
getContainerPrivateDir(appIdStr, containerIdStr) + Path.SEPARATOR
|
||||
+ String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT,
|
||||
containerIdStr));
|
||||
+ String.format(TOKEN_FILE_NAME_FMT, containerIdStr));
|
||||
Path nmPrivateClasspathJarDir = dirsHandler.getLocalPathForWrite(
|
||||
getContainerPrivateDir(appIdStr, containerIdStr));
|
||||
|
||||
|
|
|
@ -32,7 +32,6 @@ import org.apache.hadoop.yarn.server.nodemanager.containermanager.application.Ap
|
|||
import org.apache.hadoop.yarn.server.nodemanager.containermanager.container.Container;
|
||||
import org.apache.hadoop.yarn.server.nodemanager.containermanager.container.ContainerEventType;
|
||||
import org.apache.hadoop.yarn.server.nodemanager.containermanager.container.ContainerExitEvent;
|
||||
import org.apache.hadoop.yarn.server.nodemanager.containermanager.localizer.ContainerLocalizer;
|
||||
import org.apache.hadoop.yarn.server.nodemanager.executor.ContainerStartContext;
|
||||
import org.apache.hadoop.yarn.server.nodemanager.executor.DeletionAsUserContext;
|
||||
import org.slf4j.Logger;
|
||||
|
@ -176,7 +175,7 @@ public class ContainerRelaunch extends ContainerLaunch {
|
|||
String containerIdStr) throws IOException {
|
||||
return dirsHandler.getLocalPathForRead(
|
||||
getContainerPrivateDir(appIdStr, containerIdStr) + Path.SEPARATOR
|
||||
+ String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT,
|
||||
+ String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT,
|
||||
containerIdStr));
|
||||
}
|
||||
|
||||
|
|
|
@ -17,6 +17,7 @@
|
|||
*/
|
||||
package org.apache.hadoop.yarn.server.nodemanager.containermanager.localizer;
|
||||
|
||||
import com.google.common.base.Preconditions;
|
||||
import java.io.DataInputStream;
|
||||
import java.io.File;
|
||||
import java.io.IOException;
|
||||
|
@ -92,9 +93,6 @@ public class ContainerLocalizer {
|
|||
public static final String FILECACHE = "filecache";
|
||||
public static final String APPCACHE = "appcache";
|
||||
public static final String USERCACHE = "usercache";
|
||||
public static final String OUTPUTDIR = "output";
|
||||
public static final String TOKEN_FILE_NAME_FMT = "%s.tokens";
|
||||
public static final String WORKDIR = "work";
|
||||
private static final String APPCACHE_CTXT_FMT = "%s.app.cache.dirs";
|
||||
private static final String USERCACHE_CTXT_FMT = "%s.user.cache.dirs";
|
||||
private static final FsPermission FILECACHE_PERMS =
|
||||
|
@ -115,9 +113,10 @@ public class ContainerLocalizer {
|
|||
|
||||
private Set<Thread> localizingThreads =
|
||||
Collections.synchronizedSet(new HashSet<Thread>());
|
||||
private final String tokenFileName;
|
||||
|
||||
public ContainerLocalizer(FileContext lfs, String user, String appId,
|
||||
String localizerId, List<Path> localDirs,
|
||||
String localizerId, String tokenFileName, List<Path> localDirs,
|
||||
RecordFactory recordFactory) throws IOException {
|
||||
if (null == user) {
|
||||
throw new IOException("Cannot initialize for null user");
|
||||
|
@ -139,6 +138,8 @@ public class ContainerLocalizer {
|
|||
" is loaded.");
|
||||
this.appCacheDirContextName = String.format(APPCACHE_CTXT_FMT, appId);
|
||||
this.pendingResources = new HashMap<LocalResource,Future<Path>>();
|
||||
this.tokenFileName = Preconditions.checkNotNull(tokenFileName,
|
||||
"token file name cannot be null");
|
||||
}
|
||||
|
||||
@Private
|
||||
|
@ -159,8 +160,7 @@ public class ContainerLocalizer {
|
|||
try {
|
||||
// assume credentials in cwd
|
||||
// TODO: Fix
|
||||
Path tokenPath =
|
||||
new Path(String.format(TOKEN_FILE_NAME_FMT, localizerId));
|
||||
Path tokenPath = new Path(tokenFileName);
|
||||
credFile = lfs.open(tokenPath);
|
||||
creds.readTokenStorageStream(credFile);
|
||||
// Explicitly deleting token file.
|
||||
|
@ -408,7 +408,9 @@ public class ContainerLocalizer {
|
|||
*/
|
||||
public static void buildMainArgs(List<String> command,
|
||||
String user, String appId, String locId,
|
||||
InetSocketAddress nmAddr, List<String> localDirs, Configuration conf) {
|
||||
InetSocketAddress nmAddr,
|
||||
String tokenFileName,
|
||||
List<String> localDirs, Configuration conf) {
|
||||
|
||||
String logLevel = conf.get(YarnConfiguration.
|
||||
NM_CONTAINER_LOCALIZER_LOG_LEVEL,
|
||||
|
@ -420,6 +422,7 @@ public class ContainerLocalizer {
|
|||
command.add(locId);
|
||||
command.add(nmAddr.getHostName());
|
||||
command.add(Integer.toString(nmAddr.getPort()));
|
||||
command.add(tokenFileName);
|
||||
for(String dir : localDirs) {
|
||||
command.add(dir);
|
||||
}
|
||||
|
@ -450,8 +453,9 @@ public class ContainerLocalizer {
|
|||
String locId = argv[2];
|
||||
InetSocketAddress nmAddr =
|
||||
new InetSocketAddress(argv[3], Integer.parseInt(argv[4]));
|
||||
String[] sLocaldirs = Arrays.copyOfRange(argv, 5, argv.length);
|
||||
ArrayList<Path> localDirs = new ArrayList<Path>(sLocaldirs.length);
|
||||
String tokenFileName = argv[5];
|
||||
String[] sLocaldirs = Arrays.copyOfRange(argv, 6, argv.length);
|
||||
ArrayList<Path> localDirs = new ArrayList<>(sLocaldirs.length);
|
||||
for (String sLocaldir : sLocaldirs) {
|
||||
localDirs.add(new Path(sLocaldir));
|
||||
}
|
||||
|
@ -463,12 +467,11 @@ public class ContainerLocalizer {
|
|||
LOG.warn("Localization running as " + uid + " not " + user);
|
||||
}
|
||||
|
||||
ContainerLocalizer localizer =
|
||||
new ContainerLocalizer(FileContext.getLocalFSFileContext(), user,
|
||||
appId, locId, localDirs,
|
||||
ContainerLocalizer localizer = new ContainerLocalizer(
|
||||
FileContext.getLocalFSFileContext(), user,
|
||||
appId, locId, tokenFileName, localDirs,
|
||||
RecordFactoryProvider.getRecordFactory(null));
|
||||
localizer.runLocalization(nmAddr);
|
||||
return;
|
||||
} catch (Throwable e) {
|
||||
// Print traces to stdout so that they can be logged by the NM address
|
||||
// space in both DefaultCE and LCE cases
|
||||
|
|
|
@ -996,6 +996,8 @@ public class ResourceLocalizationService extends CompositeService
|
|||
private final RecordFactory recordFactory =
|
||||
RecordFactoryProvider.getRecordFactory(getConfig());
|
||||
|
||||
private final String tokenFileName;
|
||||
|
||||
LocalizerRunner(LocalizerContext context, String localizerId) {
|
||||
super("LocalizerRunner for " + localizerId);
|
||||
this.context = context;
|
||||
|
@ -1003,8 +1005,9 @@ public class ResourceLocalizationService extends CompositeService
|
|||
this.pending =
|
||||
Collections
|
||||
.synchronizedList(new ArrayList<LocalizerResourceRequestEvent>());
|
||||
this.scheduled =
|
||||
new HashMap<LocalResourceRequest, LocalizerResourceRequestEvent>();
|
||||
this.scheduled = new HashMap<>();
|
||||
tokenFileName = String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT,
|
||||
localizerId + Long.toHexString(System.currentTimeMillis()));
|
||||
}
|
||||
|
||||
public void addResource(LocalizerResourceRequestEvent request) {
|
||||
|
@ -1199,11 +1202,8 @@ public class ResourceLocalizationService extends CompositeService
|
|||
Throwable exception = null;
|
||||
try {
|
||||
// Get nmPrivateDir
|
||||
nmPrivateCTokensPath =
|
||||
dirsHandler.getLocalPathForWrite(
|
||||
NM_PRIVATE_DIR + Path.SEPARATOR
|
||||
+ String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT,
|
||||
localizerId));
|
||||
nmPrivateCTokensPath = dirsHandler.getLocalPathForWrite(
|
||||
NM_PRIVATE_DIR + Path.SEPARATOR + tokenFileName);
|
||||
|
||||
// 0) init queue, etc.
|
||||
// 1) write credentials to private dir
|
||||
|
|
|
@ -412,14 +412,15 @@ public class TestDefaultContainerExecutor {
|
|||
spy(new DefaultContainerExecutor(mockLfs) {
|
||||
@Override
|
||||
public ContainerLocalizer createContainerLocalizer(String user,
|
||||
String appId, String locId, List<String> localDirs,
|
||||
FileContext localizerFc) throws IOException {
|
||||
String appId, String locId, String tokenFileName,
|
||||
List<String> localDirs, FileContext localizerFc)
|
||||
throws IOException {
|
||||
|
||||
// Spy on the localizer and make it return valid heart-beat
|
||||
// responses even though there is no real NodeManager.
|
||||
ContainerLocalizer localizer =
|
||||
super.createContainerLocalizer(user, appId, locId, localDirs,
|
||||
localizerFc);
|
||||
super.createContainerLocalizer(user, appId, locId,
|
||||
tokenFileName, localDirs, localizerFc);
|
||||
ContainerLocalizer spyLocalizer = spy(localizer);
|
||||
LocalizationProtocol nmProxy = mock(LocalizationProtocol.class);
|
||||
try {
|
||||
|
|
|
@ -353,7 +353,7 @@ public class TestLinuxContainerExecutor {
|
|||
dirsHandler
|
||||
.getLocalPathForWrite(ResourceLocalizationService.NM_PRIVATE_DIR
|
||||
+ Path.SEPARATOR
|
||||
+ String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT, locId));
|
||||
+ String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT, locId));
|
||||
files.create(nmPrivateContainerTokensPath, EnumSet.of(CREATE, OVERWRITE));
|
||||
Configuration config = new YarnConfiguration(conf);
|
||||
InetSocketAddress nmAddr =
|
||||
|
@ -366,7 +366,7 @@ public class TestLinuxContainerExecutor {
|
|||
@Override
|
||||
public void buildMainArgs(List<String> command, String user,
|
||||
String appId, String locId, InetSocketAddress nmAddr,
|
||||
List<String> localDirs) {
|
||||
String tokenFileName, List<String> localDirs) {
|
||||
MockContainerLocalizer.buildMainArgs(command, user, appId, locId,
|
||||
nmAddr, localDirs);
|
||||
}
|
||||
|
@ -387,7 +387,7 @@ public class TestLinuxContainerExecutor {
|
|||
dirsHandler
|
||||
.getLocalPathForWrite(ResourceLocalizationService.NM_PRIVATE_DIR
|
||||
+ Path.SEPARATOR
|
||||
+ String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT, locId2));
|
||||
+ String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT, locId2));
|
||||
files.create(nmPrivateContainerTokensPath2, EnumSet.of(CREATE, OVERWRITE));
|
||||
exec.startLocalizer(new LocalizerStartContext.Builder()
|
||||
.setNmPrivateContainerTokens(nmPrivateContainerTokensPath2)
|
||||
|
|
|
@ -268,7 +268,7 @@ public class TestLinuxContainerExecutorWithMocks {
|
|||
.build());
|
||||
|
||||
List<String> result=readMockParams();
|
||||
Assert.assertEquals(result.size(), 25);
|
||||
Assert.assertEquals(result.size(), 26);
|
||||
Assert.assertEquals(result.get(0), YarnConfiguration.DEFAULT_NM_NONSECURE_MODE_LOCAL_USER);
|
||||
Assert.assertEquals(result.get(1), "test");
|
||||
Assert.assertEquals(result.get(2), "0" );
|
||||
|
@ -294,6 +294,7 @@ public class TestLinuxContainerExecutorWithMocks {
|
|||
Assert.assertEquals(result.get(21), "12345");
|
||||
Assert.assertEquals(result.get(22), "localhost");
|
||||
Assert.assertEquals(result.get(23), "8040");
|
||||
Assert.assertEquals(result.get(24), "nmPrivateCTokensPath");
|
||||
|
||||
} catch (InterruptedException e) {
|
||||
LOG.error("Error:"+e.getMessage(),e);
|
||||
|
|
|
@ -1201,7 +1201,7 @@ public class TestContainerManager extends BaseContainerManagerTest {
|
|||
// While the container is running, localize new resources.
|
||||
// Verify the symlink is created properly
|
||||
@Test
|
||||
public void testLocalingResourceWhileContainerRunning() throws Exception {
|
||||
public void testLocalizingResourceWhileContainerRunning() throws Exception {
|
||||
// Real del service
|
||||
delSrvc = new DeletionService(exec);
|
||||
delSrvc.init(conf);
|
||||
|
|
|
@ -37,6 +37,8 @@ import static org.mockito.Mockito.spy;
|
|||
import static org.mockito.Mockito.times;
|
||||
import static org.mockito.Mockito.verify;
|
||||
import static org.mockito.Mockito.when;
|
||||
|
||||
import org.apache.hadoop.yarn.server.nodemanager.ContainerExecutor;
|
||||
import org.slf4j.Logger;
|
||||
import org.slf4j.LoggerFactory;
|
||||
|
||||
|
@ -453,7 +455,9 @@ public class TestContainerLocalizer {
|
|||
FakeContainerLocalizer(FileContext lfs, String user, String appId,
|
||||
String localizerId, List<Path> localDirs,
|
||||
RecordFactory recordFactory) throws IOException {
|
||||
super(lfs, user, appId, localizerId, localDirs, recordFactory);
|
||||
super(lfs, user, appId, localizerId,
|
||||
String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT, containerId),
|
||||
localDirs, recordFactory);
|
||||
}
|
||||
|
||||
FakeLongDownload getDownloader() {
|
||||
|
@ -529,7 +533,7 @@ public class TestContainerLocalizer {
|
|||
DataInputBuffer appTokens = createFakeCredentials(random, 10);
|
||||
tokenPath =
|
||||
lfs.makeQualified(new Path(
|
||||
String.format(ContainerLocalizer.TOKEN_FILE_NAME_FMT,
|
||||
String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT,
|
||||
containerId)));
|
||||
doReturn(new FSDataInputStream(new FakeFSDataInputStream(appTokens))
|
||||
).when(spylfs).open(tokenPath);
|
||||
|
@ -661,7 +665,8 @@ static DataInputBuffer createFakeCredentials(Random r, int nTok)
|
|||
RecordFactory recordFactory = mock(RecordFactory.class);
|
||||
ContainerLocalizer localizer = new ContainerLocalizer(lfs,
|
||||
UserGroupInformation.getCurrentUser().getUserName(), "application_01",
|
||||
"container_01", new ArrayList<Path>(), recordFactory);
|
||||
"container_01", String.format(ContainerExecutor.TOKEN_FILE_NAME_FMT,
|
||||
"container_01"), new ArrayList<Path>(), recordFactory);
|
||||
LocalResource rsrc = mock(LocalResource.class);
|
||||
when(rsrc.getVisibility()).thenReturn(LocalResourceVisibility.PRIVATE);
|
||||
Path destDirPath = new Path(fileCacheDir, "0/0/85");
|
||||
|
|
Loading…
Reference in New Issue