YARN-3637. Handle localization sym-linking correctly at the YARN level. Contributed by Chris Trezzo.

(cherry picked from commit 425a7e5028)
This commit is contained in:
Sangjin Lee 2017-01-25 15:51:36 -08:00
parent c4d3b28c2d
commit b799ea7641
3 changed files with 81 additions and 10 deletions

View File

@ -63,14 +63,29 @@ public abstract class SharedCacheClient extends AbstractService {
* exist, null is returned instead. * exist, null is returned instead.
* </p> * </p>
* *
* <p>
* Once a path has been returned for a resource, that path is safe to use for
* the lifetime of the application that corresponds to the provided
* ApplicationId.
* </p>
*
* <p>
* Additionally, a name for the resource should be specified. A fragment will
* be added to the path with the desired name if the desired name is different
* than the name of the provided path from the shared cache. This ensures that
* if the returned path is used to create a LocalResource, then the symlink
* created during YARN localization will match the name specified.
* </p>
*
* @param applicationId ApplicationId of the application using the resource * @param applicationId ApplicationId of the application using the resource
* @param resourceKey the key (i.e. checksum) that identifies the resource * @param resourceKey the key (i.e. checksum) that identifies the resource
* @param resourceName the desired name of the resource
* @return Path to the resource, or null if it does not exist * @return Path to the resource, or null if it does not exist
*/ */
@Public @Public
@Unstable @Unstable
public abstract Path use(ApplicationId applicationId, String resourceKey) public abstract Path use(ApplicationId applicationId, String resourceKey,
throws YarnException; String resourceName) throws YarnException;
/** /**
* <p> * <p>

View File

@ -21,6 +21,8 @@ package org.apache.hadoop.yarn.client.api.impl;
import java.io.IOException; import java.io.IOException;
import java.net.InetSocketAddress; import java.net.InetSocketAddress;
import java.net.URI;
import java.net.URISyntaxException;
import org.apache.commons.logging.Log; import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory; import org.apache.commons.logging.LogFactory;
@ -111,8 +113,8 @@ public class SharedCacheClientImpl extends SharedCacheClient {
} }
@Override @Override
public Path use(ApplicationId applicationId, String resourceKey) public Path use(ApplicationId applicationId, String resourceKey,
throws YarnException { String resourceName) throws YarnException {
Path resourcePath = null; Path resourcePath = null;
UseSharedCacheResourceRequest request = Records.newRecord( UseSharedCacheResourceRequest request = Records.newRecord(
UseSharedCacheResourceRequest.class); UseSharedCacheResourceRequest.class);
@ -129,6 +131,31 @@ public class SharedCacheClientImpl extends SharedCacheClient {
// We don't handle different exceptions separately at this point. // We don't handle different exceptions separately at this point.
throw new YarnException(e); throw new YarnException(e);
} }
if (resourcePath != null) {
if (resourcePath.getName().equals(resourceName)) {
// The preferred name is the same as the name of the item in the cache,
// so we skip generating the fragment to save space in the MRconfig.
return resourcePath;
} else {
// We are using the shared cache, and a preferred name has been
// specified that is different than the name of the resource in the
// shared cache. We need to set the fragment portion of the URI to
// preserve the desired name.
URI pathURI = resourcePath.toUri();
try {
// We assume that there is no existing fragment in the URI since the
// shared cache manager does not use fragments.
pathURI =
new URI(pathURI.getScheme(), pathURI.getSchemeSpecificPart(),
resourceName);
resourcePath = new Path(pathURI);
} catch (URISyntaxException e) {
throw new YarnException(
"Could not create a new URI due to syntax errors: "
+ pathURI.toString(), e);
}
}
}
return resourcePath; return resourcePath;
} }

View File

@ -19,6 +19,7 @@
package org.apache.hadoop.yarn.client.api.impl; package org.apache.hadoop.yarn.client.api.impl;
import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNull;
import static org.mockito.Matchers.isA; import static org.mockito.Matchers.isA;
import static org.mockito.Mockito.mock; import static org.mockito.Mockito.mock;
import static org.mockito.Mockito.when; import static org.mockito.Mockito.when;
@ -26,6 +27,7 @@ import static org.mockito.Mockito.when;
import java.io.DataOutputStream; import java.io.DataOutputStream;
import java.io.FileNotFoundException; import java.io.FileNotFoundException;
import java.io.IOException; import java.io.IOException;
import java.net.URI;
import org.apache.commons.logging.Log; import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory; import org.apache.commons.logging.LogFactory;
@ -106,15 +108,42 @@ public class TestSharedCacheClientImpl {
} }
@Test @Test
public void testUse() throws Exception { public void testUseCacheMiss() throws Exception {
UseSharedCacheResourceResponse response =
new UseSharedCacheResourceResponsePBImpl();
response.setPath(null);
when(cProtocol.use(isA(UseSharedCacheResourceRequest.class))).thenReturn(
response);
Path newPath = client.use(mock(ApplicationId.class), "key", null);
assertNull("The path is not null!", newPath);
}
@Test
public void testUseWithResourceName() throws Exception {
Path file = new Path("viewfs://test/path"); Path file = new Path("viewfs://test/path");
URI useUri = new URI("viewfs://test/path#linkName");
Path usePath = new Path(useUri);
UseSharedCacheResourceResponse response = UseSharedCacheResourceResponse response =
new UseSharedCacheResourceResponsePBImpl(); new UseSharedCacheResourceResponsePBImpl();
response.setPath(file.toString()); response.setPath(file.toString());
when(cProtocol.use(isA(UseSharedCacheResourceRequest.class))).thenReturn( when(cProtocol.use(isA(UseSharedCacheResourceRequest.class))).thenReturn(
response); response);
Path newPath = client.use(mock(ApplicationId.class), "key"); Path newPath = client.use(mock(ApplicationId.class), "key", "linkName");
assertEquals(file, newPath); assertEquals("The paths are not equal!", usePath, newPath);
}
@Test
public void testUseWithSameResourceName() throws Exception {
Path file = new Path("viewfs://test/path");
URI useUri = new URI("viewfs://test/path");
Path usePath = new Path(useUri);
UseSharedCacheResourceResponse response =
new UseSharedCacheResourceResponsePBImpl();
response.setPath(file.toString());
when(cProtocol.use(isA(UseSharedCacheResourceRequest.class))).thenReturn(
response);
Path newPath = client.use(mock(ApplicationId.class), "key", "path");
assertEquals("The paths are not equal!", usePath, newPath);
} }
@Test(expected = YarnException.class) @Test(expected = YarnException.class)
@ -122,7 +151,7 @@ public class TestSharedCacheClientImpl {
String message = "Mock IOExcepiton!"; String message = "Mock IOExcepiton!";
when(cProtocol.use(isA(UseSharedCacheResourceRequest.class))).thenThrow( when(cProtocol.use(isA(UseSharedCacheResourceRequest.class))).thenThrow(
new IOException(message)); new IOException(message));
client.use(mock(ApplicationId.class), "key"); client.use(mock(ApplicationId.class), "key", null);
} }
@Test @Test