MAPREDUCE-7069. Add ability to specify user environment variables individually. Contributed by Jim Brennan

(cherry picked from commit 4571351ccc)
This commit is contained in:
Kihwal Lee 2020-08-13 19:02:03 -05:00
parent f9c251badc
commit 0c35e44184
11 changed files with 405 additions and 79 deletions

View File

@ -19,7 +19,6 @@
package org.apache.hadoop.mapred;
import java.net.InetSocketAddress;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Vector;
@ -28,7 +27,6 @@ import org.apache.hadoop.fs.Path;
import org.apache.hadoop.mapred.TaskLog.LogName;
import org.apache.hadoop.mapreduce.MRJobConfig;
import org.apache.hadoop.mapreduce.TaskType;
import org.apache.hadoop.mapreduce.TypeConverter;
import org.apache.hadoop.mapreduce.v2.util.MRApps;
import org.apache.hadoop.yarn.api.ApplicationConstants;
import org.apache.hadoop.yarn.api.ApplicationConstants.Environment;
@ -42,50 +40,53 @@ public class MapReduceChildJVM {
filter.toString();
}
private static String getChildEnv(JobConf jobConf, boolean isMap) {
private static String getChildEnvProp(JobConf jobConf, boolean isMap) {
if (isMap) {
return jobConf.get(JobConf.MAPRED_MAP_TASK_ENV,
jobConf.get(JobConf.MAPRED_TASK_ENV));
return JobConf.MAPRED_MAP_TASK_ENV;
}
return jobConf.get(JobConf.MAPRED_REDUCE_TASK_ENV,
jobConf.get(JobConf.MAPRED_TASK_ENV));
return JobConf.MAPRED_REDUCE_TASK_ENV;
}
private static String getChildEnvDefaultValue(JobConf jobConf) {
// There is no default value for these - use the fallback value instead.
return jobConf.get(JobConf.MAPRED_TASK_ENV);
}
public static void setVMEnv(Map<String, String> environment,
Task task) {
JobConf conf = task.conf;
// Add the env variables passed by the user
String mapredChildEnv = getChildEnv(conf, task.isMapTask());
MRApps.setEnvFromInputString(environment, mapredChildEnv, conf);
boolean isMap = task.isMapTask();
// Set logging level in the environment.
// This is so that, if the child forks another "bin/hadoop" (common in
// streaming) it will have the correct loglevel.
environment.put(
"HADOOP_ROOT_LOGGER",
MRApps.getChildLogLevel(conf, task.isMapTask()) + ",console");
// Remove these before adding the user variables to prevent
// MRApps.setEnvFromInputProperty() from appending to them.
String hadoopRootLoggerKey = "HADOOP_ROOT_LOGGER";
String hadoopClientOptsKey = "HADOOP_CLIENT_OPTS";
environment.remove(hadoopRootLoggerKey);
environment.remove(hadoopClientOptsKey);
// TODO: The following is useful for instance in streaming tasks. Should be
// set in ApplicationMaster's env by the RM.
String hadoopClientOpts = System.getenv("HADOOP_CLIENT_OPTS");
if (hadoopClientOpts == null) {
hadoopClientOpts = "";
} else {
hadoopClientOpts = hadoopClientOpts + " ";
// Add the environment variables passed by the user
MRApps.setEnvFromInputProperty(environment, getChildEnvProp(conf, isMap),
getChildEnvDefaultValue(conf), conf);
// Set HADOOP_ROOT_LOGGER and HADOOP_CLIENTS if the user did not set them.
if (!environment.containsKey(hadoopRootLoggerKey)) {
// Set the value for logging level in the environment.
// This is so that, if the child forks another "bin/hadoop" (common in
// streaming) it will have the correct loglevel.
environment.put(hadoopRootLoggerKey,
MRApps.getChildLogLevel(conf, task.isMapTask()) + ",console");
}
environment.put("HADOOP_CLIENT_OPTS", hadoopClientOpts);
// setEnvFromInputString above will add env variable values from
// mapredChildEnv to existing variables. We want to overwrite
// HADOOP_ROOT_LOGGER and HADOOP_CLIENT_OPTS if the user set it explicitly.
Map<String, String> tmpEnv = new HashMap<String, String>();
MRApps.setEnvFromInputString(tmpEnv, mapredChildEnv, conf);
String[] keys = { "HADOOP_ROOT_LOGGER", "HADOOP_CLIENT_OPTS" };
for (String key : keys) {
if (tmpEnv.containsKey(key)) {
environment.put(key, tmpEnv.get(key));
if (!environment.containsKey(hadoopClientOptsKey)) {
// TODO: The following is useful for instance in streaming tasks.
// Should be set in ApplicationMaster's env by the RM.
String hadoopClientOptsValue = System.getenv(hadoopClientOptsKey);
if (hadoopClientOptsValue == null) {
hadoopClientOptsValue = "";
} else {
hadoopClientOptsValue = hadoopClientOptsValue + " ";
}
environment.put(hadoopClientOptsKey, hadoopClientOptsValue);
}
// Add stdout/stderr env

View File

@ -961,10 +961,10 @@ public abstract class TaskAttemptImpl implements
MRApps.crossPlatformifyMREnv(conf, Environment.PWD), conf);
// Add the env variables passed by the admin
MRApps.setEnvFromInputString(environment,
conf.get(MRJobConfig.MAPRED_ADMIN_USER_ENV,
MRJobConfig.DEFAULT_MAPRED_ADMIN_USER_ENV),
conf);
MRApps.setEnvFromInputProperty(environment,
MRJobConfig.MAPRED_ADMIN_USER_ENV,
MRJobConfig.DEFAULT_MAPRED_ADMIN_USER_ENV, conf);
return environment;
}

View File

@ -289,11 +289,11 @@ public class TestMapReduceChildJVM {
app.verifyCompleted();
Assert.assertTrue("HADOOP_ROOT_LOGGER not set for job",
app.cmdEnvironment.containsKey("HADOOP_ROOT_LOGGER"));
app.cmdEnvironment.containsKey("HADOOP_ROOT_LOGGER"));
Assert.assertEquals("WARN,console",
app.cmdEnvironment.get("HADOOP_ROOT_LOGGER"));
app.cmdEnvironment.get("HADOOP_ROOT_LOGGER"));
Assert.assertTrue("HADOOP_CLIENT_OPTS not set for job",
app.cmdEnvironment.containsKey("HADOOP_CLIENT_OPTS"));
app.cmdEnvironment.containsKey("HADOOP_CLIENT_OPTS"));
Assert.assertEquals("test", app.cmdEnvironment.get("HADOOP_CLIENT_OPTS"));
// Try one more.
@ -305,8 +305,22 @@ public class TestMapReduceChildJVM {
app.verifyCompleted();
Assert.assertTrue("HADOOP_ROOT_LOGGER not set for job",
app.cmdEnvironment.containsKey("HADOOP_ROOT_LOGGER"));
app.cmdEnvironment.containsKey("HADOOP_ROOT_LOGGER"));
Assert.assertEquals("trace",
app.cmdEnvironment.get("HADOOP_ROOT_LOGGER"));
app.cmdEnvironment.get("HADOOP_ROOT_LOGGER"));
// Try one using the mapreduce.task.env.var=value syntax
app = new MyMRApp(1, 0, true, this.getClass().getName(), true);
conf = new Configuration();
conf.set(JobConf.MAPRED_MAP_TASK_ENV + ".HADOOP_ROOT_LOGGER",
"DEBUG,console");
job = app.submit(conf);
app.waitForState(job, JobState.SUCCEEDED);
app.verifyCompleted();
Assert.assertTrue("HADOOP_ROOT_LOGGER not set for job",
app.cmdEnvironment.containsKey("HADOOP_ROOT_LOGGER"));
Assert.assertEquals("DEBUG,console",
app.cmdEnvironment.get("HADOOP_ROOT_LOGGER"));
}
}

View File

@ -708,6 +708,16 @@ public class MRApps extends Apps {
Apps.setEnvFromInputString(env, envString, classPathSeparator);
}
public static void setEnvFromInputProperty(Map<String, String> env,
String propName, String defaultPropValue, Configuration conf) {
String classPathSeparator =
conf.getBoolean(MRConfig.MAPREDUCE_APP_SUBMISSION_CROSS_PLATFORM,
MRConfig.DEFAULT_MAPREDUCE_APP_SUBMISSION_CROSS_PLATFORM)
? ApplicationConstants.CLASS_PATH_SEPARATOR : File.pathSeparator;
Apps.setEnvFromInputProperty(env, propName, defaultPropValue, conf,
classPathSeparator);
}
@Public
@Unstable
public static void addToEnvironment(Map<String, String> environment,

View File

@ -312,6 +312,15 @@ public class JobConf extends Configuration {
* <ul>
* <li> A=foo - This will set the env variable A to foo. </li>
* </ul>
*
* You can also add environment variables individually by appending
* <code>.VARNAME</code> to this configuration key, where VARNAME is
* the name of the environment variable.
*
* Example:
* <ul>
* <li>mapreduce.map.env.VARNAME=value</li>
* </ul>
*/
public static final String MAPRED_MAP_TASK_ENV = JobContext.MAP_ENV;
@ -326,6 +335,15 @@ public class JobConf extends Configuration {
* <ul>
* <li> A=foo - This will set the env variable A to foo. </li>
* </ul>
*
* You can also add environment variables individually by appending
* <code>.VARNAME</code> to this configuration key, where VARNAME is
* the name of the environment variable.
*
* Example:
* <ul>
* <li>mapreduce.reduce.env.VARNAME=value</li>
* </ul>
*/
public static final String MAPRED_REDUCE_TASK_ENV = JobContext.REDUCE_ENV;

View File

@ -350,11 +350,22 @@
<property>
<name>mapred.child.env</name>
<value></value>
<description>User added environment variables for the task processes.
<description>User added environment variables for the task processes,
specified as a comma separated list.
Example :
1) A=foo This will set the env variable A to foo
2) B=$B:c This is inherit nodemanager's B env variable on Unix.
3) B=%B%;c This is inherit nodemanager's B env variable on Windows.
To specify a comma separated list of environment variables specifically for
map or reduce tasks, use the mapreduce.map.env or mapreduce.reduce.env
properties.
To define environment variables individually for map or reduce tasks,
you can specify multiple properties of the form mapreduce.map.env.VARNAME
or mapreduce.reduce.env.VARNAME, where VARNAME is the name of the
environment variable. This is the only way to add a variable when its value
contains commas.
</description>
</property>
@ -362,7 +373,15 @@
<property>
<name>mapreduce.map.env</name>
<value></value>
<description>User added environment variables for the map task processes.
<description>User added environment variables for the map task processes,
specified as a comma separated list.
Example:
VAR1=value1,VAR2=value2
To define environment variables individually, you can specify
multiple properties of the form mapreduce.map.env.VARNAME,
where VARNAME is the name of the environment variable. This is the only
way to add a variable when its value contains commas.
</description>
</property>
-->
@ -371,7 +390,16 @@
<property>
<name>mapreduce.reduce.env</name>
<value></value>
<description>User added environment variables for the reduce task processes.
<description>User added environment variables for the reduce task processes,
specified as a comma separated list.
Example:
VAR1=value1,VAR2=value2
To define environment variables individually, you can specify
multiple properties of the form mapreduce.reduce.env.VARNAME,
where VARNAME is the name of the environment variable. This is the only
way to add a variable when its value contains commas.
contains commas.
</description>
</property>
-->
@ -385,9 +413,14 @@
You must preserve the original value if you want your map and
reduce tasks to have access to native libraries (compression, etc).
When this value is empty, the command to set execution
envrionment will be OS dependent:
environment will be OS dependent:
For linux, use LD_LIBRARY_PATH=$HADOOP_COMMON_HOME/lib/native.
For windows, use PATH = %PATH%;%HADOOP_COMMON_HOME%\\bin.
To define environment variables individually, you can specify
multiple properties of the form mapreduce.admin.user.env.VARNAME,
where VARNAME is the name of the environment variable. This is the only
way to add a variable when its value contains commas.
</description>
</property>
@ -1365,20 +1398,32 @@
<name>yarn.app.mapreduce.am.env</name>
<value></value>
<description>User added environment variables for the MR App Master
processes. Example :
processes, specified as a comma separated list.
Example :
1) A=foo This will set the env variable A to foo
2) B=$B:c This is inherit tasktracker's B env variable.
To define environment variables individually, you can specify
multiple properties of the form yarn.app.mapreduce.am.env.VARNAME,
where VARNAME is the name of the environment variable. This is the only
way to add a variable when its value contains commas.
</description>
</property>
<property>
<name>yarn.app.mapreduce.am.admin.user.env</name>
<value></value>
<description> Environment variables for the MR App Master
processes for admin purposes. These values are set first and can be
overridden by the user env (yarn.app.mapreduce.am.env) Example :
<description>Environment variables for the MR App Master
processes for admin purposes, specified as a comma separated list
These values are set first and can be overridden by the user env
(yarn.app.mapreduce.am.env). Example :
1) A=foo This will set the env variable A to foo
2) B=$B:c This is inherit app master's B env variable.
To define environment variables individually, you can specify
multiple properties of the form yarn.app.mapreduce.am.admin.user.env.VARNAME,
where VARNAME is the name of the environment variable. This is the only
way to add a variable when its value contains commas.
</description>
</property>

View File

@ -206,6 +206,12 @@ For example,
Here, the files dir1/dict.txt and dir2/dict.txt can be accessed by tasks using the symbolic names dict1 and dict2 respectively. The archive mytar.tgz will be placed and unarchived into a directory by the name "tgzdir".
Applications can specify environment variables for mapper, reducer, and application master tasks by specifying them on the command line using the options -Dmapreduce.map.env, -Dmapreduce.reduce.env, and -Dyarn.app.mapreduce.am.env, respectively.
For example the following sets environment variables FOO_VAR=bar and LIST_VAR=a,b,c for the mappers and reducers,
bin/hadoop jar hadoop-mapreduce-examples-<ver>.jar wordcount -Dmapreduce.map.env.FOO_VAR=bar -Dmapreduce.map.env.LIST_VAR=a,b,c -Dmapreduce.reduce.env.FOO_VAR=bar -Dmapreduce.reduce.env.LIST_VAR=a,b,c input output
### Walk-through
The `WordCount` application is quite straight-forward.

View File

@ -533,12 +533,13 @@ public class YARNRunner implements ClientProtocol {
MRApps.crossPlatformifyMREnv(conf, Environment.PWD), conf);
// Setup the environment variables for Admin first
MRApps.setEnvFromInputString(environment,
conf.get(MRJobConfig.MR_AM_ADMIN_USER_ENV,
MRJobConfig.DEFAULT_MR_AM_ADMIN_USER_ENV), conf);
MRApps.setEnvFromInputProperty(environment,
MRJobConfig.MR_AM_ADMIN_USER_ENV,
MRJobConfig.DEFAULT_MR_AM_ADMIN_USER_ENV,
conf);
// Setup the environment variables (LD_LIBRARY_PATH, etc)
MRApps.setEnvFromInputString(environment,
conf.get(MRJobConfig.MR_AM_ENV), conf);
MRApps.setEnvFromInputProperty(environment, MRJobConfig.MR_AM_ENV, null,
conf);
// Parse distributed cache
MRApps.setupDistributedCache(jobConf, localResources);

View File

@ -812,15 +812,22 @@ public class TestYARNRunner {
@Test
public void testAMStandardEnvWithDefaultLibPath() throws Exception {
testAMStandardEnv(false);
testAMStandardEnv(false, false);
}
@Test
public void testAMStandardEnvWithCustomLibPath() throws Exception {
testAMStandardEnv(true);
testAMStandardEnv(true, false);
}
private void testAMStandardEnv(boolean customLibPath) throws Exception {
@Test
public void testAMStandardEnvWithCustomLibPathWithSeparateEnvProps()
throws Exception {
testAMStandardEnv(true, true);
}
private void testAMStandardEnv(boolean customLibPath,
boolean useSeparateEnvProps) throws Exception {
// the Windows behavior is different and this test currently doesn't really
// apply
// MAPREDUCE-6588 should revisit this test
@ -833,9 +840,16 @@ public class TestYARNRunner {
String pathKey = Environment.LD_LIBRARY_PATH.name();
if (customLibPath) {
jobConf.set(MRJobConfig.MR_AM_ADMIN_USER_ENV, pathKey + "=" +
ADMIN_LIB_PATH);
jobConf.set(MRJobConfig.MR_AM_ENV, pathKey + "=" + USER_LIB_PATH);
if (useSeparateEnvProps) {
// Specify these as individual variables instead of k=v lists
jobConf.set(MRJobConfig.MR_AM_ADMIN_USER_ENV + "." + pathKey,
ADMIN_LIB_PATH);
jobConf.set(MRJobConfig.MR_AM_ENV + "." + pathKey, USER_LIB_PATH);
} else {
jobConf.set(MRJobConfig.MR_AM_ADMIN_USER_ENV, pathKey + "=" +
ADMIN_LIB_PATH);
jobConf.set(MRJobConfig.MR_AM_ENV, pathKey + "=" + USER_LIB_PATH);
}
}
jobConf.set(MRJobConfig.MAPRED_ADMIN_USER_SHELL, USER_SHELL);

View File

@ -24,6 +24,7 @@ import static org.apache.hadoop.yarn.util.StringHelper.sjoin;
import java.io.File;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.Iterator;
import java.util.Map;
import java.util.regex.Matcher;
@ -32,6 +33,7 @@ import java.util.regex.Pattern;
import org.apache.hadoop.classification.InterfaceAudience.Private;
import org.apache.hadoop.classification.InterfaceAudience.Public;
import org.apache.hadoop.classification.InterfaceStability.Unstable;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.util.Shell;
import org.apache.hadoop.util.StringInterner;
import org.apache.hadoop.yarn.api.ApplicationConstants;
@ -80,33 +82,112 @@ public class Apps {
throw new YarnRuntimeException(join("Error parsing ", name, ": ", s));
}
private static void setEnvFromString(Map<String, String> env,
String envVar, String varString, String classPathSeparator) {
Matcher m = VAR_SUBBER.matcher(varString);
StringBuffer sb = new StringBuffer();
while (m.find()) {
String var = m.group(1);
// do variable substitution of $var from passed in environment or from
// system environment and default to empty string if undefined in both.
String replace = env.get(var);
if (replace == null) {
replace = System.getenv(var);
}
if (replace == null) {
replace = "";
}
m.appendReplacement(sb, Matcher.quoteReplacement(replace));
}
m.appendTail(sb);
addToEnvironment(env, envVar, sb.toString(), classPathSeparator);
}
public static void setEnvFromInputString(Map<String, String> env,
String envString, String classPathSeparator) {
if (envString != null && envString.length() > 0) {
Matcher varValMatcher = VARVAL_SPLITTER.matcher(envString);
while (varValMatcher.find()) {
String envVar = varValMatcher.group(1);
Matcher m = VAR_SUBBER.matcher(varValMatcher.group(2));
StringBuffer sb = new StringBuffer();
while (m.find()) {
String var = m.group(1);
// replace $env with the child's env constructed by tt's
String replace = env.get(var);
// if this key is not configured by the tt for the child .. get it
// from the tt's env
if (replace == null)
replace = System.getenv(var);
// the env key is note present anywhere .. simply set it
if (replace == null)
replace = "";
m.appendReplacement(sb, Matcher.quoteReplacement(replace));
}
m.appendTail(sb);
addToEnvironment(env, envVar, sb.toString(), classPathSeparator);
String varString = varValMatcher.group(2);
setEnvFromString(env, envVar, varString, classPathSeparator);
}
}
}
/**
* Set environment from string without doing any variable substitution.
* Used internally to avoid double expansion.
* @param env environment to set
* @param envString comma-separated k=v pairs.
* @param classPathSeparator Separator to use when appending to an existing
* environment variable.
*/
private static void setEnvFromInputStringNoExpand(Map<String, String> env,
String envString, String classPathSeparator) {
if (envString != null && envString.length() > 0) {
Matcher varValMatcher = VARVAL_SPLITTER.matcher(envString);
while (varValMatcher.find()) {
String envVar = varValMatcher.group(1);
String varString = varValMatcher.group(2);
addToEnvironment(env, envVar, varString, classPathSeparator);
}
}
}
/**
* Set environment variables from map of input properties.
* @param env environment to update
* @param inputMap environment variable property keys and values
* @param classPathSeparator separator to use when appending to an existing
* environment variable
*/
private static void setEnvFromInputStringMap(Map<String, String> env,
Map<String, String> inputMap, String classPathSeparator) {
for(Map.Entry<String, String> inputVar: inputMap.entrySet()) {
String envVar = inputVar.getKey();
String varString = inputVar.getValue();
setEnvFromString(env, envVar, varString, classPathSeparator);
}
}
/**
* Set environment variables from the given environment input property.
* For example, given the property mapreduce.map.env, this method
* will extract environment variables from:
* the comma-separated string value of mapreduce.map.env, and
* the values of any properties of the form mapreduce.map.env.VAR_NAME
* Variables specified via the latter syntax take precedence over those
* specified using the former syntax.
* @param env the environment to update
* @param propName the name of the property
* @param defaultPropValue the default value for propName
* @param conf configuration containing properties
* @param classPathSeparator Separator used when appending to an existing var
*/
public static void setEnvFromInputProperty(Map<String, String> env,
String propName, String defaultPropValue, Configuration conf,
String classPathSeparator) {
String envString = conf.get(propName, defaultPropValue);
// Get k,v pairs from string into a tmp env. Note that we don't want
// to expand the env var values, because we will do that below -
// don't want to do it twice.
Map<String, String> tmpEnv = new HashMap<String, String>();
Apps.setEnvFromInputStringNoExpand(tmpEnv, envString, classPathSeparator);
// Get map of props with prefix propName.
// (e.g., map.reduce.env.ENV_VAR_NAME=value)
Map<String, String> inputMap = conf.getPropsWithPrefix(propName + ".");
// Entries from map should override entries from input string.
tmpEnv.putAll(inputMap);
// Add them to the environment
setEnvFromInputStringMap(env, tmpEnv, classPathSeparator);
}
/**
*
* @param envString String containing env variable definitions

View File

@ -17,6 +17,7 @@
*/
package org.apache.hadoop.yarn.util;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.util.Shell;
import org.junit.Test;
@ -25,6 +26,8 @@ import java.util.HashMap;
import java.util.Map;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;
public class TestApps {
@Test
@ -58,4 +61,137 @@ public class TestApps {
assertEquals("=", environment.get("e1"));
assertEquals("a1=a2", environment.get("e2"));
}
@Test
public void testSetEnvFromInputProperty() {
Configuration conf = new Configuration(false);
Map<String, String> env = new HashMap<>();
String propName = "mapreduce.map.env";
String defaultPropName = "mapreduce.child.env";
// Setup environment input properties
conf.set(propName, "env1=env1_val,env2=env2_val,env3=env3_val");
conf.set(propName + ".env4", "env4_val");
conf.set(propName + ".env2", "new_env2_val");
// Setup some default values - we shouldn't see these values
conf.set(defaultPropName, "env1=def1_val,env2=def2_val,env3=def3_val");
String defaultPropValue = conf.get(defaultPropName);
// These should never be referenced.
conf.set(defaultPropName + ".env4", "def4_val");
conf.set(defaultPropName + ".env2", "new_def2_val");
Apps.setEnvFromInputProperty(env, propName, defaultPropValue, conf,
File.pathSeparator);
// Check values from string
assertEquals("env1_val", env.get("env1"));
assertEquals("env3_val", env.get("env3"));
// Check individual value
assertEquals("env4_val", env.get("env4"));
// Check individual value that eclipses one in string
assertEquals("new_env2_val", env.get("env2"));
}
@Test
public void testSetEnvFromInputPropertyDefault() {
Configuration conf = new Configuration(false);
Map<String, String> env = new HashMap<>();
String propName = "mapreduce.map.env";
String defaultPropName = "mapreduce.child.env";
// Setup environment input properties
conf.set(propName, "env1=env1_val,env2=env2_val,env3=env3_val");
conf.set(propName + ".env4", "env4_val");
conf.set(propName + ".env2", "new_env2_val");
// Setup some default values
conf.set(defaultPropName, "env1=def1_val,env2=def2_val,env3=def3_val");
String defaultPropValue = conf.get(defaultPropName);
// These should never be referenced.
conf.set(defaultPropName + ".env4", "def4_val");
conf.set(defaultPropName + ".env2", "new_def2_val");
// Test using default value for the string.
// Individually specified env properties do not have defaults,
// so this should just get things from the defaultPropName string.
String bogusProp = propName + "bogus";
Apps.setEnvFromInputProperty(env, bogusProp, defaultPropValue, conf,
File.pathSeparator);
// Check values from string
assertEquals("def1_val", env.get("env1"));
assertEquals("def2_val", env.get("env2"));
assertEquals("def3_val", env.get("env3"));
// Check individual value is not set.
assertNull(env.get("env4"));
}
@Test
public void testSetEnvFromInputPropertyOverrideDefault() {
Configuration conf = new Configuration(false);
Map<String, String> env = new HashMap<>();
// Try using default value, but specify some individual values using
// the main propName, but no main value, so it should get values from
// the default string, and then the individual values.
String propName = "mapreduce.reduce.env";
conf.set(propName + ".env2", "new2_val");
conf.set(propName + ".env4", "new4_val");
// Setup some default values - we shouldn't see these values
String defaultPropName = "mapreduce.child.env";
conf.set(defaultPropName, "env1=def1_val,env2=def2_val,env3=def3_val");
String defaultPropValue = conf.get(defaultPropName);
// These should never be referenced.
conf.set(defaultPropName + ".env4", "def4_val");
conf.set(defaultPropName + ".env2", "new_def2_val");
Apps.setEnvFromInputProperty(env, propName, defaultPropValue, conf,
File.pathSeparator);
// Check values from string
assertEquals("def1_val", env.get("env1"));
assertEquals("def3_val", env.get("env3"));
// Check individual value
assertEquals("new4_val", env.get("env4"));
// Check individual value that eclipses one in string
assertEquals("new2_val", env.get("env2"));
}
@Test
public void testSetEnvFromInputPropertyCommas() {
Configuration conf = new Configuration(false);
Map<String, String> env = new HashMap<>();
String propName = "mapreduce.reduce.env";
conf.set(propName, "env1=env1_val,env2=env2_val,env3=env3_val");
conf.set(propName + ".env2", "new2_val1,new2_val2,new2_val3");
conf.set(propName + ".env4", "new4_valwith=equals");
// Setup some default values - we shouldn't see these values
String defaultPropName = "mapreduce.child.env";
conf.set(defaultPropName, "env1=def1_val,env2=def2_val,env3=def3_val");
String defaultPropValue = conf.get(defaultPropName);
Apps.setEnvFromInputProperty(env, propName, defaultPropValue, conf,
File.pathSeparator);
// Check values from string
assertEquals("env1_val", env.get("env1"));
assertEquals("env3_val", env.get("env3"));
// Check individual value
assertEquals("new4_valwith=equals", env.get("env4"));
// Check individual value that eclipses one in string
assertEquals("new2_val1,new2_val2,new2_val3", env.get("env2"));
}
@Test
public void testSetEnvFromInputPropertyNull() {
Configuration conf = new Configuration(false);
Map<String, String> env = new HashMap<>();
String propName = "mapreduce.map.env";
String defaultPropName = "mapreduce.child.env";
// Setup environment input properties
conf.set(propName, "env1=env1_val,env2=env2_val,env3=env3_val");
conf.set(propName + ".env4", "env4_val");
conf.set(propName + ".env2", "new_env2_val");
// Setup some default values - we shouldn't see these values
conf.set(defaultPropName, "env1=def1_val,env2=def2_val,env3=def3_val");
String defaultPropValue = conf.get(defaultPropName);
// These should never be referenced.
conf.set(defaultPropName + ".env4", "def4_val");
conf.set(defaultPropName + ".env2", "new_def2_val");
// Try with null inputs
Apps.setEnvFromInputProperty(env, "bogus1", null, conf, File.pathSeparator);
assertTrue(env.isEmpty());
}
}