MAPREDUCE-6686. Add a way to download the job config from the mapred CLI (rkanter)

(cherry picked from commit 992a49353f)
This commit is contained in:
Robert Kanter 2016-05-18 12:16:21 -07:00
parent 1470af8c95
commit 27aabcab45
3 changed files with 63 additions and 3 deletions

View File

@ -39,6 +39,8 @@ import org.apache.hadoop.classification.InterfaceStability;
import org.apache.hadoop.classification.InterfaceAudience.Private; import org.apache.hadoop.classification.InterfaceAudience.Private;
import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.conf.Configured; import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.ipc.RemoteException; import org.apache.hadoop.ipc.RemoteException;
import org.apache.hadoop.mapred.JobConf; import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.TIPStatus; import org.apache.hadoop.mapred.TIPStatus;
@ -106,6 +108,7 @@ public class CLI extends Configured implements Tool {
int fromEvent = 0; int fromEvent = 0;
int nEvents = 0; int nEvents = 0;
int jpvalue = 0; int jpvalue = 0;
String configOutFile = null;
boolean getStatus = false; boolean getStatus = false;
boolean getCounter = false; boolean getCounter = false;
boolean killJob = false; boolean killJob = false;
@ -121,6 +124,7 @@ public class CLI extends Configured implements Tool {
boolean failTask = false; boolean failTask = false;
boolean setJobPriority = false; boolean setJobPriority = false;
boolean logs = false; boolean logs = false;
boolean downloadConfig = false;
if ("-submit".equals(cmd)) { if ("-submit".equals(cmd)) {
if (argv.length != 2) { if (argv.length != 2) {
@ -295,6 +299,14 @@ public class CLI extends Configured implements Tool {
displayUsage(cmd); displayUsage(cmd);
return exitCode; return exitCode;
} }
} else if ("-config".equals(cmd)) {
downloadConfig = true;
if (argv.length != 3) {
displayUsage(cmd);
return exitCode;
}
jobid = argv[1];
configOutFile = argv[2];
} else { } else {
displayUsage(cmd); displayUsage(cmd);
return exitCode; return exitCode;
@ -473,6 +485,22 @@ public class CLI extends Configured implements Tool {
System.out.println(e.getMessage()); System.out.println(e.getMessage());
} }
} }
} else if (downloadConfig) {
Job job = getJob(JobID.forName(jobid));
if (job == null) {
System.out.println("Could not find job " + jobid);
} else {
String jobFile = job.getJobFile();
if (jobFile == null || jobFile.isEmpty()) {
System.out.println("Config file for job " + jobFile +
" could not be found.");
} else {
Path configPath = new Path(jobFile);
FileSystem fs = FileSystem.get(getConf());
fs.copyToLocalFile(configPath, new Path(configOutFile));
exitCode = 0;
}
}
} }
} catch (RemoteException re) { } catch (RemoteException re) {
IOException unwrappedException = re.unwrapRemoteException(); IOException unwrappedException = re.unwrapRemoteException();
@ -550,6 +578,8 @@ public class CLI extends Configured implements Tool {
System.err.println(prefix + "[" + cmd + System.err.println(prefix + "[" + cmd +
" <job-id> <task-attempt-id>]. " + " <job-id> <task-attempt-id>]. " +
" <task-attempt-id> is optional to get task attempt logs."); " <task-attempt-id> is optional to get task attempt logs.");
} else if ("-config".equals(cmd)) {
System.err.println(prefix + "[" + cmd + " <job-id> <file>]");
} else { } else {
System.err.printf(prefix + "<command> <args>%n"); System.err.printf(prefix + "<command> <args>%n");
System.err.printf("\t[-submit <job-file>]%n"); System.err.printf("\t[-submit <job-file>]%n");
@ -571,7 +601,8 @@ public class CLI extends Configured implements Tool {
"Valid values for <task-state> are " + taskStates); "Valid values for <task-state> are " + taskStates);
System.err.printf("\t[-kill-task <task-attempt-id>]%n"); System.err.printf("\t[-kill-task <task-attempt-id>]%n");
System.err.printf("\t[-fail-task <task-attempt-id>]%n"); System.err.printf("\t[-fail-task <task-attempt-id>]%n");
System.err.printf("\t[-logs <job-id> <task-attempt-id>]%n%n"); System.err.printf("\t[-logs <job-id> <task-attempt-id>]%n");
System.err.printf("\t[-config <job-id> <file>%n%n");
ToolRunner.printGenericCommandUsage(System.out); ToolRunner.printGenericCommandUsage(System.out);
} }
} }

View File

@ -81,7 +81,7 @@ Copy file or directories recursively. More information can be found at
Command to interact with Map Reduce Jobs. Command to interact with Map Reduce Jobs.
Usage: `mapred job | [GENERIC_OPTIONS] | [-submit <job-file>] | [-status <job-id>] | [-counter <job-id> <group-name> <counter-name>] | [-kill <job-id>] | [-events <job-id> <from-event-#> <#-of-events>] | [-history [all] <jobHistoryFile|jobId> [-outfile <file>] [-format <human|json>]] | [-list [all]] | [-kill-task <task-id>] | [-fail-task <task-id>] | [-set-priority <job-id> <priority>] | [-list-active-trackers] | [-list-blacklisted-trackers] | [-list-attempt-ids <job-id> <task-type> <task-state>] [-logs <job-id> <task-attempt-id>]` Usage: `mapred job | [GENERIC_OPTIONS] | [-submit <job-file>] | [-status <job-id>] | [-counter <job-id> <group-name> <counter-name>] | [-kill <job-id>] | [-events <job-id> <from-event-#> <#-of-events>] | [-history [all] <jobHistoryFile|jobId> [-outfile <file>] [-format <human|json>]] | [-list [all]] | [-kill-task <task-id>] | [-fail-task <task-id>] | [-set-priority <job-id> <priority>] | [-list-active-trackers] | [-list-blacklisted-trackers] | [-list-attempt-ids <job-id> <task-type> <task-state>] [-logs <job-id> <task-attempt-id>] [-config <job-id> <file>]`
| COMMAND\_OPTION | Description | | COMMAND\_OPTION | Description |
|:---- |:---- | |:---- |:---- |
@ -99,6 +99,7 @@ Usage: `mapred job | [GENERIC_OPTIONS] | [-submit <job-file>] | [-status <job-id
| -list-blacklisted-trackers | List the black listed task trackers in the cluster. This command is not supported in MRv2 based cluster. | | -list-blacklisted-trackers | List the black listed task trackers in the cluster. This command is not supported in MRv2 based cluster. |
| -list-attempt-ids *job-id* *task-type* *task-state* | List the attempt-ids based on the task type and the status given. Valid values for task-type are REDUCE, MAP. Valid values for task-state are running, pending, completed, failed, killed. | | -list-attempt-ids *job-id* *task-type* *task-state* | List the attempt-ids based on the task type and the status given. Valid values for task-type are REDUCE, MAP. Valid values for task-state are running, pending, completed, failed, killed. |
| -logs *job-id* *task-attempt-id* | Dump the container log for a job if taskAttemptId is not specified, otherwise dump the log for the task with the specified taskAttemptId. The logs will be dumped in system out. | | -logs *job-id* *task-attempt-id* | Dump the container log for a job if taskAttemptId is not specified, otherwise dump the log for the task with the specified taskAttemptId. The logs will be dumped in system out. |
| -config *job-id* *file* | Download the job configuration file. |
### `pipes` ### `pipes`

View File

@ -168,6 +168,8 @@ public class TestMRJobClient extends ClusterMapReduceTestCase {
testfailTask(conf); testfailTask(conf);
// kill job // kill job
testKillJob(conf); testKillJob(conf);
// download job config
testConfig(jobId, conf);
} }
/** /**
@ -534,6 +536,32 @@ public class TestMRJobClient extends ClusterMapReduceTestCase {
assertEquals(0, out.size()); assertEquals(0, out.size());
} }
/**
* download job config
*/
private void testConfig(String jobId, Configuration conf) throws Exception {
CLI jc = createJobClient();
ByteArrayOutputStream out = new ByteArrayOutputStream();
// bad arguments
int exitCode = runTool(conf, jc, new String[] { "-config" }, out);
assertEquals("Exit code", -1, exitCode);
exitCode = runTool(conf, jc, new String[] { "-config job_invalid foo.xml" },
out);
assertEquals("Exit code", -1, exitCode);
// good arguments
File outFile = File.createTempFile("config", ".xml");
exitCode = runTool(conf, jc, new String[] { "-config", jobId,
outFile.toString()}, out);
assertEquals("Exit code", 0, exitCode);
BufferedReader br = new BufferedReader(new FileReader(outFile));
String line = br.readLine();
br.close();
assertEquals("<?xml version=\"1.0\" encoding=\"UTF-8\" " +
"standalone=\"no\"?><configuration>", line);
}
/** /**
* print job events list * print job events list
*/ */