MAPREDUCE-2243. Close streams propely in a finally-block to avoid leakage in CompletedJobStatusStore, TaskLog, EventWriter and TotalOrderPartitioner. Contributed by Devaraj K

git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/trunk@1152787 13f79535-47bb-0310-9956-ffa450edef68
2011-08-01 14:11:19 +00:00 · 2011-08-01 14:11:19 +00:00 · 7e18c90d39
parent d68e38b78d
commit 7e18c90d39
5 changed files with 89 additions and 48 deletions
--- a/mapreduce/CHANGES.txt
+++ b/mapreduce/CHANGES.txt
@ -362,6 +362,10 @@ Trunk (unreleased changes)
    MAPREDUCE-2463. Job history files are not moved to done folder when job
    history location is hdfs.  (Devaraj K via szetszwo)
    MAPREDUCE-2243. Close streams propely in a finally-block to avoid leakage
    in CompletedJobStatusStore, TaskLog, EventWriter and TotalOrderPartitioner.
    (Devaraj K via szetszwo)
 Release 0.22.0 - Unreleased
  INCOMPATIBLE CHANGES
--- a/mapreduce/src/java/org/apache/hadoop/mapred/CompletedJobStatusStore.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapred/CompletedJobStatusStore.java
@ -32,6 +32,7 @@ import org.apache.hadoop.security.UserGroupInformation;
 import org.apache.hadoop.security.AccessControlException;
 import org.apache.hadoop.fs.permission.FsAction;
 import org.apache.hadoop.fs.permission.FsPermission;
 import org.apache.hadoop.io.IOUtils;
 import org.apache.hadoop.util.DiskChecker.DiskErrorException;
 /**
@ -172,8 +173,9 @@ class CompletedJobStatusStore implements Runnable {
    if (active && retainTime > 0) {
      JobID jobId = job.getStatus().getJobID();
      Path jobStatusFile = getInfoFilePath(jobId);
      FSDataOutputStream dataOut = null;
      try {
-        FSDataOutputStream dataOut = fs.create(jobStatusFile);
+        dataOut = fs.create(jobStatusFile);
        job.getStatus().write(dataOut);
@ -189,6 +191,7 @@ class CompletedJobStatusStore implements Runnable {
        }
        dataOut.close();
        dataOut = null; // set dataOut to null explicitly so that close in finally will not be executed again.
      } catch (IOException ex) {
        LOG.warn("Could not store [" + jobId + "] job info : " +
                 ex.getMessage(), ex);
@ -198,6 +201,8 @@ class CompletedJobStatusStore implements Runnable {
        catch (IOException ex1) {
          //ignore
        }
      } finally {
        IOUtils.cleanup(LOG, dataOut);
      }
    }
  }
--- a/mapreduce/src/java/org/apache/hadoop/mapred/TaskLog.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapred/TaskLog.java
@ -41,6 +41,7 @@ import org.apache.hadoop.fs.LocalFileSystem;
 import org.apache.hadoop.fs.FileStatus;
 import org.apache.hadoop.fs.FileUtil;
 import org.apache.hadoop.fs.Path;
 import org.apache.hadoop.io.IOUtils;
 import org.apache.hadoop.io.SecureIOUtils;
 import org.apache.hadoop.mapreduce.JobID;
 import org.apache.hadoop.mapreduce.util.ProcessTree;
@ -111,34 +112,42 @@ public class TaskLog {
    //stderr:<start-offset in the stderr file> <length>
    //syslog:<start-offset in the syslog file> <length>
    LogFileDetail l = new LogFileDetail();
-    String str = fis.readLine();
+    String str = null;
-    if (str == null) { //the file doesn't have anything
+    try {
-      throw new IOException ("Index file for the log of " + taskid+" doesn't exist.");
+      str = fis.readLine();
-    }
+      if (str == null) { // the file doesn't have anything
-    l.location = str.substring(str.indexOf(LogFileDetail.LOCATION)+
+        throw new IOException("Index file for the log of " + taskid
-        LogFileDetail.LOCATION.length());
+            + " doesn't exist.");
-    //special cases are the debugout and profile.out files. They are guaranteed
+      }
-    //to be associated with each task attempt since jvm reuse is disabled
+      l.location = str.substring(str.indexOf(LogFileDetail.LOCATION)
-    //when profiling/debugging is enabled
+          + LogFileDetail.LOCATION.length());
-    if (filter.equals(LogName.DEBUGOUT) || filter.equals(LogName.PROFILE)) {
+      // special cases are the debugout and profile.out files. They are
-      l.length = new File(l.location, filter.toString()).length();
+      // guaranteed
-      l.start = 0;
+      // to be associated with each task attempt since jvm reuse is disabled
-      fis.close();
+      // when profiling/debugging is enabled
-      return l;
+      if (filter.equals(LogName.DEBUGOUT) || filter.equals(LogName.PROFILE)) {
-    }
+        l.length = new File(l.location, filter.toString()).length();
-    str = fis.readLine();
+        l.start = 0;
-    while (str != null) {
+        fis.close();
-      //look for the exact line containing the logname
+        return l;
      if (str.contains(filter.toString())) {
        str = str.substring(filter.toString().length()+1);
        String[] startAndLen = str.split(" ");
        l.start = Long.parseLong(startAndLen[0]);
        l.length = Long.parseLong(startAndLen[1]);
        break;
      }
      str = fis.readLine();
      while (str != null) {
        // look for the exact line containing the logname
        if (str.contains(filter.toString())) {
          str = str.substring(filter.toString().length() + 1);
          String[] startAndLen = str.split(" ");
          l.start = Long.parseLong(startAndLen[0]);
          l.length = Long.parseLong(startAndLen[1]);
          break;
        }
        str = fis.readLine();
      }
      fis.close();
      fis = null;
    } finally {
      IOUtils.cleanup(LOG, fis);
    }
    fis.close();
    return l;
  }
@ -189,22 +198,27 @@ public class TaskLog {
    //LOG_DIR: <the dir where the task logs are really stored>
    //STDOUT: <start-offset in the stdout file> <length>
    //STDERR: <start-offset in the stderr file> <length>
-    //SYSLOG: <start-offset in the syslog file> <length>    
+    //SYSLOG: <start-offset in the syslog file> <length>   
-    dos.writeBytes(LogFileDetail.LOCATION + logLocation + "\n"
+    try{
-        + LogName.STDOUT.toString() + ":");
+      dos.writeBytes(LogFileDetail.LOCATION + logLocation + "\n"
-    dos.writeBytes(Long.toString(prevOutLength) + " ");
+          + LogName.STDOUT.toString() + ":");
-    dos.writeBytes(Long.toString(new File(logLocation, LogName.STDOUT
+      dos.writeBytes(Long.toString(prevOutLength) + " ");
-        .toString()).length() - prevOutLength)
+      dos.writeBytes(Long.toString(new File(logLocation, LogName.STDOUT
-        + "\n" + LogName.STDERR + ":");
+          .toString()).length() - prevOutLength)
-    dos.writeBytes(Long.toString(prevErrLength) + " ");
+          + "\n" + LogName.STDERR + ":");
-    dos.writeBytes(Long.toString(new File(logLocation, LogName.STDERR
+      dos.writeBytes(Long.toString(prevErrLength) + " ");
-        .toString()).length() - prevErrLength)
+      dos.writeBytes(Long.toString(new File(logLocation, LogName.STDERR
-        + "\n" + LogName.SYSLOG.toString() + ":");
+          .toString()).length() - prevErrLength)
-    dos.writeBytes(Long.toString(prevLogLength) + " ");
+          + "\n" + LogName.SYSLOG.toString() + ":");
-    dos.writeBytes(Long.toString(new File(logLocation, LogName.SYSLOG
+      dos.writeBytes(Long.toString(prevLogLength) + " ");
-        .toString()).length() - prevLogLength)
+      dos.writeBytes(Long.toString(new File(logLocation, LogName.SYSLOG
-        + "\n");
+          .toString()).length() - prevLogLength)
-    dos.close();
+          + "\n");
      dos.close();
      dos = null;
    } finally {
      IOUtils.cleanup(LOG, dos);
    }
    File indexFile = getIndexFile(currentTaskid, isCleanup);
    Path indexFilePath = new Path(indexFile.getAbsolutePath());
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/jobhistory/EventWriter.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/jobhistory/EventWriter.java
@ -22,6 +22,7 @@ import java.io.IOException;
 import java.util.Iterator;
 import org.apache.hadoop.fs.FSDataOutputStream;
 import org.apache.hadoop.io.IOUtils;
 import org.apache.hadoop.mapreduce.Counter;
 import org.apache.hadoop.mapreduce.CounterGroup;
 import org.apache.hadoop.mapreduce.Counters;
@ -33,6 +34,8 @@ import org.apache.avro.io.DatumWriter;
 import org.apache.avro.specific.SpecificDatumWriter;
 import org.apache.avro.generic.GenericData;
 import org.apache.avro.util.Utf8;
 import org.apache.commons.logging.Log;
 import org.apache.commons.logging.LogFactory;
 /**
 * Event Writer is an utility class used to write events to the underlying
@ -47,6 +50,7 @@ class EventWriter {
  private DatumWriter<Event> writer =
    new SpecificDatumWriter<Event>(Event.class);
  private Encoder encoder;
  private static final Log LOG = LogFactory.getLog(EventWriter.class);
  EventWriter(FSDataOutputStream out) throws IOException {
    this.out = out;
@ -72,8 +76,13 @@ class EventWriter {
  }
  void close() throws IOException {
-    encoder.flush();
+    try {
-    out.close();
+      encoder.flush();
      out.close();
      out = null;
    } finally {
      IOUtils.cleanup(LOG, out);
    }
  }
  private static final Schema GROUPS =
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/partition/TotalOrderPartitioner.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/partition/TotalOrderPartitioner.java
@ -23,6 +23,8 @@ import java.lang.reflect.Array;
 import java.util.ArrayList;
 import java.util.Arrays;
 import org.apache.commons.logging.Log;
 import org.apache.commons.logging.LogFactory;
 import org.apache.hadoop.classification.InterfaceAudience;
 import org.apache.hadoop.classification.InterfaceStability;
 import org.apache.hadoop.conf.Configurable;
@ -30,6 +32,7 @@ import org.apache.hadoop.conf.Configuration;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
 import org.apache.hadoop.io.BinaryComparable;
 import org.apache.hadoop.io.IOUtils;
 import org.apache.hadoop.io.NullWritable;
 import org.apache.hadoop.io.SequenceFile;
 import org.apache.hadoop.io.RawComparator;
@ -56,6 +59,7 @@ public class TotalOrderPartitioner<K extends WritableComparable<?>,V>
  public static final String NATURAL_ORDER = 
    "mapreduce.totalorderpartitioner.naturalorder";
  Configuration conf;
  private static final Log LOG = LogFactory.getLog(TotalOrderPartitioner.class);
  public TotalOrderPartitioner() { }
@ -298,11 +302,16 @@ public class TotalOrderPartitioner<K extends WritableComparable<?>,V>
    ArrayList<K> parts = new ArrayList<K>();
    K key = ReflectionUtils.newInstance(keyClass, conf);
    NullWritable value = NullWritable.get();
-    while (reader.next(key, value)) {
+    try {
-      parts.add(key);
+      while (reader.next(key, value)) {
-      key = ReflectionUtils.newInstance(keyClass, conf);
+        parts.add(key);
        key = ReflectionUtils.newInstance(keyClass, conf);
      }
      reader.close();
      reader = null;
    } finally {
      IOUtils.cleanup(LOG, reader);
    }
    reader.close();
    return parts.toArray((K[])Array.newInstance(keyClass, parts.size()));
  }