MAPREDUCE-6751. Add debug log message when splitting is not possible due to unsplittable compression. (Peter Vary via rchiang)

This commit is contained in:
Ray Chiang 2016-08-16 12:13:22 -07:00
parent b047bc7270
commit 6c154abd33
3 changed files with 18 additions and 0 deletions

View File

@ -369,6 +369,13 @@ public abstract class FileInputFormat<K, V> implements InputFormat<K, V> {
splitHosts[0], splitHosts[1])); splitHosts[0], splitHosts[1]));
} }
} else { } else {
if (LOG.isDebugEnabled()) {
// Log only if the file is big enough to be splitted
if (length > Math.min(file.getBlockSize(), minSize)) {
LOG.debug("File is not splittable so no parallelization "
+ "is possible: " + file.getPath());
}
}
String[][] splitHosts = getSplitHostsAndCachedHosts(blkLocations,0,length,clusterMap); String[][] splitHosts = getSplitHostsAndCachedHosts(blkLocations,0,length,clusterMap);
splits.add(makeSplit(path, 0, length, splitHosts[0], splitHosts[1])); splits.add(makeSplit(path, 0, length, splitHosts[0], splitHosts[1]));
} }

View File

@ -600,6 +600,10 @@ public abstract class CombineFileInputFormat<K, V>
if (!isSplitable) { if (!isSplitable) {
// if the file is not splitable, just create the one block with // if the file is not splitable, just create the one block with
// full file length // full file length
if (LOG.isDebugEnabled()) {
LOG.debug("File is not splittable so no parallelization "
+ "is possible: " + stat.getPath());
}
blocks = new OneBlockInfo[1]; blocks = new OneBlockInfo[1];
fileSize = stat.getLen(); fileSize = stat.getLen();
blocks[0] = new OneBlockInfo(stat.getPath(), 0, fileSize, blocks[0] = new OneBlockInfo(stat.getPath(), 0, fileSize,

View File

@ -422,6 +422,13 @@ public abstract class FileInputFormat<K, V> extends InputFormat<K, V> {
blkLocations[blkIndex].getCachedHosts())); blkLocations[blkIndex].getCachedHosts()));
} }
} else { // not splitable } else { // not splitable
if (LOG.isDebugEnabled()) {
// Log only if the file is big enough to be splitted
if (length > Math.min(file.getBlockSize(), minSize)) {
LOG.debug("File is not splittable so no parallelization "
+ "is possible: " + file.getPath());
}
}
splits.add(makeSplit(path, 0, length, blkLocations[0].getHosts(), splits.add(makeSplit(path, 0, length, blkLocations[0].getHosts(),
blkLocations[0].getCachedHosts())); blkLocations[0].getCachedHosts()));
} }