HBASE-17057 Minor compactions should also drop page cache (Ashu Pachauri)

Signed-off-by: Gary Helmling <garyh@apache.org>
This commit is contained in:
Ashu Pachauri 2016-11-30 15:47:59 -08:00 committed by Gary Helmling
parent b0780bdc63
commit 4b8195f22c
2 changed files with 39 additions and 5 deletions

View File

@ -752,6 +752,24 @@ possible configurations would overwhelm and obscure the important.
which occurs after the marker's timestamp plus the value of this setting, in milliseconds. which occurs after the marker's timestamp plus the value of this setting, in milliseconds.
</description> </description>
</property> </property>
<property>
<name>hbase.regionserver.majorcompaction.pagecache.drop</name>
<value>true</value>
<description>Specifies whether to drop pages read/written into the system page cache by
major compactions. Setting it to true helps prevent major compactions from
polluting the page cache, which is almost always required, especially for clusters
with low/moderate memory to storage ratio.</description>
</property>
<property>
<name>hbase.regionserver.minorcompaction.pagecache.drop</name>
<value>true</value>
<description>Specifies whether to drop pages read/written into the system page cache by
minor compactions. Setting it to true helps prevent minor compactions from
polluting the page cache, which is most beneficial on clusters with low
memory to storage ratio or very write heavy clusters. You may want to set it to
false under moderate to low write workload when bulk of the reads are
on the most recently written data.</description>
</property>
<property> <property>
<name>hbase.storescanner.parallel.seek.enable</name> <name>hbase.storescanner.parallel.seek.enable</name>
<value>false</value> <value>false</value>

View File

@ -77,6 +77,15 @@ public abstract class Compactor<T extends CellSink> {
/** specify how many days to keep MVCC values during major compaction **/ /** specify how many days to keep MVCC values during major compaction **/
protected int keepSeqIdPeriod; protected int keepSeqIdPeriod;
// Configs that drive whether we drop page cache behind compactions
protected static final String MAJOR_COMPACTION_DROP_CACHE =
"hbase.regionserver.majorcompaction.pagecache.drop";
protected static final String MINOR_COMPACTION_DROP_CACHE =
"hbase.regionserver.minorcompaction.pagecache.drop";
private boolean dropCacheMajor;
private boolean dropCacheMinor;
//TODO: depending on Store is not good but, realistically, all compactors currently do. //TODO: depending on Store is not good but, realistically, all compactors currently do.
Compactor(final Configuration conf, final Store store) { Compactor(final Configuration conf, final Store store) {
this.conf = conf; this.conf = conf;
@ -87,6 +96,8 @@ public abstract class Compactor<T extends CellSink> {
Compression.Algorithm.NONE : this.store.getFamily().getCompactionCompression(); Compression.Algorithm.NONE : this.store.getFamily().getCompactionCompression();
this.keepSeqIdPeriod = Math.max(this.conf.getInt(HConstants.KEEP_SEQID_PERIOD, this.keepSeqIdPeriod = Math.max(this.conf.getInt(HConstants.KEEP_SEQID_PERIOD,
HConstants.MIN_KEEP_SEQID_PERIOD), HConstants.MIN_KEEP_SEQID_PERIOD); HConstants.MIN_KEEP_SEQID_PERIOD), HConstants.MIN_KEEP_SEQID_PERIOD);
this.dropCacheMajor = conf.getBoolean(MAJOR_COMPACTION_DROP_CACHE, true);
this.dropCacheMinor = conf.getBoolean(MINOR_COMPACTION_DROP_CACHE, true);
} }
public interface CellSink { public interface CellSink {
@ -267,6 +278,13 @@ public abstract class Compactor<T extends CellSink> {
List<StoreFileScanner> scanners; List<StoreFileScanner> scanners;
Collection<StoreFile> readersToClose; Collection<StoreFile> readersToClose;
T writer = null; T writer = null;
boolean dropCache;
if (request.isMajor() || request.isAllFiles()) {
dropCache = this.dropCacheMajor;
} else {
dropCache = this.dropCacheMinor;
}
if (this.conf.getBoolean("hbase.regionserver.compaction.private.readers", true)) { if (this.conf.getBoolean("hbase.regionserver.compaction.private.readers", true)) {
// clone all StoreFiles, so we'll do the compaction on a independent copy of StoreFiles, // clone all StoreFiles, so we'll do the compaction on a independent copy of StoreFiles,
// HFiles, and their readers // HFiles, and their readers
@ -274,12 +292,10 @@ public abstract class Compactor<T extends CellSink> {
for (StoreFile f : request.getFiles()) { for (StoreFile f : request.getFiles()) {
readersToClose.add(f.cloneForReader()); readersToClose.add(f.cloneForReader());
} }
scanners = createFileScanners(readersToClose, smallestReadPoint, scanners = createFileScanners(readersToClose, smallestReadPoint, dropCache);
store.throttleCompaction(request.getSize()));
} else { } else {
readersToClose = Collections.emptyList(); readersToClose = Collections.emptyList();
scanners = createFileScanners(request.getFiles(), smallestReadPoint, scanners = createFileScanners(request.getFiles(), smallestReadPoint, dropCache);
store.throttleCompaction(request.getSize()));
} }
InternalScanner scanner = null; InternalScanner scanner = null;
boolean finished = false; boolean finished = false;
@ -301,7 +317,7 @@ public abstract class Compactor<T extends CellSink> {
smallestReadPoint = Math.min(fd.minSeqIdToKeep, smallestReadPoint); smallestReadPoint = Math.min(fd.minSeqIdToKeep, smallestReadPoint);
cleanSeqId = true; cleanSeqId = true;
} }
writer = sinkFactory.createWriter(scanner, fd, store.throttleCompaction(request.getSize())); writer = sinkFactory.createWriter(scanner, fd, dropCache);
finished = finished =
performCompaction(scanner, writer, smallestReadPoint, cleanSeqId, throughputController); performCompaction(scanner, writer, smallestReadPoint, cleanSeqId, throughputController);
if (!finished) { if (!finished) {