HDFS-10713. Throttle FsNameSystem lock warnings. Contributed by Hanisha Koneru.

(cherry-picked from a349c54603)
This commit is contained in:
Arpit Agarwal 2016-09-27 09:00:39 -07:00 committed by Zhe Zhang
parent 7a2d602ae0
commit c08346ea2d
4 changed files with 165 additions and 36 deletions

View File

@ -386,6 +386,12 @@ public class DFSConfigKeys extends CommonConfigurationKeys {
"dfs.namenode.read-lock-reporting-threshold-ms"; "dfs.namenode.read-lock-reporting-threshold-ms";
public static final long DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_DEFAULT = 5000L; public static final long DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_DEFAULT = 5000L;
// Threshold for how long the lock warnings must be suppressed
public static final String DFS_LOCK_SUPPRESS_WARNING_INTERVAL_KEY =
"dfs.lock.suppress.warning.interval";
public static final long DFS_LOCK_SUPPRESS_WARNING_INTERVAL_DEFAULT =
10000; //ms
//Following keys have no defaults //Following keys have no defaults
public static final String DFS_DATANODE_DATA_DIR_KEY = "dfs.datanode.data.dir"; public static final String DFS_DATANODE_DATA_DIR_KEY = "dfs.datanode.data.dir";
public static final String DFS_NAMENODE_HTTPS_PORT_KEY = "dfs.https.port"; public static final String DFS_NAMENODE_HTTPS_PORT_KEY = "dfs.https.port";

View File

@ -75,6 +75,8 @@ import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_WRITE_LOCK_REPOR
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_WRITE_LOCK_REPORTING_THRESHOLD_MS_DEFAULT; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_WRITE_LOCK_REPORTING_THRESHOLD_MS_DEFAULT;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_KEY; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_KEY;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_DEFAULT; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_DEFAULT;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_LOCK_SUPPRESS_WARNING_INTERVAL_KEY;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_LOCK_SUPPRESS_WARNING_INTERVAL_DEFAULT;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_RETRY_CACHE_EXPIRYTIME_MILLIS_DEFAULT; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_RETRY_CACHE_EXPIRYTIME_MILLIS_DEFAULT;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_RETRY_CACHE_EXPIRYTIME_MILLIS_KEY; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_RETRY_CACHE_EXPIRYTIME_MILLIS_KEY;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_RETRY_CACHE_HEAP_PERCENT_DEFAULT; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_RETRY_CACHE_HEAP_PERCENT_DEFAULT;
@ -128,6 +130,8 @@ import java.util.Map;
import java.util.Set; import java.util.Set;
import java.util.TreeMap; import java.util.TreeMap;
import java.util.concurrent.TimeUnit; import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicLong;
import java.util.concurrent.locks.Condition; import java.util.concurrent.locks.Condition;
import java.util.concurrent.locks.ReentrantLock; import java.util.concurrent.locks.ReentrantLock;
import java.util.concurrent.locks.ReentrantReadWriteLock; import java.util.concurrent.locks.ReentrantReadWriteLock;
@ -288,6 +292,7 @@ import org.apache.hadoop.util.Daemon;
import org.apache.hadoop.util.DataChecksum; import org.apache.hadoop.util.DataChecksum;
import org.apache.hadoop.util.ReflectionUtils; import org.apache.hadoop.util.ReflectionUtils;
import org.apache.hadoop.util.StringUtils; import org.apache.hadoop.util.StringUtils;
import org.apache.hadoop.util.Timer;
import org.apache.hadoop.util.VersionInfo; import org.apache.hadoop.util.VersionInfo;
import org.apache.log4j.Appender; import org.apache.log4j.Appender;
import org.apache.log4j.AsyncAppender; import org.apache.log4j.AsyncAppender;
@ -731,6 +736,7 @@ public class FSNamesystem implements Namesystem, FSNamesystemMBean,
fsLock = new FSNamesystemLock(fair); fsLock = new FSNamesystemLock(fair);
cond = fsLock.writeLock().newCondition(); cond = fsLock.writeLock().newCondition();
cpLock = new ReentrantLock(); cpLock = new ReentrantLock();
setTimer(new Timer());
this.fsImage = fsImage; this.fsImage = fsImage;
try { try {
@ -831,6 +837,10 @@ public class FSNamesystem implements Namesystem, FSNamesystemMBean,
DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_KEY, DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_KEY,
DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_DEFAULT); DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_DEFAULT);
this.lockSuppressWarningInterval = conf.getTimeDuration(
DFS_LOCK_SUPPRESS_WARNING_INTERVAL_KEY,
DFS_LOCK_SUPPRESS_WARNING_INTERVAL_DEFAULT, TimeUnit.MILLISECONDS);
// For testing purposes, allow the DT secret manager to be started regardless // For testing purposes, allow the DT secret manager to be started regardless
// of whether security is enabled. // of whether security is enabled.
alwaysUseDelegationTokensForTests = conf.getBoolean( alwaysUseDelegationTokensForTests = conf.getBoolean(
@ -1483,12 +1493,20 @@ public class FSNamesystem implements Namesystem, FSNamesystemMBean,
return Util.stringCollectionAsURIs(dirNames); return Util.stringCollectionAsURIs(dirNames);
} }
private final long lockSuppressWarningInterval;
/** Threshold (ms) for long holding write lock report. */ /** Threshold (ms) for long holding write lock report. */
private long writeLockReportingThreshold; private final long writeLockReportingThreshold;
private int numWriteLockWarningsSuppressed = 0;
private long timeStampOfLastWriteLockReport = 0;
private long longestWriteLockHeldInterval = 0;
/** Last time stamp for write lock. Keep the longest one for multi-entrance.*/ /** Last time stamp for write lock. Keep the longest one for multi-entrance.*/
private long writeLockHeldTimeStamp; private long writeLockHeldTimeStamp;
/** Threshold (ms) for long holding read lock report. */ /** Threshold (ms) for long holding read lock report. */
private long readLockReportingThreshold; private long readLockReportingThreshold;
private AtomicInteger numReadLockWarningsSuppressed = new AtomicInteger(0);
private AtomicLong timeStampOfLastReadLockReport = new AtomicLong(0);
private AtomicLong longestReadLockHeldInterval = new AtomicLong(0);
private Timer timer;
/** /**
* Last time stamp for read lock. Keep the longest one for * Last time stamp for read lock. Keep the longest one for
* multi-entrance. This is ThreadLocal since there could be * multi-entrance. This is ThreadLocal since there could be
@ -1506,48 +1524,99 @@ public class FSNamesystem implements Namesystem, FSNamesystemMBean,
public void readLock() { public void readLock() {
this.fsLock.readLock().lock(); this.fsLock.readLock().lock();
if (this.fsLock.getReadHoldCount() == 1) { if (this.fsLock.getReadHoldCount() == 1) {
readLockHeldTimeStamp.set(monotonicNow()); readLockHeldTimeStamp.set(timer.monotonicNow());
} }
} }
@Override @Override
public void readUnlock() { public void readUnlock() {
final boolean needReport = this.fsLock.getReadHoldCount() == 1; final boolean needReport = this.fsLock.getReadHoldCount() == 1;
final long readLockInterval = monotonicNow() - readLockHeldTimeStamp.get(); final long readLockInterval = timer.monotonicNow() -
this.fsLock.readLock().unlock(); readLockHeldTimeStamp.get();
if (needReport) { if (needReport) {
readLockHeldTimeStamp.remove(); readLockHeldTimeStamp.remove();
if (readLockInterval > this.readLockReportingThreshold) {
LOG.info("FSNamesystem read lock held for " + readLockInterval +
" ms via\n" + StringUtils.getStackTrace(Thread.currentThread()));
} }
this.fsLock.readLock().unlock();
if (needReport && readLockInterval >= this.readLockReportingThreshold) {
long localLongestReadLock;
do {
localLongestReadLock = longestReadLockHeldInterval.get();
} while (localLongestReadLock - readLockInterval < 0
&& !longestReadLockHeldInterval.compareAndSet(localLongestReadLock,
readLockInterval));
long localTimeStampOfLastReadLockReport;
long now;
do {
now = timer.monotonicNow();
localTimeStampOfLastReadLockReport = timeStampOfLastReadLockReport
.get();
if (now - localTimeStampOfLastReadLockReport <
lockSuppressWarningInterval) {
numReadLockWarningsSuppressed.incrementAndGet();
return;
}
} while (!timeStampOfLastReadLockReport.compareAndSet(
localTimeStampOfLastReadLockReport, now));
int numSuppressedWarnings = numReadLockWarningsSuppressed.getAndSet(0);
long longestLockHeldInterval = longestReadLockHeldInterval.getAndSet(0);
LOG.info("FSNamesystem read lock held for " + readLockInterval +
" ms via\n" + StringUtils.getStackTrace(Thread.currentThread()) +
"\tNumber of suppressed read-lock reports: " +
numSuppressedWarnings + "\n\tLongest read-lock held interval: " +
longestLockHeldInterval);
} }
} }
@Override @Override
public void writeLock() { public void writeLock() {
this.fsLock.writeLock().lock(); this.fsLock.writeLock().lock();
if (fsLock.getWriteHoldCount() == 1) { if (fsLock.getWriteHoldCount() == 1) {
writeLockHeldTimeStamp = monotonicNow(); writeLockHeldTimeStamp = timer.monotonicNow();
} }
} }
@Override @Override
public void writeLockInterruptibly() throws InterruptedException { public void writeLockInterruptibly() throws InterruptedException {
this.fsLock.writeLock().lockInterruptibly(); this.fsLock.writeLock().lockInterruptibly();
if (fsLock.getWriteHoldCount() == 1) { if (fsLock.getWriteHoldCount() == 1) {
writeLockHeldTimeStamp = monotonicNow(); writeLockHeldTimeStamp = timer.monotonicNow();
} }
} }
@Override @Override
public void writeUnlock() { public void writeUnlock() {
final boolean needReport = fsLock.getWriteHoldCount() == 1 && final boolean needReport = fsLock.getWriteHoldCount() == 1 &&
fsLock.isWriteLockedByCurrentThread(); fsLock.isWriteLockedByCurrentThread();
final long writeLockInterval = monotonicNow() - writeLockHeldTimeStamp; final long currentTime = timer.monotonicNow();
final long writeLockInterval = currentTime - writeLockHeldTimeStamp;
boolean logReport = false;
int numSuppressedWarnings = 0;
long longestLockHeldInterval = 0;
if (needReport && writeLockInterval >= this.writeLockReportingThreshold) {
if (writeLockInterval > longestWriteLockHeldInterval) {
longestWriteLockHeldInterval = writeLockInterval;
}
if (currentTime - timeStampOfLastWriteLockReport > this
.lockSuppressWarningInterval) {
logReport = true;
numSuppressedWarnings = numWriteLockWarningsSuppressed;
numWriteLockWarningsSuppressed = 0;
longestLockHeldInterval = longestWriteLockHeldInterval;
longestWriteLockHeldInterval = 0;
timeStampOfLastWriteLockReport = currentTime;
} else {
numWriteLockWarningsSuppressed++;
}
}
this.fsLock.writeLock().unlock(); this.fsLock.writeLock().unlock();
if (needReport && writeLockInterval >= this.writeLockReportingThreshold) { if (logReport) {
LOG.info("FSNamesystem write lock held for " + writeLockInterval + LOG.info("FSNamesystem write lock held for " + writeLockInterval +
" ms via\n" + StringUtils.getStackTrace(Thread.currentThread())); " ms via\n" + StringUtils.getStackTrace(Thread.currentThread()) +
"\tNumber of suppressed write-lock reports: " +
numSuppressedWarnings + "\n\tLongest write-lock held interval: " +
longestLockHeldInterval);
} }
} }
@Override @Override
@ -8329,5 +8398,9 @@ public class FSNamesystem implements Namesystem, FSNamesystemMBean,
} }
} }
@VisibleForTesting
void setTimer(Timer newTimer) {
this.timer = newTimer;
}
} }

View File

@ -2530,4 +2530,11 @@
Keytab based login can be enabled with dfs.balancer.keytab.enabled. Keytab based login can be enabled with dfs.balancer.keytab.enabled.
</description> </description>
</property> </property>
<property>
<name>dfs.lock.suppress.warning.interval</name>
<value>10s</value>
<description>Instrumentation reporting long critical sections will suppress
consecutive warnings within this interval.</description>
</property>
</configuration> </configuration>

View File

@ -20,12 +20,14 @@ package org.apache.hadoop.hdfs.server.namenode;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_EDITS_DIR_KEY; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_EDITS_DIR_KEY;
import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_NAME_DIR_KEY; import static org.apache.hadoop.hdfs.DFSConfigKeys.DFS_NAMENODE_NAME_DIR_KEY;
import org.apache.hadoop.util.FakeTimer;
import static org.hamcrest.CoreMatchers.either;
import static org.hamcrest.CoreMatchers.instanceOf;
import static org.junit.Assert.*; import static org.junit.Assert.*;
import java.io.File; import java.io.File;
import java.io.IOException; import java.io.IOException;
import java.net.URI; import java.net.URI;
import java.util.ArrayList;
import java.util.Collection; import java.util.Collection;
import com.google.common.base.Supplier; import com.google.common.base.Supplier;
@ -52,8 +54,8 @@ import org.mockito.internal.util.reflection.Whitebox;
import java.util.concurrent.CountDownLatch; import java.util.concurrent.CountDownLatch;
import java.util.concurrent.ExecutorService; import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors; import java.util.concurrent.Executors;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.TimeoutException; import java.util.concurrent.TimeoutException;
import java.util.regex.Matcher;
import java.util.regex.Pattern; import java.util.regex.Pattern;
public class TestFSNamesystem { public class TestFSNamesystem {
@ -267,45 +269,54 @@ public class TestFSNamesystem {
@Test(timeout=45000) @Test(timeout=45000)
public void testFSWriteLockLongHoldingReport() throws Exception { public void testFSWriteLockLongHoldingReport() throws Exception {
final long writeLockReportingThreshold = 100L; final long writeLockReportingThreshold = 100L;
final long writeLockSuppressWarningInterval = 10000L;
Configuration conf = new Configuration(); Configuration conf = new Configuration();
conf.setLong(DFSConfigKeys.DFS_NAMENODE_WRITE_LOCK_REPORTING_THRESHOLD_MS_KEY, conf.setLong(DFSConfigKeys.DFS_NAMENODE_WRITE_LOCK_REPORTING_THRESHOLD_MS_KEY,
writeLockReportingThreshold); writeLockReportingThreshold);
conf.setTimeDuration(DFSConfigKeys.DFS_LOCK_SUPPRESS_WARNING_INTERVAL_KEY,
writeLockSuppressWarningInterval, TimeUnit.MILLISECONDS);
FSImage fsImage = Mockito.mock(FSImage.class); FSImage fsImage = Mockito.mock(FSImage.class);
FSEditLog fsEditLog = Mockito.mock(FSEditLog.class); FSEditLog fsEditLog = Mockito.mock(FSEditLog.class);
Mockito.when(fsImage.getEditLog()).thenReturn(fsEditLog); Mockito.when(fsImage.getEditLog()).thenReturn(fsEditLog);
final FSNamesystem fsn = new FSNamesystem(conf, fsImage); final FSNamesystem fsn = new FSNamesystem(conf, fsImage);
FakeTimer timer = new FakeTimer();
fsn.setTimer(timer);
timer.advance(writeLockSuppressWarningInterval);
LogCapturer logs = LogCapturer.captureLogs(FSNamesystem.LOG); LogCapturer logs = LogCapturer.captureLogs(FSNamesystem.LOG);
GenericTestUtils.setLogLevel(FSNamesystem.LOG, Level.INFO); GenericTestUtils.setLogLevel(FSNamesystem.LOG, Level.INFO);
// Don't report if the write lock is held for a short time // Don't report if the write lock is held for a short time
fsn.writeLock(); fsn.writeLock();
Thread.sleep(writeLockReportingThreshold / 2);
fsn.writeUnlock(); fsn.writeUnlock();
assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName())); assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()));
// Report the first write lock warning if it is held for a long time
// Report if the write lock is held for a long time
fsn.writeLock(); fsn.writeLock();
Thread.sleep(writeLockReportingThreshold + 10); timer.advance(writeLockReportingThreshold + 10);
logs.clearOutput(); logs.clearOutput();
fsn.writeUnlock(); fsn.writeUnlock();
assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName())); assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName()));
// Report if the write lock is held (interruptibly) for a long time // Track but do not Report if the write lock is held (interruptibly) for
// a long time but time since last report does not exceed the suppress
// warning interval
fsn.writeLockInterruptibly(); fsn.writeLockInterruptibly();
Thread.sleep(writeLockReportingThreshold + 10); timer.advance(writeLockReportingThreshold + 10);
logs.clearOutput(); logs.clearOutput();
fsn.writeUnlock(); fsn.writeUnlock();
assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName())); assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()));
// Report if it's held for a long time when re-entering write lock // Track but do not Report if it's held for a long time when re-entering
// write lock but time since last report does not exceed the suppress
// warning interval
fsn.writeLock(); fsn.writeLock();
Thread.sleep(writeLockReportingThreshold/ 2 + 1); timer.advance(writeLockReportingThreshold/ 2 + 1);
fsn.writeLockInterruptibly(); fsn.writeLockInterruptibly();
Thread.sleep(writeLockReportingThreshold / 2 + 1); timer.advance(writeLockReportingThreshold/ 2 + 1);
fsn.writeLock(); fsn.writeLock();
Thread.sleep(writeLockReportingThreshold / 2); timer.advance(writeLockReportingThreshold/ 2);
logs.clearOutput(); logs.clearOutput();
fsn.writeUnlock(); fsn.writeUnlock();
assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName())); assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()));
@ -314,7 +325,18 @@ public class TestFSNamesystem {
assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName())); assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()));
logs.clearOutput(); logs.clearOutput();
fsn.writeUnlock(); fsn.writeUnlock();
assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()));
// Report if it's held for a long time and time since last report exceeds
// the supress warning interval
timer.advance(writeLockSuppressWarningInterval);
fsn.writeLock();
timer.advance(writeLockReportingThreshold + 100);
logs.clearOutput();
fsn.writeUnlock();
assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName())); assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName()));
assertTrue(logs.getOutput().contains("Number of suppressed write-lock " +
"reports: 2"));
} }
/** /**
@ -324,52 +346,71 @@ public class TestFSNamesystem {
@Test(timeout=45000) @Test(timeout=45000)
public void testFSReadLockLongHoldingReport() throws Exception { public void testFSReadLockLongHoldingReport() throws Exception {
final long readLockReportingThreshold = 100L; final long readLockReportingThreshold = 100L;
final long readLockSuppressWarningInterval = 10000L;
final String readLockLogStmt = "FSNamesystem read lock held for "; final String readLockLogStmt = "FSNamesystem read lock held for ";
Configuration conf = new Configuration(); Configuration conf = new Configuration();
conf.setLong( conf.setLong(
DFSConfigKeys.DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_KEY, DFSConfigKeys.DFS_NAMENODE_READ_LOCK_REPORTING_THRESHOLD_MS_KEY,
readLockReportingThreshold); readLockReportingThreshold);
conf.setTimeDuration(DFSConfigKeys.DFS_LOCK_SUPPRESS_WARNING_INTERVAL_KEY,
readLockSuppressWarningInterval, TimeUnit.MILLISECONDS);
FSImage fsImage = Mockito.mock(FSImage.class); FSImage fsImage = Mockito.mock(FSImage.class);
FSEditLog fsEditLog = Mockito.mock(FSEditLog.class); FSEditLog fsEditLog = Mockito.mock(FSEditLog.class);
Mockito.when(fsImage.getEditLog()).thenReturn(fsEditLog); Mockito.when(fsImage.getEditLog()).thenReturn(fsEditLog);
final FSNamesystem fsn = new FSNamesystem(conf, fsImage); final FSNamesystem fsn = new FSNamesystem(conf, fsImage);
final FakeTimer timer = new FakeTimer();
fsn.setTimer(timer);
timer.advance(readLockSuppressWarningInterval);
LogCapturer logs = LogCapturer.captureLogs(FSNamesystem.LOG); LogCapturer logs = LogCapturer.captureLogs(FSNamesystem.LOG);
GenericTestUtils.setLogLevel(FSNamesystem.LOG, Level.INFO); GenericTestUtils.setLogLevel(FSNamesystem.LOG, Level.INFO);
// Don't report if the read lock is held for a short time // Don't report if the read lock is held for a short time
fsn.readLock(); fsn.readLock();
Thread.sleep(readLockReportingThreshold / 2);
fsn.readUnlock(); fsn.readUnlock();
assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()) && assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()) &&
logs.getOutput().contains(readLockLogStmt)); logs.getOutput().contains(readLockLogStmt));
// Report if the read lock is held for a long time // Report the first read lock warning if it is held for a long time
fsn.readLock(); fsn.readLock();
Thread.sleep(readLockReportingThreshold + 10); timer.advance(readLockReportingThreshold + 10);
logs.clearOutput(); logs.clearOutput();
fsn.readUnlock(); fsn.readUnlock();
assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName()) assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName())
&& logs.getOutput().contains(readLockLogStmt)); && logs.getOutput().contains(readLockLogStmt));
// Report if it's held for a long time when re-entering read lock // Track but do not Report if the write lock is held for a long time but
// time since last report does not exceed the suppress warning interval
fsn.readLock(); fsn.readLock();
Thread.sleep(readLockReportingThreshold / 2 + 1); timer.advance(readLockReportingThreshold + 10);
logs.clearOutput();
fsn.readUnlock();
assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName())
&& logs.getOutput().contains(readLockLogStmt));
// Track but do not Report if it's held for a long time when re-entering
// read lock but time since last report does not exceed the suppress
// warning interval
fsn.readLock(); fsn.readLock();
Thread.sleep(readLockReportingThreshold / 2 + 1); timer.advance(readLockReportingThreshold / 2 + 1);
fsn.readLock();
timer.advance(readLockReportingThreshold / 2 + 1);
logs.clearOutput(); logs.clearOutput();
fsn.readUnlock(); fsn.readUnlock();
assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()) || assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()) ||
logs.getOutput().contains(readLockLogStmt)); logs.getOutput().contains(readLockLogStmt));
logs.clearOutput(); logs.clearOutput();
fsn.readUnlock(); fsn.readUnlock();
assertTrue(logs.getOutput().contains(GenericTestUtils.getMethodName()) && assertFalse(logs.getOutput().contains(GenericTestUtils.getMethodName()) &&
logs.getOutput().contains(readLockLogStmt)); logs.getOutput().contains(readLockLogStmt));
// Report if it's held for a long time while another thread also has the // Report if it's held for a long time (and time since last report
// exceeds the suppress warning interval) while another thread also has the
// read lock. Let one thread hold the lock long enough to activate an // read lock. Let one thread hold the lock long enough to activate an
// alert, then have another thread grab the read lock to ensure that this // alert, then have another thread grab the read lock to ensure that this
// doesn't reset the timing. // doesn't reset the timing.
timer.advance(readLockSuppressWarningInterval);
logs.clearOutput(); logs.clearOutput();
final CountDownLatch barrier = new CountDownLatch(1); final CountDownLatch barrier = new CountDownLatch(1);
final CountDownLatch barrier2 = new CountDownLatch(1); final CountDownLatch barrier2 = new CountDownLatch(1);
@ -378,7 +419,7 @@ public class TestFSNamesystem {
public void run() { public void run() {
try { try {
fsn.readLock(); fsn.readLock();
Thread.sleep(readLockReportingThreshold + 1); timer.advance(readLockReportingThreshold + 1);
barrier.countDown(); // Allow for t2 to acquire the read lock barrier.countDown(); // Allow for t2 to acquire the read lock
barrier2.await(); // Wait until t2 has the read lock barrier2.await(); // Wait until t2 has the read lock
fsn.readUnlock(); fsn.readUnlock();
@ -413,5 +454,7 @@ public class TestFSNamesystem {
Pattern t2Pattern = Pattern.compile( Pattern t2Pattern = Pattern.compile(
String.format(stackTracePatternString, t2.getClass().getName())); String.format(stackTracePatternString, t2.getClass().getName()));
assertFalse(t2Pattern.matcher(logs.getOutput()).find()); assertFalse(t2Pattern.matcher(logs.getOutput()).find());
assertTrue(logs.getOutput().contains("Number of suppressed read-lock " +
"reports: 2"));
} }
} }