LUCENE-7237: LRUQueryCache now prefers returning an uncached Scorer than waiting on a lock.

This commit is contained in:
Adrien Grand 2016-04-22 14:09:44 +02:00
parent 927a44881c
commit bf232d7635
2 changed files with 154 additions and 83 deletions

View File

@ -76,6 +76,9 @@ Optimizations
* LUCENE-7238: Explicitly disable the query cache in MemoryIndex#createSearcher. * LUCENE-7238: Explicitly disable the query cache in MemoryIndex#createSearcher.
(Adrien Grand) (Adrien Grand)
* LUCENE-7237: LRUQueryCache now prefers returning an uncached Scorer than
waiting on a lock. (Adrien Grand)
Bug Fixes Bug Fixes
* LUCENE-7127: Fix corner case bugs in GeoPointDistanceQuery. (Robert Muir) * LUCENE-7127: Fix corner case bugs in GeoPointDistanceQuery. (Robert Muir)

View File

@ -29,6 +29,7 @@ import java.util.List;
import java.util.Map; import java.util.Map;
import java.util.Set; import java.util.Set;
import java.util.concurrent.atomic.AtomicBoolean; import java.util.concurrent.atomic.AtomicBoolean;
import java.util.concurrent.locks.ReentrantLock;
import java.util.function.Predicate; import java.util.function.Predicate;
import org.apache.lucene.index.LeafReader.CoreClosedListener; import org.apache.lucene.index.LeafReader.CoreClosedListener;
@ -112,6 +113,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
// mostRecentlyUsedQueries. This is why write operations are performed under a lock // mostRecentlyUsedQueries. This is why write operations are performed under a lock
private final Set<Query> mostRecentlyUsedQueries; private final Set<Query> mostRecentlyUsedQueries;
private final Map<Object, LeafCache> cache; private final Map<Object, LeafCache> cache;
private final ReentrantLock lock;
// these variables are volatile so that we do not need to sync reads // these variables are volatile so that we do not need to sync reads
// but increments need to be performed under the lock // but increments need to be performed under the lock
@ -134,6 +136,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
uniqueQueries = new LinkedHashMap<>(16, 0.75f, true); uniqueQueries = new LinkedHashMap<>(16, 0.75f, true);
mostRecentlyUsedQueries = uniqueQueries.keySet(); mostRecentlyUsedQueries = uniqueQueries.keySet();
cache = new IdentityHashMap<>(); cache = new IdentityHashMap<>();
lock = new ReentrantLock();
ramBytesUsed = 0; ramBytesUsed = 0;
} }
@ -182,6 +185,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
* @lucene.experimental * @lucene.experimental
*/ */
protected void onHit(Object readerCoreKey, Query query) { protected void onHit(Object readerCoreKey, Query query) {
assert lock.isHeldByCurrentThread();
hitCount += 1; hitCount += 1;
} }
@ -191,6 +195,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
* @lucene.experimental * @lucene.experimental
*/ */
protected void onMiss(Object readerCoreKey, Query query) { protected void onMiss(Object readerCoreKey, Query query) {
assert lock.isHeldByCurrentThread();
assert query != null; assert query != null;
missCount += 1; missCount += 1;
} }
@ -203,6 +208,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
* @lucene.experimental * @lucene.experimental
*/ */
protected void onQueryCache(Query query, long ramBytesUsed) { protected void onQueryCache(Query query, long ramBytesUsed) {
assert lock.isHeldByCurrentThread();
this.ramBytesUsed += ramBytesUsed; this.ramBytesUsed += ramBytesUsed;
} }
@ -212,6 +218,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
* @lucene.experimental * @lucene.experimental
*/ */
protected void onQueryEviction(Query query, long ramBytesUsed) { protected void onQueryEviction(Query query, long ramBytesUsed) {
assert lock.isHeldByCurrentThread();
this.ramBytesUsed -= ramBytesUsed; this.ramBytesUsed -= ramBytesUsed;
} }
@ -223,6 +230,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
* @lucene.experimental * @lucene.experimental
*/ */
protected void onDocIdSetCache(Object readerCoreKey, long ramBytesUsed) { protected void onDocIdSetCache(Object readerCoreKey, long ramBytesUsed) {
assert lock.isHeldByCurrentThread();
cacheSize += 1; cacheSize += 1;
cacheCount += 1; cacheCount += 1;
this.ramBytesUsed += ramBytesUsed; this.ramBytesUsed += ramBytesUsed;
@ -235,6 +243,7 @@ public class LRUQueryCache implements QueryCache, Accountable {
* @lucene.experimental * @lucene.experimental
*/ */
protected void onDocIdSetEviction(Object readerCoreKey, int numEntries, long sumRamBytesUsed) { protected void onDocIdSetEviction(Object readerCoreKey, int numEntries, long sumRamBytesUsed) {
assert lock.isHeldByCurrentThread();
this.ramBytesUsed -= sumRamBytesUsed; this.ramBytesUsed -= sumRamBytesUsed;
cacheSize -= numEntries; cacheSize -= numEntries;
} }
@ -244,12 +253,14 @@ public class LRUQueryCache implements QueryCache, Accountable {
* @lucene.experimental * @lucene.experimental
*/ */
protected void onClear() { protected void onClear() {
assert lock.isHeldByCurrentThread();
ramBytesUsed = 0; ramBytesUsed = 0;
cacheSize = 0; cacheSize = 0;
} }
/** Whether evictions are required. */ /** Whether evictions are required. */
boolean requiresEviction() { boolean requiresEviction() {
assert lock.isHeldByCurrentThread();
final int size = mostRecentlyUsedQueries.size(); final int size = mostRecentlyUsedQueries.size();
if (size == 0) { if (size == 0) {
return false; return false;
@ -258,7 +269,8 @@ public class LRUQueryCache implements QueryCache, Accountable {
} }
} }
synchronized DocIdSet get(Query key, LeafReaderContext context) { DocIdSet get(Query key, LeafReaderContext context) {
assert lock.isHeldByCurrentThread();
assert key instanceof BoostQuery == false; assert key instanceof BoostQuery == false;
assert key instanceof ConstantScoreQuery == false; assert key instanceof ConstantScoreQuery == false;
final Object readerKey = context.reader().getCoreCacheKey(); final Object readerKey = context.reader().getCoreCacheKey();
@ -282,40 +294,45 @@ public class LRUQueryCache implements QueryCache, Accountable {
return cached; return cached;
} }
synchronized void putIfAbsent(Query query, LeafReaderContext context, DocIdSet set) { void putIfAbsent(Query query, LeafReaderContext context, DocIdSet set) {
// under a lock to make sure that mostRecentlyUsedQueries and cache remain sync'ed
// we don't want to have user-provided queries as keys in our cache since queries are mutable
assert query instanceof BoostQuery == false; assert query instanceof BoostQuery == false;
assert query instanceof ConstantScoreQuery == false; assert query instanceof ConstantScoreQuery == false;
Query singleton = uniqueQueries.putIfAbsent(query, query); // under a lock to make sure that mostRecentlyUsedQueries and cache remain sync'ed
if (singleton == null) { lock.lock();
onQueryCache(singleton, LINKED_HASHTABLE_RAM_BYTES_PER_ENTRY + ramBytesUsed(query)); try {
} else { Query singleton = uniqueQueries.putIfAbsent(query, query);
query = singleton; if (singleton == null) {
onQueryCache(singleton, LINKED_HASHTABLE_RAM_BYTES_PER_ENTRY + ramBytesUsed(query));
} else {
query = singleton;
}
final Object key = context.reader().getCoreCacheKey();
LeafCache leafCache = cache.get(key);
if (leafCache == null) {
leafCache = new LeafCache(key);
final LeafCache previous = cache.put(context.reader().getCoreCacheKey(), leafCache);
ramBytesUsed += HASHTABLE_RAM_BYTES_PER_ENTRY;
assert previous == null;
// we just created a new leaf cache, need to register a close listener
context.reader().addCoreClosedListener(new CoreClosedListener() {
@Override
public void onClose(Object ownerCoreCacheKey) {
clearCoreCacheKey(ownerCoreCacheKey);
}
});
}
leafCache.putIfAbsent(query, set);
evictIfNecessary();
} finally {
lock.unlock();
} }
final Object key = context.reader().getCoreCacheKey();
LeafCache leafCache = cache.get(key);
if (leafCache == null) {
leafCache = new LeafCache(key);
final LeafCache previous = cache.put(context.reader().getCoreCacheKey(), leafCache);
ramBytesUsed += HASHTABLE_RAM_BYTES_PER_ENTRY;
assert previous == null;
// we just created a new leaf cache, need to register a close listener
context.reader().addCoreClosedListener(new CoreClosedListener() {
@Override
public void onClose(Object ownerCoreCacheKey) {
clearCoreCacheKey(ownerCoreCacheKey);
}
});
}
leafCache.putIfAbsent(query, set);
evictIfNecessary();
} }
synchronized void evictIfNecessary() { void evictIfNecessary() {
assert lock.isHeldByCurrentThread();
// under a lock to make sure that mostRecentlyUsedQueries and cache keep sync'ed // under a lock to make sure that mostRecentlyUsedQueries and cache keep sync'ed
if (requiresEviction()) { if (requiresEviction()) {
Iterator<Query> iterator = mostRecentlyUsedQueries.iterator(); Iterator<Query> iterator = mostRecentlyUsedQueries.iterator();
do { do {
final Query query = iterator.next(); final Query query = iterator.next();
@ -337,31 +354,42 @@ public class LRUQueryCache implements QueryCache, Accountable {
/** /**
* Remove all cache entries for the given core cache key. * Remove all cache entries for the given core cache key.
*/ */
public synchronized void clearCoreCacheKey(Object coreKey) { public void clearCoreCacheKey(Object coreKey) {
final LeafCache leafCache = cache.remove(coreKey); lock.lock();
if (leafCache != null) { try {
ramBytesUsed -= HASHTABLE_RAM_BYTES_PER_ENTRY; final LeafCache leafCache = cache.remove(coreKey);
final int numEntries = leafCache.cache.size(); if (leafCache != null) {
if (numEntries > 0) { ramBytesUsed -= HASHTABLE_RAM_BYTES_PER_ENTRY;
onDocIdSetEviction(coreKey, numEntries, leafCache.ramBytesUsed); final int numEntries = leafCache.cache.size();
} else { if (numEntries > 0) {
assert numEntries == 0; onDocIdSetEviction(coreKey, numEntries, leafCache.ramBytesUsed);
assert leafCache.ramBytesUsed == 0; } else {
assert numEntries == 0;
assert leafCache.ramBytesUsed == 0;
}
} }
} finally {
lock.unlock();
} }
} }
/** /**
* Remove all cache entries for the given query. * Remove all cache entries for the given query.
*/ */
public synchronized void clearQuery(Query query) { public void clearQuery(Query query) {
final Query singleton = uniqueQueries.remove(query); lock.lock();
if (singleton != null) { try {
onEviction(singleton); final Query singleton = uniqueQueries.remove(query);
if (singleton != null) {
onEviction(singleton);
}
} finally {
lock.unlock();
} }
} }
private void onEviction(Query singleton) { private void onEviction(Query singleton) {
assert lock.isHeldByCurrentThread();
onQueryEviction(singleton, LINKED_HASHTABLE_RAM_BYTES_PER_ENTRY + ramBytesUsed(singleton)); onQueryEviction(singleton, LINKED_HASHTABLE_RAM_BYTES_PER_ENTRY + ramBytesUsed(singleton));
for (LeafCache leafCache : cache.values()) { for (LeafCache leafCache : cache.values()) {
leafCache.remove(singleton); leafCache.remove(singleton);
@ -371,55 +399,70 @@ public class LRUQueryCache implements QueryCache, Accountable {
/** /**
* Clear the content of this cache. * Clear the content of this cache.
*/ */
public synchronized void clear() { public void clear() {
cache.clear(); lock.lock();
mostRecentlyUsedQueries.clear(); try {
onClear(); cache.clear();
mostRecentlyUsedQueries.clear();
onClear();
} finally {
lock.unlock();
}
} }
// pkg-private for testing // pkg-private for testing
synchronized void assertConsistent() { void assertConsistent() {
if (requiresEviction()) { lock.lock();
throw new AssertionError("requires evictions: size=" + mostRecentlyUsedQueries.size() try {
+ ", maxSize=" + maxSize + ", ramBytesUsed=" + ramBytesUsed() + ", maxRamBytesUsed=" + maxRamBytesUsed); if (requiresEviction()) {
} throw new AssertionError("requires evictions: size=" + mostRecentlyUsedQueries.size()
for (LeafCache leafCache : cache.values()) { + ", maxSize=" + maxSize + ", ramBytesUsed=" + ramBytesUsed() + ", maxRamBytesUsed=" + maxRamBytesUsed);
Set<Query> keys = Collections.newSetFromMap(new IdentityHashMap<>());
keys.addAll(leafCache.cache.keySet());
keys.removeAll(mostRecentlyUsedQueries);
if (!keys.isEmpty()) {
throw new AssertionError("One leaf cache contains more keys than the top-level cache: " + keys);
} }
} for (LeafCache leafCache : cache.values()) {
long recomputedRamBytesUsed = Set<Query> keys = Collections.newSetFromMap(new IdentityHashMap<>());
HASHTABLE_RAM_BYTES_PER_ENTRY * cache.size() keys.addAll(leafCache.cache.keySet());
+ LINKED_HASHTABLE_RAM_BYTES_PER_ENTRY * uniqueQueries.size(); keys.removeAll(mostRecentlyUsedQueries);
for (Query query : mostRecentlyUsedQueries) { if (!keys.isEmpty()) {
recomputedRamBytesUsed += ramBytesUsed(query); throw new AssertionError("One leaf cache contains more keys than the top-level cache: " + keys);
} }
for (LeafCache leafCache : cache.values()) { }
recomputedRamBytesUsed += HASHTABLE_RAM_BYTES_PER_ENTRY * leafCache.cache.size(); long recomputedRamBytesUsed =
for (DocIdSet set : leafCache.cache.values()) { HASHTABLE_RAM_BYTES_PER_ENTRY * cache.size()
recomputedRamBytesUsed += set.ramBytesUsed(); + LINKED_HASHTABLE_RAM_BYTES_PER_ENTRY * uniqueQueries.size();
for (Query query : mostRecentlyUsedQueries) {
recomputedRamBytesUsed += ramBytesUsed(query);
}
for (LeafCache leafCache : cache.values()) {
recomputedRamBytesUsed += HASHTABLE_RAM_BYTES_PER_ENTRY * leafCache.cache.size();
for (DocIdSet set : leafCache.cache.values()) {
recomputedRamBytesUsed += set.ramBytesUsed();
}
}
if (recomputedRamBytesUsed != ramBytesUsed) {
throw new AssertionError("ramBytesUsed mismatch : " + ramBytesUsed + " != " + recomputedRamBytesUsed);
} }
}
if (recomputedRamBytesUsed != ramBytesUsed) {
throw new AssertionError("ramBytesUsed mismatch : " + ramBytesUsed + " != " + recomputedRamBytesUsed);
}
long recomputedCacheSize = 0; long recomputedCacheSize = 0;
for (LeafCache leafCache : cache.values()) { for (LeafCache leafCache : cache.values()) {
recomputedCacheSize += leafCache.cache.size(); recomputedCacheSize += leafCache.cache.size();
} }
if (recomputedCacheSize != getCacheSize()) { if (recomputedCacheSize != getCacheSize()) {
throw new AssertionError("cacheSize mismatch : " + getCacheSize() + " != " + recomputedCacheSize); throw new AssertionError("cacheSize mismatch : " + getCacheSize() + " != " + recomputedCacheSize);
}
} finally {
lock.unlock();
} }
} }
// pkg-private for testing // pkg-private for testing
// return the list of cached queries in LRU order // return the list of cached queries in LRU order
synchronized List<Query> cachedQueries() { List<Query> cachedQueries() {
return new ArrayList<>(mostRecentlyUsedQueries); lock.lock();
try {
return new ArrayList<>(mostRecentlyUsedQueries);
} finally {
lock.unlock();
}
} }
@Override @Override
@ -438,8 +481,11 @@ public class LRUQueryCache implements QueryCache, Accountable {
@Override @Override
public Collection<Accountable> getChildResources() { public Collection<Accountable> getChildResources() {
synchronized (this) { lock.lock();
try {
return Accountables.namedAccountables("segment", cache); return Accountables.namedAccountables("segment", cache);
} finally {
lock.unlock();
} }
} }
@ -659,7 +705,18 @@ public class LRUQueryCache implements QueryCache, Accountable {
return in.scorer(context); return in.scorer(context);
} }
DocIdSet docIdSet = get(in.getQuery(), context); // If the lock is already busy, prefer using the uncached version than waiting
if (lock.tryLock() == false) {
return in.scorer(context);
}
DocIdSet docIdSet;
try {
docIdSet = get(in.getQuery(), context);
} finally {
lock.unlock();
}
if (docIdSet == null) { if (docIdSet == null) {
if (policy.shouldCache(in.getQuery())) { if (policy.shouldCache(in.getQuery())) {
docIdSet = cache(context); docIdSet = cache(context);
@ -692,7 +749,18 @@ public class LRUQueryCache implements QueryCache, Accountable {
return in.bulkScorer(context); return in.bulkScorer(context);
} }
DocIdSet docIdSet = get(in.getQuery(), context); // If the lock is already busy, prefer using the uncached version than waiting
if (lock.tryLock() == false) {
return in.bulkScorer(context);
}
DocIdSet docIdSet;
try {
docIdSet = get(in.getQuery(), context);
} finally {
lock.unlock();
}
if (docIdSet == null) { if (docIdSet == null) {
if (policy.shouldCache(in.getQuery())) { if (policy.shouldCache(in.getQuery())) {
docIdSet = cache(context); docIdSet = cache(context);