LUCENE-7657: Fixed potential memory leak when a (Span)TermQuery that wraps a TermContext is cached.

This commit is contained in:
Adrien Grand 2017-01-25 16:10:47 +01:00
parent 9899cbd031
commit f530142845
7 changed files with 39 additions and 20 deletions

View File

@ -118,6 +118,13 @@ Build
* LUCENE-7653: Update randomizedtesting to version 2.5.0. (Dawid Weiss) * LUCENE-7653: Update randomizedtesting to version 2.5.0. (Dawid Weiss)
======================= Lucene 6.4.1 =======================
Bug Fixes
* LUCENE-7657: Fixed potential memory leak in the case that a (Span)TermQuery
with a TermContext is cached. (Adrien Grand)
======================= Lucene 6.4.0 ======================= ======================= Lucene 6.4.0 =======================
API Changes API Changes

View File

@ -32,7 +32,12 @@ public abstract class IndexReaderContext {
public final int docBaseInParent; public final int docBaseInParent;
/** the ord for this reader in the parent, <tt>0</tt> if parent is null */ /** the ord for this reader in the parent, <tt>0</tt> if parent is null */
public final int ordInParent; public final int ordInParent;
// An object that uniquely identifies this context without referencing
// segments. The goal is to make it fine to have references to this
// identity object, even after the index reader has been closed
final Object identity = new Object();
IndexReaderContext(CompositeReaderContext parent, int ordInParent, int docBaseInParent) { IndexReaderContext(CompositeReaderContext parent, int ordInParent, int docBaseInParent) {
if (!(this instanceof CompositeReaderContext || this instanceof LeafReaderContext)) if (!(this instanceof CompositeReaderContext || this instanceof LeafReaderContext))
throw new Error("This class should never be extended by custom code!"); throw new Error("This class should never be extended by custom code!");

View File

@ -33,12 +33,8 @@ import java.util.Arrays;
*/ */
public final class TermContext { public final class TermContext {
/** Holds the {@link IndexReaderContext} of the top-level // Important: do NOT keep hard references to index readers
* {@link IndexReader}, used internally only for private final Object topReaderContextIdentity;
* asserting.
*
* @lucene.internal */
public final IndexReaderContext topReaderContext;
private final TermState[] states; private final TermState[] states;
private int docFreq; private int docFreq;
private long totalTermFreq; private long totalTermFreq;
@ -50,7 +46,7 @@ public final class TermContext {
*/ */
public TermContext(IndexReaderContext context) { public TermContext(IndexReaderContext context) {
assert context != null && context.isTopLevel; assert context != null && context.isTopLevel;
topReaderContext = context; topReaderContextIdentity = context.identity;
docFreq = 0; docFreq = 0;
totalTermFreq = 0; totalTermFreq = 0;
final int len; final int len;
@ -61,7 +57,16 @@ public final class TermContext {
} }
states = new TermState[len]; states = new TermState[len];
} }
/**
* Expert: Return whether this {@link TermContext} was built for the given
* {@link IndexReaderContext}. This is typically used for assertions.
* @lucene.internal
*/
public boolean wasBuiltFor(IndexReaderContext context) {
return topReaderContextIdentity == context.identity;
}
/** /**
* Creates a {@link TermContext} with an initial {@link TermState}, * Creates a {@link TermContext} with an initial {@link TermState},
* {@link IndexReader} pair. * {@link IndexReader} pair.

View File

@ -22,6 +22,7 @@ import java.util.Arrays;
import java.util.List; import java.util.List;
import org.apache.lucene.index.IndexReader; import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexReaderContext;
import org.apache.lucene.index.LeafReaderContext; import org.apache.lucene.index.LeafReaderContext;
import org.apache.lucene.index.Term; import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermContext; import org.apache.lucene.index.TermContext;
@ -264,7 +265,7 @@ public final class BlendedTermQuery extends Query {
public final Query rewrite(IndexReader reader) throws IOException { public final Query rewrite(IndexReader reader) throws IOException {
final TermContext[] contexts = Arrays.copyOf(this.contexts, this.contexts.length); final TermContext[] contexts = Arrays.copyOf(this.contexts, this.contexts.length);
for (int i = 0; i < contexts.length; ++i) { for (int i = 0; i < contexts.length; ++i) {
if (contexts[i] == null || contexts[i].topReaderContext != reader.getContext()) { if (contexts[i] == null || contexts[i].wasBuiltFor(reader.getContext()) == false) {
contexts[i] = TermContext.build(reader.getContext(), terms[i]); contexts[i] = TermContext.build(reader.getContext(), terms[i]);
} }
} }
@ -284,7 +285,7 @@ public final class BlendedTermQuery extends Query {
} }
for (int i = 0; i < contexts.length; ++i) { for (int i = 0; i < contexts.length; ++i) {
contexts[i] = adjustFrequencies(contexts[i], df, ttf); contexts[i] = adjustFrequencies(reader.getContext(), contexts[i], df, ttf);
} }
Query[] termQueries = new Query[terms.length]; Query[] termQueries = new Query[terms.length];
@ -297,15 +298,16 @@ public final class BlendedTermQuery extends Query {
return rewriteMethod.rewrite(termQueries); return rewriteMethod.rewrite(termQueries);
} }
private static TermContext adjustFrequencies(TermContext ctx, int artificialDf, long artificialTtf) { private static TermContext adjustFrequencies(IndexReaderContext readerContext,
List<LeafReaderContext> leaves = ctx.topReaderContext.leaves(); TermContext ctx, int artificialDf, long artificialTtf) {
List<LeafReaderContext> leaves = readerContext.leaves();
final int len; final int len;
if (leaves == null) { if (leaves == null) {
len = 1; len = 1;
} else { } else {
len = leaves.size(); len = leaves.size();
} }
TermContext newCtx = new TermContext(ctx.topReaderContext); TermContext newCtx = new TermContext(readerContext);
for (int i = 0; i < len; ++i) { for (int i = 0; i < len; ++i) {
TermState termState = ctx.get(i); TermState termState = ctx.get(i);
if (termState == null) { if (termState == null) {

View File

@ -86,7 +86,7 @@ public class TermQuery extends Query {
@Override @Override
public Scorer scorer(LeafReaderContext context) throws IOException { public Scorer scorer(LeafReaderContext context) throws IOException {
assert termStates == null || termStates.topReaderContext == ReaderUtil.getTopLevelContext(context) : "The top-reader used to create Weight (" + termStates.topReaderContext + ") is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context);; assert termStates == null || termStates.wasBuiltFor(ReaderUtil.getTopLevelContext(context)) : "The top-reader used to create Weight is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context);;
final TermsEnum termsEnum = getTermsEnum(context); final TermsEnum termsEnum = getTermsEnum(context);
if (termsEnum == null) { if (termsEnum == null) {
return null; return null;
@ -103,7 +103,7 @@ public class TermQuery extends Query {
private TermsEnum getTermsEnum(LeafReaderContext context) throws IOException { private TermsEnum getTermsEnum(LeafReaderContext context) throws IOException {
if (termStates != null) { if (termStates != null) {
// TermQuery either used as a Query or the term states have been provided at construction time // TermQuery either used as a Query or the term states have been provided at construction time
assert termStates.topReaderContext == ReaderUtil.getTopLevelContext(context) : "The top-reader used to create Weight (" + termStates.topReaderContext + ") is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context); assert termStates.wasBuiltFor(ReaderUtil.getTopLevelContext(context)) : "The top-reader used to create Weight is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context);
final TermState state = termStates.get(context.ord); final TermState state = termStates.get(context.ord);
if (state == null) { // term is not present in that reader if (state == null) { // term is not present in that reader
assert termNotInReader(context.reader(), term) : "no termstate found but term exists in reader term=" + term; assert termNotInReader(context.reader(), term) : "no termstate found but term exists in reader term=" + term;
@ -181,7 +181,7 @@ public class TermQuery extends Query {
final IndexReaderContext context = searcher.getTopReaderContext(); final IndexReaderContext context = searcher.getTopReaderContext();
final TermContext termState; final TermContext termState;
if (perReaderTermState == null if (perReaderTermState == null
|| perReaderTermState.topReaderContext != context) { || perReaderTermState.wasBuiltFor(context) == false) {
if (needsScores) { if (needsScores) {
// make TermQuery single-pass if we don't have a PRTS or if the context // make TermQuery single-pass if we don't have a PRTS or if the context
// differs! // differs!

View File

@ -67,7 +67,7 @@ public class SpanTermQuery extends SpanQuery {
public SpanWeight createWeight(IndexSearcher searcher, boolean needsScores, float boost) throws IOException { public SpanWeight createWeight(IndexSearcher searcher, boolean needsScores, float boost) throws IOException {
final TermContext context; final TermContext context;
final IndexReaderContext topContext = searcher.getTopReaderContext(); final IndexReaderContext topContext = searcher.getTopReaderContext();
if (termContext == null || termContext.topReaderContext != topContext) { if (termContext == null || termContext.wasBuiltFor(topContext) == false) {
context = TermContext.build(topContext, term); context = TermContext.build(topContext, term);
} }
else { else {
@ -99,7 +99,7 @@ public class SpanTermQuery extends SpanQuery {
@Override @Override
public Spans getSpans(final LeafReaderContext context, Postings requiredPostings) throws IOException { public Spans getSpans(final LeafReaderContext context, Postings requiredPostings) throws IOException {
assert termContext.topReaderContext == ReaderUtil.getTopLevelContext(context) : "The top-reader used to create Weight (" + termContext.topReaderContext + ") is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context); assert termContext.wasBuiltFor(ReaderUtil.getTopLevelContext(context)) : "The top-reader used to create Weight is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context);
final TermState state = termContext.get(context.ord); final TermState state = termContext.get(context.ord);
if (state == null) { // term is not present in that reader if (state == null) { // term is not present in that reader

View File

@ -378,7 +378,7 @@ public class TermAutomatonQuery extends Query {
boolean any = false; boolean any = false;
for(Map.Entry<Integer,TermContext> ent : termStates.entrySet()) { for(Map.Entry<Integer,TermContext> ent : termStates.entrySet()) {
TermContext termContext = ent.getValue(); TermContext termContext = ent.getValue();
assert termContext.topReaderContext == ReaderUtil.getTopLevelContext(context) : "The top-reader used to create Weight (" + termContext.topReaderContext + ") is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context); assert termContext.wasBuiltFor(ReaderUtil.getTopLevelContext(context)) : "The top-reader used to create Weight is not the same as the current reader's top-reader (" + ReaderUtil.getTopLevelContext(context);
BytesRef term = idToTerm.get(ent.getKey()); BytesRef term = idToTerm.get(ent.getKey());
TermState state = termContext.get(context.ord); TermState state = termContext.get(context.ord);
if (state != null) { if (state != null) {