mirror of https://github.com/apache/lucene.git
LUCENE-1383: workaround the 'leak' in Java's ThreadLocal to prevent Lucene from causing OutOfMemoryError in certain situations, eg J2EE applications
git-svn-id: https://svn.apache.org/repos/asf/lucene/java/trunk@695184 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
f82e52e3bf
commit
ac6ee32b60
|
@ -207,6 +207,11 @@ Bug fixes
|
||||||
|
|
||||||
15. LUCENE-1351: ISOLatin1AccentFilter now cleans additional ligatures (Cedrik Lime via Grant Ingersoll)
|
15. LUCENE-1351: ISOLatin1AccentFilter now cleans additional ligatures (Cedrik Lime via Grant Ingersoll)
|
||||||
|
|
||||||
|
16. LUCENE-1383: Workaround a nasty "leak" in Java's builtin
|
||||||
|
ThreadLocal, to prevent Lucene from causing unexpected
|
||||||
|
OutOfMemoryError in certain situations (notably J2EE
|
||||||
|
applications). (Chris Lu via Mike McCandless)
|
||||||
|
|
||||||
New features
|
New features
|
||||||
|
|
||||||
1. LUCENE-1137: Added Token.set/getFlags() accessors for passing more information about a Token through the analysis
|
1. LUCENE-1137: Added Token.set/getFlags() accessors for passing more information about a Token through the analysis
|
||||||
|
|
|
@ -23,6 +23,7 @@ import org.apache.lucene.store.Directory;
|
||||||
import org.apache.lucene.store.IndexInput;
|
import org.apache.lucene.store.IndexInput;
|
||||||
import org.apache.lucene.store.AlreadyClosedException;
|
import org.apache.lucene.store.AlreadyClosedException;
|
||||||
import org.apache.lucene.store.BufferedIndexInput;
|
import org.apache.lucene.store.BufferedIndexInput;
|
||||||
|
import org.apache.lucene.util.CloseableThreadLocal;
|
||||||
|
|
||||||
import java.io.ByteArrayOutputStream;
|
import java.io.ByteArrayOutputStream;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
@ -58,7 +59,7 @@ final class FieldsReader {
|
||||||
// file. This will be 0 if we have our own private file.
|
// file. This will be 0 if we have our own private file.
|
||||||
private int docStoreOffset;
|
private int docStoreOffset;
|
||||||
|
|
||||||
private ThreadLocal fieldsStreamTL = new ThreadLocal();
|
private CloseableThreadLocal fieldsStreamTL = new CloseableThreadLocal();
|
||||||
|
|
||||||
FieldsReader(Directory d, String segment, FieldInfos fn) throws IOException {
|
FieldsReader(Directory d, String segment, FieldInfos fn) throws IOException {
|
||||||
this(d, segment, fn, BufferedIndexInput.BUFFER_SIZE, -1, 0);
|
this(d, segment, fn, BufferedIndexInput.BUFFER_SIZE, -1, 0);
|
||||||
|
@ -155,11 +156,7 @@ final class FieldsReader {
|
||||||
if (indexStream != null) {
|
if (indexStream != null) {
|
||||||
indexStream.close();
|
indexStream.close();
|
||||||
}
|
}
|
||||||
IndexInput localFieldsStream = (IndexInput) fieldsStreamTL.get();
|
fieldsStreamTL.close();
|
||||||
if (localFieldsStream != null) {
|
|
||||||
localFieldsStream.close();
|
|
||||||
fieldsStreamTL.set(null);
|
|
||||||
}
|
|
||||||
closed = true;
|
closed = true;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -36,6 +36,7 @@ import org.apache.lucene.store.Directory;
|
||||||
import org.apache.lucene.store.IndexInput;
|
import org.apache.lucene.store.IndexInput;
|
||||||
import org.apache.lucene.store.IndexOutput;
|
import org.apache.lucene.store.IndexOutput;
|
||||||
import org.apache.lucene.util.BitVector;
|
import org.apache.lucene.util.BitVector;
|
||||||
|
import org.apache.lucene.util.CloseableThreadLocal;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* @version $Id$
|
* @version $Id$
|
||||||
|
@ -50,7 +51,7 @@ class SegmentReader extends DirectoryIndexReader {
|
||||||
|
|
||||||
TermInfosReader tis;
|
TermInfosReader tis;
|
||||||
TermVectorsReader termVectorsReaderOrig = null;
|
TermVectorsReader termVectorsReaderOrig = null;
|
||||||
ThreadLocal termVectorsLocal = new ThreadLocal();
|
CloseableThreadLocal termVectorsLocal = new CloseableThreadLocal();
|
||||||
|
|
||||||
BitVector deletedDocs = null;
|
BitVector deletedDocs = null;
|
||||||
private boolean deletedDocsDirty = false;
|
private boolean deletedDocsDirty = false;
|
||||||
|
@ -616,7 +617,9 @@ class SegmentReader extends DirectoryIndexReader {
|
||||||
|
|
||||||
protected void doClose() throws IOException {
|
protected void doClose() throws IOException {
|
||||||
boolean hasReferencedReader = (referencedSegmentReader != null);
|
boolean hasReferencedReader = (referencedSegmentReader != null);
|
||||||
|
|
||||||
|
termVectorsLocal.close();
|
||||||
|
|
||||||
if (hasReferencedReader) {
|
if (hasReferencedReader) {
|
||||||
referencedSegmentReader.decRefReaderNotNorms();
|
referencedSegmentReader.decRefReaderNotNorms();
|
||||||
referencedSegmentReader = null;
|
referencedSegmentReader = null;
|
||||||
|
|
|
@ -23,6 +23,7 @@ import org.apache.lucene.store.Directory;
|
||||||
import org.apache.lucene.store.BufferedIndexInput;
|
import org.apache.lucene.store.BufferedIndexInput;
|
||||||
import org.apache.lucene.util.cache.Cache;
|
import org.apache.lucene.util.cache.Cache;
|
||||||
import org.apache.lucene.util.cache.SimpleLRUCache;
|
import org.apache.lucene.util.cache.SimpleLRUCache;
|
||||||
|
import org.apache.lucene.util.CloseableThreadLocal;
|
||||||
|
|
||||||
/** This stores a monotonically increasing set of <Term, TermInfo> pairs in a
|
/** This stores a monotonically increasing set of <Term, TermInfo> pairs in a
|
||||||
* Directory. Pairs are accessed either by Term or by ordinal position the
|
* Directory. Pairs are accessed either by Term or by ordinal position the
|
||||||
|
@ -33,7 +34,7 @@ final class TermInfosReader {
|
||||||
private String segment;
|
private String segment;
|
||||||
private FieldInfos fieldInfos;
|
private FieldInfos fieldInfos;
|
||||||
|
|
||||||
private ThreadLocal threadResources = new ThreadLocal();
|
private CloseableThreadLocal threadResources = new CloseableThreadLocal();
|
||||||
private SegmentTermEnum origEnum;
|
private SegmentTermEnum origEnum;
|
||||||
private long size;
|
private long size;
|
||||||
|
|
||||||
|
@ -143,7 +144,7 @@ final class TermInfosReader {
|
||||||
origEnum.close();
|
origEnum.close();
|
||||||
if (indexEnum != null)
|
if (indexEnum != null)
|
||||||
indexEnum.close();
|
indexEnum.close();
|
||||||
threadResources.set(null);
|
threadResources.close();
|
||||||
}
|
}
|
||||||
|
|
||||||
/** Returns the number of term/value pairs in the set. */
|
/** Returns the number of term/value pairs in the set. */
|
||||||
|
|
|
@ -0,0 +1,88 @@
|
||||||
|
package org.apache.lucene.util;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
import java.util.Map;
|
||||||
|
import java.util.HashMap;
|
||||||
|
import java.util.Iterator;
|
||||||
|
import java.lang.ref.WeakReference;
|
||||||
|
|
||||||
|
/** Java's builtin ThreadLocal has a serious flaw:
|
||||||
|
* it can take an arbitrarily long amount of time to
|
||||||
|
* dereference the things you had stored in it, even once the
|
||||||
|
* ThreadLocal instance itself is no longer referenced.
|
||||||
|
* This is because there is single, master map stored for
|
||||||
|
* each thread, which all ThreadLocals share, and that
|
||||||
|
* master map only periodically purges "stale" entries.
|
||||||
|
*
|
||||||
|
* While not technically a memory leak, because eventually
|
||||||
|
* the memory will be reclaimed, it can take a long time
|
||||||
|
* and you can easily hit OutOfMemoryError because from the
|
||||||
|
* GC's standpoint the stale entries are not reclaimaible.
|
||||||
|
*
|
||||||
|
* This class works around that, by only enrolling
|
||||||
|
* WeakReference values into the ThreadLocal, and
|
||||||
|
* separately holding a hard reference to each stored
|
||||||
|
* value. When you call {@link #close}, these hard
|
||||||
|
* references are cleared and then GC is freely able to
|
||||||
|
* reclaim space by objects stored in it. */
|
||||||
|
|
||||||
|
public final class CloseableThreadLocal {
|
||||||
|
|
||||||
|
private ThreadLocal t = new ThreadLocal();
|
||||||
|
|
||||||
|
private Map hardRefs = new HashMap();
|
||||||
|
|
||||||
|
public Object get() {
|
||||||
|
WeakReference weakRef = (WeakReference) t.get();
|
||||||
|
if (weakRef == null)
|
||||||
|
return null;
|
||||||
|
else {
|
||||||
|
Object v = weakRef.get();
|
||||||
|
// This can never be null, because we hold a hard
|
||||||
|
// reference to the underlying object:
|
||||||
|
assert v != null;
|
||||||
|
return v;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public void set(Object object) {
|
||||||
|
|
||||||
|
t.set(new WeakReference(object));
|
||||||
|
|
||||||
|
synchronized(hardRefs) {
|
||||||
|
hardRefs.put(Thread.currentThread(), object);
|
||||||
|
|
||||||
|
// Purge dead threads
|
||||||
|
Iterator it = hardRefs.keySet().iterator();
|
||||||
|
while(it.hasNext()) {
|
||||||
|
Thread t = (Thread) it.next();
|
||||||
|
if (!t.isAlive())
|
||||||
|
it.remove();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public void close() {
|
||||||
|
// Clear the hard refs; then, the only remaining refs to
|
||||||
|
// all values we were storing are weak (unless somewhere
|
||||||
|
// else is still using them) and so GC may reclaim them:
|
||||||
|
hardRefs = null;
|
||||||
|
t = null;
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue