From 75e34cdba9b516c8e47ef0d806f6a138f0461ad6 Mon Sep 17 00:00:00 2001 From: Michael McCandless Date: Wed, 11 Aug 2010 18:19:13 +0000 Subject: [PATCH] LUCENE-2576: simplify IndexWriter's private startCommit method now that it's single thread'd (may fix this intermittent test failure); also add one missing checkpoint() in addIndexes git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@984510 13f79535-47bb-0310-9956-ffa450edef68 --- .../org/apache/lucene/index/IndexWriter.java | 117 ++++++++---------- 1 file changed, 50 insertions(+), 67 deletions(-) diff --git a/lucene/src/java/org/apache/lucene/index/IndexWriter.java b/lucene/src/java/org/apache/lucene/index/IndexWriter.java index 8c2c99ae455..1ae943abaa6 100644 --- a/lucene/src/java/org/apache/lucene/index/IndexWriter.java +++ b/lucene/src/java/org/apache/lucene/index/IndexWriter.java @@ -3006,6 +3006,7 @@ public class IndexWriter implements Closeable { info.setUseCompoundFile(true); } } finally { + checkpoint(); deleter.decRef(files); } } @@ -3181,6 +3182,7 @@ public class IndexWriter implements Closeable { setRollbackSegmentInfos(pendingCommit); deleter.checkpoint(pendingCommit, true); } finally { + // Matches the incRef done in startCommit: deleter.decRef(pendingCommit); pendingCommit = null; notifyAll(); @@ -4267,6 +4269,21 @@ public class IndexWriter implements Closeable { } } + // called only from assert + private boolean filesExist(SegmentInfos toSync) throws IOException { + Collection files = toSync.files(directory, false); + for(final String fileName: files) { + assert directory.fileExists(fileName): "file " + fileName + " does not exist"; + // If this trips it means we are missing a call to + // .checkpoint somewhere, because by the time we + // are called, deleter should know about every + // file referenced by the current head + // segmentInfos: + assert deleter.exists(fileName) : "IndexFileDeleter doesn't know about file " + fileName; + } + return true; + } + /** Walk through all files referenced by the current * segmentInfos and ask the Directory to sync each file, * if it wasn't already. If that succeeds, then we @@ -4275,9 +4292,7 @@ public class IndexWriter implements Closeable { private void startCommit(long sizeInBytes, Map commitUserData) throws IOException { assert testPoint("startStartCommit"); - - // TODO: as of LUCENE-2095, we can simplify this method, - // since only 1 thread can be in here at once + assert pendingCommit == null; if (hitOOM) { throw new IllegalStateException("this writer hit an OutOfMemoryError; cannot commit"); @@ -4288,7 +4303,7 @@ public class IndexWriter implements Closeable { if (infoStream != null) message("startCommit(): start sizeInBytes=" + sizeInBytes); - SegmentInfos toSync = null; + final SegmentInfos toSync; final long myChangeCount; synchronized(this) { @@ -4303,94 +4318,50 @@ public class IndexWriter implements Closeable { // First, we clone & incref the segmentInfos we intend // to sync, then, without locking, we sync() each file - // referenced by toSync, in the background. Multiple - // threads can be doing this at once, if say a large - // merge and a small merge finish at the same time: + // referenced by toSync, in the background. if (infoStream != null) message("startCommit index=" + segString(segmentInfos) + " changeCount=" + changeCount); - + readerPool.commit(); toSync = (SegmentInfos) segmentInfos.clone(); + assert filesExist(toSync); if (commitUserData != null) toSync.setUserData(commitUserData); + // This protects the segmentInfos we are now going + // to commit. This is important in case, eg, while + // we are trying to sync all referenced files, a + // merge completes which would otherwise have + // removed the files we are now syncing. deleter.incRef(toSync, false); myChangeCount = changeCount; - - Collection files = toSync.files(directory, false); - for(final String fileName: files) { - assert directory.fileExists(fileName): "file " + fileName + " does not exist"; - - // If this trips it means we are missing a call to - // .checkpoint somewhere, because by the time we - // are called, deleter should know about every - // file referenced by the current head - // segmentInfos: - assert deleter.exists(fileName); - } } assert testPoint("midStartCommit"); - boolean setPending = false; - try { + // This call can take a long time -- 10s of seconds + // or more. We do it without sync: directory.sync(toSync.files(directory, false)); assert testPoint("midStartCommit2"); synchronized(this) { - // If someone saved a newer version of segments file - // since I first started syncing my version, I can - // safely skip saving myself since I've been - // superseded: - while(true) { - if (myChangeCount <= lastCommitChangeCount) { - if (infoStream != null) { - message("sync superseded by newer infos"); - } - break; - } else if (pendingCommit == null) { - // My turn to commit + assert pendingCommit == null; - if (segmentInfos.getGeneration() > toSync.getGeneration()) - toSync.updateGeneration(segmentInfos); + assert segmentInfos.getGeneration() == toSync.getGeneration(); - boolean success = false; - try { + // Exception here means nothing is prepared + // (this method unwinds everything it did on + // an exception) + toSync.prepareCommit(directory); - // Exception here means nothing is prepared - // (this method unwinds everything it did on - // an exception) - try { - toSync.prepareCommit(directory); - } finally { - // Have our master segmentInfos record the - // generations we just prepared. We do this - // on error or success so we don't - // double-write a segments_N file. - segmentInfos.updateGeneration(toSync); - } - - assert pendingCommit == null; - setPending = true; - pendingCommit = toSync; - pendingCommitChangeCount = myChangeCount; - success = true; - } finally { - if (!success && infoStream != null) - message("hit exception committing segments file"); - } - break; - } else { - // Must wait for other commit to complete - doWait(); - } - } + pendingCommit = toSync; + pendingCommitChangeCount = myChangeCount; } if (infoStream != null) @@ -4400,8 +4371,20 @@ public class IndexWriter implements Closeable { } finally { synchronized(this) { - if (!setPending) + + // Have our master segmentInfos record the + // generations we just prepared. We do this + // on error or success so we don't + // double-write a segments_N file. + segmentInfos.updateGeneration(toSync); + + if (pendingCommit == null) { + if (infoStream != null) { + message("hit exception committing segments file"); + } + deleter.decRef(toSync); + } } } } catch (OutOfMemoryError oom) {