LUCENE-8296: PendingDeletes may no longer write to live docs after they are shared.

This commit is contained in:
Adrien Grand 2018-05-09 15:12:23 +02:00
parent 8dc69428e3
commit 7873cf845e
5 changed files with 29 additions and 53 deletions

View File

@ -33,15 +33,11 @@ import org.apache.lucene.util.IOUtils;
*/ */
class PendingDeletes { class PendingDeletes {
protected final SegmentCommitInfo info; protected final SegmentCommitInfo info;
// True if the current liveDocs is referenced by an // Read-only live docs, null until live docs are initialized or if all docs are alive
// external NRT reader:
protected boolean liveDocsShared;
// Holds the current shared (readable and writable)
// liveDocs. This is null when there are no deleted
// docs, and it's copy-on-write (cloned whenever we need
// to change it but it's been shared to an external NRT
// reader).
private Bits liveDocs; private Bits liveDocs;
// Writeable live docs, null if this instance is not ready to accept writes, in which
// case getMutableBits needs to be called
private FixedBitSet writeableLiveDocs;
protected int pendingDeleteCount; protected int pendingDeleteCount;
private boolean liveDocsInitialized; private boolean liveDocsInitialized;
@ -59,7 +55,6 @@ class PendingDeletes {
private PendingDeletes(SegmentCommitInfo info, Bits liveDocs, boolean liveDocsInitialized) { private PendingDeletes(SegmentCommitInfo info, Bits liveDocs, boolean liveDocsInitialized) {
this.info = info; this.info = info;
liveDocsShared = true;
this.liveDocs = liveDocs; this.liveDocs = liveDocs;
pendingDeleteCount = 0; pendingDeleteCount = 0;
this.liveDocsInitialized = liveDocsInitialized; this.liveDocsInitialized = liveDocsInitialized;
@ -70,24 +65,23 @@ class PendingDeletes {
// if we pull mutable bits but we haven't been initialized something is completely off. // if we pull mutable bits but we haven't been initialized something is completely off.
// this means we receive deletes without having the bitset that is on-disk ready to be cloned // this means we receive deletes without having the bitset that is on-disk ready to be cloned
assert liveDocsInitialized : "can't delete if liveDocs are not initialized"; assert liveDocsInitialized : "can't delete if liveDocs are not initialized";
if (liveDocsShared) { if (writeableLiveDocs == null) {
// Copy on write: this means we've cloned a // Copy on write: this means we've cloned a
// SegmentReader sharing the current liveDocs // SegmentReader sharing the current liveDocs
// instance; must now make a private clone so we can // instance; must now make a private clone so we can
// change it: // change it:
FixedBitSet mutableBits = new FixedBitSet(info.info.maxDoc()); writeableLiveDocs = new FixedBitSet(info.info.maxDoc());
mutableBits.set(0, info.info.maxDoc()); writeableLiveDocs.set(0, info.info.maxDoc());
if (liveDocs != null) { if (liveDocs != null) {
for (int i = 0; i < liveDocs.length(); ++i) { for (int i = 0; i < liveDocs.length(); ++i) {
if (liveDocs.get(i) == false) { if (liveDocs.get(i) == false) {
mutableBits.clear(i); writeableLiveDocs.clear(i);
} }
} }
} }
liveDocs = mutableBits; liveDocs = writeableLiveDocs;
liveDocsShared = false;
} }
return (FixedBitSet) liveDocs; return writeableLiveDocs;
} }
@ -100,7 +94,6 @@ class PendingDeletes {
FixedBitSet mutableBits = getMutableBits(); FixedBitSet mutableBits = getMutableBits();
assert mutableBits != null; assert mutableBits != null;
assert docID >= 0 && docID < mutableBits.length() : "out of bounds: docid=" + docID + " liveDocsLength=" + mutableBits.length() + " seg=" + info.info.name + " maxDoc=" + info.info.maxDoc(); assert docID >= 0 && docID < mutableBits.length() : "out of bounds: docid=" + docID + " liveDocsLength=" + mutableBits.length() + " seg=" + info.info.name + " maxDoc=" + info.info.maxDoc();
assert !liveDocsShared;
final boolean didDelete = mutableBits.get(docID); final boolean didDelete = mutableBits.get(docID);
if (didDelete) { if (didDelete) {
mutableBits.clear(docID); mutableBits.clear(docID);
@ -110,20 +103,19 @@ class PendingDeletes {
} }
/** /**
* Should be called if the live docs returned from {@link #getLiveDocs()} are shared outside of the * Returns a snapshot of the current live docs.
* {@link ReadersAndUpdates}
*/ */
void liveDocsShared() { Bits getLiveDocs() {
liveDocsShared = true; // Prevent modifications to the returned live docs
writeableLiveDocs = null;
return liveDocs;
} }
/** /**
* Returns the current live docs or null if all docs are live. The returned instance might be mutable or is mutated behind the scenes. * Returns a snapshot of the hard live docs.
* If the returned live docs are shared outside of the ReadersAndUpdates {@link #liveDocsShared()} should be called
* first.
*/ */
Bits getLiveDocs() { Bits getHardLiveDocs() {
return liveDocs; return getLiveDocs();
} }
/** /**
@ -138,6 +130,7 @@ class PendingDeletes {
*/ */
void onNewReader(CodecReader reader, SegmentCommitInfo info) throws IOException { void onNewReader(CodecReader reader, SegmentCommitInfo info) throws IOException {
if (liveDocsInitialized == false) { if (liveDocsInitialized == false) {
assert writeableLiveDocs == null;
if (reader.hasDeletions()) { if (reader.hasDeletions()) {
// we only initialize this once either in the ctor or here // we only initialize this once either in the ctor or here
// if we use the live docs from a reader it has to be in a situation where we don't // if we use the live docs from a reader it has to be in a situation where we don't
@ -145,7 +138,6 @@ class PendingDeletes {
assert pendingDeleteCount == 0 : "pendingDeleteCount: " + pendingDeleteCount; assert pendingDeleteCount == 0 : "pendingDeleteCount: " + pendingDeleteCount;
liveDocs = reader.getLiveDocs(); liveDocs = reader.getLiveDocs();
assert liveDocs == null || assertCheckLiveDocs(liveDocs, info.info.maxDoc(), info.getDelCount()); assert liveDocs == null || assertCheckLiveDocs(liveDocs, info.info.maxDoc(), info.getDelCount());
liveDocsShared = true;
} }
liveDocsInitialized = true; liveDocsInitialized = true;
} }
@ -175,7 +167,7 @@ class PendingDeletes {
StringBuilder sb = new StringBuilder(); StringBuilder sb = new StringBuilder();
sb.append("PendingDeletes(seg=").append(info); sb.append("PendingDeletes(seg=").append(info);
sb.append(" numPendingDeletes=").append(pendingDeleteCount); sb.append(" numPendingDeletes=").append(pendingDeleteCount);
sb.append(" liveDocsShared=").append(liveDocsShared); sb.append(" writeable=").append(writeableLiveDocs != null);
return sb.toString(); return sb.toString();
} }
@ -246,7 +238,4 @@ class PendingDeletes {
return policy.numDeletesToMerge(info, numPendingDeletes(), readerIOSupplier); return policy.numDeletesToMerge(info, numPendingDeletes(), readerIOSupplier);
} }
Bits getHardLiveDocs() {
return liveDocs;
}
} }

View File

@ -195,13 +195,9 @@ final class PendingSoftDeletes extends PendingDeletes {
} }
} }
@Override
Bits getHardLiveDocs() { Bits getHardLiveDocs() {
return hardDeletes.getHardLiveDocs(); return hardDeletes.getLiveDocs();
} }
@Override
void liveDocsShared() {
super.liveDocsShared();
hardDeletes.liveDocsShared();
}
} }

View File

@ -234,7 +234,6 @@ final class ReadersAndUpdates {
} }
// force new liveDocs // force new liveDocs
Bits liveDocs = pendingDeletes.getLiveDocs(); Bits liveDocs = pendingDeletes.getLiveDocs();
markAsShared();
if (liveDocs != null) { if (liveDocs != null) {
return new SegmentReader(reader.getSegmentInfo(), reader, liveDocs, return new SegmentReader(reader.getSegmentInfo(), reader, liveDocs,
info.info.maxDoc() - info.getDelCount() - pendingDeletes.numPendingDeletes()); info.info.maxDoc() - info.getDelCount() - pendingDeletes.numPendingDeletes());
@ -263,6 +262,9 @@ final class ReadersAndUpdates {
return reader; return reader;
} }
/**
* Returns a snapshot of the live docs.
*/
public synchronized Bits getLiveDocs() { public synchronized Bits getLiveDocs() {
return pendingDeletes.getLiveDocs(); return pendingDeletes.getLiveDocs();
} }
@ -720,8 +722,6 @@ final class ReadersAndUpdates {
assert pendingDeletes.getLiveDocs() != null; assert pendingDeletes.getLiveDocs() != null;
reader = createNewReaderWithLatestLiveDocs(reader); reader = createNewReaderWithLatestLiveDocs(reader);
} }
markAsShared();
assert verifyDocCounts(); assert verifyDocCounts();
return new MergeReader(reader, pendingDeletes.getHardLiveDocs()); return new MergeReader(reader, pendingDeletes.getHardLiveDocs());
@ -754,11 +754,6 @@ final class ReadersAndUpdates {
return pendingDeletes.isFullyDeleted(this::getLatestReader); return pendingDeletes.isFullyDeleted(this::getLatestReader);
} }
private final void markAsShared() {
assert Thread.holdsLock(this);
pendingDeletes.liveDocsShared(); // this is not costly we can just call it even if it's already marked as shared
}
boolean keepFullyDeletedSegment(MergePolicy mergePolicy) throws IOException { boolean keepFullyDeletedSegment(MergePolicy mergePolicy) throws IOException {
return mergePolicy.keepFullyDeletedSegment(this::getLatestReader); return mergePolicy.keepFullyDeletedSegment(this::getLatestReader);
} }

View File

@ -52,18 +52,16 @@ public class TestPendingDeletes extends LuceneTestCase {
assertFalse(liveDocs.get(docToDelete)); assertFalse(liveDocs.get(docToDelete));
assertFalse(deletes.delete(docToDelete)); // delete again assertFalse(deletes.delete(docToDelete)); // delete again
// make sure we are live ie. mutable
assertTrue(liveDocs.get(8)); assertTrue(liveDocs.get(8));
assertTrue(deletes.delete(8)); assertTrue(deletes.delete(8));
assertFalse(liveDocs.get(8)); assertTrue(liveDocs.get(8)); // we have a snapshot
assertEquals(2, deletes.numPendingDeletes()); assertEquals(2, deletes.numPendingDeletes());
deletes.liveDocsShared();
// make sure we are live ie. mutable
assertTrue(liveDocs.get(9)); assertTrue(liveDocs.get(9));
assertTrue(deletes.delete(9)); assertTrue(deletes.delete(9));
assertTrue(liveDocs.get(9)); assertTrue(liveDocs.get(9));
// now make sure new live docs see the deletions
liveDocs = deletes.getLiveDocs(); liveDocs = deletes.getLiveDocs();
assertFalse(liveDocs.get(9)); assertFalse(liveDocs.get(9));
assertFalse(liveDocs.get(8)); assertFalse(liveDocs.get(8));
@ -83,7 +81,7 @@ public class TestPendingDeletes extends LuceneTestCase {
boolean secondDocDeletes = random().nextBoolean(); boolean secondDocDeletes = random().nextBoolean();
deletes.delete(5); deletes.delete(5);
if (secondDocDeletes) { if (secondDocDeletes) {
deletes.liveDocsShared(); deletes.getLiveDocs();
deletes.delete(2); deletes.delete(2);
} }
assertEquals(-1, commitInfo.getDelGen()); assertEquals(-1, commitInfo.getDelGen());

View File

@ -73,7 +73,6 @@ public class TestPendingSoftDeletes extends TestPendingDeletes {
assertNull(pendingSoftDeletes.getHardLiveDocs()); assertNull(pendingSoftDeletes.getHardLiveDocs());
// pass reader again // pass reader again
Bits liveDocs = pendingSoftDeletes.getLiveDocs(); Bits liveDocs = pendingSoftDeletes.getLiveDocs();
pendingSoftDeletes.liveDocsShared();
pendingSoftDeletes.onNewReader(segmentReader, segmentInfo); pendingSoftDeletes.onNewReader(segmentReader, segmentInfo);
assertEquals(1, pendingSoftDeletes.numPendingDeletes()); assertEquals(1, pendingSoftDeletes.numPendingDeletes());
assertSame(liveDocs, pendingSoftDeletes.getLiveDocs()); assertSame(liveDocs, pendingSoftDeletes.getLiveDocs());
@ -189,7 +188,6 @@ public class TestPendingSoftDeletes extends TestPendingDeletes {
assertTrue(deletes.getLiveDocs().get(0)); assertTrue(deletes.getLiveDocs().get(0));
assertFalse(deletes.getLiveDocs().get(1)); assertFalse(deletes.getLiveDocs().get(1));
assertTrue(deletes.getLiveDocs().get(2)); assertTrue(deletes.getLiveDocs().get(2));
deletes.liveDocsShared();
Bits liveDocs = deletes.getLiveDocs(); Bits liveDocs = deletes.getLiveDocs();
deletes.onNewReader(segmentReader, segmentInfo); deletes.onNewReader(segmentReader, segmentInfo);
// no changes we don't apply updates twice // no changes we don't apply updates twice