LUCENE-2811: SegmentInfo now tracks whether a segment wrote term vectors

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1045322 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Michael McCandless 2010-12-13 19:20:32 +00:00
parent fbab97a0f1
commit 1ca059706e
17 changed files with 187 additions and 66 deletions

View File

@ -450,7 +450,7 @@ final class DocumentsWriter {
assert docStoreSegment != null; assert docStoreSegment != null;
if (infoStream != null) { if (infoStream != null) {
message("closeDocStore: files=" + openFiles + "; segment=" + docStoreSegment + "; docStoreOffset=" + docStoreOffset + "; numDocsInStore=" + numDocsInStore + "; isSeparate=" + isSeparate); message("closeDocStore: openFiles=" + openFiles + "; segment=" + docStoreSegment + "; docStoreOffset=" + docStoreOffset + "; numDocsInStore=" + numDocsInStore + "; isSeparate=" + isSeparate);
} }
closedFiles.clear(); closedFiles.clear();
@ -720,17 +720,21 @@ final class DocumentsWriter {
docStoreSegment, numDocsInRAM, numDocsInStore, writer.getConfig().getTermIndexInterval(), docStoreSegment, numDocsInRAM, numDocsInStore, writer.getConfig().getTermIndexInterval(),
SegmentCodecs.build(fieldInfos, writer.codecs)); SegmentCodecs.build(fieldInfos, writer.codecs));
newSegment = new SegmentInfo(segment, numDocsInRAM, directory, false, -1, null, false, hasProx(), flushState.segmentCodecs); newSegment = new SegmentInfo(segment, numDocsInRAM, directory, false, -1, null, false, hasProx(), flushState.segmentCodecs, false);
if (!closeDocStore || docStoreOffset != 0) { if (!closeDocStore || docStoreOffset != 0) {
newSegment.setDocStoreSegment(docStoreSegment); newSegment.setDocStoreSegment(docStoreSegment);
newSegment.setDocStoreOffset(docStoreOffset); newSegment.setDocStoreOffset(docStoreOffset);
} }
boolean hasVectors = false;
if (closeDocStore) { if (closeDocStore) {
closeDocStore(flushState, writer, deleter, newSegment, mergePolicy, segmentInfos); closeDocStore(flushState, writer, deleter, newSegment, mergePolicy, segmentInfos);
} }
hasVectors |= flushState.hasVectors;
if (numDocsInRAM > 0) { if (numDocsInRAM > 0) {
assert nextDocID == numDocsInRAM; assert nextDocID == numDocsInRAM;
@ -749,6 +753,19 @@ final class DocumentsWriter {
final long startNumBytesUsed = bytesUsed(); final long startNumBytesUsed = bytesUsed();
consumer.flush(threads, flushState); consumer.flush(threads, flushState);
hasVectors |= flushState.hasVectors;
if (hasVectors) {
if (infoStream != null) {
message("new segment has vectors");
}
newSegment.setHasVectors(true);
} else {
if (infoStream != null) {
message("new segment has no vectors");
}
}
if (infoStream != null) { if (infoStream != null) {
message("flushedFiles=" + flushState.flushedFiles); message("flushedFiles=" + flushState.flushedFiles);
message("flushed codecs=" + newSegment.getSegmentCodecs()); message("flushed codecs=" + newSegment.getSegmentCodecs());

View File

@ -1047,8 +1047,10 @@ public class IndexWriter implements Closeable {
mergePolicy.close(); mergePolicy.close();
synchronized(this) {
finishMerges(waitForMerges); finishMerges(waitForMerges);
stopMerges = true; stopMerges = true;
}
mergeScheduler.close(); mergeScheduler.close();
@ -1251,14 +1253,16 @@ public class IndexWriter implements Closeable {
synchronized (this) { synchronized (this) {
// If docWriter has some aborted files that were // If docWriter has some aborted files that were
// never incref'd, then we clean them up here // never incref'd, then we clean them up here
deleter.checkpoint(segmentInfos, false);
if (docWriter != null) { if (docWriter != null) {
final Collection<String> files = docWriter.abortedFiles(); final Collection<String> files = docWriter.abortedFiles();
if (files != null) if (files != null) {
deleter.deleteNewFiles(files); deleter.deleteNewFiles(files);
} }
} }
} }
} }
}
if (doFlush) if (doFlush)
flush(true, false, false); flush(true, false, false);
} catch (OutOfMemoryError oom) { } catch (OutOfMemoryError oom) {
@ -1879,7 +1883,14 @@ public class IndexWriter implements Closeable {
} }
try { try {
synchronized(this) {
finishMerges(false); finishMerges(false);
stopMerges = true;
}
if (infoStream != null ) {
message("rollback: done finish merges");
}
// Must pre-close these two, in case they increment // Must pre-close these two, in case they increment
// changeCount so that we can then set it to false // changeCount so that we can then set it to false
@ -2230,7 +2241,8 @@ public class IndexWriter implements Closeable {
int docCount = merger.merge(); // merge 'em int docCount = merger.merge(); // merge 'em
SegmentInfo info = new SegmentInfo(mergedName, docCount, directory, SegmentInfo info = new SegmentInfo(mergedName, docCount, directory,
false, -1, null, false, merger.hasProx(), merger.getSegmentCodecs()); false, -1, null, false, merger.hasProx(), merger.getSegmentCodecs(),
merger.hasVectors());
setDiagnostics(info, "addIndexes(IndexReader...)"); setDiagnostics(info, "addIndexes(IndexReader...)");
boolean useCompoundFile; boolean useCompoundFile;
@ -2541,9 +2553,17 @@ public class IndexWriter implements Closeable {
return false; return false;
} finally { } finally {
flushControl.clearFlushPending(); flushControl.clearFlushPending();
if (!success && infoStream != null) { if (!success) {
if (infoStream != null) {
message("hit exception during flush"); message("hit exception during flush");
} }
if (docWriter != null) {
final Collection<String> files = docWriter.abortedFiles();
if (files != null) {
deleter.deleteNewFiles(files);
}
}
}
} }
} }
@ -2928,6 +2948,7 @@ public class IndexWriter implements Closeable {
boolean mergeDocStores = false; boolean mergeDocStores = false;
boolean doFlushDocStore = false; boolean doFlushDocStore = false;
boolean hasVectors = false;
final String currentDocStoreSegment = docWriter.getDocStoreSegment(); final String currentDocStoreSegment = docWriter.getDocStoreSegment();
// Test each segment to be merged: check if we need to // Test each segment to be merged: check if we need to
@ -2939,6 +2960,10 @@ public class IndexWriter implements Closeable {
if (si.hasDeletions()) if (si.hasDeletions())
mergeDocStores = true; mergeDocStores = true;
if (si.getHasVectors()) {
hasVectors = true;
}
// If it has its own (private) doc stores we must // If it has its own (private) doc stores we must
// merge the doc stores // merge the doc stores
if (-1 == si.getDocStoreOffset()) if (-1 == si.getDocStoreOffset())
@ -3014,6 +3039,7 @@ public class IndexWriter implements Closeable {
updatePendingMerges(1, false); updatePendingMerges(1, false);
} }
merge.hasVectors = hasVectors;
merge.mergeDocStores = mergeDocStores; merge.mergeDocStores = mergeDocStores;
// Bind a new segment name here so even with // Bind a new segment name here so even with
@ -3024,8 +3050,8 @@ public class IndexWriter implements Closeable {
docStoreSegment, docStoreSegment,
docStoreIsCompoundFile, docStoreIsCompoundFile,
false, false,
null); null,
false);
Map<String,String> details = new HashMap<String,String>(); Map<String,String> details = new HashMap<String,String>();
details.put("optimize", Boolean.toString(merge.optimize)); details.put("optimize", Boolean.toString(merge.optimize));
@ -3033,6 +3059,10 @@ public class IndexWriter implements Closeable {
details.put("mergeDocStores", Boolean.toString(mergeDocStores)); details.put("mergeDocStores", Boolean.toString(mergeDocStores));
setDiagnostics(merge.info, "merge", details); setDiagnostics(merge.info, "merge", details);
if (infoStream != null) {
message("merge seg=" + merge.info.name + " mergeDocStores=" + mergeDocStores);
}
// Also enroll the merged segment into mergingSegments; // Also enroll the merged segment into mergingSegments;
// this prevents it from getting selected for a merge // this prevents it from getting selected for a merge
// after our merge is done but while we are building the // after our merge is done but while we are building the
@ -3252,6 +3282,7 @@ public class IndexWriter implements Closeable {
// Record which codec was used to write the segment // Record which codec was used to write the segment
merge.info.setSegmentCodecs(merger.getSegmentCodecs()); merge.info.setSegmentCodecs(merger.getSegmentCodecs());
merge.info.setHasVectors(merger.hasVectors() || merge.hasVectors);
if (infoStream != null) { if (infoStream != null) {
message("merge segmentCodecs=" + merger.getSegmentCodecs()); message("merge segmentCodecs=" + merger.getSegmentCodecs());
@ -3446,7 +3477,7 @@ public class IndexWriter implements Closeable {
// are called, deleter should know about every // are called, deleter should know about every
// file referenced by the current head // file referenced by the current head
// segmentInfos: // segmentInfos:
assert deleter.exists(fileName) : "IndexFileDeleter doesn't know about file " + fileName; assert deleter.exists(fileName): "IndexFileDeleter doesn't know about file " + fileName;
} }
return true; return true;
} }

View File

@ -68,6 +68,7 @@ public abstract class MergePolicy implements java.io.Closeable {
SegmentInfo info; // used by IndexWriter SegmentInfo info; // used by IndexWriter
boolean mergeDocStores; // used by IndexWriter boolean mergeDocStores; // used by IndexWriter
boolean hasVectors; // used by IndexWriter
boolean optimize; // used by IndexWriter boolean optimize; // used by IndexWriter
boolean registerDone; // used by IndexWriter boolean registerDone; // used by IndexWriter
long mergeGen; // used by IndexWriter long mergeGen; // used by IndexWriter
@ -156,6 +157,9 @@ public abstract class MergePolicy implements java.io.Closeable {
if (mergeDocStores) { if (mergeDocStores) {
b.append(" [mergeDocStores]"); b.append(" [mergeDocStores]");
} }
if (aborted) {
b.append(" [ABORTED]");
}
return b.toString(); return b.toString();
} }

View File

@ -80,12 +80,15 @@ public final class SegmentInfo {
private boolean hasProx; // True if this segment has any fields with omitTermFreqAndPositions==false private boolean hasProx; // True if this segment has any fields with omitTermFreqAndPositions==false
private byte hasVectors; // 0 if no; 1 if yes; 2 if must-check-filesystem (old index)
private SegmentCodecs segmentCodecs; private SegmentCodecs segmentCodecs;
private Map<String,String> diagnostics; private Map<String,String> diagnostics;
public SegmentInfo(String name, int docCount, Directory dir, boolean isCompoundFile, int docStoreOffset, public SegmentInfo(String name, int docCount, Directory dir, boolean isCompoundFile, int docStoreOffset,
String docStoreSegment, boolean docStoreIsCompoundFile, boolean hasProx, SegmentCodecs segmentCodecs) { String docStoreSegment, boolean docStoreIsCompoundFile, boolean hasProx, SegmentCodecs segmentCodecs,
boolean hasVectors) {
this.name = name; this.name = name;
this.docCount = docCount; this.docCount = docCount;
this.dir = dir; this.dir = dir;
@ -96,6 +99,7 @@ public final class SegmentInfo {
this.docStoreIsCompoundFile = docStoreIsCompoundFile; this.docStoreIsCompoundFile = docStoreIsCompoundFile;
this.hasProx = hasProx; this.hasProx = hasProx;
this.segmentCodecs = segmentCodecs; this.segmentCodecs = segmentCodecs;
this.hasVectors = (byte) (hasVectors ? 1 : 0);
delCount = 0; delCount = 0;
assert docStoreOffset == -1 || docStoreSegment != null: "dso=" + docStoreOffset + " dss=" + docStoreSegment + " docCount=" + docCount; assert docStoreOffset == -1 || docStoreSegment != null: "dso=" + docStoreOffset + " dss=" + docStoreSegment + " docCount=" + docCount;
} }
@ -111,6 +115,7 @@ public final class SegmentInfo {
delGen = src.delGen; delGen = src.delGen;
docStoreOffset = src.docStoreOffset; docStoreOffset = src.docStoreOffset;
docStoreIsCompoundFile = src.docStoreIsCompoundFile; docStoreIsCompoundFile = src.docStoreIsCompoundFile;
hasVectors = src.hasVectors;
if (src.normGen == null) { if (src.normGen == null) {
normGen = null; normGen = null;
} else { } else {
@ -184,6 +189,12 @@ public final class SegmentInfo {
segmentCodecs.codecs = new Codec[] { codecs.lookup("PreFlex")}; segmentCodecs.codecs = new Codec[] { codecs.lookup("PreFlex")};
} }
diagnostics = input.readStringStringMap(); diagnostics = input.readStringStringMap();
if (format <= DefaultSegmentInfosWriter.FORMAT_HAS_VECTORS) {
hasVectors = input.readByte();
} else {
hasVectors = 2;
}
} }
/** Returns total size in bytes of all of files used by /** Returns total size in bytes of all of files used by
@ -204,6 +215,27 @@ public final class SegmentInfo {
return sizeInBytes; return sizeInBytes;
} }
public boolean getHasVectors() throws IOException {
if (hasVectors == 1) {
return true;
} else if (hasVectors == 0) {
return false;
} else {
final String storesSegment;
if (getDocStoreOffset() != -1) {
storesSegment = getDocStoreSegment();
} else {
storesSegment = name;
}
return dir.fileExists(IndexFileNames.segmentFileName(storesSegment, "", IndexFileNames.VECTORS_INDEX_EXTENSION));
}
}
public void setHasVectors(boolean v) {
hasVectors = (byte) (v ? 1 : 0);
clearFiles();
}
public boolean hasDeletions() { public boolean hasDeletions() {
// Cases: // Cases:
// //
@ -229,18 +261,14 @@ public final class SegmentInfo {
@Override @Override
public Object clone() { public Object clone() {
SegmentInfo si = new SegmentInfo(name, docCount, dir, isCompoundFile, docStoreOffset, docStoreSegment, docStoreIsCompoundFile, hasProx, segmentCodecs); SegmentInfo si = new SegmentInfo(name, docCount, dir, isCompoundFile, docStoreOffset, docStoreSegment, docStoreIsCompoundFile, hasProx, segmentCodecs, false);
si.isCompoundFile = isCompoundFile;
si.delGen = delGen; si.delGen = delGen;
si.delCount = delCount; si.delCount = delCount;
si.hasProx = hasProx;
si.diagnostics = new HashMap<String, String>(diagnostics); si.diagnostics = new HashMap<String, String>(diagnostics);
if (normGen != null) { if (normGen != null) {
si.normGen = normGen.clone(); si.normGen = normGen.clone();
} }
si.docStoreOffset = docStoreOffset; si.hasVectors = hasVectors;
si.docStoreSegment = docStoreSegment;
si.docStoreIsCompoundFile = docStoreIsCompoundFile;
return si; return si;
} }
@ -404,6 +432,7 @@ public final class SegmentInfo {
output.writeByte((byte) (hasProx ? 1:0)); output.writeByte((byte) (hasProx ? 1:0));
segmentCodecs.write(output); segmentCodecs.write(output);
output.writeStringStringMap(diagnostics); output.writeStringStringMap(diagnostics);
output.writeByte(hasVectors);
} }
void setHasProx(boolean hasProx) { void setHasProx(boolean hasProx) {
@ -466,12 +495,30 @@ public final class SegmentInfo {
if (docStoreIsCompoundFile) { if (docStoreIsCompoundFile) {
fileSet.add(IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.COMPOUND_FILE_STORE_EXTENSION)); fileSet.add(IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.COMPOUND_FILE_STORE_EXTENSION));
} else { } else {
for (String ext : IndexFileNames.STORE_INDEX_EXTENSIONS) fileSet.add(IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.FIELDS_INDEX_EXTENSION));
addIfExists(fileSet, IndexFileNames.segmentFileName(docStoreSegment, "", ext)); fileSet.add(IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.FIELDS_EXTENSION));
if (hasVectors == 1) {
fileSet.add(IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_INDEX_EXTENSION));
fileSet.add(IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION));
fileSet.add(IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_FIELDS_EXTENSION));
} else if (hasVectors == 2) {
addIfExists(fileSet, IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_INDEX_EXTENSION));
addIfExists(fileSet, IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION));
addIfExists(fileSet, IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_FIELDS_EXTENSION));
}
} }
} else if (!useCompoundFile) { } else if (!useCompoundFile) {
for (String ext : IndexFileNames.STORE_INDEX_EXTENSIONS) fileSet.add(IndexFileNames.segmentFileName(name, "", IndexFileNames.FIELDS_INDEX_EXTENSION));
addIfExists(fileSet, IndexFileNames.segmentFileName(name, "", ext)); fileSet.add(IndexFileNames.segmentFileName(name, "", IndexFileNames.FIELDS_EXTENSION));
if (hasVectors == 1) {
fileSet.add(IndexFileNames.segmentFileName(name, "", IndexFileNames.VECTORS_INDEX_EXTENSION));
fileSet.add(IndexFileNames.segmentFileName(name, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION));
fileSet.add(IndexFileNames.segmentFileName(name, "", IndexFileNames.VECTORS_FIELDS_EXTENSION));
} else if (hasVectors == 2) {
addIfExists(fileSet, IndexFileNames.segmentFileName(name, "", IndexFileNames.VECTORS_INDEX_EXTENSION));
addIfExists(fileSet, IndexFileNames.segmentFileName(name, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION));
addIfExists(fileSet, IndexFileNames.segmentFileName(name, "", IndexFileNames.VECTORS_FIELDS_EXTENSION));
}
} }
String delFileName = IndexFileNames.fileNameFromGeneration(name, IndexFileNames.DELETES_EXTENSION, delGen); String delFileName = IndexFileNames.fileNameFromGeneration(name, IndexFileNames.DELETES_EXTENSION, delGen);

View File

@ -75,6 +75,7 @@ final class SegmentMerger {
private final CodecProvider codecs; private final CodecProvider codecs;
private Codec codec; private Codec codec;
private SegmentWriteState segmentWriteState; private SegmentWriteState segmentWriteState;
private boolean hasVectors;
private PayloadProcessorProvider payloadProcessorProvider; private PayloadProcessorProvider payloadProcessorProvider;
@ -100,6 +101,10 @@ final class SegmentMerger {
return fieldInfos.hasProx(); return fieldInfos.hasProx();
} }
boolean hasVectors() {
return hasVectors;
}
/** /**
* Add an IndexReader to the collection of readers that are to be merged * Add an IndexReader to the collection of readers that are to be merged
* @param reader * @param reader
@ -427,7 +432,7 @@ final class SegmentMerger {
private final void mergeVectors() throws IOException { private final void mergeVectors() throws IOException {
TermVectorsWriter termVectorsWriter = TermVectorsWriter termVectorsWriter =
new TermVectorsWriter(directory, segment, fieldInfos); new TermVectorsWriter(directory, segment, fieldInfos);
hasVectors = true;
try { try {
int idx = 0; int idx = 0;
for (final IndexReader reader : readers) { for (final IndexReader reader : readers) {

View File

@ -243,7 +243,7 @@ public class SegmentReader extends IndexReader implements Cloneable {
throw new CorruptIndexException("doc counts differ for segment " + segment + ": fieldsReader shows " + fieldsReaderOrig.size() + " but segmentInfo shows " + si.docCount); throw new CorruptIndexException("doc counts differ for segment " + segment + ": fieldsReader shows " + fieldsReaderOrig.size() + " but segmentInfo shows " + si.docCount);
} }
if (fieldInfos.hasVectors()) { // open term vector files only as needed if (si.getHasVectors()) { // open term vector files only as needed
termVectorsReaderOrig = new TermVectorsReader(storeDir, storesSegment, fieldInfos, readBufferSize, si.getDocStoreOffset(), si.docCount); termVectorsReaderOrig = new TermVectorsReader(storeDir, storesSegment, fieldInfos, readBufferSize, si.getDocStoreOffset(), si.docCount);
} }
} }

View File

@ -34,6 +34,7 @@ public class SegmentWriteState {
public final String docStoreSegmentName; public final String docStoreSegmentName;
public final int numDocs; public final int numDocs;
public int numDocsInStore; public int numDocsInStore;
public boolean hasVectors;
public final Collection<String> flushedFiles; public final Collection<String> flushedFiles;
final SegmentCodecs segmentCodecs; final SegmentCodecs segmentCodecs;

View File

@ -77,7 +77,6 @@ class TermVectorsReader implements Cloneable {
try { try {
String idxName = IndexFileNames.segmentFileName(segment, "", IndexFileNames.VECTORS_INDEX_EXTENSION); String idxName = IndexFileNames.segmentFileName(segment, "", IndexFileNames.VECTORS_INDEX_EXTENSION);
if (d.fileExists(idxName)) {
tvx = d.openInput(idxName, readBufferSize); tvx = d.openInput(idxName, readBufferSize);
format = checkValidFormat(tvx, idxName); format = checkValidFormat(tvx, idxName);
String fn = IndexFileNames.segmentFileName(segment, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION); String fn = IndexFileNames.segmentFileName(segment, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION);
@ -103,13 +102,6 @@ class TermVectorsReader implements Cloneable {
// docs // docs
assert numTotalDocs >= size + docStoreOffset: "numTotalDocs=" + numTotalDocs + " size=" + size + " docStoreOffset=" + docStoreOffset; assert numTotalDocs >= size + docStoreOffset: "numTotalDocs=" + numTotalDocs + " size=" + size + " docStoreOffset=" + docStoreOffset;
} }
} else {
// If all documents flushed in a segment had hit
// non-aborting exceptions, it's possible that
// FieldInfos.hasVectors returns true yet the term
// vector files don't exist.
format = 0;
}
this.fieldInfos = fieldInfos; this.fieldInfos = fieldInfos;
success = true; success = true;

View File

@ -37,6 +37,7 @@ final class TermVectorsTermsWriter extends TermsHashConsumer {
IndexOutput tvd; IndexOutput tvd;
IndexOutput tvf; IndexOutput tvf;
int lastDocID; int lastDocID;
boolean hasVectors;
public TermVectorsTermsWriter(DocumentsWriter docWriter) { public TermVectorsTermsWriter(DocumentsWriter docWriter) {
this.docWriter = docWriter; this.docWriter = docWriter;
@ -57,6 +58,7 @@ final class TermVectorsTermsWriter extends TermsHashConsumer {
// because, although FieldInfos.hasVectors() will return // because, although FieldInfos.hasVectors() will return
// true, the TermVectorsReader gracefully handles // true, the TermVectorsReader gracefully handles
// non-existence of the term vectors files. // non-existence of the term vectors files.
state.hasVectors = hasVectors;
if (tvx != null) { if (tvx != null) {
@ -108,6 +110,8 @@ final class TermVectorsTermsWriter extends TermsHashConsumer {
docWriter.removeOpenFile(docName); docWriter.removeOpenFile(docName);
lastDocID = 0; lastDocID = 0;
state.hasVectors = hasVectors;
hasVectors = false;
} }
} }
@ -159,6 +163,7 @@ final class TermVectorsTermsWriter extends TermsHashConsumer {
String idxName = IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_INDEX_EXTENSION); String idxName = IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_INDEX_EXTENSION);
String docName = IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION); String docName = IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_DOCUMENTS_EXTENSION);
String fldName = IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_FIELDS_EXTENSION); String fldName = IndexFileNames.segmentFileName(docStoreSegment, "", IndexFileNames.VECTORS_FIELDS_EXTENSION);
hasVectors = true;
tvx = docWriter.directory.createOutput(idxName); tvx = docWriter.directory.createOutput(idxName);
tvd = docWriter.directory.createOutput(docName); tvd = docWriter.directory.createOutput(docName);
tvf = docWriter.directory.createOutput(fldName); tvf = docWriter.directory.createOutput(fldName);
@ -218,6 +223,7 @@ final class TermVectorsTermsWriter extends TermsHashConsumer {
@Override @Override
public void abort() { public void abort() {
hasVectors = false;
if (tvx != null) { if (tvx != null) {
try { try {
tvx.close(); tvx.close();

View File

@ -39,9 +39,12 @@ public class DefaultSegmentInfosWriter extends SegmentInfosWriter {
* in the new flex format */ * in the new flex format */
public static final int FORMAT_4_0 = -10; public static final int FORMAT_4_0 = -10;
/** Each segment records whether it has term vectors */
public static final int FORMAT_HAS_VECTORS = -11;
/** This must always point to the most recent file format. /** This must always point to the most recent file format.
* whenever you add a new format, make it 1 smaller (negative version logic)! */ * whenever you add a new format, make it 1 smaller (negative version logic)! */
public static final int FORMAT_CURRENT = FORMAT_4_0; public static final int FORMAT_CURRENT = FORMAT_HAS_VECTORS;
/** This must always point to the first supported file format. */ /** This must always point to the first supported file format. */
public static final int FORMAT_MINIMUM = FORMAT_DIAGNOSTICS; public static final int FORMAT_MINIMUM = FORMAT_DIAGNOSTICS;

View File

@ -39,7 +39,6 @@ import org.apache.lucene.store.Directory;
import org.apache.lucene.store.MockDirectoryWrapper; import org.apache.lucene.store.MockDirectoryWrapper;
import org.apache.lucene.store.RAMDirectory; import org.apache.lucene.store.RAMDirectory;
import org.apache.lucene.util.LuceneTestCase; import org.apache.lucene.util.LuceneTestCase;
import org.apache.lucene.util.Version;
import org.apache.lucene.util._TestUtil; import org.apache.lucene.util._TestUtil;
public class TestAddIndexes extends LuceneTestCase { public class TestAddIndexes extends LuceneTestCase {
@ -642,10 +641,12 @@ public class TestAddIndexes extends LuceneTestCase {
addDoc(writer); addDoc(writer);
writer.close(); writer.close();
dir2 = new MockDirectoryWrapper(random, new RAMDirectory()); dir2 = newDirectory();
writer2 = new IndexWriter(dir2, new IndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer())); writer2 = new IndexWriter(dir2, new IndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer()));
writer2.setInfoStream(VERBOSE ? System.out : null);
writer2.commit(); writer2.commit();
readers = new IndexReader[NUM_COPY]; readers = new IndexReader[NUM_COPY];
for(int i=0;i<NUM_COPY;i++) for(int i=0;i<NUM_COPY;i++)
readers[i] = IndexReader.open(dir, true); readers[i] = IndexReader.open(dir, true);
@ -919,9 +920,12 @@ public class TestAddIndexes extends LuceneTestCase {
CommitAndAddIndexes3 c = new CommitAndAddIndexes3(NUM_COPY); CommitAndAddIndexes3 c = new CommitAndAddIndexes3(NUM_COPY);
c.launchThreads(-1); c.launchThreads(-1);
Thread.sleep(500); Thread.sleep(_TestUtil.nextInt(random, 100, 500));
// Close w/o first stopping/joining the threads // Close w/o first stopping/joining the threads
if (VERBOSE) {
System.out.println("TEST: now force rollback");
}
c.didClose = true; c.didClose = true;
c.writer2.rollback(); c.writer2.rollback();

View File

@ -270,7 +270,7 @@ public class TestCodecs extends LuceneTestCase {
final Directory dir = newDirectory(); final Directory dir = newDirectory();
this.write(fieldInfos, dir, fields); this.write(fieldInfos, dir, fields);
final SegmentInfo si = new SegmentInfo(SEGMENT, 10000, dir, false, -1, SEGMENT, false, true, SegmentCodecs.build(fieldInfos, CodecProvider.getDefault())); final SegmentInfo si = new SegmentInfo(SEGMENT, 10000, dir, false, -1, SEGMENT, false, true, SegmentCodecs.build(fieldInfos, CodecProvider.getDefault()), fieldInfos.hasVectors());
si.setHasProx(false); si.setHasProx(false);
final FieldsProducer reader = si.getSegmentCodecs().codec().fieldsProducer(new SegmentReadState(dir, si, fieldInfos, 64, IndexReader.DEFAULT_TERMS_INDEX_DIVISOR)); final FieldsProducer reader = si.getSegmentCodecs().codec().fieldsProducer(new SegmentReadState(dir, si, fieldInfos, 64, IndexReader.DEFAULT_TERMS_INDEX_DIVISOR));
@ -318,7 +318,7 @@ public class TestCodecs extends LuceneTestCase {
final Directory dir = newDirectory(); final Directory dir = newDirectory();
this.write(fieldInfos, dir, fields); this.write(fieldInfos, dir, fields);
final SegmentInfo si = new SegmentInfo(SEGMENT, 10000, dir, false, -1, SEGMENT, false, true, SegmentCodecs.build(fieldInfos, CodecProvider.getDefault())); final SegmentInfo si = new SegmentInfo(SEGMENT, 10000, dir, false, -1, SEGMENT, false, true, SegmentCodecs.build(fieldInfos, CodecProvider.getDefault()), fieldInfos.hasVectors());
final FieldsProducer terms = si.getSegmentCodecs().codec().fieldsProducer(new SegmentReadState(dir, si, fieldInfos, 1024, IndexReader.DEFAULT_TERMS_INDEX_DIVISOR)); final FieldsProducer terms = si.getSegmentCodecs().codec().fieldsProducer(new SegmentReadState(dir, si, fieldInfos, 1024, IndexReader.DEFAULT_TERMS_INDEX_DIVISOR));

View File

@ -201,7 +201,8 @@ public class TestDoc extends LuceneTestCase {
r2.close(); r2.close();
final SegmentInfo info = new SegmentInfo(merged, si1.docCount + si2.docCount, si1.dir, final SegmentInfo info = new SegmentInfo(merged, si1.docCount + si2.docCount, si1.dir,
useCompoundFile, -1, null, false, merger.hasProx(), merger.getSegmentCodecs()); useCompoundFile, -1, null, false, merger.hasProx(), merger.getSegmentCodecs(),
merger.hasVectors());
if (useCompoundFile) { if (useCompoundFile) {
Collection<String> filesToDelete = merger.createCompoundFile(merged + ".cfs", info); Collection<String> filesToDelete = merger.createCompoundFile(merged + ".cfs", info);

View File

@ -881,10 +881,14 @@ public class TestIndexWriter extends LuceneTestCase {
public void testEmptyDocAfterFlushingRealDoc() throws IOException { public void testEmptyDocAfterFlushingRealDoc() throws IOException {
Directory dir = newDirectory(); Directory dir = newDirectory();
IndexWriter writer = new IndexWriter(dir, newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer())); IndexWriter writer = new IndexWriter(dir, newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer()));
writer.setInfoStream(VERBOSE ? System.out : null);
Document doc = new Document(); Document doc = new Document();
doc.add(newField("field", "aaa", Field.Store.YES, Field.Index.ANALYZED, Field.TermVector.WITH_POSITIONS_OFFSETS)); doc.add(newField("field", "aaa", Field.Store.YES, Field.Index.ANALYZED, Field.TermVector.WITH_POSITIONS_OFFSETS));
writer.addDocument(doc); writer.addDocument(doc);
writer.commit(); writer.commit();
if (VERBOSE) {
System.out.println("\nTEST: now add empty doc");
}
writer.addDocument(new Document()); writer.addDocument(new Document());
writer.close(); writer.close();
_TestUtil.checkIndex(dir); _TestUtil.checkIndex(dir);
@ -1027,7 +1031,11 @@ public class TestIndexWriter extends LuceneTestCase {
Directory dir = newDirectory(); Directory dir = newDirectory();
int delID = 0; int delID = 0;
for(int i=0;i<20;i++) { for(int i=0;i<20;i++) {
if (VERBOSE) {
System.out.println("TEST: iter=" + i);
}
IndexWriter writer = new IndexWriter(dir, newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer()).setMaxBufferedDocs(2)); IndexWriter writer = new IndexWriter(dir, newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer()).setMaxBufferedDocs(2));
writer.setInfoStream(VERBOSE ? System.out : null);
LogMergePolicy lmp = (LogMergePolicy) writer.getConfig().getMergePolicy(); LogMergePolicy lmp = (LogMergePolicy) writer.getConfig().getMergePolicy();
lmp.setMergeFactor(2); lmp.setMergeFactor(2);
lmp.setUseCompoundFile(false); lmp.setUseCompoundFile(false);

View File

@ -51,7 +51,7 @@ public class TestIndexWriterOnDiskFull extends LuceneTestCase {
System.out.println("TEST: pass=" + pass); System.out.println("TEST: pass=" + pass);
} }
boolean doAbort = pass == 1; boolean doAbort = pass == 1;
long diskFree = 200; long diskFree = _TestUtil.nextInt(random, 100, 300);
while(true) { while(true) {
if (VERBOSE) { if (VERBOSE) {
System.out.println("TEST: cycle: diskFree=" + diskFree); System.out.println("TEST: cycle: diskFree=" + diskFree);
@ -120,7 +120,7 @@ public class TestIndexWriterOnDiskFull extends LuceneTestCase {
dir.close(); dir.close();
// Now try again w/ more space: // Now try again w/ more space:
diskFree += 500; diskFree += _TestUtil.nextInt(random, 400, 600);
} else { } else {
//_TestUtil.syncConcurrentMerges(writer); //_TestUtil.syncConcurrentMerges(writer);
dir.setMaxSizeInBytes(0); dir.setMaxSizeInBytes(0);

View File

@ -80,7 +80,8 @@ public class TestSegmentMerger extends LuceneTestCase {
assertTrue(docsMerged == 2); assertTrue(docsMerged == 2);
//Should be able to open a new SegmentReader against the new directory //Should be able to open a new SegmentReader against the new directory
SegmentReader mergedReader = SegmentReader.get(false, mergedDir, new SegmentInfo(mergedSegment, docsMerged, mergedDir, false, -1, SegmentReader mergedReader = SegmentReader.get(false, mergedDir, new SegmentInfo(mergedSegment, docsMerged, mergedDir, false, -1,
null, false, merger.hasProx(), merger.getSegmentCodecs()), BufferedIndexInput.BUFFER_SIZE, true, IndexReader.DEFAULT_TERMS_INDEX_DIVISOR); null, false, merger.hasProx(), merger.getSegmentCodecs(), merger.hasVectors()),
BufferedIndexInput.BUFFER_SIZE, true, IndexReader.DEFAULT_TERMS_INDEX_DIVISOR);
assertTrue(mergedReader != null); assertTrue(mergedReader != null);
assertTrue(mergedReader.numDocs() == 2); assertTrue(mergedReader.numDocs() == 2);

View File

@ -106,6 +106,7 @@ public class MockIndexOutputWrapper extends IndexOutput {
message += ")"; message += ")";
if (LuceneTestCase.VERBOSE) { if (LuceneTestCase.VERBOSE) {
System.out.println(Thread.currentThread().getName() + ": MDW: now throw fake disk full"); System.out.println(Thread.currentThread().getName() + ": MDW: now throw fake disk full");
new Throwable().printStackTrace(System.out);
} }
throw new IOException(message); throw new IOException(message);
} else { } else {