added some javadoc

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/branches/docvalues@1104045 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Simon Willnauer 2011-05-17 08:09:17 +00:00
parent f50134fe1b
commit 8603fac79a
10 changed files with 71 additions and 29 deletions

View File

@ -144,7 +144,7 @@ final class DocFieldProcessor extends DocConsumer {
try { try {
consumer.close(); consumer.close();
} catch (IOException e) { } catch (IOException e) {
// nocommit handle exce // ignore and continue closing remaining consumers
} }
} }
perDocConsumers.clear(); perDocConsumers.clear();

View File

@ -1069,7 +1069,19 @@ public abstract class IndexReader implements Cloneable,Closeable {
* through them yourself. */ * through them yourself. */
public abstract Fields fields() throws IOException; public abstract Fields fields() throws IOException;
// nocommit javadoc /**
* Flex API: returns {@link PerDocValues} for this reader.
* This method may return null if the reader has no per-document
* values stored.
*
* <p><b>NOTE</b>: if this is a multi reader ({@link
* #getSequentialSubReaders} is not null) then this
* method will throw UnsupportedOperationException. If
* you really need {@link PerDocValues} for such a reader,
* use {@link MultiPerDocValues#getPerDocs(IndexReader)}. However, for
* performance reasons, it's best to get all sub-readers
* using {@link ReaderUtil#gatherSubReaders} and iterate
* through them yourself. */
public abstract PerDocValues perDocValues() throws IOException; public abstract PerDocValues perDocValues() throws IOException;
public int docFreq(Term term) throws IOException { public int docFreq(Term term) throws IOException {

View File

@ -29,11 +29,20 @@ import org.apache.lucene.index.values.MultiDocValues;
import org.apache.lucene.index.values.Type; import org.apache.lucene.index.values.Type;
import org.apache.lucene.index.values.MultiDocValues.DocValuesIndex; import org.apache.lucene.index.values.MultiDocValues.DocValuesIndex;
import org.apache.lucene.util.ReaderUtil; import org.apache.lucene.util.ReaderUtil;
import org.apache.lucene.util.ReaderUtil.Gather;
/** /**
* Exposes per-document flex API, merged from per-document flex API of
* sub-segments. This is useful when you're interacting with an
* {@link IndexReader} implementation that consists of sequential sub-readers
* (eg DirectoryReader or {@link MultiReader}).
* *
* nocommit - javadoc * <p>
* @experimental * <b>NOTE</b>: for multi readers, you'll get better performance by gathering
* the sub readers using {@link ReaderUtil#gatherSubReaders} and then operate
* per-reader, instead of using this class.
*
* @lucene.experimental
*/ */
public class MultiPerDocValues extends PerDocValues { public class MultiPerDocValues extends PerDocValues {
private final PerDocValues[] subs; private final PerDocValues[] subs;
@ -50,6 +59,14 @@ public class MultiPerDocValues extends PerDocValues {
} }
} }
/**
* Returns a single {@link PerDocValues} instance for this reader, merging
* their values on the fly. This method will not return <code>null</code>.
*
* <p>
* <b>NOTE</b>: this is a slow way to access postings. It's better to get the
* sub-readers (using {@link Gather}) and iterate through them yourself.
*/
public static PerDocValues getPerDocs(IndexReader r) throws IOException { public static PerDocValues getPerDocs(IndexReader r) throws IOException {
final IndexReader[] subs = r.getSequentialSubReaders(); final IndexReader[] subs = r.getSequentialSubReaders();
if (subs == null) { if (subs == null) {

View File

@ -18,10 +18,13 @@ package org.apache.lucene.index;
import java.io.PrintStream; import java.io.PrintStream;
import java.util.concurrent.atomic.AtomicLong; import java.util.concurrent.atomic.AtomicLong;
import org.apache.lucene.index.codecs.PerDocConsumer;
import org.apache.lucene.store.Directory; import org.apache.lucene.store.Directory;
/** /**
* nocommit - javadoc * Encapsulates all necessary state to initiate a {@link PerDocConsumer} and
* create all necessary files in order to consume and merge per-document values.
*
* @lucene.experimental * @lucene.experimental
*/ */
public class PerDocWriteState { public class PerDocWriteState {
@ -33,14 +36,9 @@ public class PerDocWriteState {
public final SegmentCodecs segmentCodecs; public final SegmentCodecs segmentCodecs;
public final int codecId; public final int codecId;
/** Expert: The fraction of terms in the "dictionary" which should be stored PerDocWriteState(PrintStream infoStream, Directory directory,
* in RAM. Smaller values use more memory, but make searching slightly String segmentName, FieldInfos fieldInfos, AtomicLong bytesUsed,
* faster, while larger values use less memory and make searching slightly int codecId) {
* slower. Searching is typically not dominated by dictionary lookup, so
* tweaking this is rarely useful.*/
public int termIndexInterval; // TODO: this should be private to the codec, not settable here or in IWC
public PerDocWriteState(PrintStream infoStream, Directory directory, String segmentName, FieldInfos fieldInfos, AtomicLong bytesUsed, int codecId) {
this.infoStream = infoStream; this.infoStream = infoStream;
this.directory = directory; this.directory = directory;
this.segmentName = segmentName; this.segmentName = segmentName;
@ -50,7 +48,7 @@ public class PerDocWriteState {
this.bytesUsed = bytesUsed; this.bytesUsed = bytesUsed;
} }
public PerDocWriteState(SegmentWriteState state) { PerDocWriteState(SegmentWriteState state) {
infoStream = state.infoStream; infoStream = state.infoStream;
directory = state.directory; directory = state.directory;
segmentCodecs = state.segmentCodecs; segmentCodecs = state.segmentCodecs;
@ -60,7 +58,7 @@ public class PerDocWriteState {
bytesUsed = new AtomicLong(0); bytesUsed = new AtomicLong(0);
} }
public PerDocWriteState(PerDocWriteState state, int codecId) { PerDocWriteState(PerDocWriteState state, int codecId) {
this.infoStream = state.infoStream; this.infoStream = state.infoStream;
this.directory = state.directory; this.directory = state.directory;
this.segmentName = state.segmentName; this.segmentName = state.segmentName;
@ -70,7 +68,6 @@ public class PerDocWriteState {
this.bytesUsed = state.bytesUsed; this.bytesUsed = state.bytesUsed;
} }
public String codecIdAsString() { public String codecIdAsString() {
return "" + codecId; return "" + codecId;
} }

View File

@ -18,7 +18,6 @@ package org.apache.lucene.index;
*/ */
import java.io.PrintStream; import java.io.PrintStream;
import java.util.concurrent.atomic.AtomicLong;
import org.apache.lucene.store.Directory; import org.apache.lucene.store.Directory;
import org.apache.lucene.util.BitVector; import org.apache.lucene.util.BitVector;

View File

@ -23,7 +23,6 @@ import java.io.IOException;
import org.apache.lucene.index.Fields; import org.apache.lucene.index.Fields;
import org.apache.lucene.index.FieldsEnum; import org.apache.lucene.index.FieldsEnum;
import org.apache.lucene.index.Terms; import org.apache.lucene.index.Terms;
import org.apache.lucene.index.values.DocValues;
/** Abstract API that consumes terms, doc, freq, prox and /** Abstract API that consumes terms, doc, freq, prox and
* payloads postings. Concrete implementations of this * payloads postings. Concrete implementations of this

View File

@ -22,15 +22,24 @@ import org.apache.lucene.index.FieldInfo;
import org.apache.lucene.index.values.DocValues; import org.apache.lucene.index.values.DocValues;
/** /**
* nocommit - javadoc * Abstract API that consumes per document values. Concrete implementations of
* @experimental * this convert field values into a Codec specific format during indexing.
* <p>
* The {@link PerDocConsumer} API is accessible through flexible indexing / the
* {@link Codec} - API providing per field consumers and producers for inverted
* data (terms, postings) as well as per-document data.
* *
* @lucene.experimental
*/ */
public abstract class PerDocConsumer implements Closeable{ public abstract class PerDocConsumer implements Closeable{
/** Adds a new DocValuesField */ /** Adds a new DocValuesField */
public abstract DocValuesConsumer addValuesField(FieldInfo field) public abstract DocValuesConsumer addValuesField(FieldInfo field)
throws IOException; throws IOException;
/**
* Consumes and merges the given {@link PerDocValues} producer
* into this consumers format.
*/
public void merge(MergeState mergeState, PerDocValues producer) public void merge(MergeState mergeState, PerDocValues producer)
throws IOException { throws IOException {
Iterable<String> fields = producer.fields(); Iterable<String> fields = producer.fields();

View File

@ -22,9 +22,16 @@ import java.util.Collection;
import org.apache.lucene.index.values.DocValues; import org.apache.lucene.index.values.DocValues;
/** /**
* Abstract API that provides access to one or more per-document storage
* features. The concrete implementations provide access to the underlying
* storage on a per-document basis corresponding to their actual
* {@link PerDocConsumer} counterpart.
* <p>
* The {@link PerDocValues} API is accessible through flexible indexing / the
* {@link Codec} - API providing per field consumers and producers for inverted
* data (terms, postings) as well as per-document data.
* *
* nocommit javadoc * @lucene.experimental
* @experimental
*/ */
public abstract class PerDocValues implements Closeable { public abstract class PerDocValues implements Closeable {
/** /**
@ -40,5 +47,9 @@ public abstract class PerDocValues implements Closeable {
public static final PerDocValues[] EMPTY_ARRAY = new PerDocValues[0]; public static final PerDocValues[] EMPTY_ARRAY = new PerDocValues[0];
/**
* Returns all fields this {@link PerDocValues} contains values for.
*/
public abstract Collection<String> fields(); public abstract Collection<String> fields();
} }

View File

@ -27,7 +27,7 @@ import org.apache.lucene.util.AttributeSource;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
/** /**
* TODO * nocommit - javadoc
* *
* @see FieldsEnum#docValues() * @see FieldsEnum#docValues()
* @see Fields#docValues(String) * @see Fields#docValues(String)

View File

@ -69,10 +69,8 @@ public class TestDocValuesIndexing extends LuceneTestCase {
* *
* - Add documentation for: * - Add documentation for:
* - DocValues * - DocValues
* - Add @lucene.experimental to all necessary classes
* - add test for unoptimized case with deletes * - add test for unoptimized case with deletes
* - add multithreaded tests / integrate into stress indexing? * - add multithreaded tests / integrate into stress indexing?
* - run RAT
*/ */
@Before @Before