Search: Cut over to IndexSearcher.count.

There is a new IndexSearcher.count method that makes it easier to count how
many documents match a particular query.
This commit is contained in:
Adrien Grand 2015-04-20 14:49:35 +02:00
parent 45fa5dcad9
commit 03c07377e3
3 changed files with 37 additions and 27 deletions

View File

@ -20,16 +20,26 @@
package org.elasticsearch.common.lucene; package org.elasticsearch.common.lucene;
import com.google.common.collect.Iterables; import com.google.common.collect.Iterables;
import com.google.common.collect.Lists;
import org.apache.lucene.analysis.core.KeywordAnalyzer; import org.apache.lucene.analysis.core.KeywordAnalyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer; import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.codecs.CodecUtil; import org.apache.lucene.codecs.CodecUtil;
import org.apache.lucene.codecs.DocValuesFormat; import org.apache.lucene.codecs.DocValuesFormat;
import org.apache.lucene.codecs.PostingsFormat; import org.apache.lucene.codecs.PostingsFormat;
import org.apache.lucene.index.*; import org.apache.lucene.index.CorruptIndexException;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexCommit;
import org.apache.lucene.index.IndexFileNames;
import org.apache.lucene.index.IndexFormatTooNewException;
import org.apache.lucene.index.IndexFormatTooOldException;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.LeafReaderContext;
import org.apache.lucene.index.NoMergePolicy;
import org.apache.lucene.index.SegmentCommitInfo;
import org.apache.lucene.index.SegmentInfos;
import org.apache.lucene.search.Collector; import org.apache.lucene.search.Collector;
import org.apache.lucene.search.ComplexExplanation; import org.apache.lucene.search.ComplexExplanation;
import org.apache.lucene.search.ConstantScoreQuery;
import org.apache.lucene.search.Explanation; import org.apache.lucene.search.Explanation;
import org.apache.lucene.search.FieldDoc; import org.apache.lucene.search.FieldDoc;
import org.apache.lucene.search.Filter; import org.apache.lucene.search.Filter;
@ -43,8 +53,11 @@ import org.apache.lucene.search.SortField;
import org.apache.lucene.search.TimeLimitingCollector; import org.apache.lucene.search.TimeLimitingCollector;
import org.apache.lucene.search.TopDocs; import org.apache.lucene.search.TopDocs;
import org.apache.lucene.search.TopFieldDocs; import org.apache.lucene.search.TopFieldDocs;
import org.apache.lucene.search.TotalHitCountCollector; import org.apache.lucene.store.Directory;
import org.apache.lucene.store.*; import org.apache.lucene.store.IOContext;
import org.apache.lucene.store.IndexInput;
import org.apache.lucene.store.Lock;
import org.apache.lucene.store.LockObtainFailedException;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.Counter; import org.apache.lucene.util.Counter;
import org.apache.lucene.util.Version; import org.apache.lucene.util.Version;
@ -64,7 +77,11 @@ import org.elasticsearch.index.fielddata.IndexFieldData;
import java.io.IOException; import java.io.IOException;
import java.text.ParseException; import java.text.ParseException;
import java.util.*; import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.List;
import java.util.Map;
import static org.elasticsearch.common.lucene.search.NoopCollector.NOOP_COLLECTOR; import static org.elasticsearch.common.lucene.search.NoopCollector.NOOP_COLLECTOR;
@ -236,10 +253,7 @@ public class Lucene {
} }
public static long count(IndexSearcher searcher, Query query) throws IOException { public static long count(IndexSearcher searcher, Query query) throws IOException {
TotalHitCountCollector countCollector = new TotalHitCountCollector(); return searcher.count(query);
query = wrapCountQuery(query);
searcher.search(query, countCollector);
return countCollector.getTotalHits();
} }
/** /**
@ -313,7 +327,6 @@ public class Lucene {
*/ */
public static boolean countWithEarlyTermination(IndexSearcher searcher, Filter filter, Query query, public static boolean countWithEarlyTermination(IndexSearcher searcher, Filter filter, Query query,
EarlyTerminatingCollector collector) throws IOException { EarlyTerminatingCollector collector) throws IOException {
query = wrapCountQuery(query);
try { try {
if (filter == null) { if (filter == null) {
searcher.search(query, collector); searcher.search(query, collector);
@ -335,14 +348,6 @@ public class Lucene {
return createCountBasedEarlyTerminatingCollector(1); return createCountBasedEarlyTerminatingCollector(1);
} }
private final static Query wrapCountQuery(Query query) {
// we don't need scores, so wrap it in a constant score query
if (!(query instanceof ConstantScoreQuery)) {
query = new ConstantScoreQuery(query);
}
return query;
}
/** /**
* Closes the index writer, returning <tt>false</tt> if it failed to close. * Closes the index writer, returning <tt>false</tt> if it failed to close.
*/ */

View File

@ -25,7 +25,16 @@ import org.apache.lucene.index.LeafReader;
import org.apache.lucene.index.LeafReaderContext; import org.apache.lucene.index.LeafReaderContext;
import org.apache.lucene.index.Term; import org.apache.lucene.index.Term;
import org.apache.lucene.queries.TermFilter; import org.apache.lucene.queries.TermFilter;
import org.apache.lucene.search.*; import org.apache.lucene.search.DocIdSet;
import org.apache.lucene.search.DocIdSetIterator;
import org.apache.lucene.search.Filter;
import org.apache.lucene.search.FilteredQuery;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.search.TopDocsCollector;
import org.apache.lucene.search.TopFieldCollector;
import org.apache.lucene.search.TopScoreDocCollector;
import org.apache.lucene.search.TotalHitCountCollector;
import org.apache.lucene.search.join.BitDocIdSetFilter; import org.apache.lucene.search.join.BitDocIdSetFilter;
import org.apache.lucene.util.BitSet; import org.apache.lucene.util.BitSet;
import org.apache.lucene.util.Bits; import org.apache.lucene.util.Bits;
@ -125,9 +134,7 @@ public final class InnerHitsContext {
Query q = new FilteredQuery(query, new NestedChildrenFilter(parentFilter, childFilter, hitContext)); Query q = new FilteredQuery(query, new NestedChildrenFilter(parentFilter, childFilter, hitContext));
if (size() == 0) { if (size() == 0) {
TotalHitCountCollector collector = new TotalHitCountCollector(); return new TopDocs(context.searcher().count(q), Lucene.EMPTY_SCORE_DOCS, 0);
context.searcher().search(q, collector);
return new TopDocs(collector.getTotalHits(), Lucene.EMPTY_SCORE_DOCS, 0);
} else { } else {
int topN = from() + size(); int topN = from() + size();
TopDocsCollector topDocsCollector; TopDocsCollector topDocsCollector;

View File

@ -20,10 +20,10 @@
package org.elasticsearch.search.query; package org.elasticsearch.search.query;
import com.google.common.collect.ImmutableMap; import com.google.common.collect.ImmutableMap;
import org.apache.lucene.search.Query; import org.apache.lucene.search.Query;
import org.apache.lucene.search.ScoreDoc; import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TopDocs; import org.apache.lucene.search.TopDocs;
import org.apache.lucene.search.TotalHitCountCollector;
import org.elasticsearch.action.search.SearchType; import org.elasticsearch.action.search.SearchType;
import org.elasticsearch.common.inject.Inject; import org.elasticsearch.common.inject.Inject;
import org.elasticsearch.common.lucene.Lucene; import org.elasticsearch.common.lucene.Lucene;
@ -109,9 +109,7 @@ public class QueryPhase implements SearchPhase {
int numDocs = searchContext.from() + searchContext.size(); int numDocs = searchContext.from() + searchContext.size();
if (searchContext.size() == 0) { // no matter what the value of from is if (searchContext.size() == 0) { // no matter what the value of from is
TotalHitCountCollector collector = new TotalHitCountCollector(); topDocs = new TopDocs(searchContext.searcher().count(query), Lucene.EMPTY_SCORE_DOCS, 0);
searchContext.searcher().search(query, collector);
topDocs = new TopDocs(collector.getTotalHits(), Lucene.EMPTY_SCORE_DOCS, 0);
} else if (searchContext.searchType() == SearchType.SCAN) { } else if (searchContext.searchType() == SearchType.SCAN) {
topDocs = searchContext.scanContext().execute(searchContext); topDocs = searchContext.scanContext().execute(searchContext);
} else { } else {