mirror of https://github.com/apache/lucene.git
LUCENE-9565 Fix competitive iteration (#1952)
PR #1351 introduced a sort optimization where documents can be skipped. But iteration over competitive iterators was not properly organized, as they were not storing the current docID, and when competitive iterator was updated the current doc ID was lost. This patch fixed it. Relates to #1351
This commit is contained in:
parent
6ac94a6f9f
commit
874c446ab9
|
@ -204,9 +204,17 @@ public abstract class Weight implements SegmentCacheable {
|
||||||
collector.setScorer(scorer);
|
collector.setScorer(scorer);
|
||||||
DocIdSetIterator scorerIterator = twoPhase == null ? iterator : twoPhase.approximation();
|
DocIdSetIterator scorerIterator = twoPhase == null ? iterator : twoPhase.approximation();
|
||||||
DocIdSetIterator collectorIterator = collector.competitiveIterator();
|
DocIdSetIterator collectorIterator = collector.competitiveIterator();
|
||||||
// if possible filter scorerIterator to keep only competitive docs as defined by collector
|
DocIdSetIterator filteredIterator;
|
||||||
DocIdSetIterator filteredIterator = collectorIterator == null ? scorerIterator :
|
if (collectorIterator == null) {
|
||||||
ConjunctionDISI.intersectIterators(Arrays.asList(scorerIterator, collectorIterator));
|
filteredIterator = scorerIterator;
|
||||||
|
} else {
|
||||||
|
if (scorerIterator.docID() != -1) {
|
||||||
|
// Wrap ScorerIterator to start from -1 for conjunction
|
||||||
|
scorerIterator = new RangeDISIWrapper(scorerIterator, max);
|
||||||
|
}
|
||||||
|
// filter scorerIterator to keep only competitive docs as defined by collector
|
||||||
|
filteredIterator = ConjunctionDISI.intersectIterators(Arrays.asList(scorerIterator, collectorIterator));
|
||||||
|
}
|
||||||
if (filteredIterator.docID() == -1 && min == 0 && max == DocIdSetIterator.NO_MORE_DOCS) {
|
if (filteredIterator.docID() == -1 && min == 0 && max == DocIdSetIterator.NO_MORE_DOCS) {
|
||||||
scoreAll(collector, filteredIterator, twoPhase, acceptDocs);
|
scoreAll(collector, filteredIterator, twoPhase, acceptDocs);
|
||||||
return DocIdSetIterator.NO_MORE_DOCS;
|
return DocIdSetIterator.NO_MORE_DOCS;
|
||||||
|
@ -266,4 +274,45 @@ public abstract class Weight implements SegmentCacheable {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Wraps an internal docIdSetIterator for it to start with docID = -1
|
||||||
|
*/
|
||||||
|
protected static class RangeDISIWrapper extends DocIdSetIterator {
|
||||||
|
private final DocIdSetIterator in;
|
||||||
|
private final int min;
|
||||||
|
private final int max;
|
||||||
|
private int docID = -1;
|
||||||
|
|
||||||
|
public RangeDISIWrapper(DocIdSetIterator in, int max) {
|
||||||
|
this.in = in;
|
||||||
|
this.min = in.docID();
|
||||||
|
this.max = max;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public int docID() {
|
||||||
|
return docID;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public int nextDoc() throws IOException {
|
||||||
|
return advance(docID + 1);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public int advance(int target) throws IOException {
|
||||||
|
target = Math.max(min, target);
|
||||||
|
if (target >= max) {
|
||||||
|
return docID = NO_MORE_DOCS;
|
||||||
|
}
|
||||||
|
return docID = in.advance(target);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public long cost() {
|
||||||
|
return Math.min(max - min, in.cost());
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
|
@ -133,14 +133,16 @@ public class DocComparator extends FieldComparator<Integer> {
|
||||||
return null;
|
return null;
|
||||||
} else {
|
} else {
|
||||||
return new DocIdSetIterator() {
|
return new DocIdSetIterator() {
|
||||||
|
private int docID = -1;
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public int nextDoc() throws IOException {
|
public int nextDoc() throws IOException {
|
||||||
return competitiveIterator.nextDoc();
|
return advance(docID + 1);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public int docID() {
|
public int docID() {
|
||||||
return competitiveIterator.docID();
|
return docID;
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -150,7 +152,7 @@ public class DocComparator extends FieldComparator<Integer> {
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public int advance(int target) throws IOException {
|
public int advance(int target) throws IOException {
|
||||||
return competitiveIterator.advance(target);
|
return docID = competitiveIterator.advance(target);
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
|
@ -220,14 +220,16 @@ public abstract class NumericComparator<T extends Number> extends FieldComparato
|
||||||
public DocIdSetIterator competitiveIterator() {
|
public DocIdSetIterator competitiveIterator() {
|
||||||
if (enableSkipping == false) return null;
|
if (enableSkipping == false) return null;
|
||||||
return new DocIdSetIterator() {
|
return new DocIdSetIterator() {
|
||||||
|
private int docID = -1;
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public int nextDoc() throws IOException {
|
public int nextDoc() throws IOException {
|
||||||
return competitiveIterator.nextDoc();
|
return advance(docID + 1);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public int docID() {
|
public int docID() {
|
||||||
return competitiveIterator.docID();
|
return docID;
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -237,7 +239,7 @@ public abstract class NumericComparator<T extends Number> extends FieldComparato
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public int advance(int target) throws IOException {
|
public int advance(int target) throws IOException {
|
||||||
return competitiveIterator.advance(target);
|
return docID = competitiveIterator.advance(target);
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue