From 8e65aca0e1e08c8f3e3d53e2561b8cd09a5e1a22 Mon Sep 17 00:00:00 2001 From: Adrien Grand Date: Tue, 28 Feb 2017 13:38:55 +0100 Subject: [PATCH] LUCENE-7716: Reduce specialization in TopFieldCollector. --- .../search/MultiLeafFieldComparator.java | 92 +++++++ .../lucene/search/TopFieldCollector.java | 224 +++++------------- 2 files changed, 147 insertions(+), 169 deletions(-) create mode 100644 lucene/core/src/java/org/apache/lucene/search/MultiLeafFieldComparator.java diff --git a/lucene/core/src/java/org/apache/lucene/search/MultiLeafFieldComparator.java b/lucene/core/src/java/org/apache/lucene/search/MultiLeafFieldComparator.java new file mode 100644 index 00000000000..5fdb87d3e20 --- /dev/null +++ b/lucene/core/src/java/org/apache/lucene/search/MultiLeafFieldComparator.java @@ -0,0 +1,92 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package org.apache.lucene.search; + +import java.io.IOException; + +final class MultiLeafFieldComparator implements LeafFieldComparator { + + private final LeafFieldComparator[] comparators; + private final int[] reverseMul; + // we extract the first comparator to avoid array access in the common case + // that the first comparator compares worse than the bottom entry in the queue + private final LeafFieldComparator firstComparator; + private final int firstReverseMul; + + MultiLeafFieldComparator(LeafFieldComparator[] comparators, int[] reverseMul) { + if (comparators.length != reverseMul.length) { + throw new IllegalArgumentException("Must have the same number of comparators and reverseMul, got " + + comparators.length + " and " + reverseMul.length); + } + this.comparators = comparators; + this.reverseMul = reverseMul; + this.firstComparator = comparators[0]; + this.firstReverseMul = reverseMul[0]; + } + + @Override + public void setBottom(int slot) throws IOException { + for (LeafFieldComparator comparator : comparators) { + comparator.setBottom(slot); + } + } + + @Override + public int compareBottom(int doc) throws IOException { + int cmp = firstReverseMul * firstComparator.compareBottom(doc); + if (cmp != 0) { + return cmp; + } + for (int i = 1; i < comparators.length; ++i) { + cmp = reverseMul[i] * comparators[i].compareBottom(doc); + if (cmp != 0) { + return cmp; + } + } + return 0; + } + + @Override + public int compareTop(int doc) throws IOException { + int cmp = firstReverseMul * firstComparator.compareTop(doc); + if (cmp != 0) { + return cmp; + } + for (int i = 1; i < comparators.length; ++i) { + cmp = reverseMul[i] * comparators[i].compareTop(doc); + if (cmp != 0) { + return cmp; + } + } + return 0; + } + + @Override + public void copy(int slot, int doc) throws IOException { + for (LeafFieldComparator comparator : comparators) { + comparator.copy(slot, doc); + } + } + + @Override + public void setScorer(Scorer scorer) throws IOException { + for (LeafFieldComparator comparator : comparators) { + comparator.setScorer(scorer); + } + } + +} diff --git a/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java b/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java index 3433906df77..1ec322fe5d9 100644 --- a/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java +++ b/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java @@ -39,95 +39,31 @@ public abstract class TopFieldCollector extends TopDocsCollector { // always compare lower than a real hit; this would // save having to check queueFull on each insert - private static abstract class OneComparatorLeafCollector implements LeafCollector { + private static abstract class MultiComparatorLeafCollector implements LeafCollector { final LeafFieldComparator comparator; final int reverseMul; final boolean mayNeedScoresTwice; Scorer scorer; - OneComparatorLeafCollector(LeafFieldComparator comparator, int reverseMul, boolean mayNeedScoresTwice) { - this.comparator = comparator; - this.reverseMul = reverseMul; - this.mayNeedScoresTwice = mayNeedScoresTwice; - } - - @Override - public void setScorer(Scorer scorer) throws IOException { - if (mayNeedScoresTwice && scorer instanceof ScoreCachingWrappingScorer == false) { - scorer = new ScoreCachingWrappingScorer(scorer); - } - this.scorer = scorer; - comparator.setScorer(scorer); - } - } - - private static abstract class MultiComparatorLeafCollector implements LeafCollector { - - final LeafFieldComparator[] comparators; - final int[] reverseMul; - final LeafFieldComparator firstComparator; - final int firstReverseMul; - final boolean mayNeedScoresTwice; - Scorer scorer; - MultiComparatorLeafCollector(LeafFieldComparator[] comparators, int[] reverseMul, boolean mayNeedScoresTwice) { - this.comparators = comparators; - this.reverseMul = reverseMul; - firstComparator = comparators[0]; - firstReverseMul = reverseMul[0]; + if (comparators.length == 1) { + this.reverseMul = reverseMul[0]; + this.comparator = comparators[0]; + } else { + this.reverseMul = 1; + this.comparator = new MultiLeafFieldComparator(comparators, reverseMul); + } this.mayNeedScoresTwice = mayNeedScoresTwice; } - protected final int compareBottom(int doc) throws IOException { - int cmp = firstReverseMul * firstComparator.compareBottom(doc); - if (cmp != 0) { - return cmp; - } - for (int i = 1; i < comparators.length; ++i) { - cmp = reverseMul[i] * comparators[i].compareBottom(doc); - if (cmp != 0) { - return cmp; - } - } - return 0; - } - - protected final void copy(int slot, int doc) throws IOException { - for (LeafFieldComparator comparator : comparators) { - comparator.copy(slot, doc); - } - } - - protected final void setBottom(int slot) throws IOException { - for (LeafFieldComparator comparator : comparators) { - comparator.setBottom(slot); - } - } - - protected final int compareTop(int doc) throws IOException { - int cmp = firstReverseMul * firstComparator.compareTop(doc); - if (cmp != 0) { - return cmp; - } - for (int i = 1; i < comparators.length; ++i) { - cmp = reverseMul[i] * comparators[i].compareTop(doc); - if (cmp != 0) { - return cmp; - } - } - return 0; - } - @Override public void setScorer(Scorer scorer) throws IOException { - this.scorer = scorer; if (mayNeedScoresTwice && scorer instanceof ScoreCachingWrappingScorer == false) { scorer = new ScoreCachingWrappingScorer(scorer); } - for (LeafFieldComparator comparator : comparators) { - comparator.setScorer(scorer); - } + comparator.setScorer(scorer); + this.scorer = scorer; } } @@ -164,103 +100,53 @@ public abstract class TopFieldCollector extends TopDocsCollector { final LeafFieldComparator[] comparators = queue.getComparators(context); final int[] reverseMul = queue.getReverseMul(); - if (comparators.length == 1) { - return new OneComparatorLeafCollector(comparators[0], reverseMul[0], mayNeedScoresTwice) { + return new MultiComparatorLeafCollector(comparators, reverseMul, mayNeedScoresTwice) { - @Override - public void collect(int doc) throws IOException { - float score = Float.NaN; - if (trackMaxScore) { - score = scorer.score(); - if (score > maxScore) { - maxScore = score; - } + @Override + public void collect(int doc) throws IOException { + float score = Float.NaN; + if (trackMaxScore) { + score = scorer.score(); + if (score > maxScore) { + maxScore = score; + } + } + + ++totalHits; + if (queueFull) { + if (reverseMul * comparator.compareBottom(doc) <= 0) { + // since docs are visited in doc Id order, if compare is 0, it means + // this document is largest than anything else in the queue, and + // therefore not competitive. + return; } - ++totalHits; + if (trackDocScores && !trackMaxScore) { + score = scorer.score(); + } + + // This hit is competitive - replace bottom element in queue & adjustTop + comparator.copy(bottom.slot, doc); + updateBottom(doc, score); + comparator.setBottom(bottom.slot); + } else { + // Startup transient: queue hasn't gathered numHits yet + final int slot = totalHits - 1; + + if (trackDocScores && !trackMaxScore) { + score = scorer.score(); + } + + // Copy hit into queue + comparator.copy(slot, doc); + add(slot, doc, score); if (queueFull) { - if (reverseMul * comparator.compareBottom(doc) <= 0) { - // since docs are visited in doc Id order, if compare is 0, it means - // this document is largest than anything else in the queue, and - // therefore not competitive. - return; - } - - if (trackDocScores && !trackMaxScore) { - score = scorer.score(); - } - - // This hit is competitive - replace bottom element in queue & adjustTop - comparator.copy(bottom.slot, doc); - updateBottom(doc, score); comparator.setBottom(bottom.slot); - } else { - // Startup transient: queue hasn't gathered numHits yet - final int slot = totalHits - 1; - - if (trackDocScores && !trackMaxScore) { - score = scorer.score(); - } - - // Copy hit into queue - comparator.copy(slot, doc); - add(slot, doc, score); - if (queueFull) { - comparator.setBottom(bottom.slot); - } } } + } - }; - } else { - return new MultiComparatorLeafCollector(comparators, reverseMul, mayNeedScoresTwice) { - - @Override - public void collect(int doc) throws IOException { - float score = Float.NaN; - if (trackMaxScore) { - score = scorer.score(); - if (score > maxScore) { - maxScore = score; - } - } - - ++totalHits; - if (queueFull) { - if (compareBottom(doc) <= 0) { - // since docs are visited in doc Id order, if compare is 0, it means - // this document is largest than anything else in the queue, and - // therefore not competitive. - return; - } - - if (trackDocScores && !trackMaxScore) { - score = scorer.score(); - } - - // This hit is competitive - replace bottom element in queue & adjustTop - copy(bottom.slot, doc); - updateBottom(doc, score); - setBottom(bottom.slot); - } else { - // Startup transient: queue hasn't gathered numHits yet - final int slot = totalHits - 1; - - if (trackDocScores && !trackMaxScore) { - score = scorer.score(); - } - - // Copy hit into queue - copy(slot, doc); - add(slot, doc, score); - if (queueFull) { - setBottom(bottom.slot); - } - } - } - - }; - } + }; } } @@ -321,14 +207,14 @@ public abstract class TopFieldCollector extends TopDocsCollector { if (queueFull) { // Fastmatch: return if this hit is no better than // the worst hit currently in the queue: - final int cmp = compareBottom(doc); + final int cmp = reverseMul * comparator.compareBottom(doc); if (cmp <= 0) { // not competitive since documents are visited in doc id order return; } } - final int topCmp = compareTop(doc); + final int topCmp = reverseMul * comparator.compareTop(doc); if (topCmp > 0 || (topCmp == 0 && doc <= afterDoc)) { // Already collected on a previous page return; @@ -336,7 +222,7 @@ public abstract class TopFieldCollector extends TopDocsCollector { if (queueFull) { // This hit is competitive - replace bottom element in queue & adjustTop - copy(bottom.slot, doc); + comparator.copy(bottom.slot, doc); // Compute score only if it is competitive. if (trackDocScores && !trackMaxScore) { @@ -344,7 +230,7 @@ public abstract class TopFieldCollector extends TopDocsCollector { } updateBottom(doc, score); - setBottom(bottom.slot); + comparator.setBottom(bottom.slot); } else { collectedHits++; @@ -352,7 +238,7 @@ public abstract class TopFieldCollector extends TopDocsCollector { final int slot = collectedHits - 1; //System.out.println(" slot=" + slot); // Copy hit into queue - copy(slot, doc); + comparator.copy(slot, doc); // Compute score only if it is competitive. if (trackDocScores && !trackMaxScore) { @@ -361,7 +247,7 @@ public abstract class TopFieldCollector extends TopDocsCollector { bottom = pq.add(new Entry(slot, docBase + doc, score)); queueFull = collectedHits == numHits; if (queueFull) { - setBottom(bottom.slot); + comparator.setBottom(bottom.slot); } } }