LUCENE-1773: fix highlighter test case; add contrib/memory as dependency to contrib/benchmark

git-svn-id: https://svn.apache.org/repos/asf/lucene/java/trunk@801160 13f79535-47bb-0310-9956-ffa450edef68
2009-08-05 12:09:48 +00:00 · 2009-08-05 12:09:48 +00:00 · c471e8e83c
parent fe43cd7243
commit c471e8e83c
6 changed files with 55 additions and 42 deletions
--- a/contrib/benchmark/CHANGES.txt
+++ b/contrib/benchmark/CHANGES.txt
@ -8,8 +8,15 @@ $Id:$
  LUCENE-1770: Add EnwikiQueryMaker (Mark Miller)

 8/04/2009
-  LUCENE-1773: Add FastVectorHighlighter tasks.  (Koji Sekiguchi via
-  Mike McCandless)
+  LUCENE-1773: Add FastVectorHighlighter tasks.  This change is a
+  non-backwards compatible change in how subclasses of ReadTask define
+  a highlighter.  The methods doHighlight, isMergeContiguousFragments,
+  maxNumFragments and getHighlighter are no longer used and have been
+  mark deprecated and package protected private so there's a compile
+  time error.  Instead, the new getBenchmarkHighlighter method should
+  return an appropriate highlighter for the task. The configuration of
+  the highlighter tasks (maxFrags, mergeContiguous, etc.) is now
+  accepted as params to the task.  (Koji Sekiguchi via Mike McCandless)

 8/03/2009
  LUCENE-1778: Add support for log.step setting per task type. Perviously, if
--- a/contrib/benchmark/build.xml
+++ b/contrib/benchmark/build.xml
@ -105,6 +105,7 @@
        <pathelement path="${common.dir}/build/classes/java"/>
        <pathelement path="${common.dir}/build/classes/demo"/>
        <pathelement path="${common.dir}/build/contrib/highlighter/classes/java"/>
+        <pathelement path="${common.dir}/build/contrib/memory/classes/java"/>
        <pathelement path="${common.dir}/build/contrib/fast-vector-highlighter/classes/java"/>
    	<fileset dir="lib">
    		<include name="**/*.jar"/>
@ -149,13 +150,18 @@
         <fileset dir="${common.dir}/contrib/highlighter" includes="build.xml"/>
      </subant>
    </target>
+    <target name="compile-memory">
+      <subant target="compile">
+         <fileset dir="${common.dir}/contrib/memory" includes="build.xml"/>
+      </subant>
+    </target>
    <target name="compile-vector-highlighter">
      <subant target="compile">
         <fileset dir="${common.dir}/contrib/fast-vector-highlighter" includes="build.xml"/>
      </subant>
    </target>

-    <target name="init" depends="common.init,compile-demo,compile-highlighter,compile-vector-highlighter,check-files"/>
+    <target name="init" depends="common.init,compile-demo,compile-memory,compile-highlighter,compile-vector-highlighter,check-files"/>

    <!-- make sure online collections (reuters) are first downloaded -->
    <target name="test" depends="init,get-files">
--- a/contrib/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/ReadTask.java
+++ b/contrib/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/ReadTask.java
@ -38,10 +38,6 @@ import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.Query;
 import org.apache.lucene.search.Sort;
 import org.apache.lucene.search.highlight.Highlighter;
-import org.apache.lucene.search.highlight.QueryTermScorer;
-import org.apache.lucene.search.highlight.SimpleHTMLFormatter;
-import org.apache.lucene.search.highlight.TextFragment;
-import org.apache.lucene.search.highlight.TokenSources;
 import org.apache.lucene.search.highlight.InvalidTokenOffsetsException;
 import org.apache.lucene.store.Directory;

@ -122,10 +118,8 @@ public abstract class ReadTask extends PerfTask {
            int numHighlight = Math.min(numToHighlight(), scoreDocs.length);
            Analyzer analyzer = getRunData().getAnalyzer();
            BenchmarkHighlighter highlighter = null;
-            int maxFrags = 1;
            if (numHighlight > 0) {
              highlighter = getBenchmarkHighlighter(q);
-              maxFrags = maxNumFragments();
            }
            for (int m = 0; m < traversalSize; m++) {
              int id = scoreDocs[m].doc;
@ -242,37 +236,50 @@ public abstract class ReadTask extends PerfTask {
  /**
   * @deprecated Use {@link #getBenchmarkHighlighter(Query)}
   */
-  protected Highlighter getHighlighter(Query q){
-    return new Highlighter(new SimpleHTMLFormatter(), new QueryTermScorer(q));
+  final Highlighter getHighlighter(Query q) {
+    // not called
+    return null;
  }
  
+  /**
+   * Return an appropriate highlighter to be used with
+   * highlighting tasks
+   */
  protected BenchmarkHighlighter getBenchmarkHighlighter(Query q){
    return null;
  }

  /**
-   *
   * @return the maxiumum number of highlighter fragments
+   * @deprecated Please define getBenchmarkHighlighter instead
   */
-  public int maxNumFragments(){
+  final int maxNumFragments(){
+    // not called -- we switched this method to final to
+    // force any external subclasses to cutover to
+    // getBenchmarkHighlighter instead
    return 10;
  }

  /**
   *
   * @return true if the highlighter should merge contiguous fragments
-   * @deprecated
+   * @deprecated Please define getBenchmarkHighlighter instead
   */
-  public boolean isMergeContiguousFragments(){
+  final boolean isMergeContiguousFragments(){
+    // not called -- we switched this method to final to
+    // force any external subclasses to cutover to
+    // getBenchmarkHighlighter instead
    return false;
  }

  /**
-   * @deprecated
+   * @deprecated Please define getBenchmarkHighlighter instead
   */
-  protected int doHighlight(TokenStream ts, String text,  Highlighter highlighter, boolean mergeContiguous, int maxFragments) throws IOException, InvalidTokenOffsetsException {
-    TextFragment[] frag = highlighter.getBestTextFragments(ts, text, mergeContiguous, maxFragments);
-    return frag != null ? frag.length : 0;
+  final int doHighlight(TokenStream ts, String text,  Highlighter highlighter, boolean mergeContiguous, int maxFragments) throws IOException, InvalidTokenOffsetsException {
+    // not called -- we switched this method to final to
+    // force any external subclasses to cutover to
+    // getBenchmarkHighlighter instead
+    return 0;
  }
  
  protected Sort getSort() {
--- a/contrib/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/SearchTravRetHighlightTask.java
+++ b/contrib/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/SearchTravRetHighlightTask.java
@ -24,13 +24,11 @@ import org.apache.lucene.document.Document;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.search.Query;
 import org.apache.lucene.search.highlight.Highlighter;
-import org.apache.lucene.search.highlight.InvalidTokenOffsetsException;
 import org.apache.lucene.search.highlight.QueryScorer;
 import org.apache.lucene.search.highlight.SimpleHTMLFormatter;
 import org.apache.lucene.search.highlight.TextFragment;
 import org.apache.lucene.search.highlight.TokenSources;

-import java.io.IOException;
 import java.util.Set;
 import java.util.Collection;
 import java.util.HashSet;
@ -103,17 +101,6 @@ public class SearchTravRetHighlightTask extends SearchTravTask {
    };
  }

-  /**
-   * @deprecated
-   */
-  public boolean isMergeContiguousFragments() {
-    return mergeContiguous;
-  }
-
-  public int maxNumFragments() {
-    return maxFrags;
-  }
-
  protected Collection/*<String>*/ getFieldsToHighlight(Document document) {
    Collection result = super.getFieldsToHighlight(document);
    //if stored is false, then result will be empty, in which case just get all the param fields
--- a/contrib/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/SearchTravRetVectorHighlightTask.java
+++ b/contrib/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/SearchTravRetVectorHighlightTask.java
@ -101,10 +101,6 @@ public class SearchTravRetVectorHighlightTask extends SearchTravTask {
    };
  }

-  public int maxNumFragments() {
-    return maxFrags;
-  }
-
  protected Collection/*<String>*/ getFieldsToHighlight(Document document) {
    Collection result = super.getFieldsToHighlight(document);
    //if stored is false, then result will be empty, in which case just get all the param fields
--- a/contrib/benchmark/src/test/org/apache/lucene/benchmark/byTask/tasks/CountingHighlighterTestTask.java
+++ b/contrib/benchmark/src/test/org/apache/lucene/benchmark/byTask/tasks/CountingHighlighterTestTask.java
@ -19,9 +19,13 @@ package org.apache.lucene.benchmark.byTask.tasks;

 import org.apache.lucene.benchmark.byTask.PerfRunData;
 import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.search.highlight.SimpleHTMLFormatter;
 import org.apache.lucene.search.highlight.Highlighter;
 import org.apache.lucene.search.highlight.TextFragment;
-import org.apache.lucene.search.highlight.InvalidTokenOffsetsException;
+import org.apache.lucene.search.highlight.QueryScorer;
+import org.apache.lucene.search.highlight.TokenSources;
+import org.apache.lucene.search.Query;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.index.IndexReader;

@ -47,9 +51,15 @@ public class CountingHighlighterTestTask extends SearchTravRetHighlightTask {
    return document;
  }

-  protected int doHighlight(TokenStream ts, String text,  Highlighter highlighter, boolean mergeContiguous, int maxFragments) throws IOException, InvalidTokenOffsetsException {
-    TextFragment[] frag = highlighter.getBestTextFragments(ts, text, mergeContiguous, maxFragments);
-    numHighlightedResults += frag != null ? frag.length : 0;
-    return frag != null ? frag.length : 0;
+  public BenchmarkHighlighter getBenchmarkHighlighter(Query q) {
+    highlighter = new Highlighter(new SimpleHTMLFormatter(), new QueryScorer(q));
+    return new BenchmarkHighlighter() {
+      public int doHighlight(IndexReader reader, int doc, String field, Document document, Analyzer analyzer, String text) throws Exception {
+        TokenStream ts = TokenSources.getAnyTokenStream(reader, doc, field, document, analyzer);
+        TextFragment[] frag = highlighter.getBestTextFragments(ts, text, mergeContiguous, maxFrags);
+        numHighlightedResults += frag != null ? frag.length : 0;
+        return frag != null ? frag.length : 0;
+      }
+    };
  }
-}
+}