From 3aed0fd54bcbf31e71268cf606c10fa9334debdf Mon Sep 17 00:00:00 2001
From: Michael McCandless <mikemccand@apache.org>
Date: Mon, 10 Aug 2009 18:46:39 +0000
Subject: [PATCH] LUCENE-1797: don't over-increment positions when creating
 MultiPhraseQuery

git-svn-id: https://svn.apache.org/repos/asf/lucene/java/trunk@802893 13f79535-47bb-0310-9956-ffa450edef68
---
 .../AnalyzerQueryNodeProcessor.java           | 10 ++--
 .../queryParser/standard/TestQPHelper.java    | 53 ++++++++++++++++++-
 2 files changed, 59 insertions(+), 4 deletions(-)
diff --git a/contrib/queryparser/src/java/org/apache/lucene/queryParser/standard/processors/AnalyzerQueryNodeProcessor.java b/contrib/queryparser/src/java/org/apache/lucene/queryParser/standard/processors/AnalyzerQueryNodeProcessor.java
index c44428daa89..9bd6e4a7ce9 100644
--- a/contrib/queryparser/src/java/org/apache/lucene/queryParser/standard/processors/AnalyzerQueryNodeProcessor.java
+++ b/contrib/queryparser/src/java/org/apache/lucene/queryParser/standard/processors/AnalyzerQueryNodeProcessor.java
@@ -218,6 +218,7 @@ public class AnalyzerQueryNodeProcessor extends QueryNodeProcessorImpl {
           List<FieldQueryNode> multiTerms = new ArrayList<FieldQueryNode>();
           int position = -1;
           int i = 0;
+          int termGroupCount = 0;
           for (; i < numTokens; i++) {
             String term = null;
             int positionIncrement = 1;
@@ -239,15 +240,18 @@ public class AnalyzerQueryNodeProcessor extends QueryNodeProcessorImpl {
 
                 if (this.positionIncrementsEnabled) {
                   termNode.setPositionIncrement(position);
-
                 } else {
-                  termNode.setPositionIncrement(i);
+                  termNode.setPositionIncrement(termGroupCount);
                 }
 
                 mpq.add(termNode);
 
               }
 
+              // Only increment once for each "group" of
+              // terms that were in the same position:
+              termGroupCount++;
+
               multiTerms.clear();
 
             }
@@ -263,7 +267,7 @@ public class AnalyzerQueryNodeProcessor extends QueryNodeProcessorImpl {
               termNode.setPositionIncrement(position);
 
             } else {
-              termNode.setPositionIncrement(i);
+              termNode.setPositionIncrement(termGroupCount);
             }
 
             mpq.add(termNode);
diff --git a/contrib/queryparser/src/test/org/apache/lucene/queryParser/standard/TestQPHelper.java b/contrib/queryparser/src/test/org/apache/lucene/queryParser/standard/TestQPHelper.java
index f75029ff98c..6679ded5d8e 100644
--- a/contrib/queryparser/src/test/org/apache/lucene/queryParser/standard/TestQPHelper.java
+++ b/contrib/queryparser/src/test/org/apache/lucene/queryParser/standard/TestQPHelper.java
@@ -41,11 +41,13 @@ import org.apache.lucene.analysis.WhitespaceAnalyzer;
 import org.apache.lucene.analysis.standard.StandardAnalyzer;
 import org.apache.lucene.analysis.tokenattributes.OffsetAttribute;
 import org.apache.lucene.analysis.tokenattributes.TermAttribute;
+import org.apache.lucene.analysis.tokenattributes.PositionIncrementAttribute;
 import org.apache.lucene.document.DateField;
 import org.apache.lucene.document.DateTools;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.index.IndexWriter;
+import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.Term;
 import org.apache.lucene.messages.MessageImpl;
 import org.apache.lucene.queryParser.core.QueryNodeException;
@@ -55,12 +57,12 @@ import org.apache.lucene.queryParser.core.nodes.QueryNode;
 import org.apache.lucene.queryParser.core.nodes.WildcardQueryNode;
 import org.apache.lucene.queryParser.core.processors.QueryNodeProcessorImpl;
 import org.apache.lucene.queryParser.core.processors.QueryNodeProcessorPipeline;
-import org.apache.lucene.queryParser.standard.config.StandardQueryConfigHandler;
 import org.apache.lucene.queryParser.standard.config.DefaultOperatorAttribute.Operator;
 import org.apache.lucene.search.BooleanQuery;
 import org.apache.lucene.search.FuzzyQuery;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.MatchAllDocsQuery;
+import org.apache.lucene.search.MultiPhraseQuery;
 import org.apache.lucene.search.MultiTermQuery;
 import org.apache.lucene.search.PhraseQuery;
 import org.apache.lucene.search.PrefixQuery;
@@ -70,6 +72,7 @@ import org.apache.lucene.search.TermQuery;
 import org.apache.lucene.search.TermRangeQuery;
 import org.apache.lucene.search.WildcardQuery;
 import org.apache.lucene.store.RAMDirectory;
+import org.apache.lucene.store.MockRAMDirectory;
 import org.apache.lucene.util.LuceneTestCase;
 
 /**
@@ -1144,4 +1147,52 @@ public class TestQPHelper extends LuceneTestCase {
     BooleanQuery.setMaxClauseCount(originalMaxClauses);
   }
 
+  private class CannedTokenStream extends TokenStream {
+    private int upto = 0;
+    public boolean incrementToken() {
+      if (upto == 4) {
+        return false;
+      }
+      PositionIncrementAttribute posIncr = (PositionIncrementAttribute) addAttribute(PositionIncrementAttribute.class);
+      TermAttribute term = (TermAttribute) addAttribute(TermAttribute.class);
+      if (upto == 0) {
+        posIncr.setPositionIncrement(1);
+        term.setTermBuffer("a");
+      } else if (upto == 1) {
+        posIncr.setPositionIncrement(1);
+        term.setTermBuffer("b");
+      } else if (upto == 2) {
+        posIncr.setPositionIncrement(0);
+        term.setTermBuffer("c");
+      } else {
+        posIncr.setPositionIncrement(0);
+        term.setTermBuffer("d");
+      }
+      upto++;
+      return true;
+    }
+  }
+
+  private class CannedAnalyzer extends Analyzer {
+    public TokenStream tokenStream(String ignored, Reader alsoIgnored) {
+      return new CannedTokenStream();
+    }
+  }
+
+  public void testMultiPhraseQuery() throws Exception {
+    MockRAMDirectory dir = new MockRAMDirectory();
+    IndexWriter w = new IndexWriter(dir, new CannedAnalyzer(), IndexWriter.MaxFieldLength.UNLIMITED);
+    Document doc = new Document();
+    doc.add(new Field("field", "", Field.Store.NO, Field.Index.ANALYZED));
+    w.addDocument(doc);
+    IndexReader r = w.getReader();
+    IndexSearcher s = new IndexSearcher(r);
+    
+    Query q = new StandardQueryParser(new CannedAnalyzer()).parse("\"a\"", "field");
+    assertTrue(q instanceof MultiPhraseQuery);
+    assertEquals(1, s.search(q, 10).totalHits);
+    r.close();
+    w.close();
+  }
+
 }