From d8e0288109f05ffc828e7f41a0f00b2c6f707151 Mon Sep 17 00:00:00 2001
From: Shai Erera <shaie@apache.org>
Date: Wed, 16 May 2012 08:01:40 +0000
Subject: [PATCH 01/47] LUCENE-4060: port to trunk

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339047 13f79535-47bb-0310-9956-ffa450edef68
---
 lucene/CHANGES.txt                            |   5 +
 .../example/merge/TaxonomyMergeUtils.java     |   2 +-
 .../facet/taxonomy/directory/Consts.java      |   3 +-
 .../directory/DirectoryTaxonomyWriter.java    | 208 ++++----------
 .../taxonomy/directory/TestAddTaxonomies.java | 254 ------------------
 .../taxonomy/directory/TestAddTaxonomy.java   | 228 ++++++++++++++++
 6 files changed, 280 insertions(+), 420 deletions(-)
 delete mode 100644 lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomies.java
 create mode 100644 lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java

diff --git a/lucene/CHANGES.txt b/lucene/CHANGES.txt
index 17ea33945f8..5d86c224963 100644
--- a/lucene/CHANGES.txt
+++ b/lucene/CHANGES.txt
@@ -953,6 +953,11 @@ Bug fixes
   offset calculation in PathHierarchyTokenizer. 
   (Mike McCandless, Uwe Schindler, Robert Muir)
 
+* LUCENE-4060: Fix a synchronization bug in 
+  DirectoryTaxonomyWriter.addTaxonomies(). Also, the method has been renamed to
+  addTaxonomy and now takes only one Directory and one OrdinalMap.
+  (Shai Erera, Gilad Barkai)
+
 Documentation
 
 * LUCENE-3958: Javadocs corrections for IndexWriter.
diff --git a/lucene/facet/src/examples/org/apache/lucene/facet/example/merge/TaxonomyMergeUtils.java b/lucene/facet/src/examples/org/apache/lucene/facet/example/merge/TaxonomyMergeUtils.java
index 40dfac53dfd..835c8e846f5 100644
--- a/lucene/facet/src/examples/org/apache/lucene/facet/example/merge/TaxonomyMergeUtils.java
+++ b/lucene/facet/src/examples/org/apache/lucene/facet/example/merge/TaxonomyMergeUtils.java
@@ -81,7 +81,7 @@ public class TaxonomyMergeUtils {
                             OrdinalMap map, IndexWriter destIndexWriter,
                             DirectoryTaxonomyWriter destTaxWriter) throws IOException {
     // merge the taxonomies
-    destTaxWriter.addTaxonomies(new Directory[] { srcTaxDir }, new OrdinalMap[] { map });
+    destTaxWriter.addTaxonomy(srcTaxDir, map);
 
     PayloadProcessorProvider payloadProcessor = new FacetsPayloadProcessorProvider(
         srcIndexDir, map.getMap(), new DefaultFacetIndexingParams());
diff --git a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/Consts.java b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/Consts.java
index ec6e842c067..2d7988ad152 100644
--- a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/Consts.java
+++ b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/Consts.java
@@ -4,8 +4,6 @@ import java.io.IOException;
 
 import org.apache.lucene.index.FieldInfo;
 import org.apache.lucene.index.StoredFieldVisitor;
-import org.apache.lucene.index.StoredFieldVisitor.Status;
-import org.apache.lucene.store.IndexInput;
 
 /**
  * Licensed to the Apache Software Foundation (ASF) under one or more
@@ -42,6 +40,7 @@ abstract class Consts {
   public static final class LoadFullPathOnly extends StoredFieldVisitor {
     private String fullPath;
 
+    @Override
     public void stringField(FieldInfo fieldInfo, String value) throws IOException {
       fullPath = value;
     }
diff --git a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
index e1dfbea534d..b77e0f1bcfe 100644
--- a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
+++ b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
@@ -12,15 +12,21 @@ import java.io.IOException;
 import java.util.HashMap;
 import java.util.Map;
 
-import org.apache.lucene.analysis.core.KeywordAnalyzer;
 import org.apache.lucene.analysis.TokenStream;
-import org.apache.lucene.analysis.tokenattributes.PositionIncrementAttribute;
+import org.apache.lucene.analysis.core.KeywordAnalyzer;
 import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
+import org.apache.lucene.analysis.tokenattributes.PositionIncrementAttribute;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.document.TextField;
+import org.apache.lucene.facet.taxonomy.CategoryPath;
+import org.apache.lucene.facet.taxonomy.TaxonomyReader;
+import org.apache.lucene.facet.taxonomy.TaxonomyWriter;
+import org.apache.lucene.facet.taxonomy.writercache.TaxonomyWriterCache;
+import org.apache.lucene.facet.taxonomy.writercache.cl2o.Cl2oTaxonomyWriterCache;
+import org.apache.lucene.facet.taxonomy.writercache.lru.LruTaxonomyWriterCache;
 import org.apache.lucene.index.CorruptIndexException;
 import org.apache.lucene.index.DirectoryReader;
 import org.apache.lucene.index.DocsEnum;
@@ -30,9 +36,9 @@ import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.index.IndexWriterConfig.OpenMode;
 import org.apache.lucene.index.LogByteSizeMergePolicy;
 import org.apache.lucene.index.MultiFields;
+import org.apache.lucene.index.SegmentInfos;
 import org.apache.lucene.index.Terms;
 import org.apache.lucene.index.TermsEnum;
-import org.apache.lucene.index.SegmentInfos;
 import org.apache.lucene.index.TieredMergePolicy;
 import org.apache.lucene.search.DocIdSetIterator;
 import org.apache.lucene.store.AlreadyClosedException;
@@ -44,13 +50,6 @@ import org.apache.lucene.util.Bits;
 import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.Version;
 
-import org.apache.lucene.facet.taxonomy.CategoryPath;
-import org.apache.lucene.facet.taxonomy.TaxonomyReader;
-import org.apache.lucene.facet.taxonomy.TaxonomyWriter;
-import org.apache.lucene.facet.taxonomy.writercache.TaxonomyWriterCache;
-import org.apache.lucene.facet.taxonomy.writercache.cl2o.Cl2oTaxonomyWriterCache;
-import org.apache.lucene.facet.taxonomy.writercache.lru.LruTaxonomyWriterCache;
-
 /**
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
@@ -812,6 +811,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     }
     return parentArray;
   }
+  
   @Override
   public int getParent(int ordinal) throws IOException {
     ensureOpen();
@@ -823,158 +823,47 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     }
     return getParentArray().getArray()[ordinal];
   }
-
+  
   /**
-   * Take all the categories of one or more given taxonomies, and add them to
-   * the main taxonomy (this), if they are not already there.
-   * <P>
-   * Additionally, fill a <I>mapping</I> for each of the added taxonomies,
-   * mapping its ordinals to the ordinals in the enlarged main taxonomy.
-   * These mapping are saved into an array of OrdinalMap objects given by the
-   * user, one for each of the given taxonomies (not including "this", the main
-   * taxonomy). Often the first of these will be a MemoryOrdinalMap and the
-   * others will be a DiskOrdinalMap - see discussion in {OrdinalMap}. 
-   * <P> 
-   * Note that the taxonomies to be added are given as Directory objects,
-   * not opened TaxonomyReader/TaxonomyWriter objects, so if any of them are
-   * currently managed by an open TaxonomyWriter, make sure to commit() (or
-   * close()) it first. The main taxonomy (this) is an open TaxonomyWriter,
-   * and does not need to be commit()ed before this call. 
+   * Takes the categories from the given taxonomy directory, and adds the
+   * missing ones to this taxonomy. Additionally, it fills the given
+   * {@link OrdinalMap} with a mapping from the original ordinal to the new
+   * ordinal.
    */
-  public void addTaxonomies(Directory[] taxonomies, OrdinalMap[] ordinalMaps) throws IOException {
+  public void addTaxonomy(Directory taxoDir, OrdinalMap map) throws IOException {
     ensureOpen();
-    // To prevent us stepping on the rest of this class's decisions on when
-    // to open a reader, and when not, we'll be opening a new reader instead
-    // of using the existing "reader" object:
-    IndexReader mainreader = openReader();
-    // TODO (Facet): can this then go segment-by-segment and avoid MultiDocsEnum etc?
-    Terms terms = MultiFields.getTerms(mainreader, Consts.FULL);
-    assert terms != null; // TODO (Facet): explicit check / throw exception?
-    TermsEnum mainte = terms.iterator(null);
-    DocsEnum mainde = null;
-
-    IndexReader[] otherreaders = new IndexReader[taxonomies.length];
-    TermsEnum[] othertes = new TermsEnum[taxonomies.length];
-    DocsEnum[] otherdocsEnum = new DocsEnum[taxonomies.length]; // just for reuse
-    for (int i=0; i<taxonomies.length; i++) {
-      otherreaders[i] = DirectoryReader.open(taxonomies[i]);
-      terms = MultiFields.getTerms(otherreaders[i], Consts.FULL);
-      assert terms != null; // TODO (Facet): explicit check / throw exception?
-      othertes[i] = terms.iterator(null);
-      // Also tell the ordinal maps their expected sizes:
-      ordinalMaps[i].setSize(otherreaders[i].numDocs());
-    }
-
-    CategoryPath cp = new CategoryPath();
-
-    // We keep a "current" cursor over the alphabetically-ordered list of
-    // categories in each taxonomy. We start the cursor on the first
-    // (alphabetically) category of each taxonomy:
-
-    String currentMain;
-    String[] currentOthers = new String[taxonomies.length];
-    currentMain = nextTE(mainte);
-    int otherTaxonomiesLeft = 0;
-    for (int i=0; i<taxonomies.length; i++) {
-      currentOthers[i] = nextTE(othertes[i]);
-      if (currentOthers[i]!=null) {
-        otherTaxonomiesLeft++;
-      }
-    }
-
-    // And then, at each step look at the first (alphabetically) of the
-    // current taxonomies.
-    // NOTE: The most efficient way we could have done this is using a
-    // PriorityQueue. But for simplicity, and assuming that usually we'll
-    // have a very small number of other taxonomies (often just 1), we use
-    // a more naive algorithm (o(ntaxonomies) instead of o(ln ntaxonomies)
-    // per step)
-
-    while (otherTaxonomiesLeft>0) {
-      // TODO: use a pq here
-      String first=null;
-      for (int i=0; i<taxonomies.length; i++) {
-        if (currentOthers[i]==null) continue;
-        if (first==null || first.compareTo(currentOthers[i])>0) {
-          first = currentOthers[i];
-        }
-      }
-      int comp = 0;
-      if (currentMain==null || (comp = currentMain.compareTo(first))>0) {
-        // If 'first' is before currentMain, or currentMain is null,
-        // then 'first' is a new category and we need to add it to the
-        // main taxonomy. Then for all taxonomies with this 'first'
-        // category, we need to add the new category number to their
-        // map, and move to the next category in all of them.
+    IndexReader r = DirectoryReader.open(taxoDir);
+    try {
+      final int size = r.numDocs();
+      final OrdinalMap ordinalMap = map;
+      ordinalMap.setSize(size);
+      CategoryPath cp = new CategoryPath();
+      Terms terms = MultiFields.getTerms(r, Consts.FULL);
+      TermsEnum te = terms.iterator(null);
+      Bits liveDocs = MultiFields.getLiveDocs(r);
+      DocsEnum docs = null;
+      // we call next() first, to skip the root category which always exists.
+      while (te.next() != null) {
+        String value = te.term().utf8ToString();
         cp.clear();
-        cp.add(first, delimiter);
-        // We can call internalAddCategory() instead of addCategory()
-        // because we know the category hasn't been seen yet.
-        int newordinal = internalAddCategory(cp, cp.length());
-        // TODO (Facet): we already had this term in our hands before, in nextTE...
-        // // TODO (Facet): no need to make this term?
-        for (int i=0; i<taxonomies.length; i++) {
-          if (first.equals(currentOthers[i])) {
-            // remember the remapping of this ordinal. Note how
-            // this requires reading a posting list from the index -
-            // but since we do this in lexical order of terms, just
-            // like Lucene's merge works, we hope there are few seeks.
-            // TODO (Facet): is there a quicker way? E.g., not specifying the
-            // next term by name every time?
-            otherdocsEnum[i] = othertes[i].docs(MultiFields.getLiveDocs(otherreaders[i]), otherdocsEnum[i], false);
-            otherdocsEnum[i].nextDoc(); // TODO (Facet): check?
-            int origordinal = otherdocsEnum[i].docID();
-            ordinalMaps[i].addMapping(origordinal, newordinal);
-            // and move to the next category in the i'th taxonomy 
-            currentOthers[i] = nextTE(othertes[i]);
-            if (currentOthers[i]==null) {
-              otherTaxonomiesLeft--;
-            }
-          }
+        cp.add(value, Consts.DEFAULT_DELIMITER);
+        int ordinal = findCategory(cp);
+        if (ordinal < 0) {
+          // NOTE: call addCategory so that it works well in a multi-threaded
+          // environment, in case e.g. a thread just added the category, after
+          // the findCategory() call above failed to find it.
+          ordinal = addCategory(cp);
         }
-      } else if (comp==0) {
-        // 'first' and currentMain are the same, so both the main and some
-        // other taxonomies need to be moved, but a category doesn't need
-        // to be added because it already existed in the main taxonomy.
-
-        // TODO (Facet): Again, is there a quicker way?
-        mainde = mainte.docs(MultiFields.getLiveDocs(mainreader), mainde, false);
-        mainde.nextDoc(); // TODO (Facet): check?
-        int newordinal = mainde.docID();
-
-        currentMain = nextTE(mainte);
-        for (int i=0; i<taxonomies.length; i++) {
-          if (first.equals(currentOthers[i])) {
-            // TODO (Facet): again, is there a quicker way?
-            otherdocsEnum[i] = othertes[i].docs(MultiFields.getLiveDocs(otherreaders[i]), otherdocsEnum[i], false);
-            otherdocsEnum[i].nextDoc(); // TODO (Facet): check?
-            int origordinal = otherdocsEnum[i].docID();
-            ordinalMaps[i].addMapping(origordinal, newordinal);
-
-            // and move to the next category 
-            currentOthers[i] = nextTE(othertes[i]);
-            if (currentOthers[i]==null) {
-              otherTaxonomiesLeft--;
-            }
-          }
-        }
-      } else /* comp > 0 */ {
-        // The currentMain doesn't appear in any of the other taxonomies -
-        // we don't need to do anything, just continue to the next one
-        currentMain = nextTE(mainte);
+        docs = te.docs(liveDocs, docs, false);
+        ordinalMap.addMapping(docs.nextDoc(), ordinal);
       }
-    }
-
-    // Close all the readers we've opened, and also tell the ordinal maps
-    // we're done adding to them
-    mainreader.close();
-    for (int i=0; i<taxonomies.length; i++) {
-      otherreaders[i].close();
-      // We never actually added a mapping for the root ordinal - let's do
-      // it now, just so that the map is complete (every ordinal between 0
-      // and size-1 is remapped)
-      ordinalMaps[i].addMapping(0, 0);
-      ordinalMaps[i].addDone();
+      // we must add the root ordinal map, so that the map will be complete
+      // (otherwise e.g. DiskOrdinalMap may fail because it expects more
+      // categories to exist in the file).
+      ordinalMap.addMapping(0, 0);
+      ordinalMap.addDone();
+    } finally {
+      r.close();
     }
   }
 
@@ -1113,13 +1002,6 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     }
   }
 
-  private static final String nextTE(TermsEnum te) throws IOException {
-    if (te.next() != null) {
-      return te.term().utf8ToString(); // TODO (Facet): avoid String creation/use Bytes?
-    } 
-    return null;
-  }
-
   /**
    * Rollback changes to the taxonomy writer and closes the instance. Following
    * this method the instance becomes unusable (calling any of its API methods
diff --git a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomies.java b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomies.java
deleted file mode 100644
index 4978a2efe77..00000000000
--- a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomies.java
+++ /dev/null
@@ -1,254 +0,0 @@
-package org.apache.lucene.facet.taxonomy.directory;
-
-import java.io.File;
-
-import org.apache.lucene.store.Directory;
-import org.junit.Test;
-
-import org.apache.lucene.util.IOUtils;
-import org.apache.lucene.util.LuceneTestCase;
-import org.apache.lucene.util._TestUtil;
-import org.apache.lucene.facet.taxonomy.CategoryPath;
-import org.apache.lucene.facet.taxonomy.TaxonomyReader;
-import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyReader;
-import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter;
-import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter.DiskOrdinalMap;
-import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter.MemoryOrdinalMap;
-import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter.OrdinalMap;
-
-/**
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-public class TestAddTaxonomies extends LuceneTestCase {
-
-  @Test
-  public void test1() throws Exception {
-    Directory dir1 = newDirectory();
-    DirectoryTaxonomyWriter tw1 = new DirectoryTaxonomyWriter(dir1);
-    tw1.addCategory(new CategoryPath("Author", "Mark Twain"));
-    tw1.addCategory(new CategoryPath("Animals", "Dog"));
-    Directory dir2 = newDirectory();
-    DirectoryTaxonomyWriter tw2 = new DirectoryTaxonomyWriter(dir2);
-    tw2.addCategory(new CategoryPath("Author", "Rob Pike"));
-    tw2.addCategory(new CategoryPath("Aardvarks", "Bob"));
-    tw2.close();
-    Directory dir3 = newDirectory();
-    DirectoryTaxonomyWriter tw3 = new DirectoryTaxonomyWriter(dir3);
-    tw3.addCategory(new CategoryPath("Author", "Zebra Smith"));
-    tw3.addCategory(new CategoryPath("Aardvarks", "Bob"));
-    tw3.addCategory(new CategoryPath("Aardvarks", "Aaron"));
-    tw3.close();
-
-    MemoryOrdinalMap[] maps = new MemoryOrdinalMap[2];
-    maps[0] = new MemoryOrdinalMap();
-    maps[1] = new MemoryOrdinalMap();
-
-    tw1.addTaxonomies(new Directory[] { dir2, dir3 }, maps);
-    tw1.close();
-
-    TaxonomyReader tr = new DirectoryTaxonomyReader(dir1);
-
-    // Test that the merged taxonomy now contains what we expect:
-    // First all the categories of the original taxonomy, in their original order:
-    assertEquals(tr.getPath(0).toString(), "");
-    assertEquals(tr.getPath(1).toString(), "Author");
-    assertEquals(tr.getPath(2).toString(), "Author/Mark Twain");
-    assertEquals(tr.getPath(3).toString(), "Animals");
-    assertEquals(tr.getPath(4).toString(), "Animals/Dog");
-    // Then the categories new in the new taxonomy, in alphabetical order: 
-    assertEquals(tr.getPath(5).toString(), "Aardvarks");
-    assertEquals(tr.getPath(6).toString(), "Aardvarks/Aaron");
-    assertEquals(tr.getPath(7).toString(), "Aardvarks/Bob");
-    assertEquals(tr.getPath(8).toString(), "Author/Rob Pike");
-    assertEquals(tr.getPath(9).toString(), "Author/Zebra Smith");
-    assertEquals(tr.getSize(), 10);
-
-    // Test that the maps contain what we expect
-    int[] map0 = maps[0].getMap();
-    assertEquals(5, map0.length);
-    assertEquals(0, map0[0]);
-    assertEquals(1, map0[1]);
-    assertEquals(8, map0[2]);
-    assertEquals(5, map0[3]);
-    assertEquals(7, map0[4]);
-
-    int[] map1 = maps[1].getMap();
-    assertEquals(6, map1.length);
-    assertEquals(0, map1[0]);
-    assertEquals(1, map1[1]);
-    assertEquals(9, map1[2]);
-    assertEquals(5, map1[3]);
-    assertEquals(7, map1[4]);
-    assertEquals(6, map1[5]);
-    
-    tr.close();
-    dir1.close();
-    dir2.close();
-    dir3.close();
-  }
-
-  // a reasonable random test
-  public void testmedium() throws Exception {
-    int numTests = atLeast(3);
-    for (int i = 0; i < numTests; i++) {
-      dotest(_TestUtil.nextInt(random(), 1, 10), 
-             _TestUtil.nextInt(random(), 1, 100), 
-             _TestUtil.nextInt(random(), 100, 1000),
-             random().nextBoolean());
-    }
-  }
-
-  // A more comprehensive and big random test.
-  @Test @Nightly
-  public void testbig() throws Exception {
-    dotest(2, 1000, 5000, false);
-    dotest(10, 10000, 100, false);
-    dotest(50, 20, 100, false);
-    dotest(10, 1000, 10000, false);
-    dotest(50, 20, 10000, false);
-    dotest(1, 20, 10000, false);
-    dotest(10, 1, 10000, false);
-    dotest(10, 1000, 20000, true);
-  }
-
-  private void dotest(int ntaxonomies, int ncats, int range, boolean disk) throws Exception {
-    Directory dirs[] = new Directory[ntaxonomies];
-    Directory copydirs[] = new Directory[ntaxonomies];
-
-    for (int i=0; i<ntaxonomies; i++) {
-      dirs[i] = newDirectory();
-      copydirs[i] = newDirectory();
-      DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[i]);
-      DirectoryTaxonomyWriter copytw = new DirectoryTaxonomyWriter(copydirs[i]);
-      for (int j=0; j<ncats; j++) {
-        String cat = Integer.toString(random().nextInt(range));
-        tw.addCategory(new CategoryPath("a",cat));
-        copytw.addCategory(new CategoryPath("a",cat));
-      }
-      // System.err.println("Taxonomy "+i+": "+tw.getSize());
-      tw.close();
-      copytw.close();
-    }
-
-    DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[0]);
-    Directory otherdirs[] = new Directory[ntaxonomies-1];
-    System.arraycopy(dirs, 1, otherdirs, 0, ntaxonomies-1);
-
-    OrdinalMap[] maps = new OrdinalMap[ntaxonomies-1];
-    if (ntaxonomies>1) {
-      for (int i=0; i<ntaxonomies-1; i++) {
-        if (disk) {
-          // TODO: use a LTC tempfile
-          maps[i] = new DiskOrdinalMap(new File(System.getProperty("java.io.tmpdir"),
-              "tmpmap"+i));
-        } else {
-          maps[i] = new MemoryOrdinalMap();
-        }
-      }
-    }
-
-    tw.addTaxonomies(otherdirs, maps);
-    // System.err.println("Merged axonomy: "+tw.getSize());
-    tw.close();
-
-    // Check that all original categories in the main taxonomy remain in
-    // unchanged, and the rest of the taxonomies are completely unchanged.
-    for (int i=0; i<ntaxonomies; i++) {
-      TaxonomyReader tr = new DirectoryTaxonomyReader(dirs[i]);
-      TaxonomyReader copytr = new DirectoryTaxonomyReader(copydirs[i]);
-      if (i==0) {
-        assertTrue(tr.getSize() >= copytr.getSize());
-      } else {
-        assertEquals(copytr.getSize(), tr.getSize());
-      }
-      for (int j=0; j<copytr.getSize(); j++) {
-        String expected = copytr.getPath(j).toString();
-        String got = tr.getPath(j).toString();
-        assertTrue("Comparing category "+j+" of taxonomy "+i+": expected "+expected+", got "+got,
-            expected.equals(got));
-      }
-      tr.close();
-      copytr.close();
-    }
-
-    // Check that all the new categories in the main taxonomy are in
-    // lexicographic order. This isn't a requirement of our API, but happens
-    // this way in our current implementation.
-    TaxonomyReader tr = new DirectoryTaxonomyReader(dirs[0]);
-    TaxonomyReader copytr = new DirectoryTaxonomyReader(copydirs[0]);
-    if (tr.getSize() > copytr.getSize()) {
-      String prev = tr.getPath(copytr.getSize()).toString();
-      for (int j=copytr.getSize()+1; j<tr.getSize(); j++) {
-        String n = tr.getPath(j).toString();
-        assertTrue(prev.compareTo(n)<0);
-        prev=n;
-      }
-    }
-    int oldsize = copytr.getSize(); // remember for later
-    tr.close();
-    copytr.close();
-
-    // Check that all the categories from other taxonomies exist in the new
-    // taxonomy.
-    TaxonomyReader main = new DirectoryTaxonomyReader(dirs[0]);
-    for (int i=1; i<ntaxonomies; i++) {
-      TaxonomyReader other = new DirectoryTaxonomyReader(dirs[i]);
-      for (int j=0; j<other.getSize(); j++) {
-        int otherord = main.getOrdinal(other.getPath(j));
-        assertTrue(otherord != TaxonomyReader.INVALID_ORDINAL);
-      }
-      other.close();
-    }
-
-    // Check that all the new categories in the merged taxonomy exist in
-    // one of the added taxonomies.
-    TaxonomyReader[] others = new TaxonomyReader[ntaxonomies-1]; 
-    for (int i=1; i<ntaxonomies; i++) {
-      others[i-1] = new DirectoryTaxonomyReader(dirs[i]);
-    }
-    for (int j=oldsize; j<main.getSize(); j++) {
-      boolean found=false;
-      CategoryPath path = main.getPath(j);
-      for (int i=1; i<ntaxonomies; i++) {
-        if (others[i-1].getOrdinal(path) != TaxonomyReader.INVALID_ORDINAL) {
-          found=true;
-          break;
-        }
-      }
-      if (!found) {
-        fail("Found category "+j+" ("+path+") in merged taxonomy not in any of the separate ones");
-      }
-    }
-
-    // Check that all the maps are correct
-    for (int i=0; i<ntaxonomies-1; i++) {
-      int[] map = maps[i].getMap();
-      for (int j=0; j<map.length; j++) {
-        assertEquals(map[j], main.getOrdinal(others[i].getPath(j)));
-      }
-    }
-
-    for (int i=1; i<ntaxonomies; i++) {
-      others[i-1].close();
-    }
-
-    main.close();
-    IOUtils.close(dirs);
-    IOUtils.close(copydirs);
-  }
-
-}
diff --git a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java
new file mode 100644
index 00000000000..0a8347c420a
--- /dev/null
+++ b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java
@@ -0,0 +1,228 @@
+package org.apache.lucene.facet.taxonomy.directory;
+
+import java.io.IOException;
+import java.util.HashSet;
+import java.util.Random;
+
+import org.apache.lucene.facet.taxonomy.CategoryPath;
+import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter.DiskOrdinalMap;
+import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter.MemoryOrdinalMap;
+import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter.OrdinalMap;
+import org.apache.lucene.store.Directory;
+import org.apache.lucene.util.IOUtils;
+import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.util._TestUtil;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+public class TestAddTaxonomy extends LuceneTestCase {
+
+  private void dotest(int ncats, int range) throws Exception {
+    Directory dirs[] = new Directory[2];
+    Random random = random();
+    for (int i = 0; i < dirs.length; i++) {
+      dirs[i] = newDirectory();
+      DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[i]);
+      for (int j = 0; j < ncats; j++) {
+        String cat = Integer.toString(random.nextInt(range));
+        tw.addCategory(new CategoryPath("a", cat));
+      }
+      tw.close();
+    }
+
+    DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[0]);
+    OrdinalMap map = randomOrdinalMap();
+    tw.addTaxonomy(dirs[1], map);
+    tw.close();
+    
+    validate(dirs[0], dirs[1], map);
+    
+    IOUtils.close(dirs);
+  }
+  
+  private OrdinalMap randomOrdinalMap() throws IOException {
+    if (random().nextBoolean()) {
+      return new DiskOrdinalMap(_TestUtil.createTempFile("taxoMap", "", TEMP_DIR));
+    } else {
+      return new MemoryOrdinalMap();
+    }
+  }
+
+  private void validate(Directory dest, Directory src, OrdinalMap ordMap) throws Exception {
+    CategoryPath cp = new CategoryPath();
+    DirectoryTaxonomyReader destTR = new DirectoryTaxonomyReader(dest);
+    try {
+      final int destSize = destTR.getSize();
+      DirectoryTaxonomyReader srcTR = new DirectoryTaxonomyReader(src);
+      try {
+        int[] map = ordMap.getMap();
+        
+        // validate taxo sizes
+        int srcSize = srcTR.getSize();
+        assertTrue("destination taxonomy expected to be larger than source; dest="
+            + destSize + " src=" + srcSize,
+            destSize >= srcSize);
+        
+        // validate that all source categories exist in destination, and their
+        // ordinals are as expected.
+        for (int j = 1; j < srcSize; j++) {
+          srcTR.getPath(j, cp);
+          int destOrdinal = destTR.getOrdinal(cp);
+          assertTrue(cp + " not found in destination", destOrdinal > 0);
+          assertEquals(destOrdinal, map[j]);
+        }
+      } finally {
+        srcTR.close();
+      }
+    } finally {
+      destTR.close();
+    }
+  }
+
+  public void testAddEmpty() throws Exception {
+    Directory dest = newDirectory();
+    DirectoryTaxonomyWriter destTW = new DirectoryTaxonomyWriter(dest);
+    destTW.addCategory(new CategoryPath("Author", "Rob Pike"));
+    destTW.addCategory(new CategoryPath("Aardvarks", "Bob"));
+    destTW.commit();
+    
+    Directory src = newDirectory();
+    new DirectoryTaxonomyWriter(src).close(); // create an empty taxonomy
+    
+    OrdinalMap map = randomOrdinalMap();
+    destTW.addTaxonomy(src, map);
+    destTW.close();
+    
+    validate(dest, src, map);
+    
+    IOUtils.close(dest, src);
+  }
+  
+  public void testAddToEmpty() throws Exception {
+    Directory dest = newDirectory();
+    
+    Directory src = newDirectory();
+    DirectoryTaxonomyWriter srcTW = new DirectoryTaxonomyWriter(src);
+    srcTW.addCategory(new CategoryPath("Author", "Rob Pike"));
+    srcTW.addCategory(new CategoryPath("Aardvarks", "Bob"));
+    srcTW.close();
+    
+    DirectoryTaxonomyWriter destTW = new DirectoryTaxonomyWriter(dest);
+    OrdinalMap map = randomOrdinalMap();
+    destTW.addTaxonomy(src, map);
+    destTW.close();
+    
+    validate(dest, src, map);
+    
+    IOUtils.close(dest, src);
+  }
+  
+  // A more comprehensive and big random test.
+  @Nightly
+  public void testBig() throws Exception {
+    dotest(200, 10000);
+    dotest(1000, 20000);
+    // really big
+    dotest(400000, 1000000);
+  }
+
+  // a reasonable random test
+  public void testMedium() throws Exception {
+    Random random = random();
+    int numTests = atLeast(3);
+    for (int i = 0; i < numTests; i++) {
+      dotest(_TestUtil.nextInt(random, 2, 100), 
+             _TestUtil.nextInt(random, 100, 1000));
+    }
+  }
+  
+  public void testSimple() throws Exception {
+    Directory dest = newDirectory();
+    DirectoryTaxonomyWriter tw1 = new DirectoryTaxonomyWriter(dest);
+    tw1.addCategory(new CategoryPath("Author", "Mark Twain"));
+    tw1.addCategory(new CategoryPath("Animals", "Dog"));
+    tw1.addCategory(new CategoryPath("Author", "Rob Pike"));
+    
+    Directory src = newDirectory();
+    DirectoryTaxonomyWriter tw2 = new DirectoryTaxonomyWriter(src);
+    tw2.addCategory(new CategoryPath("Author", "Rob Pike"));
+    tw2.addCategory(new CategoryPath("Aardvarks", "Bob"));
+    tw2.close();
+
+    OrdinalMap map = randomOrdinalMap();
+
+    tw1.addTaxonomy(src, map);
+    tw1.close();
+
+    validate(dest, src, map);
+    
+    IOUtils.close(dest, src);
+  }
+
+  public void testConcurrency() throws Exception {
+    // tests that addTaxonomy and addCategory work in parallel
+    final int numCategories = atLeast(5000);
+    
+    // build an input taxonomy index
+    Directory src = newDirectory();
+    DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(src);
+    for (int i = 0; i < numCategories; i++) {
+      tw.addCategory(new CategoryPath("a", Integer.toString(i)));
+    }
+    tw.close();
+    
+    // now add the taxonomy to an empty taxonomy, while adding the categories
+    // again, in parallel -- in the end, no duplicate categories should exist.
+    Directory dest = newDirectory();
+    final DirectoryTaxonomyWriter destTW = new DirectoryTaxonomyWriter(dest);
+    Thread t = new Thread() {
+      @Override
+      public void run() {
+        for (int i = 0; i < numCategories; i++) {
+          try {
+            destTW.addCategory(new CategoryPath("a", Integer.toString(i)));
+          } catch (IOException e) {
+            // shouldn't happen - if it does, let the test fail on uncaught exception.
+            throw new RuntimeException(e);
+          }
+        }
+      }
+    };
+    t.start();
+    
+    OrdinalMap map = new MemoryOrdinalMap();
+    destTW.addTaxonomy(src, map);
+    t.join();
+    destTW.close();
+    
+    // now validate
+    
+    DirectoryTaxonomyReader dtr = new DirectoryTaxonomyReader(dest);
+    // +2 to account for the root category + "a"
+    assertEquals(numCategories + 2, dtr.getSize());
+    HashSet<CategoryPath> categories = new HashSet<CategoryPath>();
+    for (int i = 1; i < dtr.getSize(); i++) {
+      CategoryPath cat = dtr.getPath(i);
+      assertTrue("category " + cat + " already existed", categories.add(cat));
+    }
+    dtr.close();
+    
+    IOUtils.close(src, dest);
+  }
+  
+}

From 10de0207955c8c8edaac127c65213abdc70a7535 Mon Sep 17 00:00:00 2001
From: Uwe Schindler <uschindler@apache.org>
Date: Wed, 16 May 2012 09:55:44 +0000
Subject: [PATCH 02/47] LUCENE-4059: Improve ANT task prepare-webpages (used by
 documentation tasks) to correctly encode build file names as URIs for later
 processing by XSL

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339097 13f79535-47bb-0310-9956-ffa450edef68
---
 lucene/CHANGES.txt | 4 ++++
 lucene/build.xml   | 7 ++++++-
 2 files changed, 10 insertions(+), 1 deletion(-)

diff --git a/lucene/CHANGES.txt b/lucene/CHANGES.txt
index 5d86c224963..c3127c169aa 100644
--- a/lucene/CHANGES.txt
+++ b/lucene/CHANGES.txt
@@ -995,6 +995,10 @@ Build
 * LUCENE-3286: Moved remainder of contrib/xml-query-parser to lucene/queryparser.
   Classes now found at org.apache.lucene.queryparser.xml.*
 
+* LUCENE-4059: Improve ANT task prepare-webpages (used by documentation
+  tasks) to correctly encode build file names as URIs for later processing by
+  XSL.  (Greg Bowyer, Uwe Schindler)
+
 ======================= Lucene 3.6.0 =======================
 
 Changes in backwards compatibility policy
diff --git a/lucene/build.xml b/lucene/build.xml
index 7e16b01354d..91d3d3ce84c 100644
--- a/lucene/build.xml
+++ b/lucene/build.xml
@@ -225,8 +225,13 @@
   </target>
   
   <target name="process-webpages" depends="resolve-pegdown">
-    <pathconvert pathsep="|" dirsep="/" property="buildfiles">
+    <pathconvert pathsep="|" property="buildfiles">
       <fileset dir="." includes="**/build.xml" excludes="build.xml,analysis/*,build/**,tools/**,backwards/**,site/**"/>
+      <mapper>
+        <scriptmapper language="javascript">
+          self.addMappedName((new java.io.File(source)).toURI());
+        </scriptmapper>
+      </mapper>
     </pathconvert>
     <!--
       The XSL input file is ignored completely, but XSL expects one to be given,

From b550e5a30a41887d0fdf36aca179c44678c450cd Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Wed, 16 May 2012 10:47:53 +0000
Subject: [PATCH 03/47] SOLR-3238: add missing image for analysis

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339110 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/webapp/web/img/ico/question-white.png | Bin 0 -> 761 bytes
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100755 solr/webapp/web/img/ico/question-white.png

diff --git a/solr/webapp/web/img/ico/question-white.png b/solr/webapp/web/img/ico/question-white.png
new file mode 100755
index 0000000000000000000000000000000000000000..f806468719539405a3f76885123e4ecb09cf3d1b
GIT binary patch
literal 761
zcmV<V0tWqwP)<h;3K|Lk000e1NJLTq000mG000mO1^@s6AM^iV0000PbVXQnQ*UN;
zcVTj606}DLVr3vnZDD6+Qe|Oed2z{QJOBU!n@L1LRCwB?Q%h?TQ5gMZl6fSiNh5jm
zWfLofLM^cr+iEJ5)<r9>?7A3KEJ$%9f&PJl8eND821JVDLIihG+y!Z@4+2UMgjAcB
zHZe`4oxGcwOuXNXGgxuwg)@)uJLk;(4tJPFqXGZ3jCdKp6a|Z=1#Grf5Ji)hW!X7W
zo+jx1%}Wq0tEw8VRx3$K+Jj=T0FlT3rh&EyA;7|ZXnfG(I5ltxI-JdRDy#Tb<0W4t
zR=GkrK~h>eumeqO;;P|=iyq$F&O>vwI_-748Su2V!02(ovG`~sEU7AJCe%QdWv{A~
zLkodpe3z5OcQ||X!+}}v-spo9eKuGKbn@44#zTY?A>|~C%|f9#H#ux`bh!*vtSAc1
zo^Pi(GiZf;J`e9c@6aA{CQjNMs6j0?s8p)clcO$5sMqThGZS{08sWid-N!y;GCPn+
zBw%gr8;taeRHKies%)>f!%Xfq`gKXlL%Cdmk6()L@I@Mi2V8LZ!V!{u5ilCJ-9R<E
zfzfCNXy8uviMW7)g2BMS?I(M{FeX@>?}1XOM0h;Sqd_)KHJX7aS`&%QvhT3DMua>;
zGq}}fr|CVH+Xapj^+30>O^u#`$z)%C6O-`}0nZCM&dqOA{8<wO5mw_(jcy<aE#XLv
z$z>%pFww6eMA1f}y(7{;1$Z0ha;VV_$h^s#A_ng~Rce`Cff9{I5nkPQQ{Xe!Qbc_3
zIn<Dg8q_j);(CUHBrF5iJH`TCJ!7HqA>QHlanR{vX}DY2Iz&Io5Q)jT?e&%5_t>qa
z-P8&_t<->F7%fn@(=*lIJ#cNNwQa=Du-s9ax+<^l{dgbUj6Zmp-FW?#l+pyXzYTC4
r3xQc1?H>z&kP04N{83Q*OMn3Yq{|~z654<n00000NkvXXu0mjf1Ljz5

literal 0
HcmV?d00001


From 04486d4454fc793836c2d31413e621ee12b5c708 Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Wed, 16 May 2012 11:15:41 +0000
Subject: [PATCH 04/47] SOLR-3238: decode query-params for analysis

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339114 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/webapp/web/js/scripts/analysis.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/solr/webapp/web/js/scripts/analysis.js b/solr/webapp/web/js/scripts/analysis.js
index 296af99eb5c..e268f719b3f 100644
--- a/solr/webapp/web/js/scripts/analysis.js
+++ b/solr/webapp/web/js/scripts/analysis.js
@@ -129,7 +129,7 @@ sammy.get
                 {
                   fields++;
                   $( '[name="' + key + '"]', analysis_form )
-                    .val( context.params[key] );
+                    .val( decodeURIComponent( context.params[key].replace( /\+/g, '%20' ) ) );
                 }
               }
 

From 560a287e6881ae0e71bc8bc4cc59a64148bdca11 Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Wed, 16 May 2012 11:27:32 +0000
Subject: [PATCH 05/47] SOLR-3238: rename 'Plugins' to 'Plugins / Stats' in
 Navigation

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339120 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/webapp/web/js/scripts/app.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/solr/webapp/web/js/scripts/app.js b/solr/webapp/web/js/scripts/app.js
index c67e3405263..67282bf5ef9 100644
--- a/solr/webapp/web/js/scripts/app.js
+++ b/solr/webapp/web/js/scripts/app.js
@@ -213,7 +213,7 @@ var solr_admin = function( app_config )
                          + '    <li class="replication"><a href="#/' + core_name + '/replication"><span>Replication</span></a></li>' + "\n"
                          + '    <li class="analysis"><a href="#/' + core_name + '/analysis"><span>Analysis</span></a></li>' + "\n"
                          + '    <li class="schema-browser"><a href="#/' + core_name + '/schema-browser"><span>Schema Browser</span></a></li>' + "\n"
-                         + '    <li class="plugins"><a href="#/' + core_name + '/plugins"><span>Plugins</span></a></li>' + "\n"
+                         + '    <li class="plugins"><a href="#/' + core_name + '/plugins"><span>Plugins / Stats</span></a></li>' + "\n"
                          + '    <li class="dataimport"><a href="#/' + core_name + '/dataimport"><span>Dataimport</span></a></li>' + "\n"
 
                          + '    </ul>' + "\n"

From ad7914c5b21848888824f7bb33d1a14676a3454f Mon Sep 17 00:00:00 2001
From: Michael McCandless <mikemccand@apache.org>
Date: Wed, 16 May 2012 12:28:57 +0000
Subject: [PATCH 06/47] LUCENE-3514: also support IndexSearcher.searchAfter
 when Sort is used

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339137 13f79535-47bb-0310-9956-ffa450edef68
---
 lucene/CHANGES.txt                            |   9 +
 .../apache/lucene/search/FieldComparator.java | 196 ++++++++++++-
 .../apache/lucene/search/IndexSearcher.java   | 170 +++++++----
 .../org/apache/lucene/search/TopDocs.java     |   2 +-
 .../lucene/search/TopFieldCollector.java      | 267 ++++++++++++++++--
 .../apache/lucene/search/TopFieldDocs.java    |  27 +-
 .../lucene/search/JustCompileSearch.java      |   4 +
 .../search/TestElevationComparator.java       |   8 +
 .../apache/lucene/search/TestSearchAfter.java | 110 +++++++-
 .../org/apache/lucene/search/TestSort.java    |  52 +++-
 .../lucene/search/join/TestBlockJoin.java     |   1 -
 .../lucene/queries/CustomScoreQuery.java      |   2 +-
 .../lucene/queries/function/ValueSource.java  |  13 +
 .../queries/function/TestValueSources.java    |   1 -
 .../queries/SlowCollatedStringComparator.java |  12 +
 .../component/QueryElevationComponent.java    |  11 +-
 .../apache/solr/schema/RandomSortField.java   |   6 +
 .../MissingStringLastComparatorSource.java    |  19 ++
 18 files changed, 807 insertions(+), 103 deletions(-)

diff --git a/lucene/CHANGES.txt b/lucene/CHANGES.txt
index c3127c169aa..29d5a6b5ab2 100644
--- a/lucene/CHANGES.txt
+++ b/lucene/CHANGES.txt
@@ -266,6 +266,11 @@ Changes in backwards compatibility policy
 * LUCENE-3970: Rename Fields.getUniqueFieldCount -> .size() and
   Terms.getUniqueTermCount -> .size().  (Iulius Curt via Mike McCandless)
 
+* LUCENE-3514: IndexSearcher.setDefaultFieldSortScoring was removed
+  and replaced with per-search control via new expert search methods
+  that take two booleans indicating whether hit scores and max
+  score should be computed.  (Mike McCandless)
+
 Changes in Runtime Behavior
 
 * LUCENE-2846: omitNorms now behaves like omitTermFrequencyAndPositions, if you
@@ -857,6 +862,10 @@ New features
 * LUCENE-4039: Add AddIndexesTask to benchmark, which uses IW.addIndexes. 
   (Shai Erera)
 
+* LUCENE-3514: Added IndexSearcher.searchAfter when Sort is used,
+  returning results after a specified FieldDoc for deep
+  paging.  (Mike McCandless)
+
 Optimizations
 
 * LUCENE-2588: Don't store unnecessary suffixes when writing the terms
diff --git a/lucene/core/src/java/org/apache/lucene/search/FieldComparator.java b/lucene/core/src/java/org/apache/lucene/search/FieldComparator.java
index 5013f2f67d6..e6d96b15d0e 100644
--- a/lucene/core/src/java/org/apache/lucene/search/FieldComparator.java
+++ b/lucene/core/src/java/org/apache/lucene/search/FieldComparator.java
@@ -190,6 +190,10 @@ public abstract class FieldComparator<T> {
     }
   }
 
+  /** Returns negative result if the doc's value is less
+   *  than the provided value. */
+  public abstract int compareDocToValue(int doc, T value) throws IOException;
+
   public static abstract class NumericComparator<T extends Number> extends FieldComparator<T> {
     protected final T missingValue;
     protected final String field;
@@ -274,9 +278,19 @@ public abstract class FieldComparator<T> {
     public Byte value(int slot) {
       return Byte.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Byte value) {
+      byte docValue = currentReaderValues[doc];
+      // Test for docValue == 0 to save Bits.get method call for
+      // the common case (doc has value and value is non-zero):
+      if (docsWithField != null && docValue == 0 && !docsWithField.get(doc)) {
+        docValue = missingValue;
+      }
+      return docValue - value.byteValue();
+    }
   }
 
-  
   /** Parses field's values as double (using {@link
    *  FieldCache#getDoubles} and sorts by ascending value */
   public static final class DoubleComparator extends NumericComparator<Double> {
@@ -351,6 +365,24 @@ public abstract class FieldComparator<T> {
     public Double value(int slot) {
       return Double.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Double valueObj) {
+      final double value = valueObj.doubleValue();
+      double docValue = currentReaderValues[doc];
+      // Test for docValue == 0 to save Bits.get method call for
+      // the common case (doc has value and value is non-zero):
+      if (docsWithField != null && docValue == 0 && !docsWithField.get(doc)) {
+        docValue = missingValue;
+      }
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return 1;
+      } else {
+        return 0;
+      }
+    }
   }
 
   /** Uses float index values to sort by ascending value */
@@ -415,6 +447,19 @@ public abstract class FieldComparator<T> {
     public Double value(int slot) {
       return Double.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Double valueObj) {
+      final double value = valueObj.doubleValue();
+      final double docValue = currentReaderValues.getFloat(doc);
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return 1;
+      } else {
+        return 0;
+      }
+    }
   }
 
   /** Parses field's values as float (using {@link
@@ -494,6 +539,24 @@ public abstract class FieldComparator<T> {
     public Float value(int slot) {
       return Float.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Float valueObj) {
+      final float value = valueObj.floatValue();
+      float docValue = currentReaderValues[doc];
+      // Test for docValue == 0 to save Bits.get method call for
+      // the common case (doc has value and value is non-zero):
+      if (docsWithField != null && docValue == 0 && !docsWithField.get(doc)) {
+        docValue = missingValue;
+      }
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return 1;
+      } else {
+        return 0;
+      }
+    }
   }
 
   /** Parses field's values as short (using {@link
@@ -556,6 +619,18 @@ public abstract class FieldComparator<T> {
     public Short value(int slot) {
       return Short.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Short valueObj) {
+      final short value = valueObj.shortValue();
+      short docValue = currentReaderValues[doc];
+      // Test for docValue == 0 to save Bits.get method call for
+      // the common case (doc has value and value is non-zero):
+      if (docsWithField != null && docValue == 0 && !docsWithField.get(doc)) {
+        docValue = missingValue;
+      }
+      return docValue - value;
+    }
   }
 
   /** Parses field's values as int (using {@link
@@ -640,6 +715,24 @@ public abstract class FieldComparator<T> {
     public Integer value(int slot) {
       return Integer.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Integer valueObj) {
+      final int value = valueObj.intValue();
+      int docValue = currentReaderValues[doc];
+      // Test for docValue == 0 to save Bits.get method call for
+      // the common case (doc has value and value is non-zero):
+      if (docsWithField != null && docValue == 0 && !docsWithField.get(doc)) {
+        docValue = missingValue;
+      }
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return 1;
+      } else {
+        return 0;
+      }
+    }
   }
 
   /** Loads int index values and sorts by ascending value. */
@@ -708,6 +801,19 @@ public abstract class FieldComparator<T> {
     public Long value(int slot) {
       return Long.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Long valueObj) {
+      final long value = valueObj.longValue();
+      final long docValue = currentReaderValues.getInt(doc);
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return 1;
+      } else {
+        return 0;
+      }
+    }
   }
 
   /** Parses field's values as long (using {@link
@@ -788,6 +894,24 @@ public abstract class FieldComparator<T> {
     public Long value(int slot) {
       return Long.valueOf(values[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Long valueObj) {
+      final long value = valueObj.longValue();
+      long docValue = currentReaderValues[doc];
+      // Test for docValue == 0 to save Bits.get method call for
+      // the common case (doc has value and value is non-zero):
+      if (docsWithField != null && docValue == 0 && !docsWithField.get(doc)) {
+        docValue = missingValue;
+      }
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return 1;
+      } else {
+        return 0;
+      }
+    }
   }
 
   /** Sorts by descending relevance.  NOTE: if you are
@@ -815,12 +939,14 @@ public abstract class FieldComparator<T> {
     @Override
     public int compareBottom(int doc) throws IOException {
       float score = scorer.score();
+      assert !Float.isNaN(score);
       return bottom > score ? -1 : (bottom < score ? 1 : 0);
     }
 
     @Override
     public void copy(int slot, int doc) throws IOException {
       scores[slot] = scorer.score();
+      assert !Float.isNaN(scores[slot]);
     }
 
     @Override
@@ -857,6 +983,22 @@ public abstract class FieldComparator<T> {
       // sorts descending:
       return second.compareTo(first);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Float valueObj) throws IOException {
+      final float value = valueObj.floatValue();
+      float docValue = scorer.score();
+      assert !Float.isNaN(docValue);
+      if (docValue < value) {
+        // reverse of FloatComparator
+        return 1;
+      } else if (docValue > value) {
+        // reverse of FloatComparator
+        return -1;
+      } else {
+        return 0;
+      }
+    }
   }
 
   /** Sorts by ascending docID */
@@ -904,6 +1046,19 @@ public abstract class FieldComparator<T> {
     public Integer value(int slot) {
       return Integer.valueOf(docIDs[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Integer valueObj) {
+      final int value = valueObj.intValue();
+      int docValue = docBase + doc;
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return 1;
+      } else {
+        return 0;
+      }
+    }
   }
   
   /** Sorts by field's natural Term sort order, using
@@ -998,6 +1153,20 @@ public abstract class FieldComparator<T> {
       throw new UnsupportedOperationException();
     }
 
+    @Override
+    public int compareDocToValue(int doc, BytesRef value) {
+      BytesRef docValue = termsIndex.getTerm(doc, tempBR);
+      if (docValue == null) {
+        if (value == null) {
+          return 0;
+        }
+        return -1;
+      } else if (value == null) {
+        return 1;
+      }
+      return docValue.compareTo(value);
+    }
+
     /** Base class for specialized (per bit width of the
      * ords) per-segment comparator.  NOTE: this is messy;
      * we do this only because hotspot can't reliably inline
@@ -1038,6 +1207,11 @@ public abstract class FieldComparator<T> {
         }
         return val1.compareTo(val2);
       }
+
+      @Override
+      public int compareDocToValue(int doc, BytesRef value) {
+        return TermOrdValComparator.this.compareDocToValue(doc, value);
+      }
     }
 
     // Used per-segment when bit width of doc->ord is 8:
@@ -1385,6 +1559,11 @@ public abstract class FieldComparator<T> {
       throw new UnsupportedOperationException();
     }
 
+    @Override
+    public int compareDocToValue(int doc, BytesRef value) {
+      return termsIndex.getBytes(doc, tempBR).compareTo(value);
+    }
+
     // TODO: would be nice to share these specialized impls
     // w/ TermOrdValComparator
 
@@ -1422,6 +1601,11 @@ public abstract class FieldComparator<T> {
         assert val2 != null;
         return comp.compare(val1, val2);
       }
+
+      @Override
+      public int compareDocToValue(int doc, BytesRef value) {
+        return TermOrdValDocValuesComparator.this.compareDocToValue(doc, value);
+      }
     }
 
     // Used per-segment when bit width of doc->ord is 8:
@@ -1801,6 +1985,11 @@ public abstract class FieldComparator<T> {
       }
       return val1.compareTo(val2);
     }
+
+    @Override
+    public int compareDocToValue(int doc, BytesRef value) {
+      return docTerms.getTerm(doc, tempBR).compareTo(value);
+    }
   }
 
   /** Sorts by field's natural Term sort order.  All
@@ -1869,6 +2058,11 @@ public abstract class FieldComparator<T> {
       assert val2 != null;
       return val1.compareTo(val2);
     }
+
+    @Override
+    public int compareDocToValue(int doc, BytesRef value) {
+      return docTerms.getBytes(doc, tempBR).compareTo(value);
+    }
   }
 
   final protected static int binarySearch(BytesRef br, DocTermsIndex a, BytesRef key) {
diff --git a/lucene/core/src/java/org/apache/lucene/search/IndexSearcher.java b/lucene/core/src/java/org/apache/lucene/search/IndexSearcher.java
index 9ed8a9f5b5e..3d79dbe16aa 100644
--- a/lucene/core/src/java/org/apache/lucene/search/IndexSearcher.java
+++ b/lucene/core/src/java/org/apache/lucene/search/IndexSearcher.java
@@ -304,14 +304,51 @@ public class IndexSearcher {
    * <code>sort</code>.
    * 
    * <p>NOTE: this does not compute scores by default; use
-   * {@link IndexSearcher#setDefaultFieldSortScoring} to
-   * enable scoring.
+   * {@link IndexSearcher#search(Query,Filter,int,Sort,boolean,boolean)} to
+   * control scoring.
    *
    * @throws BooleanQuery.TooManyClauses
    */
   public TopFieldDocs search(Query query, Filter filter, int n,
                              Sort sort) throws IOException {
-    return search(createNormalizedWeight(wrapFilter(query, filter)), n, sort);
+    return search(createNormalizedWeight(wrapFilter(query, filter)), n, sort, false, false);
+  }
+
+  /** Search implementation with arbitrary sorting, plus
+   * control over whether hit scores and max score
+   * should be computed.  Finds
+   * the top <code>n</code> hits for <code>query</code>, applying
+   * <code>filter</code> if non-null, and sorting the hits by the criteria in
+   * <code>sort</code>.  If <code>doDocScores</code> is <code>true</code>
+   * then the score of each hit will be computed and
+   * returned.  If <code>doMaxScore</code> is
+   * <code>true</code> then the maximum score over all
+   * collected hits will be computed.
+   * 
+   * @throws BooleanQuery.TooManyClauses
+   */
+  public TopFieldDocs search(Query query, Filter filter, int n,
+                             Sort sort, boolean doDocScores, boolean doMaxScore) throws IOException {
+    return search(createNormalizedWeight(wrapFilter(query, filter)), n, sort, doDocScores, doMaxScore);
+  }
+
+  /** Finds the top <code>n</code>
+   * hits for <code>query</code>, applying <code>filter</code> if non-null,
+   * where all results are after a previous result (<code>after</code>).
+   * <p>
+   * By passing the bottom result from a previous page as <code>after</code>,
+   * this method can be used for efficient 'deep-paging' across potentially
+   * large result sets.
+   *
+   * @throws BooleanQuery.TooManyClauses
+   */
+  public TopDocs searchAfter(ScoreDoc after, Query query, Filter filter, int n, Sort sort) throws IOException {
+    if (after != null && !(after instanceof FieldDoc)) {
+      // TODO: if we fix type safety of TopFieldDocs we can
+      // remove this
+      throw new IllegalArgumentException("after must be a FieldDoc; got " + after);
+    }
+    return search(createNormalizedWeight(wrapFilter(query, filter)), (FieldDoc) after, n, sort, true, false, false);
   }
 
   /**
@@ -324,7 +361,52 @@ public class IndexSearcher {
    */
   public TopFieldDocs search(Query query, int n,
                              Sort sort) throws IOException {
-    return search(createNormalizedWeight(query), n, sort);
+    return search(createNormalizedWeight(query), n, sort, false, false);
+  }
+
+  /** Finds the top <code>n</code>
+   * hits for <code>query</code> where all results are after a previous 
+   * result (<code>after</code>).
+   * <p>
+   * By passing the bottom result from a previous page as <code>after</code>,
+   * this method can be used for efficient 'deep-paging' across potentially
+   * large result sets.
+   *
+   * @throws BooleanQuery.TooManyClauses
+   */
+  public TopDocs searchAfter(ScoreDoc after, Query query, int n, Sort sort) throws IOException {
+    if (after != null && !(after instanceof FieldDoc)) {
+      // TODO: if we fix type safety of TopFieldDocs we can
+      // remove this
+      throw new IllegalArgumentException("after must be a FieldDoc; got " + after);
+    }
+    return search(createNormalizedWeight(query), (FieldDoc) after, n, sort, true, false, false);
+  }
+
+  /** Finds the top <code>n</code>
+   * hits for <code>query</code> where all results are after a previous 
+   * result (<code>after</code>), allowing control over
+   * whether hit scores and max score should be computed.
+   * <p>
+   * By passing the bottom result from a previous page as <code>after</code>,
+   * this method can be used for efficient 'deep-paging' across potentially
+   * large result sets.  If <code>doDocScores</code> is <code>true</code>
+   * then the score of each hit will be computed and
+   * returned.  If <code>doMaxScore</code> is
+   * <code>true</code> then the maximum score over all
+   * collected hits will be computed.
+   *
+   * @throws BooleanQuery.TooManyClauses
+   */
+  public TopDocs searchAfter(ScoreDoc after, Query query, Filter filter, int n, Sort sort,
+                             boolean doDocScores, boolean doMaxScore) throws IOException {
+    if (after != null && !(after instanceof FieldDoc)) {
+      // TODO: if we fix type safety of TopFieldDocs we can
+      // remove this
+      throw new IllegalArgumentException("after must be a FieldDoc; got " + after);
+    }
+    return search(createNormalizedWeight(wrapFilter(query, filter)), (FieldDoc) after, n, sort, true,
+                  doDocScores, doMaxScore);
   }
 
   /** Expert: Low-level search implementation.  Finds the top <code>n</code>
@@ -383,7 +465,9 @@ public class IndexSearcher {
     return collector.topDocs();
   }
 
-  /** Expert: Low-level search implementation with arbitrary sorting.  Finds
+  /** Expert: Low-level search implementation with arbitrary
+   * sorting and control over whether hit scores and max
+   * score should be computed.  Finds
    * the top <code>n</code> hits for <code>query</code> and sorting the hits
    * by the criteria in <code>sort</code>.
    *
@@ -393,12 +477,13 @@ public class IndexSearcher {
    * @throws BooleanQuery.TooManyClauses
    */
   protected TopFieldDocs search(Weight weight,
-      final int nDocs, Sort sort) throws IOException {
-    return search(weight, nDocs, sort, true);
+                                final int nDocs, Sort sort,
+                                boolean doDocScores, boolean doMaxScore) throws IOException {
+    return search(weight, null, nDocs, sort, true, doDocScores, doMaxScore);
   }
 
   /**
-   * Just like {@link #search(Weight, int, Sort)}, but you choose
+   * Just like {@link #search(Weight, int, Sort, boolean, boolean)}, but you choose
    * whether or not the fields in the returned {@link FieldDoc} instances should
    * be set by specifying fillFields.
    *
@@ -408,27 +493,29 @@ public class IndexSearcher {
    * then pass that to {@link #search(AtomicReaderContext[], Weight,
    * Collector)}.</p>
    */
-  protected TopFieldDocs search(Weight weight, int nDocs,
-                                Sort sort, boolean fillFields)
+  protected TopFieldDocs search(Weight weight, FieldDoc after, int nDocs,
+                                Sort sort, boolean fillFields,
+                                boolean doDocScores, boolean doMaxScore)
       throws IOException {
 
     if (sort == null) throw new NullPointerException();
     
     if (executor == null) {
       // use all leaves here!
-      return search (leafContexts, weight, nDocs, sort, fillFields);
+      return search(leafContexts, weight, after, nDocs, sort, fillFields, doDocScores, doMaxScore);
     } else {
       final TopFieldCollector topCollector = TopFieldCollector.create(sort, nDocs,
+                                                                      after,
                                                                       fillFields,
-                                                                      fieldSortDoTrackScores,
-                                                                      fieldSortDoMaxScore,
+                                                                      doDocScores,
+                                                                      doMaxScore,
                                                                       false);
 
       final Lock lock = new ReentrantLock();
       final ExecutionHelper<TopFieldDocs> runner = new ExecutionHelper<TopFieldDocs>(executor);
       for (int i = 0; i < leafSlices.length; i++) { // search each leaf slice
         runner.submit(
-                      new SearcherCallableWithSort(lock, this, leafSlices[i], weight, nDocs, topCollector, sort));
+                      new SearcherCallableWithSort(lock, this, leafSlices[i], weight, after, nDocs, topCollector, sort, doDocScores, doMaxScore));
       }
       int totalHits = 0;
       float maxScore = Float.NEGATIVE_INFINITY;
@@ -447,18 +534,12 @@ public class IndexSearcher {
   
   
   /**
-   * Just like {@link #search(Weight, int, Sort)}, but you choose
+   * Just like {@link #search(Weight, int, Sort, boolean, boolean)}, but you choose
    * whether or not the fields in the returned {@link FieldDoc} instances should
    * be set by specifying fillFields.
-   *
-   * <p>NOTE: this does not compute scores by default.  If you
-   * need scores, create a {@link TopFieldCollector}
-   * instance by calling {@link TopFieldCollector#create} and
-   * then pass that to {@link #search(AtomicReaderContext[], Weight, 
-   * Collector)}.</p>
    */
-  protected TopFieldDocs search(AtomicReaderContext[] leaves, Weight weight, int nDocs,
-      Sort sort, boolean fillFields) throws IOException {
+  protected TopFieldDocs search(AtomicReaderContext[] leaves, Weight weight, FieldDoc after, int nDocs,
+                                Sort sort, boolean fillFields, boolean doDocScores, boolean doMaxScore) throws IOException {
     // single thread
     int limit = reader.maxDoc();
     if (limit == 0) {
@@ -466,8 +547,9 @@ public class IndexSearcher {
     }
     nDocs = Math.min(nDocs, limit);
 
-    TopFieldCollector collector = TopFieldCollector.create(sort, nDocs,
-                                                           fillFields, fieldSortDoTrackScores, fieldSortDoMaxScore, !weight.scoresDocsOutOfOrder());
+    TopFieldCollector collector = TopFieldCollector.create(sort, nDocs, after,
+                                                           fillFields, doDocScores,
+                                                           doMaxScore, !weight.scoresDocsOutOfOrder());
     search(leaves, weight, collector);
     return (TopFieldDocs) collector.topDocs();
   }
@@ -553,26 +635,6 @@ public class IndexSearcher {
     return weight.explain(leafContexts[n], deBasedDoc);
   }
 
-  private boolean fieldSortDoTrackScores;
-  private boolean fieldSortDoMaxScore;
-
-  /** By default, no scores are computed when sorting by
-   *  field (using {@link #search(Query,Filter,int,Sort)}).
-   *  You can change that, per IndexSearcher instance, by
-   *  calling this method.  Note that this will incur a CPU
-   *  cost.
-   * 
-   *  @param doTrackScores If true, then scores are
-   *  returned for every matching document in {@link
-   *  TopFieldDocs}.
-   *
-   *  @param doMaxScore If true, then the max score for all
-   *  matching docs is computed. */
-  public void setDefaultFieldSortScoring(boolean doTrackScores, boolean doMaxScore) {
-    fieldSortDoTrackScores = doTrackScores;
-    fieldSortDoMaxScore = doMaxScore;
-  }
-
   /**
    * Creates a normalized weight for a top-level {@link Query}.
    * The query is rewritten by this method and {@link Query#createWeight} called,
@@ -626,7 +688,7 @@ public class IndexSearcher {
     }
 
     public TopDocs call() throws IOException {
-      final TopDocs docs = searcher.search (slice.leaves, weight, after, nDocs);
+      final TopDocs docs = searcher.search(slice.leaves, weight, after, nDocs);
       final ScoreDoc[] scoreDocs = docs.scoreDocs;
       //it would be so nice if we had a thread-safe insert 
       lock.lock();
@@ -657,9 +719,13 @@ public class IndexSearcher {
     private final TopFieldCollector hq;
     private final Sort sort;
     private final LeafSlice slice;
+    private final FieldDoc after;
+    private final boolean doDocScores;
+    private final boolean doMaxScore;
 
     public SearcherCallableWithSort(Lock lock, IndexSearcher searcher, LeafSlice slice, Weight weight,
-        int nDocs, TopFieldCollector hq, Sort sort) {
+                                    FieldDoc after, int nDocs, TopFieldCollector hq, Sort sort,
+                                    boolean doDocScores, boolean doMaxScore) {
       this.lock = lock;
       this.searcher = searcher;
       this.weight = weight;
@@ -667,6 +733,9 @@ public class IndexSearcher {
       this.hq = hq;
       this.sort = sort;
       this.slice = slice;
+      this.after = after;
+      this.doDocScores = doDocScores;
+      this.doMaxScore = doMaxScore;
     }
 
     private final class FakeScorer extends Scorer {
@@ -707,7 +776,7 @@ public class IndexSearcher {
 
     public TopFieldDocs call() throws IOException {
       assert slice.leaves.length == 1;
-      final TopFieldDocs docs = searcher.search (slice.leaves, weight, nDocs, sort, true);
+      final TopFieldDocs docs = searcher.search(slice.leaves, weight, after, nDocs, sort, true, doDocScores, doMaxScore);
       lock.lock();
       try {
         final int base = slice.leaves[0].docBase;
@@ -718,6 +787,11 @@ public class IndexSearcher {
           fakeScorer.score = scoreDoc.score;
           hq.collect(scoreDoc.doc-base);
         }
+
+        // Carry over maxScore from sub:
+        if (doMaxScore && docs.getMaxScore() > hq.maxScore) {
+          hq.maxScore = docs.getMaxScore();
+        }
       } finally {
         lock.unlock();
       }
diff --git a/lucene/core/src/java/org/apache/lucene/search/TopDocs.java b/lucene/core/src/java/org/apache/lucene/search/TopDocs.java
index 0e5bc0fb96e..e8af0f8d215 100644
--- a/lucene/core/src/java/org/apache/lucene/search/TopDocs.java
+++ b/lucene/core/src/java/org/apache/lucene/search/TopDocs.java
@@ -45,7 +45,7 @@ public class TopDocs {
   
   /** Sets the maximum score value encountered. */
   public void setMaxScore(float maxScore) {
-    this.maxScore=maxScore;
+    this.maxScore = maxScore;
   }
 
   /** Constructs a TopDocs with a default maxScore=Float.NaN. */
diff --git a/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java b/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java
index cc01ce8ea05..f14cabda865 100644
--- a/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java
+++ b/lucene/core/src/java/org/apache/lucene/search/TopFieldCollector.java
@@ -843,6 +843,166 @@ public abstract class TopFieldCollector extends TopDocsCollector<Entry> {
 
   }
 
+  /*
+   * Implements a TopFieldCollector when after != null.
+   */
+  private final static class PagingFieldCollector extends TopFieldCollector {
+
+    Scorer scorer;
+    int collectedHits;
+    final FieldComparator<?>[] comparators;
+    final int[] reverseMul;
+    final FieldValueHitQueue<Entry> queue;
+    final boolean trackDocScores;
+    final boolean trackMaxScore;
+    final FieldDoc after;
+    int afterDoc;
+    
+    public PagingFieldCollector(
+                                FieldValueHitQueue<Entry> queue, FieldDoc after, int numHits, boolean fillFields,
+                                boolean trackDocScores, boolean trackMaxScore)
+        throws IOException {
+      super(queue, numHits, fillFields);
+      this.queue = queue;
+      this.trackDocScores = trackDocScores;
+      this.trackMaxScore = trackMaxScore;
+      this.after = after;
+      comparators = queue.getComparators();
+      reverseMul = queue.getReverseMul();
+
+      // Must set maxScore to NEG_INF, or otherwise Math.max always returns NaN.
+      maxScore = Float.NEGATIVE_INFINITY;
+    }
+    
+    void updateBottom(int doc, float score) {
+      bottom.doc = docBase + doc;
+      bottom.score = score;
+      bottom = pq.updateTop();
+    }
+
+    @SuppressWarnings({"unchecked", "rawtypes"})
+    @Override
+    public void collect(int doc) throws IOException {
+      totalHits++;
+
+      //System.out.println("  collect doc=" + doc);
+
+      // Check if this hit was already collected on a
+      // previous page:
+      boolean sameValues = true;
+      for(int compIDX=0;compIDX<comparators.length;compIDX++) {
+        final FieldComparator comp = comparators[compIDX];
+
+        final int cmp = reverseMul[compIDX] * comp.compareDocToValue(doc, after.fields[compIDX]);
+        if (cmp < 0) {
+          // Already collected on a previous page
+          //System.out.println("    skip: before");
+          return;
+        } else if (cmp > 0) {
+          // Not yet collected
+          sameValues = false;
+          //System.out.println("    keep: after");
+          break;
+        }
+      }
+
+      // Tie-break by docID:
+      if (sameValues && doc <= afterDoc) {
+        // Already collected on a previous page
+        //System.out.println("    skip: tie-break");
+        return;
+      }
+
+      collectedHits++;
+
+      float score = Float.NaN;
+      if (trackMaxScore) {
+        score = scorer.score();
+        if (score > maxScore) {
+          maxScore = score;
+        }
+      }
+
+      if (queueFull) {
+        // Fastmatch: return if this hit is not competitive
+        for (int i = 0;; i++) {
+          final int c = reverseMul[i] * comparators[i].compareBottom(doc);
+          if (c < 0) {
+            // Definitely not competitive.
+            return;
+          } else if (c > 0) {
+            // Definitely competitive.
+            break;
+          } else if (i == comparators.length - 1) {
+            // This is the equals case.
+            if (doc + docBase > bottom.doc) {
+              // Definitely not competitive
+              return;
+            }
+            break;
+          }
+        }
+
+        // This hit is competitive - replace bottom element in queue & adjustTop
+        for (int i = 0; i < comparators.length; i++) {
+          comparators[i].copy(bottom.slot, doc);
+        }
+
+        // Compute score only if it is competitive.
+        if (trackDocScores && !trackMaxScore) {
+          score = scorer.score();
+        }
+        updateBottom(doc, score);
+
+        for (int i = 0; i < comparators.length; i++) {
+          comparators[i].setBottom(bottom.slot);
+        }
+      } else {
+        // Startup transient: queue hasn't gathered numHits yet
+        final int slot = collectedHits - 1;
+        //System.out.println("    slot=" + slot);
+        // Copy hit into queue
+        for (int i = 0; i < comparators.length; i++) {
+          comparators[i].copy(slot, doc);
+        }
+
+        // Compute score only if it is competitive.
+        if (trackDocScores && !trackMaxScore) {
+          score = scorer.score();
+        }
+        bottom = pq.add(new Entry(slot, docBase + doc, score));
+        queueFull = collectedHits == numHits;
+        if (queueFull) {
+          for (int i = 0; i < comparators.length; i++) {
+            comparators[i].setBottom(bottom.slot);
+          }
+        }
+      }
+    }
+
+    @Override
+    public void setScorer(Scorer scorer) throws IOException {
+      this.scorer = scorer;
+      for (int i = 0; i < comparators.length; i++) {
+        comparators[i].setScorer(scorer);
+      }
+    }
+    
+    @Override
+    public boolean acceptsDocsOutOfOrder() {
+      return true;
+    }
+
+    @Override
+    public void setNextReader(AtomicReaderContext context) throws IOException {
+      docBase = context.docBase;
+      afterDoc = after.doc - docBase;
+      for (int i = 0; i < comparators.length; i++) {
+        queue.setComparator(i, comparators[i].setNextReader(context));
+      }
+    }
+  }
+
   private static final ScoreDoc[] EMPTY_SCOREDOCS = new ScoreDoc[0];
   
   private final boolean fillFields;
@@ -909,6 +1069,52 @@ public abstract class TopFieldCollector extends TopDocsCollector<Entry> {
       boolean fillFields, boolean trackDocScores, boolean trackMaxScore,
       boolean docsScoredInOrder)
       throws IOException {
+    return create(sort, numHits, null, fillFields, trackDocScores, trackMaxScore, docsScoredInOrder);
+  }
+
+  /**
+   * Creates a new {@link TopFieldCollector} from the given
+   * arguments.
+   *
+   * <p><b>NOTE</b>: The instances returned by this method
+   * pre-allocate a full array of length
+   * <code>numHits</code>.
+   * 
+   * @param sort
+   *          the sort criteria (SortFields).
+   * @param numHits
+   *          the number of results to collect.
+   * @param after
+   *          only hits after this FieldDoc will be collected
+   * @param fillFields
+   *          specifies whether the actual field values should be returned on
+   *          the results (FieldDoc).
+   * @param trackDocScores
+   *          specifies whether document scores should be tracked and set on the
+   *          results. Note that if set to false, then the results' scores will
+   *          be set to Float.NaN. Setting this to true affects performance, as
+   *          it incurs the score computation on each competitive result.
+   *          Therefore if document scores are not required by the application,
+   *          it is recommended to set it to false.
+   * @param trackMaxScore
+   *          specifies whether the query's maxScore should be tracked and set
+   *          on the resulting {@link TopDocs}. Note that if set to false,
+   *          {@link TopDocs#getMaxScore()} returns Float.NaN. Setting this to
+   *          true affects performance as it incurs the score computation on
+   *          each result. Also, setting this true automatically sets
+   *          <code>trackDocScores</code> to true as well.
+   * @param docsScoredInOrder
+   *          specifies whether documents are scored in doc Id order or not by
+   *          the given {@link Scorer} in {@link #setScorer(Scorer)}.
+   * @return a {@link TopFieldCollector} instance which will sort the results by
+   *         the sort criteria.
+   * @throws IOException
+   */
+  public static TopFieldCollector create(Sort sort, int numHits, FieldDoc after,
+      boolean fillFields, boolean trackDocScores, boolean trackMaxScore,
+      boolean docsScoredInOrder)
+      throws IOException {
+
     if (sort.fields.length == 0) {
       throw new IllegalArgumentException("Sort must contain at least one field");
     }
@@ -918,43 +1124,56 @@ public abstract class TopFieldCollector extends TopDocsCollector<Entry> {
     }
 
     FieldValueHitQueue<Entry> queue = FieldValueHitQueue.create(sort.fields, numHits);
-    if (queue.getComparators().length == 1) {
+
+    if (after == null) {
+      if (queue.getComparators().length == 1) {
+        if (docsScoredInOrder) {
+          if (trackMaxScore) {
+            return new OneComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
+          } else if (trackDocScores) {
+            return new OneComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
+          } else {
+            return new OneComparatorNonScoringCollector(queue, numHits, fillFields);
+          }
+        } else {
+          if (trackMaxScore) {
+            return new OutOfOrderOneComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
+          } else if (trackDocScores) {
+            return new OutOfOrderOneComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
+          } else {
+            return new OutOfOrderOneComparatorNonScoringCollector(queue, numHits, fillFields);
+          }
+        }
+      }
+
+      // multiple comparators.
       if (docsScoredInOrder) {
         if (trackMaxScore) {
-          return new OneComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
+          return new MultiComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
         } else if (trackDocScores) {
-          return new OneComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
+          return new MultiComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
         } else {
-          return new OneComparatorNonScoringCollector(queue, numHits, fillFields);
+          return new MultiComparatorNonScoringCollector(queue, numHits, fillFields);
         }
       } else {
         if (trackMaxScore) {
-          return new OutOfOrderOneComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
+          return new OutOfOrderMultiComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
         } else if (trackDocScores) {
-          return new OutOfOrderOneComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
+          return new OutOfOrderMultiComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
         } else {
-          return new OutOfOrderOneComparatorNonScoringCollector(queue, numHits, fillFields);
+          return new OutOfOrderMultiComparatorNonScoringCollector(queue, numHits, fillFields);
         }
       }
-    }
-
-    // multiple comparators.
-    if (docsScoredInOrder) {
-      if (trackMaxScore) {
-        return new MultiComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
-      } else if (trackDocScores) {
-        return new MultiComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
-      } else {
-        return new MultiComparatorNonScoringCollector(queue, numHits, fillFields);
-      }
     } else {
-      if (trackMaxScore) {
-        return new OutOfOrderMultiComparatorScoringMaxScoreCollector(queue, numHits, fillFields);
-      } else if (trackDocScores) {
-        return new OutOfOrderMultiComparatorScoringNoMaxScoreCollector(queue, numHits, fillFields);
-      } else {
-        return new OutOfOrderMultiComparatorNonScoringCollector(queue, numHits, fillFields);
+      if (after.fields == null) {
+        throw new IllegalArgumentException("after.fields wasn't set; you must pass fillFields=true for the previous search");
       }
+
+      if (after.fields.length != sort.getSort().length) {
+        throw new IllegalArgumentException("after.fields has " + after.fields.length + " values but sort has " + sort.getSort().length);
+      }
+
+      return new PagingFieldCollector(queue, after, numHits, fillFields, trackDocScores, trackMaxScore);
     }
   }
   
diff --git a/lucene/core/src/java/org/apache/lucene/search/TopFieldDocs.java b/lucene/core/src/java/org/apache/lucene/search/TopFieldDocs.java
index fc4c2331c3b..aa17421b19e 100644
--- a/lucene/core/src/java/org/apache/lucene/search/TopFieldDocs.java
+++ b/lucene/core/src/java/org/apache/lucene/search/TopFieldDocs.java
@@ -21,20 +21,19 @@ package org.apache.lucene.search;
 /** Represents hits returned by {@link
  * IndexSearcher#search(Query,Filter,int,Sort)}.
  */
-public class TopFieldDocs
-extends TopDocs {
+public class TopFieldDocs extends TopDocs {
 
-	/** The fields which were used to sort results by. */
-	public SortField[] fields;
+  /** The fields which were used to sort results by. */
+  public SortField[] fields;
         
-	/** Creates one of these objects.
-	 * @param totalHits  Total number of hits for the query.
-	 * @param scoreDocs  The top hits for the query.
-	 * @param fields     The sort criteria used to find the top hits.
-	 * @param maxScore   The maximum score encountered.
-	 */
-        public TopFieldDocs (int totalHits, ScoreDoc[] scoreDocs, SortField[] fields, float maxScore) {
-	  super (totalHits, scoreDocs, maxScore);
-	  this.fields = fields;
-	}
+  /** Creates one of these objects.
+   * @param totalHits  Total number of hits for the query.
+   * @param scoreDocs  The top hits for the query.
+   * @param fields     The sort criteria used to find the top hits.
+   * @param maxScore   The maximum score encountered.
+   */
+  public TopFieldDocs (int totalHits, ScoreDoc[] scoreDocs, SortField[] fields, float maxScore) {
+    super (totalHits, scoreDocs, maxScore);
+    this.fields = fields;
+  }
 }
\ No newline at end of file
diff --git a/lucene/core/src/test/org/apache/lucene/search/JustCompileSearch.java b/lucene/core/src/test/org/apache/lucene/search/JustCompileSearch.java
index 7774da63fc1..e3c284564ae 100644
--- a/lucene/core/src/test/org/apache/lucene/search/JustCompileSearch.java
+++ b/lucene/core/src/test/org/apache/lucene/search/JustCompileSearch.java
@@ -139,6 +139,10 @@ final class JustCompileSearch {
       throw new UnsupportedOperationException(UNSUPPORTED_MSG);
     }
 
+    @Override
+    public int compareDocToValue(int doc, Object value) {
+      throw new UnsupportedOperationException(UNSUPPORTED_MSG);
+    }
   }
 
   static final class JustCompileFieldComparatorSource extends FieldComparatorSource {
diff --git a/lucene/core/src/test/org/apache/lucene/search/TestElevationComparator.java b/lucene/core/src/test/org/apache/lucene/search/TestElevationComparator.java
index fa04a5b52c4..688bc921f58 100644
--- a/lucene/core/src/test/org/apache/lucene/search/TestElevationComparator.java
+++ b/lucene/core/src/test/org/apache/lucene/search/TestElevationComparator.java
@@ -188,6 +188,14 @@ class ElevationComparatorSource extends FieldComparatorSource {
      public Integer value(int slot) {
        return Integer.valueOf(values[slot]);
      }
+
+     @Override
+     public int compareDocToValue(int doc, Integer valueObj) throws IOException {
+       final int value = valueObj.intValue();
+       final int docValue = docVal(doc);
+       // values will be small enough that there is no overflow concern
+       return value - docValue;
+     }
    };
  }
 }
diff --git a/lucene/core/src/test/org/apache/lucene/search/TestSearchAfter.java b/lucene/core/src/test/org/apache/lucene/search/TestSearchAfter.java
index 0fa6f22dbeb..ed8b793f901 100644
--- a/lucene/core/src/test/org/apache/lucene/search/TestSearchAfter.java
+++ b/lucene/core/src/test/org/apache/lucene/search/TestSearchAfter.java
@@ -17,12 +17,25 @@ package org.apache.lucene.search;
  * limitations under the License.
  */
 
+import java.util.Arrays;
+
+import org.apache.lucene.codecs.Codec;
 import org.apache.lucene.document.Document;
+import org.apache.lucene.document.DoubleField;
+import org.apache.lucene.document.FloatDocValuesField;
+import org.apache.lucene.document.FloatField;
+import org.apache.lucene.document.IntDocValuesField;
+import org.apache.lucene.document.IntField;
+import org.apache.lucene.document.LongField;
+import org.apache.lucene.document.SortedBytesDocValuesField;
+import org.apache.lucene.document.StraightBytesDocValuesField;
+import org.apache.lucene.document.StringField;
 import org.apache.lucene.document.TextField;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.RandomIndexWriter;
 import org.apache.lucene.index.Term;
 import org.apache.lucene.store.Directory;
+import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.English;
 import org.apache.lucene.util.LuceneTestCase;
 import org.apache.lucene.util._TestUtil;
@@ -30,11 +43,19 @@ import org.apache.lucene.util._TestUtil;
 /**
  * Tests IndexSearcher's searchAfter() method
  */
+
 public class TestSearchAfter extends LuceneTestCase {
   private Directory dir;
   private IndexReader reader;
   private IndexSearcher searcher;
    
+  boolean supportsDocValues = Codec.getDefault().getName().equals("Lucene3x") == false;
+
+  private static SortField useDocValues(SortField field) {
+    field.setUseIndexValues(true);
+    return field;
+  }
+
   @Override
   public void setUp() throws Exception {
     super.setUp();
@@ -45,6 +66,25 @@ public class TestSearchAfter extends LuceneTestCase {
       Document document = new Document();
       document.add(newField("english", English.intToEnglish(i), TextField.TYPE_UNSTORED));
       document.add(newField("oddeven", (i % 2 == 0) ? "even" : "odd", TextField.TYPE_UNSTORED));
+      document.add(newField("byte", "" + ((byte) random().nextInt()), StringField.TYPE_UNSTORED));
+      document.add(newField("short", "" + ((short) random().nextInt()), StringField.TYPE_UNSTORED));
+      document.add(new IntField("int", random().nextInt()));
+      document.add(new LongField("long", random().nextLong()));
+
+      document.add(new FloatField("float", random().nextFloat()));
+      document.add(new DoubleField("double", random().nextDouble()));
+      document.add(newField("bytes", _TestUtil.randomRealisticUnicodeString(random()), StringField.TYPE_UNSTORED));
+      document.add(newField("bytesval", _TestUtil.randomRealisticUnicodeString(random()), StringField.TYPE_UNSTORED));
+      document.add(new DoubleField("double", random().nextDouble()));
+
+      if (supportsDocValues) {
+        document.add(new IntDocValuesField("intdocvalues", random().nextInt()));
+        document.add(new FloatDocValuesField("floatdocvalues", random().nextFloat()));
+        document.add(new SortedBytesDocValuesField("sortedbytesdocvalues", new BytesRef(_TestUtil.randomRealisticUnicodeString(random()))));
+        document.add(new SortedBytesDocValuesField("sortedbytesdocvaluesval", new BytesRef(_TestUtil.randomRealisticUnicodeString(random()))));
+        document.add(new StraightBytesDocValuesField("straightbytesdocvalues", new BytesRef(_TestUtil.randomRealisticUnicodeString(random()))));
+      }
+
       iw.addDocument(document);
     }
     reader = iw.getReader();
@@ -63,7 +103,7 @@ public class TestSearchAfter extends LuceneTestCase {
     // because the first page has a null 'after', we get a normal collector.
     // so we need to run the test a few times to ensure we will collect multiple
     // pages.
-    int n = atLeast(10);
+    int n = atLeast(20);
     for (int i = 0; i < n; i++) {
       Filter odd = new QueryWrapperFilter(new TermQuery(new Term("oddeven", "odd")));
       assertQuery(new MatchAllDocsQuery(), null);
@@ -78,13 +118,67 @@ public class TestSearchAfter extends LuceneTestCase {
   }
   
   void assertQuery(Query query, Filter filter) throws Exception {
+    assertQuery(query, filter, null);
+    assertQuery(query, filter, Sort.RELEVANCE);
+    assertQuery(query, filter, Sort.INDEXORDER);
+    for(int rev=0;rev<2;rev++) {
+      boolean reversed = rev == 1;
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("byte", SortField.Type.BYTE, reversed)}));
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("short", SortField.Type.SHORT, reversed)}));
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("int", SortField.Type.INT, reversed)}));
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("long", SortField.Type.LONG, reversed)}));
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("float", SortField.Type.FLOAT, reversed)}));
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("double", SortField.Type.DOUBLE, reversed)}));
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("bytes", SortField.Type.STRING, reversed)}));
+      assertQuery(query, filter, new Sort(new SortField[] {new SortField("bytesval", SortField.Type.STRING_VAL, reversed)}));
+      if (supportsDocValues) {
+        assertQuery(query, filter, new Sort(new SortField[] {useDocValues(new SortField("intdocvalues", SortField.Type.INT, reversed))}));
+        assertQuery(query, filter, new Sort(new SortField[] {useDocValues(new SortField("floatdocvalues", SortField.Type.FLOAT, reversed))}));
+        assertQuery(query, filter, new Sort(new SortField[] {useDocValues(new SortField("sortedbytesdocvalues", SortField.Type.STRING, reversed))}));
+        assertQuery(query, filter, new Sort(new SortField[] {useDocValues(new SortField("sortedbytesdocvaluesval", SortField.Type.STRING_VAL, reversed))}));
+        assertQuery(query, filter, new Sort(new SortField[] {useDocValues(new SortField("straightbytesdocvalues", SortField.Type.STRING_VAL, reversed))}));
+      }
+    }
+  }
+
+  void assertQuery(Query query, Filter filter, Sort sort) throws Exception {
     int maxDoc = searcher.getIndexReader().maxDoc();
-    TopDocs all = searcher.search(query, filter, maxDoc);
+    TopDocs all;
     int pageSize = _TestUtil.nextInt(random(), 1, maxDoc*2);
+    if (VERBOSE) {
+      System.out.println("\nassertQuery: query=" + query + " filter=" + filter + " sort=" + sort + " pageSize=" + pageSize);
+    }
+    final boolean doMaxScore = random().nextBoolean();
+    if (sort == null) {
+      all = searcher.search(query, filter, maxDoc);
+    } else if (sort == Sort.RELEVANCE) {
+      all = searcher.search(query, filter, maxDoc, sort, true, doMaxScore);
+    } else {
+      all = searcher.search(query, filter, maxDoc, sort);
+    }
+    if (VERBOSE) {
+      System.out.println("  all.totalHits=" + all.totalHits);
+    }
     int pageStart = 0;
     ScoreDoc lastBottom = null;
     while (pageStart < all.totalHits) {
-      TopDocs paged = searcher.searchAfter(lastBottom, query, filter, pageSize);
+      TopDocs paged;
+      if (sort == null) {
+        if (VERBOSE) {
+          System.out.println("  iter lastBottom=" + lastBottom);
+        }
+        paged = searcher.searchAfter(lastBottom, query, filter, pageSize);
+      } else {
+        if (VERBOSE) {
+          System.out.println("  iter lastBottom=" + lastBottom + (lastBottom == null ? "" : " fields=" + Arrays.toString(((FieldDoc) lastBottom).fields)));
+        }
+        if (sort == Sort.RELEVANCE) {
+          paged = searcher.searchAfter(lastBottom, query, filter, pageSize, sort, true, doMaxScore);
+        } else {
+          paged = searcher.searchAfter(lastBottom, query, filter, pageSize, sort);
+        }
+      }
+
       if (paged.scoreDocs.length == 0) {
         break;
       }
@@ -98,8 +192,14 @@ public class TestSearchAfter extends LuceneTestCase {
   static void assertPage(int pageStart, TopDocs all, TopDocs paged) {
     assertEquals(all.totalHits, paged.totalHits);
     for (int i = 0; i < paged.scoreDocs.length; i++) {
-      assertEquals(all.scoreDocs[pageStart + i].doc, paged.scoreDocs[i].doc);
-      assertEquals(all.scoreDocs[pageStart + i].score, paged.scoreDocs[i].score, 0f);
+      ScoreDoc sd1 = all.scoreDocs[pageStart + i];
+      ScoreDoc sd2 = paged.scoreDocs[i];
+      assertEquals(sd1.doc, sd2.doc);
+      assertEquals(sd1.score, sd2.score, 0f);
+      if (sd1 instanceof FieldDoc) {
+        assertTrue(sd2 instanceof FieldDoc);
+        assertEquals(((FieldDoc) sd1).fields, ((FieldDoc) sd2).fields);
+      }
     }
   }
 }
diff --git a/lucene/core/src/test/org/apache/lucene/search/TestSort.java b/lucene/core/src/test/org/apache/lucene/search/TestSort.java
index 759ad15af78..a63af54d49a 100644
--- a/lucene/core/src/test/org/apache/lucene/search/TestSort.java
+++ b/lucene/core/src/test/org/apache/lucene/search/TestSort.java
@@ -44,9 +44,11 @@ import org.apache.lucene.document.StringField;
 import org.apache.lucene.document.TextField;
 import org.apache.lucene.index.AtomicReaderContext;
 import org.apache.lucene.index.CorruptIndexException;
+import org.apache.lucene.index.DirectoryReader;
 import org.apache.lucene.index.DocValues;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.IndexWriter;
+import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.index.IndexableField;
 import org.apache.lucene.index.MultiReader;
 import org.apache.lucene.index.RandomIndexWriter;
@@ -218,7 +220,6 @@ public class TestSort extends LuceneTestCase {
     IndexReader reader = writer.getReader();
     writer.close ();
     IndexSearcher s = newSearcher(reader);
-    s.setDefaultFieldSortScoring(true, true);
     return s;
   }
 
@@ -734,6 +735,15 @@ public class TestSort extends LuceneTestCase {
     public Integer value(int slot) {
       return Integer.valueOf(slotValues[slot]);
     }
+
+    @Override
+    public int compareDocToValue(int doc, Integer valueObj) {
+      final int value = valueObj.intValue();
+      final int docValue = docValues[doc];
+
+      // values are small enough that overflow won't happen
+      return docValue - value;
+    }
   }
 
   static class MyFieldComparatorSource extends FieldComparatorSource {
@@ -889,7 +899,7 @@ public class TestSort extends LuceneTestCase {
 
     // try to pick a query that will result in an unnormalized
     // score greater than 1 to test for correct normalization
-    final TopDocs docs1 = full.search(queryE,null,nDocs,sort);
+    final TopDocs docs1 = full.search(queryE,null,nDocs,sort,true,true);
 
     // a filter that only allows through the first hit
     Filter filt = new Filter() {
@@ -903,7 +913,7 @@ public class TestSort extends LuceneTestCase {
       }
     };
 
-    TopDocs docs2 = full.search(queryE, filt, nDocs, sort);
+    TopDocs docs2 = full.search(queryE, filt, nDocs, sort,true,true);
     
     assertEquals(docs1.scoreDocs[0].score, docs2.scoreDocs[0].score, 1e-6);
   }
@@ -1244,7 +1254,7 @@ public class TestSort extends LuceneTestCase {
       String expectedResult) throws IOException {
 
     //ScoreDoc[] result = searcher.search (query, null, 1000, sort).scoreDocs;
-    TopDocs hits = searcher.search(query, null, Math.max(1, expectedResult.length()), sort);
+    TopDocs hits = searcher.search(query, null, Math.max(1, expectedResult.length()), sort, true, true);
     ScoreDoc[] result = hits.scoreDocs;
     assertEquals(expectedResult.length(),hits.totalHits);
     StringBuilder buff = new StringBuilder(10);
@@ -1478,4 +1488,38 @@ public class TestSort extends LuceneTestCase {
     r.close();
     dir.close();
   }
+
+  public void testMaxScore() throws Exception {
+    Directory d = newDirectory();
+    // Not RIW because we need exactly 2 segs:
+    IndexWriter w = new IndexWriter(d, new IndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(random())));
+    int id = 0;
+    for(int seg=0;seg<2;seg++) {
+      for(int docIDX=0;docIDX<10;docIDX++) {
+        Document doc = new Document();
+        doc.add(newField("id", ""+docIDX, StringField.TYPE_STORED));
+        StringBuilder sb = new StringBuilder();
+        for(int i=0;i<id;i++) {
+          sb.append(' ');
+          sb.append("text");
+        }
+        doc.add(newField("body", sb.toString(), TextField.TYPE_UNSTORED));
+        w.addDocument(doc);
+        id++;
+      }
+      w.commit();
+    }
+
+    IndexReader r = DirectoryReader.open(w, true);
+    w.close();
+    Query q = new TermQuery(new Term("body", "text"));
+    IndexSearcher s = newSearcher(r);
+    float maxScore = s.search(q , 10).getMaxScore();
+    assertEquals(maxScore, s.search(q, null, 3, Sort.INDEXORDER, random().nextBoolean(), true).getMaxScore(), 0.0);
+    assertEquals(maxScore, s.search(q, null, 3, Sort.RELEVANCE, random().nextBoolean(), true).getMaxScore(), 0.0);
+    assertEquals(maxScore, s.search(q, null, 3, new Sort(new SortField[] {new SortField("id", SortField.Type.INT, false)}), random().nextBoolean(), true).getMaxScore(), 0.0);
+    assertEquals(maxScore, s.search(q, null, 3, new Sort(new SortField[] {new SortField("id", SortField.Type.INT, true)}), random().nextBoolean(), true).getMaxScore(), 0.0);
+    r.close();
+    d.close();
+  }
 }
diff --git a/lucene/join/src/test/org/apache/lucene/search/join/TestBlockJoin.java b/lucene/join/src/test/org/apache/lucene/search/join/TestBlockJoin.java
index 85b8e7f492b..34f7b656119 100644
--- a/lucene/join/src/test/org/apache/lucene/search/join/TestBlockJoin.java
+++ b/lucene/join/src/test/org/apache/lucene/search/join/TestBlockJoin.java
@@ -444,7 +444,6 @@ public class TestBlockJoin extends LuceneTestCase {
     }
 
     final IndexSearcher s = newSearcher(r);
-    s.setDefaultFieldSortScoring(true, true);
 
     final IndexSearcher joinS = newSearcher(joinR);
 
diff --git a/lucene/queries/src/java/org/apache/lucene/queries/CustomScoreQuery.java b/lucene/queries/src/java/org/apache/lucene/queries/CustomScoreQuery.java
index ef594d879df..0a6b193e83d 100755
--- a/lucene/queries/src/java/org/apache/lucene/queries/CustomScoreQuery.java
+++ b/lucene/queries/src/java/org/apache/lucene/queries/CustomScoreQuery.java
@@ -64,7 +64,7 @@ public class CustomScoreQuery extends Query {
    * computation.  This parameter is optional - it can be null.
    */
   public CustomScoreQuery(Query subQuery, Query scoringQuery) {
-	  this(subQuery, scoringQuery!=null ? // don't want an array that contains a single null..
+    this(subQuery, scoringQuery!=null ? // don't want an array that contains a single null..
         new Query[] {scoringQuery} : new Query[0]);
   }
 
diff --git a/lucene/queries/src/java/org/apache/lucene/queries/function/ValueSource.java b/lucene/queries/src/java/org/apache/lucene/queries/function/ValueSource.java
index 68da0a3d441..e4894ee33bf 100644
--- a/lucene/queries/src/java/org/apache/lucene/queries/function/ValueSource.java
+++ b/lucene/queries/src/java/org/apache/lucene/queries/function/ValueSource.java
@@ -184,5 +184,18 @@ public abstract class ValueSource {
     public Double value(int slot) {
       return values[slot];
     }
+
+    @Override
+    public int compareDocToValue(int doc, Double valueObj) {
+      final double value = valueObj.doubleValue();
+      final double docValue = docVals.doubleVal(doc);
+      if (docValue < value) {
+        return -1;
+      } else if (docValue > value) {
+        return -1;
+      } else {
+        return 0;
+      }
+    }
   }
 }
diff --git a/lucene/queries/src/test/org/apache/lucene/queries/function/TestValueSources.java b/lucene/queries/src/test/org/apache/lucene/queries/function/TestValueSources.java
index a8e208479c9..de8a33ffd2b 100644
--- a/lucene/queries/src/test/org/apache/lucene/queries/function/TestValueSources.java
+++ b/lucene/queries/src/test/org/apache/lucene/queries/function/TestValueSources.java
@@ -132,7 +132,6 @@ public class TestValueSources extends LuceneTestCase {
     
     reader = iw.getReader();
     searcher = newSearcher(reader);
-    searcher.setDefaultFieldSortScoring(true, true);
     iw.close();
   }
   
diff --git a/lucene/sandbox/src/java/org/apache/lucene/sandbox/queries/SlowCollatedStringComparator.java b/lucene/sandbox/src/java/org/apache/lucene/sandbox/queries/SlowCollatedStringComparator.java
index 4170bdd1dfd..4bc543b6956 100644
--- a/lucene/sandbox/src/java/org/apache/lucene/sandbox/queries/SlowCollatedStringComparator.java
+++ b/lucene/sandbox/src/java/org/apache/lucene/sandbox/queries/SlowCollatedStringComparator.java
@@ -118,4 +118,16 @@ public final class SlowCollatedStringComparator extends FieldComparator<String>
       return collator.compare(first, second);
     }
   }
+
+  @Override
+  public int compareDocToValue(int doc, String value) {
+    final BytesRef br = currentDocTerms.getTerm(doc, tempBR);
+    final String docValue;
+    if (br == null) {
+      docValue = null;
+    } else {
+      docValue = br.utf8ToString();
+    }
+    return compareValues(docValue, value);
+  }
 }
diff --git a/solr/core/src/java/org/apache/solr/handler/component/QueryElevationComponent.java b/solr/core/src/java/org/apache/solr/handler/component/QueryElevationComponent.java
index 2104cb722c9..1da847d8da8 100644
--- a/solr/core/src/java/org/apache/solr/handler/component/QueryElevationComponent.java
+++ b/solr/core/src/java/org/apache/solr/handler/component/QueryElevationComponent.java
@@ -560,9 +560,14 @@ public class QueryElevationComponent extends SearchComponent implements SolrCore
       public Integer value(int slot) {
         return values[slot];
       }
+
+      @Override
+      public int compareDocToValue(int doc, Integer valueObj) throws IOException {
+        final int value = valueObj.intValue();
+        final int docValue = docVal(doc);
+        return docValue - value;  // values will be small enough that there is no overflow concern
+      }
     };
   }
+  }
 }
-}
-
-
diff --git a/solr/core/src/java/org/apache/solr/schema/RandomSortField.java b/solr/core/src/java/org/apache/solr/schema/RandomSortField.java
index 69ca740bd02..9640f947338 100644
--- a/solr/core/src/java/org/apache/solr/schema/RandomSortField.java
+++ b/solr/core/src/java/org/apache/solr/schema/RandomSortField.java
@@ -138,6 +138,12 @@ public class RandomSortField extends FieldType {
         public Integer value(int slot) {
           return values[slot];
         }
+
+        @Override
+        public int compareDocToValue(int doc, Integer valueObj) {
+          // values will be positive... no overflow possible.
+          return hash(doc+seed) - valueObj.intValue();
+        }
       };
     }
   };
diff --git a/solr/core/src/java/org/apache/solr/search/MissingStringLastComparatorSource.java b/solr/core/src/java/org/apache/solr/search/MissingStringLastComparatorSource.java
index ec1363abf1b..65b7ad596ed 100644
--- a/solr/core/src/java/org/apache/solr/search/MissingStringLastComparatorSource.java
+++ b/solr/core/src/java/org/apache/solr/search/MissingStringLastComparatorSource.java
@@ -121,6 +121,11 @@ class TermOrdValComparator_SML extends FieldComparator<Comparable> {
     return TermOrdValComparator_SML.createComparator(context.reader(), this);
   }
 
+  @Override
+  public int compareDocToValue(int doc, Comparable docValue) {
+    throw new UnsupportedOperationException();
+  }
+
   // Base class for specialized (per bit width of the
   // ords) per-segment comparator.  NOTE: this is messy;
   // we do this only because hotspot can't reliably inline
@@ -216,6 +221,20 @@ class TermOrdValComparator_SML extends FieldComparator<Comparable> {
     public BytesRef value(int slot) {
       return values==null ? parent.NULL_VAL : values[slot];
     }
+
+    @Override
+    public int compareDocToValue(int doc, BytesRef value) {
+      final BytesRef docValue = termsIndex.getTerm(doc, tempBR);
+      if (docValue == null) {
+        if (value == null) {
+          return 0;
+        }
+        return 1;
+      } else if (value == null) {
+        return -1;
+      }
+      return docValue.compareTo(value);
+    }
   }
 
   // Used per-segment when bit width of doc->ord is 8:

From b4c22fcf37e7194026887e9226929c0acfcf6e00 Mon Sep 17 00:00:00 2001
From: Shai Erera <shaie@apache.org>
Date: Wed, 16 May 2012 13:11:07 +0000
Subject: [PATCH 07/47] LUCENE-4061: improvements to DirectoryTaxonomyWriter

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339150 13f79535-47bb-0310-9956-ffa450edef68
---
 lucene/CHANGES.txt                            |   6 +-
 .../directory/DirectoryTaxonomyWriter.java    | 183 ++++++++++--------
 .../cl2o/Cl2oTaxonomyWriterCache.java         |  59 ++++--
 .../lru/LruTaxonomyWriterCache.java           |  23 ++-
 .../taxonomy/directory/TestAddTaxonomy.java   |  31 ++-
 .../TestDirectoryTaxonomyWriter.java          |  56 +++++-
 6 files changed, 243 insertions(+), 115 deletions(-)

diff --git a/lucene/CHANGES.txt b/lucene/CHANGES.txt
index 29d5a6b5ab2..6025da6c306 100644
--- a/lucene/CHANGES.txt
+++ b/lucene/CHANGES.txt
@@ -914,7 +914,11 @@ Optimizations
   FST under the hood, which requires less RAM.  NormalizeCharMap no
   longer accepts empty string match (it did previously, but ignored
   it).  (Dawid Weiss, Mike McCandless)
-             
+
+* LUCENE-4061: improve synchronization in DirectoryTaxonomyWriter.addCategory
+  and few general improvements to DirectoryTaxonomyWriter.
+  (Shai Erera, Gilad Barkai)
+  
 Bug fixes
 
 * LUCENE-2803: The FieldCache can miss values if an entry for a reader
diff --git a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
index b77e0f1bcfe..09ad26f1a5c 100644
--- a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
+++ b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
@@ -27,6 +27,7 @@ import org.apache.lucene.facet.taxonomy.TaxonomyWriter;
 import org.apache.lucene.facet.taxonomy.writercache.TaxonomyWriterCache;
 import org.apache.lucene.facet.taxonomy.writercache.cl2o.Cl2oTaxonomyWriterCache;
 import org.apache.lucene.facet.taxonomy.writercache.lru.LruTaxonomyWriterCache;
+import org.apache.lucene.index.AtomicReader;
 import org.apache.lucene.index.CorruptIndexException;
 import org.apache.lucene.index.DirectoryReader;
 import org.apache.lucene.index.DocsEnum;
@@ -40,7 +41,6 @@ import org.apache.lucene.index.SegmentInfos;
 import org.apache.lucene.index.Terms;
 import org.apache.lucene.index.TermsEnum;
 import org.apache.lucene.index.TieredMergePolicy;
-import org.apache.lucene.search.DocIdSetIterator;
 import org.apache.lucene.store.AlreadyClosedException;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.LockObtainFailedException;
@@ -347,18 +347,6 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     closeResources();
   }
 
-  /**
-   * Returns the number of memory bytes used by the cache.
-   * @return Number of cache bytes in memory, for CL2O only; zero otherwise.
-   */
-  public int getCacheMemoryUsage() {
-    ensureOpen();
-    if (this.cache == null || !(this.cache instanceof Cl2oTaxonomyWriterCache)) {
-      return 0;
-    }
-    return ((Cl2oTaxonomyWriterCache)this.cache).getMemoryUsage();
-  }
-
   /**
    * A hook for extending classes to close additional resources that were used.
    * The default implementation closes the {@link IndexReader} as well as the
@@ -413,21 +401,26 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
       reader = openReader();
     }
 
-    // TODO (Facet): avoid Multi*?
-    Bits liveDocs = MultiFields.getLiveDocs(reader);
-    DocsEnum docs = MultiFields.getTermDocsEnum(reader, liveDocs, Consts.FULL, 
-                                                new BytesRef(categoryPath.toString(delimiter)),
-                                                false);
-    if (docs == null || docs.nextDoc() == DocIdSetIterator.NO_MORE_DOCS) {
-      return -1; // category does not exist in taxonomy
+    int base = 0;
+    int doc = -1;
+    for (AtomicReader r : reader.getSequentialSubReaders()) {
+      DocsEnum docs = r.termDocsEnum(null, Consts.FULL, 
+          new BytesRef(categoryPath.toString(delimiter)), false);
+      if (docs != null) {
+        doc = docs.nextDoc() + base;
+        break;
+      }
+      base += r.maxDoc(); // we don't have deletions, so it's ok to call maxDoc
     }
     // Note: we do NOT add to the cache the fact that the category
     // does not exist. The reason is that our only use for this
     // method is just before we actually add this category. If
     // in the future this usage changes, we should consider caching
     // the fact that the category is not in the taxonomy.
-    addToCache(categoryPath, docs.docID());
-    return docs.docID();
+    if (doc > 0) {
+      addToCache(categoryPath, doc);
+    }
+    return doc;
   }
 
   /**
@@ -436,7 +429,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
    * case the category does not yet exist in the taxonomy.
    */
   private int findCategory(CategoryPath categoryPath, int prefixLen)
-  throws IOException {
+      throws IOException {
     int res = cache.get(categoryPath, prefixLen);
     if (res >= 0) {
       return res;
@@ -451,36 +444,46 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     if (reader == null) {
       reader = openReader();
     }
-    Bits liveDocs = MultiFields.getLiveDocs(reader);
-    DocsEnum docs = MultiFields.getTermDocsEnum(reader, liveDocs, Consts.FULL, 
-                                                new BytesRef(categoryPath.toString(delimiter, prefixLen)),
-                                                false);
-    if (docs == null || docs.nextDoc() == DocIdSetIterator.NO_MORE_DOCS) {
-      return -1; // category does not exist in taxonomy
+    
+    int base = 0;
+    int doc = -1;
+    for (AtomicReader r : reader.getSequentialSubReaders()) {
+      DocsEnum docs = r.termDocsEnum(null, Consts.FULL, 
+          new BytesRef(categoryPath.toString(delimiter, prefixLen)), false);
+      if (docs != null) {
+        doc = docs.nextDoc() + base;
+        break;
+      }
+      base += r.maxDoc(); // we don't have deletions, so it's ok to call maxDoc
     }
-    addToCache(categoryPath, prefixLen, docs.docID());
-    return docs.docID();
+    
+    if (doc > 0) {
+      addToCache(categoryPath, prefixLen, doc);
+    }
+    return doc;
   }
 
-  // TODO (Facet): addCategory() is synchronized. This means that if indexing is
-  // multi-threaded, a new category that needs to be written to disk (and
-  // potentially even trigger a lengthy merge) locks out other addCategory()
-  // calls - even those which could immediately return a cached value.
-  // We definitely need to fix this situation!
   @Override
-  public synchronized int addCategory(CategoryPath categoryPath) throws IOException {
+  public int addCategory(CategoryPath categoryPath) throws IOException {
     ensureOpen();
     // If the category is already in the cache and/or the taxonomy, we
-    // should return its existing ordinal:
+    // should return its existing ordinal
     int res = findCategory(categoryPath);
     if (res < 0) {
-      // This is a new category, and we need to insert it into the index
-      // (and the cache). Actually, we might also need to add some of
-      // the category's ancestors before we can add the category itself
-      // (while keeping the invariant that a parent is always added to
-      // the taxonomy before its child). internalAddCategory() does all
-      // this recursively:
-      res = internalAddCategory(categoryPath, categoryPath.length());
+      // the category is neither in the cache nor in the index - following code
+      // cannot be executed in parallel.
+      synchronized (this) {
+        res = findCategory(categoryPath);
+        if (res < 0) {
+          // This is a new category, and we need to insert it into the index
+          // (and the cache). Actually, we might also need to add some of
+          // the category's ancestors before we can add the category itself
+          // (while keeping the invariant that a parent is always added to
+          // the taxonomy before its child). internalAddCategory() does all
+          // this recursively
+          res = internalAddCategory(categoryPath, categoryPath.length());
+        }
+      }
     }
     return res;
 
@@ -496,7 +499,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
    * recursion.
    */
   private int internalAddCategory(CategoryPath categoryPath, int length)
-  throws CorruptIndexException, IOException {
+      throws IOException {
 
     // Find our parent's ordinal (recursively adding the parent category
     // to the taxonomy if it's not already there). Then add the parent
@@ -528,13 +531,12 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     }
   }
   
-  // Note that the methods calling addCategoryDocument() are synchornized,
-  // so this method is effectively synchronized as well, but we'll add
-  // synchronized to be on the safe side, and we can reuse class-local objects
-  // instead of allocating them every time
-  protected synchronized int addCategoryDocument(CategoryPath categoryPath,
-                                                  int length, int parent)
-      throws CorruptIndexException, IOException {
+  /**
+   * Note that the methods calling addCategoryDocument() are synchornized, so
+   * this method is effectively synchronized as well.
+   */
+  private int addCategoryDocument(CategoryPath categoryPath, int length,
+      int parent) throws IOException {
     // Before Lucene 2.9, position increments >=0 were supported, so we
     // added 1 to parent to allow the parent -1 (the parent of the root).
     // Unfortunately, starting with Lucene 2.9, after LUCENE-1542, this is
@@ -544,7 +546,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     // we write here (e.g., to write parent+2), and need to do a workaround
     // in the reader (which knows that anyway only category 0 has a parent
     // -1).    
-    parentStream.set(parent+1);
+    parentStream.set(parent + 1);
     Document d = new Document();
     d.add(parentStreamField);
 
@@ -601,8 +603,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     }
   }
 
-  private void addToCache(CategoryPath categoryPath, int id)
-  throws CorruptIndexException, IOException {
+  private void addToCache(CategoryPath categoryPath, int id) throws IOException {
     if (cache.put(categoryPath, id)) {
       // If cache.put() returned true, it means the cache was limited in
       // size, became full, so parts of it had to be cleared.
@@ -620,7 +621,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
   }
 
   private void addToCache(CategoryPath categoryPath, int prefixLen, int id)
-  throws CorruptIndexException, IOException {
+      throws IOException {
     if (cache.put(categoryPath, prefixLen, id)) {
       refreshReader();
       cacheIsComplete = false;
@@ -766,7 +767,29 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     }
 
     CategoryPath cp = new CategoryPath();
-    Terms terms = MultiFields.getTerms(reader, Consts.FULL);
+    TermsEnum termsEnum = null;
+    DocsEnum docsEnum = null;
+    int base = 0;
+    for (AtomicReader r : reader.getSequentialSubReaders()) {
+      Terms terms = r.terms(Consts.FULL);
+      if (terms != null) { // cannot really happen, but be on the safe side
+        termsEnum = terms.iterator(termsEnum);
+        while (termsEnum.next() != null) {
+          BytesRef t = termsEnum.term();
+          // Since we guarantee uniqueness of categories, each term has exactly
+          // one document. Also, since we do not allow removing categories (and
+          // hence documents), there are no deletions in the index. Therefore, it
+          // is sufficient to call next(), and then doc(), exactly once with no
+          // 'validation' checks.
+          cp.clear();
+          cp.add(t.utf8ToString(), delimiter);
+          docsEnum = termsEnum.docs(null, docsEnum, false);
+          cache.put(cp, docsEnum.nextDoc() + base);
+        }
+      }
+      base += r.maxDoc(); // we don't have any deletions, so we're ok
+    }
+    /*Terms terms = MultiFields.getTerms(reader, Consts.FULL);
     // The check is done here to avoid checking it on every iteration of the
     // below loop. A null term wlil be returned if there are no terms in the
     // lexicon, or after the Consts.FULL term. However while the loop is
@@ -786,11 +809,10 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
         docsEnum = termsEnum.docs(liveDocs, docsEnum, false);
         docsEnum.nextDoc();
         cp.clear();
-        // TODO (Facet): avoid String creation/use bytes?
         cp.add(t.utf8ToString(), delimiter);
         cache.put(cp, docsEnum.docID());
       }
-    }
+    }*/
 
     cacheIsComplete = true;
     // No sense to keep the reader open - we will not need to read from it
@@ -832,35 +854,34 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
    */
   public void addTaxonomy(Directory taxoDir, OrdinalMap map) throws IOException {
     ensureOpen();
-    IndexReader r = DirectoryReader.open(taxoDir);
+    DirectoryReader r = DirectoryReader.open(taxoDir);
     try {
       final int size = r.numDocs();
       final OrdinalMap ordinalMap = map;
       ordinalMap.setSize(size);
       CategoryPath cp = new CategoryPath();
-      Terms terms = MultiFields.getTerms(r, Consts.FULL);
-      TermsEnum te = terms.iterator(null);
-      Bits liveDocs = MultiFields.getLiveDocs(r);
+      int base = 0;
+      TermsEnum te = null;
       DocsEnum docs = null;
-      // we call next() first, to skip the root category which always exists.
-      while (te.next() != null) {
-        String value = te.term().utf8ToString();
-        cp.clear();
-        cp.add(value, Consts.DEFAULT_DELIMITER);
-        int ordinal = findCategory(cp);
-        if (ordinal < 0) {
-          // NOTE: call addCategory so that it works well in a multi-threaded
-          // environment, in case e.g. a thread just added the category, after
-          // the findCategory() call above failed to find it.
-          ordinal = addCategory(cp);
+      for (AtomicReader ar : r.getSequentialSubReaders()) {
+        Terms terms = ar.terms(Consts.FULL);
+        te = terms.iterator(te);
+        while (te.next() != null) {
+          String value = te.term().utf8ToString();
+          cp.clear();
+          cp.add(value, Consts.DEFAULT_DELIMITER);
+          int ordinal = findCategory(cp);
+          if (ordinal < 0) {
+            // NOTE: call addCategory so that it works well in a multi-threaded
+            // environment, in case e.g. a thread just added the category, after
+            // the findCategory() call above failed to find it.
+            ordinal = addCategory(cp);
+          }
+          docs = te.docs(null, docs, false);
+          ordinalMap.addMapping(docs.nextDoc() + base, ordinal);
         }
-        docs = te.docs(liveDocs, docs, false);
-        ordinalMap.addMapping(docs.nextDoc(), ordinal);
+        base += ar.maxDoc(); // no deletions, so we're ok
       }
-      // we must add the root ordinal map, so that the map will be complete
-      // (otherwise e.g. DiskOrdinalMap may fail because it expects more
-      // categories to exist in the file).
-      ordinalMap.addMapping(0, 0);
       ordinalMap.addDone();
     } finally {
       r.close();
diff --git a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/cl2o/Cl2oTaxonomyWriterCache.java b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/cl2o/Cl2oTaxonomyWriterCache.java
index a9822f945ee..f69a33a3c35 100644
--- a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/cl2o/Cl2oTaxonomyWriterCache.java
+++ b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/cl2o/Cl2oTaxonomyWriterCache.java
@@ -1,5 +1,8 @@
 package org.apache.lucene.facet.taxonomy.writercache.cl2o;
 
+import java.util.concurrent.locks.ReadWriteLock;
+import java.util.concurrent.locks.ReentrantReadWriteLock;
+
 import org.apache.lucene.facet.taxonomy.CategoryPath;
 import org.apache.lucene.facet.taxonomy.writercache.TaxonomyWriterCache;
 
@@ -30,44 +33,71 @@ import org.apache.lucene.facet.taxonomy.writercache.TaxonomyWriterCache;
  */
 public class Cl2oTaxonomyWriterCache implements TaxonomyWriterCache {  
 
+  private final ReadWriteLock lock = new ReentrantReadWriteLock();
   private CompactLabelToOrdinal cache;
 
   public Cl2oTaxonomyWriterCache(int initialCapcity, float loadFactor, int numHashArrays) {
     this.cache = new CompactLabelToOrdinal(initialCapcity, loadFactor, numHashArrays);
   }
 
-  public void close() {
-    cache=null;
+  @Override
+  public synchronized void close() {
+    cache = null;
   }
 
+  @Override
   public boolean hasRoom(int n) {
     // This cache is unlimited, so we always have room for remembering more:
     return true;
   }
 
+  @Override
   public int get(CategoryPath categoryPath) {
-    return cache.getOrdinal(categoryPath);
+    lock.readLock().lock();
+    try {
+      return cache.getOrdinal(categoryPath);
+    } finally {
+      lock.readLock().unlock();
+    }
   }
 
+  @Override
   public int get(CategoryPath categoryPath, int length) {
-    if (length<0 || length>categoryPath.length()) {
+    if (length < 0 || length > categoryPath.length()) {
       length = categoryPath.length();
     }
-    return cache.getOrdinal(categoryPath, length);
+    lock.readLock().lock();
+    try {
+      return cache.getOrdinal(categoryPath, length);
+    } finally {
+      lock.readLock().unlock();
+    }
   }
 
+  @Override
   public boolean put(CategoryPath categoryPath, int ordinal) {
-    cache.addLabel(categoryPath, ordinal);
-    // Tell the caller we didn't clear part of the cache, so it doesn't
-    // have to flush its on-disk index now
-    return false;
+    lock.writeLock().lock();
+    try {
+      cache.addLabel(categoryPath, ordinal);
+      // Tell the caller we didn't clear part of the cache, so it doesn't
+      // have to flush its on-disk index now
+      return false;
+    } finally {
+      lock.writeLock().unlock();
+    }
   }
 
+  @Override
   public boolean put(CategoryPath categoryPath, int prefixLen, int ordinal) {
-    cache.addLabel(categoryPath, prefixLen, ordinal);
-    // Tell the caller we didn't clear part of the cache, so it doesn't
-    // have to flush its on-disk index now
-    return false;
+    lock.writeLock().lock();
+    try {
+      cache.addLabel(categoryPath, prefixLen, ordinal);
+      // Tell the caller we didn't clear part of the cache, so it doesn't
+      // have to flush its on-disk index now
+      return false;
+    } finally {
+      lock.writeLock().unlock();
+    }
   }
 
   /**
@@ -75,8 +105,7 @@ public class Cl2oTaxonomyWriterCache implements TaxonomyWriterCache {
    * @return Number of bytes in memory used by this object.
    */
   public int getMemoryUsage() {
-    int memoryUsage = (this.cache == null) ? 0 : this.cache.getMemoryUsage();
-    return memoryUsage;
+    return cache == null ? 0 : cache.getMemoryUsage();
   }
 
 }
diff --git a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/lru/LruTaxonomyWriterCache.java b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/lru/LruTaxonomyWriterCache.java
index af34d42dbc3..aeb85073c44 100644
--- a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/lru/LruTaxonomyWriterCache.java
+++ b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/writercache/lru/LruTaxonomyWriterCache.java
@@ -60,16 +60,19 @@ public class LruTaxonomyWriterCache implements TaxonomyWriterCache {
     }
   }
 
-  public boolean hasRoom(int n) {
-    return n<=(cache.getMaxSize()-cache.getSize());
+  @Override
+  public synchronized boolean hasRoom(int n) {
+    return n <= (cache.getMaxSize() - cache.getSize());
   }
 
-  public void close() {
+  @Override
+  public synchronized void close() {
     cache.clear();
-    cache=null;
+    cache = null;
   }
 
-  public int get(CategoryPath categoryPath) {
+  @Override
+  public synchronized int get(CategoryPath categoryPath) {
     Integer res = cache.get(categoryPath);
     if (res == null) {
       return -1;
@@ -78,7 +81,8 @@ public class LruTaxonomyWriterCache implements TaxonomyWriterCache {
     return res.intValue();
   }
 
-  public int get(CategoryPath categoryPath, int length) {
+  @Override
+  public synchronized int get(CategoryPath categoryPath, int length) {
     if (length<0 || length>categoryPath.length()) {
       length = categoryPath.length();
     }
@@ -94,7 +98,8 @@ public class LruTaxonomyWriterCache implements TaxonomyWriterCache {
     return res.intValue();
   }
 
-  public boolean put(CategoryPath categoryPath, int ordinal) {
+  @Override
+  public synchronized boolean put(CategoryPath categoryPath, int ordinal) {
     boolean ret = cache.put(categoryPath, new Integer(ordinal));
     // If the cache is full, we need to clear one or more old entries
     // from the cache. However, if we delete from the cache a recent
@@ -109,7 +114,8 @@ public class LruTaxonomyWriterCache implements TaxonomyWriterCache {
     return ret;
   }
 
-  public boolean put(CategoryPath categoryPath, int prefixLen, int ordinal) {
+  @Override
+  public synchronized boolean put(CategoryPath categoryPath, int prefixLen, int ordinal) {
     boolean ret = cache.put(categoryPath, prefixLen, new Integer(ordinal));
     // If the cache is full, we need to clear one or more old entries
     // from the cache. However, if we delete from the cache a recent
@@ -125,4 +131,3 @@ public class LruTaxonomyWriterCache implements TaxonomyWriterCache {
   }
 
 }
-
diff --git a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java
index 0a8347c420a..bc59f78e673 100644
--- a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java
+++ b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestAddTaxonomy.java
@@ -3,6 +3,7 @@ package org.apache.lucene.facet.taxonomy.directory;
 import java.io.IOException;
 import java.util.HashSet;
 import java.util.Random;
+import java.util.concurrent.atomic.AtomicInteger;
 
 import org.apache.lucene.facet.taxonomy.CategoryPath;
 import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter.DiskOrdinalMap;
@@ -32,16 +33,32 @@ import org.apache.lucene.util._TestUtil;
 
 public class TestAddTaxonomy extends LuceneTestCase {
 
-  private void dotest(int ncats, int range) throws Exception {
+  private void dotest(int ncats, final int range) throws Exception {
+    final AtomicInteger numCats = new AtomicInteger(ncats);
     Directory dirs[] = new Directory[2];
-    Random random = random();
     for (int i = 0; i < dirs.length; i++) {
       dirs[i] = newDirectory();
-      DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[i]);
-      for (int j = 0; j < ncats; j++) {
-        String cat = Integer.toString(random.nextInt(range));
-        tw.addCategory(new CategoryPath("a", cat));
+      final DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[i]);
+      Thread[] addThreads = new Thread[4];
+      for (int j = 0; j < addThreads.length; j++) {
+        addThreads[j] = new Thread() {
+          @Override
+          public void run() {
+            Random random = random();
+            while (numCats.decrementAndGet() > 0) {
+              String cat = Integer.toString(random.nextInt(range));
+              try {
+                tw.addCategory(new CategoryPath("a", cat));
+              } catch (IOException e) {
+                throw new RuntimeException(e);
+              }
+            }
+          }
+        };
       }
+      
+      for (Thread t : addThreads) t.start();
+      for (Thread t : addThreads) t.join();
       tw.close();
     }
 
@@ -133,11 +150,9 @@ public class TestAddTaxonomy extends LuceneTestCase {
   }
   
   // A more comprehensive and big random test.
-  @Nightly
   public void testBig() throws Exception {
     dotest(200, 10000);
     dotest(1000, 20000);
-    // really big
     dotest(400000, 1000000);
   }
 
diff --git a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestDirectoryTaxonomyWriter.java b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestDirectoryTaxonomyWriter.java
index ef7e297b32f..cfcd0fbeb35 100644
--- a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestDirectoryTaxonomyWriter.java
+++ b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestDirectoryTaxonomyWriter.java
@@ -3,11 +3,16 @@ package org.apache.lucene.facet.taxonomy.directory;
 import java.io.IOException;
 import java.util.HashMap;
 import java.util.Map;
+import java.util.Random;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.concurrent.atomic.AtomicInteger;
 
-import org.apache.lucene.index.DirectoryReader;
 import org.apache.lucene.facet.taxonomy.CategoryPath;
 import org.apache.lucene.facet.taxonomy.InconsistentTaxonomyException;
 import org.apache.lucene.facet.taxonomy.writercache.TaxonomyWriterCache;
+import org.apache.lucene.facet.taxonomy.writercache.cl2o.Cl2oTaxonomyWriterCache;
+import org.apache.lucene.facet.taxonomy.writercache.lru.LruTaxonomyWriterCache;
+import org.apache.lucene.index.DirectoryReader;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.IndexWriterConfig;
@@ -42,11 +47,17 @@ public class TestDirectoryTaxonomyWriter extends LuceneTestCase {
 
     NoOpCache() { }
     
+    @Override
     public void close() {}
+    @Override
     public int get(CategoryPath categoryPath) { return -1; }
+    @Override
     public int get(CategoryPath categoryPath, int length) { return get(categoryPath); }
+    @Override
     public boolean put(CategoryPath categoryPath, int ordinal) { return true; }
+    @Override
     public boolean put(CategoryPath categoryPath, int prefixLen, int ordinal) { return true; }
+    @Override
     public boolean hasRoom(int numberOfEntries) { return false; }
     
   }
@@ -201,5 +212,48 @@ public class TestDirectoryTaxonomyWriter extends LuceneTestCase {
     
     dir.close();
   }
+
+  public void testConcurrency() throws Exception {
+    int ncats = atLeast(100000); // add many categories
+    final int range = ncats * 3; // affects the categories selection
+    final AtomicInteger numCats = new AtomicInteger(ncats);
+    Directory dir = newDirectory();
+    final ConcurrentHashMap<Integer,Integer> values = new ConcurrentHashMap<Integer,Integer>();
+    TaxonomyWriterCache cache = random().nextBoolean() 
+        ? new Cl2oTaxonomyWriterCache(1024, 0.15f, 3) 
+        : new LruTaxonomyWriterCache(ncats / 10);
+    final DirectoryTaxonomyWriter tw = new DirectoryTaxonomyWriter(dir, OpenMode.CREATE, cache);
+    Thread[] addThreads = new Thread[atLeast(4)];
+    for (int z = 0; z < addThreads.length; z++) {
+      addThreads[z] = new Thread() {
+        @Override
+        public void run() {
+          Random random = random();
+          while (numCats.decrementAndGet() > 0) {
+            try {
+              int value = random.nextInt(range);
+              tw.addCategory(new CategoryPath("a", Integer.toString(value)));
+              values.put(value, value);
+            } catch (IOException e) {
+              throw new RuntimeException(e);
+            }
+          }
+        }
+      };
+    }
+    
+    for (Thread t : addThreads) t.start();
+    for (Thread t : addThreads) t.join();
+    tw.close();
+    
+    DirectoryTaxonomyReader dtr = new DirectoryTaxonomyReader(dir);
+    assertEquals(values.size() + 2, dtr.getSize()); // +2 for root category + "a"
+    for (Integer value : values.keySet()) {
+      assertTrue("category not found a/" + value, dtr.getOrdinal(new CategoryPath("a", value.toString())) > 0);
+    }
+    dtr.close();
+    
+    dir.close();
+  }
   
 }

From 3f733420252732aea82ef9cfc6291c4cb127dd6d Mon Sep 17 00:00:00 2001
From: Uwe Schindler <uschindler@apache.org>
Date: Wed, 16 May 2012 14:55:02 +0000
Subject: [PATCH 08/47] SOLR-3461: Ignore this test on windows until this is
 fixed

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339209 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/core/src/test/org/apache/solr/search/TestRealTimeGet.java | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/solr/core/src/test/org/apache/solr/search/TestRealTimeGet.java b/solr/core/src/test/org/apache/solr/search/TestRealTimeGet.java
index 9aa52c3157b..c9f59b3c786 100644
--- a/solr/core/src/test/org/apache/solr/search/TestRealTimeGet.java
+++ b/solr/core/src/test/org/apache/solr/search/TestRealTimeGet.java
@@ -25,6 +25,7 @@ import org.apache.lucene.index.*;
 import org.apache.lucene.search.*;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.util.BytesRef;
+import org.apache.lucene.util.Constants;
 import org.apache.noggit.ObjectBuilder;
 import org.apache.solr.SolrTestCaseJ4;
 import org.apache.solr.common.SolrException;
@@ -1213,6 +1214,7 @@ public class TestRealTimeGet extends SolrTestCaseJ4 {
   // and tests the ability to buffer updates and apply them later
   @Test
   public void testStressRecovery() throws Exception {
+    assumeFalse("FIXME: This test is horribly slow sometimes on Windows!", Constants.WINDOWS);
     clearIndex();
     assertU(commit());
 

From 4898a6eb8e9fdffd53eeb2cad83f9c556b158980 Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Wed, 16 May 2012 15:36:35 +0000
Subject: [PATCH 09/47] SOLR-3401: Always show CoreAdmin

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339232 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/webapp/web/admin.html        |  2 +-
 solr/webapp/web/js/scripts/app.js | 38 +++++++++++--------------------
 2 files changed, 14 insertions(+), 26 deletions(-)

diff --git a/solr/webapp/web/admin.html b/solr/webapp/web/admin.html
index db484c79c3f..f77e802ba60 100644
--- a/solr/webapp/web/admin.html
+++ b/solr/webapp/web/admin.html
@@ -79,7 +79,7 @@ limitations under the License.
             <li id="index" class="global"><p><a href="#/">Dashboard</a></p></li>
             <li id="logging" class="global"><p><a href="#/~logging">Logging</a></p></li>
             <li id="cloud" class="global optional"><p><a href="#/~cloud">Cloud</a></p></li>
-            <li id="cores" class="global optional"><p><a href="#/~cores">Core Admin</a></p></li>
+            <li id="cores" class="global"><p><a href="#/~cores">Core Admin</a></p></li>
             <li id="java-properties" class="global"><p><a href="#/~java-properties">Java Properties</a></li>
             <li id="threads" class="global"><p><a href="#/~threads">Thread Dump</a></p></li>
           </ul>
diff --git a/solr/webapp/web/js/scripts/app.js b/solr/webapp/web/js/scripts/app.js
index 67282bf5ef9..4ae37140b8b 100644
--- a/solr/webapp/web/js/scripts/app.js
+++ b/solr/webapp/web/js/scripts/app.js
@@ -131,7 +131,7 @@ var sammy = $.sammy
 
 var solr_admin = function( app_config )
 {
-	self = this,
+  self = this,
 
   menu_element = null,
 
@@ -168,41 +168,29 @@ var solr_admin = function( app_config )
         {
           self.cores_data = response.status;
 
-          var core_count = 0; for( var i in response.status ) { core_count++; }
-          is_multicore = core_count > 1;
-
-          if( is_multicore )
-          {
-            self.menu_element
-              .addClass( 'multicore' );
-
-            $( '#cores', menu_element )
-              .show();
-          }
-          else
-          {
-            self.menu_element 
-              .addClass( 'singlecore' );
-          }
-
           for( var core_name in response.status )
           {
             var core_path = config.solr_path + '/' + core_name;
             var schema =  response['status'][core_name]['schema'];
             var solrconfig =  response['status'][core_name]['config'];
-			
-            if( !core_name )
-            {
-              core_name = 'singlecore';
-              core_path = config.solr_path
-            }
+            var classes = [];
 
             if( !environment_basepath )
             {
               environment_basepath = core_path;
             }
 
-            var core_tpl = '<li id="' + core_name + '" data-basepath="' + core_path + '" schema="' + schema + '" config="' + solrconfig + '">' + "\n"
+            if( response['status'][core_name]['isDefaultCore'] )
+            {
+              classes.push( 'default' );
+            }
+
+            var core_tpl = '<li id="' + core_name + '" '
+                         + '    class="' + classes.join( ' ' ) + '"'
+                         + '    data-basepath="' + core_path + '"'
+                         + '    schema="' + schema + '"'
+                         + '    config="' + solrconfig + '"'
+                         + '>' + "\n"
                          + '  <p><a href="#/' + core_name + '">' + core_name + '</a></p>' + "\n"
                          + '  <ul>' + "\n"
 

From 89a796d7bcb13bf0cc8759d710329056612a0419 Mon Sep 17 00:00:00 2001
From: Simon Willnauer <simonw@apache.org>
Date: Wed, 16 May 2012 19:35:31 +0000
Subject: [PATCH 10/47] LUCENE-4026: fix possible deadlock due to ignored
 return value on tryRelease

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339321 13f79535-47bb-0310-9956-ffa450edef68
---
 .../index/DocumentsWriterFlushControl.java    |   5 +-
 .../index/DocumentsWriterStallControl.java    |  26 +-
 .../TestDocumentsWriterStallControl.java      | 356 ++++++++++++++++++
 3 files changed, 377 insertions(+), 10 deletions(-)
 create mode 100644 lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java

diff --git a/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterFlushControl.java b/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterFlushControl.java
index 0c7cf746dd8..bb57bb01bf8 100644
--- a/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterFlushControl.java
+++ b/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterFlushControl.java
@@ -26,6 +26,7 @@ import java.util.Queue;
 import java.util.concurrent.atomic.AtomicBoolean;
 
 import org.apache.lucene.index.DocumentsWriterPerThreadPool.ThreadState;
+import org.apache.lucene.index.DocumentsWriterStallControl.MemoryController;
 import org.apache.lucene.util.ThreadInterruptedException;
 
 /**
@@ -40,7 +41,7 @@ import org.apache.lucene.util.ThreadInterruptedException;
  * {@link IndexWriterConfig#getRAMPerThreadHardLimitMB()} to prevent address
  * space exhaustion.
  */
-final class DocumentsWriterFlushControl {
+final class DocumentsWriterFlushControl implements MemoryController {
 
   private final long hardMaxBytesPerDWPT;
   private long activeBytes = 0;
@@ -88,7 +89,7 @@ final class DocumentsWriterFlushControl {
     return flushBytes + activeBytes;
   }
   
-  long stallLimitBytes() {
+  public long stallLimitBytes() {
     final double maxRamMB = config.getRAMBufferSizeMB();
     return maxRamMB != IndexWriterConfig.DISABLE_AUTO_FLUSH ? (long)(2 * (maxRamMB * 1024 * 1024)) : Long.MAX_VALUE;
   }
diff --git a/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterStallControl.java b/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterStallControl.java
index d61cc6d8e51..80dbf9b01e4 100644
--- a/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterStallControl.java
+++ b/lucene/core/src/java/org/apache/lucene/index/DocumentsWriterStallControl.java
@@ -1,6 +1,6 @@
 package org.apache.lucene.index;
 
-/**
+/*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements. See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
@@ -19,6 +19,7 @@ package org.apache.lucene.index;
 import java.util.concurrent.locks.AbstractQueuedSynchronizer;
 
 import org.apache.lucene.index.DocumentsWriterPerThreadPool.ThreadState;
+import org.apache.lucene.util.ThreadInterruptedException;
 
 /**
  * Controls the health status of a {@link DocumentsWriter} sessions. This class
@@ -55,11 +56,11 @@ final class DocumentsWriterStallControl {
 
     boolean tryReset() {
       final int oldState = getState();
-      if (oldState == 0)
+      if (oldState == 0) {
         return true;
+      }
       if (compareAndSetState(oldState, 0)) {
-        releaseShared(0);
-        return true;
+        return releaseShared(0);
       }
       return false;
     }
@@ -97,11 +98,11 @@ final class DocumentsWriterStallControl {
    * {@link DocumentsWriterStallControl} to healthy and release all threads waiting on
    * {@link #waitIfStalled()}
    */
-  void updateStalled(DocumentsWriterFlushControl flushControl) {
+  void updateStalled(MemoryController controller) {
     do {
       // if we have more flushing / blocked DWPT than numActiveDWPT we stall!
       // don't stall if we have queued flushes - threads should be hijacked instead
-      while (flushControl.netBytes() > flushControl.stallLimitBytes()) {
+      while (controller.netBytes() > controller.stallLimitBytes()) {
         if (sync.trySetStalled()) {
           assert wasStalled = true;
           return;
@@ -111,10 +112,19 @@ final class DocumentsWriterStallControl {
   }
 
   void waitIfStalled() {
-    sync.acquireShared(0);
+    try {
+      sync.acquireSharedInterruptibly(0);
+    } catch (InterruptedException e) {
+      throw new ThreadInterruptedException(e);
+    }
   }
   
   boolean hasBlocked() { // for tests
     return sync.hasBlockedThreads;
   }
-}
\ No newline at end of file
+  
+  static interface MemoryController {
+    long netBytes();
+    long stallLimitBytes();
+  }
+}
diff --git a/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java b/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java
new file mode 100644
index 00000000000..0252c9f1aa6
--- /dev/null
+++ b/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java
@@ -0,0 +1,356 @@
+package org.apache.lucene.index;
+
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with this
+ * work for additional information regarding copyright ownership. The ASF
+ * licenses this file to You under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ * 
+ * http://www.apache.org/licenses/LICENSE-2.0
+ * 
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+ * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+ * License for the specific language governing permissions and limitations under
+ * the License.
+ */
+
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicBoolean;
+
+import org.apache.lucene.index.DocumentsWriterStallControl.MemoryController;
+import org.apache.lucene.util.LuceneTestCase;
+
+import com.carrotsearch.randomizedtesting.annotations.Repeat;
+import com.carrotsearch.randomizedtesting.annotations.ThreadLeaks;
+
+/**
+ * Tests for {@link DocumentsWriterStallControl}
+ */
+@ThreadLeaks(failTestIfLeaking = true)
+public class TestDocumentsWriterStallControl extends LuceneTestCase {
+  
+  public void testSimpleStall() throws InterruptedException {
+    DocumentsWriterStallControl ctrl = new DocumentsWriterStallControl();
+    SimpleMemCtrl memCtrl = new SimpleMemCtrl();
+    memCtrl.limit = 1000;
+    memCtrl.netBytes = 1000;
+    ctrl.updateStalled(memCtrl);
+    Thread[] waitThreads = waitThreads(atLeast(1), ctrl);
+    start(waitThreads);
+    assertFalse(ctrl.hasBlocked());
+    assertFalse(ctrl.anyStalledThreads());
+    join(waitThreads, 10);
+    
+    // now stall threads and wake them up again
+    memCtrl.netBytes = 1001;
+    ctrl.updateStalled(memCtrl);
+    waitThreads = waitThreads(atLeast(1), ctrl);
+    start(waitThreads);
+    awaitState(100, Thread.State.WAITING, waitThreads);
+    assertTrue(ctrl.hasBlocked());
+    assertTrue(ctrl.anyStalledThreads());
+    memCtrl.netBytes = 50;
+    ctrl.updateStalled(memCtrl);
+    assertFalse(ctrl.anyStalledThreads());
+    join(waitThreads, 100);
+  }
+  
+  public void testRandom() throws InterruptedException {
+    final DocumentsWriterStallControl ctrl = new DocumentsWriterStallControl();
+    SimpleMemCtrl memCtrl = new SimpleMemCtrl();
+    memCtrl.limit = 1000;
+    memCtrl.netBytes = 1;
+    ctrl.updateStalled(memCtrl);
+    Thread[] stallThreads = new Thread[atLeast(3)];
+    for (int i = 0; i < stallThreads.length; i++) {
+      final int threadId = i;
+      stallThreads[i] = new Thread() {
+        public void run() {
+          int baseBytes = threadId % 2 == 0 ? 500 : 700;
+          SimpleMemCtrl memCtrl = new SimpleMemCtrl();
+          memCtrl.limit = 1000;
+          memCtrl.netBytes = 1;
+          int iters = atLeast(1000);
+          for (int j = 0; j < iters; j++) {
+            memCtrl.netBytes = baseBytes + random().nextInt(1000);
+            ctrl.updateStalled(memCtrl);
+            if (random().nextInt(5) == 0) { // thread 0 only updates
+              ctrl.waitIfStalled();
+            }
+          }
+        }
+      };
+    }
+    start(stallThreads);
+    long time = System.currentTimeMillis();
+    /*
+     * use a 100 sec timeout to make sure we not hang forever. join will fail in
+     * that case
+     */
+    while ((System.currentTimeMillis() - time) < 100 * 1000
+        && !terminated(stallThreads)) {
+      ctrl.updateStalled(memCtrl);
+      if (random().nextBoolean()) {
+        Thread.yield();
+      } else {
+        Thread.sleep(1);
+      }
+      
+    }
+    join(stallThreads, 100);
+    
+  }
+  
+  public void testAccquireReleaseRace() throws InterruptedException {
+    final DocumentsWriterStallControl ctrl = new DocumentsWriterStallControl();
+    SimpleMemCtrl memCtrl = new SimpleMemCtrl();
+    memCtrl.limit = 1000;
+    memCtrl.netBytes = 1;
+    ctrl.updateStalled(memCtrl);
+    final AtomicBoolean stop = new AtomicBoolean(false);
+    final AtomicBoolean checkPoint = new AtomicBoolean(true);
+    
+    int numStallers = atLeast(1);
+    int numReleasers = atLeast(1);
+    int numWaiters = atLeast(1);
+    
+    final CountDownLatch[] latches = new CountDownLatch[] {
+        new CountDownLatch(numStallers + numReleasers), new CountDownLatch(1),
+        new CountDownLatch(numWaiters)};
+    Thread[] threads = new Thread[numReleasers + numStallers + numWaiters];
+    List<Throwable> exceptions =  Collections.synchronizedList(new ArrayList<Throwable>());
+    for (int i = 0; i < numReleasers; i++) {
+      threads[i] = new Updater(stop, checkPoint, ctrl, latches, true, exceptions);
+    }
+    for (int i = numReleasers; i < numReleasers + numStallers; i++) {
+      threads[i] = new Updater(stop, checkPoint, ctrl, latches, false, exceptions);
+      
+    }
+    for (int i = numReleasers + numStallers; i < numReleasers + numStallers
+        + numWaiters; i++) {
+      threads[i] = new Waiter(stop, checkPoint, ctrl, latches, exceptions);
+      
+    }
+    
+    start(threads);
+    int iters = atLeast(20000);
+    for (int i = 0; i < iters; i++) {
+      if (checkPoint.get()) {
+       
+        latches[0].await(5, TimeUnit.SECONDS);
+        if (!exceptions.isEmpty()) {
+          for (Throwable throwable : exceptions) {
+            throwable.printStackTrace();
+          }
+          fail("got exceptions in threads");
+        }
+        
+        if (!ctrl.anyStalledThreads()) {
+          assertTrue(
+              "control claims no stalled threads but waiter seems to be blocked",
+              latches[2].await(3, TimeUnit.SECONDS));
+        }
+        checkPoint.set(false);
+        
+        latches[1].countDown();
+      }
+      assertFalse(checkPoint.get());
+      if (random().nextInt(2) == 0) {
+        latches[0] = new CountDownLatch(numStallers + numReleasers);
+        latches[1] = new CountDownLatch(1);
+        latches[2] = new CountDownLatch(numWaiters);
+        checkPoint.set(true);
+      }
+  
+    }
+    
+    stop.set(true);
+    memCtrl.limit = 1000;
+    memCtrl.netBytes = 1;
+    ctrl.updateStalled(memCtrl);
+    if (checkPoint.get()) {
+      latches[1].countDown();
+    }
+    
+    for (int i = 0; i < threads.length; i++) {
+      threads[i].join(2000);
+      if (threads[i].isAlive() && threads[i] instanceof Waiter) {
+        if (threads[i].getState() == Thread.State.WAITING) {
+          fail("waiter is not released - anyThreadsStalled: "
+              + ctrl.anyStalledThreads());
+        }
+      }
+    }
+  }
+  
+  public static class Waiter extends Thread {
+    private CountDownLatch[] latches;
+    private DocumentsWriterStallControl ctrl;
+    private AtomicBoolean checkPoint;
+    private AtomicBoolean stop;
+    private List<Throwable> exceptions;
+    
+    public Waiter(AtomicBoolean stop, AtomicBoolean checkPoint,
+        DocumentsWriterStallControl ctrl, CountDownLatch[] latches,
+        List<Throwable> exceptions) {
+      this.stop = stop;
+      this.checkPoint = checkPoint;
+      this.ctrl = ctrl;
+      this.latches = latches;
+      this.exceptions = exceptions;
+    }
+    
+    public void run() {
+      try {
+        while (!stop.get()) {
+          ctrl.waitIfStalled();
+          if (checkPoint.get()) {
+            CountDownLatch join = latches[2];
+            CountDownLatch wait = latches[1];
+            join.countDown();
+            try {
+              wait.await();
+            } catch (InterruptedException e) {
+              throw new RuntimeException(e);
+            }
+          }
+        }
+      } catch (Throwable e) {
+        e.printStackTrace();
+        exceptions.add(e);
+      }
+    }
+  }
+  
+  public static class Updater extends Thread {
+    
+    private CountDownLatch[] latches;
+    private DocumentsWriterStallControl ctrl;
+    private AtomicBoolean checkPoint;
+    private AtomicBoolean stop;
+    private boolean release;
+    private List<Throwable> exceptions;
+    
+    public Updater(AtomicBoolean stop, AtomicBoolean checkPoint,
+        DocumentsWriterStallControl ctrl, CountDownLatch[] latches,
+        boolean release, List<Throwable> exceptions) {
+      this.stop = stop;
+      this.checkPoint = checkPoint;
+      this.ctrl = ctrl;
+      this.latches = latches;
+      this.release = release;
+      this.exceptions = exceptions;
+    }
+    
+    public void run() {
+      try {
+        SimpleMemCtrl memCtrl = new SimpleMemCtrl();
+        memCtrl.limit = 1000;
+        memCtrl.netBytes = release ? 1 : 2000;
+        while (!stop.get()) {
+          int internalIters = release && random().nextBoolean() ? atLeast(5) : 1;
+          for (int i = 0; i < internalIters; i++) {
+            ctrl.updateStalled(memCtrl);
+          }
+          if (checkPoint.get()) {
+            CountDownLatch join = latches[0];
+            CountDownLatch wait = latches[1];
+            join.countDown();
+            try {
+              wait.await();
+            } catch (InterruptedException e) {
+              throw new RuntimeException(e);
+            }
+          }
+          Thread.yield();
+        }
+      } catch (Throwable e) {
+        e.printStackTrace();
+        exceptions.add(e);
+      }
+    }
+    
+  }
+  
+  public static boolean terminated(Thread[] threads) {
+    for (Thread thread : threads) {
+      if (Thread.State.TERMINATED != thread.getState()) return false;
+    }
+    return true;
+  }
+  
+  public static void start(Thread[] tostart) throws InterruptedException {
+    for (Thread thread : tostart) {
+      thread.start();
+    }
+    Thread.sleep(1); // let them start
+  }
+  
+  public static void join(Thread[] toJoin, long timeout)
+      throws InterruptedException {
+    for (Thread thread : toJoin) {
+      thread.join(timeout);
+      assertEquals(thread.getState().toString(), Thread.State.TERMINATED,
+          thread.getState());
+    }
+  }
+  
+  public static Thread[] waitThreads(int num,
+      final DocumentsWriterStallControl ctrl) {
+    Thread[] array = new Thread[num];
+    for (int i = 0; i < array.length; i++) {
+      array[i] = new Thread() {
+        public void run() {
+          ctrl.waitIfStalled();
+        }
+      };
+    }
+    return array;
+  }
+  
+  public static void awaitState(long timeout, Thread.State state,
+      Thread... threads) throws InterruptedException {
+    long t = System.currentTimeMillis();
+    while (System.currentTimeMillis() - t <= timeout) {
+      boolean done = true;
+      for (Thread thread : threads) {
+        if (thread.getState() != state) {
+          done = false;
+        }
+      }
+      if (done) {
+        return;
+      }
+      if (random().nextBoolean()) {
+        Thread.yield();
+      } else {
+        Thread.sleep(1);
+      }
+    }
+    fail("timed out waiting for state: " + state + " timeout: " + timeout
+        + " ms");
+  }
+  
+  private static class SimpleMemCtrl implements MemoryController {
+    long netBytes;
+    long limit;
+    
+    @Override
+    public long netBytes() {
+      return netBytes;
+    }
+    
+    @Override
+    public long stallLimitBytes() {
+      return limit;
+    }
+    
+  }
+}

From 31ead5af5869cb4b42658e01bcc6fa28166e3cf7 Mon Sep 17 00:00:00 2001
From: Steven Rowe <sarowe@apache.org>
Date: Wed, 16 May 2012 20:03:49 +0000
Subject: [PATCH 11/47] LUCENE-4063: FrenchLightStemmer no longer deletes
 repeated digits.

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339333 13f79535-47bb-0310-9956-ffa450edef68
---
 lucene/CHANGES.txt                               |  3 +++
 .../lucene/analysis/fr/FrenchLightStemmer.java   |  4 ++--
 .../analysis/fr/TestFrenchLightStemFilter.java   | 16 ++++++++++++++++
 3 files changed, 21 insertions(+), 2 deletions(-)

diff --git a/lucene/CHANGES.txt b/lucene/CHANGES.txt
index 6025da6c306..dce825156f8 100644
--- a/lucene/CHANGES.txt
+++ b/lucene/CHANGES.txt
@@ -513,6 +513,9 @@ API Changes
   immutable instances of NormalizeCharMap. (Dawid Weiss, Mike
   McCandless)
 
+* LUCENE-4063: FrenchLightStemmer no longer deletes repeated digits.
+  (Tanguy Moal via Steve Rowe)
+
 New features
 
 * LUCENE-2604: Added RegexpQuery support to QueryParser. Regular expressions
diff --git a/lucene/analysis/common/src/java/org/apache/lucene/analysis/fr/FrenchLightStemmer.java b/lucene/analysis/common/src/java/org/apache/lucene/analysis/fr/FrenchLightStemmer.java
index 43e2e0625d1..5be44bc032e 100644
--- a/lucene/analysis/common/src/java/org/apache/lucene/analysis/fr/FrenchLightStemmer.java
+++ b/lucene/analysis/common/src/java/org/apache/lucene/analysis/fr/FrenchLightStemmer.java
@@ -246,7 +246,7 @@ public class FrenchLightStemmer {
       
       char ch = s[0];
       for (int i = 1; i < len; i++) {
-        if (s[i] == ch)
+        if (s[i] == ch && Character.isLetter(ch))
           len = delete(s, i--, len);
         else
           ch = s[i];
@@ -260,7 +260,7 @@ public class FrenchLightStemmer {
         if (s[len-1] == 'r') len--;
         if (s[len-1] == 'e') len--;
         if (s[len-1] == 'e') len--;
-        if (s[len-1] == s[len-2]) len--;
+        if (s[len-1] == s[len-2] && Character.isLetter(s[len-1])) len--;
     }
     return len;
   }
diff --git a/lucene/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java b/lucene/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java
index 6012e8282a9..d0f7af15c24 100644
--- a/lucene/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java
+++ b/lucene/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java
@@ -153,6 +153,22 @@ public class TestFrenchLightStemFilter extends BaseTokenStreamTestCase {
     
     checkOneTerm(analyzer, "disposition", "dispos");
     checkOneTerm(analyzer, "dispose", "dispos");
+
+    // SOLR-3463 : abusive compression of repeated characters in numbers
+    // Trailing repeated char elision :
+    checkOneTerm(analyzer, "1234555", "1234555");
+    // Repeated char within numbers with more than 4 characters :
+    checkOneTerm(analyzer, "12333345", "12333345");
+    // Short numbers weren't affected already:
+    checkOneTerm(analyzer, "1234", "1234");
+    // Ensure behaviour is preserved for words!
+    // Trailing repeated char elision :
+    checkOneTerm(analyzer, "abcdeff", "abcdef");
+    // Repeated char within words with more than 4 characters :
+    checkOneTerm(analyzer, "abcccddeef", "abcdef");
+    checkOneTerm(analyzer, "créées", "cre");
+    // Combined letter and digit repetition
+    checkOneTerm(analyzer, "22hh00", "22h00"); // 10:00pm
   }
   
   /** Test against a vocabulary from the reference impl */

From f22742322e4d98123c2dbab2f6cf508f16d393d1 Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Wed, 16 May 2012 20:53:21 +0000
Subject: [PATCH 12/47] couple of minor cosmetics

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339357 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/CHANGES.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/solr/CHANGES.txt b/solr/CHANGES.txt
index 1fd6be69af7..123ffedc423 100644
--- a/solr/CHANGES.txt
+++ b/solr/CHANGES.txt
@@ -107,7 +107,7 @@ New Features
 * SOLR-2112: Solrj API now supports streaming results. (ryan)
 
 * SOLR-792: Adding PivotFacetComponent for Hierarchical faceting
-  (erik, Jeremy Hinegardner, Thibaut Lassalle, ryan)
+  (ehatcher, Jeremy Hinegardner, Thibaut Lassalle, ryan)
 
 * LUCENE-2507, SOLR-2571, SOLR-2576: Added DirectSolrSpellChecker, which uses Lucene's
   DirectSpellChecker to retrieve correction candidates directly from the term dictionary using
@@ -144,7 +144,7 @@ New Features
 * SOLR-2338: Add support for using <similarity/> in a schema's fieldType,
   for customizing scoring on a per-field basis. (hossman, yonik, rmuir)
   
-* SOLR-2335: New 'field("...")' function syntax for refering to complex 
+* SOLR-2335: New 'field("...")' function syntax for referring to complex
   field names (containing whitespace or special characters) in functions.
 
 * SOLR-2383: /browse improvements: generalize range and date facet display

From db535704b9a1be5cf6e61bf2b4173ae7b5996aae Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Wed, 16 May 2012 21:14:50 +0000
Subject: [PATCH 13/47] Fix typo

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339367 13f79535-47bb-0310-9956-ffa450edef68
---
 .../solr/update/processor/FieldMutatingUpdateProcessor.java     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/solr/core/src/java/org/apache/solr/update/processor/FieldMutatingUpdateProcessor.java b/solr/core/src/java/org/apache/solr/update/processor/FieldMutatingUpdateProcessor.java
index a7f5e21c69c..53ef98f326f 100644
--- a/solr/core/src/java/org/apache/solr/update/processor/FieldMutatingUpdateProcessor.java
+++ b/solr/core/src/java/org/apache/solr/update/processor/FieldMutatingUpdateProcessor.java
@@ -45,7 +45,7 @@ import org.slf4j.LoggerFactory;
 
 /**
  * Reusable base class for UpdateProcessors that will consider 
- * AddUpdateCommands and mutate the values assocaited with configured 
+ * AddUpdateCommands and mutate the values associated with configured
  * fields.
  * <p>
  * Subclasses should override the mutate method to specify how individual 

From e542b9b3c76a8200c129633fd9bd5f4323ebb761 Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Wed, 16 May 2012 21:24:02 +0000
Subject: [PATCH 14/47] Fix typo

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339373 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/core/src/java/org/apache/solr/util/FileUtils.java | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/solr/core/src/java/org/apache/solr/util/FileUtils.java b/solr/core/src/java/org/apache/solr/util/FileUtils.java
index e54634e809f..6cfbc3d5fe4 100644
--- a/solr/core/src/java/org/apache/solr/util/FileUtils.java
+++ b/solr/core/src/java/org/apache/solr/util/FileUtils.java
@@ -29,9 +29,9 @@ public class FileUtils {
    * Resolves a path relative a base directory.
    *
    * <p>
-   * This method does what "new File(base,path)" <b>Should</b> do, it wasn't
+   * This method does what "new File(base,path)" <b>Should</b> do, if it wasn't
    * completely lame: If path is absolute, then a File for that path is returned;
-   * if it's not absoluve, then a File is returnd using "path" as a child 
+   * if it's not absolute, then a File is returned using "path" as a child
    * of "base")
    * </p>
    */

From 2cb9ccf98c0b8c6313b42bb24261bbdbb41f6cac Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Wed, 16 May 2012 21:26:49 +0000
Subject: [PATCH 15/47] Fix errant copy/paste comment

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339376 13f79535-47bb-0310-9956-ffa450edef68
---
 .../java/org/apache/solr/response/transform/ScoreAugmenter.java | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/solr/core/src/java/org/apache/solr/response/transform/ScoreAugmenter.java b/solr/core/src/java/org/apache/solr/response/transform/ScoreAugmenter.java
index 725cafa5d79..afb56c9f8ac 100644
--- a/solr/core/src/java/org/apache/solr/response/transform/ScoreAugmenter.java
+++ b/solr/core/src/java/org/apache/solr/response/transform/ScoreAugmenter.java
@@ -20,7 +20,7 @@ import org.apache.solr.common.SolrDocument;
 import org.apache.solr.request.SolrQueryRequest;
 
 /**
- * Simple Augmenter that adds the docId
+ * Simple Augmenter that adds the score
  *
  *
  * @since solr 4.0

From bc33ed0ef28bf8014de3306747f917154ff76cee Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Thu, 17 May 2012 00:41:12 +0000
Subject: [PATCH 16/47] SOLR-1726: remove CHANGES entry until re-implemented

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339436 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/CHANGES.txt | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/solr/CHANGES.txt b/solr/CHANGES.txt
index 123ffedc423..c796893b578 100644
--- a/solr/CHANGES.txt
+++ b/solr/CHANGES.txt
@@ -226,10 +226,7 @@ New Features
 * SOLR-3069: Ability to add openSearcher=false to not open a searcher when doing
   a hard commit.  commitWithin now only invokes a softCommit. (yonik)
 
-* SOLR-1726: Added deep paging support to search (sort by score only) which should use less memory when paging deeply into results
- by keeping the priority queue small. (Manojkumar Rangasamy Kannadasan, gsingers)
-
-* SOLR-2802: New FieldMutatingUpdateProcessor and Factory to simplify the 
+* SOLR-2802: New FieldMutatingUpdateProcessor and Factory to simplify the
   development of UpdateProcessors that modify field values of documents as 
   they are indexed. Also includes several useful new implementations:
       RemoveBlankFieldUpdateProcessorFactory

From 3e7339af688c10b4904176a20ac383fb0956662c Mon Sep 17 00:00:00 2001
From: Shai Erera <shaie@apache.org>
Date: Thu, 17 May 2012 05:31:39 +0000
Subject: [PATCH 17/47] LUCENE-4061: fixed another potential concurrency issue;
 deleted TestIndexClose - the test-framework guarantees we close all our
 resources after us

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339491 13f79535-47bb-0310-9956-ffa450edef68
---
 .../directory/DirectoryTaxonomyWriter.java    |  52 ++---
 .../taxonomy/directory/TestIndexClose.java    | 193 ------------------
 2 files changed, 19 insertions(+), 226 deletions(-)
 delete mode 100644 lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestIndexClose.java

diff --git a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
index 09ad26f1a5c..49d2b2da5a3 100644
--- a/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
+++ b/lucene/facet/src/java/org/apache/lucene/facet/taxonomy/directory/DirectoryTaxonomyWriter.java
@@ -36,7 +36,6 @@ import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.index.IndexWriterConfig.OpenMode;
 import org.apache.lucene.index.LogByteSizeMergePolicy;
-import org.apache.lucene.index.MultiFields;
 import org.apache.lucene.index.SegmentInfos;
 import org.apache.lucene.index.Terms;
 import org.apache.lucene.index.TermsEnum;
@@ -46,7 +45,6 @@ import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.LockObtainFailedException;
 import org.apache.lucene.store.NativeFSLockFactory;
 import org.apache.lucene.store.SimpleFSLockFactory;
-import org.apache.lucene.util.Bits;
 import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.Version;
 
@@ -232,7 +230,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
       // Make sure that the taxonomy always contain the root category
       // with category id 0.
       addCategory(new CategoryPath());
-      refreshReader();
+      refreshInternalReader();
     } else {
       // There are some categories on the disk, which we have not yet
       // read into the cache, and therefore the cache is incomplete.
@@ -288,15 +286,15 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
         new KeywordAnalyzer()).setOpenMode(openMode).setMergePolicy(
         new LogByteSizeMergePolicy());
   }
-
-  // Currently overridden by a unit test that verifies that every index we open is close()ed.
-  /**
-   * Open an {@link IndexReader} from the internal {@link IndexWriter}, by
-   * calling {@link IndexReader#open(IndexWriter, boolean)}. Extending classes can override
-   * this method to return their own {@link IndexReader}.
-   */
-  protected DirectoryReader openReader() throws IOException {
-    return DirectoryReader.open(indexWriter, true); 
+  
+  /** Opens a {@link DirectoryReader} from the internal {@link IndexWriter}. */
+  private synchronized void openInternalReader() throws IOException {
+    // verify that the taxo-writer hasn't been closed on us. the method is
+    // synchronized since it may be called from a non sync'ed block, and it
+    // needs to protect against close() happening concurrently.
+    ensureOpen();
+    assert reader == null : "a reader is already open !";
+    reader = DirectoryReader.open(indexWriter, false); 
   }
 
   /**
@@ -398,7 +396,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     // We need to get an answer from the on-disk index. If a reader
     // is not yet open, do it now:
     if (reader == null) {
-      reader = openReader();
+      openInternalReader();
     }
 
     int base = 0;
@@ -442,7 +440,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
       return cache.get(categoryPath, prefixLen);
     }
     if (reader == null) {
-      reader = openReader();
+      openInternalReader();
     }
     
     int base = 0;
@@ -615,7 +613,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
       // Because this is a slow operation, cache implementations are
       // expected not to delete entries one-by-one but rather in bulk
       // (LruTaxonomyWriterCache removes the 2/3rd oldest entries).
-      refreshReader();
+      refreshInternalReader();
       cacheIsComplete = false;
     }
   }
@@ -623,12 +621,12 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
   private void addToCache(CategoryPath categoryPath, int prefixLen, int id)
       throws IOException {
     if (cache.put(categoryPath, prefixLen, id)) {
-      refreshReader();
+      refreshInternalReader();
       cacheIsComplete = false;
     }
   }
 
-  protected synchronized void refreshReader() throws IOException {
+  private synchronized void refreshInternalReader() throws IOException {
     if (reader != null) {
       DirectoryReader r2 = DirectoryReader.openIfChanged(reader);
       if (r2 != null) {
@@ -648,7 +646,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
   public synchronized void commit() throws CorruptIndexException, IOException {
     ensureOpen();
     indexWriter.commit(combinedCommitData(null));
-    refreshReader();
+    refreshInternalReader();
   }
 
   /**
@@ -674,7 +672,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
   public synchronized void commit(Map<String,String> commitUserData) throws CorruptIndexException, IOException {
     ensureOpen();
     indexWriter.commit(combinedCommitData(commitUserData));
-    refreshReader();
+    refreshInternalReader();
   }
   
   /**
@@ -759,7 +757,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     // TODO (Facet): we should probably completely clear the cache before starting
     // to read it?
     if (reader == null) {
-      reader = openReader();
+      openInternalReader();
     }
 
     if (!cache.hasRoom(reader.numDocs())) {
@@ -826,7 +824,7 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
   private synchronized ParentArray getParentArray() throws IOException {
     if (parentArray==null) {
       if (reader == null) {
-        reader = openReader();
+        openInternalReader();
       }
       parentArray = new ParentArray();
       parentArray.refresh(reader);
@@ -888,18 +886,6 @@ public class DirectoryTaxonomyWriter implements TaxonomyWriter {
     }
   }
 
-  /**
-   * Expert:  This method is only for expert use.
-   * Note also that any call to refresh() will invalidate the returned reader,
-   * so the caller needs to take care of appropriate locking.
-   * 
-   * @return lucene indexReader
-   */
-  DirectoryReader getInternalIndexReader() {
-    ensureOpen();
-    return this.reader;
-  }
-
   /**
    * Mapping from old ordinal to new ordinals, used when merging indexes 
    * wit separate taxonomies.
diff --git a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestIndexClose.java b/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestIndexClose.java
deleted file mode 100644
index 37cb548e12f..00000000000
--- a/lucene/facet/src/test/org/apache/lucene/facet/taxonomy/directory/TestIndexClose.java
+++ /dev/null
@@ -1,193 +0,0 @@
-package org.apache.lucene.facet.taxonomy.directory;
-
-import java.io.IOException;
-import java.util.Collections;
-import java.util.HashSet;
-import java.util.IdentityHashMap;
-import java.util.Set;
-
-import org.apache.lucene.index.CorruptIndexException;
-import org.apache.lucene.index.DirectoryReader;
-import org.apache.lucene.index.IndexWriter;
-import org.apache.lucene.index.IndexWriterConfig;
-import org.apache.lucene.index.IndexWriterConfig.OpenMode;
-import org.apache.lucene.store.Directory;
-import org.apache.lucene.store.LockObtainFailedException;
-import org.junit.Test;
-
-import org.apache.lucene.util.LuceneTestCase;
-import org.apache.lucene.analysis.MockAnalyzer;
-import org.apache.lucene.analysis.MockTokenizer;
-import org.apache.lucene.facet.taxonomy.CategoryPath;
-import org.apache.lucene.facet.taxonomy.InconsistentTaxonomyException;
-import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyReader;
-import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter;
-
-/**
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/**
- * This test case attempts to catch index "leaks" in LuceneTaxonomyReader/Writer,
- * i.e., cases where an index has been opened, but never closed; In that case,
- * Java would eventually collect this object and close the index, but leaving
- * the index open might nevertheless cause problems - e.g., on Windows it prevents
- * deleting it.
- */
-public class TestIndexClose extends LuceneTestCase {
-
-  @Test
-  public void testLeaks() throws Exception {
-    LeakChecker checker = new LeakChecker();
-    Directory dir = newDirectory();
-    DirectoryTaxonomyWriter tw = checker.openWriter(dir);
-    tw.close();
-    assertEquals(0, checker.nopen());
-
-    tw = checker.openWriter(dir);
-    tw.addCategory(new CategoryPath("animal", "dog"));
-    tw.close();
-    assertEquals(0, checker.nopen());
-
-    DirectoryTaxonomyReader tr = checker.openReader(dir);
-    tr.getPath(1);
-    tr.refresh();
-    tr.close();
-    assertEquals(0, checker.nopen());
-
-    tr = checker.openReader(dir);
-    tw = checker.openWriter(dir);
-    tw.addCategory(new CategoryPath("animal", "cat"));
-    tr.refresh();
-    tw.commit();
-    tw.close();
-    tr.refresh();
-    tr.close();
-    assertEquals(0, checker.nopen());
-
-    tw = checker.openWriter(dir);
-    for (int i=0; i<10000; i++) {
-      tw.addCategory(new CategoryPath("number", Integer.toString(i)));
-    }
-    tw.close();
-    assertEquals(0, checker.nopen());
-    tw = checker.openWriter(dir);
-    for (int i=0; i<10000; i++) {
-      tw.addCategory(new CategoryPath("number", Integer.toString(i*2)));
-    }
-    tw.close();
-    assertEquals(0, checker.nopen());
-    dir.close();
-  }
-
-  private static class LeakChecker {
-    Set<DirectoryReader> readers = Collections.newSetFromMap(new IdentityHashMap<DirectoryReader,Boolean>());
-
-    int iwriter=0;
-    Set<Integer> openWriters = new HashSet<Integer>();
-
-    LeakChecker() { }
-    
-    public DirectoryTaxonomyWriter openWriter(Directory dir) throws CorruptIndexException, LockObtainFailedException, IOException {
-      return new InstrumentedTaxonomyWriter(dir);
-    }
-
-    public DirectoryTaxonomyReader openReader(Directory dir) throws CorruptIndexException, LockObtainFailedException, IOException {
-      return new InstrumentedTaxonomyReader(dir);
-    }
-
-    public int nopen() {
-      int ret=0;
-      for (DirectoryReader r: readers) {
-        if (r.getRefCount() > 0) {
-          System.err.println("reader "+r+" still open");
-          ret++;
-        }
-      }
-      for (int i: openWriters) {
-        System.err.println("writer "+i+" still open");
-        ret++;
-      }
-      return ret;
-    }
-
-    private class InstrumentedTaxonomyWriter extends DirectoryTaxonomyWriter {
-      public InstrumentedTaxonomyWriter(Directory dir) throws CorruptIndexException, LockObtainFailedException, IOException {
-        super(dir);
-      }    
-      @Override
-      protected DirectoryReader openReader() throws IOException {
-        DirectoryReader r = super.openReader();
-        readers.add(r);
-        return r; 
-      }
-      @Override
-      protected synchronized void refreshReader() throws IOException {
-        super.refreshReader();
-        final DirectoryReader r = getInternalIndexReader();
-        if (r != null) readers.add(r);
-      }
-      @Override
-      protected IndexWriter openIndexWriter (Directory directory, IndexWriterConfig config) throws IOException {
-        return new InstrumentedIndexWriter(directory, config);
-      }
-      @Override
-      protected IndexWriterConfig createIndexWriterConfig(OpenMode openMode) {
-        return newIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(random(), MockTokenizer.KEYWORD, false))
-            .setOpenMode(openMode).setMergePolicy(newLogMergePolicy());
-      }
-
-    }
-
-    private class InstrumentedTaxonomyReader extends DirectoryTaxonomyReader {
-      public InstrumentedTaxonomyReader(Directory dir) throws CorruptIndexException, LockObtainFailedException, IOException {
-        super(dir);
-      }  
-      @Override
-      protected DirectoryReader openIndexReader(Directory dir) throws CorruptIndexException, IOException {
-        DirectoryReader r = super.openIndexReader(dir);
-        readers.add(r);
-        return r; 
-      }
-      @Override
-      public synchronized boolean refresh() throws IOException, InconsistentTaxonomyException {
-        final boolean ret = super.refresh();
-        readers.add(getInternalIndexReader());
-        return ret;
-      }
-    }
-
-    private class InstrumentedIndexWriter extends IndexWriter {
-      int mynum;
-      public InstrumentedIndexWriter(Directory d, IndexWriterConfig conf) throws CorruptIndexException, LockObtainFailedException, IOException {
-        super(d, conf);
-        mynum = iwriter++;
-        openWriters.add(mynum);
-        //        System.err.println("openedw "+mynum);
-      }
-
-      @Override
-      public void close() throws IOException {
-        super.close();
-        if (!openWriters.contains(mynum)) { // probably can't happen...
-          fail("Writer #"+mynum+" was closed twice!");
-        }
-        openWriters.remove(mynum);
-        //        System.err.println("closedw "+mynum);
-      }
-    }
-  }
-}

From 422828cfd6b2609ff118d995c3307e9ed0e50686 Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Thu, 17 May 2012 08:45:29 +0000
Subject: [PATCH 18/47] SOLR-3444: Optimize Navigation for global Items

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339518 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/webapp/web/admin.html             | 22 ++++++++++++++--
 solr/webapp/web/css/styles/cloud.css   | 26 -------------------
 solr/webapp/web/css/styles/logging.css | 14 ----------
 solr/webapp/web/css/styles/menu.css    | 36 +++++++++++++++++++++-----
 solr/webapp/web/js/scripts/cloud.js    | 12 ++++-----
 solr/webapp/web/js/scripts/logging.js  |  9 +++----
 solr/webapp/web/tpl/cloud.html         | 21 ++++-----------
 solr/webapp/web/tpl/logging.html       |  9 -------
 8 files changed, 62 insertions(+), 87 deletions(-)

diff --git a/solr/webapp/web/admin.html b/solr/webapp/web/admin.html
index f77e802ba60..a051ad4c07e 100644
--- a/solr/webapp/web/admin.html
+++ b/solr/webapp/web/admin.html
@@ -76,12 +76,30 @@ limitations under the License.
         <div>
                   
           <ul id="menu">
+
             <li id="index" class="global"><p><a href="#/">Dashboard</a></p></li>
-            <li id="logging" class="global"><p><a href="#/~logging">Logging</a></p></li>
-            <li id="cloud" class="global optional"><p><a href="#/~cloud">Cloud</a></p></li>
+
+            <li id="logging" class="global"><p><a href="#/~logging">Logging</a></p>
+              <ul>
+                <li class="level"><a href="#/~logging/level">Level</a></li>
+              </ul>
+            </li>
+
+            <li id="cloud" class="global optional"><p><a href="#/~cloud">Cloud</a></p>
+              <ul>
+                <li class="tree"><a href="#/~cloud">Tree</a></li>
+                <li class="graph"><a href="#/~cloud?view=graph">Graph</a></li>
+                <li class="rgraph"><a href="#/~cloud?view=rgraph">Graph (Radial)</a></li>
+                <li class="dump"><a href="#/~cloud">Dump</a></li>
+              </ul>
+            </li>
+
             <li id="cores" class="global"><p><a href="#/~cores">Core Admin</a></p></li>
+
             <li id="java-properties" class="global"><p><a href="#/~java-properties">Java Properties</a></li>
+
             <li id="threads" class="global"><p><a href="#/~threads">Thread Dump</a></p></li>
+            
           </ul>
 
           <ul id="menu-selector">
diff --git a/solr/webapp/web/css/styles/cloud.css b/solr/webapp/web/css/styles/cloud.css
index 793c0c1ebd1..74163240d60 100644
--- a/solr/webapp/web/css/styles/cloud.css
+++ b/solr/webapp/web/css/styles/cloud.css
@@ -3,32 +3,6 @@
   position: relative;
 }
 
-#content #cloud #navigation
-{
-  width: 11%;
-}
-
-#content #cloud #navigation .tree a { background-image: url( ../../img/ico/folder-tree.png ); }
-#content #cloud #navigation .graph a { background-image: url( ../../img/ico/molecule.png ); }
-#content #cloud #navigation .rgraph a { background-image: url( ../../img/ico/asterisk.png ); }
-#content #cloud #navigation .dump a { background-image: url( ../../img/ico/download-cloud.png ); }
-
-#content #cloud #navigation .dump
-{
-  margin-top: 10px;
-}
-
-#content #cloud #navigation .dump a:hover
-{
-  color: #008;
-}
-
-#content #cloud #frame
-{
-  float: right;
-  width: 88%;
-}
-
 #content #cloud #frame .content
 {
   display: none;
diff --git a/solr/webapp/web/css/styles/logging.css b/solr/webapp/web/css/styles/logging.css
index 40e0bc36730..d04898b5c65 100644
--- a/solr/webapp/web/css/styles/logging.css
+++ b/solr/webapp/web/css/styles/logging.css
@@ -1,17 +1,3 @@
-#content #logging #navigation
-{
-  width: 8%;
-}
-
-#content #logging #navigation .viewer a { background-image: url( ../../img/ico/document-text.png ); }
-#content #logging #navigation .level a { background-image: url( ../../img/ico/gear.png ); }
-
-#content #logging #frame
-{
-  float: right;
-  width: 90%;
-}
-
 #content #logging .loader
 {
   background-position: 0 50%;
diff --git a/solr/webapp/web/css/styles/menu.css b/solr/webapp/web/css/styles/menu.css
index b23bbdf4484..89a3ae279f1 100644
--- a/solr/webapp/web/css/styles/menu.css
+++ b/solr/webapp/web/css/styles/menu.css
@@ -17,7 +17,8 @@
   border-color: #c0c0c0;
 }
 
-#menu-wrapper p a
+#menu-wrapper p a,
+#menu a
 {
   background-position: 5px 50%;
   padding-left: 26px;
@@ -138,19 +139,27 @@
   background-image: url( ../../img/ico/box.png );
 }
 
-#menu-selector ul
+#menu-selector ul,
+#menu ul
 {
   display: none;
   padding-top: 5px;
   padding-bottom: 10px;
 }
 
-#menu-selector .active ul
+#menu-selector .active ul,
+#menu .active ul
 {
   display: block;
 }
 
-#menu-selector ul li a
+#menu ul li
+{
+  border-bottom: 0;
+}
+
+#menu-selector ul li a,
+#menu ul li a
 {
   background-position: 7px 50%;
   border-bottom: 1px solid #f0f0f0;
@@ -159,18 +168,21 @@
   padding-left: 26px;
 }
 
-#menu-selector ul li:last-child a
+#menu-selector ul li:last-child a,
+#menu ul li:last-child a
 {
   border-bottom: 0;
 }
 
-#menu-selector ul li a:hover
+#menu-selector ul li a:hover,
+#menu ul li a:hover
 {
   background-color: #f0f0f0;
   color: #333;
 }
 
-#menu-selector ul li.active a
+#menu-selector ul li.active a,
+#menu ul li.active a
 {
   background-color: #d0d0d0;
   border-color: #d0d0d0;
@@ -178,11 +190,21 @@
 }
 
 #menu #index.global p a { background-image: url( ../../img/ico/dashboard.png ); }
+
 #menu #logging.global p a { background-image: url( ../../img/ico/inbox-document-text.png ); }
+#menu #logging.global .level a { background-image: url( ../../img/ico/gear.png ); }
+
 #menu #java-properties.global p a { background-image: url( ../../img/ico/jar.png ); }
+
 #menu #threads.global p a { background-image: url( ../../img/ico/ui-accordion.png ); }
+
 #menu #cores.global p a { background-image: url( ../../img/ico/databases.png ); }
+
 #menu #cloud.global p a { background-image: url( ../../img/ico/network-cloud.png ); }
+#menu #cloud.global .tree a { background-image: url( ../../img/ico/folder-tree.png ); }
+#menu #cloud.global .graph a { background-image: url( ../../img/ico/molecule.png ); }
+#menu #cloud.global .rgraph a { background-image: url( ../../img/ico/asterisk.png ); }
+#menu #cloud.global .dump a { background-image: url( ../../img/ico/download-cloud.png ); }
 
 #menu-selector .ping.error a
 {
diff --git a/solr/webapp/web/js/scripts/cloud.js b/solr/webapp/web/js/scripts/cloud.js
index bbb7e9dd86d..21b8783afb7 100644
--- a/solr/webapp/web/js/scripts/cloud.js
+++ b/solr/webapp/web/js/scripts/cloud.js
@@ -18,7 +18,7 @@
 var init_debug = function( cloud_element )
 {
   var debug_element = $( '#debug', cloud_element );
-  var debug_button = $( '.dump a', cloud_element );
+  var debug_button = $( '#menu #cloud .dump a' );
 
   var clipboard_element = $( '.clipboard', debug_element );
   var clipboard_button = $( 'a', clipboard_element );
@@ -65,7 +65,6 @@ var init_debug = function( cloud_element )
       'show',
       function( event )
       {
-        debug_button.hide();
         debug_element.show();
 
         $.ajax
@@ -147,7 +146,6 @@ var init_debug = function( cloud_element )
 
         clipboard_client.destroy();
 
-        debug_button.show();
         debug_element.hide();
       }
     );
@@ -675,7 +673,7 @@ sammy.get
           .html( template );
 
         var cloud_element = $( '#cloud', content_element );
-        var navigation_element = $( '#navigation', content_element );
+        var navigation_element = $( '#menu #cloud' );
 
         init_debug( cloud_element );
 
@@ -686,7 +684,7 @@ sammy.get
             'activate',
             function( event )
             {
-              $( this ).addClass( 'current' );
+              $( this ).addClass( 'active' );
               init_tree( $( '#tree-content', cloud_element ) );
             }
           );
@@ -698,7 +696,7 @@ sammy.get
             'activate',
             function( event )
             {
-              $( this ).addClass( 'current' );
+              $( this ).addClass( 'active' );
               init_graph( $( '#graph-content', cloud_element ) );
             }
           );
@@ -710,7 +708,7 @@ sammy.get
             'activate',
             function( event )
             {
-              $( this ).addClass( 'current' );
+              $( this ).addClass( 'active' );
               init_rgraph( $( '#graph-content', cloud_element ) );
             }
           );
diff --git a/solr/webapp/web/js/scripts/logging.js b/solr/webapp/web/js/scripts/logging.js
index 7b95b21b117..a84e8382472 100644
--- a/solr/webapp/web/js/scripts/logging.js
+++ b/solr/webapp/web/js/scripts/logging.js
@@ -398,9 +398,6 @@ sammy.get
         content_element
           .html( template );
 
-        $( '#navigation a[href="' + context.path + '"]', content_element )
-          .parent().addClass( 'current' );
-
         frame_element = $( '#frame', content_element );
         frame_element
           .html
@@ -472,7 +469,7 @@ sammy.get
 // #/~logging/level
 sammy.get
 (
-  /^#\/~(logging)\/level$/,
+  /^#\/(~logging)\/level$/,
   function( context )
   {
     var core_basepath = $( 'li[data-basepath]', app.menu_element ).attr( 'data-basepath' );
@@ -487,8 +484,8 @@ sammy.get
         content_element
           .html( template );
 
-        $( '#navigation a[href="' + context.path + '"]', content_element )
-          .parent().addClass( 'current' );
+        $( '#menu a[href="' + context.path + '"]' )
+          .parent().addClass( 'active' );
                       
         $.ajax
         (
diff --git a/solr/webapp/web/tpl/cloud.html b/solr/webapp/web/tpl/cloud.html
index 1c89fc89446..44342b7667d 100644
--- a/solr/webapp/web/tpl/cloud.html
+++ b/solr/webapp/web/tpl/cloud.html
@@ -43,23 +43,12 @@ limitations under the License.
 
   </div>
 
-  <div id="navigation" class="clearfix">
-
-    <ul>
-      <li class="tree"><a href="#/~cloud">Tree</a></li>
-      <li class="graph"><a href="#/~cloud?view=graph">Graph</a></li>
-      <li class="rgraph"><a href="#/~cloud?view=rgraph">Graph (Radial)</a></li>
-      <li class="dump"><a href="#/~cloud">Dump</a></li>
+  <div id="debug">
+    <ul class="clearfix">
+      <li class="clipboard"><a href="#" data-copied="Copied to Clipboard!">Copy to Clipboard (BUGGY!)</a></li>
+      <li class="close"><a href="#">Close</a></li>
     </ul>
-
-    <div id="debug">
-      <ul class="clearfix">
-        <li class="clipboard"><a href="#" data-copied="Copied to Clipboard!">Copy to Clipboard (BUGGY!)</a></li>
-        <li class="close"><a href="#">Close</a></li>
-      </ul>
-      <pre class="debug"></pre>
-    </div>
-
+    <pre class="debug"></pre>
   </div>
 
 </div>
\ No newline at end of file
diff --git a/solr/webapp/web/tpl/logging.html b/solr/webapp/web/tpl/logging.html
index 494d622e3a5..80671e5280d 100644
--- a/solr/webapp/web/tpl/logging.html
+++ b/solr/webapp/web/tpl/logging.html
@@ -20,13 +20,4 @@ limitations under the License.
 
   </div>
 
-  <div id="navigation" class="clearfix">
-
-    <ul>
-      <li class="viewer"><a href="#/~logging">Viewer</a></li>
-      <li class="level"><a href="#/~logging/level">Level</a></li>
-    </ul>
-  
-  </div>
-
 </div>

From 63da7ea3fd05da8a4dc055273725db8834317fec Mon Sep 17 00:00:00 2001
From: Shai Erera <shaie@apache.org>
Date: Thu, 17 May 2012 11:22:10 +0000
Subject: [PATCH 19/47] LUCENE-4064: Move ContentSource to PerfRunData out of
 DocMaker

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339555 13f79535-47bb-0310-9956-ffa450edef68
---
 .../lucene/benchmark/byTask/PerfRunData.java  | 24 ++++++++++---
 .../byTask/feeds/ContentItemsSource.java      |  1 -
 .../benchmark/byTask/feeds/DocMaker.java      | 33 +++---------------
 .../tasks/ConsumeContentSourceTask.java       | 34 +++----------------
 .../benchmark/utils/ExtractWikipedia.java     | 14 +++++---
 .../benchmark/byTask/feeds/DocMakerTest.java  | 13 +++----
 6 files changed, 45 insertions(+), 74 deletions(-)

diff --git a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/PerfRunData.java b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/PerfRunData.java
index 44ff891cc3f..fc60959ee9e 100644
--- a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/PerfRunData.java
+++ b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/PerfRunData.java
@@ -25,20 +25,20 @@ import java.util.HashMap;
 import java.util.Locale;
 
 import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.benchmark.byTask.feeds.ContentSource;
 import org.apache.lucene.benchmark.byTask.feeds.DocMaker;
 import org.apache.lucene.benchmark.byTask.feeds.FacetSource;
 import org.apache.lucene.benchmark.byTask.feeds.QueryMaker;
 import org.apache.lucene.benchmark.byTask.stats.Points;
+import org.apache.lucene.benchmark.byTask.tasks.NewAnalyzerTask;
 import org.apache.lucene.benchmark.byTask.tasks.PerfTask;
 import org.apache.lucene.benchmark.byTask.tasks.ReadTask;
 import org.apache.lucene.benchmark.byTask.tasks.SearchTask;
 import org.apache.lucene.benchmark.byTask.utils.Config;
 import org.apache.lucene.benchmark.byTask.utils.FileUtils;
-import org.apache.lucene.benchmark.byTask.tasks.NewAnalyzerTask;
 import org.apache.lucene.facet.taxonomy.TaxonomyReader;
 import org.apache.lucene.facet.taxonomy.TaxonomyWriter;
 import org.apache.lucene.index.DirectoryReader;
-import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.store.Directory;
@@ -80,6 +80,7 @@ public class PerfRunData implements Closeable {
   private Directory directory;
   private Analyzer analyzer;
   private DocMaker docMaker;
+  private ContentSource contentSource;
   private FacetSource facetSource;
   private Locale locale;
 
@@ -105,10 +106,16 @@ public class PerfRunData implements Closeable {
     // analyzer (default is standard analyzer)
     analyzer = NewAnalyzerTask.createAnalyzer(config.get("analyzer",
         "org.apache.lucene.analysis.standard.StandardAnalyzer"));
+
+    // content source
+    String sourceClass = config.get("content.source", "org.apache.lucene.benchmark.byTask.feeds.SingleDocSource");
+    contentSource = Class.forName(sourceClass).asSubclass(ContentSource.class).newInstance();
+    contentSource.setConfig(config);
+
     // doc maker
     docMaker = Class.forName(config.get("doc.maker",
         "org.apache.lucene.benchmark.byTask.feeds.DocMaker")).asSubclass(DocMaker.class).newInstance();
-    docMaker.setConfig(config);
+    docMaker.setConfig(config, contentSource);
     // facet source
     facetSource = Class.forName(config.get("facet.source",
         "org.apache.lucene.benchmark.byTask.feeds.RandomFacetSource")).asSubclass(FacetSource.class).newInstance();
@@ -129,10 +136,11 @@ public class PerfRunData implements Closeable {
     }
   }
   
+  @Override
   public void close() throws IOException {
     IOUtils.close(indexWriter, indexReader, directory, 
                   taxonomyWriter, taxonomyReader, taxonomyDir, 
-                  docMaker, facetSource);
+                  docMaker, facetSource, contentSource);
     
     // close all perf objects that are closeable.
     ArrayList<Closeable> perfObjectsToClose = new ArrayList<Closeable>();
@@ -361,7 +369,12 @@ public class PerfRunData implements Closeable {
     this.analyzer = analyzer;
   }
 
-  /** Returns the docMaker. */
+  /** Returns the ContentSource. */
+  public ContentSource getContentSource() {
+    return contentSource;
+  }
+  
+  /** Returns the DocMaker. */
   public DocMaker getDocMaker() {
     return docMaker;
   }
@@ -393,6 +406,7 @@ public class PerfRunData implements Closeable {
   }
 
   public void resetInputs() throws IOException {
+    contentSource.resetInputs();
     docMaker.resetInputs();
     facetSource.resetInputs();
     for (final QueryMaker queryMaker : readTaskQueryMaker.values()) {
diff --git a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/ContentItemsSource.java b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/ContentItemsSource.java
index 36738c2d8d4..51dd9ba31e1 100644
--- a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/ContentItemsSource.java
+++ b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/ContentItemsSource.java
@@ -131,7 +131,6 @@ public abstract class ContentItemsSource implements Closeable {
    * items generated since the last reset, so it's important to call
    * super.resetInputs in case you override this method.
    */
-  @SuppressWarnings("unused")
   public void resetInputs() throws IOException {
     bytesCount = 0;
     itemCount = 0;
diff --git a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/DocMaker.java b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/DocMaker.java
index 64fc3e103b2..a7b263dc6a7 100644
--- a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/DocMaker.java
+++ b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/feeds/DocMaker.java
@@ -355,26 +355,11 @@ public class DocMaker implements Closeable {
    * {@link ContentSource}, and it can be overridden to do more work (but make
    * sure to call super.close()).
    */
+  @Override
   public void close() throws IOException {
     source.close();
   }
   
-  /**
-   * Returns the number of bytes generated by the content source since last
-   * reset.
-   */
-  public synchronized long getBytesCount() {
-    return source.getBytesCount();
-  }
-
-  /**
-   * Returns the total number of bytes that were generated by the content source
-   * defined to that doc maker.
-   */ 
-  public long getTotalBytesCount() {
-    return source.getTotalBytesCount();
-  }
-
   /**
    * Creates a {@link Document} object ready for indexing. This method uses the
    * {@link ContentSource} to get the next document from the source, and creates
@@ -426,26 +411,16 @@ public class DocMaker implements Closeable {
   public synchronized void resetInputs() throws IOException {
     source.printStatistics("docs");
     // re-initiate since properties by round may have changed.
-    setConfig(config);
+    setConfig(config, source);
     source.resetInputs();
     numDocsCreated.set(0);
     resetLeftovers();
   }
   
   /** Set the configuration parameters of this doc maker. */
-  public void setConfig(Config config) {
+  public void setConfig(Config config, ContentSource source) {
     this.config = config;
-    try {
-        if (source != null) {
-          source.close();
-        }
-      String sourceClass = config.get("content.source", "org.apache.lucene.benchmark.byTask.feeds.SingleDocSource");
-      source = Class.forName(sourceClass).asSubclass(ContentSource.class).newInstance();
-      source.setConfig(config);
-    } catch (Exception e) {
-      // Should not get here. Throw runtime exception.
-      throw new RuntimeException(e);
-    }
+    this.source = source;
 
     boolean stored = config.get("doc.stored", false);
     boolean bodyStored = config.get("doc.body.stored", stored);
diff --git a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/ConsumeContentSourceTask.java b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/ConsumeContentSourceTask.java
index 5dbed927ecc..53cc6ca1052 100644
--- a/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/ConsumeContentSourceTask.java
+++ b/lucene/benchmark/src/java/org/apache/lucene/benchmark/byTask/tasks/ConsumeContentSourceTask.java
@@ -20,34 +20,16 @@ package org.apache.lucene.benchmark.byTask.tasks;
 import org.apache.lucene.benchmark.byTask.PerfRunData;
 import org.apache.lucene.benchmark.byTask.feeds.ContentSource;
 import org.apache.lucene.benchmark.byTask.feeds.DocData;
-import org.apache.lucene.benchmark.byTask.utils.Config;
 
-/**
- * Consumes a {@link org.apache.lucene.benchmark.byTask.feeds.ContentSource}.
- * Supports the following parameters:
- * <ul>
- * <li>content.source - the content source to use. (mandatory)
- * </ul>
- */
+/** Consumes a {@link org.apache.lucene.benchmark.byTask.feeds.ContentSource}. */
 public class ConsumeContentSourceTask extends PerfTask {
 
-  private ContentSource source;
-  private DocData dd = new DocData();
+  private final ContentSource source;
+  private ThreadLocal<DocData> dd = new ThreadLocal<DocData>();
   
   public ConsumeContentSourceTask(PerfRunData runData) {
     super(runData);
-    Config config = runData.getConfig();
-    String sourceClass = config.get("content.source", null);
-    if (sourceClass == null) {
-      throw new IllegalArgumentException("content.source must be defined");
-    }
-    try {
-      source = Class.forName(sourceClass).asSubclass(ContentSource.class).newInstance();
-      source.setConfig(config);
-      source.resetInputs();
-    } catch (Exception e) {
-      throw new RuntimeException(e);
-    }
+    source = runData.getContentSource();
   }
 
   @Override
@@ -55,15 +37,9 @@ public class ConsumeContentSourceTask extends PerfTask {
     return "read " + recsCount + " documents from the content source";
   }
   
-  @Override
-  public void close() throws Exception {
-    source.close();
-    super.close();
-  }
-
   @Override
   public int doLogic() throws Exception {
-    dd = source.getNextDocData(dd);
+    dd.set(source.getNextDocData(dd.get()));
     return 1;
   }
 
diff --git a/lucene/benchmark/src/java/org/apache/lucene/benchmark/utils/ExtractWikipedia.java b/lucene/benchmark/src/java/org/apache/lucene/benchmark/utils/ExtractWikipedia.java
index feeb6dac2b6..56527342f06 100644
--- a/lucene/benchmark/src/java/org/apache/lucene/benchmark/utils/ExtractWikipedia.java
+++ b/lucene/benchmark/src/java/org/apache/lucene/benchmark/utils/ExtractWikipedia.java
@@ -22,7 +22,9 @@ import java.io.FileWriter;
 import java.io.IOException;
 import java.util.Properties;
 
+import org.apache.lucene.benchmark.byTask.feeds.ContentSource;
 import org.apache.lucene.benchmark.byTask.feeds.DocMaker;
+import org.apache.lucene.benchmark.byTask.feeds.EnwikiContentSource;
 import org.apache.lucene.benchmark.byTask.feeds.NoMoreDataException;
 import org.apache.lucene.benchmark.byTask.utils.Config;
 import org.apache.lucene.document.Document;
@@ -122,15 +124,19 @@ public class ExtractWikipedia {
       } else if (arg.equals("--discardImageOnlyDocs") || arg.equals("-d")) {
         keepImageOnlyDocs = false;
       }
-
     }
-    DocMaker docMaker = new DocMaker();
+    
     Properties properties = new Properties();
-    properties.setProperty("content.source", "org.apache.lucene.benchmark.byTask.feeds.EnwikiContentSource");
     properties.setProperty("docs.file", wikipedia.getAbsolutePath());
     properties.setProperty("content.source.forever", "false");
     properties.setProperty("keep.image.only.docs", String.valueOf(keepImageOnlyDocs));
-    docMaker.setConfig(new Config(properties));
+    Config config = new Config(properties);
+
+    ContentSource source = new EnwikiContentSource();
+    source.setConfig(config);
+    
+    DocMaker docMaker = new DocMaker();
+    docMaker.setConfig(config, source);
     docMaker.resetInputs();
     if (wikipedia.exists()) {
       System.out.println("Extracting Wikipedia to: " + outputDir + " using EnwikiContentSource");
diff --git a/lucene/benchmark/src/test/org/apache/lucene/benchmark/byTask/feeds/DocMakerTest.java b/lucene/benchmark/src/test/org/apache/lucene/benchmark/byTask/feeds/DocMakerTest.java
index 47133b01708..dc1c78fa87f 100644
--- a/lucene/benchmark/src/test/org/apache/lucene/benchmark/byTask/feeds/DocMakerTest.java
+++ b/lucene/benchmark/src/test/org/apache/lucene/benchmark/byTask/feeds/DocMakerTest.java
@@ -28,7 +28,6 @@ import org.apache.lucene.benchmark.byTask.PerfRunData;
 import org.apache.lucene.benchmark.byTask.tasks.AddDocTask;
 import org.apache.lucene.benchmark.byTask.tasks.CloseIndexTask;
 import org.apache.lucene.benchmark.byTask.tasks.CreateIndexTask;
-import org.apache.lucene.benchmark.byTask.tasks.ResetInputsTask;
 import org.apache.lucene.benchmark.byTask.tasks.TaskSequence;
 import org.apache.lucene.benchmark.byTask.utils.Config;
 import org.apache.lucene.document.Document;
@@ -42,7 +41,7 @@ import org.apache.lucene.search.TopDocs;
 /** Tests the functionality of {@link DocMaker}. */
 public class DocMakerTest extends BenchmarkTestCase {
 
-  static final class OneDocSource extends ContentSource {
+  public static final class OneDocSource extends ContentSource {
 
     private boolean finish = false;
     
@@ -106,7 +105,6 @@ public class DocMakerTest extends BenchmarkTestCase {
     
     // Indexing configuration.
     props.setProperty("analyzer", WhitespaceAnalyzer.class.getName());
-    props.setProperty("content.source", OneDocSource.class.getName());
     props.setProperty("directory", "RAMDirectory");
     if (setNormsProp) {
       props.setProperty("doc.tokenized.norms", Boolean.toString(normsPropVal));
@@ -119,7 +117,7 @@ public class DocMakerTest extends BenchmarkTestCase {
     Config config = new Config(props);
     
     DocMaker dm = new DocMaker();
-    dm.setConfig(config);
+    dm.setConfig(config, new OneDocSource());
     return dm.makeDocument();
   }
   
@@ -175,12 +173,15 @@ public class DocMakerTest extends BenchmarkTestCase {
     ps.close();
     
     Properties props = new Properties();
-    props.setProperty("content.source", "org.apache.lucene.benchmark.byTask.feeds.LineDocSource");
     props.setProperty("docs.file", f.getAbsolutePath());
     props.setProperty("content.source.forever", "false");
     Config config = new Config(props);
+    
+    ContentSource source = new LineDocSource();
+    source.setConfig(config);
+    
     DocMaker dm = new DocMaker();
-    dm.setConfig(config);
+    dm.setConfig(config, source);
     dm.resetInputs();
     dm.resetInputs();
     dm.close();

From ca7df01ccf109e31427fffbed58eeac80ac368ac Mon Sep 17 00:00:00 2001
From: Yonik Seeley <yonik@apache.org>
Date: Thu, 17 May 2012 16:23:58 +0000
Subject: [PATCH 20/47] SOLR-2824: add fromSearcher open time to JoinQuery for
 caching

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339687 13f79535-47bb-0310-9956-ffa450edef68
---
 .../java/org/apache/solr/core/SolrCore.java   | 21 ++++++++++++++-----
 .../apache/solr/search/JoinQParserPlugin.java | 15 ++++++++++---
 2 files changed, 28 insertions(+), 8 deletions(-)

diff --git a/solr/core/src/java/org/apache/solr/core/SolrCore.java b/solr/core/src/java/org/apache/solr/core/SolrCore.java
index 5940c42595d..59760fca001 100644
--- a/solr/core/src/java/org/apache/solr/core/SolrCore.java
+++ b/solr/core/src/java/org/apache/solr/core/SolrCore.java
@@ -1006,11 +1006,23 @@ public final class SolrCore implements SolrInfoMBean {
   }
 
   /**
-  * Return the newest normal {@link RefCounted}&lt;{@link SolrIndexSearcher}&gt; with
-  * the reference count incremented.  It <b>must</b> be decremented when no longer needed.
-  * If no searcher is currently open, then if openNew==true a new searcher will be opened,
-  * or null is returned if openNew==false.
+  * Returns the current registered searcher with its reference count incremented, or null if none are registered.
   */
+  public RefCounted<SolrIndexSearcher> getRegisteredSearcher() {
+    synchronized (searcherLock) {
+      if (_searcher != null) {
+        _searcher.incref();
+      }
+      return _searcher;
+    }
+  }
+
+  /**
+   * Return the newest normal {@link RefCounted}&lt;{@link SolrIndexSearcher}&gt; with
+   * the reference count incremented.  It <b>must</b> be decremented when no longer needed.
+   * If no searcher is currently open, then if openNew==true a new searcher will be opened,
+   * or null is returned if openNew==false.
+   */
   public RefCounted<SolrIndexSearcher> getNewestSearcher(boolean openNew) {
     synchronized (searcherLock) {
       if (!_searchers.isEmpty()) {
@@ -1023,7 +1035,6 @@ public final class SolrCore implements SolrInfoMBean {
     return openNew ? getRealtimeSearcher() : null;
   }
 
-
   /** Gets the latest real-time searcher w/o forcing open a new searcher if one already exists.
    * The reference count will be incremented.
    */
diff --git a/solr/core/src/java/org/apache/solr/search/JoinQParserPlugin.java b/solr/core/src/java/org/apache/solr/search/JoinQParserPlugin.java
index 944ac2fed00..d687df91882 100644
--- a/solr/core/src/java/org/apache/solr/search/JoinQParserPlugin.java
+++ b/solr/core/src/java/org/apache/solr/search/JoinQParserPlugin.java
@@ -59,11 +59,13 @@ public class JoinQParserPlugin extends QParserPlugin {
         String toField = getParam("to");
         String v = localParams.get("v");
         Query fromQuery;
+        long fromCoreOpenTime = 0;
 
-        if (fromIndex != null) {
+        if (fromIndex != null && !fromIndex.equals(req.getCore().getCoreDescriptor().getName()) ) {
           CoreContainer container = req.getCore().getCoreDescriptor().getCoreContainer();
 
           final SolrCore fromCore = container.getCore(fromIndex);
+          RefCounted<SolrIndexSearcher> fromHolder = null;
 
           if (fromCore == null) {
             throw new SolrException(SolrException.ErrorCode.BAD_REQUEST, "Cross-core join: no such core " + fromIndex);
@@ -73,9 +75,12 @@ public class JoinQParserPlugin extends QParserPlugin {
           try {
             QParser parser = QParser.getParser(v, "lucene", otherReq);
             fromQuery = parser.getQuery();
+            fromHolder = fromCore.getRegisteredSearcher();
+            if (fromHolder != null) fromCoreOpenTime = fromHolder.get().getOpenTime();
           } finally {
             otherReq.close();
             fromCore.close();
+            if (fromHolder != null) fromHolder.decref();
           }
         } else {
           QParser fromQueryParser = subQuery(v, null);
@@ -83,6 +88,7 @@ public class JoinQParserPlugin extends QParserPlugin {
         }
 
         JoinQuery jq = new JoinQuery(fromField, toField, fromIndex, fromQuery);
+        jq.fromCoreOpenTime = fromCoreOpenTime;
         return jq;
       }
     };
@@ -95,6 +101,7 @@ class JoinQuery extends Query {
   String toField;
   String fromIndex;
   Query q;
+  long fromCoreOpenTime;
 
   public JoinQuery(String fromField, String toField, String fromIndex, Query subQuery) {
     this.fromField = fromField;
@@ -548,12 +555,14 @@ class JoinQuery extends Query {
            && this.toField.equals(other.toField)
            && this.getBoost() == other.getBoost()
            && this.q.equals(other.q)
-           && (this.fromIndex == other.fromIndex || this.fromIndex != null && this.fromIndex.equals(other.fromIndex));
+           && (this.fromIndex == other.fromIndex || this.fromIndex != null && this.fromIndex.equals(other.fromIndex))
+           && this.fromCoreOpenTime == other.fromCoreOpenTime
+        ;
   }
 
   @Override
   public int hashCode() {
-    int h = q.hashCode();
+    int h = q.hashCode() + (int)fromCoreOpenTime;
     h = h * 31 + fromField.hashCode();
     h = h * 31 + toField.hashCode();
     return h;

From 119de8f949d3f7c68a050eea9288ff496cc98a40 Mon Sep 17 00:00:00 2001
From: Mark Robert Miller <markrmiller@apache.org>
Date: Thu, 17 May 2012 16:47:39 +0000
Subject: [PATCH 21/47] SOLR-3460: Improve cmd line config bootstrap tool so
 that it now reads solr.xml and uploads configs for each SolrCore found

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339701 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/cloud-dev/solrcloud-multi-start.sh       | 45 ++++++++++
 solr/cloud-dev/solrcloud-start.sh             |  2 +-
 .../org/apache/solr/cloud/ZkController.java   | 83 ++++++++++++++++---
 .../org/apache/solr/core/CoreContainer.java   | 24 +-----
 solr/example/multicore/core0/conf/schema.xml  | 10 ++-
 .../multicore/core0/conf/solrconfig.xml       | 17 +++-
 solr/example/multicore/core1/conf/schema.xml  | 10 ++-
 .../multicore/core1/conf/solrconfig.xml       | 17 +++-
 8 files changed, 162 insertions(+), 46 deletions(-)
 create mode 100644 solr/cloud-dev/solrcloud-multi-start.sh

diff --git a/solr/cloud-dev/solrcloud-multi-start.sh b/solr/cloud-dev/solrcloud-multi-start.sh
new file mode 100644
index 00000000000..4715d6c606a
--- /dev/null
+++ b/solr/cloud-dev/solrcloud-multi-start.sh
@@ -0,0 +1,45 @@
+#!/usr/bin/env bash
+
+# starts up the multicore example
+
+cd ..
+
+rm -r -f example2
+rm -r -f example3
+rm -r -f example4
+rm -r -f example5
+rm -r -f example6
+
+rm -r -f dist
+rm -r -f build
+rm -r -f example/solr/zoo_data
+rm -r -f example/solr/data
+rm -f example/example.log
+
+ant example dist
+
+cp -r -f example example2
+cp -r -f example example3
+cp -r -f example example4
+cp -r -f example example5
+cp -r -f example example6
+
+java -classpath lib/*:dist/*:build/lucene-libs/* org.apache.solr.cloud.ZkController 127.0.0.1:9983 example/multicore 8983
+
+cd example
+java -DzkRun -DnumShards=2 -DSTOP.PORT=7983 -DSTOP.KEY=key -Dsolr.solr.home=multicore -jar start.jar 1>example.log 2>&1 &
+
+cd ../example2
+java -Djetty.port=7574 -DzkHost=localhost:9983 -DnumShards=2 -DSTOP.PORT=6574 -DSTOP.KEY=key -Dsolr.solr.home=multicore -jar start.jar 1>example2.log 2>&1 &
+
+cd ../example3
+java -Djetty.port=7575 -DzkHost=localhost:9983 -DnumShards=2 -DSTOP.PORT=6575 -DSTOP.KEY=key -Dsolr.solr.home=multicore -jar start.jar 1>example3.log 2>&1 &
+
+cd ../example4
+java -Djetty.port=7576 -DzkHost=localhost:9983 -DnumShards=2 -DSTOP.PORT=6576 -DSTOP.KEY=key -Dsolr.solr.home=multicore -jar start.jar 1>example4.log 2>&1 &
+
+cd ../example5
+java -Djetty.port=7577 -DzkHost=localhost:9983 -DnumShards=2 -DSTOP.PORT=6577 -DSTOP.KEY=key -Dsolr.solr.home=multicore -jar start.jar 1>example5.log 2>&1 &
+
+cd ../example6
+java -Djetty.port=7578 -DzkHost=localhost:9983 -DnumShards=2 -DSTOP.PORT=6578 -DSTOP.KEY=key -Dsolr.solr.home=multicore -jar start.jar 1>example6.log 2>&1 &
diff --git a/solr/cloud-dev/solrcloud-start.sh b/solr/cloud-dev/solrcloud-start.sh
index e77480f71fe..142d2342d1b 100644
--- a/solr/cloud-dev/solrcloud-start.sh
+++ b/solr/cloud-dev/solrcloud-start.sh
@@ -22,7 +22,7 @@ cp -r -f example example4
 cp -r -f example example5
 cp -r -f example example6
 
-java -classpath lib/*:dist/*:build/lucene-libs/* org.apache.solr.cloud.ZkController 127.0.0.1:9983 8983 example/solr/conf conf1 example/solr
+java -classpath lib/*:dist/*:build/lucene-libs/* org.apache.solr.cloud.ZkController 127.0.0.1:9983 example/solr 8983
 
 cd example
 java -DzkRun -DnumShards=2 -DSTOP.PORT=7983 -DSTOP.KEY=key -jar start.jar 1>example.log 2>&1 &
diff --git a/solr/core/src/java/org/apache/solr/cloud/ZkController.java b/solr/core/src/java/org/apache/solr/cloud/ZkController.java
index 5e9750732bc..3b9246008ca 100644
--- a/solr/core/src/java/org/apache/solr/cloud/ZkController.java
+++ b/solr/core/src/java/org/apache/solr/cloud/ZkController.java
@@ -32,6 +32,8 @@ import java.util.concurrent.TimeoutException;
 import java.util.regex.Matcher;
 import java.util.regex.Pattern;
 
+import javax.xml.xpath.XPathConstants;
+
 import org.apache.solr.client.solrj.impl.HttpSolrServer;
 import org.apache.solr.client.solrj.request.CoreAdminRequest.WaitForState;
 import org.apache.solr.common.SolrException;
@@ -46,16 +48,22 @@ import org.apache.solr.common.cloud.ZkNodeProps;
 import org.apache.solr.common.cloud.ZkStateReader;
 import org.apache.solr.common.cloud.ZooKeeperException;
 import org.apache.solr.common.params.SolrParams;
+import org.apache.solr.core.Config;
 import org.apache.solr.core.CoreContainer;
 import org.apache.solr.core.CoreDescriptor;
 import org.apache.solr.core.SolrCore;
+import org.apache.solr.core.SolrResourceLoader;
 import org.apache.solr.update.UpdateLog;
+import org.apache.solr.util.DOMUtil;
 import org.apache.zookeeper.CreateMode;
 import org.apache.zookeeper.KeeperException;
 import org.apache.zookeeper.KeeperException.NoNodeException;
 import org.apache.zookeeper.data.Stat;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
+import org.w3c.dom.Node;
+import org.w3c.dom.NodeList;
+import org.xml.sax.InputSource;
 
 /**
  * Handle ZooKeeper interactions.
@@ -114,21 +122,31 @@ public final class ZkController {
   // this can be null in which case recovery will be inactive
   private CoreContainer cc;
 
+  /**
+   * Bootstraps the current configs for all collections in solr.xml.
+   * Takes two params - the zkhost to connect to and the solrhome location
+   * to find solr.xml.
+   *
+   * If you also pass a solrPort, it will be used to start
+   * an embedded zk useful for single machine, multi node tests.
+   * 
+   * @param args
+   * @throws Exception
+   */
   public static void main(String[] args) throws Exception {
     // start up a tmp zk server first
     String zkServerAddress = args[0];
     
-    String solrPort = args[1];
-    
-    String confDir = args[2];
-    String confName = args[3];
-    
-    String solrHome = null;
-    if (args.length == 5) {
-      solrHome = args[4];
+    String solrHome = args[1];
+   
+    String solrPort = null;
+    if (args.length > 2) {
+      solrPort = args[2];
     }
+    
+
     SolrZkServer zkServer = null;
-    if (solrHome != null) {
+    if (solrPort != null) {
       zkServer = new SolrZkServer("true", null, solrHome + "/zoo_data", solrHome, solrPort);
       zkServer.parseConfig();
       zkServer.start();
@@ -140,8 +158,13 @@ public final class ZkController {
           public void command() {
           }});
     
-    uploadConfigDir(zkClient, new File(confDir), confName);
-    if (solrHome != null) {
+    SolrResourceLoader loader = new SolrResourceLoader(solrHome);
+    solrHome = loader.getInstanceDir();
+    
+    InputSource cfgis = new InputSource(new File(solrHome, "solr.xml").toURI().toASCIIString());
+    Config cfg = new Config(loader, null, cfgis , null, false);
+    bootstrapConf(zkClient, cfg, solrHome);
+    if (solrPort != null) {
       zkServer.stop();
     }
   }
@@ -855,7 +878,7 @@ public final class ZkController {
         try {
           Map<String,String> collectionProps = new HashMap<String,String>();
           // TODO: if collection.configName isn't set, and there isn't already a conf in zk, just use that?
-          String defaultConfigName = System.getProperty(COLLECTION_PARAM_PREFIX+CONFIGNAME_PROP, "configuration1");
+          String defaultConfigName = System.getProperty(COLLECTION_PARAM_PREFIX+CONFIGNAME_PROP, collection);
 
           // params passed in - currently only done via core admin (create core commmand).
           if (params != null) {
@@ -948,6 +971,13 @@ public final class ZkController {
         collectionProps.put(CONFIGNAME_PROP,  configNames.get(0));
         break;
       }
+      
+      if (configNames != null && configNames.contains(collection)) {
+        log.info("Could not find explicit collection configName, but found config name matching collection name - using that set.");
+        collectionProps.put(CONFIGNAME_PROP,  collection);
+        break;
+      }
+      
       log.info("Could not find collection configName - pausing for 3 seconds and trying again - try: " + retry);
       Thread.sleep(3000);
     }
@@ -1155,5 +1185,34 @@ public final class ZkController {
     }
     return leaderProps;
   }
+  
+  /**
+   * If in SolrCloud mode, upload config sets for each SolrCore in solr.xml.
+   * 
+   * @throws IOException
+   * @throws KeeperException
+   * @throws InterruptedException
+   */
+  public static void bootstrapConf(SolrZkClient zkClient, Config cfg, String solrHome) throws IOException,
+      KeeperException, InterruptedException {
+    
+    NodeList nodes = (NodeList)cfg.evaluate("solr/cores/core", XPathConstants.NODESET);
+
+    for (int i=0; i<nodes.getLength(); i++) {
+      Node node = nodes.item(i);
+      String rawName = DOMUtil.getAttr(node, "name", null);
+      String instanceDir = DOMUtil.getAttr(node, "instanceDir", null);
+      File idir = new File(instanceDir);
+      if (!idir.isAbsolute()) {
+        idir = new File(solrHome, instanceDir);
+      }
+      String confName = DOMUtil.getAttr(node, "collection", null);
+      if (confName == null) {
+        confName = rawName;
+      }
+
+      ZkController.uploadConfigDir(zkClient, new File(idir, "conf"), confName);
+    }
+  }
 
 }
diff --git a/solr/core/src/java/org/apache/solr/core/CoreContainer.java b/solr/core/src/java/org/apache/solr/core/CoreContainer.java
index c84bd5553dc..b968df81a5a 100644
--- a/solr/core/src/java/org/apache/solr/core/CoreContainer.java
+++ b/solr/core/src/java/org/apache/solr/core/CoreContainer.java
@@ -233,7 +233,7 @@ public class CoreContainer
         
         boolean boostrapConf = Boolean.getBoolean("bootstrap_conf");
         if(boostrapConf) {
-          bootstrapConf();
+          ZkController.bootstrapConf(zkController.getZkClient(), cfg, solrHome);
         }
         
       } catch (InterruptedException e) {
@@ -259,28 +259,6 @@ public class CoreContainer
     
   }
 
-  private void bootstrapConf() throws IOException,
-      KeeperException, InterruptedException {
-
-    NodeList nodes = (NodeList)cfg.evaluate("solr/cores/core", XPathConstants.NODESET);
-
-    for (int i=0; i<nodes.getLength(); i++) {
-      Node node = nodes.item(i);
-      String rawName = DOMUtil.getAttr(node, "name", null);
-      String instanceDir = DOMUtil.getAttr(node, "instanceDir", null);
-      File idir = new File(instanceDir);
-      if (!idir.isAbsolute()) {
-        idir = new File(solrHome, instanceDir);
-      }
-      String confName = DOMUtil.getAttr(node, "collection", null);
-      if (confName == null) {
-        confName = rawName;
-      }
-
-      zkController.uploadConfigDir(new File(idir, "conf"), confName);
-    }
-  }
-
   public Properties getContainerProperties() {
     return containerProperties;
   }
diff --git a/solr/example/multicore/core0/conf/schema.xml b/solr/example/multicore/core0/conf/schema.xml
index 2a86fc717b3..7401b5b58ed 100644
--- a/solr/example/multicore/core0/conf/schema.xml
+++ b/solr/example/multicore/core0/conf/schema.xml
@@ -19,14 +19,16 @@
 <schema name="example core zero" version="1.1">
   <types>
    <fieldtype name="string"  class="solr.StrField" sortMissingLast="true" omitNorms="true"/>
+   <fieldType name="long" class="solr.TrieLongField" precisionStep="0" positionIncrementGap="0"/>
   </types>
 
  <fields>   
   <!-- general -->
-  <field name="id"      type="string"   indexed="true"  stored="true"  multiValued="false" required="true"/>
-  <field name="type"    type="string"   indexed="true"  stored="true"  multiValued="false" /> 
-  <field name="name"    type="string"   indexed="true"  stored="true"  multiValued="false" /> 
-  <field name="core0"   type="string"   indexed="true"  stored="true"  multiValued="false" /> 
+  <field name="id"        type="string"   indexed="true"  stored="true"  multiValued="false" required="true"/>
+  <field name="type"      type="string"   indexed="true"  stored="true"  multiValued="false" /> 
+  <field name="name"      type="string"   indexed="true"  stored="true"  multiValued="false" /> 
+  <field name="core0"     type="string"   indexed="true"  stored="true"  multiValued="false" /> 
+  <field name="_version_" type="long"     indexed="true"  stored="true"/>
  </fields>
 
  <!-- field to use to determine and enforce document uniqueness. -->
diff --git a/solr/example/multicore/core0/conf/solrconfig.xml b/solr/example/multicore/core0/conf/solrconfig.xml
index 81c52bbe88e..18d842b718a 100644
--- a/solr/example/multicore/core0/conf/solrconfig.xml
+++ b/solr/example/multicore/core0/conf/solrconfig.xml
@@ -29,7 +29,22 @@
 
   <dataDir>${solr.core0.data.dir:}</dataDir>
 
-  <updateHandler class="solr.DirectUpdateHandler2" />
+  <updateHandler class="solr.DirectUpdateHandler2">
+    <updateLog>
+      <str name="dir">${solr.core0.data.dir:}</str>
+    </updateLog>
+  </updateHandler>
+
+  <!-- realtime get handler, guaranteed to return the latest stored fields 
+    of any document, without the need to commit or open a new searcher. The current 
+    implementation relies on the updateLog feature being enabled. -->
+  <requestHandler name="/get" class="solr.RealTimeGetHandler">
+    <lst name="defaults">
+      <str name="omitHeader">true</str>
+    </lst>
+  </requestHandler>  
+  
+  <requestHandler name="/replication" class="solr.ReplicationHandler" startup="lazy" /> 
 
   <requestDispatcher handleSelect="true" >
     <requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048" />
diff --git a/solr/example/multicore/core1/conf/schema.xml b/solr/example/multicore/core1/conf/schema.xml
index d02865df407..5a27d39df2d 100644
--- a/solr/example/multicore/core1/conf/schema.xml
+++ b/solr/example/multicore/core1/conf/schema.xml
@@ -19,14 +19,16 @@
 <schema name="example core one" version="1.1">
   <types>
    <fieldtype name="string"  class="solr.StrField" sortMissingLast="true" omitNorms="true"/>
+   <fieldType name="long" class="solr.TrieLongField" precisionStep="0" positionIncrementGap="0"/>
   </types>
 
  <fields>   
   <!-- general -->
-  <field name="id"       type="string"    indexed="true"  stored="true"  multiValued="false" required="true"/>
-  <field name="type"     type="string"    indexed="true"  stored="true"  multiValued="false" /> 
-  <field name="name"     type="string"    indexed="true"  stored="true"  multiValued="false" /> 
-  <field name="core1"    type="string"    indexed="true"  stored="true"  multiValued="false" /> 
+  <field name="id"        type="string"    indexed="true"  stored="true"  multiValued="false" required="true"/>
+  <field name="type"      type="string"    indexed="true"  stored="true"  multiValued="false" /> 
+  <field name="name"      type="string"    indexed="true"  stored="true"  multiValued="false" /> 
+  <field name="core1"     type="string"    indexed="true"  stored="true"  multiValued="false" />
+  <field name="_version_" type="long"      indexed="true"  stored="true"/>
  </fields>
 
  <!-- field to use to determine and enforce document uniqueness. -->
diff --git a/solr/example/multicore/core1/conf/solrconfig.xml b/solr/example/multicore/core1/conf/solrconfig.xml
index 73e816f00e6..7bc5a3ac6dd 100644
--- a/solr/example/multicore/core1/conf/solrconfig.xml
+++ b/solr/example/multicore/core1/conf/solrconfig.xml
@@ -29,7 +29,22 @@
 
   <dataDir>${solr.core1.data.dir:}</dataDir>
 
-  <updateHandler class="solr.DirectUpdateHandler2" />
+  <updateHandler class="solr.DirectUpdateHandler2">
+    <updateLog>
+      <str name="dir">${solr.core1.data.dir:}</str>
+    </updateLog>
+  </updateHandler>
+
+  <!-- realtime get handler, guaranteed to return the latest stored fields 
+    of any document, without the need to commit or open a new searcher. The current 
+    implementation relies on the updateLog feature being enabled. -->
+  <requestHandler name="/get" class="solr.RealTimeGetHandler">
+    <lst name="defaults">
+      <str name="omitHeader">true</str>
+    </lst>
+  </requestHandler>
+  
+  <requestHandler name="/replication" class="solr.ReplicationHandler" startup="lazy" /> 
 
   <requestDispatcher handleSelect="true" >
     <requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048" />

From 8db469ef018fd7131a3dea6f94eb3c0ae57454d8 Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Thu, 17 May 2012 17:59:42 +0000
Subject: [PATCH 22/47] Fix typo in defaultValue parameter name

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339750 13f79535-47bb-0310-9956-ffa450edef68
---
 .../apache/solr/response/transform/ValueAugmenterFactory.java   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/solr/core/src/java/org/apache/solr/response/transform/ValueAugmenterFactory.java b/solr/core/src/java/org/apache/solr/response/transform/ValueAugmenterFactory.java
index a62e709f2d1..f0eeafbc4f7 100644
--- a/solr/core/src/java/org/apache/solr/response/transform/ValueAugmenterFactory.java
+++ b/solr/core/src/java/org/apache/solr/response/transform/ValueAugmenterFactory.java
@@ -37,7 +37,7 @@ public class ValueAugmenterFactory extends TransformerFactory
   public void init(NamedList args) {
     value = args.get( "value" );
     if( value == null ) {
-      defaultValue = args.get( "deaultValue" );
+      defaultValue = args.get( "defaultValue" );
     }
   }
 

From fc84112ece8e7306083283c7d3b099e97bdbcbfb Mon Sep 17 00:00:00 2001
From: Robert Muir <rmuir@apache.org>
Date: Thu, 17 May 2012 18:03:13 +0000
Subject: [PATCH 23/47] add hepburn test and fix some corner cases

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339753 13f79535-47bb-0310-9956-ffa450edef68
---
 .../lucene/analysis/ja/util/ToStringUtil.java | 69 ++++++++++++++--
 .../analysis/ja/util/TestToStringUtil.java    | 78 +++++++++++++++++++
 2 files changed, 142 insertions(+), 5 deletions(-)

diff --git a/lucene/analysis/kuromoji/src/java/org/apache/lucene/analysis/ja/util/ToStringUtil.java b/lucene/analysis/kuromoji/src/java/org/apache/lucene/analysis/ja/util/ToStringUtil.java
index c83de194d7a..977ab49f0e8 100644
--- a/lucene/analysis/kuromoji/src/java/org/apache/lucene/analysis/ja/util/ToStringUtil.java
+++ b/lucene/analysis/kuromoji/src/java/org/apache/lucene/analysis/ja/util/ToStringUtil.java
@@ -252,6 +252,8 @@ public class ToStringUtil {
   /**
    * Romanize katakana with modified hepburn
    */
+  // TODO: now that this is used by readingsfilter and not just for
+  // debugging, fix this to really be a scheme that works best with IMEs
   public static void getRomanization(Appendable builder, CharSequence s) throws IOException {
     final int len = s.length();
     for (int i = 0; i < len; i++) {
@@ -522,6 +524,9 @@ public class ToStringUtil {
           if (ch2 == 'ウ') {
             builder.append("tō");
             i++;
+          } else if (ch2 == 'ゥ') {
+            builder.append("tu");
+            i++;
           } else {
             builder.append("to");
           }
@@ -665,7 +670,7 @@ public class ToStringUtil {
           builder.append("mu");
           break;
         case 'メ':
-          builder.append("mi");
+          builder.append("me");
           break;
         case 'モ':
           if (ch2 == 'ウ') {
@@ -690,7 +695,12 @@ public class ToStringUtil {
           }
           break;
         case 'ラ':
-          builder.append("ra");
+          if (ch2 == '゜') {
+            builder.append("la");
+            i++;
+          } else {
+            builder.append("ra");
+          }
           break;
         case 'リ':
           if (ch2 == 'ョ' && ch3 == 'ウ') {
@@ -711,20 +721,36 @@ public class ToStringUtil {
           } else if (ch2 == 'ェ') {
             builder.append("rye");
             i++;
+          } else if (ch2 == '゜') {
+            builder.append("li");
+            i++;
           } else {
             builder.append("ri");
           }
           break;
         case 'ル':
-          builder.append("ru");
+          if (ch2 == '゜') {
+            builder.append("lu");
+            i++;
+          } else {
+            builder.append("ru");
+          }
           break;
         case 'レ':
-          builder.append("re");
+          if (ch2 == '゜') {
+            builder.append("le");
+            i++;
+          } else {
+            builder.append("re");
+          }
           break;
         case 'ロ':
           if (ch2 == 'ウ') {
             builder.append("rō");
             i++;
+          } else if (ch2 == '゜') {
+            builder.append("lo");
+            i++;
           } else {
             builder.append("ro");
           }
@@ -887,7 +913,28 @@ public class ToStringUtil {
           builder.append("da");
           break;
         case 'ヂ':
-          builder.append("ji");
+          // TODO: investigate all this
+          if (ch2 == 'ョ' && ch3 == 'ウ') {
+            builder.append("jō");
+            i += 2;
+          } else if (ch2 == 'ュ' && ch3 == 'ウ') {
+            builder.append("jū");
+            i += 2;
+          } else if (ch2 == 'ャ') {
+            builder.append("ja");
+            i++;
+          } else if (ch2 == 'ョ') {
+            builder.append("jo");
+            i++;
+          } else if (ch2 == 'ュ') {
+            builder.append("ju");
+            i++;
+          } else if (ch2 == 'ェ') {
+            builder.append("je");
+            i++;
+          } else {
+            builder.append("ji");
+          }
           break;
         case 'ヅ':
           builder.append("zu");
@@ -994,6 +1041,18 @@ public class ToStringUtil {
             builder.append("po");
           }
           break;
+        case 'ヷ':
+          builder.append("va");
+          break;
+        case 'ヸ':
+          builder.append("vi");
+          break;
+        case 'ヹ':
+          builder.append("ve");
+          break;
+        case 'ヺ':
+          builder.append("vo");
+          break;
         case 'ヴ':
           if (ch2 == 'ィ' && ch3 == 'ェ') {
             builder.append("vye");
diff --git a/lucene/analysis/kuromoji/src/test/org/apache/lucene/analysis/ja/util/TestToStringUtil.java b/lucene/analysis/kuromoji/src/test/org/apache/lucene/analysis/ja/util/TestToStringUtil.java
index f95a527dcb9..a2388d7c03c 100644
--- a/lucene/analysis/kuromoji/src/test/org/apache/lucene/analysis/ja/util/TestToStringUtil.java
+++ b/lucene/analysis/kuromoji/src/test/org/apache/lucene/analysis/ja/util/TestToStringUtil.java
@@ -17,6 +17,9 @@ package org.apache.lucene.analysis.ja.util;
  * limitations under the License.
  */
 
+import java.util.HashMap;
+import java.util.Map;
+
 import org.apache.lucene.util.LuceneTestCase;
 
 public class TestToStringUtil extends LuceneTestCase {
@@ -31,4 +34,79 @@ public class TestToStringUtil extends LuceneTestCase {
     assertEquals("chashu", ToStringUtil.getRomanization("チャーシュー"));
     assertEquals("shumai", ToStringUtil.getRomanization("シューマイ"));
   }
+  
+  // see http://en.wikipedia.org/wiki/Hepburn_romanization,
+  // but this isnt even thorough or really probably what we want!
+  public void testHepburnTable() {
+    Map<String,String> table = new HashMap<String,String>() {{
+      put("ア", "a");   put("イ", "i");   put("ウ", "u");   put("エ", "e");   put("オ", "o");
+      put("カ", "ka");  put("キ", "ki");  put("ク", "ku");  put("ケ", "ke");  put("コ", "ko");
+      put("サ", "sa");  put("シ", "shi"); put("ス", "su");  put("セ", "se");  put("ソ", "so");
+      put("タ", "ta");  put("チ", "chi"); put("ツ", "tsu"); put("テ", "te");  put("ト", "to");
+      put("ナ", "na");  put("ニ", "ni");  put("ヌ", "nu");  put("ネ", "ne");  put("ノ", "no");
+      put("ハ", "ha");  put("ヒ", "hi");  put("フ", "fu");  put("ヘ", "he");  put("ホ", "ho");
+      put("マ", "ma");  put("ミ", "mi");  put("ム", "mu");  put("メ", "me");  put("モ", "mo");
+      put("ヤ", "ya");                  put("ユ", "yu");                 put("ヨ", "yo");
+      put("ラ", "ra");  put("リ", "ri");  put("ル", "ru");  put("レ", "re");  put("ロ", "ro");
+      put("ワ", "wa");  put("ヰ", "i");                   put("ヱ", "e");   put("ヲ", "o");
+                                                                     put("ン", "n");
+      put("ガ", "ga");  put("ギ", "gi");  put("グ", "gu");  put("ゲ", "ge");  put("ゴ", "go");
+      put("ザ", "za");  put("ジ", "ji");  put("ズ", "zu");  put("ゼ", "ze");  put("ゾ", "zo");
+      put("ダ", "da");  put("ヂ", "ji");  put("ヅ", "zu");  put("デ", "de");  put("ド", "do");
+      put("バ", "ba");  put("ビ", "bi");  put("ブ", "bu");  put("ベ", "be");  put("ボ", "bo");
+      put("パ", "pa");  put("ピ", "pi");  put("プ", "pu");  put("ペ", "pe");  put("ポ", "po");
+      
+                   put("キャ", "kya");   put("キュ", "kyu");   put("キョ", "kyo");
+                   put("シャ", "sha");   put("シュ", "shu");   put("ショ", "sho");
+                   put("チャ", "cha");   put("チュ", "chu");   put("チョ", "cho");
+                   put("ニャ", "nya");   put("ニュ", "nyu");   put("ニョ", "nyo");
+                   put("ヒャ", "hya");   put("ヒュ", "hyu");   put("ヒョ", "hyo");
+                   put("ミャ", "mya");   put("ミュ", "myu");   put("ミョ", "myo");
+                   put("リャ", "rya");   put("リュ", "ryu");   put("リョ", "ryo");
+                   put("ギャ", "gya");   put("ギュ", "gyu");   put("ギョ", "gyo");
+                   put("ジャ", "ja");    put("ジュ", "ju");    put("ジョ", "jo");
+                   put("ヂャ", "ja");    put("ヂュ", "ju");    put("ヂョ", "jo");
+                   put("ビャ", "bya");   put("ビュ", "byu");   put("ビョ", "byo");
+                   put("ピャ", "pya");   put("ピュ", "pyu");   put("ピョ", "pyo");
+      
+                      put("イィ", "yi");                 put("イェ", "ye");
+      put("ウァ", "wa"); put("ウィ", "wi"); put("ウゥ", "wu"); put("ウェ", "we"); put("ウォ", "wo");
+                                     put("ウュ", "wyu");
+                                   // TODO: really should be vu
+      put("ヴァ", "va"); put("ヴィ", "vi"); put("ヴ", "v");  put("ヴェ", "ve"); put("ヴォ", "vo");
+      put("ヴャ", "vya");              put("ヴュ", "vyu"); put("ヴィェ", "vye"); put("ヴョ", "vyo");
+                                                     put("キェ", "kye");
+                                                     put("ギェ", "gye");
+      put("クァ", "kwa"); put("クィ", "kwi");              put("クェ", "kwe"); put("クォ", "kwo");
+      put("クヮ", "kwa");
+      put("グァ", "gwa"); put("グィ", "gwi");              put("グェ", "gwe"); put("グォ", "gwo");
+      put("グヮ", "gwa");
+                                                     put("シェ", "she");
+                                                     put("ジェ", "je");
+                       put("スィ", "si");
+                       put("ズィ", "zi");
+                                                     put("チェ", "che");
+      put("ツァ", "tsa"); put("ツィ", "tsi");              put("ツェ", "tse"); put("ツォ", "tso");
+                                     put("ツュ", "tsyu");
+                      put("ティ", "ti"); put("トゥ", "tu");
+                                     put("テュ", "tyu");
+                      put("ディ", "di"); put("ドゥ", "du");
+                                     put("デュ", "dyu");
+                                                     put("ニェ", "nye");
+                                                     put("ヒェ", "hye");
+                                                     put("ビェ", "bye");
+                                                     put("ピェ", "pye");
+      put("ファ", "fa");  put("フィ", "fi");               put("フェ", "fe");  put("フォ", "fo");
+      put("フャ", "fya");              put("フュ", "fyu"); put("フィェ", "fye"); put("フョ", "fyo");
+                                    put("ホゥ", "hu");
+                                                     put("ミェ", "mye");
+                                                     put("リェ", "rye");
+      put("ラ゜", "la");  put("リ゜", "li");  put("ル゜", "lu");  put("レ゜", "le");  put("ロ゜", "lo");
+      put("ヷ", "va");  put("ヸ", "vi");                  put("ヹ", "ve");  put("ヺ", "vo");
+    }};
+    
+    for (String s : table.keySet()) {
+      assertEquals(s, table.get(s), ToStringUtil.getRomanization(s));
+    }
+  }
 }

From 28b1e9e4edcdb5600f8368847d7a228445d6a94f Mon Sep 17 00:00:00 2001
From: Simon Willnauer <simonw@apache.org>
Date: Thu, 17 May 2012 18:33:15 +0000
Subject: [PATCH 24/47] LUCENE-4066: compare actual # terms in the queue
 instead of unique terms

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339779 13f79535-47bb-0310-9956-ffa450edef68
---
 .../org/apache/lucene/index/TestDocumentsWriterDeleteQueue.java | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterDeleteQueue.java b/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterDeleteQueue.java
index ba43d4d842e..a2903cf2265 100644
--- a/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterDeleteQueue.java
+++ b/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterDeleteQueue.java
@@ -68,7 +68,7 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
         assertAllBetween(last2, j, bd2, ids);
         last2 = j + 1;
       }
-      assertEquals(uniqueValues.size(), queue.numGlobalTermDeletes());
+      assertEquals(j+1, queue.numGlobalTermDeletes());
     }
     assertEquals(uniqueValues, bd1.terms.keySet());
     assertEquals(uniqueValues, bd2.terms.keySet());

From a137d089c8fee227d2a350037c8a3b0296fb6f70 Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Thu, 17 May 2012 18:34:04 +0000
Subject: [PATCH 25/47] Update clustering /browse UI to reflect long past
 change with Carrot dependencies that used to require a system property switch
 to enable

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339781 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/example/solr/conf/solrconfig.xml      | 8 +-------
 solr/example/solr/conf/velocity/cluster.vm | 2 +-
 2 files changed, 2 insertions(+), 8 deletions(-)

diff --git a/solr/example/solr/conf/solrconfig.xml b/solr/example/solr/conf/solrconfig.xml
index 787b078c119..5f66ae8bc60 100755
--- a/solr/example/solr/conf/solrconfig.xml
+++ b/solr/example/solr/conf/solrconfig.xml
@@ -1261,13 +1261,8 @@
 
        http://wiki.apache.org/solr/ClusteringComponent
 
-       You'll need to set the solr.cluster.enabled system property 
-       when running solr to run with clustering enabled:
-
-       java -Dsolr.clustering.enabled=true -jar start.jar
     -->
-  <searchComponent name="clustering" 
-                   enable="${solr.clustering.enabled:false}"
+  <searchComponent name="clustering"
                    class="solr.clustering.ClusteringComponent" >
     <!-- Declare an engine -->
     <lst name="engine">
@@ -1333,7 +1328,6 @@
     -->
   <requestHandler name="/clustering"
                   startup="lazy"
-                  enable="${solr.clustering.enabled:false}"
                   class="solr.SearchHandler">
     <lst name="defaults">
       <bool name="clustering">true</bool>
diff --git a/solr/example/solr/conf/velocity/cluster.vm b/solr/example/solr/conf/velocity/cluster.vm
index ab2f0e458eb..c798e6a8d12 100644
--- a/solr/example/solr/conf/velocity/cluster.vm
+++ b/solr/example/solr/conf/velocity/cluster.vm
@@ -1,6 +1,6 @@
 <h2 #annTitle("Clusters generated by Carrot2 using the /clustering RequestHandler")>Clusters</h2>
 <div id="clusters">
-  Run Solr with java -Dsolr.clustering.enabled=true -jar start.jar to see results
+  Loading clusters...
 </div>
 <script type="text/javascript">
 

From 80e4e055781665505caebabb82eaee71b1324e09 Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Thu, 17 May 2012 20:51:43 +0000
Subject: [PATCH 26/47] DeHossification

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339859 13f79535-47bb-0310-9956-ffa450edef68
---
 .../processor/FieldMutatingUpdateProcessorTest.java       | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/solr/core/src/test/org/apache/solr/update/processor/FieldMutatingUpdateProcessorTest.java b/solr/core/src/test/org/apache/solr/update/processor/FieldMutatingUpdateProcessorTest.java
index 95369cf5332..778ff23adf6 100644
--- a/solr/core/src/test/org/apache/solr/update/processor/FieldMutatingUpdateProcessorTest.java
+++ b/solr/core/src/test/org/apache/solr/update/processor/FieldMutatingUpdateProcessorTest.java
@@ -614,7 +614,7 @@ public class FieldMutatingUpdateProcessorTest extends SolrTestCaseJ4 {
   }
 
   /** 
-   * Convinience method for building up SolrInputDocuments
+   * Convenience method for building up SolrInputDocuments
    */
   SolrInputDocument doc(SolrInputField... fields) {
     SolrInputDocument d = new SolrInputDocument();
@@ -625,7 +625,7 @@ public class FieldMutatingUpdateProcessorTest extends SolrTestCaseJ4 {
   }
 
   /** 
-   * Convinience method for building up SolrInputFields
+   * Convenience method for building up SolrInputFields
    */
   SolrInputField field(String name, float boost, Object... values) {
     SolrInputField f = new SolrInputField(name);
@@ -637,7 +637,7 @@ public class FieldMutatingUpdateProcessorTest extends SolrTestCaseJ4 {
   }
 
   /** 
-   * Convinience method for building up SolrInputFields with default boost
+   * Convenience method for building up SolrInputFields with default boost
    */
   SolrInputField f(String name, Object... values) {
     return field(name, 1.0F, values);
@@ -647,7 +647,7 @@ public class FieldMutatingUpdateProcessorTest extends SolrTestCaseJ4 {
   /**
    * Runs a document through the specified chain, and returns the final 
    * document used when the chain is completed (NOTE: some chains may 
-   * modifiy the document in place
+   * modify the document in place
    */
   SolrInputDocument processAdd(final String chain, 
                                final SolrInputDocument docIn) 

From 1ce88f3f65c5be6fd27dce2a3716e690f882b76f Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Thu, 17 May 2012 22:34:08 +0000
Subject: [PATCH 27/47] Revert change to r1339781 - tests fail with clustering
 automatically enabled

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339901 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/example/solr/conf/solrconfig.xml      | 7 +++++++
 solr/example/solr/conf/velocity/cluster.vm | 2 +-
 2 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/solr/example/solr/conf/solrconfig.xml b/solr/example/solr/conf/solrconfig.xml
index 5f66ae8bc60..d78a98e3ce8 100755
--- a/solr/example/solr/conf/solrconfig.xml
+++ b/solr/example/solr/conf/solrconfig.xml
@@ -1261,8 +1261,14 @@
 
        http://wiki.apache.org/solr/ClusteringComponent
 
+       You'll need to set the solr.cluster.enabled system property
+       when running solr to run with clustering enabled:
+
+            java -Dsolr.clustering.enabled=true -jar start.jar
+
     -->
   <searchComponent name="clustering"
+                   enable="${solr.clustering.enabled:false}"
                    class="solr.clustering.ClusteringComponent" >
     <!-- Declare an engine -->
     <lst name="engine">
@@ -1328,6 +1334,7 @@
     -->
   <requestHandler name="/clustering"
                   startup="lazy"
+                  enable="${solr.clustering.enabled:false}"
                   class="solr.SearchHandler">
     <lst name="defaults">
       <bool name="clustering">true</bool>
diff --git a/solr/example/solr/conf/velocity/cluster.vm b/solr/example/solr/conf/velocity/cluster.vm
index c798e6a8d12..ab2f0e458eb 100644
--- a/solr/example/solr/conf/velocity/cluster.vm
+++ b/solr/example/solr/conf/velocity/cluster.vm
@@ -1,6 +1,6 @@
 <h2 #annTitle("Clusters generated by Carrot2 using the /clustering RequestHandler")>Clusters</h2>
 <div id="clusters">
-  Loading clusters...
+  Run Solr with java -Dsolr.clustering.enabled=true -jar start.jar to see results
 </div>
 <script type="text/javascript">
 

From 870d86440f16f350ddb6d02793e0505d1a910136 Mon Sep 17 00:00:00 2001
From: Erik Hatcher <ehatcher@apache.org>
Date: Thu, 17 May 2012 23:38:49 +0000
Subject: [PATCH 28/47] Fix jquery and Solr logo references in /browse that
 broke during admin UI overhauls

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1339923 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/example/solr/conf/velocity/VM_global_library.vm | 5 ++++-
 solr/example/solr/conf/velocity/head.vm              | 2 +-
 solr/example/solr/conf/velocity/header.vm            | 2 +-
 3 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/solr/example/solr/conf/velocity/VM_global_library.vm b/solr/example/solr/conf/velocity/VM_global_library.vm
index 0756ab8dc03..eae1bfebfb8 100644
--- a/solr/example/solr/conf/velocity/VM_global_library.vm
+++ b/solr/example/solr/conf/velocity/VM_global_library.vm
@@ -1,7 +1,10 @@
 
 #macro(param $key)$request.params.get($key)#end
 
-#macro(url_for_solr)/solr#if($request.core.name != "")/$request.core.name#end#end
+#macro(url_root)/solr#end
+
+## TODO: s/url_for_solr/url_for_core/ and s/url_root/url_for_solr/
+#macro(url_for_solr)#{url_root}#if($request.core.name != "")/$request.core.name#end#end
 #macro(url_for_home)#url_for_solr/browse#end
 
 #macro(q)&q=$!{esc.url($params.get('q'))}#end
diff --git a/solr/example/solr/conf/velocity/head.vm b/solr/example/solr/conf/velocity/head.vm
index d240868772d..265b7d3f3d5 100644
--- a/solr/example/solr/conf/velocity/head.vm
+++ b/solr/example/solr/conf/velocity/head.vm
@@ -3,7 +3,7 @@
     <title>#param('title')</title>
     <meta http-equiv="content-type" content="text/html; charset=UTF-8"/>
 
-  <script type="text/javascript" src="#{url_for_solr}/js/lib/jquery-1.7.2.min.js"></script>
+  <script type="text/javascript" src="#{url_root}/js/lib/jquery-1.7.2.min.js"></script>
   <link rel="stylesheet" type="text/css" href="#{url_for_solr}/admin/file?file=/velocity/main.css&contentType=text/css"/>
   <link rel="stylesheet" href="#{url_for_solr}/admin/file?file=/velocity/jquery.autocomplete.css&contentType=text/css" type="text/css" />
   <script type="text/javascript" src="#{url_for_solr}/admin/file?file=/velocity/jquery.autocomplete.js&contentType=text/javascript"></script>
diff --git a/solr/example/solr/conf/velocity/header.vm b/solr/example/solr/conf/velocity/header.vm
index 2eb80782fb0..46f0bab7d43 100644
--- a/solr/example/solr/conf/velocity/header.vm
+++ b/solr/example/solr/conf/velocity/header.vm
@@ -1,3 +1,3 @@
 <div id="head">
-  <span ><a href="#url_for_home#if($request.params.get('debugQuery'))?debugQuery=true#end"><img src="#{url_for_solr}/img/solr.png" id="logo"/></a></span>
+  <span ><a href="#url_for_home#if($request.params.get('debugQuery'))?debugQuery=true#end"><img src="#{url_root}/img/solr.png" id="logo"/></a></span>
 </div>
\ No newline at end of file

From 6248459183c97eb4c49b0082a7ea6bf1875fc176 Mon Sep 17 00:00:00 2001
From: Dawid Weiss <dweiss@apache.org>
Date: Fri, 18 May 2012 07:53:33 +0000
Subject: [PATCH 29/47] LUCENE-4054: nested suite classes (required for tests)
 should not run in stand-alone mode.

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340021 13f79535-47bb-0310-9956-ffa450edef68
---
 .../junitcompat/TestReproduceMessage.java     | 12 +---
 .../util/junitcompat/WithNestedTests.java     | 36 ++++------
 .../apache/lucene/util/LuceneTestCase.java    |  3 +-
 .../lucene/util/TestRuleIgnoreTestSuites.java | 67 +++++++++++++++++++
 4 files changed, 85 insertions(+), 33 deletions(-)
 create mode 100644 lucene/test-framework/src/java/org/apache/lucene/util/TestRuleIgnoreTestSuites.java

diff --git a/lucene/core/src/test/org/apache/lucene/util/junitcompat/TestReproduceMessage.java b/lucene/core/src/test/org/apache/lucene/util/junitcompat/TestReproduceMessage.java
index a7e79ae2684..7df711f9670 100644
--- a/lucene/core/src/test/org/apache/lucene/util/junitcompat/TestReproduceMessage.java
+++ b/lucene/core/src/test/org/apache/lucene/util/junitcompat/TestReproduceMessage.java
@@ -53,9 +53,7 @@ public class TestReproduceMessage extends WithNestedTests {
       public Statement apply(final Statement base, Description description) {
         return new Statement() {
           public void evaluate() throws Throwable {
-            if (isRunningNested()) {
-              triggerOn(SorePoint.RULE);
-            }
+            triggerOn(SorePoint.RULE);
             base.evaluate();
           }
         };
@@ -69,9 +67,7 @@ public class TestReproduceMessage extends WithNestedTests {
 
     @Before
     public void before() {
-      if (isRunningNested()) {
-        triggerOn(SorePoint.BEFORE);
-      }
+      triggerOn(SorePoint.BEFORE);
     }    
 
     @Test
@@ -81,9 +77,7 @@ public class TestReproduceMessage extends WithNestedTests {
     
     @After
     public void after() {
-      if (isRunningNested()) {
-        triggerOn(SorePoint.AFTER);
-      }
+      triggerOn(SorePoint.AFTER);
     }    
 
     @AfterClass
diff --git a/lucene/core/src/test/org/apache/lucene/util/junitcompat/WithNestedTests.java b/lucene/core/src/test/org/apache/lucene/util/junitcompat/WithNestedTests.java
index af844ee9f82..adf0f94f735 100644
--- a/lucene/core/src/test/org/apache/lucene/util/junitcompat/WithNestedTests.java
+++ b/lucene/core/src/test/org/apache/lucene/util/junitcompat/WithNestedTests.java
@@ -22,15 +22,18 @@ import java.io.PrintStream;
 import java.io.UnsupportedEncodingException;
 
 import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.util.TestRuleIgnoreTestSuites;
 import org.junit.After;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.ClassRule;
+import org.junit.Rule;
 import org.junit.rules.TestRule;
 import org.junit.runner.Description;
 import org.junit.runners.model.Statement;
 
 import com.carrotsearch.randomizedtesting.RandomizedRunner;
+import com.carrotsearch.randomizedtesting.rules.SystemPropertiesRestoreRule;
 
 /**
  * An abstract test class that prepares nested test classes to run.
@@ -45,28 +48,11 @@ import com.carrotsearch.randomizedtesting.RandomizedRunner;
  * cause havoc (static fields).
  */
 public abstract class WithNestedTests {
-  /**
-   * This can no longer be thread local because {@link RandomizedRunner} runs
-   * suites in an isolated threadgroup/thread.
-   */
-  public static volatile boolean runsAsNested;
-
-  public static abstract class AbstractNestedTest extends LuceneTestCase {
-    @ClassRule
-    public static TestRule ignoreIfRunAsStandalone = new TestRule() {
-      public Statement apply(final Statement s, Description arg1) {
-        return new Statement() {
-          public void evaluate() throws Throwable {
-            if (isRunningNested()) {
-              s.evaluate();
-            }
-          }
-        };
-      }
-    };
 
+  public static abstract class AbstractNestedTest extends LuceneTestCase 
+    implements TestRuleIgnoreTestSuites.NestedTestSuite {
     protected static boolean isRunningNested() {
-      return runsAsNested;
+      return TestRuleIgnoreTestSuites.isRunningNested();
     }
   }
 
@@ -81,6 +67,12 @@ public abstract class WithNestedTests {
   private ByteArrayOutputStream sysout;
   private ByteArrayOutputStream syserr;
 
+  /**
+   * Restore properties after test.
+   */
+  @Rule
+  public SystemPropertiesRestoreRule restoreProperties = new SystemPropertiesRestoreRule();
+  
   @Before
   public final void before() {
     if (suppressOutputStreams) {
@@ -97,13 +89,11 @@ public abstract class WithNestedTests {
       }
     }
 
-    runsAsNested = true;
+    System.setProperty(TestRuleIgnoreTestSuites.PROPERTY_RUN_NESTED, "true");
   }
 
   @After
   public final void after() {
-    runsAsNested = false;
-
     if (suppressOutputStreams) {
       System.out.flush();
       System.err.flush();
diff --git a/lucene/test-framework/src/java/org/apache/lucene/util/LuceneTestCase.java b/lucene/test-framework/src/java/org/apache/lucene/util/LuceneTestCase.java
index 943bd6820c8..7dbb7386d44 100644
--- a/lucene/test-framework/src/java/org/apache/lucene/util/LuceneTestCase.java
+++ b/lucene/test-framework/src/java/org/apache/lucene/util/LuceneTestCase.java
@@ -291,7 +291,8 @@ public abstract class LuceneTestCase extends Assert {
    */
   @ClassRule
   public static TestRule classRules = RuleChain
-    .outerRule(suiteFailureMarker = new TestRuleMarkFailure())
+    .outerRule(new TestRuleIgnoreTestSuites())
+    .around(suiteFailureMarker = new TestRuleMarkFailure())
     .around(new TestRuleAssertionsRequired())
     .around(new TestRuleNoStaticHooksShadowing())
     .around(new TestRuleNoInstanceHooksOverrides())
diff --git a/lucene/test-framework/src/java/org/apache/lucene/util/TestRuleIgnoreTestSuites.java b/lucene/test-framework/src/java/org/apache/lucene/util/TestRuleIgnoreTestSuites.java
new file mode 100644
index 00000000000..58fa30cad1f
--- /dev/null
+++ b/lucene/test-framework/src/java/org/apache/lucene/util/TestRuleIgnoreTestSuites.java
@@ -0,0 +1,67 @@
+package org.apache.lucene.util;
+
+import org.junit.Assume;
+import org.junit.rules.TestRule;
+import org.junit.runner.Description;
+import org.junit.runners.model.Statement;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/**
+ * This rule will cause the suite to be assumption-ignored if 
+ * the test class implements a given marker interface and a special
+ * property is not set.
+ * 
+ * <p>This is a workaround for problems with certain JUnit containers (IntelliJ)
+ * which automatically discover test suites and attempt to run nested classes
+ * that we use for testing the test framework itself.
+ */
+public final class TestRuleIgnoreTestSuites implements TestRule {
+  /** 
+   * Marker interface for nested suites that should be ignored
+   * if executed in stand-alone mode.
+   */
+  public static interface NestedTestSuite {}
+  
+  /**
+   * A boolean system property indicating nested suites should be executed
+   * normally.
+   */
+  public final static String PROPERTY_RUN_NESTED = "tests.runnested"; 
+  
+  @Override
+  public Statement apply(final Statement s, final Description d) {
+    return new Statement() {
+      @Override
+      public void evaluate() throws Throwable {
+        if (NestedTestSuite.class.isAssignableFrom(d.getTestClass())) {
+          LuceneTestCase.assumeTrue("Nested suite class ignored (started as stand-along).",
+              isRunningNested());
+        }
+        s.evaluate();
+      }
+    };
+  }
+
+  /**
+   * Check if a suite class is running as a nested test.
+   */
+  public static boolean isRunningNested() {
+    return Boolean.getBoolean(PROPERTY_RUN_NESTED);
+  }
+}

From 0b1d814c94f05c0bfdbec074946dcf2465a3ff28 Mon Sep 17 00:00:00 2001
From: Martijn van Groningen <mvg@apache.org>
Date: Fri, 18 May 2012 12:28:21 +0000
Subject: [PATCH 30/47] SOLR-3454: Exception when using result grouping with
 main=true and using wt=javabin

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340080 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/CHANGES.txt                              |   3 +
 .../java/org/apache/solr/search/Grouping.java |   2 +-
 .../org/apache/solr/TestGroupingSearch.java   | 139 +++++++++++-------
 3 files changed, 93 insertions(+), 51 deletions(-)

diff --git a/solr/CHANGES.txt b/solr/CHANGES.txt
index c796893b578..f9ce07b8939 100644
--- a/solr/CHANGES.txt
+++ b/solr/CHANGES.txt
@@ -425,6 +425,9 @@ Bug Fixes
 * SOLR-3436: Group count incorrect when not all shards are queried in the second
   pass. (Francois Perron, Martijn van Groningen)
 
+* SOLR-3454: Exception when using result grouping with main=true and using
+  wt=javabin. (Ludovic Boutros, Martijn van Groningen)
+
 Other Changes
 ----------------------
 
diff --git a/solr/core/src/java/org/apache/solr/search/Grouping.java b/solr/core/src/java/org/apache/solr/search/Grouping.java
index a9e64e4bb94..54ec934b6b4 100755
--- a/solr/core/src/java/org/apache/solr/search/Grouping.java
+++ b/solr/core/src/java/org/apache/solr/search/Grouping.java
@@ -651,7 +651,7 @@ public class Grouping {
         }
       }
 
-      int len = docsGathered - offset;
+      int len = docsGathered > offset ? docsGathered - offset : 0;
       int[] docs = ArrayUtils.toPrimitive(ids.toArray(new Integer[ids.size()]));
       float[] docScores = ArrayUtils.toPrimitive(scores.toArray(new Float[scores.size()]));
       DocSlice docSlice = new DocSlice(offset, len, docs, docScores, getMatches(), maxScore);
diff --git a/solr/core/src/test/org/apache/solr/TestGroupingSearch.java b/solr/core/src/test/org/apache/solr/TestGroupingSearch.java
index 402aa0c0124..72a1de30f8d 100644
--- a/solr/core/src/test/org/apache/solr/TestGroupingSearch.java
+++ b/solr/core/src/test/org/apache/solr/TestGroupingSearch.java
@@ -20,13 +20,21 @@ package org.apache.solr;
 import org.apache.lucene.search.FieldCache;
 import org.apache.noggit.JSONUtil;
 import org.apache.noggit.ObjectBuilder;
+import org.apache.solr.client.solrj.impl.BinaryResponseParser;
+import org.apache.solr.common.params.CommonParams;
 import org.apache.solr.common.params.GroupParams;
 import org.apache.solr.request.SolrQueryRequest;
+import org.apache.solr.request.SolrRequestInfo;
+import org.apache.solr.response.BinaryResponseWriter;
+import org.apache.solr.response.ResultContext;
+import org.apache.solr.response.SolrQueryResponse;
 import org.apache.solr.schema.IndexSchema;
 import org.junit.Before;
 import org.junit.BeforeClass;
 import org.junit.Test;
 
+import java.io.ByteArrayInputStream;
+import java.io.ByteArrayOutputStream;
 import java.util.*;
 
 public class TestGroupingSearch extends SolrTestCaseJ4 {
@@ -37,7 +45,7 @@ public class TestGroupingSearch extends SolrTestCaseJ4 {
 
   @BeforeClass
   public static void beforeTests() throws Exception {
-    initCore("solrconfig.xml","schema12.xml");
+    initCore("solrconfig.xml", "schema12.xml");
   }
 
   @Before
@@ -75,18 +83,18 @@ public class TestGroupingSearch extends SolrTestCaseJ4 {
             ,"//arr[@name='groups']/lst[3]/result/doc/*[@name='id'][.='5']"
             );
 
-    assertQ(req("q","title:title", "group", "true", "group.field","group_si")
-            ,"//lst[@name='grouped']/lst[@name='group_si']"
-            ,"*[count(//arr[@name='groups']/lst) = 2]"
+    assertQ(req("q", "title:title", "group", "true", "group.field", "group_si")
+        , "//lst[@name='grouped']/lst[@name='group_si']"
+        , "*[count(//arr[@name='groups']/lst) = 2]"
 
-            ,"//arr[@name='groups']/lst[1]/int[@name='groupValue'][.='2']"
-            ,"//arr[@name='groups']/lst[1]/result[@numFound='2']"
-            ,"//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='4']"
+        , "//arr[@name='groups']/lst[1]/int[@name='groupValue'][.='2']"
+        , "//arr[@name='groups']/lst[1]/result[@numFound='2']"
+        , "//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='4']"
 
-            ,"//arr[@name='groups']/lst[2]/int[@name='groupValue'][.='1']"
-            ,"//arr[@name='groups']/lst[2]/result[@numFound='3']"
-            ,"//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='5']"
-            );
+        , "//arr[@name='groups']/lst[2]/int[@name='groupValue'][.='1']"
+        , "//arr[@name='groups']/lst[2]/result[@numFound='3']"
+        , "//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='5']"
+    );
   }
 
   @Test
@@ -117,19 +125,19 @@ public class TestGroupingSearch extends SolrTestCaseJ4 {
             ,"//arr[@name='groups']/lst[3]/result/doc/*[@name='id'][.='5']"
             );
 
-    assertQ(req("q","title:title", "group", "true", "group.field","group_si", "group.ngroups", "true")
-            ,"//lst[@name='grouped']/lst[@name='group_si']/int[@name='matches'][.='5']"
-            ,"//lst[@name='grouped']/lst[@name='group_si']/int[@name='ngroups'][.='2']"
-            ,"*[count(//arr[@name='groups']/lst) = 2]"
+    assertQ(req("q", "title:title", "group", "true", "group.field", "group_si", "group.ngroups", "true")
+        , "//lst[@name='grouped']/lst[@name='group_si']/int[@name='matches'][.='5']"
+        , "//lst[@name='grouped']/lst[@name='group_si']/int[@name='ngroups'][.='2']"
+        , "*[count(//arr[@name='groups']/lst) = 2]"
 
-            ,"//arr[@name='groups']/lst[1]/int[@name='groupValue'][.='2']"
-            ,"//arr[@name='groups']/lst[1]/result[@numFound='2']"
-            ,"//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='4']"
+        , "//arr[@name='groups']/lst[1]/int[@name='groupValue'][.='2']"
+        , "//arr[@name='groups']/lst[1]/result[@numFound='2']"
+        , "//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='4']"
 
-            ,"//arr[@name='groups']/lst[2]/int[@name='groupValue'][.='1']"
-            ,"//arr[@name='groups']/lst[2]/result[@numFound='3']"
-            ,"//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='5']"
-            );
+        , "//arr[@name='groups']/lst[2]/int[@name='groupValue'][.='1']"
+        , "//arr[@name='groups']/lst[2]/result[@numFound='3']"
+        , "//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='5']"
+    );
   }
 
   @Test
@@ -141,22 +149,22 @@ public class TestGroupingSearch extends SolrTestCaseJ4 {
     assertU(add(doc("id", "5","name", "author3", "title", "the title of a title")));
     assertU(commit());
 
-    assertQ(req("q","title:title", "group", "true", "group.field","name", "sort", "score desc", "group.sort", "score desc")
-            ,"//arr[@name='groups']/lst[1]/str[@name='groupValue'][.='author2']"
-    //        ,"//arr[@name='groups']/lst[1]/int[@name='matches'][.='2']"
-            ,"//arr[@name='groups']/lst[1]/result[@numFound='2']"
-            ,"//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='4']"
+    assertQ(req("q", "title:title", "group", "true", "group.field", "name", "sort", "score desc", "group.sort", "score desc")
+        , "//arr[@name='groups']/lst[1]/str[@name='groupValue'][.='author2']"
+        //        ,"//arr[@name='groups']/lst[1]/int[@name='matches'][.='2']"
+        , "//arr[@name='groups']/lst[1]/result[@numFound='2']"
+        , "//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='4']"
 
-            ,"//arr[@name='groups']/lst[2]/str[@name='groupValue'][.='author1']"
-    //        ,"//arr[@name='groups']/lst[2]/int[@name='matches'][.='2']"
-            ,"//arr[@name='groups']/lst[2]/result[@numFound='2']"
-            ,"//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='2']"
+        , "//arr[@name='groups']/lst[2]/str[@name='groupValue'][.='author1']"
+        //        ,"//arr[@name='groups']/lst[2]/int[@name='matches'][.='2']"
+        , "//arr[@name='groups']/lst[2]/result[@numFound='2']"
+        , "//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='2']"
 
-            ,"//arr[@name='groups']/lst[3]/str[@name='groupValue'][.='author3']"
-    //        ,"//arr[@name='groups']/lst[3]/int[@name='matches'][.='1']"
-            ,"//arr[@name='groups']/lst[3]/result[@numFound='1']"
-            ,"//arr[@name='groups']/lst[3]/result/doc/*[@name='id'][.='5']"
-            );
+        , "//arr[@name='groups']/lst[3]/str[@name='groupValue'][.='author3']"
+        //        ,"//arr[@name='groups']/lst[3]/int[@name='matches'][.='1']"
+        , "//arr[@name='groups']/lst[3]/result[@numFound='1']"
+        , "//arr[@name='groups']/lst[3]/result/doc/*[@name='id'][.='5']"
+    );
   }
 
 
@@ -168,18 +176,18 @@ public class TestGroupingSearch extends SolrTestCaseJ4 {
     assertU(add(doc("id", "4","name", "author2", "weight", "0.11")));
     assertU(commit());
 
-    assertQ(req("q","*:*", "group", "true", "group.field","name", "sort", "id asc", "group.sort", "weight desc")
-            ,"*[count(//arr[@name='groups']/lst) = 2]"
-            ,"//arr[@name='groups']/lst[1]/str[@name='groupValue'][.='author1']"
-    //        ,"//arr[@name='groups']/lst[1]/int[@name='matches'][.='2']"
-            ,"//arr[@name='groups']/lst[1]/result[@numFound='2']"
-            ,"//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='1']"
+    assertQ(req("q", "*:*", "group", "true", "group.field", "name", "sort", "id asc", "group.sort", "weight desc")
+        , "*[count(//arr[@name='groups']/lst) = 2]"
+        , "//arr[@name='groups']/lst[1]/str[@name='groupValue'][.='author1']"
+        //        ,"//arr[@name='groups']/lst[1]/int[@name='matches'][.='2']"
+        , "//arr[@name='groups']/lst[1]/result[@numFound='2']"
+        , "//arr[@name='groups']/lst[1]/result/doc/*[@name='id'][.='1']"
 
-            ,"//arr[@name='groups']/lst[2]/str[@name='groupValue'][.='author2']"
-    //        ,"//arr[@name='groups']/lst[2]/int[@name='matches'][.='2']"
-            ,"//arr[@name='groups']/lst[2]/result[@numFound='2']"
-            ,"//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='4']"
-            );
+        , "//arr[@name='groups']/lst[2]/str[@name='groupValue'][.='author2']"
+        //        ,"//arr[@name='groups']/lst[2]/int[@name='matches'][.='2']"
+        , "//arr[@name='groups']/lst[2]/result[@numFound='2']"
+        , "//arr[@name='groups']/lst[2]/result/doc/*[@name='id'][.='4']"
+    );
   }
 
   @Test
@@ -214,6 +222,37 @@ public class TestGroupingSearch extends SolrTestCaseJ4 {
     );
   }
 
+  @Test
+  public void testGroupingSimpleFormatArrayIndexOutOfBoundsExceptionWithJavaBin() throws Exception {
+    assertU(add(doc("id", "1", "nullfirst", "1")));
+    assertU(add(doc("id", "2", "nullfirst", "1")));
+    assertU(add(doc("id", "3", "nullfirst", "2")));
+    assertU(add(doc("id", "4", "nullfirst", "2")));
+    assertU(add(doc("id", "5", "nullfirst", "2")));
+    assertU(add(doc("id", "6", "nullfirst", "3")));
+    assertU(commit());
+
+    SolrQueryRequest request =
+        req("q", "*:*","group", "true", "group.field", "nullfirst", "group.main", "true", "wt", "javabin", "start", "4", "rows", "10");
+
+    SolrQueryResponse response = new SolrQueryResponse();
+    ByteArrayOutputStream out = new ByteArrayOutputStream();
+    try {
+      SolrRequestInfo.setRequestInfo(new SolrRequestInfo(request, response));
+      String handlerName = request.getParams().get(CommonParams.QT);
+      h.getCore().execute(h.getCore().getRequestHandler(handlerName), request, response);
+      BinaryResponseWriter responseWriter = new BinaryResponseWriter();
+      responseWriter.write(out, request, response);
+    } finally {
+      request.close();
+      SolrRequestInfo.clearRequestInfo();
+    }
+
+    assertEquals(6, ((ResultContext) response.getValues().get("response")).docs.matches());
+    new BinaryResponseParser().processResponse(new ByteArrayInputStream(out.toByteArray()), "");
+    out.close();
+  }
+
   @Test
   public void testGroupingWithTimeAllowed() throws Exception {
     assertU(add(doc("id", "1")));
@@ -530,9 +569,9 @@ public class TestGroupingSearch extends SolrTestCaseJ4 {
     );
 
     ///////////////////////// group.format == simple
-    assertJQ(req("fq",filt,  "q","{!func}"+f2, "group","true", "group.field",f, "fl","id", "rows","3", "start","1", "group.limit","2", "group.format","simple")
-    , "/grouped/foo_i=={'matches':10,'doclist':"
-        +"{'numFound':10,'start':1,'docs':[{'id':'10'},{'id':'3'},{'id':'6'}]}}"
+    assertJQ(req("fq", filt, "q", "{!func}" + f2, "group", "true", "group.field", f, "fl", "id", "rows", "3", "start", "1", "group.limit", "2", "group.format", "simple")
+        , "/grouped/foo_i=={'matches':10,'doclist':"
+        + "{'numFound':10,'start':1,'docs':[{'id':'10'},{'id':'3'},{'id':'6'}]}}"
     );
   }
 

From 5efed3447ef7ffc65b7c33db6992e236311fb340 Mon Sep 17 00:00:00 2001
From: Steven Rowe <sarowe@apache.org>
Date: Fri, 18 May 2012 16:58:38 +0000
Subject: [PATCH 31/47] LUCENE-3983: HTMLStripCharFilter: Stop upcasing HTML
 character entity names at class initialization time; instead, provide
 hard-coded upcased versions for a small set of them.

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340169 13f79535-47bb-0310-9956-ffa450edef68
---
 .../charfilter/HTMLCharacterEntities.jflex    | 17 +++++++++---
 .../charfilter/HTMLStripCharFilter.java       | 26 +++++++++++++------
 .../charfilter/HTMLStripCharFilter.jflex      |  3 ++-
 .../lucene/analysis/charfilter/htmlentity.py  | 17 +++++++++---
 4 files changed, 46 insertions(+), 17 deletions(-)

diff --git a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLCharacterEntities.jflex b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLCharacterEntities.jflex
index b4f73a61411..a32e1480828 100644
--- a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLCharacterEntities.jflex
+++ b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLCharacterEntities.jflex
@@ -62,8 +62,16 @@ CharacterEntities = ( "AElig" | "Aacute" | "Acirc" | "Agrave" | "Alpha"
                     | "weierp" | "xi" | "yacute" | "yen" | "yuml" | "zeta"
                     | "zwj" | "zwnj" )
 %{
-  private static final Set<String> upperCaseVariantsAccepted
-      = new HashSet<String>(Arrays.asList("quot","copy","gt","lt","reg","amp"));
+  private static final Map<String,String> upperCaseVariantsAccepted
+      = new HashMap<String,String>();
+  static {
+    upperCaseVariantsAccepted.put("quot", "QUOT");
+    upperCaseVariantsAccepted.put("copy", "COPY");
+    upperCaseVariantsAccepted.put("gt", "GT");
+    upperCaseVariantsAccepted.put("lt", "LT");
+    upperCaseVariantsAccepted.put("reg", "REG");
+    upperCaseVariantsAccepted.put("amp", "AMP");
+  }
   private static final CharArrayMap<Character> entityValues
       = new CharArrayMap<Character>(Version.LUCENE_40, 253, false);
   static {
@@ -145,8 +153,9 @@ CharacterEntities = ( "AElig" | "Aacute" | "Acirc" | "Agrave" | "Alpha"
     for (int i = 0 ; i < entities.length ; i += 2) {
       Character value = entities[i + 1].charAt(0);
       entityValues.put(entities[i], value);
-      if (upperCaseVariantsAccepted.contains(entities[i])) {
-        entityValues.put(entities[i].toUpperCase(), value);
+      String upperCaseVariant = upperCaseVariantsAccepted.get(entities[i]);
+      if (upperCaseVariant != null) {
+        entityValues.put(upperCaseVariant, value);
       }
     }
   }
diff --git a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.java b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.java
index 949110284e9..2b83aa017e4 100644
--- a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.java
+++ b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.java
@@ -1,4 +1,4 @@
-/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 3/24/12 4:50 PM */
+/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 5/18/12 12:24 PM */
 
 package org.apache.lucene.analysis.charfilter;
 
@@ -21,7 +21,8 @@ package org.apache.lucene.analysis.charfilter;
 
 import java.io.IOException;
 import java.util.Arrays;
-import java.util.HashSet;
+import java.util.HashMap;
+import java.util.Map;
 import java.util.Set;
 
 import org.apache.lucene.util.Version;
@@ -39,8 +40,8 @@ import org.apache.lucene.analysis.util.OpenStringBuilder;
 /**
  * This class is a scanner generated by 
  * <a href="http://www.jflex.de/">JFlex</a> 1.5.0-SNAPSHOT
- * on 3/24/12 4:50 PM from the specification file
- * <tt>C:/cygwin/home/s/svn/lucene/dev/trunk/modules/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex</tt>
+ * on 5/18/12 12:24 PM from the specification file
+ * <tt>C:/svn/lucene/dev/trunk/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex</tt>
  */
 public final class HTMLStripCharFilter extends BaseCharFilter {
 
@@ -30522,8 +30523,16 @@ public final class HTMLStripCharFilter extends BaseCharFilter {
   private boolean zzEOFDone;
 
   /* user code: */
-  private static final Set<String> upperCaseVariantsAccepted
-      = new HashSet<String>(Arrays.asList("quot","copy","gt","lt","reg","amp"));
+  private static final Map<String,String> upperCaseVariantsAccepted
+      = new HashMap<String,String>();
+  static {
+    upperCaseVariantsAccepted.put("quot", "QUOT");
+    upperCaseVariantsAccepted.put("copy", "COPY");
+    upperCaseVariantsAccepted.put("gt", "GT");
+    upperCaseVariantsAccepted.put("lt", "LT");
+    upperCaseVariantsAccepted.put("reg", "REG");
+    upperCaseVariantsAccepted.put("amp", "AMP");
+  }
   private static final CharArrayMap<Character> entityValues
       = new CharArrayMap<Character>(Version.LUCENE_40, 253, false);
   static {
@@ -30605,8 +30614,9 @@ public final class HTMLStripCharFilter extends BaseCharFilter {
     for (int i = 0 ; i < entities.length ; i += 2) {
       Character value = entities[i + 1].charAt(0);
       entityValues.put(entities[i], value);
-      if (upperCaseVariantsAccepted.contains(entities[i])) {
-        entityValues.put(entities[i].toUpperCase(), value);
+      String upperCaseVariant = upperCaseVariantsAccepted.get(entities[i]);
+      if (upperCaseVariant != null) {
+        entityValues.put(upperCaseVariant, value);
       }
     }
   }
diff --git a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex
index 54d62cc9372..3c9116b8440 100755
--- a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex
+++ b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex
@@ -19,7 +19,8 @@ package org.apache.lucene.analysis.charfilter;
 
 import java.io.IOException;
 import java.util.Arrays;
-import java.util.HashSet;
+import java.util.HashMap;
+import java.util.Map;
 import java.util.Set;
 
 import org.apache.lucene.util.Version;
diff --git a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/htmlentity.py b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/htmlentity.py
index b3300687556..ff9ee6bf3a1 100644
--- a/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/htmlentity.py
+++ b/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/htmlentity.py
@@ -50,8 +50,16 @@ def main():
   print output_line, ')'
 
   print '%{'
-  print '  private static final Set<String> upperCaseVariantsAccepted'
-  print '      = new HashSet<String>(Arrays.asList("quot","copy","gt","lt","reg","amp"));'
+  print '  private static final Map<String,String> upperCaseVariantsAccepted'
+  print '      = new HashMap<String,String>();'
+  print '  static {'
+  print '    upperCaseVariantsAccepted.put("quot", "QUOT");'
+  print '    upperCaseVariantsAccepted.put("copy", "COPY");'
+  print '    upperCaseVariantsAccepted.put("gt", "GT");'
+  print '    upperCaseVariantsAccepted.put("lt", "LT");'
+  print '    upperCaseVariantsAccepted.put("reg", "REG");'
+  print '    upperCaseVariantsAccepted.put("amp", "AMP");'
+  print '  }'
   print '  private static final CharArrayMap<Character> entityValues'
   print '      = new CharArrayMap<Character>(Version.LUCENE_40, %i, false);' % len(keys)
   print '  static {'
@@ -68,8 +76,9 @@ def main():
   print '    for (int i = 0 ; i < entities.length ; i += 2) {'
   print '      Character value = entities[i + 1].charAt(0);'
   print '      entityValues.put(entities[i], value);'
-  print '      if (upperCaseVariantsAccepted.contains(entities[i])) {'
-  print '        entityValues.put(entities[i].toUpperCase(), value);'
+  print '      String upperCaseVariant = upperCaseVariantsAccepted.get(entities[i]);'
+  print '      if (upperCaseVariant != null) {'
+  print '        entityValues.put(upperCaseVariant, value);'
   print '      }'
   print '    }'
   print "  }"

From a0493e557085fb21e41bf2d1a88fd476e7a4104e Mon Sep 17 00:00:00 2001
From: Simon Willnauer <simonw@apache.org>
Date: Sat, 19 May 2012 16:29:58 +0000
Subject: [PATCH 32/47] LUCENE-4070: assign output to member to prevent double
 opening on error

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340514 13f79535-47bb-0310-9956-ffa450edef68
---
 .../java/org/apache/lucene/store/CompoundFileWriter.java  | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/lucene/core/src/java/org/apache/lucene/store/CompoundFileWriter.java b/lucene/core/src/java/org/apache/lucene/store/CompoundFileWriter.java
index 8134b8cba47..a5e3d1cfb04 100644
--- a/lucene/core/src/java/org/apache/lucene/store/CompoundFileWriter.java
+++ b/lucene/core/src/java/org/apache/lucene/store/CompoundFileWriter.java
@@ -118,16 +118,14 @@ final class CompoundFileWriter implements Closeable{
   
   private synchronized IndexOutput getOutput() throws IOException {
     if (dataOut == null) {
-      IndexOutput dataOutput = null;
       boolean success = false;
       try {
-        dataOutput = directory.createOutput(dataFileName, IOContext.DEFAULT);
-        dataOutput.writeVInt(FORMAT_CURRENT);
-        dataOut = dataOutput;
+        dataOut = directory.createOutput(dataFileName, IOContext.DEFAULT);
+        dataOut.writeVInt(FORMAT_CURRENT);
         success = true;
       } finally {
         if (!success) {
-          IOUtils.closeWhileHandlingException(dataOutput);
+          IOUtils.closeWhileHandlingException(dataOut);
         }
       }
     } 

From 419a026c0629a7ea08e050d289f6ac1ad45759d1 Mon Sep 17 00:00:00 2001
From: Michael McCandless <mikemccand@apache.org>
Date: Sat, 19 May 2012 17:24:36 +0000
Subject: [PATCH 33/47] fix over-copying of CFX files during
 addIndexes(Directory[])

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340521 13f79535-47bb-0310-9956-ffa450edef68
---
 .../java/org/apache/lucene/index/IndexWriter.java | 15 ++++++++++-----
 1 file changed, 10 insertions(+), 5 deletions(-)

diff --git a/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java b/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java
index 06b5e771fad..28d16a8ef4f 100644
--- a/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java
+++ b/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java
@@ -2159,6 +2159,8 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
         sis.read(dir);
         final Set<String> dsFilesCopied = new HashSet<String>();
         final Map<String, String> dsNames = new HashMap<String, String>();
+        final Set<String> copiedFiles = new HashSet<String>();
+
         for (SegmentInfo info : sis) {
           assert !infos.contains(info): "dup info dir=" + info.dir + " name=" + info.name;
 
@@ -2171,7 +2173,7 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
 
           IOContext context = new IOContext(new MergeInfo(info.docCount, info.sizeInBytes(), true, -1));
           
-          copySegmentAsIs(info, newSegName, dsNames, dsFilesCopied, context);
+          copySegmentAsIs(info, newSegName, dsNames, dsFilesCopied, context, copiedFiles);
 
           infos.add(info);
         }
@@ -2282,7 +2284,8 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
 
   /** Copies the segment files as-is into the IndexWriter's directory. */
   private void copySegmentAsIs(SegmentInfo info, String segName,
-      Map<String, String> dsNames, Set<String> dsFilesCopied, IOContext context)
+                               Map<String, String> dsNames, Set<String> dsFilesCopied, IOContext context,
+                               Set<String> copiedFiles)
       throws IOException {
     // Determine if the doc store of this segment needs to be copied. It's
     // only relevant for segments that share doc store with others,
@@ -2301,10 +2304,10 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
     Set<String> codecDocStoreFiles = new HashSet<String>();
     if (info.getDocStoreOffset() != -1) {
       // only violate the codec this way if its preflex
-      codec.storedFieldsFormat().files(info, codecDocStoreFiles);
-      codec.termVectorsFormat().files(info, codecDocStoreFiles);
+      info.getCodec().storedFieldsFormat().files(info, codecDocStoreFiles);
+      info.getCodec().termVectorsFormat().files(info, codecDocStoreFiles);
     }
-    
+
     // Copy the segment files
     for (String file: info.files()) {
       final String newFileName;
@@ -2319,6 +2322,8 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
       }
       
       assert !directory.fileExists(newFileName): "file \"" + newFileName + "\" already exists";
+      assert !copiedFiles.contains(file): "file \"" + file + "\" is being copied more than once";
+      copiedFiles.add(file);
       info.dir.copy(directory, file, newFileName, context);
     }
     

From 80ed49893cd992efdb4e76e45f8ac1555be57fe7 Mon Sep 17 00:00:00 2001
From: Robert Muir <rmuir@apache.org>
Date: Sat, 19 May 2012 17:47:38 +0000
Subject: [PATCH 34/47] test untested query, fix broken equals() impl

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340526 13f79535-47bb-0310-9956-ffa450edef68
---
 .../lucene/queries/function/BoostedQuery.java |  7 +-
 .../queries/function/TestBoostedQuery.java    | 99 +++++++++++++++++++
 2 files changed, 103 insertions(+), 3 deletions(-)
 create mode 100644 lucene/queries/src/test/org/apache/lucene/queries/function/TestBoostedQuery.java

diff --git a/lucene/queries/src/java/org/apache/lucene/queries/function/BoostedQuery.java b/lucene/queries/src/java/org/apache/lucene/queries/function/BoostedQuery.java
index c0c2942ba33..91d98321d3e 100755
--- a/lucene/queries/src/java/org/apache/lucene/queries/function/BoostedQuery.java
+++ b/lucene/queries/src/java/org/apache/lucene/queries/function/BoostedQuery.java
@@ -31,6 +31,8 @@ import java.util.Map;
 /**
  * Query that is boosted by a ValueSource
  */
+// TODO: BoostedQuery and BoostingQuery in the same module? 
+// something has to give
 public class BoostedQuery extends Query {
   private Query q;
   private ValueSource boostVal; // optional, can be null
@@ -187,10 +189,9 @@ public class BoostedQuery extends Query {
 
   @Override
   public boolean equals(Object o) {
-    if (getClass() != o.getClass()) return false;
+  if (!super.equals(o)) return false;
     BoostedQuery other = (BoostedQuery)o;
-    return this.getBoost() == other.getBoost()
-           && this.q.equals(other.q)
+    return this.q.equals(other.q)
            && this.boostVal.equals(other.boostVal);
   }
 
diff --git a/lucene/queries/src/test/org/apache/lucene/queries/function/TestBoostedQuery.java b/lucene/queries/src/test/org/apache/lucene/queries/function/TestBoostedQuery.java
new file mode 100644
index 00000000000..5a9a0c2dd83
--- /dev/null
+++ b/lucene/queries/src/test/org/apache/lucene/queries/function/TestBoostedQuery.java
@@ -0,0 +1,99 @@
+package org.apache.lucene.queries.function;
+
+import java.io.IOException;
+
+import org.apache.lucene.analysis.MockAnalyzer;
+import org.apache.lucene.document.Document;
+import org.apache.lucene.document.Field;
+import org.apache.lucene.document.StringField;
+import org.apache.lucene.index.IndexReader;
+import org.apache.lucene.index.IndexWriterConfig;
+import org.apache.lucene.index.RandomIndexWriter;
+import org.apache.lucene.queries.function.valuesource.ConstValueSource;
+import org.apache.lucene.search.CheckHits;
+import org.apache.lucene.search.IndexSearcher;
+import org.apache.lucene.search.MatchAllDocsQuery;
+import org.apache.lucene.search.Query;
+import org.apache.lucene.search.ScoreDoc;
+import org.apache.lucene.search.Sort;
+import org.apache.lucene.search.SortField;
+import org.apache.lucene.search.TopDocs;
+import org.apache.lucene.store.Directory;
+import org.apache.lucene.util.LuceneTestCase;
+import org.junit.AfterClass;
+import org.junit.BeforeClass;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/**
+ * Basic tests for {@link BoostedQuery}
+ */
+// TODO: more tests
+public class TestBoostedQuery extends LuceneTestCase {
+  static Directory dir;
+  static IndexReader ir;
+  static IndexSearcher is;
+  
+  @BeforeClass
+  public static void beforeClass() throws Exception {
+    dir = newDirectory();
+    IndexWriterConfig iwConfig = newIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(random()));
+    iwConfig.setMergePolicy(newLogMergePolicy());
+    RandomIndexWriter iw = new RandomIndexWriter(random(), dir, iwConfig);
+    Document document = new Document();
+    Field idField = new StringField("id", "");
+    document.add(idField);
+    iw.addDocument(document);
+    ir = iw.getReader();
+    is = newSearcher(ir);
+    iw.close();
+  }
+  
+  @AfterClass
+  public static void afterClass() throws Exception {
+    is = null;
+    ir.close();
+    ir = null;
+    dir.close();
+    dir = null;
+  }
+  
+  public void testBasic() throws Exception {
+    Query q = new MatchAllDocsQuery();
+    TopDocs docs = is.search(q, 10);
+    assertEquals(1, docs.totalHits);
+    float score = docs.scoreDocs[0].score;
+    
+    Query boostedQ = new BoostedQuery(q, new ConstValueSource(2.0f));
+    assertHits(boostedQ, new float[] { score*2 });
+  }
+  
+  void assertHits(Query q, float scores[]) throws Exception {
+    ScoreDoc expected[] = new ScoreDoc[scores.length];
+    int expectedDocs[] = new int[scores.length];
+    for (int i = 0; i < expected.length; i++) {
+      expectedDocs[i] = i;
+      expected[i] = new ScoreDoc(i, scores[i]);
+    }
+    TopDocs docs = is.search(q, 10, 
+        new Sort(new SortField("id", SortField.Type.STRING)));
+    CheckHits.checkHits(random(), q, "", is, expectedDocs);
+    CheckHits.checkHitsQuery(q, expected, docs.scoreDocs, expectedDocs);
+    CheckHits.checkExplanations(q, "", is);
+  }
+}

From fa75b33949d18473ee5122cfd59b6a20d7a3c2a9 Mon Sep 17 00:00:00 2001
From: Simon Willnauer <simonw@apache.org>
Date: Sun, 20 May 2012 10:03:35 +0000
Subject: [PATCH 35/47] LUCENE-4046: Add IOException to DocsEnum#freq()

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340653 13f79535-47bb-0310-9956-ffa450edef68
---
 .../lucene/codecs/MappingMultiDocsAndPositionsEnum.java    | 2 +-
 .../org/apache/lucene/codecs/MappingMultiDocsEnum.java     | 2 +-
 .../org/apache/lucene/codecs/lucene3x/Lucene3xFields.java  | 4 ++--
 .../lucene/codecs/lucene3x/Lucene3xTermVectorsReader.java  | 4 ++--
 .../lucene/codecs/lucene40/Lucene40PostingsReader.java     | 6 +++---
 .../lucene/codecs/lucene40/Lucene40TermVectorsReader.java  | 4 ++--
 .../apache/lucene/codecs/memory/MemoryPostingsFormat.java  | 4 ++--
 .../lucene/codecs/pulsing/PulsingPostingsReader.java       | 4 ++--
 .../org/apache/lucene/codecs/sep/SepPostingsReader.java    | 4 ++--
 .../lucene/codecs/simpletext/SimpleTextFieldsReader.java   | 4 ++--
 .../codecs/simpletext/SimpleTextTermVectorsReader.java     | 4 ++--
 lucene/core/src/java/org/apache/lucene/index/DocsEnum.java | 7 +++++--
 .../java/org/apache/lucene/index/FilterAtomicReader.java   | 4 ++--
 .../org/apache/lucene/index/MultiDocsAndPositionsEnum.java | 2 +-
 .../src/java/org/apache/lucene/index/MultiDocsEnum.java    | 2 +-
 .../java/org/apache/lucene/search/MultiPhraseQuery.java    | 2 +-
 .../core/src/java/org/apache/lucene/search/TermScorer.java | 4 ++--
 .../java/org/apache/lucene/index/memory/MemoryIndex.java   | 4 ++--
 .../lucene/codecs/ramonly/RAMOnlyPostingsFormat.java       | 4 ++--
 19 files changed, 37 insertions(+), 34 deletions(-)

diff --git a/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsAndPositionsEnum.java b/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsAndPositionsEnum.java
index e4e89bf84ce..683b2c30e54 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsAndPositionsEnum.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsAndPositionsEnum.java
@@ -53,7 +53,7 @@ public final class MappingMultiDocsAndPositionsEnum extends DocsAndPositionsEnum
   }
 
   @Override
-  public int freq() {
+  public int freq() throws IOException {
     return current.freq();
   }
 
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsEnum.java b/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsEnum.java
index 0319e1da1ce..8a9bb79525b 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsEnum.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/MappingMultiDocsEnum.java
@@ -52,7 +52,7 @@ public final class MappingMultiDocsEnum extends DocsEnum {
   }
 
   @Override
-  public int freq() {
+  public int freq() throws IOException {
     return current.freq();
   }
 
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xFields.java b/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xFields.java
index 621fe44f481..3d153d60a11 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xFields.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xFields.java
@@ -1024,7 +1024,7 @@ class Lucene3xFields extends FieldsProducer {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return docs.freq();
     }
 
@@ -1071,7 +1071,7 @@ class Lucene3xFields extends FieldsProducer {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return pos.freq();
     }
 
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xTermVectorsReader.java b/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xTermVectorsReader.java
index c66e0584dee..1df5ca960bc 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xTermVectorsReader.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/lucene3x/Lucene3xTermVectorsReader.java
@@ -528,7 +528,7 @@ class Lucene3xTermVectorsReader extends TermVectorsReader {
     private Bits liveDocs;
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return freq;
     }
 
@@ -574,7 +574,7 @@ class Lucene3xTermVectorsReader extends TermVectorsReader {
     private int[] endOffsets;
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       if (positions != null) {
         return positions.length;
       } else {
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40PostingsReader.java b/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40PostingsReader.java
index 0eb36aeff96..7bf74d7a9a2 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40PostingsReader.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40PostingsReader.java
@@ -351,7 +351,7 @@ public class Lucene40PostingsReader extends PostingsReaderBase {
     }
     
     @Override
-    public final int freq() {
+    public final int freq() throws IOException {
       assert !indexOmitsTF;
       return freq;
     }
@@ -770,7 +770,7 @@ public class Lucene40PostingsReader extends PostingsReaderBase {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return freq;
     }
 
@@ -989,7 +989,7 @@ public class Lucene40PostingsReader extends PostingsReaderBase {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return freq;
     }
 
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40TermVectorsReader.java b/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40TermVectorsReader.java
index c0420d1ba95..e44713b65ab 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40TermVectorsReader.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/lucene40/Lucene40TermVectorsReader.java
@@ -549,7 +549,7 @@ public class Lucene40TermVectorsReader extends TermVectorsReader {
     private Bits liveDocs;
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return freq;
     }
 
@@ -595,7 +595,7 @@ public class Lucene40TermVectorsReader extends TermVectorsReader {
     private int[] endOffsets;
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       if (positions != null) {
         return positions.length;
       } else {
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/memory/MemoryPostingsFormat.java b/lucene/core/src/java/org/apache/lucene/codecs/memory/MemoryPostingsFormat.java
index 8badc9ba7e3..1453252514e 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/memory/MemoryPostingsFormat.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/memory/MemoryPostingsFormat.java
@@ -424,7 +424,7 @@ public class MemoryPostingsFormat extends PostingsFormat {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       assert indexOptions != IndexOptions.DOCS_ONLY;
       return freq;
     }
@@ -624,7 +624,7 @@ public class MemoryPostingsFormat extends PostingsFormat {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return freq;
     }
   }
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/pulsing/PulsingPostingsReader.java b/lucene/core/src/java/org/apache/lucene/codecs/pulsing/PulsingPostingsReader.java
index 18bd58867f0..644e48511b2 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/pulsing/PulsingPostingsReader.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/pulsing/PulsingPostingsReader.java
@@ -356,7 +356,7 @@ public class PulsingPostingsReader extends PostingsReaderBase {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       assert indexOptions != IndexOptions.DOCS_ONLY;
       return freq;
     }
@@ -462,7 +462,7 @@ public class PulsingPostingsReader extends PostingsReaderBase {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return freq;
     }
 
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/sep/SepPostingsReader.java b/lucene/core/src/java/org/apache/lucene/codecs/sep/SepPostingsReader.java
index 533fd2f3b22..6424fe3b9d5 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/sep/SepPostingsReader.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/sep/SepPostingsReader.java
@@ -423,7 +423,7 @@ public class SepPostingsReader extends PostingsReaderBase {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       assert !omitTF;
       return freq;
     }
@@ -601,7 +601,7 @@ public class SepPostingsReader extends PostingsReaderBase {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return freq;
     }
 
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextFieldsReader.java b/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextFieldsReader.java
index c3b252df204..ec04e9a64c4 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextFieldsReader.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextFieldsReader.java
@@ -269,7 +269,7 @@ class SimpleTextFieldsReader extends FieldsProducer {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       assert !omitTF;
       return tf;
     }
@@ -370,7 +370,7 @@ class SimpleTextFieldsReader extends FieldsProducer {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return tf;
     }
 
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextTermVectorsReader.java b/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextTermVectorsReader.java
index 03d6825f1a7..c7c8dc7563d 100644
--- a/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextTermVectorsReader.java
+++ b/lucene/core/src/java/org/apache/lucene/codecs/simpletext/SimpleTextTermVectorsReader.java
@@ -400,7 +400,7 @@ public class SimpleTextTermVectorsReader extends TermVectorsReader {
     private Bits liveDocs;
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       assert freq != -1;
       return freq;
     }
@@ -447,7 +447,7 @@ public class SimpleTextTermVectorsReader extends TermVectorsReader {
     private int[] endOffsets;
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       if (positions != null) {
         return positions.length;
       } else {
diff --git a/lucene/core/src/java/org/apache/lucene/index/DocsEnum.java b/lucene/core/src/java/org/apache/lucene/index/DocsEnum.java
index e8d97ad5fc5..7b48dd0645c 100644
--- a/lucene/core/src/java/org/apache/lucene/index/DocsEnum.java
+++ b/lucene/core/src/java/org/apache/lucene/index/DocsEnum.java
@@ -17,6 +17,8 @@ package org.apache.lucene.index;
  * limitations under the License.
  */
 
+import java.io.IOException;
+
 import org.apache.lucene.search.DocIdSetIterator;
 import org.apache.lucene.util.AttributeSource;
 
@@ -29,8 +31,9 @@ public abstract class DocsEnum extends DocIdSetIterator {
 
   /** Returns term frequency in the current document.  Do
    *  not call this before {@link #nextDoc} is first called,
-   *  nor after {@link #nextDoc} returns NO_MORE_DOCS. */
-  public abstract int freq();
+   *  nor after {@link #nextDoc} returns NO_MORE_DOCS. 
+   **/
+  public abstract int freq() throws IOException;
   
   /** Returns the related attributes. */
   public AttributeSource attributes() {
diff --git a/lucene/core/src/java/org/apache/lucene/index/FilterAtomicReader.java b/lucene/core/src/java/org/apache/lucene/index/FilterAtomicReader.java
index cc67c40e5f1..e0c4b58b87f 100644
--- a/lucene/core/src/java/org/apache/lucene/index/FilterAtomicReader.java
+++ b/lucene/core/src/java/org/apache/lucene/index/FilterAtomicReader.java
@@ -225,7 +225,7 @@ public class FilterAtomicReader extends AtomicReader {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return in.freq();
     }
 
@@ -259,7 +259,7 @@ public class FilterAtomicReader extends AtomicReader {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return in.freq();
     }
 
diff --git a/lucene/core/src/java/org/apache/lucene/index/MultiDocsAndPositionsEnum.java b/lucene/core/src/java/org/apache/lucene/index/MultiDocsAndPositionsEnum.java
index dd6f2634615..e515a2d3e85 100644
--- a/lucene/core/src/java/org/apache/lucene/index/MultiDocsAndPositionsEnum.java
+++ b/lucene/core/src/java/org/apache/lucene/index/MultiDocsAndPositionsEnum.java
@@ -69,7 +69,7 @@ public final class MultiDocsAndPositionsEnum extends DocsAndPositionsEnum {
   }
 
   @Override
-  public int freq() {
+  public int freq() throws IOException {
     return current.freq();
   }
 
diff --git a/lucene/core/src/java/org/apache/lucene/index/MultiDocsEnum.java b/lucene/core/src/java/org/apache/lucene/index/MultiDocsEnum.java
index c90ab1d7a40..2597c7ced81 100644
--- a/lucene/core/src/java/org/apache/lucene/index/MultiDocsEnum.java
+++ b/lucene/core/src/java/org/apache/lucene/index/MultiDocsEnum.java
@@ -69,7 +69,7 @@ public final class MultiDocsEnum extends DocsEnum {
   }
 
   @Override
-  public int freq() {
+  public int freq() throws IOException {
     return current.freq();
   }
 
diff --git a/lucene/core/src/java/org/apache/lucene/search/MultiPhraseQuery.java b/lucene/core/src/java/org/apache/lucene/search/MultiPhraseQuery.java
index 2dbc77e27cb..e008c197918 100644
--- a/lucene/core/src/java/org/apache/lucene/search/MultiPhraseQuery.java
+++ b/lucene/core/src/java/org/apache/lucene/search/MultiPhraseQuery.java
@@ -568,7 +568,7 @@ class UnionDocsAndPositionsEnum extends DocsAndPositionsEnum {
   }
 
   @Override
-  public final int freq() {
+  public final int freq() throws IOException {
     return _freq;
   }
 
diff --git a/lucene/core/src/java/org/apache/lucene/search/TermScorer.java b/lucene/core/src/java/org/apache/lucene/search/TermScorer.java
index e5f93d13daa..ba638a5bbc5 100644
--- a/lucene/core/src/java/org/apache/lucene/search/TermScorer.java
+++ b/lucene/core/src/java/org/apache/lucene/search/TermScorer.java
@@ -51,7 +51,7 @@ final class TermScorer extends Scorer {
   }
 
   @Override
-  public float freq() {
+  public float freq() throws IOException {
     return docsEnum.freq();
   }
 
@@ -66,7 +66,7 @@ final class TermScorer extends Scorer {
   }
   
   @Override
-  public float score() {
+  public float score() throws IOException {
     assert docID() != NO_MORE_DOCS;
     return docScorer.score(docsEnum.docID(), docsEnum.freq());  
   }
diff --git a/lucene/memory/src/java/org/apache/lucene/index/memory/MemoryIndex.java b/lucene/memory/src/java/org/apache/lucene/index/memory/MemoryIndex.java
index d6615bcb31d..977a87d287f 100644
--- a/lucene/memory/src/java/org/apache/lucene/index/memory/MemoryIndex.java
+++ b/lucene/memory/src/java/org/apache/lucene/index/memory/MemoryIndex.java
@@ -945,7 +945,7 @@ public class MemoryIndex {
       }
 
       @Override
-      public int freq() {
+      public int freq() throws IOException {
         return positions.size();
       }
     }
@@ -987,7 +987,7 @@ public class MemoryIndex {
       }
 
       @Override
-      public int freq() {
+      public int freq() throws IOException {
         return positions.size() / stride;
       }
 
diff --git a/lucene/test-framework/src/java/org/apache/lucene/codecs/ramonly/RAMOnlyPostingsFormat.java b/lucene/test-framework/src/java/org/apache/lucene/codecs/ramonly/RAMOnlyPostingsFormat.java
index f23d0fc35e1..896f72a2bd5 100644
--- a/lucene/test-framework/src/java/org/apache/lucene/codecs/ramonly/RAMOnlyPostingsFormat.java
+++ b/lucene/test-framework/src/java/org/apache/lucene/codecs/ramonly/RAMOnlyPostingsFormat.java
@@ -439,7 +439,7 @@ public class RAMOnlyPostingsFormat extends PostingsFormat {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return current.positions.length;
     }
 
@@ -487,7 +487,7 @@ public class RAMOnlyPostingsFormat extends PostingsFormat {
     }
 
     @Override
-    public int freq() {
+    public int freq() throws IOException {
       return current.positions.length;
     }
 

From d722b19748a2c1dabc3b7ff5fb16b4c6e3d65d75 Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Sun, 20 May 2012 10:32:38 +0000
Subject: [PATCH 36/47] SOLR-3238: Add License for d3

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340665 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/webapp/web/js/lib/d3.js | 31 +++++++++++++++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/solr/webapp/web/js/lib/d3.js b/solr/webapp/web/js/lib/d3.js
index c1b6caf261e..c29ff9c9680 100755
--- a/solr/webapp/web/js/lib/d3.js
+++ b/solr/webapp/web/js/lib/d3.js
@@ -1,3 +1,34 @@
+/*
+
+Copyright (c) 2012, Michael Bostock
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* The name Michael Bostock may not be used to endorse or promote products
+  derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL MICHAEL BOSTOCK BE LIABLE FOR ANY DIRECT,
+INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
+OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
+EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+*/
+
 (function(){if (!Date.now) Date.now = function() {
   return +new Date;
 };

From d65f086bafa9fc1d32dcd7ba412ec43f41d8608e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Stanis=C5=82aw=20Osi=C5=84ski?= <stanislaw@apache.org>
Date: Sun, 20 May 2012 11:53:51 +0000
Subject: [PATCH 37/47] SOLR-3470: Custom Carrot2 tokenizer and stemmer
 factories overwritten by defaults: fixed

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340686 13f79535-47bb-0310-9956-ffa450edef68
---
 .../carrot2/CarrotClusteringEngine.java       | 13 +++-
 .../clustering/solr/conf/solrconfig.xml       | 10 +++
 .../carrot2/CarrotClusteringEngineTest.java   | 28 +++++++
 .../carrot2/DuplicatingStemmerFactory.java    | 34 +++++++++
 .../carrot2/DuplicatingTokenizerFactory.java  | 52 +++++++++++++
 .../carrot2/EchoStemsClusteringAlgorithm.java | 75 +++++++++++++++++++
 .../EchoTokensClusteringAlgorithm.java        | 69 +++++++++++++++++
 7 files changed, 277 insertions(+), 4 deletions(-)
 create mode 100644 solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingStemmerFactory.java
 create mode 100644 solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingTokenizerFactory.java
 create mode 100644 solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java
 create mode 100644 solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java

diff --git a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java
index df62be8f59c..edaffe18db5 100644
--- a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java
+++ b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java
@@ -62,6 +62,7 @@ import org.carrot2.core.LanguageCode;
 import org.carrot2.core.attribute.AttributeNames;
 import org.carrot2.text.linguistic.DefaultLexicalDataFactoryDescriptor;
 import org.carrot2.text.preprocessing.pipeline.BasicPreprocessingPipelineDescriptor;
+import org.carrot2.text.preprocessing.pipeline.BasicPreprocessingPipelineDescriptor.AttributeBuilder;
 import org.carrot2.util.resource.ClassLoaderLocator;
 import org.carrot2.util.resource.IResource;
 import org.carrot2.util.resource.IResourceLocator;
@@ -255,10 +256,14 @@ public class CarrotClusteringEngine extends SearchClusteringEngine {
     // Additionally, we set a custom lexical resource factory for Carrot2 that
     // will use both Carrot2 default stop words as well as stop words from
     // the StopFilter defined on the field.
-    BasicPreprocessingPipelineDescriptor.attributeBuilder(initAttributes)
-        .stemmerFactory(LuceneCarrot2StemmerFactory.class)
-        .tokenizerFactory(LuceneCarrot2TokenizerFactory.class)
-        .lexicalDataFactory(SolrStopwordsCarrot2LexicalDataFactory.class);
+    final AttributeBuilder attributeBuilder = BasicPreprocessingPipelineDescriptor.attributeBuilder(initAttributes);
+    attributeBuilder.lexicalDataFactory(SolrStopwordsCarrot2LexicalDataFactory.class);
+    if (!initAttributes.containsKey(BasicPreprocessingPipelineDescriptor.Keys.TOKENIZER_FACTORY)) {
+      attributeBuilder.tokenizerFactory(LuceneCarrot2TokenizerFactory.class);
+    }
+    if (!initAttributes.containsKey(BasicPreprocessingPipelineDescriptor.Keys.STEMMER_FACTORY)) {
+      attributeBuilder.stemmerFactory(LuceneCarrot2StemmerFactory.class);
+    }
 
     // Pass the schema to SolrStopwordsCarrot2LexicalDataFactory.
     initAttributes.put("solrIndexSchema", core.getSchema());
diff --git a/solr/contrib/clustering/src/test-files/clustering/solr/conf/solrconfig.xml b/solr/contrib/clustering/src/test-files/clustering/solr/conf/solrconfig.xml
index 41787f82644..430c0616564 100644
--- a/solr/contrib/clustering/src/test-files/clustering/solr/conf/solrconfig.xml
+++ b/solr/contrib/clustering/src/test-files/clustering/solr/conf/solrconfig.xml
@@ -339,6 +339,16 @@
       <str name="carrot.algorithm">org.apache.solr.handler.clustering.carrot2.LexicalResourcesCheckClusteringAlgorithm</str>
       <str name="carrot.lexicalResourcesDir">clustering/custom</str>
     </lst>
+    <lst name="engine">
+      <str name="name">custom-duplicating-tokenizer</str>
+      <str name="carrot.algorithm">org.apache.solr.handler.clustering.carrot2.EchoTokensClusteringAlgorithm</str>
+      <str name="PreprocessingPipeline.tokenizerFactory">org.apache.solr.handler.clustering.carrot2.DuplicatingTokenizerFactory</str>
+    </lst>
+    <lst name="engine">
+      <str name="name">custom-duplicating-stemmer</str>
+      <str name="carrot.algorithm">org.apache.solr.handler.clustering.carrot2.EchoStemsClusteringAlgorithm</str>
+      <str name="PreprocessingPipeline.stemmerFactory">org.apache.solr.handler.clustering.carrot2.DuplicatingStemmerFactory</str>
+    </lst>
   </searchComponent>
 
   <searchComponent class="org.apache.solr.handler.clustering.ClusteringComponent" name="doc-clustering">
diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java
index e4ef997f3d5..911f03d787d 100644
--- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java
+++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java
@@ -352,6 +352,34 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
     assertEquals("List field", "[first, second]", labels.get(4));
   }
 
+  @Test
+  public void customTokenizer() throws Exception {
+    final ModifiableSolrParams params = new ModifiableSolrParams();
+    params.add(CarrotParams.TITLE_FIELD_NAME, "title");
+    params.add(CarrotParams.SNIPPET_FIELD_NAME, "snippet");
+
+    final List<String> labels = getLabels(checkEngine(
+        getClusteringEngine("custom-duplicating-tokenizer"), 1, 16, new TermQuery(new Term("title",
+            "field")), params).get(0));
+    
+    // The custom test tokenizer duplicates each token's text
+    assertTrue("First token", labels.get(0).contains("TitleTitle"));
+  }
+  
+  @Test
+  public void customStemmer() throws Exception {
+    final ModifiableSolrParams params = new ModifiableSolrParams();
+    params.add(CarrotParams.TITLE_FIELD_NAME, "title");
+    params.add(CarrotParams.SNIPPET_FIELD_NAME, "snippet");
+    
+    final List<String> labels = getLabels(checkEngine(
+        getClusteringEngine("custom-duplicating-stemmer"), 1, 12, new TermQuery(new Term("title",
+            "field")), params).get(0));
+    
+    // The custom test stemmer duplicates and lowercases each token's text
+    assertTrue("First token", labels.get(0).contains("titletitle"));
+  }
+
   private CarrotClusteringEngine getClusteringEngine(String engineName) {
     ClusteringComponent comp = (ClusteringComponent) h.getCore()
             .getSearchComponent("clustering");
diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingStemmerFactory.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingStemmerFactory.java
new file mode 100644
index 00000000000..c090a1567e1
--- /dev/null
+++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingStemmerFactory.java
@@ -0,0 +1,34 @@
+package org.apache.solr.handler.clustering.carrot2;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.carrot2.core.LanguageCode;
+import org.carrot2.text.linguistic.IStemmer;
+import org.carrot2.text.linguistic.IStemmerFactory;
+
+public class DuplicatingStemmerFactory implements IStemmerFactory {
+  @Override
+  public IStemmer getStemmer(LanguageCode language) {
+    return new IStemmer() {
+      @Override
+      public CharSequence stem(CharSequence word) {
+        return word.toString() + word.toString();
+      }
+    };
+  }
+}
diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingTokenizerFactory.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingTokenizerFactory.java
new file mode 100644
index 00000000000..99e6b605c91
--- /dev/null
+++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/DuplicatingTokenizerFactory.java
@@ -0,0 +1,52 @@
+package org.apache.solr.handler.clustering.carrot2;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.carrot2.core.LanguageCode;
+import org.carrot2.text.analysis.ExtendedWhitespaceTokenizer;
+import org.carrot2.text.analysis.ITokenizer;
+import org.carrot2.text.linguistic.ITokenizerFactory;
+import org.carrot2.text.util.MutableCharArray;
+
+public class DuplicatingTokenizerFactory implements ITokenizerFactory {
+  @Override
+  public ITokenizer getTokenizer(LanguageCode language) {
+    return new ITokenizer() {
+      private final ExtendedWhitespaceTokenizer delegate = new ExtendedWhitespaceTokenizer();
+      
+      @Override
+      public void setTermBuffer(MutableCharArray buffer) {
+        delegate.setTermBuffer(buffer);
+        buffer.reset(buffer.toString() + buffer.toString());
+      }
+      
+      @Override
+      public void reset(Reader input) throws IOException {
+        delegate.reset(input);
+      }
+      
+      @Override
+      public short nextToken() throws IOException {
+        return delegate.nextToken();
+      }
+    };
+  }
+}
diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java
new file mode 100644
index 00000000000..52d8e054230
--- /dev/null
+++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java
@@ -0,0 +1,75 @@
+package org.apache.solr.handler.clustering.carrot2;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+import java.util.List;
+
+import org.carrot2.core.Cluster;
+import org.carrot2.core.Document;
+import org.carrot2.core.IClusteringAlgorithm;
+import org.carrot2.core.LanguageCode;
+import org.carrot2.core.ProcessingComponentBase;
+import org.carrot2.core.ProcessingException;
+import org.carrot2.core.attribute.AttributeNames;
+import org.carrot2.core.attribute.Processing;
+import org.carrot2.text.preprocessing.PreprocessingContext;
+import org.carrot2.text.preprocessing.PreprocessingContext.AllStems;
+import org.carrot2.text.preprocessing.PreprocessingContext.AllTokens;
+import org.carrot2.text.preprocessing.PreprocessingContext.AllWords;
+import org.carrot2.text.preprocessing.pipeline.BasicPreprocessingPipeline;
+import org.carrot2.util.attribute.Attribute;
+import org.carrot2.util.attribute.Bindable;
+import org.carrot2.util.attribute.Input;
+import org.carrot2.util.attribute.Output;
+
+import com.google.common.collect.Lists;
+
+/**
+ * A mock Carrot2 clustering algorithm that outputs stem of each token of each
+ * document as a separate cluster. Useful only in tests.
+ */
+@Bindable(prefix = "EchoTokensClusteringAlgorithm")
+public class EchoStemsClusteringAlgorithm extends ProcessingComponentBase
+    implements IClusteringAlgorithm {
+  @Input
+  @Processing
+  @Attribute(key = AttributeNames.DOCUMENTS)
+  private List<Document> documents;
+  
+  @Output
+  @Processing
+  @Attribute(key = AttributeNames.CLUSTERS)
+  private List<Cluster> clusters;
+  
+  BasicPreprocessingPipeline preprocessing = new BasicPreprocessingPipeline();
+  
+  @Override
+  public void process() throws ProcessingException {
+    final PreprocessingContext preprocessingContext = preprocessing.preprocess(
+        documents, "", LanguageCode.ENGLISH);
+    final AllTokens allTokens = preprocessingContext.allTokens;
+    final AllWords allWords = preprocessingContext.allWords;
+    final AllStems allStems = preprocessingContext.allStems;
+    clusters = Lists.newArrayListWithCapacity(allTokens.image.length);
+    for (int i = 0; i < allTokens.image.length; i++) {
+      if (allTokens.wordIndex[i] >= 0) {
+        clusters.add(new Cluster(new String(
+            allStems.image[allWords.stemIndex[allTokens.wordIndex[i]]])));
+      }
+    }
+  }
+}
diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java
new file mode 100644
index 00000000000..2ed2d95dbf5
--- /dev/null
+++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java
@@ -0,0 +1,69 @@
+package org.apache.solr.handler.clustering.carrot2;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+import java.util.List;
+
+import org.carrot2.core.Cluster;
+import org.carrot2.core.Document;
+import org.carrot2.core.IClusteringAlgorithm;
+import org.carrot2.core.LanguageCode;
+import org.carrot2.core.ProcessingComponentBase;
+import org.carrot2.core.ProcessingException;
+import org.carrot2.core.attribute.AttributeNames;
+import org.carrot2.core.attribute.Processing;
+import org.carrot2.text.preprocessing.PreprocessingContext;
+import org.carrot2.text.preprocessing.pipeline.BasicPreprocessingPipeline;
+import org.carrot2.util.attribute.Attribute;
+import org.carrot2.util.attribute.Bindable;
+import org.carrot2.util.attribute.Input;
+import org.carrot2.util.attribute.Output;
+
+import com.google.common.collect.Lists;
+
+/**
+ * A mock Carrot2 clustering algorithm that outputs each token of each document
+ * as a separate cluster. Useful only in tests.
+ */
+@Bindable(prefix = "EchoTokensClusteringAlgorithm")
+public class EchoTokensClusteringAlgorithm extends ProcessingComponentBase
+    implements IClusteringAlgorithm {
+  @Input
+  @Processing
+  @Attribute(key = AttributeNames.DOCUMENTS)
+  private List<Document> documents;
+  
+  @Output
+  @Processing
+  @Attribute(key = AttributeNames.CLUSTERS)
+  private List<Cluster> clusters;
+  
+  BasicPreprocessingPipeline preprocessing = new BasicPreprocessingPipeline();
+  
+  @Override
+  public void process() throws ProcessingException {
+    final PreprocessingContext preprocessingContext = preprocessing.preprocess(
+        documents, "", LanguageCode.ENGLISH);
+    clusters = Lists
+        .newArrayListWithCapacity(preprocessingContext.allTokens.image.length);
+    for (char[] token : preprocessingContext.allTokens.image) {
+      if (token != null) {
+        clusters.add(new Cluster(new String(token)));
+      }
+    }
+  }
+}

From 664ab89dee64ee40d17ecb462ec6d0a996913cbb Mon Sep 17 00:00:00 2001
From: Uwe Schindler <uschindler@apache.org>
Date: Sun, 20 May 2012 12:06:22 +0000
Subject: [PATCH 38/47] SOLR-3471: Disable tests that don't work correctly on
 Windows

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340687 13f79535-47bb-0310-9956-ffa450edef68
---
 .../test/org/apache/solr/core/TestSolrDeletionPolicy1.java    | 4 ++++
 .../src/test/org/apache/solr/update/SoftAutoCommitTest.java   | 4 ++++
 2 files changed, 8 insertions(+)

diff --git a/solr/core/src/test/org/apache/solr/core/TestSolrDeletionPolicy1.java b/solr/core/src/test/org/apache/solr/core/TestSolrDeletionPolicy1.java
index 1242c3fb568..53cec4828c7 100644
--- a/solr/core/src/test/org/apache/solr/core/TestSolrDeletionPolicy1.java
+++ b/solr/core/src/test/org/apache/solr/core/TestSolrDeletionPolicy1.java
@@ -17,6 +17,7 @@
 package org.apache.solr.core;
 
 import org.apache.lucene.index.IndexCommit;
+import org.apache.lucene.util.Constants;
 import org.apache.solr.SolrTestCaseJ4;
 import org.junit.Before;
 import org.junit.BeforeClass;
@@ -109,6 +110,9 @@ public class TestSolrDeletionPolicy1 extends SolrTestCaseJ4 {
 
   @Test
   public void testCommitAge() throws InterruptedException {
+    assumeFalse("This test is not working on Windows (or maybe machines with only 2 CPUs)",
+      Constants.WINDOWS);
+  
     IndexDeletionPolicyWrapper delPolicy = h.getCore().getDeletionPolicy();
     addDocs();
     Map<Long, IndexCommit> commits = delPolicy.getCommits();
diff --git a/solr/core/src/test/org/apache/solr/update/SoftAutoCommitTest.java b/solr/core/src/test/org/apache/solr/update/SoftAutoCommitTest.java
index 8c2b3591a76..221f95a692b 100644
--- a/solr/core/src/test/org/apache/solr/update/SoftAutoCommitTest.java
+++ b/solr/core/src/test/org/apache/solr/update/SoftAutoCommitTest.java
@@ -24,6 +24,7 @@ import static org.junit.Assert.assertEquals;
 import java.util.concurrent.BlockingQueue;
 import java.util.concurrent.LinkedBlockingQueue;
 
+import org.apache.lucene.util.Constants;
 import org.apache.solr.common.util.NamedList;
 import org.apache.solr.core.SolrCore;
 import org.apache.solr.core.SolrEventListener;
@@ -62,6 +63,9 @@ public class SoftAutoCommitTest extends AbstractSolrTestCase {
     
   @Before
   public void createMonitor() throws Exception {
+    assumeFalse("This test is not working on Windows (or maybe machines with only 2 CPUs)",
+      Constants.WINDOWS);
+  
     SolrCore core = h.getCore();
 
     updater = (DirectUpdateHandler2) core.getUpdateHandler();

From 8945e4b2ce2a66b01c1016628d91c527478e642c Mon Sep 17 00:00:00 2001
From: Michael McCandless <mikemccand@apache.org>
Date: Sun, 20 May 2012 13:41:33 +0000
Subject: [PATCH 39/47] don't excessively call RateLimiter in tests

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340713 13f79535-47bb-0310-9956-ffa450edef68
---
 .../java/org/apache/lucene/store/MockIndexOutputWrapper.java    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lucene/test-framework/src/java/org/apache/lucene/store/MockIndexOutputWrapper.java b/lucene/test-framework/src/java/org/apache/lucene/store/MockIndexOutputWrapper.java
index 9658110e006..1b9b1adee68 100644
--- a/lucene/test-framework/src/java/org/apache/lucene/store/MockIndexOutputWrapper.java
+++ b/lucene/test-framework/src/java/org/apache/lucene/store/MockIndexOutputWrapper.java
@@ -78,7 +78,7 @@ public class MockIndexOutputWrapper extends IndexOutput {
     long freeSpace = dir.maxSize == 0 ? 0 : dir.maxSize - dir.sizeInBytes();
     long realUsage = 0;
 
-    if (dir.rateLimiter != null) {
+    if (dir.rateLimiter != null && len >= 10) {
       dir.rateLimiter.pause(len);
     }
 

From 5c714e8147b2476c46bf3991de6913a4309c6846 Mon Sep 17 00:00:00 2001
From: Simon Willnauer <simonw@apache.org>
Date: Sun, 20 May 2012 18:39:51 +0000
Subject: [PATCH 40/47] fix testcase to not check unreliable thread state in
 join helper

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340794 13f79535-47bb-0310-9956-ffa450edef68
---
 .../apache/lucene/index/TestDocumentsWriterStallControl.java | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java b/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java
index 0252c9f1aa6..46052131015 100644
--- a/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java
+++ b/lucene/core/src/test/org/apache/lucene/index/TestDocumentsWriterStallControl.java
@@ -27,7 +27,6 @@ import java.util.concurrent.atomic.AtomicBoolean;
 import org.apache.lucene.index.DocumentsWriterStallControl.MemoryController;
 import org.apache.lucene.util.LuceneTestCase;
 
-import com.carrotsearch.randomizedtesting.annotations.Repeat;
 import com.carrotsearch.randomizedtesting.annotations.ThreadLeaks;
 
 /**
@@ -59,7 +58,7 @@ public class TestDocumentsWriterStallControl extends LuceneTestCase {
     memCtrl.netBytes = 50;
     ctrl.updateStalled(memCtrl);
     assertFalse(ctrl.anyStalledThreads());
-    join(waitThreads, 100);
+    join(waitThreads, 500);
   }
   
   public void testRandom() throws InterruptedException {
@@ -297,8 +296,6 @@ public class TestDocumentsWriterStallControl extends LuceneTestCase {
       throws InterruptedException {
     for (Thread thread : toJoin) {
       thread.join(timeout);
-      assertEquals(thread.getState().toString(), Thread.State.TERMINATED,
-          thread.getState());
     }
   }
   

From abaec93967a7b10993de34870c4851c464c69c2a Mon Sep 17 00:00:00 2001
From: Mark Robert Miller <markrmiller@apache.org>
Date: Sun, 20 May 2012 20:54:17 +0000
Subject: [PATCH 41/47] add a couple cloud props to multicore example solr.xml

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340837 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/example/multicore/solr.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/solr/example/multicore/solr.xml b/solr/example/multicore/solr.xml
index c6ed7e57983..ff97c67722b 100644
--- a/solr/example/multicore/solr.xml
+++ b/solr/example/multicore/solr.xml
@@ -28,7 +28,7 @@
   adminPath: RequestHandler path to manage cores.  
     If 'null' (or absent), cores will not be manageable via request handler
   -->
-  <cores adminPath="/admin/cores">
+  <cores adminPath="/admin/cores" host="${host:}" hostPort="${jetty.port:}">
     <core name="core0" instanceDir="core0" />
     <core name="core1" instanceDir="core1" />
   </cores>

From ff037852fc54d3bda26353c664799ac94df5af66 Mon Sep 17 00:00:00 2001
From: Mark Robert Miller <markrmiller@apache.org>
Date: Sun, 20 May 2012 22:49:35 +0000
Subject: [PATCH 42/47] add ping and analysis request handlers for good UI
 defaults

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340863 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/example/multicore/core0/conf/solrconfig.xml | 12 +++++++++++-
 solr/example/multicore/core1/conf/solrconfig.xml | 12 +++++++++++-
 2 files changed, 22 insertions(+), 2 deletions(-)

diff --git a/solr/example/multicore/core0/conf/solrconfig.xml b/solr/example/multicore/core0/conf/solrconfig.xml
index 18d842b718a..d29101c22cf 100644
--- a/solr/example/multicore/core0/conf/solrconfig.xml
+++ b/solr/example/multicore/core0/conf/solrconfig.xml
@@ -51,9 +51,19 @@
   </requestDispatcher>
   
   <requestHandler name="standard" class="solr.StandardRequestHandler" default="true" />
+  <requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" />
   <requestHandler name="/update" class="solr.UpdateRequestHandler"  />
   <requestHandler name="/admin/" class="org.apache.solr.handler.admin.AdminHandlers" />
-      
+     
+  <requestHandler name="/admin/ping" class="solr.PingRequestHandler">
+    <lst name="invariants">
+      <str name="q">solrpingquery</str>
+    </lst>
+    <lst name="defaults">
+      <str name="echoParams">all</str>
+    </lst>
+  </requestHandler>
+   
   <!-- config for the admin interface --> 
   <admin>
     <defaultQuery>solr</defaultQuery>
diff --git a/solr/example/multicore/core1/conf/solrconfig.xml b/solr/example/multicore/core1/conf/solrconfig.xml
index 7bc5a3ac6dd..13c59fbf400 100644
--- a/solr/example/multicore/core1/conf/solrconfig.xml
+++ b/solr/example/multicore/core1/conf/solrconfig.xml
@@ -51,9 +51,19 @@
   </requestDispatcher>
   
   <requestHandler name="standard" class="solr.StandardRequestHandler" default="true" />
+  <requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" />
   <requestHandler name="/update" class="solr.UpdateRequestHandler"  />
   <requestHandler name="/admin/" class="org.apache.solr.handler.admin.AdminHandlers" />
-      
+
+  <requestHandler name="/admin/ping" class="solr.PingRequestHandler">
+    <lst name="invariants">
+      <str name="q">solrpingquery</str>
+    </lst>
+    <lst name="defaults">
+      <str name="echoParams">all</str>
+    </lst>
+  </requestHandler>
+
   <!-- config for the admin interface --> 
   <admin>
     <defaultQuery>solr</defaultQuery>

From a29a6c6f29e23ce36eadc39cc4535966d23fc4e3 Mon Sep 17 00:00:00 2001
From: Mark Robert Miller <markrmiller@apache.org>
Date: Sun, 20 May 2012 23:10:02 +0000
Subject: [PATCH 43/47] SOLR-3472: ping request handler should force
 distrib=false default

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340869 13f79535-47bb-0310-9956-ffa450edef68
---
 .../org/apache/solr/handler/PingRequestHandler.java   | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/solr/core/src/java/org/apache/solr/handler/PingRequestHandler.java b/solr/core/src/java/org/apache/solr/handler/PingRequestHandler.java
index 7a991c76407..4206f634e86 100644
--- a/solr/core/src/java/org/apache/solr/handler/PingRequestHandler.java
+++ b/solr/core/src/java/org/apache/solr/handler/PingRequestHandler.java
@@ -25,6 +25,7 @@ import java.util.Locale;
 
 import org.apache.solr.common.SolrException;
 import org.apache.solr.common.params.CommonParams;
+import org.apache.solr.common.params.ModifiableSolrParams;
 import org.apache.solr.common.params.SolrParams;
 import org.apache.solr.common.util.NamedList;
 import org.apache.solr.core.SolrCore;
@@ -173,7 +174,15 @@ public class PingRequestHandler extends RequestHandlerBase implements SolrCoreAw
   {
     
     SolrParams params = req.getParams();
-    SolrCore core = req.getCore();
+    
+    // in this case, we want to default distrib to false so
+    // we only ping the single node
+    Boolean distrib = params.getBool("distrib");
+    if (distrib == null)   {
+      ModifiableSolrParams mparams = new ModifiableSolrParams(params);
+      mparams.set("distrib", false);
+      req.setParams(mparams);
+    }
     
     String actionParam = params.get("action");
     ACTIONS action = null;

From aee60cb3ab36e05bb560413f7c5c66d849791f11 Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Mon, 21 May 2012 08:37:34 +0000
Subject: [PATCH 44/47] SOLR-3459: Fix Cloud's Graph-Views for multiple
 collections

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340933 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/webapp/web/css/styles/cloud.css | 18 ++++++++++++++----
 solr/webapp/web/js/scripts/cloud.js  | 20 +++++++++++---------
 2 files changed, 25 insertions(+), 13 deletions(-)

diff --git a/solr/webapp/web/css/styles/cloud.css b/solr/webapp/web/css/styles/cloud.css
index 74163240d60..ef0c963045a 100644
--- a/solr/webapp/web/css/styles/cloud.css
+++ b/solr/webapp/web/css/styles/cloud.css
@@ -236,17 +236,17 @@
   stroke-width: 1.5px;
 }
 
-#content #graph-content .node.lvl-2 text
+#content #graph-content .node.lvl-3 text
 {
   cursor: pointer;
 }
 
-#content #graph-content .node.lvl-2:hover circle
+#content #graph-content .node.lvl-3:hover circle
 {
   stroke: #000 !important;
 }
 
-#content #graph-content .node.lvl-2:hover text
+#content #graph-content .node.lvl-3:hover text
 {
   fill: #000 !important;
 }
@@ -314,8 +314,18 @@
   fill: #000;
 }
 
-#content #graph-content .link.lvl-1,
+#content #graph-content .link.lvl-2,
 #content #graph-content .link.leader
 {
   stroke: #c0c0c0;
+}
+
+#content #graph-content .node.lvl-0 circle
+{
+  stroke: #fff;
+}
+
+#content #graph-content .link.lvl-1
+{
+  stroke: #fff;
 }
\ No newline at end of file
diff --git a/solr/webapp/web/js/scripts/cloud.js b/solr/webapp/web/js/scripts/cloud.js
index 21b8783afb7..5aa9f2e1fc7 100644
--- a/solr/webapp/web/js/scripts/cloud.js
+++ b/solr/webapp/web/js/scripts/cloud.js
@@ -156,12 +156,12 @@ var helper_path_class = function( p )
   var classes = [ 'link' ];
   classes.push( 'lvl-' + p.target.depth );
 
-  if( p.target.data.leader )
+  if( p.target.data && p.target.data.leader )
   {
     classes.push( 'leader' );
   }
 
-  if( p.target.data.state )
+  if( p.target.data && p.target.data.state )
   {
     classes.push( p.target.data.state );
   }
@@ -174,12 +174,12 @@ var helper_node_class = function( d )
   var classes = [ 'node' ];
   classes.push( 'lvl-' + d.depth );
 
-  if( d.data.leader )
+  if( d.data && d.data.leader )
   {
     classes.push( 'leader' );
   }
 
-  if( d.data.state )
+  if( d.data && d.data.state )
   {
     classes.push( d.data.state );
   }
@@ -197,7 +197,7 @@ var helper_data = {
 
 var helper_node_text = function( d )
 {
-  if( !d.data.uri )
+  if( !d.data || !d.data.uri )
   {
     return d.name;
   }
@@ -361,7 +361,11 @@ var prepare_graph = function( graph_element, callback )
               eval( 'state = ' + response.znode.data + ';' );
               
               var leaf_count = 0;
-              var collections = [];
+              var graph_data = {
+                name: null,
+                children : []
+              };
+
               for( var c in state )
               {
                 var shards = [];
@@ -424,10 +428,8 @@ var prepare_graph = function( graph_element, callback )
                   },
                   children: shards
                 };
-                collections.push( collection );
+                graph_data.children.push( collection );
               }
-
-              var graph_data = collections.shift();
               
               helper_data.protocol = $.unique( helper_data.protocol );
               helper_data.host = $.unique( helper_data.host );

From a79a14347d4ba81bc106598db904ec2b97321355 Mon Sep 17 00:00:00 2001
From: Stefan Matheis <steffkes@apache.org>
Date: Mon, 21 May 2012 08:47:39 +0000
Subject: [PATCH 45/47] SOLR-3234: Remove contrib/dataimport's webapp

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340934 13f79535-47bb-0310-9956-ffa450edef68
---
 .../src/webapp/admin/dataimport.jsp           |  53 ---------
 .../src/webapp/admin/debug.jsp                | 103 ------------------
 2 files changed, 156 deletions(-)
 delete mode 100644 solr/contrib/dataimporthandler/src/webapp/admin/dataimport.jsp
 delete mode 100644 solr/contrib/dataimporthandler/src/webapp/admin/debug.jsp

diff --git a/solr/contrib/dataimporthandler/src/webapp/admin/dataimport.jsp b/solr/contrib/dataimporthandler/src/webapp/admin/dataimport.jsp
deleted file mode 100644
index 667f8947d54..00000000000
--- a/solr/contrib/dataimporthandler/src/webapp/admin/dataimport.jsp
+++ /dev/null
@@ -1,53 +0,0 @@
-<%@ page import="org.apache.solr.request.SolrRequestHandler" %>
-<%@ page import="java.util.Map" %>
-<%@ page contentType="text/html; charset=utf-8" pageEncoding="UTF-8"%>
-<%--
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements.  See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License.  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
---%>
-<%-- do a verbatim include so we can use the local vars --%>
-<%@include file="_info.jsp"%>
-<html>
-<%
-  String handler = request.getParameter("handler");
-
-  if (handler == null) {
-    Map<String, SolrRequestHandler> handlers = core.getRequestHandlers();
-%>
-<head>
-  <title>DataImportHandler Interactive Development</title>
-  <link rel="stylesheet" type="text/css" href="solr-admin.css">
-</head>
-<body>
-Select handler:
-<ul>
-<%
-    for (String key : handlers.keySet()) {
-      if (handlers.get(key).getClass().getName().equals("org.apache.solr.handler.dataimport.DataImportHandler")) { %>
-  <li><a href="dataimport.jsp?handler=<%=key%>"><%=key%></a></li>
-<%
-      }
-    }
-%>
-</ul>
-</body>
-<% } else { %>
-
-<frameset cols = "50%, 50%">
-  <frame src ="debug.jsp?handler=<%=handler%>" />
-  <frame src ="..<%=handler%>?command=status"  name="result"/>
-</frameset>
-<% } %>
-</html>
diff --git a/solr/contrib/dataimporthandler/src/webapp/admin/debug.jsp b/solr/contrib/dataimporthandler/src/webapp/admin/debug.jsp
deleted file mode 100644
index 2c76ce728c8..00000000000
--- a/solr/contrib/dataimporthandler/src/webapp/admin/debug.jsp
+++ /dev/null
@@ -1,103 +0,0 @@
-<%@ page contentType="text/html; charset=utf-8" pageEncoding="UTF-8"%>
-<%--
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements.  See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License.  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
---%>
-<%-- do a verbatim include so we can use the local vars --%>
-<%@include file="_info.jsp"%>
-<html>
-<head>
-<title>DataImportHandler Interactive Development</title>
-<link rel="stylesheet" type="text/css" href="solr-admin.css"/>
-<link rel="icon" href="favicon.ico" type="image/ico"/>
-<link rel="shortcut icon" href="favicon.ico" type="image/ico"/>
-<script src="jquery-1.4.3.min.js"></script>
-</head>
-<body>
-<h1>DataImportHandler Development Console</h1>
-<%
-  String handler = request.getParameter("handler");  // must be specified
-%>
-<form action="..<%=handler%>" target="result" method="get">
-<input type="hidden" name="debug" value="on"/>
-<table>
-  <tr>
-    <th>Handler: </th>
-    <td><%=handler%> <a href="dataimport.jsp" target="_top">change handler</a></td>
-  </tr>
-	<tr>
-		<td colspan="2">
-		<table width="100%">
-			<tr>
-				<td>
-					<select name="command">
-						<option value="full-import" selected="selected">full-import</option>
-						<option value="delta-import">delta-import</option>
-					</select>
-				</td>
-				<td><strong>Verbose</strong>&nbsp;<input
-					name="verbose" type="checkbox"></td>
-				<td><strong>Commit</strong>&nbsp;<input
-					name="commit" type="checkbox"></td>
-				<td><strong>Clean</strong>&nbsp;<input
-					name="clean" type="checkbox"></td>
-				<td><strong>Start Row</strong>&nbsp;<input
-					name="start" size="4" type="text" value="0"></td>
-				<td><strong>No. of Rows</strong>&nbsp;<input name="rows"
-					type="text" size="4" value="10"></td>
-			</tr>
-		</table>
-		</td>
-	<tr>
-		<td><strong>data config xml</strong></td>
-		<td><input class="stdbutton" type="submit" value="debug now">
-		</td>
-	</tr>
-	<tr>
-		<td colspan="2"><textarea id="txtDataConfig" rows="30" cols="80" name="dataConfig"></textarea></td>
-    <script type="text/javascript" language="javascript">
-        $.get("..<%=handler%>?command=show-config", function(data){
-            $('#txtDataConfig').attr('value', data);
-        });
-    </script>
-	</tr>
-</table>
-</form>
-<form action="..<%=handler%>" target="result" method="get">
-	<input type="hidden" name="clean" value="false">
-	<input type="hidden" name="commit" value="true">
-	<input class="stdbutton" type="submit" name="command" value="full-import">
-	<input class="stdbutton" type="submit" name="command" value="delta-import">
-	<input class="stdbutton" type="submit" name="command" value="status">
-	<input class="stdbutton" type="submit" name="command" value="reload-config">
-	<input class="stdbutton" type="submit" name="command" value="abort">
-</form>
-<form action="../select" target="result" method="get">
-	<input type="hidden" name="q" value="*:*">
-	<input type="hidden" name="start" value="0">
-	<input type="hidden" name="rows" value="0">
-	<input class="stdbutton" type="submit" value="Documents Count">
-</form>
-<form action="..<%=handler%>" target="result" method="get">
-	<input type="hidden" name="verbose" value="true">
-	<input type="hidden" name="clean" value="true">
-	<input type="hidden" name="commit" value="true">
-	<input type="hidden" name="command" value="full-import">
-	<input class="stdbutton" type="submit" value="Full Import with Cleaning">
-</form>
-
-<a href="index.jsp" target="_parent">Return to Admin Page</a>
-</body>
-</html>

From 98d15d4e6787779b2c97a0b908358b2e69c4d981 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Stanis=C5=82aw=20Osi=C5=84ski?= <stanislaw@apache.org>
Date: Mon, 21 May 2012 08:57:31 +0000
Subject: [PATCH 46/47] SOLR-3470: Custom Carrot2 tokenizer and stemmer
 factories overwritten by defaults: fixing class loader issues, minor cleanups
 (Dawid Weiss)

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340939 13f79535-47bb-0310-9956-ffa450edef68
---
 solr/contrib/clustering/CHANGES.txt           |  3 +-
 .../carrot2/CarrotClusteringEngine.java       | 37 ++++++++++--
 .../clustering/carrot2/CarrotParams.java      | 57 ++++++++++++-------
 .../carrot2/CarrotClusteringEngineTest.java   | 22 +++----
 4 files changed, 83 insertions(+), 36 deletions(-)

diff --git a/solr/contrib/clustering/CHANGES.txt b/solr/contrib/clustering/CHANGES.txt
index 1baee1dc05d..ebda2079ba3 100644
--- a/solr/contrib/clustering/CHANGES.txt
+++ b/solr/contrib/clustering/CHANGES.txt
@@ -9,7 +9,8 @@ CHANGES
 $Id$
 ================== Release 4.0.0-dev ==============
 
-(No Changes)
+* SOLR-3470: Bug fix: custom Carrot2 tokenizer and stemmer factories are 
+  respected now (Stanislaw Osinski, Dawid Weiss)
 
 ================== Release 3.6.0 ==================
 
diff --git a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java
index edaffe18db5..b086318e99f 100644
--- a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java
+++ b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java
@@ -109,6 +109,9 @@ public class CarrotClusteringEngine extends SearchClusteringEngine {
   private Controller controller = ControllerFactory.createPooling();
   private Class<? extends IClusteringAlgorithm> clusteringAlgorithmClass;
 
+  /** Solr core we're bound to. */
+  private SolrCore core;
+
   private static class SolrResourceLocator implements IResourceLocator {
     private final SolrResourceLoader resourceLoader;
     private final String carrot2ResourcesDir;
@@ -147,7 +150,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine {
         public InputStream open() throws IOException {
           return new ByteArrayInputStream(asBytes);
         }
-        
+
         @Override
         public int hashCode() {
           // In case multiple resources are found they will be deduped, but we don't use it in Solr,
@@ -232,8 +235,19 @@ public class CarrotClusteringEngine extends SearchClusteringEngine {
       extractCarrotAttributes(sreq.getParams(), attributes);
 
       // Perform clustering and convert to named list
-      return clustersToNamedList(controller.process(attributes,
-              clusteringAlgorithmClass).getClusters(), sreq.getParams());
+      // Carrot2 uses current thread's context class loader to get
+      // certain classes (e.g. custom tokenizer/stemmer) at runtime.
+      // To make sure classes from contrib JARs are available,
+      // we swap the context class loader for the time of clustering.
+      Thread ct = Thread.currentThread();
+      ClassLoader prev = ct.getContextClassLoader();
+      try {
+        ct.setContextClassLoader(core.getResourceLoader().getClassLoader());
+        return clustersToNamedList(controller.process(attributes,
+                clusteringAlgorithmClass).getClusters(), sreq.getParams());
+      } finally {
+        ct.setContextClassLoader(prev);
+      }
     } catch (Exception e) {
       log.error("Carrot2 clustering failed", e);
       throw new SolrException(ErrorCode.SERVER_ERROR, "Carrot2 clustering failed", e);
@@ -243,6 +257,8 @@ public class CarrotClusteringEngine extends SearchClusteringEngine {
   @Override
   @SuppressWarnings({ "unchecked", "rawtypes" })
   public String init(NamedList config, final SolrCore core) {
+    this.core = core;
+
     String result = super.init(config, core);
     final SolrParams initParams = SolrParams.toSolrParams(config);
 
@@ -277,8 +293,19 @@ public class CarrotClusteringEngine extends SearchClusteringEngine {
         // Using the class loader directly because this time we want to omit the prefix
         new ClassLoaderLocator(core.getResourceLoader().getClassLoader())));
 
-    this.controller.init(initAttributes);
-    
+    // Carrot2 uses current thread's context class loader to get
+    // certain classes (e.g. custom tokenizer/stemmer) at initialization time.
+    // To make sure classes from contrib JARs are available,
+    // we swap the context class loader for the time of clustering.
+    Thread ct = Thread.currentThread();
+    ClassLoader prev = ct.getContextClassLoader();
+    try {
+      ct.setContextClassLoader(core.getResourceLoader().getClassLoader());
+      this.controller.init(initAttributes);
+    } finally {
+      ct.setContextClassLoader(prev);
+    }
+
     SchemaField uniqueField = core.getSchema().getUniqueKeyField();
     if (uniqueField == null) {
       throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, 
diff --git a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java
index 00050476a56..f9d7b757cb1 100644
--- a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java
+++ b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java
@@ -22,29 +22,48 @@ import com.google.common.collect.ImmutableSet;
  */
 
 
-public interface CarrotParams {
+/**
+ * Carrot2 parameter mapping (recognized and mapped if passed via Solr configuration).
+ */
+public final class CarrotParams {
 
-  String CARROT_PREFIX = "carrot.";
+  private static String CARROT_PREFIX = "carrot.";
 
-  String ALGORITHM = CARROT_PREFIX + "algorithm";
+  public static String ALGORITHM = CARROT_PREFIX + "algorithm";
   
-  String TITLE_FIELD_NAME = CARROT_PREFIX + "title";
-  String URL_FIELD_NAME = CARROT_PREFIX + "url";
-  String SNIPPET_FIELD_NAME = CARROT_PREFIX + "snippet";
-  String LANGUAGE_FIELD_NAME = CARROT_PREFIX + "lang";
-  String CUSTOM_FIELD_NAME = CARROT_PREFIX + "custom";
+  public static String TITLE_FIELD_NAME = CARROT_PREFIX + "title";
+  public static String URL_FIELD_NAME = CARROT_PREFIX + "url";
+  public static String SNIPPET_FIELD_NAME = CARROT_PREFIX + "snippet";
+  public static String LANGUAGE_FIELD_NAME = CARROT_PREFIX + "lang";
+  public static String CUSTOM_FIELD_NAME = CARROT_PREFIX + "custom";
   
-  String PRODUCE_SUMMARY = CARROT_PREFIX + "produceSummary";
-  String SUMMARY_FRAGSIZE = CARROT_PREFIX + "fragSize";
-  String SUMMARY_SNIPPETS = CARROT_PREFIX + "summarySnippets";
+  public static String PRODUCE_SUMMARY = CARROT_PREFIX + "produceSummary";
+  public static String SUMMARY_FRAGSIZE = CARROT_PREFIX + "fragSize";
+  public static String SUMMARY_SNIPPETS = CARROT_PREFIX + "summarySnippets";
 
-  String NUM_DESCRIPTIONS = CARROT_PREFIX + "numDescriptions";
-  String OUTPUT_SUB_CLUSTERS = CARROT_PREFIX + "outputSubClusters";
-  String LEXICAL_RESOURCES_DIR = CARROT_PREFIX + "lexicalResourcesDir";
-  String LANGUAGE_CODE_MAP = CARROT_PREFIX + "lcmap";
+  public static String NUM_DESCRIPTIONS = CARROT_PREFIX + "numDescriptions";
+  public static String OUTPUT_SUB_CLUSTERS = CARROT_PREFIX + "outputSubClusters";
+  public static String LEXICAL_RESOURCES_DIR = CARROT_PREFIX + "lexicalResourcesDir";
+  public static String LANGUAGE_CODE_MAP = CARROT_PREFIX + "lcmap";
 
-  public static final Set<String> CARROT_PARAM_NAMES = ImmutableSet.of(
-          ALGORITHM, TITLE_FIELD_NAME, URL_FIELD_NAME, SNIPPET_FIELD_NAME, LANGUAGE_FIELD_NAME,
-          PRODUCE_SUMMARY, SUMMARY_FRAGSIZE, SUMMARY_SNIPPETS, NUM_DESCRIPTIONS, OUTPUT_SUB_CLUSTERS, 
-          LEXICAL_RESOURCES_DIR);
+  static final Set<String> CARROT_PARAM_NAMES = ImmutableSet.of(
+          ALGORITHM, 
+          
+          TITLE_FIELD_NAME, 
+          URL_FIELD_NAME, 
+          SNIPPET_FIELD_NAME, 
+          LANGUAGE_FIELD_NAME,
+          CUSTOM_FIELD_NAME,
+          
+          PRODUCE_SUMMARY, 
+          SUMMARY_FRAGSIZE, 
+          SUMMARY_SNIPPETS, 
+          
+          NUM_DESCRIPTIONS, 
+          OUTPUT_SUB_CLUSTERS, 
+          LEXICAL_RESOURCES_DIR,
+          LANGUAGE_CODE_MAP);
+  
+  /** No instances. */
+  private CarrotParams() {}
 }
diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java
index 911f03d787d..94502350bcd 100644
--- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java
+++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java
@@ -205,7 +205,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
 
   @Test
-  public void solrStopWordsUsedInCarrot2Clustering() throws Exception {
+  public void testSolrStopWordsUsedInCarrot2Clustering() throws Exception {
     ModifiableSolrParams params = new ModifiableSolrParams();
     params.set("merge-resources", false);
     params.set(AttributeUtils.getKey(
@@ -220,7 +220,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
 
   @Test
-  public void solrStopWordsNotDefinedOnAFieldForClustering() throws Exception {
+  public void testSolrStopWordsNotDefinedOnAFieldForClustering() throws Exception {
     ModifiableSolrParams params = new ModifiableSolrParams();
     // Force string fields to be used for clustering. Does not make sense
     // in a real word, but does the job in the test.
@@ -239,7 +239,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
   
   @Test
-  public void highlightingOfMultiValueField() throws Exception {
+  public void testHighlightingOfMultiValueField() throws Exception {
     final String snippetWithoutSummary = getLabels(clusterWithHighlighting(
         false, 30, 3, "multi", 1).get(0)).get(1);
     assertTrue("Snippet contains first value", snippetWithoutSummary.contains("First"));
@@ -256,7 +256,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
   
   @Test
-  public void concatenatingMultipleFields() throws Exception {
+  public void testConcatenatingMultipleFields() throws Exception {
     final ModifiableSolrParams params = new ModifiableSolrParams();
     params.add(CarrotParams.TITLE_FIELD_NAME, "title,heading");
     params.add(CarrotParams.SNIPPET_FIELD_NAME, "snippet,body");
@@ -271,7 +271,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
 
   @Test
-  public void highlightingMultipleFields() throws Exception {
+  public void testHighlightingMultipleFields() throws Exception {
     final TermQuery query = new TermQuery(new Term("snippet", "content"));
 
     final ModifiableSolrParams params = new ModifiableSolrParams();
@@ -297,7 +297,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
 
   @Test
-  public void oneCarrot2SupportedLanguage() throws Exception {
+  public void testOneCarrot2SupportedLanguage() throws Exception {
     final ModifiableSolrParams params = new ModifiableSolrParams();
     params.add(CarrotParams.LANGUAGE_FIELD_NAME, "lang");
 
@@ -309,7 +309,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
   
   @Test
-  public void oneCarrot2SupportedLanguageOfMany() throws Exception {
+  public void testOneCarrot2SupportedLanguageOfMany() throws Exception {
     final ModifiableSolrParams params = new ModifiableSolrParams();
     params.add(CarrotParams.LANGUAGE_FIELD_NAME, "lang");
     
@@ -321,7 +321,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
   
   @Test
-  public void languageCodeMapping() throws Exception {
+  public void testLanguageCodeMapping() throws Exception {
     final ModifiableSolrParams params = new ModifiableSolrParams();
     params.add(CarrotParams.LANGUAGE_FIELD_NAME, "lang");
     params.add(CarrotParams.LANGUAGE_CODE_MAP, "POLISH:pl");
@@ -334,7 +334,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
   
   @Test
-  public void passingOfCustomFields() throws Exception {
+  public void testPassingOfCustomFields() throws Exception {
     final ModifiableSolrParams params = new ModifiableSolrParams();
     params.add(CarrotParams.CUSTOM_FIELD_NAME, "intfield_i:intfield");
     params.add(CarrotParams.CUSTOM_FIELD_NAME, "floatfield_f:floatfield");
@@ -353,7 +353,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
 
   @Test
-  public void customTokenizer() throws Exception {
+  public void testCustomTokenizer() throws Exception {
     final ModifiableSolrParams params = new ModifiableSolrParams();
     params.add(CarrotParams.TITLE_FIELD_NAME, "title");
     params.add(CarrotParams.SNIPPET_FIELD_NAME, "snippet");
@@ -367,7 +367,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase {
   }
   
   @Test
-  public void customStemmer() throws Exception {
+  public void testCustomStemmer() throws Exception {
     final ModifiableSolrParams params = new ModifiableSolrParams();
     params.add(CarrotParams.TITLE_FIELD_NAME, "title");
     params.add(CarrotParams.SNIPPET_FIELD_NAME, "snippet");

From 20f10be75b469a4ca5817815b99098eb44c60cb6 Mon Sep 17 00:00:00 2001
From: Martijn van Groningen <mvg@apache.org>
Date: Mon, 21 May 2012 11:07:01 +0000
Subject: [PATCH 47/47] LUCENE-4068: Improve IW#addDocuments(...) javadoc

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1340966 13f79535-47bb-0310-9956-ffa450edef68
---
 .../org/apache/lucene/index/IndexWriter.java  | 19 +++++++++++++------
 1 file changed, 13 insertions(+), 6 deletions(-)

diff --git a/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java b/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java
index 28d16a8ef4f..d229c71d39a 100644
--- a/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java
+++ b/lucene/core/src/java/org/apache/lucene/index/IndexWriter.java
@@ -1041,12 +1041,19 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
    *
    * <p><b>WARNING</b>: the index does not currently record
    * which documents were added as a block.  Today this is
-   * fine, because merging will preserve the block (as long
-   * as none them were deleted).  But it's possible in the
-   * future that Lucene may more aggressively re-order
-   * documents (for example, perhaps to obtain better index
-   * compression), in which case you may need to fully
-   * re-index your documents at that time.
+   * fine, because merging will preserve a block. The order of
+   * documents within a segment will be preserved, even when child
+   * documents within a block are deleted. Most search features
+   * (like result grouping and block joining) require you to
+   * mark documents; when these documents are deleted these
+   * search features will not work as expected. Obviously adding
+   * documents to an existing block will require you the reindex
+   * the entire block.
+   *
+   * <p>However it's possible that in the future Lucene may
+   * merge more aggressively re-order documents (for example,
+   * perhaps to obtain better index compression), in which case
+   * you may need to fully re-index your documents at that time.
    *
    * <p>See {@link #addDocument(Iterable)} for details on
    * index and IndexWriter state after an Exception, and