SOLR-2452: Merged with trunk up to r1137526

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/branches/solr2452@1137527 13f79535-47bb-0310-9956-ffa450edef68
2011-06-20 07:12:59 +00:00 · 2011-06-20 07:12:59 +00:00 · 2e4fbd2baf
parent a9b8ed0002 4d68c56a04
commit 2e4fbd2baf
9 changed files with 67 additions and 62 deletions
--- a/lucene/CHANGES.txt
+++ b/lucene/CHANGES.txt
@ -451,12 +451,6 @@ Optimizations
  seek the term dictionary in TermQuery / TermWeight.
  (Simon Willnauer, Mike McCandless, Robert Muir)
 * LUCENE-2897: Apply deleted terms while flushing a segment.  We still
  buffer deleted terms to later apply to past segments.  (Mike McCandless)
 * LUCENE-1736: DateTools.java general improvements. 
  (David Smiley via Steve Rowe)
 Bug fixes
 * LUCENE-2633: PackedInts Packed32 and Packed64 did not support internal
@ -478,6 +472,10 @@ Changes in backwards compatibility policy
  of IndexInput) as its first argument.  (Robert Muir, Dawid Weiss,
  Mike McCandless)
 * LUCENE-3191: FieldComparator.value now returns an Object not
  Comparable; FieldDoc.fields also changed from Comparable[] to
  Object[] (Uwe Schindler, Mike McCandless)
 * LUCENE-3208: Made deprecated methods Query.weight(Searcher) and
  Searcher.createWeight() final to prevent override. If you have
  overridden one of these methods, cut over to the non-deprecated
@ -545,6 +543,11 @@ API Changes
  argument, so the merge policy knows which segments were originally
  present vs produced by an optimizing merge (Mike McCandless)
 Optimizations
 * LUCENE-1736: DateTools.java general improvements. 
  (David Smiley via Steve Rowe)
 New Features
 * LUCENE-3140: Added experimental FST implementation to Lucene.
--- a/lucene/contrib/misc/src/java/org/apache/lucene/index/PKIndexSplitter.java
+++ b/lucene/contrib/misc/src/java/org/apache/lucene/index/PKIndexSplitter.java
@ -34,6 +34,7 @@ import org.apache.lucene.util.Version;
 /**
 * Split an index based on a {@link Filter}.
 */
 public class PKIndexSplitter {
  private final Filter docsInFirstIndex;
  private final Directory input;
--- a/lucene/src/java/org/apache/lucene/index/IndexWriter.java
+++ b/lucene/src/java/org/apache/lucene/index/IndexWriter.java
@ -1674,11 +1674,13 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
      for(final MergePolicy.OneMerge merge  : pendingMerges) {
        merge.optimize = true;
        merge.maxNumSegmentsOptimize = maxNumSegments;
        segmentsToOptimize.put(merge.info, Boolean.TRUE);
      }
      for ( final MergePolicy.OneMerge merge: runningMerges ) {
        merge.optimize = true;
        merge.maxNumSegmentsOptimize = maxNumSegments;
        segmentsToOptimize.put(merge.info, Boolean.TRUE);
      }
    }
@ -1891,7 +1893,6 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
    final MergePolicy.MergeSpecification spec;
    if (optimize) {
      spec = mergePolicy.findMergesForOptimize(segmentInfos, maxNumSegmentsOptimize, Collections.unmodifiableMap(segmentsToOptimize));
      if (spec != null) {
        final int numMerges = spec.merges.size();
        for(int i=0;i<numMerges;i++) {
@ -3044,7 +3045,9 @@ public class IndexWriter implements Closeable, TwoPhaseCommit {
    if (merge.optimize) {
      // cascade the optimize:
-      segmentsToOptimize.put(merge.info, Boolean.FALSE);
+      if (!segmentsToOptimize.containsKey(merge.info)) {
        segmentsToOptimize.put(merge.info, Boolean.FALSE);
      }
    }
    return true;
--- a/lucene/src/java/org/apache/lucene/index/LogMergePolicy.java
+++ b/lucene/src/java/org/apache/lucene/index/LogMergePolicy.java
@ -353,7 +353,7 @@ public abstract class LogMergePolicy extends MergePolicy {
    assert maxNumSegments > 0;
    if (verbose()) {
-      message("findMergesForOptimize: maxNumSegs=" + maxNumSegments + " segsToOptimize= "+ segmentsToOptimize);
+      message("findMergesForOptimize: maxNumSegs=" + maxNumSegments + " segsToOptimize="+ segmentsToOptimize);
    }
    // If the segments are already optimized (e.g. there's only 1 segment), or
--- a/lucene/src/java/org/apache/lucene/index/UpgradeIndexMergePolicy.java
+++ b/lucene/src/java/org/apache/lucene/index/UpgradeIndexMergePolicy.java
@ -101,9 +101,7 @@ public class UpgradeIndexMergePolicy extends MergePolicy {
      // the resulting set contains all segments that are left over
      // and will be merged to one additional segment:
      for (final OneMerge om : spec.merges) {
-        for(SegmentInfo info : om.segments) {
+        oldSegments.keySet().removeAll(om.segments);
          oldSegments.remove(info);
        }
      }
    }
--- a/lucene/src/test/org/apache/lucene/index/TestPerFieldCodecSupport.java
+++ b/lucene/src/test/org/apache/lucene/index/TestPerFieldCodecSupport.java
@ -285,7 +285,7 @@ public class TestPerFieldCodecSupport extends LuceneTestCase {
      for (Codec codec : codecs) {
        provider.register(codec);
      }
-      int num = atLeast(30);
+      int num = _TestUtil.nextInt(random, 30, 60);
      for (int j = 0; j < num; j++) {
        provider.setFieldCodec("" + j, codecs[random.nextInt(codecs.length)].name);
      }
@ -296,7 +296,6 @@ public class TestPerFieldCodecSupport extends LuceneTestCase {
      IndexWriter writer = newWriter(dir, config);
      for (int j = 0; j < docsPerRound; j++) {
        final Document doc = new Document();
        num = atLeast(30);
        for (int k = 0; k < num; k++) {
          Field field = newField("" + k, _TestUtil
              .randomRealisticUnicodeString(random, 128), indexValue[random
--- a/lucene/src/test/org/apache/lucene/search/TestPhraseQuery.java
+++ b/lucene/src/test/org/apache/lucene/search/TestPhraseQuery.java
@ -617,7 +617,7 @@ public class TestPhraseQuery extends LuceneTestCase {
    int NUM_DOCS = atLeast(10);
    for (int i = 0; i < NUM_DOCS; i++) {
      // must be > 4096 so it spans multiple chunks
-      int termCount = atLeast(5000);
+      int termCount = _TestUtil.nextInt(random, 4097, 8200);
      List<String> doc = new ArrayList<String>();
--- a/lucene/src/test/org/apache/lucene/util/fst/TestFSTs.java
+++ b/lucene/src/test/org/apache/lucene/util/fst/TestFSTs.java
@ -963,7 +963,7 @@ public class TestFSTs extends LuceneTestCase {
  @Nightly
  public void testBigSet() throws IOException {
-    testRandomWords(atLeast(50000), atLeast(1));
+    testRandomWords(_TestUtil.nextInt(random, 50000, 60000), atLeast(1));
  }
  private static String inputToString(int inputMode, IntsRef term) {
--- a/solr/CHANGES.txt
+++ b/solr/CHANGES.txt
@ -65,28 +65,11 @@ New Features
  the cache when warming happens. 
  (Tomas Fernandez Lobbe and hossman)
 * SOLR-1915: DebugComponent now supports using a NamedList to model
  Explanation objects in it's responses instead of
  Explanation.toString  (hossman) 
 * SOLR-1932: New relevancy function queries: termfreq, tf, docfreq, idf
  norm, maxdoc, numdocs. (yonik)
 * SOLR-1682: (SOLR-236, SOLR-237, SOLR-1773, SOLR-1311) Search grouping / Field collapsing.
  (Martijn van Groningen, Emmanuel Keller, Shalin Shekhar Mangar,
   Koji Sekiguchi, Iván de Prado, Ryan McKinley, Marc Sturlese, Peter Karich,
   Bojan Smid, Charles Hornberger, Dieter Grad, Dmitry Lihachev, Doug Steigerwald,
   Karsten Sperling, Michael Gundlach, Oleg Gnatovskiy, Thomas Traeger,
   Harish Agarwal, yonik)
  SOLR-2564: Integrate grouping module into Solr. Also adds the ability to return number of
  groups that have match a query.
 * SOLR-1665: Add debug component options for timings, results and query info only (gsingers, hossman, yonik)
 * SOLR-2113: Add TermQParserPlugin, registered as "term".  This is useful
  when generating filter queries from terms returned from field faceting or
  the terms component. Example: fq={!term f=weight}1.5   (hossman, yonik) 
 * SOLR-2001: The query component will substitute an empty query that matches
  no documents if the query parser returns null.  This also prevents an
  exception from being thrown by the default parser if "q" is missing. (yonik)
@ -210,15 +193,6 @@ Bug Fixes
 * SOLR-2275: fix DisMax 'mm' parsing to be tolerant of whitespace
  (Erick Erickson via hossman)
 * SOLR-309: Fix FieldType so setting an analyzer on a FieldType that
  doesn't expect it will generate an error.  Practically speaking this
  means that Solr will now correctly generate an error on
  initialization if the schema.xml contains an analyzer configuration
  for a fieldType that does not use TextField.  (hossman) 
 * SOLR-2467: Fix <analyzer class="..." /> initialization so any errors 
  are logged properly.  (hossman)
 Other Changes
 ----------------------
@ -252,18 +226,9 @@ Other Changes
  Conversion from SolrInputDocument > Object > Fieldable is now managed
  by FieldType rather then DocumentBuilder.  (ryan)
 * SOLR-2061: Pull base tests out into a new Solr Test Framework module,
  and publish binary, javadoc, and source test-framework jars. 
  (Drew Farris, Robert Muir, Steve Rowe)
 * SOLR-2461: QuerySenderListener and AbstractSolrEventListener are 
  now public (hossman)
 * SOLR-2451: Enhance assertJQ to allow individual tests to specify the 
  tolerance delta used in numeric equalities.  This allows for slight 
  variance in asserting score comparisons in unit tests.
  (David Smiley, Chris Hostetter)
 * LUCENE-2995: Moved some spellchecker and suggest APIs to modules/suggest:
  HighFrequencyDictionary, SortedIterator, TermFreqIterator, and the
  suggester APIs and implementations. (rmuir)
@ -271,15 +236,6 @@ Other Changes
 * SOLR-2576: Remove deprecated SpellingResult.add(Token, int).
  (James Dyer via rmuir)
 * LUCENE-3204: The maven-ant-tasks jar is now included in the source tree;
  users of the generate-maven-artifacts target no longer have to manually
  place this jar in the Ant classpath.  NOTE: when Ant looks for the 
  maven-ant-tasks jar, it looks first in its pre-existing classpath, so
  any copies it finds will be used instead of the copy included in the 
  Lucene/Solr source tree.  For this reason, it is recommeded to remove
  any copies of the maven-ant-tasks jar in the Ant classpath, e.g. under
  ~/.ant/lib/ or under the Ant installation's lib/ directory. (Steve Rowe)
 Documentation
 ----------------------
@ -302,6 +258,14 @@ New Features
  previous Tokenizers/TokenFilters (called "positionHistory").
  (Uwe Schindler)
 * SOLR-2524: (SOLR-236, SOLR-237, SOLR-1773, SOLR-1311) Grouping / Field collapsing
  using the Lucene grouping contrib. The search result can be grouped by field and query. 
  (Martijn van Groningen, Emmanuel Keller, Shalin Shekhar Mangar, Koji Sekiguchi, 
   Iván de Prado, Ryan McKinley, Marc Sturlese, Peter Karich, Bojan Smid, 
   Charles Hornberger, Dieter Grad, Dmitry Lihachev, Doug Steigerwald,
   Karsten Sperling, Michael Gundlach, Oleg Gnatovskiy, Thomas Traeger,
   Harish Agarwal, yonik, Michael McCandless, Bill Bell)
 Optimizations
 ----------------------
@ -332,6 +296,17 @@ Other Changes
  SpellingResult.addFrequency(Token token, int docFreq) instead.
  (James Dyer via rmuir)
 * SOLR-2574: Upgrade slf4j to v1.6.1 (shalin)
 * LUCENE-3204: The maven-ant-tasks jar is now included in the source tree;
  users of the generate-maven-artifacts target no longer have to manually
  place this jar in the Ant classpath.  NOTE: when Ant looks for the 
  maven-ant-tasks jar, it looks first in its pre-existing classpath, so
  any copies it finds will be used instead of the copy included in the 
  Lucene/Solr source tree.  For this reason, it is recommeded to remove
  any copies of the maven-ant-tasks jar in the Ant classpath, e.g. under
  ~/.ant/lib/ or under the Ant installation's lib/ directory. (Steve Rowe)
 ==================  3.2.0  ==================
 Versions of Major Components
 ---------------------
@ -359,6 +334,14 @@ New Features
  Example: [{"id":"doc1"},{"id":"doc2"}] 
  (yonik)
 * SOLR-2113: Add TermQParserPlugin, registered as "term".  This is useful
  when generating filter queries from terms returned from field faceting or
  the terms component. Example: fq={!term f=weight}1.5   (hossman, yonik) 
 * SOLR-1915: DebugComponent now supports using a NamedList to model
  Explanation objects in it's responses instead of
  Explanation.toString  (hossman)
 Optimizations
 ----------------------
@ -401,6 +384,9 @@ Bug Fixes
  did not clear all attributes so they displayed incorrect attribute values for tokens
  in later filter stages. (uschindler, rmuir, yonik)
 * SOLR-2467: Fix <analyzer class="..." /> initialization so any errors 
  are logged properly.  (hossman)
 * SOLR-2493: SolrQueryParser was fixed to not parse the SolrConfig DOM tree on each
  instantiation which is a huge slowdown.  (Stephane Bailliez via uschindler)
@ -418,12 +404,27 @@ Bug Fixes
 * SOLR-2539: VectorValueSource.floatVal incorrectly used byteVal on sub-sources.
  (Tom Liu via yonik)
 * SOLR-2554: RandomSortField didn't work when used in a function query. (yonik)
 Other Changes
 ----------------------
 * SOLR-2061: Pull base tests out into a new Solr Test Framework module,
  and publish binary, javadoc, and source test-framework jars. 
  (Drew Farris, Robert Muir, Steve Rowe)
 * SOLR-2105: Rename RequestHandler param 'update.processor' to 'update.chain'.
 	(Jan Høydahl via Mark Miller)
 * SOLR-2485: Deprecate BaseResponseWriter, GenericBinaryResponseWriter, and 
  GenericTextResponseWriter.  These classes will be removed in 4.0.  (ryan)
 * SOLR-2451: Enhance assertJQ to allow individual tests to specify the 
  tolerance delta used in numeric equalities.  This allows for slight 
  variance in asserting score comparisons in unit tests.
  (David Smiley, Chris Hostetter)
 * SOLR-2528: Remove default="true" from HtmlEncoder in example solrconfig.xml,
  because html encoding confuses non-ascii users. (koji)