SOLR-1296: Add support for termInfosIndexDivisor and termIndexInterval

git-svn-id: https://svn.apache.org/repos/asf/lucene/solr/trunk@814160 13f79535-47bb-0310-9956-ffa450edef68
2009-09-12 12:27:42 +00:00 · 2009-09-12 12:27:42 +00:00 · 9b936ce650
parent fc1892279f
commit 9b936ce650
9 changed files with 602 additions and 15 deletions
--- a/CHANGES.txt
+++ b/CHANGES.txt
@ -350,7 +350,7 @@ Optimizations
 11. SOLR-1169: SortedIntDocSet - a new small set implementation
    that saves memory over HashDocSet, is faster to construct, 
-    is ordered for easier impelemntation of skipTo, and is faster
+    is ordered for easier implementation of skipTo, and is faster
    in the general case. (yonik)
 12. SOLR-1165: Use Lucene Filters and pass them down to the Lucene
@ -367,6 +367,8 @@ Optimizations
 16. SOLR-1353: Implement and use reusable token streams for analysis. (yonik)
 17. SOLR-1296: Enables setting IndexReader's termInfosIndexDivisor via a new attribute to StandardIndexReaderFactory.  Enables
    setting termIndexInterval to IndexWriter via SolrIndexConfig. (Jason Rutherglen, gsingers)
 Bug Fixes
 ----------------------
--- a/example/solr/conf/solrconfig.xml
+++ b/example/solr/conf/solrconfig.xml
@ -99,6 +99,10 @@
       if not specified.)
    -->
    <lockType>native</lockType>
    <!--
     Expert:
    Controls how often Lucene loads terms into memory -->
    <!--<termIndexInterval>256</termIndexInterval>-->
  </indexDefaults>
  <mainIndex>
@ -122,7 +126,12 @@
    <!-- If true, IndexReaders will be reopened (often more efficient) instead
         of closed and then opened.  -->
    <reopenReaders>true</reopenReaders>
-	  
+
    <!--
     Expert:
    Controls how often Lucene loads terms into memory.  Default is 128 and is likely good for most everyone. -->
    <!--<termIndexInterval>256</termIndexInterval>-->
    <!--
        Custom deletion policies can specified here. The class must
        implement org.apache.lucene.index.IndexDeletionPolicy.
@ -218,6 +227,10 @@
    Parameters as required by the implementation
  </indexReaderFactory >
  -->
  <!-- To set the termInfosIndexDivisor, do this: -->
  <!--<indexReaderFactory name="IndexReaderFactory" class="org.apache.solr.core.StandardIndexReaderFactory">
    <int name="termInfosIndexDivisor">12</int>
  </indexReaderFactory >-->
  <query>
--- a/src/java/org/apache/solr/core/IndexReaderFactory.java
+++ b/src/java/org/apache/solr/core/IndexReaderFactory.java
@ -27,15 +27,30 @@ import org.apache.solr.util.plugin.NamedListInitializedPlugin;
 * Factory used to build a new IndexReader instance.
 */
 public abstract class IndexReaderFactory implements NamedListInitializedPlugin {
-
+  protected int termInfosIndexDivisor = 1;//IndexReader.DEFAULT_TERMS_INDEX_DIVISOR;  Set this once Lucene makes this public.
  /**
   * Potentially initializes {@link #termInfosIndexDivisor}.  Overriding classes should call super.init() in order
   * to make sure termInfosIndexDivisor is set.
   * <p>
   * <code>init</code> will be called just once, immediately after creation.
   * <p>
   * The args are user-level initialization parameters that may be specified
   * when declaring an indexReaderFactory in solrconfig.xml
   *
   */
  public void init(NamedList args) {
-    /* :NOOP: */
+    Integer v = (Integer)args.get("termInfosIndexDivisor");
    if (v != null) {
      termInfosIndexDivisor = v.intValue();
    }
  }
  /**
   *
   * @return The setting of {@link #termInfosIndexDivisor} 
   */
  public int getTermInfosIndexDivisor() {
    return termInfosIndexDivisor;
  }
  /**
--- a/src/java/org/apache/solr/core/StandardIndexReaderFactory.java
+++ b/src/java/org/apache/solr/core/StandardIndexReaderFactory.java
@ -20,6 +20,7 @@ import java.io.IOException;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.store.Directory;
 import org.apache.solr.common.util.NamedList;
 /**
 * Default IndexReaderFactory implementation. Returns a standard Lucene
@ -28,12 +29,12 @@ import org.apache.lucene.store.Directory;
 * @see IndexReader#open(Directory)
 */
 public class StandardIndexReaderFactory extends IndexReaderFactory {
-
+  
  /* (non-Javadoc)
   * @see org.apache.solr.core.IndexReaderFactory#newReader(org.apache.lucene.store.Directory, boolean)
   */
  public IndexReader newReader(Directory indexDir, boolean readOnly)
      throws IOException {
-    return IndexReader.open(indexDir, readOnly);
+    return IndexReader.open(indexDir, null, readOnly, termInfosIndexDivisor);
  }
 }
--- a/src/java/org/apache/solr/update/SolrIndexConfig.java
+++ b/src/java/org/apache/solr/update/SolrIndexConfig.java
@ -20,6 +20,7 @@ package org.apache.solr.update;
 import org.apache.solr.core.SolrConfig;
 import org.apache.lucene.index.LogByteSizeMergePolicy;
 import org.apache.lucene.index.ConcurrentMergeScheduler;
 import org.apache.lucene.index.IndexWriter;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@ -53,6 +54,7 @@ public class SolrIndexConfig {
    mergePolicyClassName = DEFAULT_MERGE_POLICY_CLASSNAME;
    mergeSchedulerClassname = DEFAULT_MERGE_SCHEDULER_CLASSNAME;
    luceneAutoCommit = false;
    termIndexInterval = IndexWriter.DEFAULT_TERM_INDEX_INTERVAL;
  }
  public final boolean useCompoundFile;
@ -69,6 +71,7 @@ public class SolrIndexConfig {
  public final String mergePolicyClassName;
  public final String mergeSchedulerClassname;
  public final boolean luceneAutoCommit;
  public final int termIndexInterval;
  public String infoStreamFile = null;
@ -90,6 +93,7 @@ public class SolrIndexConfig {
    mergePolicyClassName = solrConfig.get(prefix + "/mergePolicy", def.mergePolicyClassName);
    mergeSchedulerClassname = solrConfig.get(prefix + "/mergeScheduler", def.mergeSchedulerClassname);
    luceneAutoCommit = solrConfig.getBool(prefix + "/luceneAutoCommit", def.luceneAutoCommit);
    termIndexInterval = solrConfig.getInt(prefix + "/termIndexInterval", def.termIndexInterval);
    boolean infoStreamEnabled = solrConfig.getBool(prefix + "/infoStream", false);
    if(infoStreamEnabled) {
--- a/src/java/org/apache/solr/update/SolrIndexWriter.java
+++ b/src/java/org/apache/solr/update/SolrIndexWriter.java
@ -69,6 +69,10 @@ public class SolrIndexWriter extends IndexWriter {
      if (config.ramBufferSizeMB != -1) {
        setRAMBufferSizeMB(config.ramBufferSizeMB);
      }
      if (config.termIndexInterval != -1) {
        setTermIndexInterval(config.termIndexInterval);
      }
      if (config.maxMergeDocs != -1) setMaxMergeDocs(config.maxMergeDocs);
      if (config.maxFieldLength != -1) setMaxFieldLength(config.maxFieldLength);
      if (config.mergePolicyClassName != null && SolrIndexConfig.DEFAULT_MERGE_POLICY_CLASSNAME.equals(config.mergePolicyClassName) == false) {
--- a/src/test/org/apache/solr/core/IndexReaderFactoryTest.java
+++ b/src/test/org/apache/solr/core/IndexReaderFactoryTest.java
@ -0,0 +1,48 @@
 package org.apache.solr.core;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.store.Directory;
 import org.apache.solr.util.AbstractSolrTestCase;
 import java.io.IOException;
 public class IndexReaderFactoryTest extends AbstractSolrTestCase {
  public String getSchemaFile() {
    return "schema.xml";
  }
  public String getSolrConfigFile() {
    return "solrconfig-termindex.xml";
  }
  /**
   * Simple test to ensure that alternate IndexReaderFactory is being used.
   *
   * @throws Exception
   */
  public void testAltReaderUsed() throws Exception {
    IndexReaderFactory readerFactory = h.getCore().getIndexReaderFactory();
    assertNotNull("Factory is null", readerFactory);
    assertTrue("readerFactory is not an instanceof " + AlternateIndexReaderTest.TestIndexReaderFactory.class, readerFactory instanceof StandardIndexReaderFactory);
    assertTrue("termInfoIndexDivisor not set to 12", readerFactory.getTermInfosIndexDivisor() == 12);
  }
 }
--- a/src/test/org/apache/solr/core/TestConfig.java
+++ b/src/test/org/apache/solr/core/TestConfig.java
@ -17,18 +17,30 @@
 package org.apache.solr.core;
 import org.apache.lucene.index.IndexWriter;
 import org.apache.solr.handler.admin.ShowFileRequestHandler;
-import org.apache.solr.util.AbstractSolrTestCase;
+import org.apache.solr.search.SolrIndexReader;
 import org.apache.solr.search.SolrIndexSearcher;
 import org.apache.solr.update.DirectUpdateHandler2;
 import org.apache.solr.update.SolrIndexConfig;
 import org.apache.solr.util.AbstractSolrTestCase;
 import org.apache.solr.util.RefCounted;
 import org.w3c.dom.Node;
 import org.w3c.dom.NodeList;
 import javax.xml.xpath.XPathConstants;
 import java.io.IOException;
 public class TestConfig extends AbstractSolrTestCase {
-  public String getSchemaFile() { return "schema.xml"; }
+  public String getSchemaFile() {
-  public String getSolrConfigFile() { return "solrconfig.xml"; }
+    return "schema.xml";
  }
  //public String getSolrConfigFile() { return "solrconfig.xml"; }
  public String getSolrConfigFile() {
    return "solrconfig-termindex.xml";
  }
  public void testJavaProperty() {
    // property values defined in build.xml
@ -65,15 +77,44 @@ public class TestConfig extends AbstractSolrTestCase {
  }
  // sometime if the config referes to old things, it must be replaced with new stuff
-  public void testAutomaticDeprecationSupport()
+  public void testAutomaticDeprecationSupport() {
  {
    // make sure the "admin/file" handler is registered
-    ShowFileRequestHandler handler = (ShowFileRequestHandler) h.getCore().getRequestHandler( "/admin/file" );
+    ShowFileRequestHandler handler = (ShowFileRequestHandler) h.getCore().getRequestHandler("/admin/file");
-    assertTrue( "file handler should have been automatically registered", handler!=null );
+    assertTrue("file handler should have been automatically registered", handler != null);
    //System.out.println( handler.getHiddenFiles() );
    // should not contain: <gettableFiles>solrconfig.xml scheam.xml admin-extra.html</gettableFiles>
-    assertFalse( handler.getHiddenFiles().contains( "scheam.xml".toUpperCase() ) );
+    assertFalse(handler.getHiddenFiles().contains("scheam.xml".toUpperCase()));
-    assertTrue( handler.getHiddenFiles().contains( "PROTWORDS.TXT" ) );
+    assertTrue(handler.getHiddenFiles().contains("PROTWORDS.TXT"));
  }
  public void testTermIndexInterval() throws Exception {
    class ExposeWriterHandler extends DirectUpdateHandler2 {
      public ExposeWriterHandler() throws IOException {
        super(h.getCore());
      }
      public IndexWriter getWriter() throws IOException {
        forceOpenWriter();
        return writer;
      }
    }
    IndexWriter writer = new ExposeWriterHandler().getWriter();
    int interval = writer.getTermIndexInterval();
    assertEquals(256, interval);
  }
  public void testTermIndexDivisor() throws Exception {
    IndexReaderFactory irf = h.getCore().getIndexReaderFactory();
    StandardIndexReaderFactory sirf = (StandardIndexReaderFactory) irf;
    assertEquals(12, sirf.termInfosIndexDivisor);
    RefCounted<SolrIndexSearcher> refCounted = h.getCore().getSearcher();
    SolrIndexReader solrReader = refCounted.get().getReader();
    assertEquals(12, solrReader.getTermInfosIndexDivisor());
  }
 }
--- a/src/test/test-files/solr/conf/solrconfig-termindex.xml
+++ b/src/test/test-files/solr/conf/solrconfig-termindex.xml
@ -0,0 +1,459 @@
 <?xml version="1.0" ?>
 <!--
 Licensed to the Apache Software Foundation (ASF) under one or more
 contributor license agreements.  See the NOTICE file distributed with
 this work for additional information regarding copyright ownership.
 The ASF licenses this file to You under the Apache License, Version 2.0
 (the "License"); you may not use this file except in compliance with
 the License.  You may obtain a copy of the License at
     http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 -->
 <!-- $Id: solrconfig.xml 382610 2006-03-03 01:43:03Z yonik $
     $Source$
     $Name$
  -->
 <config>
  <jmx />
  <!-- Used to specify an alternate directory to hold all index data.
       It defaults to "index" if not present, and should probably
       not be changed if replication is in use. -->
  <dataDir>${solr.data.dir:./solr/data}</dataDir>
  <indexDefaults>
   <!-- Values here affect all index writers and act as a default
   unless overridden. -->
    <!-- Values here affect all index writers and act as a default unless overridden. -->
    <useCompoundFile>false</useCompoundFile>
    <mergeFactor>10</mergeFactor>
    <!-- If both ramBufferSizeMB and maxBufferedDocs is set, then Lucene will flush based on whichever limit is hit first.
     -->
    <!--<maxBufferedDocs>1000</maxBufferedDocs>-->
    <!-- Tell Lucene when to flush documents to disk.
    Giving Lucene more memory for indexing means faster indexing at the cost of more RAM
    If both ramBufferSizeMB and maxBufferedDocs is set, then Lucene will flush based on whichever limit is hit first.
    -->
    <ramBufferSizeMB>32</ramBufferSizeMB>
    <maxMergeDocs>2147483647</maxMergeDocs>
    <maxFieldLength>10000</maxFieldLength>
    <writeLockTimeout>1000</writeLockTimeout>
    <commitLockTimeout>10000</commitLockTimeout>
    <!-- 
     Expert: Turn on Lucene's auto commit capability.
     NOTE: Despite the name, this value does not have any relation to Solr's autoCommit functionality
     -->
    <luceneAutoCommit>false</luceneAutoCommit>
    <!--
     Expert:
     The Merge Policy in Lucene controls how merging is handled by Lucene.  The default in 2.3 is the LogByteSizeMergePolicy, previous
     versions used LogDocMergePolicy.
     LogByteSizeMergePolicy chooses segments to merge based on their size.  The Lucene 2.2 default, LogDocMergePolicy chose when
     to merge based on number of documents
     Other implementations of MergePolicy must have a no-argument constructor
     -->
    <mergePolicy>org.apache.lucene.index.LogByteSizeMergePolicy</mergePolicy>
    <!--
     Expert:
     The Merge Scheduler in Lucene controls how merges are performed.  The ConcurrentMergeScheduler (Lucene 2.3 default)
      can perform merges in the background using separate threads.  The SerialMergeScheduler (Lucene 2.2 default) does not.
     -->
    <mergeScheduler>org.apache.lucene.index.ConcurrentMergeScheduler</mergeScheduler>
    <!-- these are global... can't currently override per index -->
    <writeLockTimeout>1000</writeLockTimeout>
    <commitLockTimeout>10000</commitLockTimeout>
    <!-- Controls how often Lucene loads terms into memory -->
    <termIndexInterval>256</termIndexInterval>
    <lockType>single</lockType>
  </indexDefaults>
  <mainIndex>
    <!-- lucene options specific to the main on-disk lucene index -->
    <useCompoundFile>false</useCompoundFile>
    <mergeFactor>10</mergeFactor>
    <!-- for better multi-segment testing, we are using slower
    indexing properties of maxBufferedDocs=10 and LogDocMergePolicy.
    -->
    <maxBufferedDocs>10</maxBufferedDocs>
    <termIndexInterval>256</termIndexInterval>
    <maxMergeDocs>2147483647</maxMergeDocs>
    <maxFieldLength>10000</maxFieldLength>
    <mergePolicy>org.apache.lucene.index.LogDocMergePolicy</mergePolicy>
    <unlockOnStartup>true</unlockOnStartup>
  </mainIndex>
  <updateHandler class="solr.DirectUpdateHandler2">
    <!-- autocommit pending docs if certain criteria are met 
    <autoCommit> 
      <maxDocs>10000</maxDocs>
      <maxTime>3600000</maxTime> 
    </autoCommit>
    -->
    <!-- represents a lower bound on the frequency that commits may
    occur (in seconds). NOTE: not yet implemented
    <commitIntervalLowerBound>0</commitIntervalLowerBound>
    -->
    <!-- The RunExecutableListener executes an external command.
         exe - the name of the executable to run
         dir - dir to use as the current working directory. default="."
         wait - the calling thread waits until the executable returns. default="true"
         args - the arguments to pass to the program.  default=nothing
         env - environment variables to set.  default=nothing
      -->
    <!-- A postCommit event is fired after every commit
    <listener event="postCommit" class="solr.RunExecutableListener">
      <str name="exe">/var/opt/resin3/__PORT__/scripts/solr/snapshooter</str>
      <str name="dir">/var/opt/resin3/__PORT__</str>
      <bool name="wait">true</bool>
      <arr name="args"> <str>arg1</str> <str>arg2</str> </arr>
      <arr name="env"> <str>MYVAR=val1</str> </arr>
    </listener>
    -->
  </updateHandler>
  <indexReaderFactory name="IndexReaderFactory" class="org.apache.solr.core.StandardIndexReaderFactory">
    <int name="termInfosIndexDivisor">12</int>
  </indexReaderFactory >
  <query>
    <!-- Maximum number of clauses in a boolean query... can affect
        range or wildcard queries that expand to big boolean
        queries.  An exception is thrown if exceeded.
    -->
    <maxBooleanClauses>1024</maxBooleanClauses>
    <!-- Cache specification for Filters or DocSets - unordered set of *all* documents
         that match a particular query.
      -->
    <filterCache
      class="solr.search.FastLRUCache"
      size="512"
      initialSize="512"
      autowarmCount="256"/>
    <queryResultCache
      class="solr.search.LRUCache"
      size="512"
      initialSize="512"
      autowarmCount="1024"/>
    <documentCache
      class="solr.search.LRUCache"
      size="512"
      initialSize="512"
      autowarmCount="0"/>
    <!-- If true, stored fields that are not requested will be loaded lazily.
    -->
    <enableLazyFieldLoading>true</enableLazyFieldLoading>
    <!--
    <cache name="myUserCache"
      class="solr.search.LRUCache"
      size="4096"
      initialSize="1024"
      autowarmCount="1024"
      regenerator="MyRegenerator"
      />
    -->
    <!--
    <useFilterForSortedQuery>true</useFilterForSortedQuery>
    -->
    <queryResultWindowSize>10</queryResultWindowSize>
    <!-- set maxSize artificially low to exercise both types of sets -->
    <HashDocSet maxSize="3" loadFactor="0.75"/>
    <!-- boolToFilterOptimizer converts boolean clauses with zero boost
         into cached filters if the number of docs selected by the clause exceeds
         the threshold (represented as a fraction of the total index)
    -->
    <boolTofilterOptimizer enabled="false" cacheSize="32" threshold=".05"/>
    <!-- a newSearcher event is fired whenever a new searcher is being prepared
         and there is a current searcher handling requests (aka registered). -->
    <!-- QuerySenderListener takes an array of NamedList and executes a
         local query request for each NamedList in sequence. -->
    <!--
    <listener event="newSearcher" class="solr.QuerySenderListener">
      <arr name="queries">
        <lst> <str name="q">solr</str> <str name="start">0</str> <str name="rows">10</str> </lst>
        <lst> <str name="q">rocks</str> <str name="start">0</str> <str name="rows">10</str> </lst>
      </arr>
    </listener>
    -->
    <!-- a firstSearcher event is fired whenever a new searcher is being
         prepared but there is no current registered searcher to handle
         requests or to gain prewarming data from. -->
    <!--
    <listener event="firstSearcher" class="solr.QuerySenderListener">
      <arr name="queries">
        <lst> <str name="q">fast_warm</str> <str name="start">0</str> <str name="rows">10</str> </lst>
      </arr>
    </listener>
    -->
  </query>
  <!-- An alternate set representation that uses an integer hash to store filters (sets of docids).
       If the set cardinality <= maxSize elements, then HashDocSet will be used instead of the bitset
       based HashBitset. -->
  <!-- requestHandler plugins... incoming queries will be dispatched to the
     correct handler based on the qt (query type) param matching the
     name of registered handlers.
      The "standard" request handler is the default and will be used if qt
     is not specified in the request.
  -->
  <requestHandler name="standard" class="solr.StandardRequestHandler">
  	<bool name="httpCaching">true</bool>
  </requestHandler>
  <requestHandler name="dismaxOldStyleDefaults"
                  class="solr.DisMaxRequestHandler" >
     <!-- for historic reasons, DisMaxRequestHandler will use all of
          it's init params as "defaults" if there is no "defaults" list
          specified
     -->
     <float name="tie">0.01</float>
     <str name="qf">
        text^0.5 features_t^1.0 subject^1.4 title_stemmed^2.0
     </str>
     <str name="pf">
        text^0.2 features_t^1.1 subject^1.4 title_stemmed^2.0 title^1.5
     </str>
     <str name="bf">
        ord(weight)^0.5 recip(rord(iind),1,1000,1000)^0.3
     </str>
     <str name="mm">
        3&lt;-1 5&lt;-2 6&lt;90%
     </str>
     <int name="ps">100</int>
  </requestHandler>
  <requestHandler name="dismax" class="solr.DisMaxRequestHandler" >
    <lst name="defaults">
     <str name="q.alt">*:*</str>
     <float name="tie">0.01</float>
     <str name="qf">
        text^0.5 features_t^1.0 subject^1.4 title_stemmed^2.0
     </str>
     <str name="pf">
        text^0.2 features_t^1.1 subject^1.4 title_stemmed^2.0 title^1.5
     </str>
     <str name="bf">
        ord(weight)^0.5 recip(rord(iind),1,1000,1000)^0.3
     </str>
     <str name="mm">
        3&lt;-1 5&lt;-2 6&lt;90%
     </str>
     <int name="ps">100</int>
    </lst>
  </requestHandler>
  <requestHandler name="old" class="solr.tst.OldRequestHandler" >
    <int name="myparam">1000</int>
    <float name="ratio">1.4142135</float>
    <arr name="myarr"><int>1</int><int>2</int></arr>
    <str>foo</str>
  </requestHandler>
  <requestHandler name="oldagain" class="solr.tst.OldRequestHandler" >
    <lst name="lst1"> <str name="op">sqrt</str> <int name="val">2</int> </lst>
    <lst name="lst2"> <str name="op">log</str> <float name="val">10</float> </lst>
  </requestHandler>
  <requestHandler name="test" class="solr.tst.TestRequestHandler" />
  <!-- test query parameter defaults -->
  <requestHandler name="defaults" class="solr.StandardRequestHandler">
    <lst name="defaults">
      <int name="rows">4</int>
      <bool name="hl">true</bool>
      <str name="hl.fl">text,name,subject,title,whitetok</str>
    </lst>
  </requestHandler>
  <!-- test query parameter defaults -->
  <requestHandler name="lazy" class="solr.StandardRequestHandler" startup="lazy">
    <lst name="defaults">
      <int name="rows">4</int>
      <bool name="hl">true</bool>
      <str name="hl.fl">text,name,subject,title,whitetok</str>
    </lst>
  </requestHandler>
  <requestHandler name="/update"     class="solr.XmlUpdateRequestHandler"          />
  <requestHandler name="/update/csv" class="solr.CSVRequestHandler" startup="lazy">
  	<bool name="httpCaching">false</bool>
  </requestHandler>
  <!-- test elevation -->
  <searchComponent name="elevate" class="org.apache.solr.handler.component.QueryElevationComponent" >
    <str name="queryFieldType">string</str>
    <str name="config-file">elevate.xml</str>
  </searchComponent>
  <requestHandler name="/elevate" class="org.apache.solr.handler.component.SearchHandler">
    <lst name="defaults">
      <str name="echoParams">explicit</str>
    </lst>
    <arr name="last-components">
      <str>elevate</str>
    </arr>
  </requestHandler>
  <searchComponent name="spellcheck" class="org.apache.solr.handler.component.SpellCheckComponent">
    <str name="queryAnalyzerFieldType">lowerfilt</str>
    <lst name="spellchecker">
      <str name="name">default</str>
      <str name="field">lowerfilt</str>
      <str name="spellcheckIndexDir">spellchecker1</str>
      <str name="buildOnCommit">true</str>
    </lst>
    <!-- Example of using different distance measure -->
    <lst name="spellchecker">
      <str name="name">jarowinkler</str>
      <str name="field">lowerfilt</str>
      <!-- Use a different Distance Measure -->
      <str name="distanceMeasure">org.apache.lucene.search.spell.JaroWinklerDistance</str>
      <str name="spellcheckIndexDir">spellchecker2</str>
    </lst>
    <lst name="spellchecker">
      <str name="classname">solr.FileBasedSpellChecker</str>
      <str name="name">external</str>
      <str name="sourceLocation">spellings.txt</str>
      <str name="characterEncoding">UTF-8</str>
      <str name="spellcheckIndexDir">spellchecker3</str>
    </lst>
  </searchComponent>
  <searchComponent name="termsComp" class="org.apache.solr.handler.component.TermsComponent"/>
  <requestHandler name="/terms" class="org.apache.solr.handler.component.SearchHandler">
    <arr name="components">
      <str>termsComp</str>
    </arr>
  </requestHandler>
  <!--
  The SpellingQueryConverter to convert raw (CommonParams.Q) queries into tokens.  Uses a simple regular expression
   to strip off field markup, boosts, ranges, etc. but it is not guaranteed to match an exact parse from the query parser.
   -->
  <queryConverter name="queryConverter" class="org.apache.solr.spelling.SpellingQueryConverter"/>
  <requestHandler name="spellCheckCompRH" class="org.apache.solr.handler.component.SearchHandler">
    <lst name="defaults">
      <!-- omp = Only More Popular -->
      <str name="spellcheck.onlyMorePopular">false</str>
      <!-- exr = Extended Results -->
      <str name="spellcheck.extendedResults">false</str>
      <!--  The number of suggestions to return -->
      <str name="spellcheck.count">1</str>
    </lst>
    <arr name="last-components">
      <str>spellcheck</str>
    </arr>
  </requestHandler>
  <searchComponent name="tvComponent" class="org.apache.solr.handler.component.TermVectorComponent"/>
  <requestHandler name="tvrh" class="org.apache.solr.handler.component.SearchHandler">
    <lst name="defaults">
    </lst>
    <arr name="last-components">
      <str>tvComponent</str>
    </arr>
  </requestHandler>
  <highlighting>
   <!-- Configure the standard fragmenter -->
   <fragmenter name="gap" class="org.apache.solr.highlight.GapFragmenter" default="true">
    <lst name="defaults">
     <int name="hl.fragsize">100</int>
    </lst>
   </fragmenter>
   <fragmenter name="regex" class="org.apache.solr.highlight.RegexFragmenter">
    <lst name="defaults">
     <int name="hl.fragsize">70</int>
    </lst>
   </fragmenter>
   <!-- Configure the standard formatter -->
   <formatter name="html" class="org.apache.solr.highlight.HtmlFormatter" default="true">
    <lst name="defaults">
     <str name="hl.simple.pre"><![CDATA[<em>]]></str>
     <str name="hl.simple.post"><![CDATA[</em>]]></str>
    </lst>
   </formatter>
  </highlighting>
  <!-- enable streaming for testing... -->
  <requestDispatcher handleSelect="true" >
    <requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048" />
    <httpCaching lastModifiedFrom="openTime" etagSeed="Solr" never304="false">
      <cacheControl>max-age=30, public</cacheControl>
    </httpCaching>
  </requestDispatcher>
  <admin>
    <defaultQuery>solr</defaultQuery>
    <gettableFiles>solrconfig.xml scheam.xml admin-extra.html</gettableFiles>
  </admin>
  <!-- test getting system property -->
  <propTest attr1="${solr.test.sys.prop1}-$${literal}"
            attr2="${non.existent.sys.prop:default-from-config}">prefix-${solr.test.sys.prop2}-suffix</propTest>
  <queryParser name="foo" class="FooQParserPlugin"/>
  <updateRequestProcessorChain name="dedupe">
    <processor class="org.apache.solr.update.processor.SignatureUpdateProcessorFactory">
      <bool name="enabled">false</bool>
      <bool name="overwriteDupes">true</bool>
      <str name="fields">v_t,t_field</str>
      <str name="signatureClass">org.apache.solr.update.processor.TextProfileSignature</str>
    </processor>
    <processor class="solr.RunUpdateProcessorFactory" />
  </updateRequestProcessorChain>
 </config>