mirror of https://github.com/apache/lucene.git
526 lines
22 KiB
XML
Executable File
526 lines
22 KiB
XML
Executable File
<?xml version="1.0" encoding="UTF-8" ?>
|
|
<!--
|
|
Licensed to the Apache Software Foundation (ASF) under one or more
|
|
contributor license agreements. See the NOTICE file distributed with
|
|
this work for additional information regarding copyright ownership.
|
|
The ASF licenses this file to You under the Apache License, Version 2.0
|
|
(the "License"); you may not use this file except in compliance with
|
|
the License. You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
-->
|
|
|
|
<config>
|
|
<!-- Set this to 'false' if you want solr to continue working after it has
|
|
encountered an severe configuration error. In a production environment,
|
|
you may want solr to keep working even if one handler is mis-configured.
|
|
|
|
You may also set this to false using by setting the system property:
|
|
-Dsolr.abortOnConfigurationError=false
|
|
-->
|
|
<abortOnConfigurationError>${solr.abortOnConfigurationError:true}</abortOnConfigurationError>
|
|
|
|
<!-- Used to specify an alternate directory to hold all index data
|
|
other than the default ./data under the Solr home.
|
|
If replication is in use, this should match the replication configuration. -->
|
|
<dataDir>${solr.data.dir:./solr/data}</dataDir>
|
|
|
|
|
|
<indexDefaults>
|
|
<!-- Values here affect all index writers and act as a default unless overridden. -->
|
|
<useCompoundFile>false</useCompoundFile>
|
|
<mergeFactor>10</mergeFactor>
|
|
<maxBufferedDocs>1000</maxBufferedDocs>
|
|
<maxMergeDocs>2147483647</maxMergeDocs>
|
|
<maxFieldLength>10000</maxFieldLength>
|
|
<writeLockTimeout>1000</writeLockTimeout>
|
|
<commitLockTimeout>10000</commitLockTimeout>
|
|
<!--
|
|
As long as Solr is the only process modifying your index, it is
|
|
safe to use Lucene's in process locking mechanism. But you may
|
|
specify one of the other Lucene LockFactory implementations in
|
|
the event that you have a custom situation.
|
|
|
|
none = NoLockFactory (typically only used with read only indexes)
|
|
single = SingleInstanceLockFactory (suggested)
|
|
native = NativeFSLockFactory
|
|
simple = SimpleFSLockFactory
|
|
|
|
('simple' is the default for backwards compatibility with Solr 1.2)
|
|
-->
|
|
<lockType>single</lockType>
|
|
</indexDefaults>
|
|
|
|
<mainIndex>
|
|
<!-- options specific to the main on-disk lucene index -->
|
|
<useCompoundFile>false</useCompoundFile>
|
|
<mergeFactor>10</mergeFactor>
|
|
<maxBufferedDocs>1000</maxBufferedDocs>
|
|
<maxMergeDocs>2147483647</maxMergeDocs>
|
|
<maxFieldLength>10000</maxFieldLength>
|
|
|
|
<!-- If true, unlock any held write or commit locks on startup.
|
|
This defeats the locking mechanism that allows multiple
|
|
processes to safely access a lucene index, and should be
|
|
used with care.
|
|
This is not needed if lock type is 'none' or 'single'
|
|
-->
|
|
<unlockOnStartup>false</unlockOnStartup>
|
|
</mainIndex>
|
|
|
|
<!-- the default high-performance update handler -->
|
|
<updateHandler class="solr.DirectUpdateHandler2">
|
|
|
|
<!-- A prefix of "solr." for class names is an alias that
|
|
causes solr to search appropriate packages, including
|
|
org.apache.solr.(search|update|request|core|analysis)
|
|
-->
|
|
|
|
<!-- autocommit pending docs if certain criteria are met
|
|
<autoCommit>
|
|
<maxDocs>10000</maxDocs>
|
|
<maxTime>1000</maxTime>
|
|
</autoCommit>
|
|
-->
|
|
|
|
<!-- The RunExecutableListener executes an external command.
|
|
exe - the name of the executable to run
|
|
dir - dir to use as the current working directory. default="."
|
|
wait - the calling thread waits until the executable returns. default="true"
|
|
args - the arguments to pass to the program. default=nothing
|
|
env - environment variables to set. default=nothing
|
|
-->
|
|
<!-- A postCommit event is fired after every commit or optimize command
|
|
<listener event="postCommit" class="solr.RunExecutableListener">
|
|
<str name="exe">snapshooter</str>
|
|
<str name="dir">solr/bin</str>
|
|
<bool name="wait">true</bool>
|
|
<arr name="args"> <str>arg1</str> <str>arg2</str> </arr>
|
|
<arr name="env"> <str>MYVAR=val1</str> </arr>
|
|
</listener>
|
|
-->
|
|
<!-- A postOptimize event is fired only after every optimize command, useful
|
|
in conjunction with index distribution to only distribute optimized indicies
|
|
<listener event="postOptimize" class="solr.RunExecutableListener">
|
|
<str name="exe">snapshooter</str>
|
|
<str name="dir">solr/bin</str>
|
|
<bool name="wait">true</bool>
|
|
</listener>
|
|
-->
|
|
|
|
</updateHandler>
|
|
|
|
|
|
<query>
|
|
<!-- Maximum number of clauses in a boolean query... can affect
|
|
range or prefix queries that expand to big boolean
|
|
queries. An exception is thrown if exceeded. -->
|
|
<maxBooleanClauses>1024</maxBooleanClauses>
|
|
|
|
|
|
<!-- Cache used by SolrIndexSearcher for filters (DocSets),
|
|
unordered sets of *all* documents that match a query.
|
|
When a new searcher is opened, its caches may be prepopulated
|
|
or "autowarmed" using data from caches in the old searcher.
|
|
autowarmCount is the number of items to prepopulate. For LRUCache,
|
|
the autowarmed items will be the most recently accessed items.
|
|
Parameters:
|
|
class - the SolrCache implementation (currently only LRUCache)
|
|
size - the maximum number of entries in the cache
|
|
initialSize - the initial capacity (number of entries) of
|
|
the cache. (seel java.util.HashMap)
|
|
autowarmCount - the number of entries to prepopulate from
|
|
and old cache.
|
|
-->
|
|
<filterCache
|
|
class="solr.LRUCache"
|
|
size="512"
|
|
initialSize="512"
|
|
autowarmCount="256"/>
|
|
|
|
<!-- queryResultCache caches results of searches - ordered lists of
|
|
document ids (DocList) based on a query, a sort, and the range
|
|
of documents requested. -->
|
|
<queryResultCache
|
|
class="solr.LRUCache"
|
|
size="512"
|
|
initialSize="512"
|
|
autowarmCount="256"/>
|
|
|
|
<!-- documentCache caches Lucene Document objects (the stored fields for each document).
|
|
Since Lucene internal document ids are transient, this cache will not be autowarmed. -->
|
|
<documentCache
|
|
class="solr.LRUCache"
|
|
size="512"
|
|
initialSize="512"
|
|
autowarmCount="0"/>
|
|
|
|
<!-- If true, stored fields that are not requested will be loaded lazily.
|
|
|
|
This can result in a significant speed improvement if the usual case is to
|
|
not load all stored fields, especially if the skipped fields are large compressed
|
|
text fields.
|
|
-->
|
|
<enableLazyFieldLoading>true</enableLazyFieldLoading>
|
|
|
|
<!-- Example of a generic cache. These caches may be accessed by name
|
|
through SolrIndexSearcher.getCache(),cacheLookup(), and cacheInsert().
|
|
The purpose is to enable easy caching of user/application level data.
|
|
The regenerator argument should be specified as an implementation
|
|
of solr.search.CacheRegenerator if autowarming is desired. -->
|
|
<!--
|
|
<cache name="myUserCache"
|
|
class="solr.LRUCache"
|
|
size="4096"
|
|
initialSize="1024"
|
|
autowarmCount="1024"
|
|
regenerator="org.mycompany.mypackage.MyRegenerator"
|
|
/>
|
|
-->
|
|
|
|
<!-- An optimization that attempts to use a filter to satisfy a search.
|
|
If the requested sort does not include score, then the filterCache
|
|
will be checked for a filter matching the query. If found, the filter
|
|
will be used as the source of document ids, and then the sort will be
|
|
applied to that.
|
|
<useFilterForSortedQuery>true</useFilterForSortedQuery>
|
|
-->
|
|
|
|
<!-- An optimization for use with the queryResultCache. When a search
|
|
is requested, a superset of the requested number of document ids
|
|
are collected. For example, if a search for a particular query
|
|
requests matching documents 10 through 19, and queryWindowSize is 50,
|
|
then documents 0 through 49 will be collected and cached. Any further
|
|
requests in that range can be satisfied via the cache. -->
|
|
<queryResultWindowSize>50</queryResultWindowSize>
|
|
|
|
<!-- Maximum number of documents to cache for any entry in the
|
|
queryResultCache. -->
|
|
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
|
|
|
|
<!-- This entry enables an int hash representation for filters (DocSets)
|
|
when the number of items in the set is less than maxSize. For smaller
|
|
sets, this representation is more memory efficient, more efficient to
|
|
iterate over, and faster to take intersections. -->
|
|
<HashDocSet maxSize="3000" loadFactor="0.75"/>
|
|
|
|
|
|
<!-- boolToFilterOptimizer converts boolean clauses with zero boost
|
|
into cached filters if the number of docs selected by the clause exceeds
|
|
the threshold (represented as a fraction of the total index) -->
|
|
<boolTofilterOptimizer enabled="true" cacheSize="32" threshold=".05"/>
|
|
|
|
|
|
<!-- a newSearcher event is fired whenever a new searcher is being prepared
|
|
and there is a current searcher handling requests (aka registered). -->
|
|
<!-- QuerySenderListener takes an array of NamedList and executes a
|
|
local query request for each NamedList in sequence. -->
|
|
<!--
|
|
<listener event="newSearcher" class="solr.QuerySenderListener">
|
|
<arr name="queries">
|
|
<lst> <str name="q">solr</str> <str name="start">0</str> <str name="rows">10</str> </lst>
|
|
<lst> <str name="q">rocks</str> <str name="start">0</str> <str name="rows">10</str> </lst>
|
|
</arr>
|
|
</listener>
|
|
-->
|
|
|
|
<!-- a firstSearcher event is fired whenever a new searcher is being
|
|
prepared but there is no current registered searcher to handle
|
|
requests or to gain autowarming data from. -->
|
|
<!--
|
|
<listener event="firstSearcher" class="solr.QuerySenderListener">
|
|
<arr name="queries">
|
|
<lst> <str name="q">fast_warm</str> <str name="start">0</str> <str name="rows">10</str> </lst>
|
|
</arr>
|
|
</listener>
|
|
-->
|
|
|
|
<!-- If a search request comes in and there is no current registered searcher,
|
|
then immediately register the still warming searcher and use it. If
|
|
"false" then all requests will block until the first searcher is done
|
|
warming. -->
|
|
<useColdSearcher>false</useColdSearcher>
|
|
|
|
<!-- Maximum number of searchers that may be warming in the background
|
|
concurrently. An error is returned if this limit is exceeded. Recommend
|
|
1-2 for read-only slaves, higher for masters w/o cache warming. -->
|
|
<maxWarmingSearchers>4</maxWarmingSearchers>
|
|
|
|
</query>
|
|
|
|
<!--
|
|
Let the dispatch filter handler /select?qt=XXX
|
|
handleSelect=true will use consistent error handling for /select and /update
|
|
handleSelect=false will use solr1.1 style error formatting
|
|
-->
|
|
<requestDispatcher handleSelect="true" >
|
|
<!--Make sure your system has some authentication before enabling remote streaming! -->
|
|
<requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048" />
|
|
</requestDispatcher>
|
|
|
|
|
|
<!-- requestHandler plugins... incoming queries will be dispatched to the
|
|
correct handler based on the path or the qt (query type) param.
|
|
Names starting with a '/' are accessed with the a path equal to the
|
|
registered name. Names without a leading '/' are accessed with:
|
|
http://host/app/select?qt=name
|
|
If no qt is defined, the requestHandlere that declares default="true"
|
|
will be used.
|
|
-->
|
|
<requestHandler name="standard" class="solr.StandardRequestHandler" default="true">
|
|
<!-- default values for query parameters -->
|
|
<lst name="defaults">
|
|
<str name="echoParams">explicit</str>
|
|
<!--
|
|
<int name="rows">10</int>
|
|
<str name="fl">*</str>
|
|
<str name="version">2.1</str>
|
|
-->
|
|
</lst>
|
|
</requestHandler>
|
|
|
|
<!-- DisMaxRequestHandler allows easy searching across multiple fields
|
|
for simple user-entered phrases.
|
|
see http://wiki.apache.org/solr/DisMaxRequestHandler
|
|
-->
|
|
<requestHandler name="dismax" class="solr.DisMaxRequestHandler" >
|
|
<lst name="defaults">
|
|
<str name="echoParams">explicit</str>
|
|
<float name="tie">0.01</float>
|
|
<str name="qf">
|
|
text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 manu^1.1 cat^1.4
|
|
</str>
|
|
<str name="pf">
|
|
text^0.2 features^1.1 name^1.5 manu^1.4 manu_exact^1.9
|
|
</str>
|
|
<str name="bf">
|
|
ord(poplarity)^0.5 recip(rord(price),1,1000,1000)^0.3
|
|
</str>
|
|
<str name="fl">
|
|
id,name,price,score
|
|
</str>
|
|
<str name="mm">
|
|
2<-1 5<-2 6<90%
|
|
</str>
|
|
<int name="ps">100</int>
|
|
<str name="q.alt">*:*</str>
|
|
</lst>
|
|
</requestHandler>
|
|
|
|
<!-- Note how you can register the same handler multiple times with
|
|
different names (and different init parameters)
|
|
-->
|
|
<requestHandler name="partitioned" class="solr.DisMaxRequestHandler" >
|
|
<lst name="defaults">
|
|
<str name="echoParams">explicit</str>
|
|
<str name="qf">text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0</str>
|
|
<str name="mm">2<-1 5<-2 6<90%</str>
|
|
<!-- This is an example of using Date Math to specify a constantly
|
|
moving date range in a config...
|
|
-->
|
|
<str name="bq">incubationdate_dt:[* TO NOW/DAY-1MONTH]^2.2</str>
|
|
</lst>
|
|
<!-- In addition to defaults, "appends" params can be specified
|
|
to identify values which should be appended to the list of
|
|
multi-val params from the query (or the existing "defaults").
|
|
|
|
In this example, the param "fq=instock:true" will be appended to
|
|
any query time fq params the user may specify, as a mechanism for
|
|
partitioning the index, independent of any user selected filtering
|
|
that may also be desired (perhaps as a result of faceted searching).
|
|
|
|
NOTE: there is *absolutely* nothing a client can do to prevent these
|
|
"appends" values from being used, so don't use this mechanism
|
|
unless you are sure you always want it.
|
|
-->
|
|
<lst name="appends">
|
|
<str name="fq">inStock:true</str>
|
|
</lst>
|
|
<!-- "invariants" are a way of letting the Solr maintainer lock down
|
|
the options available to Solr clients. Any params values
|
|
specified here are used regardless of what values may be specified
|
|
in either the query, the "defaults", or the "appends" params.
|
|
|
|
In this example, the facet.field and facet.query params are fixed,
|
|
limiting the facets clients can use. Faceting is not turned on by
|
|
default - but if the client does specify facet=true in the request,
|
|
these are the only facets they will be able to see counts for;
|
|
regardless of what other facet.field or facet.query params they
|
|
may specify.
|
|
|
|
NOTE: there is *absolutely* nothing a client can do to prevent these
|
|
"invariants" values from being used, so don't use this mechanism
|
|
unless you are sure you always want it.
|
|
-->
|
|
<lst name="invariants">
|
|
<str name="facet.field">cat</str>
|
|
<str name="facet.field">manu_exact</str>
|
|
<str name="facet.query">price:[* TO 500]</str>
|
|
<str name="facet.query">price:[500 TO *]</str>
|
|
</lst>
|
|
</requestHandler>
|
|
|
|
<requestHandler name="instock" class="solr.DisMaxRequestHandler" >
|
|
<!-- for legacy reasons, DisMaxRequestHandler will assume all init
|
|
params are "defaults" if you don't explicitly specify any defaults.
|
|
-->
|
|
<str name="fq">
|
|
inStock:true
|
|
</str>
|
|
<str name="qf">
|
|
text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 manu^1.1 cat^1.4
|
|
</str>
|
|
<str name="mm">
|
|
2<-1 5<-2 6<90%
|
|
</str>
|
|
</requestHandler>
|
|
|
|
|
|
<!-- SpellCheckerRequestHandler takes in a word (or several words) as the
|
|
value of the "q" parameter and returns a list of alternative spelling
|
|
suggestions. If invoked with a ...&cmd=rebuild, it will rebuild the
|
|
spellchecker index.
|
|
-->
|
|
<requestHandler name="spellchecker" class="solr.SpellCheckerRequestHandler" startup="lazy">
|
|
<!-- default values for query parameters -->
|
|
<lst name="defaults">
|
|
<int name="suggestionCount">1</int>
|
|
<float name="accuracy">0.5</float>
|
|
</lst>
|
|
|
|
<!-- Main init params for handler -->
|
|
|
|
<!-- The directory where your SpellChecker Index should live. -->
|
|
<!-- May be absolute, or relative to the Solr "dataDir" directory. -->
|
|
<!-- If this option is not specified, a RAM directory will be used -->
|
|
<str name="spellcheckerIndexDir">spell</str>
|
|
|
|
<!-- the field in your schema that you want to be able to build -->
|
|
<!-- your spell index on. This should be a field that uses a very -->
|
|
<!-- simple FieldType without a lot of Analysis (ie: string) -->
|
|
<str name="termSourceField">word</str>
|
|
|
|
</requestHandler>
|
|
|
|
<requestHandler name="/mlt" class="solr.MoreLikeThisHandler">
|
|
<lst name="defaults">
|
|
<str name="mlt.fl">manu,cat</str>
|
|
<int name="mlt.mindf">1</int>
|
|
</lst>
|
|
</requestHandler>
|
|
|
|
<!-- Update request handler.
|
|
|
|
Note: Since solr1.1 requestHandlers requires a valid content type header if posted in
|
|
the body. For example, curl now requires: -H 'Content-type:text/xml; charset=utf-8'
|
|
The response format differs from solr1.1 formatting and returns a standard error code.
|
|
|
|
To enable solr1.1 behavior, remove the /update handler or change its path
|
|
|
|
"update.processor.class" is the class name for the UpdateRequestProcessor. It is initalized
|
|
only once. This can not be changed for each request.
|
|
-->
|
|
<requestHandler name="/update" class="solr.XmlUpdateRequestHandler" >
|
|
<!--
|
|
<str name="update.processor.class">org.apache.solr.handler.UpdateRequestProcessor</str>
|
|
-->
|
|
</requestHandler>
|
|
<!-- this will be removed before solr 1.3 -->
|
|
<requestHandler name="/update/xpp" class="solr.XppUpdateRequestHandler" />
|
|
|
|
<!-- CSV update handler, loaded on demand -->
|
|
<requestHandler name="/update/csv" class="solr.CSVRequestHandler" startup="lazy" />
|
|
|
|
|
|
<!-- Admin Handlers. TODO? There could be a single handler that loads them all... -->
|
|
<requestHandler name="/admin/luke" class="org.apache.solr.handler.admin.LukeRequestHandler" />
|
|
<requestHandler name="/admin/system" class="org.apache.solr.handler.admin.SystemInfoHandler" />
|
|
<requestHandler name="/admin/plugins" class="org.apache.solr.handler.admin.PluginInfoHandler" />
|
|
<requestHandler name="/admin/threads" class="org.apache.solr.handler.admin.ThreadDumpHandler" />
|
|
<requestHandler name="/admin/properties" class="org.apache.solr.handler.admin.PropertiesRequestHandler" />
|
|
|
|
<!-- Echo the request contents back to the client -->
|
|
<requestHandler name="/debug/dump" class="solr.DumpRequestHandler" >
|
|
<lst name="defaults">
|
|
<str name="echoParams">explicit</str> <!-- for all params (including the default etc) use: 'all' -->
|
|
<str name="echoHandler">true</str>
|
|
</lst>
|
|
</requestHandler>
|
|
|
|
<highlighting>
|
|
<!-- Configure the standard fragmenter -->
|
|
<!-- This could most likely be commented out in the "default" case -->
|
|
<fragmenter name="gap" class="org.apache.solr.highlight.GapFragmenter" default="true">
|
|
<lst name="defaults">
|
|
<int name="hl.fragsize">100</int>
|
|
</lst>
|
|
</fragmenter>
|
|
|
|
<!-- A regular-expression-based fragmenter (f.i., for sentence extraction) -->
|
|
<fragmenter name="regex" class="org.apache.solr.highlight.RegexFragmenter">
|
|
<lst name="defaults">
|
|
<!-- slightly smaller fragsizes work better because of slop -->
|
|
<int name="hl.fragsize">70</int>
|
|
<!-- allow 50% slop on fragment sizes -->
|
|
<float name="hl.regex.slop">0.5</float>
|
|
<!-- a basic sentence pattern -->
|
|
<str name="hl.regex.pattern">[-\w ,/\n\"']{20,200}</str>
|
|
</lst>
|
|
</fragmenter>
|
|
|
|
<!-- Configure the standard formatter -->
|
|
<formatter name="html" class="org.apache.solr.highlight.HtmlFormatter" default="true">
|
|
<lst name="defaults">
|
|
<str name="hl.simple.pre"><![CDATA[<em>]]></str>
|
|
<str name="hl.simple.post"><![CDATA[</em>]]></str>
|
|
</lst>
|
|
</formatter>
|
|
</highlighting>
|
|
|
|
|
|
<!-- queryResponseWriter plugins... query responses will be written using the
|
|
writer specified by the 'wt' request parameter matching the name of a registered
|
|
writer.
|
|
The "default" writer is the default and will be used if 'wt' is not specified
|
|
in the request. XMLResponseWriter will be used if nothing is specified here.
|
|
The json, python, and ruby writers are also available by default.
|
|
|
|
<queryResponseWriter name="xml" class="org.apache.solr.request.XMLResponseWriter" default="true"/>
|
|
<queryResponseWriter name="json" class="org.apache.solr.request.JSONResponseWriter"/>
|
|
<queryResponseWriter name="python" class="org.apache.solr.request.PythonResponseWriter"/>
|
|
<queryResponseWriter name="ruby" class="org.apache.solr.request.RubyResponseWriter"/>
|
|
|
|
<queryResponseWriter name="custom" class="com.example.MyResponseWriter"/>
|
|
-->
|
|
|
|
<!-- XSLT response writer transforms the XML output by any xslt file found
|
|
in Solr's conf/xslt directory. Changes to xslt files are checked for
|
|
every xsltCacheLifetimeSeconds.
|
|
-->
|
|
<queryResponseWriter name="xslt" class="org.apache.solr.request.XSLTResponseWriter">
|
|
<int name="xsltCacheLifetimeSeconds">5</int>
|
|
</queryResponseWriter>
|
|
|
|
<!-- config for the admin interface -->
|
|
<admin>
|
|
<defaultQuery>solr</defaultQuery>
|
|
<gettableFiles>solrconfig.xml schema.xml admin-extra.html</gettableFiles>
|
|
<!-- pingQuery should be "URLish" ...
|
|
& separated key=val pairs ... but there shouldn't be any
|
|
URL escaping of the values -->
|
|
<pingQuery>
|
|
qt=standard&q=solrpingquery
|
|
</pingQuery>
|
|
<!-- configure a healthcheck file for servers behind a loadbalancer
|
|
<healthcheck type="file">server-enabled</healthcheck>
|
|
-->
|
|
</admin>
|
|
|
|
</config>
|