SOLR-3441: ElisionFilterFactory is now MultiTermAware

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1379275 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Chris M. Hostetter 2012-08-31 03:44:05 +00:00
parent 562af97e39
commit adc8db0353
4 changed files with 72 additions and 1 deletions

View File

@ -29,6 +29,9 @@ New Features
as the default Codec on IndexWriter, because it cannot write new segments.
(Mike McCandless, Robert Muir)
* SOLR-3441: ElisionFilterFactory is now MultiTermAware
(Jack Krupansky via hossman)
API Changes
* LUCENE-4299: Added Terms.hasPositions() and Terms.hasOffsets().

View File

@ -34,7 +34,7 @@ import org.apache.lucene.analysis.fr.FrenchAnalyzer;
* &lt;/fieldType&gt;</pre>
*
*/
public class ElisionFilterFactory extends TokenFilterFactory implements ResourceLoaderAware {
public class ElisionFilterFactory extends TokenFilterFactory implements ResourceLoaderAware, MultiTermAwareComponent {
private CharArraySet articles;
@ -53,5 +53,10 @@ public class ElisionFilterFactory extends TokenFilterFactory implements Resource
public ElisionFilter create(TokenStream input) {
return new ElisionFilter(input, articles);
}
@Override
public AbstractAnalysisFactory getMultiTermComponent() {
return this;
}
}

View File

@ -206,6 +206,16 @@
</analyzer>
</fieldType>
<fieldType name="text_fr" class="solr.TextField" positionIncrementGap="100">
<analyzer>
<tokenizer class="solr.StandardTokenizerFactory"/>
<!-- removes l', etc -->
<filter class="solr.ElisionFilterFactory" ignoreCase="true" />
<filter class="solr.LowerCaseFilterFactory"/>
<filter class="solr.FrenchLightStemFilterFactory"/>
</analyzer>
</fieldType>
<fieldType name="int" class="solr.TrieIntField" precisionStep="4" omitNorms="true" positionIncrementGap="0"/>
<fieldType name="float" class="solr.TrieFloatField" precisionStep="4" omitNorms="true" positionIncrementGap="0"/>
@ -250,6 +260,7 @@
<dynamicField name="*_folding" type="text_folding" indexed="true" stored="true"/>
<dynamicField name="*_stemming" type="text_stemming" indexed="true" stored="true"/>
<dynamicField name="*_keyword" type="text_keyword" indexed="true" stored="true"/>
<dynamicField name="*_fr" type="text_fr" indexed="true" stored="true"/>
</fields>

View File

@ -0,0 +1,52 @@
package org.apache.solr.search;
import org.apache.solr.SolrTestCaseJ4;
import org.junit.BeforeClass;
import org.junit.Test;
/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
public class TestElisionMultitermQuery extends SolrTestCaseJ4 {
public String getCoreName() {
return "basic";
}
@BeforeClass
public static void beforeTests() throws Exception {
initCore("solrconfig-basic.xml", "schema-folding.xml");
assertU(adoc("id", "1", "text_fr", "l'Auberge"));
assertU(adoc("id", "2", "text_fr", "Auberge"));
assertU(adoc("id", "3", "text_fr", "other"));
assertU(commit());
}
@Test
public void testElisionMultitermQuery() {
assertQ(req("q", "text_fr:auberge"), "//result[@numFound='2']");
assertQ(req("q", "text_fr:Auberge"), "//result[@numFound='2']");
assertQ(req("q", "text_fr:l'auberge"), "//result[@numFound='2']");
assertQ(req("q", "text_fr:l'Auberge"), "//result[@numFound='2']");
assertQ(req("q", "text_fr:aub*"), "//result[@numFound='2']");
assertQ(req("q", "text_fr:Aub*"), "//result[@numFound='2']");
assertQ(req("q", "text_fr:l'aub*"), "//result[@numFound='2']");
assertQ(req("q", "text_fr:l'Aub*"), "//result[@numFound='2']");
}
}