mirror of https://github.com/apache/lucene.git
convert to utf-8
git-svn-id: https://svn.apache.org/repos/asf/lucene/java/trunk@151002 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
22a19287ea
commit
1b5eb6c40c
|
@ -66,7 +66,7 @@ import org.apache.lucene.analysis.TokenStream;
|
|||
/**
|
||||
* Test case for FrenchAnalyzer.
|
||||
*
|
||||
* @author Jean-François Halleux
|
||||
* @author Jean-François Halleux
|
||||
* @version $version$
|
||||
*/
|
||||
|
||||
|
@ -140,25 +140,25 @@ public class TestFrenchAnalyzer extends TestCase {
|
|||
sign is often used for composing words */
|
||||
assertAnalyzesTo(
|
||||
fa,
|
||||
"Jean-François",
|
||||
new String[] { "jean", "françois" });
|
||||
"Jean-François",
|
||||
new String[] { "jean", "françois" });
|
||||
|
||||
// 2. stopwords
|
||||
assertAnalyzesTo(
|
||||
fa,
|
||||
"le la chien les aux chat du des à cheval",
|
||||
"le la chien les aux chat du des à cheval",
|
||||
new String[] { "chien", "chat", "cheval" });
|
||||
|
||||
// some nouns and adjectives
|
||||
assertAnalyzesTo(
|
||||
fa,
|
||||
"lances chismes habitable chiste éléments captifs",
|
||||
"lances chismes habitable chiste éléments captifs",
|
||||
new String[] {
|
||||
"lanc",
|
||||
"chism",
|
||||
"habit",
|
||||
"chist",
|
||||
"élément",
|
||||
"élément",
|
||||
"captif" });
|
||||
|
||||
// some verbs
|
||||
|
@ -171,12 +171,12 @@ public class TestFrenchAnalyzer extends TestCase {
|
|||
// aujourd'hui stays one term which is OK
|
||||
assertAnalyzesTo(
|
||||
fa,
|
||||
"C3PO aujourd'hui oeuf ïâöûàä anticonstitutionnellement Java++ ",
|
||||
"C3PO aujourd'hui oeuf ïâöûàä anticonstitutionnellement Java++ ",
|
||||
new String[] {
|
||||
"c3po",
|
||||
"aujourd'hui",
|
||||
"oeuf",
|
||||
"ïâöûàä",
|
||||
"ïâöûàä",
|
||||
"anticonstitutionnel",
|
||||
"jav" });
|
||||
|
||||
|
|
Loading…
Reference in New Issue