mirror of https://github.com/apache/lucene.git
#23505 - Hani's patch to fix RussianAnalyzer test
git-svn-id: https://svn.apache.org/repos/asf/lucene/java/trunk@150069 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
dc4e35c080
commit
99ffd3cf27
|
@ -56,11 +56,7 @@ package org.apache.lucene.analysis.ru;
|
||||||
|
|
||||||
import junit.framework.TestCase;
|
import junit.framework.TestCase;
|
||||||
|
|
||||||
import java.io.FileReader;
|
import java.io.*;
|
||||||
|
|
||||||
import java.io.InputStreamReader;
|
|
||||||
import java.io.FileInputStream;
|
|
||||||
import java.io.IOException;
|
|
||||||
|
|
||||||
import org.apache.lucene.analysis.TokenStream;
|
import org.apache.lucene.analysis.TokenStream;
|
||||||
import org.apache.lucene.analysis.Token;
|
import org.apache.lucene.analysis.Token;
|
||||||
|
@ -78,13 +74,13 @@ public class TestRussianAnalyzer extends TestCase
|
||||||
|
|
||||||
private InputStreamReader sampleUnicode;
|
private InputStreamReader sampleUnicode;
|
||||||
|
|
||||||
private FileReader inWordsKOI8;
|
private Reader inWordsKOI8;
|
||||||
|
|
||||||
private FileReader sampleKOI8;
|
private Reader sampleKOI8;
|
||||||
|
|
||||||
private FileReader inWords1251;
|
private Reader inWords1251;
|
||||||
|
|
||||||
private FileReader sample1251;
|
private Reader sample1251;
|
||||||
|
|
||||||
public TestRussianAnalyzer(String name)
|
public TestRussianAnalyzer(String name)
|
||||||
{
|
{
|
||||||
|
@ -155,9 +151,9 @@ public class TestRussianAnalyzer extends TestCase
|
||||||
//System.out.println(new java.util.Date());
|
//System.out.println(new java.util.Date());
|
||||||
RussianAnalyzer ra = new RussianAnalyzer(RussianCharsets.KOI8);
|
RussianAnalyzer ra = new RussianAnalyzer(RussianCharsets.KOI8);
|
||||||
// KOI8
|
// KOI8
|
||||||
inWordsKOI8 = new FileReader("src/test/org/apache/lucene/analysis/ru/testKOI8.txt");
|
inWordsKOI8 = new InputStreamReader(new FileInputStream("src/test/org/apache/lucene/analysis/ru/testKOI8.txt"), "iso-8859-1");
|
||||||
|
|
||||||
sampleKOI8 = new FileReader("src/test/org/apache/lucene/analysis/ru/resKOI8.htm");
|
sampleKOI8 = new InputStreamReader(new FileInputStream("src/test/org/apache/lucene/analysis/ru/resKOI8.htm"), "iso-8859-1");
|
||||||
|
|
||||||
TokenStream in = ra.tokenStream("all", inWordsKOI8);
|
TokenStream in = ra.tokenStream("all", inWordsKOI8);
|
||||||
RussianLetterTokenizer sample =
|
RussianLetterTokenizer sample =
|
||||||
|
@ -191,9 +187,9 @@ public class TestRussianAnalyzer extends TestCase
|
||||||
public void test1251() throws IOException
|
public void test1251() throws IOException
|
||||||
{
|
{
|
||||||
// 1251
|
// 1251
|
||||||
inWords1251 = new FileReader("src/test/org/apache/lucene/analysis/ru/test1251.txt");
|
inWords1251 = new InputStreamReader(new FileInputStream("src/test/org/apache/lucene/analysis/ru/test1251.txt"), "iso-8859-1");
|
||||||
|
|
||||||
sample1251 = new FileReader("src/test/org/apache/lucene/analysis/ru/res1251.htm");
|
sample1251 = new InputStreamReader(new FileInputStream("src/test/org/apache/lucene/analysis/ru/res1251.htm"), "iso-8859-1");
|
||||||
|
|
||||||
RussianAnalyzer ra = new RussianAnalyzer(RussianCharsets.CP1251);
|
RussianAnalyzer ra = new RussianAnalyzer(RussianCharsets.CP1251);
|
||||||
TokenStream in = ra.tokenStream("", inWords1251);
|
TokenStream in = ra.tokenStream("", inWords1251);
|
||||||
|
|
Loading…
Reference in New Issue