mirror of https://github.com/apache/lucene.git
LUCENE-8784: Restore the Korean's part of speech tag for NGRAM.
The part of speech tag for unigram has been changed inadvertenly in a previous commit (not released). This change restores the original value that is also set on the serialized unkwnown dictionary.
This commit is contained in:
parent
04d781db8b
commit
bf0d6fad42
|
@ -32,7 +32,7 @@ import java.util.List;
|
|||
import org.apache.lucene.analysis.ko.dict.CharacterDefinition;
|
||||
|
||||
public class UnknownDictionaryBuilder {
|
||||
private static final String NGRAM_DICTIONARY_ENTRY = "NGRAM,1798,3559,3677,UNKNOWN,*,*,*,*,*,*,*";
|
||||
private static final String NGRAM_DICTIONARY_ENTRY = "NGRAM,1798,3559,3677,SY,*,*,*,*,*,*,*";
|
||||
|
||||
private String encoding = "utf-8";
|
||||
|
||||
|
|
Loading…
Reference in New Issue