2018-05-10 13:52:58 +08:00
|
|
|
|
/*
|
2019-09-27 09:52:45 +08:00
|
|
|
|
* IK 中文分词 版本 8.2.0
|
|
|
|
|
* IK Analyzer release 8.2.0
|
2018-11-15 11:05:24 +08:00
|
|
|
|
*
|
|
|
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
|
|
|
* contributor license agreements. See the NOTICE file distributed with
|
|
|
|
|
* this work for additional information regarding copyright ownership.
|
|
|
|
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
|
|
|
|
* (the "License"); you may not use this file except in compliance with
|
|
|
|
|
* the License. You may obtain a copy of the License at
|
|
|
|
|
*
|
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
*
|
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
|
* limitations under the License.
|
|
|
|
|
*
|
|
|
|
|
* 源代码由林良益(linliangyi2005@gmail.com)提供
|
|
|
|
|
* 版权声明 2012,乌龙茶工作室
|
|
|
|
|
* provided by Linliangyi and copyright 2012 by Oolong studio
|
|
|
|
|
*
|
2019-09-27 09:52:45 +08:00
|
|
|
|
* 8.2.0版本 由 Magese (magese@live.cn) 更新
|
|
|
|
|
* release 8.2.0 update by Magese(magese@live.cn)
|
2018-11-15 11:05:24 +08:00
|
|
|
|
*
|
2018-05-10 13:52:58 +08:00
|
|
|
|
*/
|
|
|
|
|
package org.wltea.analyzer.lucene;
|
|
|
|
|
|
|
|
|
|
import org.apache.lucene.analysis.Analyzer;
|
|
|
|
|
import org.apache.lucene.analysis.Tokenizer;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* IK分词器,Lucene Analyzer接口实现
|
|
|
|
|
*/
|
|
|
|
|
@SuppressWarnings("unused")
|
|
|
|
|
public final class IKAnalyzer extends Analyzer{
|
|
|
|
|
|
|
|
|
|
private boolean useSmart;
|
|
|
|
|
|
|
|
|
|
private boolean useSmart() {
|
|
|
|
|
return useSmart;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public void setUseSmart(boolean useSmart) {
|
|
|
|
|
this.useSmart = useSmart;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* IK分词器Lucene Analyzer接口实现类
|
|
|
|
|
*
|
|
|
|
|
* 默认细粒度切分算法
|
|
|
|
|
*/
|
|
|
|
|
public IKAnalyzer(){
|
|
|
|
|
this(false);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* IK分词器Lucene Analyzer接口实现类
|
|
|
|
|
*
|
|
|
|
|
* @param useSmart 当为true时,分词器进行智能切分
|
|
|
|
|
*/
|
|
|
|
|
public IKAnalyzer(boolean useSmart){
|
|
|
|
|
super();
|
|
|
|
|
this.useSmart = useSmart;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* 重载Analyzer接口,构造分词组件
|
|
|
|
|
*/
|
|
|
|
|
@Override
|
|
|
|
|
protected TokenStreamComponents createComponents(String fieldName) {
|
|
|
|
|
Tokenizer _IKTokenizer = new IKTokenizer(this.useSmart());
|
|
|
|
|
return new TokenStreamComponents(_IKTokenizer);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|