<strong><span style="font-size:18px;">/***
* @author YangXin
* @info一个封装了StandardTokenizer的LuceneAnalyzer
* 带有小写过滤器的MyAnalyzer
*/
package unitTen;
import java.io.Reader;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.LengthFilter;
import org.apache.lucene.analysis.LowerCaseFilter;
import org.apache.lucene.analysis.PorterStemFilter;
import org.apache.lucene.analysis.StopFilter;
import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.analysis.standard.StandardTokenizer;
import org.apache.lucene.util.Version;
public class MyAnalyzer extends Analyzer {
@SuppressWarnings("deprecation")
@Override
一个封装了StandardTokenizer的自定义Lucene Analyzer
最新推荐文章于 2024-05-30 10:19:23 发布
本文介绍了一个由YangXin编写的自定义Lucene Analyzer,名为MyAnalyzer。这个Analyzer封装了StandardTokenizer,并结合了LowerCaseFilter、LengthFilter、StopFilter和PorterStemFilter,用于对输入文本进行标准化处理,包括转换为小写、长度限制和词干提取等操作。
摘要由CSDN通过智能技术生成