一、不包含原来分词器StopAnalyZer信息
Code 1:
public class MyStopAnalyzer extends Analyzer {
//一组数组产生分词对象
private CharArraySet stopWordsSet;//自己要屏蔽的一些单词
//构造函数
public MyStopAnalyzer(String[] stopWords) {
//将String数组转换为<span style="font-family: Arial, Helvetica, sans-serif;">CharArraySet</span>
stopWordsSet = StopFilter.makeStopSet(stopWords, true); //CharArraySet
}
@Override
protected TokenStreamComponents createComponents(String arg0) {
//创建一个分词器
LetterTokenizer letterTokenizer = new LetterTokenizer();
//创建一系列分词过滤器
LowerCaseFilter lowerCaseFilter = new LowerCaseFilter(letterTokenizer);
StopFilte