Lucene分词器（搜索关键字解析器）

最新推荐文章于 2022-01-24 13:51:28 发布

置顶 feixiangdexin123087

最新推荐文章于 2022-01-24 13:51:28 发布

阅读量3.1k

点赞数

分类专栏： java 网站 Web前端 LuceneSearch 文章标签： lucene string exception date import

本文链接：https://blog.csdn.net/feixiangdexin123087/article/details/8001292

版权

java 同时被 3 个专栏收录

55 篇文章 0 订阅

订阅专栏

Web前端

27 篇文章 0 订阅

订阅专栏

网站

23 篇文章 0 订阅

订阅专栏

import java.io.StringReader;
import java.text.SimpleDateFormat;
import java.util.Date;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.KeywordAnalyzer;
import org.apache.lucene.analysis.SimpleAnalyzer;
import org.apache.lucene.analysis.StopAnalyzer;
import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.analysis.WhitespaceAnalyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.analysis.tokenattributes.TermAttribute;
import org.apache.lucene.util.Version;

public class luncens {

public static void analyze(Analyzer analyzer, String text) throws Exception {
System.out.println("分词器：" + analyzer.getClass());
TokenStream tokenStream = analyzer.tokenStream("content", new StringReader(text));
tokenStream.addAttribute(TermAttribute.class);
while (tokenStream.incrementToken()) {
TermAttribute termAttribute =tokenStream.getAttribute(TermAttribute.class);
System.out.println(termAttribute.term());
}
}

public static void main(String[] args) throws Exception {
String enText = "China is a great country!JC-46C(16tt)dd";
// String chText = "昨天，一阵雷阵雨后，空气异常地清新!46C";
String chText = "SICAO新潮半导体电子酒柜JC-46C（16支）";
SimpleAnalyzer analyzer1 = new SimpleAnalyzer();
analyze(analyzer1,enText);
analyze(analyzer1,chText);
StopAnalyzer analyzer2 = new StopAnalyzer(Version.LUCENE_CURRENT);
analyze(analyzer2,enText);
analyze(analyzer2,chText);
StandardAnalyzer analyzer3 = new StandardAnalyzer(Version.LUCENE_CURRENT);
analyze(analyzer3,enText);
analyze(analyzer3,chText);//逐个字切分
WhitespaceAnalyzer analyzer4 = new WhitespaceAnalyzer();
analyze(analyzer4,enText);
analyze(analyzer4,chText);
KeywordAnalyzer analyzer5 = new KeywordAnalyzer();
analyze(analyzer5,enText);
analyze(analyzer5,chText);

SimpleDateFormat format = new SimpleDateFormat("yyyy-MM-dd HH:mm:ss");

Date date = new Date();
//当前时间
String endtime = format.format(date).substring(11, 13);
System.out.println("时间="+endtime);
}

}

feixiangdexin123087

关注

0
点赞
踩
1

收藏

觉得还不错? 一键收藏
0
评论
Lucene分词器（搜索关键字解析器）

import java.io.StringReader;import java.text.SimpleDateFormat;import java.util.Date;import org.apache.lucene.analysis.Analyzer;import org.apache.lucene.analysis.KeywordAnalyzer;import or
复制链接

扫一扫