lucene本身是模糊匹配,基于分词后建立倒排索引
建立索引
建立索引时使用KeywordAnalyzer,此分词器将源字段的所有内容当成一个token进行存储,查询时需要进行完全匹配才能有输出
//Analyzer analyzer = new StandardAnalyzer();//Analyzer分词,交给Indexwriter建立索引
//IKAnalyzer analyzer = new IKAnalyzer();
KeywordAnalyzer analyzer = new KeywordAnalyzer();
IndexWriterConfig config = new IndexWriterConfig(analyzer);
IndexWriter indexWriter = new IndexWriter(dir, config);
搜索时用PhraseQuery,
{
//QueryParser parser = new QueryParser("key", analyzer);
//Query Query;
/*
Term term = new Term("entity", query);
System.out.println("term:" + term);
Query = parser.parse(query);
System.out.println(Query);
*/
PhraseQuery.Builder builder = new PhraseQuery.Builder();
builder.add(new Term("key", query), 0);
PhraseQuery pq = builder.build();
Hits hit = searcher.search(pq);
TopDocs topDocs = searcher.search(pq, 50);
ScoreDoc[] hits = topDocs.scoreDocs;
System.out.println(topDocs.totalHits);
System.out.println(hits.length);
Random random = new Random();
ArrayList ans = new ArrayList();
if(hits.length == 0)
return null;
else {
for (int i = 0; i < hits.length; i++) {
Document document = searcher.doc(hits[i].doc);
ans.add(document.get("value"));
}
}
}