/**
* Demo for simple use of lucene
*/
package Test;
import java.io.File;
import java.io.FileReader;
import java.io.Reader;
import java.util.Date;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.search.*;
import org.apache.lucene.queryParser.QueryParser;
/**
* @author sxch
*
*/
public class LuceneTest {
/**
* @param args
*/
public static void main(String[] args)throws Exception {
// TODO Auto-generated method stub
//被索引文件所在目录
File fileDir = new File("F:\\Works\\JWork\\LuceneTest\\soucefile");
//索引文件存放目录
File indexDir = new File("indexfile");
Analyzer luceneAnalyzer = new StandardAnalyzer();
IndexWriter indexWriter = new IndexWriter(indexDir,luceneAnalyzer,true);
File[] textFiles = fileDir.listFiles();
long startTime = new Date().getTime();
for(int i =0 ; i < textFiles.length; i++)
{
if(textFiles[i].isFile() && textFiles[i].getName().endsWith(".txt"))
{
System.out.println("File "+ textFiles[i].getCanonicalPath() + " is being indexed !");
Reader textReader = new FileReader(textFiles[i]);
//新建一个文档
Document document = new Document();
//文档中放入内容字段
document.add(new Field("content",textReader));;
//文档中放入路径字段
document.add(new Field("path",textFiles[i].getPath(),Field.Store.YES,Field.Index.TOKENIZED));
//添加索引
indexWriter.addDocument(document);
}
}
//优化索引
indexWriter.optimize();
indexWriter.close();
//索引完成,查询
//Query query = new TermQuery(new Term("content","world"));
IndexSearcher searcher = new IndexSearcher("indexfile");
Hits hits = null;
Query query = null;
//查询解析器,建立在content字段
QueryParser qp = new QueryParser("content",new StandardAnalyzer());
//在content字段查询关键字hello
query =qp.parse("hello");
//查询
hits = searcher.search(query);
//输出查询结果综述
System.out.println(hits.length());
//输出查询结果的路径及文件名
for (int i = 0; i < hits.length(); i++) {
System.out.println(hits.doc(i).getField("path"));
}
}
}
lucene 使用示例
最新推荐文章于 2024-08-29 06:57:42 发布