一、创建Directory
public IndexUtil() {
try {
directory = FSDirectory.open(new File("F:/LuceneTest/inedx02"));
} catch (IOException e) {
e.printStackTrace();
}
}
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
三、创建文档并添加索引
文档和域的概念很重要,文档相当于表中的每一条记录,域相当于表中每一个字段
Document doc=null;
for (int i = 0; i < ids.length; i++) {
doc=new Document();
doc.add(new Field("id", ids[i], Field.Store.YES, Field.Index.NOT_ANALYZED));
doc.add(new Field("email", emails[i], Field.Store.YES, Field.Index.NOT_ANALYZED));
doc.add(new Field("Content", Contents[i], Field.Store.NO, Field.Index.NOT_ANALYZED_NO_NORMS));
doc.add(new Field("name", names[i], Field.Store.YES, Field.Index.NOT_ANALYZED_NO_NORMS));
writer.addDocument(doc);
四、查询索引的基本信息
使用IndexReader进行查询
IndexReader reader=IndexReader.open(directory);
//通过reader可以有效的获取文档个数
System.out.println("numDocs:"+reader.numDocs());
System.out.println("maxDocs"+reader.maxDoc());
五、删除和更新索引
1.删除-delete()
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
// 参数是一个选项,可以是一个Query,也可以是一个Term,Term是一个精确的查找值
// 此时删除的文档并不会被完全删除,而是存储在一个回收站中,可以恢复
writer.deleteDocuments(new Term("id", "1"));
// 使用IndexReader进行恢复
try {
// 恢复时,必须把IndexReader的只读(readOnly)状态设置为false
IndexReader reader = IndexReader.open(directory, false);
reader.undeleteAll();
reader.close();
3.强制删除-forceDelete()
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
writer.forceMergeDeletes();
4.优化和合并-marge()(不建议使用)
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
// 会将索引合并为两段,这两段中被删除的数据会被清空
// 特别注意,此处在Lucene3.5之后不建议使用,以为会消耗大量开销,Lucene会根据情况自动处理
writer.forceMerge(2);
5.更新索引-updata()
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
/*
*Lucene并不提供更新功能,这里的更新操作实际上是以下两个操作的合集
*先删除再添加
*/
Document doc=new Document();
doc.add(new Field("id", "11", Field.Store.YES,
Field.Index.NOT_ANALYZED_NO_NORMS));
doc.add(new Field("email", emails[0], Field.Store.YES,
Field.Index.NOT_ANALYZED));
doc.add(new Field("Content", Contents[0], Field.Store.NO,
Field.Index.NOT_ANALYZED_NO_NORMS));
doc.add(new Field("name", names[0], Field.Store.YES,
Field.Index.NOT_ANALYZED_NO_NORMS));
writer.updateDocument(new Term("id", "1"), doc);
附--java代码段
package org.itat.index;
import java.io.File;
import java.io.IOException;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.index.CorruptIndexException;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.Term;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;
import org.apache.lucene.store.LockObtainFailedException;
import org.apache.lucene.util.Version;
public class IndexUtil {
private String[] ids = { "1", "2", "3", "4", "5", "6" };
private String[] emails = { "aa@sian.com", "bb@qq.com", "cc@yeah.net",
"dd@gmail.com", "ee@sina.cn", "ff@hust.edu.cn" };
private String[] Contents = { "I'm a boy.", "I love basketball.",
"Boston Celtics", "Kvein Garnett", "Ray Allen", "Pual Priers" };
// private int[] attachs = { 2, 3, 4, 4, 5, 2 };
private String[] names = { "ZhangSan", "LiSi", "WangEr", "MaZi", "KG", "PP" };
private Directory directory = null;
public IndexUtil() {
try {
directory = FSDirectory.open(new File("F:/LuceneTest/inedx02"));
} catch (IOException e) {
e.printStackTrace();
}
}
public void index() {
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
writer.deleteAll();
Document doc = null;
for (int i = 0; i < ids.length; i++) {
doc = new Document();
doc.add(new Field("id", ids[i], Field.Store.YES,
Field.Index.NOT_ANALYZED_NO_NORMS));
doc.add(new Field("email", emails[i], Field.Store.YES,
Field.Index.NOT_ANALYZED));
doc.add(new Field("Content", Contents[i], Field.Store.NO,
Field.Index.NOT_ANALYZED_NO_NORMS));
doc.add(new Field("name", names[i], Field.Store.YES,
Field.Index.NOT_ANALYZED_NO_NORMS));
writer.addDocument(doc);
}
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (LockObtainFailedException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
} finally {
if (writer != null)
try {
writer.close();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
}
public void query() {
try {
IndexReader reader = IndexReader.open(directory);
// 通过reader可以有效的获取文档个数
System.out.println("numDocs:" + reader.numDocs());
System.out.println("maxDocs:" + reader.maxDoc());
System.out.println("deleteDocs:" + reader.numDeletedDocs());
reader.close();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
public void delete() {
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
// 参数是一个选项,可以是一个Query,也可以是一个Term,Term是一个精确的查找值
// 此时删除的文档并不会被完全删除,而是存储在一个回收站中,可以恢复
writer.deleteDocuments(new Term("id", "1"));
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (LockObtainFailedException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
} finally {
if (writer != null)
try {
writer.close();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
}
public void unDelete() {
// 使用IndexReader进行恢复
try {
// 恢复时,必须把IndexReader的只读(readOnly)状态设置为false
IndexReader reader = IndexReader.open(directory, false);
reader.undeleteAll();
reader.close();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
public void forceDelete() {
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
writer.forceMergeDeletes();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (LockObtainFailedException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
} finally {
if (writer != null)
try {
writer.close();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
}
public void marge() {
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
// 会将索引合并为两段,这两段中被删除的数据会被清空
// 特别注意,此处在Lucene3.5之后不建议使用,以为会消耗大量开销,Lucene会根据情况自动处理
writer.forceMerge(2);
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (LockObtainFailedException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
} finally {
if (writer != null)
try {
writer.close();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
}
public void updata() {
IndexWriter writer = null;
try {
writer = new IndexWriter(directory, new IndexWriterConfig(
Version.LUCENE_35, new StandardAnalyzer(Version.LUCENE_35)));
/*
*Lucene并不提供更新功能,这里的更新操作实际上是以下两个操作的合集
*先删除再添加
*/
Document doc=new Document();
doc.add(new Field("id", "11", Field.Store.YES,
Field.Index.NOT_ANALYZED_NO_NORMS));
doc.add(new Field("email", emails[0], Field.Store.YES,
Field.Index.NOT_ANALYZED));
doc.add(new Field("Content", Contents[0], Field.Store.NO,
Field.Index.NOT_ANALYZED_NO_NORMS));
doc.add(new Field("name", names[0], Field.Store.YES,
Field.Index.NOT_ANALYZED_NO_NORMS));
writer.updateDocument(new Term("id", "1"), doc);
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (LockObtainFailedException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
} finally{
if(writer!=null)
try {
writer.close();
} catch (CorruptIndexException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
}
}
package org.itat.test;
import org.itat.index.IndexUtil;
import org.junit.Test;
public class TestIndex {
@Test
public void testIndex() {
IndexUtil iu=new IndexUtil();
iu.index();
}
@Test
public void testQuery() {
IndexUtil iu=new IndexUtil();
iu.query();
}
@Test
public void testDelete() {
IndexUtil iu=new IndexUtil();
iu.delete();
}
@Test
public void testunDelete() {
IndexUtil iu=new IndexUtil();
iu.unDelete();
}
@Test
public void testforceDelete() {
IndexUtil iu=new IndexUtil();
iu.forceDelete();
}
@Test
public void testMarge(){
IndexUtil iu=new IndexUtil();
iu.marge();
}
@Test
public void testUpdata() {
IndexUtil iu=new IndexUtil();
iu.updata();
}
}