先取出文件夹下的所有File,然后给这些File创建索引,最后根据条件查询
1.pom.xml:
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
4.0.0
hui
Lucene
0.0.1-SNAPSHOT
jar
Lucene
http://maven.apache.org
UTF-8
junit
junit
4.12
org.apache.lucene
lucene-core
6.0.0
org.apache.lucene
lucene-analyzers-common
6.0.0
org.apache.lucene
lucene-queryparser
6.0.0
org.apache.lucene
lucene-highlighter
6.0.0
2.递归取出文件夹下的所有文件ListFiles.java:
package luceneTest;
import java.io.File;
import java.util.ArrayList;
import java.util.List;
public class ListFiles {
private static List filesResult = new ArrayList<>();
public static void main(String[] args) {
List files = listFiles("e:/eclipse/OOP");
System.out.println(files.size());
for (File f : files) {
System.out.println(f.getName());
}
}
public static List listFiles(String srcPath) {
File file = new File(srcPath);
File[] files = file.listFiles();
for (File f : files) {
if (f.isDirectory()) {
listFiles(f.getAbsolutePath());
} else {
filesResult.add(f);
}
}
return filesResult;
}
}
3.根据自己的条件创建索引+查询:FilesTest.java:
package luceneTest;
import java.io.File;
import java.io.FileReader;
import java.io.IOException;
import java.nio.file.Paths;
import java.util.List;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.TextField;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.queryparser.classic.ParseException;
import org.apache.lucene.queryparser.classic.QueryParser;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;
public class FilesTest {
public static void main(String[] args) throws ParseException, IOException {
String srcPath = "E:/eclipse/OOP";
String destPath = "e:/test/index";
// createIndexTo(srcPath, destPath);
read(destPath, "fileContent", "string");
}
public static void read(String indexPath, String fieldName, String parseString)
throws IOException, ParseException {
Analyzer analyzer = new StandardAnalyzer();
Directory directory = FSDirectory.open(Paths.get(indexPath));
// Now search the index:
DirectoryReader reader = DirectoryReader.open(directory);
IndexSearcher searcher = new IndexSearcher(reader);
process(searcher, analyzer, fieldName, parseString);
reader.close();
directory.close();
}
private static void process(IndexSearcher searcher, Analyzer analyzer,
String fieldName, String parseString) throws ParseException, IOException {
QueryParser parser = new QueryParser(fieldName, analyzer);
Query query = parser.parse(parseString);
ScoreDoc[] hits = searcher.search(query, 1000).scoreDocs;
System.out.println(hits.length);
for (int i = 0; i
Document hitDoc = searcher.doc(hits[i].doc);
System.out.println(hitDoc.get("filePath"));
}
}
public static void createIndexTo(String srcPath, String destPath) throws IOException {
Analyzer analyzer = new StandardAnalyzer();
Directory directory = FSDirectory.open(Paths.get(destPath));
IndexWriterConfig config = new IndexWriterConfig(analyzer);
IndexWriter writer = new IndexWriter(directory, config);
List files = ListFiles.listFiles(srcPath);
FileReader fileReader = null;
for (File temp : files) {
if (temp.isFile()) {
fileReader = new FileReader(temp);
Document doc = new Document();
doc.add(new Field("fileName", temp.getName(), TextField.TYPE_STORED));
doc.add(new Field("fileContent", fileReader, TextField.TYPE_NOT_STORED));
doc.add(new Field("filePath", temp.getAbsolutePath(),
TextField.TYPE_STORED));
System.out.println(temp.getAbsolutePath() + " indexed");
writer.addDocument(doc);
}
}
writer.close();
}
}