java代码查询索引文件实例,Lucene6.0 查询File实例

weixin_36365795

于 2021-03-15 01:23:27 发布

阅读量90

点赞数

文章标签： java代码查询索引文件实例

先取出文件夹下的所有File，然后给这些File创建索引，最后根据条件查询

1.pom.xml:

xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">

4.0.0

hui

Lucene

0.0.1-SNAPSHOT

jar

Lucene

http://maven.apache.org

UTF-8

junit

4.12

org.apache.lucene

lucene-core

6.0.0

org.apache.lucene

lucene-analyzers-common

6.0.0

org.apache.lucene

lucene-queryparser

6.0.0

org.apache.lucene

lucene-highlighter

6.0.0

2.递归取出文件夹下的所有文件ListFiles.java:

package luceneTest;

import java.io.File;

import java.util.ArrayList;

import java.util.List;

public class ListFiles {

private static List filesResult = new ArrayList<>();

public static void main(String[] args) {

List files = listFiles("e:/eclipse/OOP");

System.out.println(files.size());

for (File f : files) {

System.out.println(f.getName());

}

public static List listFiles(String srcPath) {

File file = new File(srcPath);

File[] files = file.listFiles();

for (File f : files) {

if (f.isDirectory()) {

listFiles(f.getAbsolutePath());

} else {

filesResult.add(f);

}

return filesResult;

}

3.根据自己的条件创建索引+查询：FilesTest.java:

package luceneTest;

import java.io.File;

import java.io.FileReader;

import java.io.IOException;

import java.nio.file.Paths;

import java.util.List;

import org.apache.lucene.analysis.Analyzer;

import org.apache.lucene.analysis.standard.StandardAnalyzer;

import org.apache.lucene.document.Document;

import org.apache.lucene.document.Field;

import org.apache.lucene.document.TextField;

import org.apache.lucene.index.DirectoryReader;

import org.apache.lucene.index.IndexWriter;

import org.apache.lucene.index.IndexWriterConfig;

import org.apache.lucene.queryparser.classic.ParseException;

import org.apache.lucene.queryparser.classic.QueryParser;

import org.apache.lucene.search.IndexSearcher;

import org.apache.lucene.search.Query;

import org.apache.lucene.search.ScoreDoc;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

public class FilesTest {

public static void main(String[] args) throws ParseException, IOException {

String srcPath = "E:/eclipse/OOP";

String destPath = "e:/test/index";

// createIndexTo(srcPath, destPath);

read(destPath, "fileContent", "string");

}

public static void read(String indexPath, String fieldName, String parseString)

throws IOException, ParseException {

Analyzer analyzer = new StandardAnalyzer();

Directory directory = FSDirectory.open(Paths.get(indexPath));

// Now search the index:

DirectoryReader reader = DirectoryReader.open(directory);

IndexSearcher searcher = new IndexSearcher(reader);

process(searcher, analyzer, fieldName, parseString);

reader.close();

directory.close();

}

private static void process(IndexSearcher searcher, Analyzer analyzer,

String fieldName, String parseString) throws ParseException, IOException {

QueryParser parser = new QueryParser(fieldName, analyzer);

Query query = parser.parse(parseString);

ScoreDoc[] hits = searcher.search(query, 1000).scoreDocs;

System.out.println(hits.length);

for (int i = 0; i

Document hitDoc = searcher.doc(hits[i].doc);

System.out.println(hitDoc.get("filePath"));

}

public static void createIndexTo(String srcPath, String destPath) throws IOException {

Analyzer analyzer = new StandardAnalyzer();

Directory directory = FSDirectory.open(Paths.get(destPath));

IndexWriterConfig config = new IndexWriterConfig(analyzer);

IndexWriter writer = new IndexWriter(directory, config);

List files = ListFiles.listFiles(srcPath);

FileReader fileReader = null;

for (File temp : files) {

if (temp.isFile()) {

fileReader = new FileReader(temp);

Document doc = new Document();

doc.add(new Field("fileName", temp.getName(), TextField.TYPE_STORED));

doc.add(new Field("fileContent", fileReader, TextField.TYPE_NOT_STORED));

doc.add(new Field("filePath", temp.getAbsolutePath(),

TextField.TYPE_STORED));

System.out.println(temp.getAbsolutePath() + " indexed");

writer.addDocument(doc);

}

writer.close();

}

weixin_36365795

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
复制链接

分享到 QQ

分享到新浪微博

扫一扫