Spring-Boot使用IK分词器

1.Maven依赖

1.1Spring-Boot版本

<parent>
        <groupId>org.springframework.boot</groupId>
        <artifactId>spring-boot-starter-parent</artifactId>
        <version>3.3.1</version>
        <relativePath/>
    </parent>

1.2Lucene版本

 <dependency>
            <groupId>org.apache.lucene</groupId>
            <artifactId>lucene-core</artifactId>
            <version>8.11.1</version>
 </dependency>
 <dependency>
            <groupId>org.apache.lucene</groupId>
            <artifactId>lucene-analyzers-common</artifactId>
            <version>8.11.1</version>
 </dependency>

1.3 ik-analyzer

<dependency>
            <groupId>com.github.magese</groupId>
            <artifactId>ik-analyzer</artifactId>
            <version>8.5.0</version>
        </dependency>
</dependencies>

2. 启动器

import org.apache.lucene.analysis.Analyzer;
import org.springframework.boot.SpringApplication;
import org.springframework.boot.autoconfigure.SpringBootApplication;
import org.springframework.context.annotation.Bean;
import org.wltea.analyzer.lucene.IKAnalyzer;


@SpringBootApplication
public class ikApplication {

    public static void main(String[] args) {
        SpringApplication.run(ikApplication.class, args);
    }

    @Bean
    public Analyzer ikAnalyzer() {
        return new IKAnalyzer();
    }
}

3.项目结构

项目结构配置文件说明icon-default.png?t=N7T8https://github.com/magese/ik-analyzer-solr/tree/master?tab=readme-ov-file

4.测试类


import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.StringField;
import org.apache.lucene.document.TextField;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;
import org.junit.jupiter.api.Test;
import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.boot.test.context.SpringBootTest;
import org.wltea.analyzer.lucene.IKAnalyzer;

import java.io.File;
import java.io.IOException;
import java.util.List;

@SpringBootTest
class IKApplicationTests {

    @Autowired
    JobInfoService jobInfoService;

    //注入ik分词器
    @Autowired
    Analyzer ikAnalyzer;

    //创建索引
    @Test
    void contextLoads() throws IOException {
        // 1.指定索引文件的存储位置
        Directory directory = FSDirectory.open(new File("E:/class/index").toPath());
        // 2.配置(IK)分词器
        Analyzer analyzer = new IKAnalyzer();
        
        IndexWriterConfig config = new IndexWriterConfig(analyzer);
        // 3.创建IndexWrite对象,作用是创建索引
        org.apache.lucene.index.IndexWriter indexWriter = new org.apache.lucene.index.IndexWriter(directory, config);
        // 删除已经存在的索引库
        indexWriter.deleteAll();
        // 4.获得索引源/原始数据(需要自己写查询数据库)
        List<JobInfo> jobInfos = jobInfoService.selectAllJobInfo();
        // 5.遍历,创建Document对象
        for (JobInfo jobInfo : jobInfos) {
            // 每次循环都创建一个新的Document对象
            Document document = new Document();
            // 创建Field对象并添加到Document
            document.add(new StringField("id", jobInfo.getId().toString(), Field.Store.YES));
            document.add(new TextField("companyName", jobInfo.getCompanyName(), Field.Store.YES));
            document.add(new org.apache.lucene.document.IntPoint("salaryMin", jobInfo.getSalaryMin()));
            document.add(new org.apache.lucene.document.StoredField("salaryMinStored", jobInfo.getSalaryMin()));
 jobInfo.getSalaryMax()));
            document.add(new StringField("url", jobInfo.getUrl(), Field.Store.YES));
            indexWriter.addDocument(document);
        }
        // 关闭资源
        indexWriter.close();
    }
    //测试查询结果
    @Test
    public void query() throws IOException {
        //1.指定索引文件的存储位置
        Directory directory=FSDirectory.open(new File("E:/class/index").toPath());

        //2.IndexReader对象
        IndexReader indexReader= DirectoryReader.open(directory);
        //3.创建查询对象
        IndexSearcher indexSearcher=new IndexSearcher(indexReader);
        //4.使用term
        Query query=new TermQuery(new Term("companyName","有限公司"));
        TopDocs topDocs = indexSearcher.search(query, 100);
        //5.获取符合查询的文档数
        org.apache.lucene.search.TotalHits totalHits = topDocs.totalHits;
        System.out.println(totalHits);
        org.apache.lucene.search.ScoreDoc[] scoreDocs = topDocs.scoreDocs;
        for (org.apache.lucene.search.ScoreDoc scoreDoc:scoreDocs){
            int id = scoreDoc.doc;
            Document doc = indexSearcher.doc(id);
            System.out.println("id:"+doc.get("id"));
            System.out.println("companyName"+doc.get("companyName"));
            System.out.println("========================================");
        }
        indexReader.close();
    }

}

  • 7
    点赞
  • 7
    收藏
    觉得还不错? 一键收藏
  • 1
    评论
评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值