Lucene.Net v2.9.x + 盘古分词版

using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.IO;


using Lucene.Net;
using Lucene.Net.Analysis;
using Lucene.Net.Analysis.Standard;
using Lucene.Net.Index;
using Lucene.Net.Store;
using Lucene.Net.Documents;
using Lucene.Net.Search;
using Lucene.Net.QueryParsers;


StandardAnalyzer standardAnalyzer = new StandardAnalyzer(Lucene.Net.Util.Version.LUCENE_29);


FSDirectory fsDirectory = FSDirectory.Open(new DirectoryInfo(@"d:\search\"), new NoLockFactory());
IndexWriter indexWriter = new IndexWriter(fsDirectory, standardAnalyzer, true, IndexWriter.MaxFieldLength.LIMITED);


FileInfo fileInfo = new FileInfo(@"d:\search\射雕英雄传.txt");


using (StreamReader streamReader = new StreamReader(fileInfo.FullName, Encoding.Default))
{
while (!streamReader.EndOfStream)
{
string content = streamReader.ReadLine();
if (string.IsNullOrEmpty(content))
{
continue;
}
Document document = new Document();
document.Add(new Field("content", content, Field.Store.YES, Field.Index.ANALYZED));
indexWriter.AddDocument(document);
}
}


indexWriter.Optimize();
indexWriter.Close();


IndexSearcher indexSearcher = new IndexSearcher(fsDirectory, true);
Query query = new QueryParser(Lucene.Net.Util.Version.LUCENE_29, "content", standardAnalyzer).Parse("欧阳锋");
TopDocs topDocs = indexSearcher.Search(query, 10);
for (int i = 0;i < 10;++i)
{
if (topDocs.ScoreDocs[i] == null)
{
break;
}
Document temp = indexSearcher.Doc(topDocs.ScoreDocs[i].doc);
Console.WriteLine(temp.GetField("content").StringValue());
}

indexSearcher.Close();


下为盘古分词版===========================================


Segment.Init();
PanGuAnalyzer analyzer = new PanGuAnalyzer();
//StandardAnalyzer analyzer = new StandardAnalyzer(Lucene.Net.Util.Version.LUCENE_29);
FSDirectory fsDirectory = FSDirectory.Open(new DirectoryInfo(@"d:\search\"), new NoLockFactory());
IndexWriter indexWriter = new IndexWriter(fsDirectory, analyzer, true, IndexWriter.MaxFieldLength.LIMITED);


FileInfo fileInfo = new FileInfo(@"d:\search\射雕英雄传.txt");


using (StreamReader streamReader = new StreamReader(fileInfo.FullName, Encoding.Default))
{
while (!streamReader.EndOfStream)
{
string content = streamReader.ReadLine();
if (string.IsNullOrEmpty(content))
{
continue;
}
Document document = new Document();
document.Add(new Field("content", content, Field.Store.YES, Field.Index.ANALYZED));
indexWriter.AddDocument(document);
}
}


indexWriter.Optimize();
indexWriter.Close();


IndexSearcher indexSearcher = new IndexSearcher(fsDirectory, true);
Stopwatch stopwatch = new Stopwatch();
stopwatch.Start();
Term t = new Term("content", "欧阳锋");
Query query = new TermQuery(t);
TopDocs topDocs = indexSearcher.Search(query, 100);
stopwatch.Stop();
Console.WriteLine(stopwatch.Elapsed.ToString());


indexSearcher.Close();

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值