lucene入门简单实现

作者：袖梨 2022-06-25

数据库的龟速查找，此时我们必须另寻蹊跷，这时lucene就可以大显身手了。

首先我们做一个demo，向数据库中插入10w条数据，总共778M。

接下来，我们搜索下新闻内容中包含“流行”的记录。

mmd，检索一下要78s，是谁都要砸了面前的破机子。

下面我们来看看lucene的效果怎么样。下载地址：http://incubator.*a**pache.org/lucene.net/download.html

代码如下

复制代码

using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using Lucene.Net.Index;
using Lucene.Net.Store;
using Lucene.Net.Analysis.Standard;
using Lucene.Net.Documents;
using System.Data;
using System.Diagnostics;
using Lucene.Net.Search;

using Lucene.Net.QueryParsers;

namespace First
{
class Program
{
static string path = @"D:Sample";

static void Main(string[] args)
{
//创建索引
CreateIndex();

var watch = Stopwatch.StartNew();

//搜索
IndexSearcher search = new IndexSearcher(path);

//查询表达式
QueryParser query = new QueryParser(string.Empty, new StandardAnalyzer());

//query.parse：注入查询条件
var hits = search.Search(query.Parse("Content:流行"));

for (int i = 0; i {
Console.WriteLine("当前内容:{0}", hits.Doc(i).Get("Content").Substring(0, 20) + "...");
}

watch.Stop();

Console.WriteLine("搜索耗费时间:{0}", watch.ElapsedMilliseconds);
}

static void CreateIndex()
{
//创建索引库目录
var directory = FSDirectory.GetDirectory(path, true);

//创建一个索引,采用StandardAnalyzer对句子进行分词
IndexWriter indexWriter = new IndexWriter(directory, new StandardAnalyzer());

var reader = DbHelperSQL.ExecuteReader("select * from News");

while (reader.Read())
{
//域的集合：文档，类似于表的行
Document doc = new Document();

//要索引的字段
doc.Add(new Field("ID", reader["ID"].ToString(), Field.Store.YES, Field.Index.NOT_ANALYZED));
doc.Add(new Field("Title", reader["Title"].ToString(), Field.Store.NO, Field.Index.ANALYZED));
doc.Add(new Field("Content", reader["Content"].ToString(), Field.Store.YES, Field.Index.ANALYZED));

indexWriter.AddDocument(doc);
}

reader.Close();

//对索引文件进行优化
indexWriter.Optimize();

indexWriter.Close();
}
}
}