最近研究了一下使用.netcore的Lucene.Net应用,整理一下研究内容。

一、研究原因

1、系统环境:多终端、多服务、达梦数据库8、.netcore7.0、多机负载。

2、业务数量:单表1000万条数据,有7张的业务表或功能表有千万数据。

3、问题描述:业务表的字段较多,后台管理系统上,对数据查询的准确度与速度有要求,查询的组合字段较多,数据表上创建的索引无法完全覆盖所有的组合情况。


 

二、预期目标

1、有效提高查询速度。

2、持久化数据库与索引库保持一致。

3、减少对当前系统结构的影响,尽量降低改造的工作量。

4、可以进行索引库的数据量、待入索引库的数据、索引库查询速度等监控。


 

三、应用结构

1、因索引库只能单线程写入,可以多线程查询,所以在系统外新增索引写入服务,使多业务并发的状态形成单线程处理,根据业务表的类型,可以创建多个线程存入不同的索引库,同一索引库只有一个服务写入。

2、数据库增加触发器,当业务表增、删、改的时候,自动将业务表ID的操作存入队列表,使用触发器的方式避免多终端多服务的数据处置,保证业务表和索引库的数据一致。


 

四、实验结果

1、使用存储不分词索引导入1000万数据索引,检测多组合查询速度为1秒内。

2、业务表数据和索引库的数据可以保持一致。


 

五、代码样例

1、添加NuGet

1、达梦数据库 FreeSql.Provider.Dameng 3.5.213
2、索引 Lucene.Net 3.0.3
3、配置 System.Configuration.ConfigurationManager 9.0.9

2、写入索引库

using Lucene.Net.Analysis;
using Lucene.Net.Analysis.Standard;
using Lucene.Net.Documents;
using Lucene.Net.Index;
using Lucene.Net.Store;
using Lucene.Net.Util;
using System;
using System.Collections.Generic;
using System.Data;
using System.Data.Common;
using System.IO;
using System.Reflection.Metadata;
using System.Data;
using Dm;
using static FreeSql.Internal.GlobalFilter;
using Lucene.Net.Search;
using Lucene.Net.QueryParsers;
using System.Runtime.ConstrainedExecution;
using System.Reflection.PortableExecutable;

class Program
{
    static void Main(string[] args)
    {
        Analyzer analyzer = null;
        IndexWriter writer = null;
        Lucene.Net.Store.Directory indexDirectory = null;

        try
        {
            indexDirectory = FSDirectory.Open(new System.IO.DirectoryInfo("D:\\LuceneIndex"));
            analyzer = new StandardAnalyzer(Lucene.Net.Util.Version.LUCENE_30);
            
            bool iscreate = !Lucene.Net.Index.IndexReader.IndexExists(indexDirectory);

            writer = new IndexWriter(indexDirectory, analyzer, iscreate, IndexWriter.MaxFieldLength.UNLIMITED);

            string connectionString = "Server=LOCALHOST;Database=SYSDBA;User Id=SYSDBA;Password=123456;";

            using (DmConnection connection = new DmConnection(connectionString))
            {
                connection.Open();

                using (DmCommand command = new DmCommand("SELECT reg_id,reg_name,reg_sex,reg_datetime,reg_status FROM reg_infor", connection))
                {
                    using (DmDataAdapter adapter = new DmDataAdapter(command))
                    {
                        DataTable table = new DataTable();
                        adapter.Fill(table);


                        int i = 0;
                        foreach (DataRow row in table.Rows)
                        {
                            i++;
                            Lucene.Net.Documents.Document doc = new Lucene.Net.Documents.Document();
                            doc.Add(new Field("reg_id", row["reg_id"].ToString(), Field.Store.YES, Field.Index.NOT_ANALYZED));//存储,不分词索引
                            doc.Add(new Field("reg_name", row["reg_name"].ToString(), Field.Store.YES, Field.Index.NOT_ANALYZED));//存储,不分词索引
                            doc.Add(new Field("reg_sex", row["reg_sex"].ToString(), Field.Store.YES, Field.Index.NOT_ANALYZED));//存储,分词索引
                            doc.Add(new Field("reg_datetime", row["reg_datetime"].ToString(), Field.Store.YES, Field.Index.NOT_ANALYZED));//存储,分词索引
                            doc.Add(new Field("reg_status", row["reg_status"].ToString(), Field.Store.YES, Field.Index.NOT_ANALYZED));
                            writer.AddDocument(doc);

                            writer.Commit();//.Optimize();
                        }
                    }
                }

                connection.Close();
            }
            
        }
        catch (Exception ex)
        {
            throw;
        }
        finally
        {

            if (analyzer != null)
                analyzer.Close();
            if (writer != null)
                writer.Dispose();//之前为:writer.Close();
            if (indexDirectory != null)
                indexDirectory.Dispose();//之前使用Close();
        }

        Console.WriteLine("索引创建成功!");
        Console.ReadLine();
    }
}

3、数据查询

using Lucene.Net.Analysis;
using Lucene.Net.Analysis.Standard;
using Lucene.Net.Documents;
using Lucene.Net.Index;
using Lucene.Net.Store;
using Lucene.Net.Util;
using System;
using System.Collections.Generic;
using System.Data;
using System.Data.Common;
using System.IO;
using System.Reflection.Metadata;
using System.Data;
using Dm;
using static FreeSql.Internal.GlobalFilter;
using Lucene.Net.Search;
using Lucene.Net.QueryParsers;
using System.Runtime.ConstrainedExecution;
using System.Reflection.PortableExecutable;

class Program
{
    static void Main(string[] args)
    {
        Analyzer analyzer = null;
        IndexWriter writer = null;
        Lucene.Net.Store.Directory indexDirectory = null;

        try
        {
            indexDirectory = FSDirectory.Open(new System.IO.DirectoryInfo("D:\\LuceneIndex"));
            analyzer = new StandardAnalyzer(Lucene.Net.Util.Version.LUCENE_30);

            var directory = FSDirectory.Open("D:\\LuceneIndex");

            var reader = DirectoryReader.Open(directory, true);
            var searcher = new IndexSearcher(reader);

            int numDocs = reader.NumDocs();

            var booleanQuery = new BooleanQuery();
            booleanQuery.Add(new TermQuery(new Term("reg_status", "1")), Occur.MUST);
            booleanQuery.Add(new TermQuery(new Term("reg_sex", "1")), Occur.MUST);


            var hits = searcher.Search(booleanQuery, 10);

            foreach (var hit in hits.ScoreDocs)
            {
                var doc = searcher.Doc(hit.Doc);
                Console.WriteLine($"ID: {doc.Get("reg_id")}, Name: {doc.Get("reg_name")}");
            }

        }
        catch (Exception ex)
        {
            throw;
        }
        finally
        {

            if (analyzer != null)
                analyzer.Close();
            if (writer != null)
                writer.Dispose();//之前为:writer.Close();
            if (indexDirectory != null)
                indexDirectory.Dispose();//之前使用Close();
        }

        Console.WriteLine("索引查询成功!");
        Console.ReadLine();
    }
}

4、触发器

---新增数据触发器---
CREATE TRIGGER trg_after_insert_reginfor AFTER INSERT ON reg_infor FOR EACH ROW BEGIN insert into SYSDBA.ACTION_LOG(
"LOG_ID", "BIN_ID", "ACTION_TYPE", "ACTION_STATUS", "CREATE_TIME", "ACTION_TIME") VALUES (REPLACE(SYS_GUID(), '-', ''),NEW."reg_id", 1, 0,TO_CHAR(SYSDATE, 'YYYY-MM-DD HH24:MI:SS'),''); END;
---修改数据触发器---
CREATE TRIGGER trg_after_update_reginfor AFTER UPDATE ON reg_infor FOR EACH ROW BEGIN insert into SYSDBA.ACTION_LOG(
"LOG_ID", "BIN_ID", "ACTION_TYPE", "ACTION_STATUS", "CREATE_TIME", "ACTION_TIME") VALUES (REPLACE(SYS_GUID(), '-', ''),NEW."reg_id", 2, 0,TO_CHAR(SYSDATE, 'YYYY-MM-DD HH24:MI:SS'),''); END;

 

posted on 2025-09-20 16:06  开源包容  阅读(27)  评论(0)    收藏  举报