Lucene.Net
using System;
using System.Data;
using System.Configuration;
using System.Web;
using System.Web.Security;
using System.Web.UI;
using System.Web.UI.WebControls;
using System.Web.UI.WebControls.WebParts;
using System.Web.UI.HtmlControls;
using Lucene.Net.Index;
using Lucene.Net.Analysis.Standard;
using Lucene.Net.Documents;
using Lucene.Net.Search;
using Lucene.Net.QueryParsers;
using System.Data.OleDb;
/// <summary>
/// LuceneHelper 的摘要说明
/// </summary>
public class LuceneHelper: Page
{
public LuceneHelper()
{
//
// TODO: 在此处添加构造函数逻辑
//
}
//获得查询结果
public DataSet ExecuteQuery(string Path)
{
string strConn = "Provider=Microsoft.Jet.OLEDB.4.0;" + "Data Source=" + Path + ";" + "Extended Properties=Excel 8.0;";
OleDbConnection conn = new OleDbConnection(strConn);
conn.Open();
string strExcel = "";
OleDbDataAdapter myCommand = null;
DataSet ds = null;
strExcel = "select * from [Sheet1$]";
myCommand = new OleDbDataAdapter(strExcel, strConn);
ds = new DataSet();
myCommand.Fill(ds, "table1");
conn.Close();
return ds;
}
//建立索引
public IndexWriter CreateIndex()
{
string INDEX_STORE_PATH = Server.MapPath("index"); //INDEX_STORE_PATH 为索引存储目录
IndexWriter writer = null;
try
{
writer = new IndexWriter(INDEX_STORE_PATH, new StandardAnalyzer(), true);
DataSet ds = ExecuteQuery(@"d:\\水库.xls");
//建立索引字段
foreach (DataRow dr in ds.Tables[0].Rows)
{
Document doc = new Document();
doc.Add(new Field("NAME", dr["NAME"].ToString(), Field.Store.YES, Field.Index.UN_TOKENIZED));//存储,不索引
// doc.Add(new Field("wid", myred["wid"].ToString(), Field.Store.YES, Field.Index.UN_TOKENIZED));
doc.Add(new Field("pinyin", dr["pinyin"].ToString(), Field.Store.YES, Field.Index.TOKENIZED));
doc.Add(new Field("OBJECTID", dr["OBJECTID"].ToString(), Field.Store.YES, Field.Index.UN_TOKENIZED));
//doc.Add(new Field("NAME", dr["NAME"].ToString() , Field.Store.NO, Field.Index.TOKENIZED));//不存储,索引,indexcontent实现了title和content,也就是标题和内容的索引
// doc.Add(new Field("createdate", myred["createdate"].ToString(), Field.Store.YES, Field.Index.UN_TOKENIZED));
writer.AddDocument(doc);
}
writer.Optimize();
writer.Close();
}
catch (Exception e)
{
}
return writer;
}
public DataTable serach(string keyword)
{
string INDEX_STORE_PATH = Server.MapPath("index"); //INDEX_STORE_PATH 为索引存储目录
DataTable mytab = new DataTable("resultTable");
string kw=keyword.ToUpper();
Hits myhit = null;
IndexSearcher mysea = new IndexSearcher(INDEX_STORE_PATH);
QueryParser q = new QueryParser("pinyin", new StandardAnalyzer());
Query query = q.Parse(keyword.ToUpper()+"*");
myhit = mysea.Search(query);
//Response.Write("关于:" + keyword + " 搜索到" + myhit.Length() + "个结果<br>");
if (myhit != null)
{
DataRow myrow;
// mytab.Columns.Add("wid");
mytab.Columns.Add("pinyin");
// mytab.Columns.Add("createdate");
mytab.Columns.Add("NAME");
mytab.Columns.Add("OBJECTID");
mytab.Clear();
for (int i = 0; i < myhit.Length(); i++)
{
Document doc = myhit.Doc(i);
myrow = mytab.NewRow();
// myrow[0] = doc.Get("wid").ToString();
myrow[0] = doc.Get("pinyin").ToString();
// myrow[2] = doc.Get("createdate").ToString();
myrow[1] = doc.Get("NAME").ToString();
myrow[2] = doc.Get("OBJECTID").ToString();
mytab.Rows.Add(myrow);
myrow.AcceptChanges();
}
}
else
{
mytab = null;
}
mysea.Close();
return mytab;
}
}