bwlang

萝卜辣椒

导航

最近项目中要用到模糊查询,开始研究lucene,期间走了好多弯路,总算实现了一个简单的demo。

使用的lucene jar包是3.6版本.

一:建立数据库表,并加上测试数据。数据库表:UserInfo

 

二:新建java project,并引入lucene jar包。http://lucene.apache.org/

 

三:为数据库表建立索引及利用索引查数据:

 

import java.io.File;


import java.io.IOException;
import java.sql.Connection;
import java.sql.PreparedStatement;
import java.sql.ResultSet;
import java.sql.SQLException;


import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.IndexWriterConfig.OpenMode;
import org.apache.lucene.queryParser.QueryParser;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.store.Directory;
import org.apache.lucene.util.Version;
import org.apache.lucene.store.SimpleFSDirectory;
import com.test.dbc.DBConnection;


public class MakeTableIndex {
public static void main(String[] args) throws IOException, SQLException {
String indexDir = "d:\\lucene\\index";
Connection conn;
DBConnection conn1 = new DBConnection();
conn = conn1.getConnection();
PreparedStatement pstmt = conn
.prepareStatement("SELECT * FROM UserInfo");


ResultSet rs = pstmt.executeQuery();
// 为表字段建立索引
Directory dir = new SimpleFSDirectory(new File(indexDir));
// 分词
Analyzer luceneAnalyzer = new StandardAnalyzer(Version.LUCENE_36);
IndexWriterConfig iwc = new IndexWriterConfig(Version.LUCENE_36,
luceneAnalyzer);
iwc.setOpenMode(OpenMode.CREATE);
IndexWriter indexWriter = new IndexWriter(dir, iwc);


while (rs.next()) {
System.out.println("username***" + rs.getString(2));
Document doc = new Document();
doc.add(new Field("ID", rs.getString(1), Field.Store.YES,
Field.Index.ANALYZED));
doc.add(new Field("UserName", rs.getString(2), Field.Store.YES,
Field.Index.ANALYZED));
doc.add(new Field("Hobby", rs.getString(5), Field.Store.YES,
Field.Index.ANALYZED));
indexWriter.addDocument(doc);
}
System.out.println("numDocs" + indexWriter.numDocs());
indexWriter.close();
try {
search();
} catch (Exception e) {
// TODO: handle exception
System.out.println(e);
}

}


// ------------------Search
public static void search() throws Exception {
String  dirPathString="d:\\lucene\\index";
System.out.println(dirPathString);
Directory dir = new SimpleFSDirectory(new File(dirPathString));//查询分析器  路径
IndexReader reader = IndexReader.open(dir);
IndexSearcher searcher = new IndexSearcher(reader);
QueryParser parser = new QueryParser(Version.LUCENE_35, "UserName", new StandardAnalyzer(Version.LUCENE_36));
Query q = parser.parse("张丽");
TopDocs tds = searcher.search(q, 5);
ScoreDoc[] sds = tds.scoreDocs;
for (ScoreDoc sd : sds) {
System.out.println(sd.score);
int docName = sd.doc;
Document doc = searcher.doc(docName);
String UserName = doc.get("UserName");
String Hobby = doc.get("Hobby");
System.out.println("UserName:"+UserName+"---Hobby:"+Hobby);
}
}
}

package com.test.dbc;

import java.sql.Connection;
import java.sql.DriverManager;

public class DBConnection {
    public static final String DBDRIVER= "com.microsoft.sqlserver.jdbc.SQLServerDriver"; ;
    public static final String DBURL = "jdbc:sqlserver://localhost:1433; DatabaseName=Wang;" ;
    public static final String DBUSER = "sa" ;
    public static final String DBPASS = "sa" ;
    private Connection conn = null ;
    public DBConnection(){        //在构造方法中进行数据库连接
        try{
            Class.forName(DBDRIVER) ;     //加载驱动程序
            conn = DriverManager.getConnection(DBURL,DBUSER,DBPASS) ;
        }catch(Exception e){
            e.printStackTrace() ;
        }
    }
    public Connection getConnection(){     //取得数据库连接
        System.out.println("数据库链接");
        return this.conn ;
    }
    public void close(){
        if(this.conn!=null){                  //数据库关闭操作,避免空指针异常。
            try{
                this.conn.close() ;
            }catch(Exception e){}
        }
    }
}

 

有几点问题需要注意:

1.建立索引的分词器和查询用的分词器必须一致

2.建立索引的字段名和查询的字段名需保持一致,才能找到结果

个人认为,lucene查询相比在数据库里查询表只是多了建立索引这一步,达到的目的都是从数据库了检索出我们需要的数据。

以上仅代表个人观点,欢迎大家拍砖