Lucene 學習之一:源碼環境搭建

一直想抽點時間系統的學習下Lucene ,今天把Lucene 源碼學習環境搭建了一下。下面描述一下環境搭建過程。html

開發環境的配置(lucene-4.10.2 + Eclipse):java

1:下載最新源碼:把jar包lucene-4.10.2,和java源碼lucene-4.10.2-src 都下載下來。apache

     下載地址:http://mirror.bit.edu.cn/apache/lucene/java/4.10.2/ide

2:在Eclipse 安裝lucene-4.10.2 java源碼。學習

    新建JAVA 項目,把「使用缺省位置的勾去掉」。選擇源碼文件目錄。ui

項目加載進來後會有不少錯誤提示,這是由於還有不少依賴包沒有引用到。spa

解決辦法,把jar包lucene-4.10.2 各文件夾下面的lib 文件下面的jar 包都拷貝出來。code

在項目中建一個lib 文件夾。把因此的jar 包複製過來。而後,把因此jar 包添加到構建路徑。竟然有這麼多包。htm

lucene-4.10.2-src\lucene-4.10.2\demo\src\java\org\apache\lucene\demo 這個目錄下有兩個簡單實例,分別是建索引 和 查詢 。blog

新建一個JAVA 項目,並在構建項目中添加lucene-4.10.2的引用。

下面能夠本身嘗試寫demo了。

下面是一個建索引的例子:

package index.demo;

import java.io.File;
import java.io.IOException;
import java.util.*;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.LongField;
import org.apache.lucene.document.StringField;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.IndexWriterConfig.OpenMode;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;
import org.apache.lucene.util.Version;

import index.bean.*;

/**
 * @author zhangrh 索引構建類
 */
public class IndexBuilder {

    private IndexBuilder() {
    }

    /**
     * 索引初始化
     */
    public static void initIndex() {
        try {

            String indexPath = "D://lucene/index";

            Directory dir = FSDirectory.open(new File(indexPath));

            Analyzer analyzer = new StandardAnalyzer();

            IndexWriterConfig iwc = new IndexWriterConfig(
                    Version.LUCENE_4_10_2, analyzer);

            iwc.setOpenMode(OpenMode.CREATE);

            IndexWriter writer = new IndexWriter(dir, iwc);

            ArrayList<Hotel> hotelList = getContentData();

            if (hotelList != null) {

                for (Hotel h : hotelList) {

                    Document doc = new Document();
      
                    LongField idField = new LongField("id", h.getId(),
                            Field.Store.YES);
                    
                    doc.add(idField);

                    Field nameCNField = new StringField("name", h.getNameCN(),
                            Field.Store.YES);
                    
                    doc.add(nameCNField);
                    
                    Field nameENField = new StringField("ename", h.getNameEN(),
                            Field.Store.YES);
                    
                    doc.add(nameENField);
                    
                    writer.addDocument(doc);
                }

            }
            
            writer.close();

        } catch (IOException e) {

            // TODO 自動生成的 catch 塊
            e.printStackTrace();

        }

    }

    /**
     * 返回 {@link Hotel} 內容數據
     * 
     * @return An ArrayList of Hotel
     */
    private static ArrayList<Hotel> getContentData() {

        ArrayList<Hotel> list = new ArrayList<Hotel>();
        return list;
    }

}

 查詢例子

package index.demo;

import java.io.File;
import java.io.IOException;

import org.apache.lucene.document.Document;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;

/**
 * @author zhangrh 索引查找Demo
 *
 */
public class SearchDemo {
    
    private SearchDemo(){
    }
    
    
    /**
     * 查詢酒店
     */
    public static void SearchHotel(String hotelname) {

        try {
            String indexPath = "D://lucene/index";
            
            Directory dir = FSDirectory.open(new File(indexPath));
            
            IndexReader reader = DirectoryReader.open(dir);
            
            IndexSearcher searcher = new IndexSearcher(reader);
            
            Term term = new Term("name", hotelname);
            
            Query query = new TermQuery(term);
            // Do the search
            TopDocs docs = searcher.search(query, 10);
            
            System.out.println("查詢結果總數:" + docs.totalHits);  
            
            for (ScoreDoc sd : docs.scoreDocs) {
                
                Document document= searcher.doc(sd.doc);
                
                System.out.println("酒店id:" + document.get("id"));  
                
                System.out.println("酒店name:" + document.get("name"));  
            }
            reader.close();
            
        } catch (IOException e) {
            // TODO 自動生成的 catch 塊
            e.printStackTrace();
        }
    }
}
View Code

 

官方API說明:http://lucene.apache.org/core/4_10_2/index.html

相關文章
相關標籤/搜索