基于lucene的案例开发：创建索引

浏览数：22 / 时间：2015年06月09日

转载请注明出处：http://blog.csdn.net/xiaojimanman/article/details/42872711

从这篇博客开始，不论是API介绍还是后面的案例开发，都是基于 lucene4.3.1 这个版本，Lucene4.3.1 下载请点击这里， Lucene其他版本下载请点击这里，Lucene4.3.1官方API文档请点击这里。

创建索引demo

在开始介绍之前，先看一个简单的索引创建demo程序：

 /**  
 *@Description:   索引创建demo
 */ 
package com.lulei.lucene.study;  

import java.io.File;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field.Store;
import org.apache.lucene.document.TextField;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.IndexWriterConfig.OpenMode;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;
import org.apache.lucene.util.Version;
  
public class IndexCreate {

	public static void main(String[] args) {
		//指定索引分词技术，这里使用的是标准分词
		Analyzer analyzer = new StandardAnalyzer(Version.LUCENE_43);
		//indexwriter 配置信息
		IndexWriterConfig indexWriterConfig = new IndexWriterConfig(Version.LUCENE_43, analyzer);
		//索引的打开方式，没有索引文件就新建，有就打开
		indexWriterConfig.setOpenMode(OpenMode.CREATE_OR_APPEND);
		Directory directory = null;
		IndexWriter indexWrite = null;
		try {
			//指定索引硬盘存储路径
			directory = FSDirectory.open(new File("D://study/index/testindex"));
			//如果索引处于锁定状态，则解锁
			if (IndexWriter.isLocked(directory)){
				IndexWriter.unlock(directory);
			}
			//指定所以操作对象indexWrite
			indexWrite = new IndexWriter(directory, indexWriterConfig);
		} catch (Exception e) {
			e.printStackTrace();
		}
		
		//创建文档一
		Document doc1 = new Document();
		//对name域赋值“测试标题”，存储域值信息
		doc1.add(new TextField("name", "测试标题", Store.YES));
		//对content域赋值“测试标题”，存储域值信息
		doc1.add(new TextField("content", "测试内容", Store.YES));
		try {
			//将文档写入到索引中
			indexWrite.addDocument(doc1);
		} catch (Exception e) {
			e.printStackTrace();
		}
		
		//创建文档二
		Document doc2 = new Document();
		doc2.add(new TextField("name", "基于lucene的案例开发：索引数学模型", Store.YES));
		doc2.add(new TextField("content", "lucene将一篇文档分成若干个域，每个域又分成若干个词元，通过词元在文档中的重要程度，将文档转化为N维的空间向量，通过计算两个向量之间的夹角余弦值来计算两个文档的相似程度", Store.YES));
		try {
			//将文档写入到索引中
			indexWrite.addDocument(doc2);
		} catch (Exception e) {
			e.printStackTrace();
		}
		
		//将indexWrite操作提交，如果不提交，之前的操作将不会保存到硬盘
		try {
			//这一步很消耗系统资源，所以commit操作需要有一定的策略
			indexWrite.commit();
			//关闭资源
			indexWrite.close();
			directory.close();
		} catch (Exception e) {
			e.printStackTrace();
		}
	}
}

在上述的程序中，已做了详细的注释，对每一条语句的作用就不再介绍，下面就看一下执行这个main函数之后创建的索引文件，如下图：

技术分享