Lucene4.3入门-白红宇

强烈建议你试试无所不能的chatGPT，快点击我

Lucene4.3入门

阅读量：7224 次

发布时间：2019-06-29

本文共 5397 字，大约阅读时间需要 17 分钟。

辞职交接期间无聊看了一下搜索引擎，java社区比较火的当然是Lucene,想写一个简单的小例子，在网上找了些资料，不过都不是4.3的，自己看了一下。

下载地址：http://lucene.apache.org/core/

项目结构

constans.java 是常量类

LuceneIndex.java 建立索引类

LuceneSearch.java 搜索类

数据文件：

package com.xin;public class Constants {     public final static String INDEX_FILE_PATH = "e:\\lucene\\test"; //索引的文件的存放路径     public final static String INDEX_STORE_PATH = "e:\\lucene\\index"; //索引的存放位置 }

package com.xin;import java.io.BufferedReader;import java.io.File;import java.io.FileInputStream;import java.io.InputStreamReader;import java.io.Reader;import java.util.Date;import org.apache.lucene.analysis.Analyzer;import org.apache.lucene.analysis.standard.StandardAnalyzer;import org.apache.lucene.document.Document;import org.apache.lucene.document.Field;import org.apache.lucene.document.StringField;import org.apache.lucene.document.TextField;import org.apache.lucene.index.IndexWriter;import org.apache.lucene.index.IndexWriterConfig;import org.apache.lucene.index.IndexWriterConfig.OpenMode;import org.apache.lucene.store.Directory;import org.apache.lucene.store.FSDirectory;import org.apache.lucene.util.Version;/** * @author chongxin * @since 2013/6/19 * @version Lucene 4.3.1 * */public class LuceneIndex {	// 索引器	private IndexWriter writer = null;	public LuceneIndex() {		try {			//索引文件的保存位置			Directory dir = FSDirectory.open(new File(Constants.INDEX_STORE_PATH));			//分析器			Analyzer analyzer = new StandardAnalyzer(Version.LUCENE_40);			//配置类			IndexWriterConfig iwc = new IndexWriterConfig(Version.LUCENE_40,analyzer);			iwc.setOpenMode(OpenMode.CREATE);//创建模式 OpenMode.CREATE_OR_APPEND 添加模式						writer = new IndexWriter(dir, iwc);		} catch (Exception e) {			e.printStackTrace();		}	}	// 将要建立索引的文件构造成一个Document对象，并添加一个域"content"	private Document getDocument(File f) throws Exception {		Document doc = new Document();		FileInputStream is = new FileInputStream(f);		Reader reader = new BufferedReader(new InputStreamReader(is));		//字符串 StringField LongField TextField		Field pathField = new StringField("path", f.getAbsolutePath(),Field.Store.YES);		Field contenField = new TextField("contents", reader);		//添加字段		doc.add(contenField);		doc.add(pathField);		return doc;	}	public void writeToIndex() throws Exception {		File folder = new File(Constants.INDEX_FILE_PATH);				if (folder.isDirectory()) {			String[] files = folder.list();			for (int i = 0; i < files.length; i++) {				File file = new File(folder, files[i]);				Document doc = getDocument(file);				System.out.println("正在建立索引 : " + file + "");				writer.addDocument(doc);			}		}	}	public void close() throws Exception {		writer.close();	}	public static void main(String[] args) throws Exception {		// 声明一个对象		LuceneIndex indexer = new LuceneIndex();		// 建立索引		Date start = new Date();		indexer.writeToIndex();		Date end = new Date();		System.out.println("建立索引用时" + (end.getTime() - start.getTime()) + "毫秒");		indexer.close();	}}

执行结果：

正在建立索引 : e:\lucene\test\a.txt正在建立索引 : e:\lucene\test\b.txt正在建立索引 : e:\lucene\test\c.txt正在建立索引 : e:\lucene\test\d.txt建立索引用时109毫秒

生成的索引文件：

查找：

package com.xin;import java.io.File;import java.util.Date;import org.apache.lucene.analysis.Analyzer;import org.apache.lucene.analysis.standard.StandardAnalyzer;import org.apache.lucene.document.Document;import org.apache.lucene.index.DirectoryReader;import org.apache.lucene.index.IndexReader;import org.apache.lucene.queryparser.classic.QueryParser;import org.apache.lucene.search.IndexSearcher;import org.apache.lucene.search.Query;import org.apache.lucene.search.ScoreDoc;import org.apache.lucene.search.TopDocs;import org.apache.lucene.store.FSDirectory;import org.apache.lucene.util.Version;/** * @author chongxin * @since 2013/6/19 * @version Lucene 4.3.1 * */public class LuceneSearch {	// 声明一个IndexSearcher对象	private IndexSearcher searcher = null;	// 声明一个Query对象	private Query query = null;	private String field = "contents";	public LuceneSearch() {		try {			IndexReader reader = DirectoryReader.open(FSDirectory.open(new File(Constants.INDEX_STORE_PATH)));			searcher = new IndexSearcher(reader);		} catch (Exception e) {			e.printStackTrace();		}	}    //返回查询结果 	public final TopDocs search(String keyword) {		System.out.println("正在检索关键字 : " + keyword);		try {			Analyzer analyzer = new StandardAnalyzer(Version.LUCENE_40);			QueryParser parser = new QueryParser(Version.LUCENE_40, field,analyzer);			// 将关键字包装成Query对象			query = parser.parse(keyword);			Date start = new Date();			TopDocs results = searcher.search(query, 5 * 2);			Date end = new Date();			System.out.println("检索完成，用时" + (end.getTime() - start.getTime())					+ "毫秒");			return results;		} catch (Exception e) {			e.printStackTrace();			return null;		}	}      //打印结果	public void printResult(TopDocs results) {		ScoreDoc[] h = results.scoreDocs;		if (h.length == 0) {			System.out.println("对不起，没有找到您要的结果。");		} else {			for (int i = 0; i < h.length; i++) {				try {					Document doc = searcher.doc(h[i].doc);					System.out.print("这是第" + i + "个检索到的结果，文件名为：");					System.out.println(doc.get("path"));				} catch (Exception e) {					e.printStackTrace();				}			}		}		System.out.println("--------------------------");	}	public static void main(String[] args) throws Exception {		LuceneSearch test = new LuceneSearch();		TopDocs h = null;		h = test.search("中国");		test.printResult(h);		h = test.search("人民");		test.printResult(h);		h = test.search("共和国");		test.printResult(h);	}}

你可能感兴趣的文章

CPU 超线程、多核

用ASCII码显示string.xml中的特殊字符

网站301跳转到新域名

codewars020: The Clockwise Spiral 数字顺时针螺旋矩阵

ios 下拉刷新

Django在Windows系统下的安装配置

懒到极致：对mybatis的进一步精简

Android学习之OTA Update

Maven Multi-environment package

JMM-java内存模型

iOS的soap应用(webservice) 开发

Delphi listview 点击列头排序

android preference page

mysql索引挑选

关于冰岛足球的段子

在 Windows 中安装 Laravel 5.1.X

TeamViewer 9发布－在Linux下安装运行

Centos7 Gitea安装教程 - 一款易搭建，运行快的Git服务器

CentOS minimal 网络配置

喝酒易醉，品茶养心，人生如梦，品茶悟道，何以解忧？唯有杜康！-- 愿君每日到此一游！

当前时间: 2025-02-12 17:02:49 当前IP: 18.118.252.210 联系邮箱:javaeecc@qq.com Copyright © 2020 - 2022 baihongyu.com 京ICP备2021015314号-2

强烈建议你试试无所不能的CHAT-GPT，快点击我

强烈建议你试试无所不能的CHAT-GPT，快点击我