创建检索索引的搜索类

来源:互联网 发布:阿格里奇 知乎 编辑:程序博客网 时间:2024/06/05 21:17

对于创建索引之后的步骤,首先是创建搜索;

代码如下:

package ch2.lucenedemo.process;


import java.io.BufferedReader;
import java.io.File;
import java.io.FileReader;
import java.io.IOException;
import java.util.Date;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.Map;






import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermDocs;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.TermQuery;


public class Search {
private String INDEX_STORE_PATH = "E:\\Lucene\\项目index";

//利用Lucene的搜索
public void indexSearch(String searchType, String searchKey){
try{
System.out.println("++使用索引方式索引++");
System.out.println("---------------------------------------");

//根据索引位置建立IndexSearcher
IndexSearcher searcher = new IndexSearcher(INDEX_STORE_PATH);


//建立搜索单元, SearchType代表要搜索的Filed, searchKey代表关键字
Term t = new Term(searchType, searchKey);

//由Term生成一个Query
Query q = new TermQuery(t);

//搜索开始时间
Date beginTime = new Date();

//获取一个<document, frequency>的枚举类对象TermDocs
TermDocs termDocs = searcher.getIndexReader().termDocs(t);
while(termDocs.next()){
//输出在文档中出现关键字的次数
System.out.println("find " + termDocs.freq() + " matches in");

//输出搜索到关键词的文档
System.out.println(searcher.getIndexReader().document(termDocs.doc()).getField("filename").stringValue());
}

//搜索完成时间
Date endTime = new Date();

//搜索所消耗的时间
long timeOfSearch = endTime.getTime() - beginTime.getTime();
System.out.println("使用搜音方式搜索的总耗时 " + timeOfSearch + " ms");

}catch(IOException e){
e.printStackTrace();
 }

}
//利用String的搜索
public void stringSearch(String keyword, String searchDir){
System.out.println("++使用字符串匹方式搜索++");
System.out.println("---------------------------------------------------");

File fileDir = new File(searchDir);

//返回目录文件夹所有数组
File[] files = fileDir.listFiles();

//HashMap保存文件所偶有文件名和匹配次数对
Map rs = new  LinkedHashMap();

//记录搜索开始时间
Date beginTime = new Date();

//遍历所有文件
for(int i = 0; i < files.length; i++){
//初始化匹配次数
int hits = 0;
try{
BufferedReader br = new BufferedReader(new FileReader(files[i]));
StringBuffer sb = new StringBuffer();
String line =br.readLine();
while(line != null){
sb.append(line);
line = br.readLine();
}
br.close();
//讲StringBuffer转化成为String,以便于搜索
String stringToSearch = sb.toString();

//初始化fromIndex
int fromIndex = -keyword.length();

//逐个匹配关键词
while((fromIndex = stringToSearch.indexOf(keyword, fromIndex + keyword.length())) != -1){
hits++;
}


//将文件名和匹配次数加入HashMap
rs.put(files[i].getName(), new Integer(hits));

}catch(IOException e){
e.printStackTrace();
}
}


//输出查询结果
Iterator it = rs.keySet().iterator();
while(it.hasNext()){
String fileName = (String) it.next();
Integer hits = (Integer) rs.get(fileName);
System.out.println("find " + hits.intValue() + " matches in " + fileName);

}

//记录结束时间
Date endTime = new Date();

//得到搜索消耗的时间
long timeOfSearch = endTime.getTime() - beginTime.getDate();
System.out.println("使用字符串匹配方法总消耗 " +  timeOfSearch + " ms");
}


public static void main(String[] args){
Search search = new Search();

//通过索引搜索关键词
search.indexSearch("contant", "保尔");

//插入一个分隔符
System.out.println();

//通过String的API搜索关键词
search.stringSearch("保尔", "E:\\Lucene项目\\testFolder");

}
}


下图是结果:


0 0
原创粉丝点击