lucene5.3.1 索引增删改查

来源:互联网 发布:淘宝买iphone7靠谱吗 编辑:程序博客网 时间:2024/04/30 18:41

项目下载地址:

点击下载


增删改查工具类:


import java.io.IOException;import java.nio.file.Paths;import java.util.ArrayList;import java.util.List;import org.apache.lucene.analysis.Analyzer;import org.apache.lucene.analysis.standard.StandardAnalyzer;import org.apache.lucene.document.Document;import org.apache.lucene.document.Field;import org.apache.lucene.document.IntField;import org.apache.lucene.document.StringField;import org.apache.lucene.document.TextField;import org.apache.lucene.index.DirectoryReader;import org.apache.lucene.index.IndexReader;import org.apache.lucene.index.IndexWriter;import org.apache.lucene.index.IndexWriterConfig;import org.apache.lucene.index.Term;import org.apache.lucene.queryparser.classic.ParseException;import org.apache.lucene.queryparser.classic.QueryParser;import org.apache.lucene.search.IndexSearcher;import org.apache.lucene.search.Query;import org.apache.lucene.search.ScoreDoc;import org.apache.lucene.search.TopDocs;import org.apache.lucene.store.Directory;import org.apache.lucene.store.FSDirectory;public class IndexCrud {String[] ids = {"1","2","3","4","5","6"};String[] names = {"zs","ls","ww","hl","wq","bb"};String[] emails = {"zs@qq.com","zs@baidu.com","zs@126.com","zs@sina.com","zs@163.com","zs@google.com"};String[] contents = {   "She had been shopping with her Mom in Wal-Mart. She must have been 6 years old, this beautiful brown haired, freckle-faced image of innocence. It was pouring outside. The kind of rain that gushes over the top of rain gutters, so much in a hurry to hit the Earth, it has no time to flow down the spout."   ,"We all stood there under the awning and just inside the door of the Wal-Mart. We all waited, some patiently, others irritated, because nature messed up their hurried day. I am always mesmerized by rainfall. I get lost in the sound and sight of the heavens washing away the dirt and dust of the world. Memories of running, splashing so carefree as a child come pouring in as a welcome reprieve from the worries of my day."   ,"Her voice was so sweet as it broke the hypnotic trance we were all caught in, Mom, let's run through the rain. she said."   ,"The entire crowd stopped dead silent. I swear you couldn't hear anything but the rain. We all stood silently. No one came or left in the next few minutes. Mom paused and thought for a moment about what she would say."   ,"Now some would laugh it off and scold her for being silly. Some might even ignore what was said. But this was a moment of affirmation in a young child's life. Time when innocent trust can be nurtured so that it will bloom into faith."   ,"To everything there is a season and a time to every purpose under heaven. I hope you still take the time to run through the rain."};int[] fileSizes = {1,2,5,3,6,3};private Directory directory;private Analyzer analyzer;private IndexWriterConfig config;  private IndexWriter writer;    private IndexReader reader;public IndexCrud() { try {   //本地存储      directory = FSDirectory.open(Paths.get("E:\\project\\bigdata\\lucene\\index"));      //内存存储      //directory = new RAMDirectory();      //初始化分词器      analyzer = new StandardAnalyzer();      //config      config = new IndexWriterConfig(analyzer);      //index writer      writer = new IndexWriter(directory, config);      //      //createIndex();      //index reader      reader = DirectoryReader.open(directory);    } catch (IOException e) {      e.printStackTrace();    }  }/*** 索引更新*/public void updateIndex(){ try {      Term term = new Term("id", "2");      Document doc = new Document();      doc.add(new StringField("id", ids[1], Field.Store.YES));      doc.add(new StringField("name", "lsup", Field.Store.YES));      doc.add(new StringField("email", emails[1], Field.Store.YES));      doc.add(new IntField("fileSize", fileSizes[1], Field.Store.YES));      doc.add(new TextField("content", contents[1], Field.Store.NO));            //更新的时候,会把原来那个索引删掉,重新生成一个索引      writer.updateDocument(term, doc);            writer.commit();    } catch (IOException e) {      e.printStackTrace();    }}/*** 索引全部删除*/public void deleteAllIndex(){ try {      writer.deleteAll();      writer.commit();    } catch (IOException e) {      e.printStackTrace();    }}/*** 索引删除*/public void deleteIndex(){ try {      Term[] terms = new Term[2];      Term term = new Term("id", "1");      terms[0] = term;      term = new Term("id", "3");      terms[1] = term;      //将id为 1和3的索引删除。      //也可以传一个Query数组对象,将Query查找的结果删除。      writer.deleteDocuments(terms);      //deleteDocuments      writer.commit();    } catch (IOException e) {      e.printStackTrace();    }}public IndexSearcher getSearcher(){ try {      IndexReader newReader = DirectoryReader.openIfChanged((DirectoryReader)reader);      if(newReader != null){        reader.close();        reader = newReader;      }    } catch (IOException e) {      e.printStackTrace();    } return new IndexSearcher(reader);}/*** 根据条件查找索引*/public void queryIndex(){ try {      //搜索器      IndexSearcher searcher = getSearcher();      //查询哪个字段      QueryParser parse = new QueryParser("email", analyzer);      //查询关键字      Query query = parse.parse("zs");      TopDocs topDocs = searcher.search(query, 1000);            //碰撞结果      ScoreDoc[] hits = topDocs.scoreDocs;            for (int i = 0; i < hits.length; i++) {        ScoreDoc hit = hits[i];        Document hitDoc = searcher.doc(hit.doc);        //结果按照得分来排序。主要由 关键字的个数和权值来决定        System.out.println("("+hit.doc+"-"+hit.score+")"+"id:"+hitDoc.get("id")+" name:"+hitDoc.get("name")+" email:"+hitDoc.get("email"));      }    } catch (IOException e) {      e.printStackTrace();    } catch (ParseException e) {      e.printStackTrace();    }}/*** 读取索引*/public void readIndex(){    System.out.println("max num:"+reader.maxDoc());    System.out.println("index num:"+reader.numDocs());    //删除了的索引数    System.out.println("delete index num:"+reader.numDeletedDocs());  }/*** 创建索引*/public void createIndex(){  try {   //创建writer      List<Document> docs = new ArrayList<Document>();      for(int i = 0; i < ids.length; i++){        Document doc = new Document();        doc.add(new StringField("id", ids[i], Field.Store.YES));        doc.add(new StringField("name", names[i], Field.Store.YES));        Field field = new TextField("email", emails[i], Field.Store.YES);        doc.add(field);                //加权操作。qq邮箱2.0  新浪有限1.5  其他默认1.0 谷歌0.5        //1.权值越高,查询结果越靠前。        //2.lucene4.0以后不能对doc加权        //3.只能对TextField加权        if(emails[i].indexOf("qq.com")!=-1){          field.setBoost(2.0f);        }else if(emails[i].indexOf("sina.com")!=-1){          field.setBoost(1.5f);        }else if(emails[i].indexOf("google")!=-1){          field.setBoost(0.5f);        }                doc.add(new IntField("fileSize", fileSizes[i], Field.Store.YES));        //对于内容只索引不存储        doc.add(new TextField("content", contents[i], Field.Store.NO));        writer.addDocument(doc);      }      writer.commit();    } catch (IOException e) {      e.printStackTrace();    }}}




0 0
原创粉丝点击