Lucene 4.4 环境测试

来源:互联网 发布:windows 网络编程 编辑:程序博客网 时间:2024/09/21 06:34

package com.zsj.test;

import java.io.IOException;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
import org.apache.lucene.util.Version;
/**
 * Lu
 * @author hadoop
 *
 */
public class FirstLucene {
 public static void main(String[] args) throws IOException {
  /**
   * 标准分析器是Lucene内置的分析器,会将语汇单元转成小写形式,
   * 并去除停用词及标点符号,很明显也是不适合于中文环境
   */
  Analyzer analyzer = new StandardAnalyzer(Version.LUCENE_44);
  TokenStream tokenStream = analyzer.tokenStream("",
    "this is my first lucene");
  CharTermAttribute charTermAttribute = tokenStream
    .addAttribute(CharTermAttribute.class);
  tokenStream.reset();
  while (tokenStream.incrementToken()) {
   System.out.println(charTermAttribute.toString());
  }
  tokenStream.end();
  tokenStream.close();
 }
}

原创粉丝点击