Package org.wltea.analyzer.solr

Source Code of org.wltea.analyzer.solr.IKTokenizerFactory

/**
*
*/
package org.wltea.analyzer.solr;

import java.io.Reader;
import java.util.Map;

import org.apache.lucene.analysis.Tokenizer;
import org.apache.solr.analysis.BaseTokenizerFactory;
import org.wltea.analyzer.lucene.IKTokenizer;

/**
* 实现Solr1.4分词器接口
* 基于IKTokenizer的实现
*
* @author 林良益、李良杰
*
*/
public final class IKTokenizerFactory extends BaseTokenizerFactory{
 
  private boolean isMaxWordLength = false;
 
  /**
   * IK分词器Solr TokenizerFactory接口实现类
   * 默认最细粒度切分算法
   */
  public IKTokenizerFactory(){
  }
 
  /*
   * (non-Javadoc)
   * @see org.apache.solr.analysis.BaseTokenizerFactory#init(java.util.Map)
   */
  public void init(Map<String,String> args){
    String _arg = args.get("isMaxWordLength");
    isMaxWordLength = Boolean.parseBoolean(_arg);
  }
 
  /*
   * (non-Javadoc)
   * @see org.apache.solr.analysis.TokenizerFactory#create(java.io.Reader)
   */
  public Tokenizer create(Reader reader) {
    return new IKTokenizer(reader , isMaxWordLength());
  }

  public void setMaxWordLength(boolean isMaxWordLength) {
    this.isMaxWordLength = isMaxWordLength;
  }

  public boolean isMaxWordLength() {
    return isMaxWordLength;
  }

}
TOP

Related Classes of org.wltea.analyzer.solr.IKTokenizerFactory

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.