Package com.chenlb.mmseg4j

Source Code of com.chenlb.mmseg4j.ComplexSegTest

package com.chenlb.mmseg4j;

import java.io.IOException;

import junit.framework.TestCase;

import com.chenlb.mmseg4j.example.Complex;

public class ComplexSegTest extends TestCase {

  Complex segW;
  protected void setUp() throws Exception {
    segW = new Complex();
    //ComplexSeg.setShowChunk(true);
  }

  /*public void testSeg() {
    String txt = "";
    txt = "各人发表关于受一股来自中西伯利亚的强冷空气影响";
    ComplexSeg.setShowChunk(true);
    ComplexSeg seg = new ComplexSeg(new Dictionary("dic"));  //sogou
    Sentence sen = new Sentence(txt.toCharArray(), 0);
    System.out.println();
    while(!sen.isFinish()) {
      Chunk chunk = seg.seg(sen);
      System.out.println(chunk+" -> "+chunk.getStartOffset());
    }
  }*/

  public void testEffect() throws IOException {
    String words = segW.segWords("研究生命起源", "|");
    assertEquals("研究|生命|起源", words);
  }
 
  public void testEffect1() throws IOException {
    String words = segW.segWords("为首要考虑", "|");
    assertEquals("为首|要|考虑", words);
  }
 
  public void testEffect2() throws IOException {
    String words = segW.segWords("眼看就要来了", "|");
    assertEquals("眼看|就要|来了", words);
  }
 
  public void testEffect3() throws IOException {
    String words = segW.segWords("中西伯利亚", "|");
    assertEquals("中|西伯利亚", words);
  }
 
  public void testEffect4() throws IOException {
    String words = segW.segWords("国际化", "|");
    assertEquals("国际化", words);
  }
 
  public void testEffect5() throws IOException {
    String words = segW.segWords("化装和服装", "|");
    assertEquals("化装|和|服装", words);
  }
 
  public void testEffect6() throws IOException {
    String words = segW.segWords("中国人民银行", "|");
    assertEquals("中国人民银行", words);
  }
 
  /**
   * 自扩展的词库文件
   */
  public void testEffect7() throws IOException {
    String words = segW.segWords("白云山", "|");
    assertEquals("白云山", words);
  }
 
  public void testEffect10() throws IOException {
    String words = segW.segWords("清华大学", "|");
    assertEquals("清华大学", words);
  }
 
  public void testEffect11() throws IOException {
    String words = segW.segWords("华南理工大学", "|");
    assertEquals("华南理工大学", words);
  }
 
  public void testEffect12() throws IOException {
    String words = segW.segWords("广东工业大学", "|");
    assertEquals("广东工业大学", words);
  }
  public void testUnitEffect() throws IOException {
    String words = segW.segWords("2008年底发了资金吗", "|");
    assertEquals("2008|年|底|发了|资金|吗", words);
  }
 
  public void testUnitEffect1() throws IOException {
    String words = segW.segWords("20分钟能完成", "|");
    assertEquals("20|分钟|能|完成", words);
  }
}
TOP

Related Classes of com.chenlb.mmseg4j.ComplexSegTest

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.