Package opennlp.tools.sentdetect

Examples of opennlp.tools.sentdetect.SentenceSampleStream


    FileInputStream sampleDataIn = CmdLineUtil.openInFile(sampleDataFile);

    ObjectStream<String> lineStream = new PlainTextByLineStream(sampleDataIn
        .getChannel(), encoding);

    return new SentenceSampleStream(lineStream);
  }
View Full Code Here


    FileInputStream sampleDataIn = CmdLineUtil.openInFile(params.getData());

    ObjectStream<String> lineStream = new PlainTextByLineStream(sampleDataIn.getChannel(),
        params.getEncoding());

    return new SentenceSampleStream(lineStream);
  }
View Full Code Here

    Charset charset = Charset.forName("UTF-8");
    SentenceModel mod = null;
   
    try(FileInputStream inStream = new FileInputStream(inFile)){
      ObjectStream<String> lineStream = new PlainTextByLineStream(inStream, charset);
      ObjectStream<SentenceSample> sampleStream = new SentenceSampleStream(lineStream);

      // Training Parameters
      TrainingParameters mlParams = new TrainingParameters();
      mlParams.put(TrainingParameters.ALGORITHM_PARAM, "MAXENT");
      mlParams.put(TrainingParameters.ITERATIONS_PARAM, Integer.toString(iters));
      mlParams.put(TrainingParameters.CUTOFF_PARAM, Integer.toString(cut));

      // Abbreviations dictionary
      // TODO: Actually import a Dictionary of abbreviations
      Dictionary dict = new Dictionary();

      try {
        mod = SentenceDetectorME.train("en", sampleStream, true, dict, mlParams);
      } finally {
        sampleStream.close();
      }
    }
   
    try(FileOutputStream outStream = new FileOutputStream(outFile)){
      logger.info("Saving the model as: " + outFile.getAbsolutePath());
View Full Code Here

        if ((lang == null) || (encoding == null)) {
          usage();
        }

       
        SentenceModel model = train(lang, new SentenceSampleStream(new PlainTextByLineStream(
            new InputStreamReader(new FileInputStream(inFile), encoding))), true, null, cutoff, iters);

        // TODO: add support for iterations and cutoff settings

//        if (args.length > ai)
View Full Code Here

      lineStream = new PlainTextByLineStream(sampleDataIn, params.getEncoding());
    } catch (IOException ex) {
      CmdLineUtil.handleCreateObjectStreamError(ex);
    }

    return new SentenceSampleStream(lineStream);
  }
View Full Code Here

    FileInputStream sampleDataIn = CmdLineUtil.openInFile(sampleDataFile);

    ObjectStream<String> lineStream = new PlainTextByLineStream(sampleDataIn
        .getChannel(), encoding);

    return new SentenceSampleStream(lineStream);
  }
View Full Code Here

TOP

Related Classes of opennlp.tools.sentdetect.SentenceSampleStream

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.