Package opennlp.tools.formats.convert

Examples of opennlp.tools.formats.convert.FileToStringSampleStream


    Parameters params = ArgumentParser.parse(args, Parameters.class);

    TokenizerModel tokenizerModel = new TokenizerModelLoader().load(params.getTokenizerModel());
    Tokenizer tokenizer = new TokenizerME(tokenizerModel);

    ObjectStream<String> mucDocStream = new FileToStringSampleStream(
        new DirectorySampleStream(params.getData(), new FileFilter() {

          public boolean accept(File file) {
            return file.getName().toLowerCase().endsWith(".sgm");
          }
View Full Code Here


    Parser parser =  ParserFactory.create(parserModel);
   
    TokenizerModel tokenizerModel = new TokenizerModelLoader().load(params.getTokenizerModel());
    Tokenizer tokenizer = new TokenizerME(tokenizerModel);
   
    ObjectStream<String> mucDocStream = new FileToStringSampleStream(
        new DirectorySampleStream(params.getData(), new FileFilter() {
         
          public boolean accept(File file) {
            return file.getName().toLowerCase().endsWith(".sgm");
          }
View Full Code Here

    Parameters params = ArgumentParser.parse(args, Parameters.class);

    TokenizerModel tokenizerModel = new TokenizerModelLoader().load(params.getTokenizerModel());
    Tokenizer tokenizer = new TokenizerME(tokenizerModel);

    ObjectStream<String> mucDocStream = new FileToStringSampleStream(
        new DirectorySampleStream(params.getData(), new FileFilter() {

          public boolean accept(File file) {
            return StringUtil.toLowerCase(file.getName()).endsWith(".sgm");
          }
View Full Code Here

    // We need file to line here ... and that is probably best doen with the plain text stream
    // lets copy it over here, refactor it, and then at some point we replace the current version
    // with the refactored version

    return new OntoNotesParseSampleStream(new DocumentToLineStream(new FileToStringSampleStream(
        documentStream, Charset.forName("UTF-8"))));
  }
View Full Code Here

        return file.isDirectory();
      }
    }, true);

    return new OntoNotesNameSampleStream(new FileToStringSampleStream(
        documentStream, Charset.forName("UTF-8")));
  }
View Full Code Here

TOP

Related Classes of opennlp.tools.formats.convert.FileToStringSampleStream

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.