Package it.unimi.dsi.parser.callback

Examples of it.unimi.dsi.parser.callback.ComposedCallbackBuilder.compose()


    this.parser = new BulletParser();
   
    ComposedCallbackBuilder composedBuilder = new ComposedCallbackBuilder();
    composedBuilder.add( this.textExtractor = new TextExtractor() );
    composedBuilder.add( this.anchorExtractor = new AnchorExtractor( maxPreAnchor, maxAnchor, maxPostAnchor ) );
    parser.setCallback( composedBuilder.compose() );

    Object o;
    try {
      o = defaultMetadata.get( PropertyBasedDocumentFactory.MetadataKeys.WORDREADER );
      wordReader = o == null ? new FastBufferedReader() : ObjectParser.fromSpec( o.toString(), WordReader.class, MG4JClassParser.PACKAGE );
View Full Code Here


    ComposedCallbackBuilder composedBuilder = new ComposedCallbackBuilder();

    composedBuilder
        .add(this.textExtractor = new StructuredTextExtractor());
    parser.setCallback(composedBuilder.compose());

    this.wordReader = new FastBufferedReader();
    text = new char[DEFAULT_BUFFER_SIZE];

    if (collectionType == null)
View Full Code Here

                    // See how the parsed content looks like
                    BulletParser parser = new BulletParser(TRECParsingFactory.INSTANCE);
                    ComposedCallbackBuilder composedBuilder = new ComposedCallbackBuilder();
                    StructuredTextExtractor textExtractor = new StructuredTextExtractor();
                    composedBuilder.add(textExtractor);
                    parser.setCallback(composedBuilder.compose());
                    parser.parse(w.getHTMLContent().toCharArray());
                    System.out.println(textExtractor.getText());
                }
            }
            in.close();
View Full Code Here

                TRECParsingFactory.ELEMENT_DOCNO,
                TRECParsingFactory.ELEMENT_FILEID,
                TRECParsingFactory.ELEMENT_FIRST,
                TRECParsingFactory.ELEMENT_SECOND
        );
        parser.setCallback(composedBuilder.compose());

        this.wordReader = new FastBufferedReader();
        text = new char[DEFAULT_BUFFER_SIZE];
    }
View Full Code Here

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.