Package org.htmlparser

Examples of org.htmlparser.Parser.reset()


    if (isContentCutted) {
      // This means a new parser run which is expensive but neccessary
      htmlPage = new Page(rawDocument.getContentAsString(), "UTF-8");
      parser = new Parser(new Lexer(htmlPage));
    } else {
      parser.reset();
    }

    try {
      // Parse the content
      parser.visitAllNodesWith(linkVisitor);
View Full Code Here


          urlFilm = tmpRecherche;
        }
      }

      if(urlFilm == null){
        parser.reset();
        parser.setResource(tmpRecherche);       
        listUrlNode = parser.extractAllNodesThatMatch (new NodeClassFilter (LinkTag.class));
        //On d�tecte d'abord les liens
        for (i = 0; i < listUrlNode.size(); i++){
          tmpString = listUrlNode.elementAt(i).toHtml();
View Full Code Here

     
      System.out.println("Page Downloaded: " + _url.toString());
     
      setContent(sb.toString());
     
      par.reset();
      _links.clear();
     
      NodeFilter filter = new OrFilter( new NodeFilter[] {
          new TagNameFilter("A"),
          new TagNameFilter("META")
View Full Code Here

        for (NodeIterator e = parser.elements();e.hasMoreNodes();)
        {
            node[i++] = e.nextNode();
        }
        int cnt = i;
        parser.reset ();
        // Now try getting the elements again
        i = 0;
        for (NodeIterator e = parser.elements();e.hasMoreNodes();)
        {
            node[i++] = e.nextNode();
View Full Code Here

                list.add (iterator.nextNode ());
          }
          catch (EncodingChangeException ece)
          {
              list.removeAll ();
              parser.reset ();
            for (NodeIterator iterator = parser.elements (); iterator.hasMoreNodes (); )
                list.add (iterator.nextNode ());
          }
        }
        catch (ParserException pe)
View Full Code Here

            while (iterator.hasMoreNodes ())
                checkTagNames (iterator.nextNode ());
        }
        catch (EncodingChangeException ece)
        {
            parser.reset ();
            iterator = parser.elements ();
            while (iterator.hasMoreNodes ())
                checkTagNames (iterator.nextNode ());
        }
    }
View Full Code Here

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.