Examples of HtmlCleaner


Examples of org.apache.wookie.util.html.HtmlCleaner

  /**
   * tests that user scripts are placed after injected scripts
   */
  @Test
  public void injectScriptWithUserScript(){
    HtmlCleaner cleaner = new HtmlCleaner();
    String content = "<head><script type=\"text/javascript\" src=\"user.js\"></script></head>";
    String out = "";
    StringWriter writer = new StringWriter();
    try {
      cleaner.setReader(new StringReader(content));
      cleaner.injectScript("inject.js");
      cleaner.process(writer);
      out = writer.getBuffer().toString();
      assertEquals("<html><head><script type=\"text/javascript\" src=\"inject.js\"></script><script type=\"text/javascript\" src=\"user.js\"></script></head><body></body></html>", out);
    } catch (IOException e) {
      fail();
    }
View Full Code Here

Examples of org.apache.wookie.util.html.HtmlCleaner

  /**
   * tests that user scripts are placed after injected scripts and are not reordered
   */
  @Test
  public void injectScriptWithUserScriptNoReorder(){
    HtmlCleaner cleaner = new HtmlCleaner();
    String content = "<head><script type=\"text/javascript\" src=\"user.js\"></script><script type=\"text/javascript\">google.load(\"dojo\", \"1.4.1\");</script></head>";
    String out = "";
    StringWriter writer = new StringWriter();
    try {
      cleaner.setReader(new StringReader(content));
      cleaner.injectScript("inject.js");
      cleaner.process(writer);
      out = writer.getBuffer().toString();
      assertEquals("<html><head><script type=\"text/javascript\" src=\"inject.js\"></script><script type=\"text/javascript\" src=\"user.js\"></script><script type=\"text/javascript\">google.load(\"dojo\", \"1.4.1\");</script></head><body></body></html>", out);
    } catch (IOException e) {
      fail();
    }
View Full Code Here

Examples of org.apache.wookie.util.html.HtmlCleaner

  /**
   * tests injecting stylesheet
   */
  @Test
  public void injectStylesheet(){
    HtmlCleaner cleaner = new HtmlCleaner();
    String content = "";
    String out = "";
    StringWriter writer = new StringWriter();
    try {
      cleaner.setReader(new StringReader(content));
      cleaner.injectStylesheet("test.css");
      cleaner.process(writer);
      out = writer.getBuffer().toString();
      assertEquals("<html><head><link type=\"text/css\" rel=\"stylesheet\" href=\"test.css\" /></head><body></body></html>", out);
    } catch (IOException e) {
      fail();
    }
View Full Code Here

Examples of org.apache.wookie.util.html.HtmlCleaner

    }
  }

  @Test (expected = IOException.class)
  public void nullReader() throws IOException{
    HtmlCleaner cleaner = new HtmlCleaner();
    StringWriter writer = new StringWriter();
    cleaner.setReader(null);
    cleaner.injectStylesheet("test.css");
    cleaner.process(writer);
    fail();
  }
View Full Code Here

Examples of org.apache.wookie.util.html.HtmlCleaner

    cleaner.process(writer);
    fail();
  }
  @Test (expected = IOException.class)
  public void nullContentInReader() throws IOException{
    HtmlCleaner cleaner = new HtmlCleaner();
    StringWriter writer = new StringWriter();
    cleaner.setReader(new FileReader("bogus.html"));
    cleaner.injectStylesheet("test.css");
    cleaner.process(writer);
  }
View Full Code Here

Examples of org.apache.wookie.util.html.HtmlCleaner

    cleaner.process(writer);
  }

  @Test  (expected = IOException.class)
  public void nullWriter() throws IOException{
    HtmlCleaner cleaner = new HtmlCleaner();
    FileWriter writer = null;
    cleaner.setReader(new StringReader("test"));
    cleaner.injectStylesheet("test.css");
    cleaner.process(writer);
  }
View Full Code Here

Examples of org.htmlcleaner.HtmlCleaner

  }
 
  public static Collection<String> findAllLinkHref(String html, String hostUrl) throws Exception{
    Collection<String> urls = new ArrayList<String>();
   
    HtmlCleaner cleaner = new HtmlCleaner();
    TagNode node = cleaner.clean(html);
    Object[] ns = node.evaluateXPath("//a[@href]");
    for (Object object : ns) {
      TagNode node2=(TagNode) object;
      String href = node2.getAttributeByName("href");
      if (href == null || href.trim().length() == 0)
View Full Code Here

Examples of org.htmlcleaner.HtmlCleaner

   
    return map;
  }
 
  private List<Map<String, Object>> parseHtml(Page page) throws Exception{
    HtmlCleaner cleaner = new HtmlCleaner();
    cleaner.getProperties().setTreatUnknownTagsAsContent(true);
    String html = page.getContent();
    TagNode rootNode = cleaner.clean(html);
    fel.getContext().set("$page_content", html);
        final List<Field> fields = target.getModel().getField();
    String isModelArray = target.getModel().getIsArray();
    String modelXpath = target.getModel().getXpath();
    List<Map<String, Object>> list = new ArrayList<Map<String, Object>>();
View Full Code Here

Examples of org.htmlcleaner.HtmlCleaner

    System.out.println(objs);
  }
 
  public static Object evalXpath(String html, String xpath, String attribute){
    List<Object> result = new ArrayList<Object>();
    HtmlCleaner cleaner = new HtmlCleaner();
    try {
      TagNode tagNode = cleaner.clean(html);
      Object[] nodeVals = tagNode.evaluateXPath(xpath);
      for (Object tag : nodeVals){
        TagNode _tag = (TagNode)tag;
        Object val = null;
        if (attribute != null)
View Full Code Here

Examples of org.htmlcleaner.HtmlCleaner

        xml = CommonUtil.toXml((Node)node, keepHeader);
        return CommonUtil.toHTML(xml);
      }else if (node instanceof TagNode){
        StringWriter sw = new StringWriter();
        //TODO 从配置文件里加载这个CleanerProperties
        CleanerProperties prop = new HtmlCleaner().getProperties();
        SimpleXmlSerializer ser = new SimpleXmlSerializer(prop);
        ser.write((TagNode)node, sw, "UTF-8");
          String html = sw.getBuffer().toString();
          if (keepHeader)
            xml = html;
View Full Code Here
TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.