Package org.apache.shindig.gadgets.rewrite

Source Code of org.apache.shindig.gadgets.rewrite.LexerVsDomRewriteBenchmark

/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*   http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied.  See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.shindig.gadgets.rewrite;

import org.apache.shindig.common.PropertiesModule;
import org.apache.shindig.common.uri.Uri;
import org.apache.shindig.gadgets.DefaultGuiceModule;
import org.apache.shindig.gadgets.Gadget;
import org.apache.shindig.gadgets.GadgetContext;
import org.apache.shindig.gadgets.oauth.OAuthModule;
import org.apache.shindig.gadgets.parse.GadgetHtmlParser;
import org.apache.shindig.gadgets.parse.ParseModule;
import org.apache.shindig.gadgets.parse.caja.CajaHtmlParser;
import org.apache.shindig.gadgets.parse.nekohtml.NekoHtmlParser;
import org.apache.shindig.gadgets.parse.nekohtml.NekoSimplifiedHtmlParser;
import org.apache.shindig.gadgets.rewrite.lexer.DefaultContentRewriter;
import org.apache.shindig.gadgets.rewrite.lexer.HtmlTagTransformer;
import org.apache.shindig.gadgets.spec.GadgetSpec;

import com.google.inject.Guice;
import com.google.inject.Injector;

import org.apache.commons.io.IOUtils;

import java.io.File;
import java.io.FileInputStream;
import java.net.URI;
import java.util.Map;

/**
* Compare performance of lexer rewriter and dom rewriter.
*/
public class LexerVsDomRewriteBenchmark {

  private int numRuns;
  private String content;

  private GadgetHtmlParser cajaParser = new CajaHtmlParser(
      new ParseModule.DOMImplementationProvider().get());

  private GadgetHtmlParser nekoParser = new NekoHtmlParser(
      new ParseModule.DOMImplementationProvider().get());

  private GadgetHtmlParser nekoSimpleParser = new NekoSimplifiedHtmlParser(
      new ParseModule.DOMImplementationProvider().get());

  // Caja lexer
  private Map<String, HtmlTagTransformer> defaultTransformerMap;

  private HTMLContentRewriter htmlRewriter;
  private boolean warmup;
  private ContentRewriterFeatureFactory factory;
  private DefaultContentRewriter lexerRewriter;
  private Gadget gadget;

  private LexerVsDomRewriteBenchmark(String file, int numRuns) throws Exception {
    File inputFile = new File(file);
    if (!inputFile.exists() || !inputFile.canRead()) {
      System.err.println("Input file: " + file + " not found or can't be read.");
      System.exit(1);
    }

    Injector injector = Guice.createInjector(new PropertiesModule(), new OAuthModule(),
        new DefaultGuiceModule());

    // Lexer setup
    lexerRewriter = injector.getInstance(DefaultContentRewriter.class);
    // End lexer setup

    // DOM setup
    this.htmlRewriter = injector.getInstance(HTMLContentRewriter.class);
    factory = injector.getInstance(ContentRewriterFeatureFactory.class);
    // End DOM setup

    final Uri url = Uri.parse("http://www.example.org/dummy.xml");
    GadgetSpec spec = new GadgetSpec(url,
        "<Module><ModulePrefs title=''/><Content><![CDATA[]]></Content></Module>");

    GadgetContext context = new GadgetContext() {
      @Override
      public URI getUrl() {
        return url.toJavaUri();
      }
    };

    gadget = new Gadget()
        .setContext(context)
        .setSpec(spec);

    content = new String(IOUtils.toByteArray(new FileInputStream(file)));
    this.numRuns = numRuns;

    warmup = true;
    runLexer();
    //run(cajaParser);
    run(nekoParser);
    run(nekoSimpleParser);
    Thread.sleep(5000L);
    warmup = false;
    System.out.println("Lexer------");
    runLexer();
    //System.out.println("Caja-------");
    //run(cajaParser);
    System.out.println("Neko-------");
    run(nekoParser);
    System.out.println("NekoSimple-------");
    run(nekoSimpleParser);
  }

  private void output(String content) {
    if (!warmup) {
      System.out.println(content);
    }
  }

  private void runLexer() throws Exception {
   long startTime = System.currentTimeMillis();
    for (int i = 0; i < numRuns; i++) {
      MutableContent mc = new MutableContent(null, content);
      lexerRewriter.rewrite(gadget, mc);
      mc.getContent();
    }
    long time = System.currentTimeMillis() - startTime;
    output("Lexer Rewrite [" + time + " ms total: " +
          ((double)time)/numRuns + "ms/run]");
  }

  private void run(GadgetHtmlParser parser) throws Exception {
    long startTime = System.currentTimeMillis();
    for (int i = 0; i < numRuns; i++) {
      MutableContent mc = new MutableContent(parser, content);
      //linkRewriter.rewrite(gadget, mc);
      //jsConcatRewriter.rewrite(gadget, mc);
      //styleLinksRewriter.rewrite(gadget, mc);
      htmlRewriter.rewrite(gadget, mc);
      mc.getContent();
    }
    long time = System.currentTimeMillis() - startTime;
    output("DOM Rewrite [" + time + " ms total: " +
          ((double)time)/numRuns + "ms/run]");

  }

  public static void main(String[] args) {
    // Test can be run as standalone program to test out serialization and parsing
    // performance numbers, using Caja as a parser.
    if (args.length != 2) {
      System.err.println("Args: <input-file> <num-runs>");
      System.exit(1);
    }

    String fileArg = args[0];
    String runsArg = args[1];
    int numRuns = -1;
    try {
      numRuns = Integer.parseInt(runsArg);
    } catch (Exception e) {
      System.err.println("Invalid num-runs argument: " + runsArg + ", reason: " + e);
    }
    try {
      new LexerVsDomRewriteBenchmark(fileArg, numRuns);
    } catch (Exception e) {
      e.printStackTrace();
    }
  }

}
TOP

Related Classes of org.apache.shindig.gadgets.rewrite.LexerVsDomRewriteBenchmark

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.