Package com.crawljax.core.configuration.CrawljaxConfiguration

Examples of com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder


  private EmbeddedBrowser browser;


  @Test
  public void testExtract() throws InterruptedException, CrawljaxException {
    CrawljaxConfigurationBuilder builder =
            CrawljaxConfiguration.builderFor(DEMO_SITE_SERVER.getSiteUrl());
    builder.crawlRules().click("a");
    builder.crawlRules().clickOnce(true);
    CrawljaxConfiguration config = builder.build();

    CandidateElementExtractor extractor = newElementExtractor(config);
    browser.goToUrl(DEMO_SITE_SERVER.getSiteUrl());
    List<CandidateElement> candidates = extractor.extract(DUMMY_STATE);
View Full Code Here


    return extractor;
  }

  @Test
  public void testExtractExclude() throws Exception {
    CrawljaxConfigurationBuilder builder =
            CrawljaxConfiguration.builderFor(DEMO_SITE_SERVER.getSiteUrl());
    builder.crawlRules().click("a");
    builder.crawlRules().dontClick("div").withAttribute("id", "menubar");
    builder.crawlRules().clickOnce(true);
    CrawljaxConfiguration config = builder.build();

    CandidateElementExtractor extractor = newElementExtractor(config);
    browser.goToUrl(DEMO_SITE_SERVER.getSiteUrl());

    List<CandidateElement> candidates = extractor.extract(DUMMY_STATE);
View Full Code Here

  @Test
  public void testExtractIframeContents() throws Exception {
    RunWithWebServer server = new RunWithWebServer("/site");
    server.before();
    CrawljaxConfigurationBuilder builder = CrawljaxConfiguration
            .builderFor(server.getSiteUrl().resolve("iframe/"));
    builder.crawlRules().click("a");
    CrawljaxConfiguration config = builder.build();

    CandidateElementExtractor extractor = newElementExtractor(config);
    browser.goToUrl(server.getSiteUrl().resolve("iframe/"));
    List<CandidateElement> candidates = extractor.extract(DUMMY_STATE);
View Full Code Here

  }

  @Test
  public void whenNoFollowExternalUrlDoNotFollow() throws IOException, URISyntaxException {
    CrawljaxConfigurationBuilder builder =
            CrawljaxConfiguration.builderFor("http://example.com");
    builder.crawlRules().click("a");
    CrawljaxConfiguration config = builder.build();
    CandidateElementExtractor extractor = newElementExtractor(config);

    List<CandidateElement> extract = extractFromTestFile(extractor);

    assertThat(config.getCrawlRules().followExternalLinks(), is(false));
View Full Code Here

    assertThat(extract, hasSize(2));
  }

  @Test
  public void whenFollowExternalUrlDoFollow() throws IOException, URISyntaxException {
    CrawljaxConfigurationBuilder builder =
            CrawljaxConfiguration.builderFor("http://example.com");
    builder.crawlRules().click("a");
    builder.crawlRules().followExternalLinks(true);
    CrawljaxConfiguration config = builder.build();
    CandidateElementExtractor extractor = newElementExtractor(config);

    List<CandidateElement> extract = extractFromTestFile(extractor);

    assertThat(config.getCrawlRules().followExternalLinks(), is(true));
View Full Code Here

    return new Statistics("1 hour", 1, "2KB", 1, new Date(), stateStats, 2);
  }

  @Test
  public void testConfigSerializibility() throws IOException {
    CrawljaxConfigurationBuilder builder =
            CrawljaxConfiguration.builderFor("http://example.com")
                    .addPlugin(new CrawlOverview())
                    .setOutputDirectory(tmpFolder.getRoot());

    builder.crawlRules().addCrawlCondition(
            new CrawlCondition("kers", new RegexCondition("test")));

    builder.crawlRules().addOracleComparator(
            new OracleComparator("tes", new SimpleComparator()));

    Serializer.toPrettyJson(builder.build());
  }
View Full Code Here

   * Make sure InvariantViolationPlugin executed.
   */
  @Test
  public void testInvariantFailurePlugin() {
    hit = false;
    CrawljaxConfigurationBuilder builder = CrawljaxConfiguration.builderFor(
            "http://localhost").addPlugin(new OnInvariantViolationPlugin() {
      @Override
      public void onInvariantViolation(Invariant invariant, CrawlerContext context) {
        hit = true;
      }
    });
    builder.crawlRules().addInvariant(new Invariant("Test123", new Condition() {

      @Override
      public boolean check(EmbeddedBrowser browser) {
        return false;
      }
    }));
    setStateMachineForConfig(builder.build());

    // state2.equals(state3)
    StateVertex state2 = new StateVertexImpl(2, "state2", "<table><div>state2</div></table>");
    StateVertex state3 = new StateVertexImpl(3, "state3", "<table><div>state2</div></table>");

View Full Code Here

  @ClassRule
  public static final RunWithWebServer SERVER = new RunWithWebServer("/site");

  @Test
  public void maximumDepthIsOblidged() throws Exception {
    CrawljaxConfigurationBuilder builder = SERVER.newConfigBuilder("infinite.html");
    int depth = 3;

    CrawljaxRunner runner = new CrawljaxRunner(builder.setMaximumDepth(depth).build());
    CrawlSession session = runner.call();

    assertThat(session.getStateFlowGraph(), hasStates(depth + 1));
    assertThat(runner.getReason(), is(ExitStatus.EXHAUSTED));
  }
View Full Code Here

    assertThat(runner.getReason(), is(ExitStatus.EXHAUSTED));
  }

  @Test(timeout = 60_000)
  public void maximumTimeIsObliged() throws Exception {
    CrawljaxConfigurationBuilder builder = SERVER.newConfigBuilder("infinite.html");

    CrawljaxRunner runner = new CrawljaxRunner(builder.setUnlimitedCrawlDepth()
            .setMaximumRunTime(25, TimeUnit.SECONDS)
            .build());
    runner.call();
    assertThat(runner.getReason(), is(ExitStatus.MAX_TIME));
View Full Code Here

  }

  @Test(timeout = 60_000)
  public void maximumStatesIsObliged() throws Exception {
    CrawljaxConfigurationBuilder builder = SERVER.newConfigBuilder("infinite.html");

    CrawljaxRunner runner = new CrawljaxRunner(builder.setUnlimitedCrawlDepth()
            .setMaximumStates(3)
            .build());
    CrawlSession session = runner.call();
    assertThat(session.getStateFlowGraph(), hasStates(3));
    assertThat(runner.getReason(), is(ExitStatus.MAX_STATES));
View Full Code Here

TOP

Related Classes of com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.