Package org.apache.droids.helper.factories

Examples of org.apache.droids.helper.factories.URLFiltersFactory


    protocolFactory.getMap().put("http", httpProtocol);
    return protocolFactory;
  }
 
  public static URLFiltersFactory createDefaultURLFiltersFactory() {
    URLFiltersFactory filtersFactory = new URLFiltersFactory();
    URLFilter defaultURLFilter = new URLFilter() {

      public String filter(String urlString) {
        return urlString;
      }
     
    };
    filtersFactory.setMap(new HashMap<String, Object>());
    filtersFactory.getMap().put("default", defaultURLFilter);
    return filtersFactory;
  }
View Full Code Here


 
  public static Droid<Link> createSimpleSaveCrawlingDroid(
      String targetURI) {
    ParserFactory parserFactory = createDefaultParserFactory();
    ProtocolFactory protocolFactory = createDefaultProtocolFactory();
    URLFiltersFactory filtersFactory = createDefaultURLFiltersFactory();

    SimpleDelayTimer simpleDelayTimer = new SimpleDelayTimer();
    simpleDelayTimer.setDelayMillis(100);
   
    SimpleTaskQueueWithHistory<Link> simpleQueue = new SimpleTaskQueueWithHistory<Link>();
View Full Code Here

 
  public static Droid<Link> createSimpleReportCrawlingDroid(
      String targetURI) {
    ParserFactory parserFactory = createDefaultParserFactory();
    ProtocolFactory protocolFactory = createDefaultProtocolFactory();
    URLFiltersFactory filtersFactory = createDefaultURLFiltersFactory();

    SimpleDelayTimer simpleDelayTimer = new SimpleDelayTimer();
    simpleDelayTimer.setDelayMillis(100);

    SequentialTaskMaster<Link> taskMaster = new SequentialTaskMaster<Link>();
View Full Code Here

 
  public static Droid<Link> createSimpleExceptionCrawlingDroid(
      String targetURI) {
    ParserFactory parserFactory = createDefaultParserFactory();
    ProtocolFactory protocolFactory = createDefaultProtocolFactory();
    URLFiltersFactory filtersFactory = createDefaultURLFiltersFactory();

    SimpleDelayTimer simpleDelayTimer = new SimpleDelayTimer();
    simpleDelayTimer.setDelayMillis(100);
   
    Queue<Link> queue = new LinkedList<Link>();
View Full Code Here

    protocolFactory.setMap(new HashMap<String, Object>());
    protocolFactory.getMap().put("http", httpProtocol);
    protocolFactory.getMap().put("https", httpProtocol);
   
    // Create URL filter factory.
    URLFiltersFactory filtersFactory = new URLFiltersFactory();
    RegexURLFilter defaultURLFilter = new RegexURLFilter();
    defaultURLFilter.setFile("classpath:/regex-urlfilter.txt");
    filtersFactory.setMap(new HashMap<String, Object>());
    filtersFactory.getMap().put("default", defaultURLFilter);
   
    // Create handler factory. Provide sysout handler only.
    HandlerFactory handlerFactory = new HandlerFactory();
    SysoutHandler defaultHandler = new SysoutHandler();
    handlerFactory.setMap(new HashMap<String, Object>());
View Full Code Here

    getHandlerFactory().handle(link.getURI(), entity);
  }
 
  protected Collection<Link> getFilteredOutlinks( Parse parse )
  {
    URLFiltersFactory filters = droid.getFiltersFactory();
    TaskValidator< Link > linkValidator = droid.getLinkValidator();
  
    // TODO -- make the hashvalue for Outlink...
    Map<String,Link> filtered = new LinkedHashMap<String,Link>();
    for( Link outlink : parse.getOutlinks() ) {
      String id = outlink.getId();
      if (filters.accept(id) && !filtered.containsKey(id)) {
      if( linkValidator == null ){
        filtered.put(id,outlink);
      }
      else if( linkValidator.validate( outlink ) ){
        filtered.put(id,outlink);
View Full Code Here

    protocolFactory.getMap().put("http", httpProtocol);
    return protocolFactory;
  }
 
  public static URLFiltersFactory createDefaultURLFiltersFactory() {
    URLFiltersFactory filtersFactory = new URLFiltersFactory();
    URLFilter defaultURLFilter = new URLFilter() {

      public String filter(String urlString) {
        return urlString;
      }
     
    };
    filtersFactory.getMap().put("default", defaultURLFilter);
    return filtersFactory;
  }
View Full Code Here

 
  public static Droid<Link> createSimpleSaveCrawlingDroid(
      String targetURI) {
    ParserFactory parserFactory = createDefaultParserFactory();
    ProtocolFactory protocolFactory = createDefaultProtocolFactory();
    URLFiltersFactory filtersFactory = createDefaultURLFiltersFactory();

    SimpleDelayTimer simpleDelayTimer = new SimpleDelayTimer();
    simpleDelayTimer.setDelayMillis(100);
   
    SimpleTaskQueueWithHistory<Link> simpleQueue = new SimpleTaskQueueWithHistory<Link>();
View Full Code Here

 
  public static Droid<Link> createSimpleReportCrawlingDroid(
      String targetURI) {
    ParserFactory parserFactory = createDefaultParserFactory();
    ProtocolFactory protocolFactory = createDefaultProtocolFactory();
    URLFiltersFactory filtersFactory = createDefaultURLFiltersFactory();

    SimpleDelayTimer simpleDelayTimer = new SimpleDelayTimer();
    simpleDelayTimer.setDelayMillis(100);

    SequentialTaskMaster<Link> taskMaster = new SequentialTaskMaster<Link>();
View Full Code Here

 
  public static Droid<Link> createSimpleExceptionCrawlingDroid(
      String targetURI) {
    ParserFactory parserFactory = createDefaultParserFactory();
    ProtocolFactory protocolFactory = createDefaultProtocolFactory();
    URLFiltersFactory filtersFactory = createDefaultURLFiltersFactory();

    SimpleDelayTimer simpleDelayTimer = new SimpleDelayTimer();
    simpleDelayTimer.setDelayMillis(100);
   
    Queue<Link> queue = new LinkedList<Link>();
View Full Code Here

TOP

Related Classes of org.apache.droids.helper.factories.URLFiltersFactory

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.