Package org.data2semantics.exp

Source Code of org.data2semantics.exp.FullThemeExperiment

package org.data2semantics.exp;

import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Random;

import org.data2semantics.exp.utils.KernelExperiment;
import org.data2semantics.exp.utils.RDFLinearKernelExperiment;
import org.data2semantics.exp.utils.Result;
import org.data2semantics.exp.utils.ResultsTable;
import org.data2semantics.proppred.kernels.rdfgraphkernels.RDFFeatureVectorKernel;
import org.data2semantics.proppred.kernels.rdfgraphkernels.RDFIntersectionTreeEdgeVertexPathKernel;
import org.data2semantics.proppred.kernels.rdfgraphkernels.RDFWLSubTreeKernel;
import org.data2semantics.proppred.learners.evaluation.Accuracy;
import org.data2semantics.proppred.learners.evaluation.EvaluationFunction;
import org.data2semantics.proppred.learners.evaluation.EvaluationUtils;
import org.data2semantics.proppred.learners.evaluation.F1;
import org.data2semantics.proppred.learners.liblinear.LibLINEARParameters;
import org.data2semantics.proppred.learners.libsvm.LibSVM;
import org.data2semantics.tools.rdf.RDFFileDataSet;
import org.openrdf.model.Resource;
import org.openrdf.model.Statement;
import org.openrdf.model.Value;
import org.openrdf.rio.RDFFormat;

public class FullThemeExperiment extends RDFMLExperiment {

  /**
   * @param args
   */
  public static void main(String[] args) {
    String dataDir = "C:\\Users\\Gerben\\Dropbox\\data_bgs_ac_uk_ALL";
    long seed = 1;
    double[] fractions = {0.1};

    for (int i = 0; i < args.length; i++) {
      if (args[i].equals("-dir")) {
        i++;
        dataDir = args[i];
      }
      if (args[i].equals("-seed")) {
        i++;
        seed = Long.parseLong(args[i]);
      }
      if (args[i].equals("-frac")) {
        i++;
        String[] fracs = args[i].split(",");
        fractions = new double[fracs.length];
        for (int j = 0; j < fracs.length; j++) {
          fractions[j] = Double.parseDouble(fracs[j]);
        }
      }
    }

    long[] seeds = {11, 21, 31, 41, 51, 61, 71, 81, 91, 101};
    double[] cs = {0.001, 0.01, 0.1, 1, 10, 100, 1000}

    int[] depths = {1, 2, 3};
    int[] iterations = {0, 2, 4, 6};
    dataset = new RDFFileDataSet(dataDir, RDFFormat.NTRIPLES);

    ResultsTable resTable = new ResultsTable();
    resTable.setManWU(0.05);

    boolean inference = false;
         

    List<EvaluationFunction> evalFuncs = new ArrayList<EvaluationFunction>();
    evalFuncs.add(new Accuracy());
    evalFuncs.add(new F1());

    for (double frac : fractions) {
      createGeoDataSet((int)(1000 * frac), frac, seed, "http://data.bgs.ac.uk/ref/Lexicon/hasTheme");
      List<Double> target = EvaluationUtils.createTarget(labels);
     
      LibLINEARParameters linParms = new LibLINEARParameters(LibLINEARParameters.SVC_DUAL, cs);
      linParms.setDoCrossValidation(false);
      linParms.setNumFolds(0);
      linParms.setSplitFraction((float) 0.7);
     
      Map<Double, Double> counts = EvaluationUtils.computeClassCounts(target);
      int[] wLabels = new int[counts.size()];
      double[] weights = new double[counts.size()];

      for (double label : counts.keySet()) {
        wLabels[(int) label - 1] = (int) label;
        weights[(int) label - 1] = 1 / counts.get(label);
      }
      linParms.setWeightLabels(wLabels);
      linParms.setWeights(weights);
     

      System.out.println("Running fraction: " + frac);

     
      for (int i : depths) {     
        for (int it : iterations) {
          resTable.newRow("")

          KernelExperiment<RDFFeatureVectorKernel> exp = new RDFLinearKernelExperiment(new RDFWLSubTreeKernel(it, i, inference, true), seeds, linParms, dataset, instances, target, blackList, evalFuncs);
       
          System.out.println("Running WL RDF: " + i + " " + it);
          exp.run();

          for (Result res : exp.getResults()) {
            resTable.addResult(res);
         
        }
      }
     

      for (int i : depths) {     
        //for (int it : iterations) {
          resTable.newRow("")

          //KernelExperiment<RDFFeatureVectorKernel> exp = new RDFLinearKernelExperiment(new RDFWLSubTreeKernel(it, i, inference, true), seeds, linParms, dataset, instances, target, blackList, evalFuncs);

          KernelExperiment<RDFFeatureVectorKernel> exp = new RDFLinearKernelExperiment(new RDFIntersectionTreeEdgeVertexPathKernel(i, false, inference, true), seeds, linParms, dataset, instances, target, blackList, evalFuncs);

         
          System.out.println("Running EVP: " + i);
          //System.out.println("Running WL RDF: " + i + " " + it);
          exp.run();

          for (Result res : exp.getResults()) {
            resTable.addResult(res);
         
        }
      //}
    }

    saveResults(resTable, "geo_theme_" + seed + ".ser");

    resTable.addCompResults(resTable.getBestResults());
    System.out.println(resTable);
    saveResults(resTable.toString(), "geo_theme_full_" + seed + ".txt");
  }



  protected static void createGeoDataSet(int minSize, double frac, long seed, String property) {
    Random rand = new Random(seed);

    List<Statement> stmts = dataset.getStatementsFromStrings(null, "http://www.w3.org/2000/01/rdf-schema#isDefinedBy", "http://data.bgs.ac.uk/ref/Lexicon/NamedRockUnit");
    instances = new ArrayList<Resource>();
    labels = new ArrayList<Value>();
    blackList = new ArrayList<Statement>();

    for(Statement stmt: stmts) {
      List<Statement> stmts2 = dataset.getStatementsFromStrings(stmt.getSubject().toString(), property, null);

      for (Statement stmt2 : stmts2) {


        if (rand.nextDouble() < frac) {
          instances.add(stmt2.getSubject());
          labels.add(stmt2.getObject());
        }
      }
    }

    removeSmallClasses(minSize);
    createBlackList();

    Map<Value, Integer> labelMap = new HashMap<Value, Integer>();

    System.out.println(LibSVM.computeClassCounts(LibSVM.createTargets(labels, labelMap)));
  }

}
TOP

Related Classes of org.data2semantics.exp.FullThemeExperiment

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.