package org.data2semantics.exp.old;
import java.io.File;
import java.io.FileOutputStream;
import java.io.PrintWriter;
import java.util.ArrayList;
import java.util.List;
import org.data2semantics.exp.old.utils.Experimenter;
import org.data2semantics.exp.old.utils.PropertyPredictionExperiment;
import org.data2semantics.exp.old.utils.datasets.BinaryPropertyPredictionDataSetParameters;
import org.data2semantics.exp.old.utils.datasets.DataSetFactory;
import org.data2semantics.exp.old.utils.datasets.PropertyPredictionDataSet;
import org.data2semantics.exp.utils.Result;
import org.data2semantics.exp.utils.ResultsTable;
import org.data2semantics.proppred.kernels.graphkernels.IntersectionGraphPathKernel;
import org.data2semantics.proppred.kernels.graphkernels.IntersectionGraphWalkKernel;
import org.data2semantics.proppred.kernels.graphkernels.IntersectionPartialSubTreeKernel;
import org.data2semantics.proppred.kernels.graphkernels.IntersectionSubTreeKernel;
import org.data2semantics.proppred.kernels.graphkernels.WLSubTreeKernel;
import org.data2semantics.tools.rdf.RDFFileDataSet;
import org.openrdf.model.Statement;
import org.openrdf.model.URI;
import org.openrdf.rio.RDFFormat;
public class CommitteeMemberPredictionExperiment {
private final static String DATA_DIR = "C:\\eclipse\\workspace\\datasets\\";
private final static int NUMBER_OF_PROC = 6;
public static void main(String[] args) {
RDFFileDataSet testSetA = new RDFFileDataSet(DATA_DIR + "eswc-2011-complete.rdf", RDFFormat.RDFXML);
testSetA.addFile(DATA_DIR + "eswc-2010-complete.rdf", RDFFormat.RDFXML);
//testSetA.addFile(DATA_DIR + "eswc-2011-complete.rdf", RDFFormat.RDFXML);
//testSetA.addFile(DATA_DIR + "eswc-2010-complete.rdf", RDFFormat.RDFXML);
RDFFileDataSet testSetB = new RDFFileDataSet(DATA_DIR + "eswc-2012-complete.rdf", RDFFormat.RDFXML);
List<URI> instances = new ArrayList<URI>();
List<URI> instancesB = new ArrayList<URI>();
List<String> labels = new ArrayList<String>();
List<Statement> stmts = testSetA.getStatementsFromStrings(null, "http://www.w3.org/1999/02/22-rdf-syntax-ns#type", "http://xmlns.com/foaf/0.1/Person");
for (Statement stmt : stmts) {
if (stmt.getSubject() instanceof URI) {
instances.add((URI) stmt.getSubject());
}
}
int pos = 0, neg = 0;
for (URI instance : instances) {
if (!testSetB.getStatements(instance, null, null).isEmpty()) {
instancesB.add(instance);
if (testSetB.getStatementsFromStrings(instance.toString(), "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", false).size() > 0) {
labels.add("true");
pos++;
} else {
labels.add("false");
neg++;
}
}
}
System.out.println("Pos and Neg: " + pos + " " + neg);
List<BinaryPropertyPredictionDataSetParameters> dataSetsParams = new ArrayList<BinaryPropertyPredictionDataSetParameters>();
long[] seeds = {11,21,31,41,51,61,71,81,91,101};
double[] cs = {0.001, 0.01, 0.1, 1, 10, 100, 1000};
int maxClassSize = 50;
///*
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", instancesB, 1, false, false));
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", instancesB, 2, false, false));
//dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", instancesB, 3, false, false));
//dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", instancesB, 4, false, false));
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", instancesB, 1, false, true));
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", instancesB, 2, false, true));
//dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", instancesB, 3, false, true));
//*/
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", "http://www.w3.org/1999/02/22-rdf-syntax-ns#type", "http://xmlns.com/foaf/0.1/Person", 1, true, false));
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", "http://www.w3.org/1999/02/22-rdf-syntax-ns#type", "http://xmlns.com/foaf/0.1/Person", 2, true, false));
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", "http://www.w3.org/1999/02/22-rdf-syntax-ns#type", "http://xmlns.com/foaf/0.1/Person", 1, true, true));
dataSetsParams.add(new BinaryPropertyPredictionDataSetParameters(testSetA, "http://data.semanticweb.org/ns/swc/ontology#holdsRole", "http://data.semanticweb.org/ns/swc/ontology#heldBy", "http://data.semanticweb.org/conference/eswc/2012/research-track-committee-member", "http://www.w3.org/1999/02/22-rdf-syntax-ns#type", "http://xmlns.com/foaf/0.1/Person", 2, true, true));
//*/
PropertyPredictionDataSet dataset;
PropertyPredictionExperiment exp;
ResultsTable resultsWL = new ResultsTable();
ResultsTable resultsSTF = new ResultsTable();
ResultsTable resultsSTP = new ResultsTable();
ResultsTable resultsIGW = new ResultsTable();
ResultsTable resultsIGP = new ResultsTable();
Experimenter experimenter = new Experimenter(NUMBER_OF_PROC);
Thread expT = new Thread(experimenter);
expT.setDaemon(true);
expT.start();
try {
for (BinaryPropertyPredictionDataSetParameters params : dataSetsParams) {
dataset = DataSetFactory.createPropertyPredictionDataSet(params);
dataset.removeSmallClasses(5);
dataset.setLabels(labels);
//dataset.removeVertexAndEdgeLabels();
resultsWL.newRow(dataset.getLabel() + " WLSubTreeKernel");
for (int i = 0; i < 4; i++) {
if (experimenter.hasSpace()) {
int fileId = (int) (Math.random() * 100000000);
File file = new File(DATA_DIR + fileId + "_" + "WL" + "_" + i + ".txt");
exp = new PropertyPredictionExperiment(new PropertyPredictionDataSet(dataset), new WLSubTreeKernel(i), seeds, cs, maxClassSize, new FileOutputStream(file));
experimenter.addExperiment(exp);
resultsWL.addResult(exp.getResults().getAccuracy());
resultsWL.addResult(exp.getResults().getF1());
System.out.println("Running WL, it " + i + " on " + dataset.getLabel());
}
}
resultsSTF.newRow(dataset.getLabel() + " IntersectionFullSubTree");
for (int i = 0; i < 3; i++) {
if (experimenter.hasSpace()) {
int fileId = (int) (Math.random() * 100000000);
File file = new File(DATA_DIR + fileId + "_" + "IntersectionFullSubTree" + "_" + i + ".txt");
exp = new PropertyPredictionExperiment(new PropertyPredictionDataSet(dataset), new IntersectionSubTreeKernel(i, 1), seeds, cs, maxClassSize, new FileOutputStream(file));
experimenter.addExperiment(exp);
resultsSTF.addResult(exp.getResults().getAccuracy());
resultsSTF.addResult(exp.getResults().getF1());
System.out.println("Running STF, it " + i + " on " + dataset.getLabel());
}
}
resultsSTP.newRow(dataset.getLabel() + " IntersectionPartialSubTree");
for (int i = 0; i < 3; i++) {
if (experimenter.hasSpace()) {
int fileId = (int) (Math.random() * 100000000);
File file = new File(DATA_DIR + fileId + "_" + "IntersectionPartialSubTree" + "_" + i + ".txt");
exp = new PropertyPredictionExperiment(new PropertyPredictionDataSet(dataset), new IntersectionPartialSubTreeKernel(i, 0.01), seeds, cs, maxClassSize, new FileOutputStream(file));
experimenter.addExperiment(exp);
resultsSTP.addResult(exp.getResults().getAccuracy());
resultsSTP.addResult(exp.getResults().getF1());
System.out.println("Running STP, it " + i + " on " + dataset.getLabel());
}
}
resultsIGP.newRow(dataset.getLabel() + " IntersectionGraphPath");
for (int i = 1; i < 3; i++) {
if (experimenter.hasSpace()) {
int fileId = (int) (Math.random() * 100000000);
File file = new File(DATA_DIR + fileId + "_" + "IntersectionGraphPath" + "_" + i + ".txt");
exp = new PropertyPredictionExperiment(new PropertyPredictionDataSet(dataset), new IntersectionGraphPathKernel(i, 1), seeds, cs, maxClassSize, new FileOutputStream(file));
experimenter.addExperiment(exp);
resultsIGP.addResult(exp.getResults().getAccuracy());
resultsIGP.addResult(exp.getResults().getF1());
System.out.println("Running IGP, it " + i + " on " + dataset.getLabel());
}
}
resultsIGW.newRow(dataset.getLabel() + " IntersectionGraphWalk");
for (int i = 1; i < 3; i++) {
if (experimenter.hasSpace()) {
int fileId = (int) (Math.random() * 100000000);
File file = new File(DATA_DIR + fileId + "_" + "IntersectionGraphWalk" + "_" + i + ".txt");
exp = new PropertyPredictionExperiment(new PropertyPredictionDataSet(dataset), new IntersectionGraphWalkKernel(i, 1), seeds, cs, maxClassSize, new FileOutputStream(file));
experimenter.addExperiment(exp);
resultsIGW.addResult(exp.getResults().getAccuracy());
resultsIGW.addResult(exp.getResults().getF1());
System.out.println("Running IGW, it " + i + " on " + dataset.getLabel());
}
}
//*/
}
} catch (Exception e) {
e.printStackTrace();
}
experimenter.stop();
while (expT.isAlive()) {
try {
Thread.sleep(1000);
} catch (Exception e) {
e.printStackTrace();
}
}
try {
int fileId = (int) (Math.random() * 100000000);
File file = new File(DATA_DIR + fileId + "_" + "all_results" + ".txt");
PrintWriter fileOut = new PrintWriter(new FileOutputStream(file));
List<Result> bestResults = new ArrayList<Result>();
bestResults = resultsWL.getBestResults(bestResults);
bestResults = resultsSTF.getBestResults(bestResults);
bestResults = resultsSTP.getBestResults(bestResults);
bestResults = resultsIGW.getBestResults(bestResults);
bestResults = resultsIGP.getBestResults(bestResults);
resultsWL.addCompResults(bestResults);
resultsSTF.addCompResults(bestResults);
resultsSTP.addCompResults(bestResults);
resultsIGW.addCompResults(bestResults);
resultsIGP.addCompResults(bestResults);
fileOut.println(resultsWL);
fileOut.println(resultsSTF);
fileOut.println(resultsSTP);
fileOut.println(resultsIGW);
fileOut.println(resultsIGP);
fileOut.println(resultsWL.allScoresToString());
fileOut.println(resultsSTF.allScoresToString());
fileOut.println(resultsSTP.allScoresToString());
fileOut.println(resultsIGW.allScoresToString());
fileOut.println(resultsIGP.allScoresToString());
System.out.println(resultsWL);
System.out.println(resultsSTF);
System.out.println(resultsSTP);
System.out.println(resultsIGW);
System.out.println(resultsIGP);
System.out.println(resultsWL.allScoresToString());
System.out.println(resultsSTF.allScoresToString());
System.out.println(resultsSTP.allScoresToString());
System.out.println(resultsIGW.allScoresToString());
System.out.println(resultsIGP.allScoresToString());
} catch (Exception e) {
e.printStackTrace();
}
}
}