[DL-Learner SVN] SF.net SVN: dl-learner: [370] trunk

SourceForge Headquarters 225 Broadway Suite 1600 San Diego, CA 92101 +1 (858) 422-6466

Revision: 370
          http://dl-learner.svn.sourceforge.net/dl-learner/?rev=370&view=rev
Author:   jenslehmann
Date:     2008-01-14 03:54:55 -0800 (Mon, 14 Jan 2008)

Log Message:
-----------
- continued merge of SPARQL components
- added example for SPARQL queries using Jena in org.dllearner.kb.sparql.SparqlQuery
- updated and added Jena libraries

@developers: Please update your classpath by adding the new jars in lib!

Modified Paths:
--------------
    trunk/lib/jena/iri.jar
    trunk/lib/jena/jena.jar
    trunk/src/dl-learner/org/dllearner/cli/Start.java
    trunk/src/dl-learner/org/dllearner/server/ClientState.java
    trunk/src/dl-learner/org/dllearner/server/DLLearnerWS.java

Added Paths:
-----------
    trunk/lib/jena/arq.jar
    trunk/lib/jena/commons-logging-1.1.jar
    trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlEndpoint.java
    trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlQuery.java

Removed Paths:
-------------
    trunk/lib/jena/commons-logging.jar
    trunk/src/dl-learner/org/dllearner/kb/SparqlEndpoint.java

Added: trunk/lib/jena/arq.jar
===================================================================
(Binary files differ)


Property changes on: trunk/lib/jena/arq.jar
___________________________________________________________________
Name: svn:mime-type
   + application/octet-stream

Added: trunk/lib/jena/commons-logging-1.1.jar
===================================================================
(Binary files differ)


Property changes on: trunk/lib/jena/commons-logging-1.1.jar
___________________________________________________________________
Name: svn:mime-type
   + application/octet-stream

Deleted: trunk/lib/jena/commons-logging.jar
===================================================================
(Binary files differ)

Modified: trunk/lib/jena/iri.jar
===================================================================
(Binary files differ)

Modified: trunk/lib/jena/jena.jar
===================================================================
(Binary files differ)

Modified: trunk/src/dl-learner/org/dllearner/cli/Start.java
===================================================================

--- trunk/src/dl-learner/org/dllearner/cli/Start.java	2008-01-14 08:56:17 UTC (rev 369)
+++ trunk/src/dl-learner/org/dllearner/cli/Start.java	2008-01-14 11:54:55 UTC (rev 370)
@@ -60,7 +60,7 @@
 import org.dllearner.core.dl.Individual;
 import org.dllearner.kb.KBFile;
 import org.dllearner.kb.OWLFile;
-import org.dllearner.kb.SparqlEndpoint;
+import org.dllearner.kb.sparql.SparqlEndpoint;
 import org.dllearner.learningproblems.PosNegDefinitionLP;
 import org.dllearner.learningproblems.PosNegInclusionLP;
 import org.dllearner.learningproblems.PosOnlyDefinitionLP;

Deleted: trunk/src/dl-learner/org/dllearner/kb/SparqlEndpoint.java
===================================================================
--- trunk/src/dl-learner/org/dllearner/kb/SparqlEndpoint.java	2008-01-14 08:56:17 UTC (rev 369)
+++ trunk/src/dl-learner/org/dllearner/kb/SparqlEndpoint.java	2008-01-14 11:54:55 UTC (rev 370)
@@ -1,510 +0,0 @@
-/**
- * Copyright (C) 2007, Jens Lehmann
- *
- * This file is part of DL-Learner.
- * 
- * DL-Learner is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 3 of the License, or
- * (at your option) any later version.
- *
- * DL-Learner is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program.  If not, see <http://www.gnu.org/licenses/>.
- *
- */
-package org.dllearner.kb;
-
-import java.io.File;
-import java.io.FileWriter;
-import java.io.IOException;
-import java.net.MalformedURLException;
-import java.net.URI;
-import java.net.URL;
-import java.util.Collection;
-import java.util.HashMap;
-import java.util.HashSet;
-import java.util.LinkedList;
-import java.util.Set;
-
-import org.dllearner.core.KnowledgeSource;
-import org.dllearner.core.OntologyFormat;
-import org.dllearner.core.OntologyFormatUnsupportedException;
-import org.dllearner.core.config.BooleanConfigOption;
-import org.dllearner.core.config.ConfigEntry;
-import org.dllearner.core.config.ConfigOption;
-import org.dllearner.core.config.IntegerConfigOption;
-import org.dllearner.core.config.InvalidConfigOptionValueException;
-import org.dllearner.core.config.StringConfigOption;
-import org.dllearner.core.config.StringSetConfigOption;
-import org.dllearner.core.config.StringTupleListConfigOption;
-import org.dllearner.core.dl.KB;
-import org.dllearner.kb.sparql.Manager;
-import org.dllearner.kb.sparql.Manipulator;
-import org.dllearner.kb.sparql.PredefinedEndpoint;
-import org.dllearner.kb.sparql.PredefinedFilter;
-import org.dllearner.kb.sparql.SparqlOntologyCollector;
-import org.dllearner.kb.sparql.SparqlQueryType;
-import org.dllearner.kb.sparql.SpecificSparqlEndpoint;
-import org.dllearner.parser.KBParser;
-import org.dllearner.reasoning.DIGConverter;
-import org.dllearner.reasoning.JenaOWLDIGConverter;
-import org.dllearner.utilities.StringTuple;
-
-/**
- * Represents a SPARQL Endpoint.
- * 
- * @author Jens Lehmann
- * @author Sebastian Knappe
- * @author Sebastian Hellmann
- */
-public class SparqlEndpoint extends KnowledgeSource {
-
-	// ConfigOptions
-	private URL url;
-	String host;
-	private Set<String> instances=new HashSet<String>();;
-	private URL dumpFile;
-	private int recursionDepth = 1;
-	private int predefinedFilter = 0;
-	private int predefinedEndpoint = 0;
-	private Set<String> predList=new HashSet<String>();
-	private Set<String> objList=new HashSet<String>();
-	// private Set<String> classList;
-	private String format = "N-TRIPLES";
-	private boolean dumpToFile = true;
-	private boolean useLits = false;
-	private boolean getAllSuperClasses = true;
-	private boolean closeAfterRecursion = true;
-	private int breakSuperClassRetrievalAfter = 200;
-
-	private boolean learnDomain = false;
-	private boolean learnRange = false;
-	private int numberOfInstancesUsedForRoleLearning=40;
-	private String role="";
-	private String blankNodeIdentifier = "bnode";
-	
-	LinkedList<StringTuple> URIParameters = new LinkedList<StringTuple>();
-	LinkedList<StringTuple> replacePredicate = new LinkedList<StringTuple>();
-	LinkedList<StringTuple> replaceObject = new LinkedList<StringTuple>();
-
-	/**
-	 * Holds the results of the calculateSubjects method
-	 */
-	private String[] subjects;
-
-	/**
-	 * Holds the results of the calculateTriples method
-	 */
-	private String[] triples;
-
-	/**
-	 * Holds the results of the calculateConceptSubjects method
-	 */
-	private String[] conceptSubjects;
-
-	/**
-	 * if a method is running this becomes true
-	 */
-	private boolean subjectThreadRunning = false;
-
-	private boolean triplesThreadRunning = false;
-
-	private boolean conceptThreadRunning = false;
-
-	/**
-	 * the Thread that is running a method
-	 */
-	private Thread subjectThread;
-
-	private Thread triplesThread;
-
-	private Thread conceptThread;
-
-	// received ontology as array, used if format=Array(an element of the
-	// array consists of the subject, predicate and object separated by '<'
-	private String[] ontArray;
-
-	// received ontology as KB, the internal format
-	private KB kb;
-
-	public static String getName() {
-		return "SPARQL Endpoint Restructured";
-	}
-
-	/**
-	 * sets the ConfigOptions for this KnowledgeSource
-	 * 
-	 * @return
-	 */
-	public static Collection<ConfigOption<?>> createConfigOptions() {
-		Collection<ConfigOption<?>> options = new LinkedList<ConfigOption<?>>();
-		options.add(new StringConfigOption("url", "URL of SPARQL Endpoint"));
-		options.add(new StringConfigOption("host", "host of SPARQL Endpoint"));
-		options.add(new StringSetConfigOption("instances",
-				"relevant instances e.g. positive and negative examples in a learning problem"));
-		options.add(new IntegerConfigOption("recursionDepth",
-				"recursion depth of KB fragment selection", 2));
-		options.add(new IntegerConfigOption("predefinedFilter", "the mode of the SPARQL Filter"));
-		options.add(new IntegerConfigOption("predefinedEndpoint", "the mode of the SPARQL Filter"));
-
-		options.add(new StringSetConfigOption("predList", "list of all ignored roles"));
-		options.add(new StringSetConfigOption("objList", "list of all ignored objects"));
-		options.add(new StringSetConfigOption("classList", "list of all ignored classes"));
-		options.add(new StringConfigOption("format", "N-TRIPLES or KB format", "N-TRIPLES"));
-		options.add(new BooleanConfigOption("dumpToFile",
-				"Specifies whether the extracted ontology is written to a file or not.", true));
-		options.add(new BooleanConfigOption("useLits", "use Literals in SPARQL query"));
-		options.add(new BooleanConfigOption("getAllSuperClasses", "If true then all superclasses are retrieved until the most general class (owl:Thing) is reached.", true));
-
-		options.add(new BooleanConfigOption("learnDomain", "learns the Domain for a Role"));
-		options.add(new BooleanConfigOption("learnRange", "learns the Range for a Role"));
-		options.add(new StringConfigOption("role", "role to learn Domain/Range from"));
-		options.add(new StringConfigOption("blankNodeIdentifier",
-				"used to identify blanknodes in Tripels"));
-
-		options.add(new StringTupleListConfigOption("example", "example"));
-		options.add(new StringTupleListConfigOption("replacePredicate", "rule for replacing predicates"));
-		options.add(new StringTupleListConfigOption("replaceObject", "rule for replacing predicates"));
-		options.add(new IntegerConfigOption("breakSuperClassRetrievalAfter", "stops a cyclic hierarchy after specified number of classes"));
-		options.add(new IntegerConfigOption("numberOfInstancesUsedForRoleLearning", ""));
-		options.add(new BooleanConfigOption("closeAfterRecursion", "gets all classes for all instances"));
-		
-		
-		
-		return options;
-	}
-
-	/*
-	 * @see org.dllearner.core.Component#applyConfigEntry(org.dllearner.core.ConfigEntry)
-	 */
-	@Override
-	@SuppressWarnings( { "unchecked" })
-	public <T> void applyConfigEntry(ConfigEntry<T> entry) throws InvalidConfigOptionValueException {
-		String option = entry.getOptionName();
-		if (option.equals("url")) {
-			String s = (String) entry.getValue();
-			try {
-				url = new URL(s);
-			} catch (MalformedURLException e) {
-				throw new InvalidConfigOptionValueException(entry.getOption(), entry.getValue(),
-						"malformed URL " + s);
-			}
-		} else if (option.equals("host")) {
-			host = (String) entry.getValue();
-		} else if (option.equals("instances")) {
-			instances = (Set<String>) entry.getValue();
-		} else if (option.equals("recursionDepth")) {
-			recursionDepth = (Integer) entry.getValue();
-		} else if (option.equals("predList")) {
-			predList = (Set<String>) entry.getValue();
-		} else if (option.equals("objList")) {
-			objList = (Set<String>) entry.getValue();
-		//} else if (option.equals("classList")) {
-		//	classList = (Set<String>) entry.getValue();
-		} else if (option.equals("predefinedEndpoint")) {
-			predefinedEndpoint = (Integer) entry.getValue();
-		} else if (option.equals("predefinedFilter")) {
-			predefinedFilter = (Integer) entry.getValue();
-		} else if (option.equals("format")) {
-			format = (String) entry.getValue();
-		} else if (option.equals("dumpToFile")) {
-			dumpToFile = (Boolean) entry.getValue();
-		} else if (option.equals("useLits")) {
-			useLits = (Boolean) entry.getValue();
-		} else if (option.equals("getAllSuperClasses")) {
-			getAllSuperClasses = (Boolean) entry.getValue();
-		} else if (option.equals("learnDomain")) {
-			learnDomain = (Boolean) entry.getValue();
-		}else if (option.equals("learnRange")) {
-			learnRange = (Boolean) entry.getValue();
-		} else if (option.equals("role")) {
-			role = (String) entry.getValue();
-		} else if (option.equals("blankNodeIdentifier")) {
-			blankNodeIdentifier = (String) entry.getValue();
-		} else if (option.equals("example")) {
-			//System.out.println(entry.getValue());
-		}else if (option.equals("replacePredicate")) {
-			replacePredicate = (LinkedList)entry.getValue();
-		}else if (option.equals("replaceObject")) {
-			replaceObject = (LinkedList)entry.getValue();
-		}else if (option.equals("breakSuperClassRetrievalAfter")) {
-			breakSuperClassRetrievalAfter = (Integer) entry.getValue();
-		}else if (option.equals("numberOfInstancesUsedForRoleLearning")) {
-			numberOfInstancesUsedForRoleLearning = (Integer) entry.getValue();
-		}else if (option.equals("closeAfterRecursion")) {
-			closeAfterRecursion = (Boolean) entry.getValue();
-		} 
-		
-	}
-
-	/*
-	 * (non-Javadoc)
-	 * 
-	 * @see org.dllearner.core.Component#init()
-	 */
-	@Override
-	public void init() {
-		System.out.println("SparqlModul: Collecting Ontology");
-		// SparqlOntologyCollector oc=
-		// new SparqlOntologyCollector(Datastructures.setToArray(instances),
-		// numberOfRecursions, filterMode,
-		// Datastructures.setToArray(predList),Datastructures.setToArray(
-		// objList),Datastructures.setToArray(classList),format,url,useLits);
-		Manager m = new Manager();
-		SpecificSparqlEndpoint sse = null;
-		SparqlQueryType sqt = null;
-		// get Options for Manipulator
-		Manipulator man = new Manipulator(blankNodeIdentifier,breakSuperClassRetrievalAfter,replacePredicate,replaceObject);
-		HashMap<String, String> parameters = new HashMap<String, String>();
-		parameters.put("default-graph-uri", "http://dbpedia.org");
-		parameters.put("format", "application/sparql-results.xml");
-
-		// get Options for endpoints
-		if (predefinedEndpoint >= 1) {
-			sse = PredefinedEndpoint.getEndpoint(predefinedEndpoint);
-		} else {
-			sse = new SpecificSparqlEndpoint(url, host, parameters);
-		}
-
-		// get Options for Filters
-		
-		if (predefinedFilter >= 1) {
-			sqt = PredefinedFilter.getFilter(predefinedFilter);
-
-		} else {
-			sqt = new SparqlQueryType("forbid", objList, predList, useLits + "");
-			
-		}
-		// give everything to the manager
-		m.useConfiguration(sqt, sse, man, recursionDepth, getAllSuperClasses,closeAfterRecursion);
-		try {
-			String ont = "";
-			//System.out.println(learnDomain);
-			// used to learn a domain of a role
-			if (learnDomain || learnRange) {
-				Set<String> pos=new HashSet<String>();
-				Set<String> neg=new HashSet<String>();
-				if(learnDomain){
-					pos = m.getDomainInstancesForRole(role);
-					neg = m.getRangeInstancesForRole(role);
-				}else if(learnRange){
-					neg = m.getDomainInstancesForRole(role);
-					pos = m.getRangeInstancesForRole(role);
-				}
-				//choose 30
-				
-				
-					Set<String> tmp=new HashSet<String>();
-					for(String one:pos){
-						tmp.add(one);
-						if(tmp.size()>=numberOfInstancesUsedForRoleLearning)break;
-					}
-					pos=tmp;
-					System.out.println("Instances used: "+pos.size());
-					
-					tmp=new HashSet<String>();
-					for(String one:neg){
-						tmp.add(one);
-						if(tmp.size()>=numberOfInstancesUsedForRoleLearning)break;
-					}
-					neg=tmp;
-					
-					instances=new HashSet<String>();
-					instances.addAll(pos);
-					
-					instances.addAll(neg);
-					
-					for(String one:pos){
-						System.out.println("+\""+one+"\"");
-					}
-					for(String one:neg){
-						System.out.println("-\""+one+"\"");
-					}
-				
-				/*Random r= new Random();
-				
-				
-				Object[] arr=instances.toArray();
-					while(instances.size()>=30){
-					
-					}*/
-				// add the role to the filter(a solution is always EXISTS
-				// role.TOP)
-				m.addPredicateFilter(role);
-				//System.out.println(instances);
-				// THIS is a workaround 
-				
-			}
-			// the actual extraction is started here
-			ont = m.extract(instances);
-			System.out.println("Number of cached SPARQL queries: "+m.getConfiguration().numberOfCachedSparqlQueries);
-			System.out.println("Number of uncached SPARQL queries: "+m.getConfiguration().numberOfUncachedSparqlQueries);
-			
-			System.out.println("Finished collecting Fragment");
-
-			if (dumpToFile) {
-				String filename = System.currentTimeMillis() + ".nt";
-				String basedir = "cache" + File.separator;
-				try {
-					if (!new File(basedir).exists())
-						new File(basedir).mkdir();
-
-					FileWriter fw = new FileWriter(new File(basedir + filename), true);
-					fw.write(ont);
-					fw.flush();
-					fw.close();
-
-					dumpFile = (new File(basedir + filename)).toURI().toURL();
-				} catch (Exception e) {
-					e.printStackTrace();
-				}
-			}
-			if (format.equals("KB")) {
-				try {
-					//kb = KBParser.parseKBFile(new StringReader(ont));
-					kb=KBParser.parseKBFile(dumpFile);
-				} catch (Exception e) {
-					e.printStackTrace();
-				}
-			}
-		} catch (Exception e) {
-			e.printStackTrace();
-		}
-		System.out.println("SparqlModul: ****Finished");
-	}
-
-	/*
-	 * (non-Javadoc)
-	 * 
-	 * @see org.dllearner.core.KnowledgeSource#toDIG()
-	 */
-	@Override
-	public String toDIG(URI kbURI) {
-		if (format.equals("N-TRIPLES"))
-			return JenaOWLDIGConverter.getTellsString(dumpFile, OntologyFormat.N_TRIPLES, kbURI);
-		else
-			return DIGConverter.getDIGString(kb, kbURI).toString();
-	}
-
-	/*
-	 * (non-Javadoc)
-	 * 
-	 * @see org.dllearner.core.KnowledgeSource#export(java.io.File,
-	 *      org.dllearner.core.OntologyFormat)
-	 */
-	@Override
-	public void export(File file, OntologyFormat format) throws OntologyFormatUnsupportedException {
-		// currently no export functions implemented, so we just throw an
-		// exception
-		throw new OntologyFormatUnsupportedException("export", format);
-	}
-
-	public URL getURL() {
-		return url;
-	}
-
-	public String[] getOntArray() {
-		return ontArray;
-	}
-
-	public void calculateSubjects(String label, int limit) {
-		System.out.println("SparqlModul: Collecting Subjects");
-		SparqlOntologyCollector oc = new SparqlOntologyCollector(url);
-		try {
-			subjects = oc.getSubjectsFromLabel(label, limit);
-		} catch (IOException e) {
-			subjects = new String[1];
-			subjects[0] = "[Error]Sparql Endpoint could not be reached.";
-		}
-		System.out.println("SparqlModul: ****Finished");
-	}
-
-	public void calculateTriples(String subject) {
-		System.out.println("SparqlModul: Collecting Triples");
-		SparqlOntologyCollector oc = new SparqlOntologyCollector(url);
-		try {
-			triples = oc.collectTriples(subject);
-		} catch (IOException e) {
-			triples = new String[1];
-			triples[0] = "[Error]Sparql Endpoint could not be reached.";
-		}
-		System.out.println("SparqlModul: ****Finished");
-	}
-
-	public void calculateConceptSubjects(String concept) {
-		System.out.println("SparqlModul: Collecting Subjects");
-		SparqlOntologyCollector oc = new SparqlOntologyCollector(url);
-		try {
-			conceptSubjects = oc.getSubjectsFromConcept(concept);
-		} catch (IOException e) {
-			conceptSubjects = new String[1];
-			conceptSubjects[0] = "[Error]Sparql Endpoint could not be reached.";
-		}
-		System.out.println("SparqlModul: ****Finished");
-	}
-
-	public boolean subjectThreadIsRunning() {
-		return subjectThreadRunning;
-	}
-
-	public void setSubjectThreadRunning(boolean bool) {
-		subjectThreadRunning = bool;
-	}
-
-	public boolean triplesThreadIsRunning() {
-		return triplesThreadRunning;
-	}
-
-	public void setTriplesThreadRunning(boolean bool) {
-		triplesThreadRunning = bool;
-	}
-
-	public boolean conceptThreadIsRunning() {
-		return conceptThreadRunning;
-	}
-
-	public void setConceptThreadRunning(boolean bool) {
-		conceptThreadRunning = bool;
-	}
-
-	public String[] getSubjects() {
-		return subjects;
-	}
-
-	public Thread getSubjectThread() {
-		return subjectThread;
-	}
-
-	public void setSubjectThread(Thread subjectThread) {
-		this.subjectThread = subjectThread;
-	}
-
-	public Thread getTriplesThread() {
-		return triplesThread;
-	}
-
-	public void setTriplesThread(Thread triplesThread) {
-		this.triplesThread = triplesThread;
-	}
-
-	public Thread getConceptThread() {
-		return conceptThread;
-	}
-
-	public void setConceptThread(Thread conceptThread) {
-		this.conceptThread = conceptThread;
-	}
-
-	public String[] getTriples() {
-		return triples;
-	}
-
-	public String[] getConceptSubjects() {
-		return conceptSubjects;
-	}
-}

Copied: trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlEndpoint.java (from rev 369, trunk/src/dl-learner/org/dllearner/kb/SparqlEndpoint.java)
===================================================================
--- trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlEndpoint.java	                        (rev 0)
+++ trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlEndpoint.java	2008-01-14 11:54:55 UTC (rev 370)
@@ -0,0 +1,503 @@
+/**
+ * Copyright (C) 2007, Jens Lehmann
+ *
+ * This file is part of DL-Learner.
+ * 
+ * DL-Learner is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * DL-Learner is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ *
+ */
+package org.dllearner.kb.sparql;
+
+import java.io.File;
+import java.io.FileWriter;
+import java.io.IOException;
+import java.net.MalformedURLException;
+import java.net.URI;
+import java.net.URL;
+import java.util.Collection;
+import java.util.HashMap;
+import java.util.HashSet;
+import java.util.LinkedList;
+import java.util.Set;
+
+import org.dllearner.core.KnowledgeSource;
+import org.dllearner.core.OntologyFormat;
+import org.dllearner.core.OntologyFormatUnsupportedException;
+import org.dllearner.core.config.BooleanConfigOption;
+import org.dllearner.core.config.ConfigEntry;
+import org.dllearner.core.config.ConfigOption;
+import org.dllearner.core.config.IntegerConfigOption;
+import org.dllearner.core.config.InvalidConfigOptionValueException;
+import org.dllearner.core.config.StringConfigOption;
+import org.dllearner.core.config.StringSetConfigOption;
+import org.dllearner.core.config.StringTupleListConfigOption;
+import org.dllearner.core.dl.KB;
+import org.dllearner.parser.KBParser;
+import org.dllearner.reasoning.DIGConverter;
+import org.dllearner.reasoning.JenaOWLDIGConverter;
+import org.dllearner.utilities.StringTuple;
+
+/**
+ * Represents a SPARQL Endpoint.
+ * 
+ * @author Jens Lehmann
+ * @author Sebastian Knappe
+ * @author Sebastian Hellmann
+ */
+public class SparqlEndpoint extends KnowledgeSource {
+
+	// ConfigOptions
+	private URL url;
+	String host;
+	private Set<String> instances=new HashSet<String>();;
+	private URL dumpFile;
+	private int recursionDepth = 1;
+	private int predefinedFilter = 0;
+	private int predefinedEndpoint = 0;
+	private Set<String> predList=new HashSet<String>();
+	private Set<String> objList=new HashSet<String>();
+	// private Set<String> classList;
+	private String format = "N-TRIPLES";
+	private boolean dumpToFile = true;
+	private boolean useLits = false;
+	private boolean getAllSuperClasses = true;
+	private boolean closeAfterRecursion = true;
+	private int breakSuperClassRetrievalAfter = 200;
+
+	private boolean learnDomain = false;
+	private boolean learnRange = false;
+	private int numberOfInstancesUsedForRoleLearning=40;
+	private String role="";
+	private String blankNodeIdentifier = "bnode";
+	
+	LinkedList<StringTuple> URIParameters = new LinkedList<StringTuple>();
+	LinkedList<StringTuple> replacePredicate = new LinkedList<StringTuple>();
+	LinkedList<StringTuple> replaceObject = new LinkedList<StringTuple>();
+
+	/**
+	 * Holds the results of the calculateSubjects method
+	 */
+	private String[] subjects;
+
+	/**
+	 * Holds the results of the calculateTriples method
+	 */
+	private String[] triples;
+
+	/**
+	 * Holds the results of the calculateConceptSubjects method
+	 */
+	private String[] conceptSubjects;
+
+	/**
+	 * if a method is running this becomes true
+	 */
+	private boolean subjectThreadRunning = false;
+
+	private boolean triplesThreadRunning = false;
+
+	private boolean conceptThreadRunning = false;
+
+	/**
+	 * the Thread that is running a method
+	 */
+	private Thread subjectThread;
+
+	private Thread triplesThread;
+
+	private Thread conceptThread;
+
+	// received ontology as array, used if format=Array(an element of the
+	// array consists of the subject, predicate and object separated by '<'
+	private String[] ontArray;
+
+	// received ontology as KB, the internal format
+	private KB kb;
+
+	public static String getName() {
+		return "SPARQL Endpoint Restructured";
+	}
+
+	/**
+	 * sets the ConfigOptions for this KnowledgeSource
+	 * 
+	 * @return
+	 */
+	public static Collection<ConfigOption<?>> createConfigOptions() {
+		Collection<ConfigOption<?>> options = new LinkedList<ConfigOption<?>>();
+		options.add(new StringConfigOption("url", "URL of SPARQL Endpoint"));
+		options.add(new StringConfigOption("host", "host of SPARQL Endpoint"));
+		options.add(new StringSetConfigOption("instances",
+				"relevant instances e.g. positive and negative examples in a learning problem"));
+		options.add(new IntegerConfigOption("recursionDepth",
+				"recursion depth of KB fragment selection", 2));
+		options.add(new IntegerConfigOption("predefinedFilter", "the mode of the SPARQL Filter"));
+		options.add(new IntegerConfigOption("predefinedEndpoint", "the mode of the SPARQL Filter"));
+
+		options.add(new StringSetConfigOption("predList", "list of all ignored roles"));
+		options.add(new StringSetConfigOption("objList", "list of all ignored objects"));
+		options.add(new StringSetConfigOption("classList", "list of all ignored classes"));
+		options.add(new StringConfigOption("format", "N-TRIPLES or KB format", "N-TRIPLES"));
+		options.add(new BooleanConfigOption("dumpToFile",
+				"Specifies whether the extracted ontology is written to a file or not.", true));
+		options.add(new BooleanConfigOption("useLits", "use Literals in SPARQL query"));
+		options.add(new BooleanConfigOption("getAllSuperClasses", "If true then all superclasses are retrieved until the most general class (owl:Thing) is reached.", true));
+
+		options.add(new BooleanConfigOption("learnDomain", "learns the Domain for a Role"));
+		options.add(new BooleanConfigOption("learnRange", "learns the Range for a Role"));
+		options.add(new StringConfigOption("role", "role to learn Domain/Range from"));
+		options.add(new StringConfigOption("blankNodeIdentifier",
+				"used to identify blanknodes in Tripels"));
+
+		options.add(new StringTupleListConfigOption("example", "example"));
+		options.add(new StringTupleListConfigOption("replacePredicate", "rule for replacing predicates"));
+		options.add(new StringTupleListConfigOption("replaceObject", "rule for replacing predicates"));
+		options.add(new IntegerConfigOption("breakSuperClassRetrievalAfter", "stops a cyclic hierarchy after specified number of classes"));
+		options.add(new IntegerConfigOption("numberOfInstancesUsedForRoleLearning", ""));
+		options.add(new BooleanConfigOption("closeAfterRecursion", "gets all classes for all instances"));
+		
+		
+		
+		return options;
+	}
+
+	/*
+	 * @see org.dllearner.core.Component#applyConfigEntry(org.dllearner.core.ConfigEntry)
+	 */
+	@Override
+	@SuppressWarnings( { "unchecked" })
+	public <T> void applyConfigEntry(ConfigEntry<T> entry) throws InvalidConfigOptionValueException {
+		String option = entry.getOptionName();
+		if (option.equals("url")) {
+			String s = (String) entry.getValue();
+			try {
+				url = new URL(s);
+			} catch (MalformedURLException e) {
+				throw new InvalidConfigOptionValueException(entry.getOption(), entry.getValue(),
+						"malformed URL " + s);
+			}
+		} else if (option.equals("host")) {
+			host = (String) entry.getValue();
+		} else if (option.equals("instances")) {
+			instances = (Set<String>) entry.getValue();
+		} else if (option.equals("recursionDepth")) {
+			recursionDepth = (Integer) entry.getValue();
+		} else if (option.equals("predList")) {
+			predList = (Set<String>) entry.getValue();
+		} else if (option.equals("objList")) {
+			objList = (Set<String>) entry.getValue();
+		//} else if (option.equals("classList")) {
+		//	classList = (Set<String>) entry.getValue();
+		} else if (option.equals("predefinedEndpoint")) {
+			predefinedEndpoint = (Integer) entry.getValue();
+		} else if (option.equals("predefinedFilter")) {
+			predefinedFilter = (Integer) entry.getValue();
+		} else if (option.equals("format")) {
+			format = (String) entry.getValue();
+		} else if (option.equals("dumpToFile")) {
+			dumpToFile = (Boolean) entry.getValue();
+		} else if (option.equals("useLits")) {
+			useLits = (Boolean) entry.getValue();
+		} else if (option.equals("getAllSuperClasses")) {
+			getAllSuperClasses = (Boolean) entry.getValue();
+		} else if (option.equals("learnDomain")) {
+			learnDomain = (Boolean) entry.getValue();
+		}else if (option.equals("learnRange")) {
+			learnRange = (Boolean) entry.getValue();
+		} else if (option.equals("role")) {
+			role = (String) entry.getValue();
+		} else if (option.equals("blankNodeIdentifier")) {
+			blankNodeIdentifier = (String) entry.getValue();
+		} else if (option.equals("example")) {
+			//System.out.println(entry.getValue());
+		}else if (option.equals("replacePredicate")) {
+			replacePredicate = (LinkedList)entry.getValue();
+		}else if (option.equals("replaceObject")) {
+			replaceObject = (LinkedList)entry.getValue();
+		}else if (option.equals("breakSuperClassRetrievalAfter")) {
+			breakSuperClassRetrievalAfter = (Integer) entry.getValue();
+		}else if (option.equals("numberOfInstancesUsedForRoleLearning")) {
+			numberOfInstancesUsedForRoleLearning = (Integer) entry.getValue();
+		}else if (option.equals("closeAfterRecursion")) {
+			closeAfterRecursion = (Boolean) entry.getValue();
+		} 
+		
+	}
+
+	/*
+	 * (non-Javadoc)
+	 * 
+	 * @see org.dllearner.core.Component#init()
+	 */
+	@Override
+	public void init() {
+		System.out.println("SparqlModul: Collecting Ontology");
+		// SparqlOntologyCollector oc=
+		// new SparqlOntologyCollector(Datastructures.setToArray(instances),
+		// numberOfRecursions, filterMode,
+		// Datastructures.setToArray(predList),Datastructures.setToArray(
+		// objList),Datastructures.setToArray(classList),format,url,useLits);
+		Manager m = new Manager();
+		SpecificSparqlEndpoint sse = null;
+		SparqlQueryType sqt = null;
+		// get Options for Manipulator
+		Manipulator man = new Manipulator(blankNodeIdentifier,breakSuperClassRetrievalAfter,replacePredicate,replaceObject);
+		HashMap<String, String> parameters = new HashMap<String, String>();
+		parameters.put("default-graph-uri", "http://dbpedia.org");
+		parameters.put("format", "application/sparql-results.xml");
+
+		// get Options for endpoints
+		if (predefinedEndpoint >= 1) {
+			sse = PredefinedEndpoint.getEndpoint(predefinedEndpoint);
+		} else {
+			sse = new SpecificSparqlEndpoint(url, host, parameters);
+		}
+
+		// get Options for Filters
+		
+		if (predefinedFilter >= 1) {
+			sqt = PredefinedFilter.getFilter(predefinedFilter);
+
+		} else {
+			sqt = new SparqlQueryType("forbid", objList, predList, useLits + "");
+			
+		}
+		// give everything to the manager
+		m.useConfiguration(sqt, sse, man, recursionDepth, getAllSuperClasses,closeAfterRecursion);
+		try {
+			String ont = "";
+			//System.out.println(learnDomain);
+			// used to learn a domain of a role
+			if (learnDomain || learnRange) {
+				Set<String> pos=new HashSet<String>();
+				Set<String> neg=new HashSet<String>();
+				if(learnDomain){
+					pos = m.getDomainInstancesForRole(role);
+					neg = m.getRangeInstancesForRole(role);
+				}else if(learnRange){
+					neg = m.getDomainInstancesForRole(role);
+					pos = m.getRangeInstancesForRole(role);
+				}
+				//choose 30
+				
+				
+					Set<String> tmp=new HashSet<String>();
+					for(String one:pos){
+						tmp.add(one);
+						if(tmp.size()>=numberOfInstancesUsedForRoleLearning)break;
+					}
+					pos=tmp;
+					System.out.println("Instances used: "+pos.size());
+					
+					tmp=new HashSet<String>();
+					for(String one:neg){
+						tmp.add(one);
+						if(tmp.size()>=numberOfInstancesUsedForRoleLearning)break;
+					}
+					neg=tmp;
+					
+					instances=new HashSet<String>();
+					instances.addAll(pos);
+					
+					instances.addAll(neg);
+					
+					for(String one:pos){
+						System.out.println("+\""+one+"\"");
+					}
+					for(String one:neg){
+						System.out.println("-\""+one+"\"");
+					}
+				
+				/*Random r= new Random();
+				
+				
+				Object[] arr=instances.toArray();
+					while(instances.size()>=30){
+					
+					}*/
+				// add the role to the filter(a solution is always EXISTS
+				// role.TOP)
+				m.addPredicateFilter(role);
+				//System.out.println(instances);
+				// THIS is a workaround 
+				
+			}
+			// the actual extraction is started here
+			ont = m.extract(instances);
+			System.out.println("Number of cached SPARQL queries: "+m.getConfiguration().numberOfCachedSparqlQueries);
+			System.out.println("Number of uncached SPARQL queries: "+m.getConfiguration().numberOfUncachedSparqlQueries);
+			
+			System.out.println("Finished collecting Fragment");
+
+			if (dumpToFile) {
+				String filename = System.currentTimeMillis() + ".nt";
+				String basedir = "cache" + File.separator;
+				try {
+					if (!new File(basedir).exists())
+						new File(basedir).mkdir();
+
+					FileWriter fw = new FileWriter(new File(basedir + filename), true);
+					fw.write(ont);
+					fw.flush();
+					fw.close();
+
+					dumpFile = (new File(basedir + filename)).toURI().toURL();
+				} catch (Exception e) {
+					e.printStackTrace();
+				}
+			}
+			if (format.equals("KB")) {
+				try {
+					//kb = KBParser.parseKBFile(new StringReader(ont));
+					kb=KBParser.parseKBFile(dumpFile);
+				} catch (Exception e) {
+					e.printStackTrace();
+				}
+			}
+		} catch (Exception e) {
+			e.printStackTrace();
+		}
+		System.out.println("SparqlModul: ****Finished");
+	}
+
+	/*
+	 * (non-Javadoc)
+	 * 
+	 * @see org.dllearner.core.KnowledgeSource#toDIG()
+	 */
+	@Override
+	public String toDIG(URI kbURI) {
+		if (format.equals("N-TRIPLES"))
+			return JenaOWLDIGConverter.getTellsString(dumpFile, OntologyFormat.N_TRIPLES, kbURI);
+		else
+			return DIGConverter.getDIGString(kb, kbURI).toString();
+	}
+
+	/*
+	 * (non-Javadoc)
+	 * 
+	 * @see org.dllearner.core.KnowledgeSource#export(java.io.File,
+	 *      org.dllearner.core.OntologyFormat)
+	 */
+	@Override
+	public void export(File file, OntologyFormat format) throws OntologyFormatUnsupportedException {
+		// currently no export functions implemented, so we just throw an
+		// exception
+		throw new OntologyFormatUnsupportedException("export", format);
+	}
+
+	public URL getURL() {
+		return url;
+	}
+
+	public String[] getOntArray() {
+		return ontArray;
+	}
+
+	public void calculateSubjects(String label, int limit) {
+		System.out.println("SparqlModul: Collecting Subjects");
+		SparqlOntologyCollector oc = new SparqlOntologyCollector(url);
+		try {
+			subjects = oc.getSubjectsFromLabel(label, limit);
+		} catch (IOException e) {
+			subjects = new String[1];
+			subjects[0] = "[Error]Sparql Endpoint could not be reached.";
+		}
+		System.out.println("SparqlModul: ****Finished");
+	}
+
+	public void calculateTriples(String subject) {
+		System.out.println("SparqlModul: Collecting Triples");
+		SparqlOntologyCollector oc = new SparqlOntologyCollector(url);
+		try {
+			triples = oc.collectTriples(subject);
+		} catch (IOException e) {
+			triples = new String[1];
+			triples[0] = "[Error]Sparql Endpoint could not be reached.";
+		}
+		System.out.println("SparqlModul: ****Finished");
+	}
+
+	public void calculateConceptSubjects(String concept) {
+		System.out.println("SparqlModul: Collecting Subjects");
+		SparqlOntologyCollector oc = new SparqlOntologyCollector(url);
+		try {
+			conceptSubjects = oc.getSubjectsFromConcept(concept);
+		} catch (IOException e) {
+			conceptSubjects = new String[1];
+			conceptSubjects[0] = "[Error]Sparql Endpoint could not be reached.";
+		}
+		System.out.println("SparqlModul: ****Finished");
+	}
+
+	public boolean subjectThreadIsRunning() {
+		return subjectThreadRunning;
+	}
+
+	public void setSubjectThreadRunning(boolean bool) {
+		subjectThreadRunning = bool;
+	}
+
+	public boolean triplesThreadIsRunning() {
+		return triplesThreadRunning;
+	}
+
+	public void setTriplesThreadRunning(boolean bool) {
+		triplesThreadRunning = bool;
+	}
+
+	public boolean conceptThreadIsRunning() {
+		return conceptThreadRunning;
+	}
+
+	public void setConceptThreadRunning(boolean bool) {
+		conceptThreadRunning = bool;
+	}
+
+	public String[] getSubjects() {
+		return subjects;
+	}
+
+	public Thread getSubjectThread() {
+		return subjectThread;
+	}
+
+	public void setSubjectThread(Thread subjectThread) {
+		this.subjectThread = subjectThread;
+	}
+
+	public Thread getTriplesThread() {
+		return triplesThread;
+	}
+
+	public void setTriplesThread(Thread triplesThread) {
+		this.triplesThread = triplesThread;
+	}
+
+	public Thread getConceptThread() {
+		return conceptThread;
+	}
+
+	public void setConceptThread(Thread conceptThread) {
+		this.conceptThread = conceptThread;
+	}
+
+	public String[] getTriples() {
+		return triples;
+	}
+
+	public String[] getConceptSubjects() {
+		return conceptSubjects;
+	}
+}

Added: trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlQuery.java
===================================================================
--- trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlQuery.java	                        (rev 0)
+++ trunk/src/dl-learner/org/dllearner/kb/sparql/SparqlQuery.java	2008-01-14 11:54:55 UTC (rev 370)
@@ -0,0 +1,89 @@
+/**
+ * Copyright (C) 2007-2008, Jens Lehmann
+ *
+ * This file is part of DL-Learner.
+ * 
+ * DL-Learner is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * DL-Learner is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ *
+ */
+package org.dllearner.kb.sparql;
+
+import com.hp.hpl.jena.query.Query;
+import com.hp.hpl.jena.query.QueryExecution;
+import com.hp.hpl.jena.query.QueryExecutionFactory;
+import com.hp.hpl.jena.query.QueryFactory;
+import com.hp.hpl.jena.query.ResultSet;
+import com.hp.hpl.jena.query.ResultSetFormatter;
+
+/**
+ * Represents a SPARQL query. It includes support for stopping the SPARQL
+ * query (which may be necessary if a timeout is reached).
+ * 
+ * TODO: It is probably good to change all SPARQL query calls to use only
+ * this class.
+ * 
+ * TODO: Could we use Jena as a solid foundation here? (com.hp.jena.query)
+ * 
+ * @author Jens Lehmann
+ *
+ */
+public class SparqlQuery {
+	
+	private boolean isRunning = false;
+	
+	public SparqlQuery(SpecificSparqlEndpoint endpoint, String query) {
+		
+	}
+	
+	public void send() {
+		isRunning = true;
+		
+		// ... send query 
+		// ... check periodically whether isRunning is still true, if not
+		// abort the query
+	}
+	
+	public void stop() {
+		isRunning = false;
+	}
+
+	public boolean isRunning() {
+		return isRunning;
+	}
+	
+	// this is a working Jena script
+	// TODO: query runtime seems to be much too high (compared to running it in http://dbpedia.org/sparql)
+	// verify whether our SPARQL query implementation is faster and why;
+	// TODO: check whether Jena works with the other endpoints in PredefinedEndpoint; if not
+	// check whether it can be configured to run with these
+	public static void main(String[] args) {
+		
+		String queryString = "PREFIX dbpedia2: <http://dbpedia.org/property/> " +
+				"PREFIX skos: <http://www.w3.org/2004/02/skos/core#>" +
+				"SELECT ?episode ?chalkboard_gag WHERE {   ?episode skos:subject" +
+				"    <http://dbpedia.org/resource/Category:The_Simpsons_episodes%2C_season_12>." +
+				"  ?episode dbpedia2:blackboard ?chalkboard_gag }";
+		
+		System.out.println(queryString);
+		// create a query and parse it into Jena
+		Query query = QueryFactory.create(queryString);
+		query.validate();
+		// Jena access to DBpedia SPARQL endpoint
+		QueryExecution queryExecution = QueryExecutionFactory.sparqlService("http://dbpedia.org/sparql", query);
+		System.out.println("query SPARQL server");		
+		ResultSet rs = queryExecution.execSelect();
+		ResultSetFormatter.out(System.out, rs, query) ;
+	}
+	
+}

Modified: trunk/src/dl-learner/org/dllearner/server/ClientState.java
===================================================================
--- trunk/src/dl-learner/org/dllearner/server/ClientState.java	2008-01-14 08:56:17 UTC (rev 369)
+++ trunk/src/dl-learner/org/dllearner/server/ClientState.java	2008-01-14 11:54:55 UTC (rev 370)
@@ -33,7 +33,7 @@
 import org.dllearner.core.ReasonerComponent;
 import org.dllearner.core.ReasoningService;
 import org.dllearner.kb.OWLFile;
-import org.dllearner.kb.SparqlEndpoint;
+import org.dllearner.kb.sparql.SparqlEndpoint;
 
 /**
  * Stores the state of a DL-Learner client session.

Modified: trunk/src/dl-learner/org/dllearner/server/DLLearnerWS.java
===================================================================
--- trunk/src/dl-learner/org/dllearner/server/DLLearnerWS.java	2008-01-14 08:56:17 UTC (rev 369)
+++ trunk/src/dl-learner/org/dllearner/server/DLLearnerWS.java	2008-01-14 11:54:55 UTC (rev 370)
@@ -46,7 +46,7 @@
 import org.dllearner.core.dl.Concept;
 import org.dllearner.core.dl.Individual;
 import org.dllearner.kb.OWLFile;
-import org.dllearner.kb.SparqlEndpoint;
+import org.dllearner.kb.sparql.SparqlEndpoint;
 import org.dllearner.learningproblems.PosNegDefinitionLP;
 import org.dllearner.learningproblems.PosNegInclusionLP;
 import org.dllearner.learningproblems.PosOnlyDefinitionLP;


This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site.