From: <and...@us...> - 2013-09-04 15:58:25
|
Revision: 4069 http://sourceforge.net/p/dl-learner/code/4069 Author: andremelo Date: 2013-09-04 15:58:20 +0000 (Wed, 04 Sep 2013) Log Message: ----------- Adding the buildTrie method Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 15:39:08 UTC (rev 4068) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 15:58:20 UTC (rev 4069) @@ -1,23 +1,43 @@ package org.dllearner.algorithms.isle.index; import java.util.HashSet; +import java.util.Map; import java.util.Map.Entry; import java.util.Set; +import org.dllearner.algorithms.isle.textretrieval.AnnotationEntityTextRetriever; +import org.dllearner.algorithms.isle.textretrieval.EntityTextRetriever; import org.dllearner.core.owl.Entity; import org.dllearner.utilities.datastructures.PrefixTrie; +import org.semanticweb.owlapi.model.OWLEntity; import org.semanticweb.owlapi.model.OWLOntology; public class SimpleEntityCandidatesTrie implements EntityCandidatesTrie { PrefixTrie<Set<Entity>> trie; - OWLOntology ontology; + EntityTextRetriever entityTextRetriever; - public SimpleEntityCandidatesTrie(OWLOntology ontology) { - this.ontology = ontology; + public SimpleEntityCandidatesTrie(EntityTextRetriever entityTextRetriever) { + this.entityTextRetriever = entityTextRetriever; this.trie = new PrefixTrie<Set<Entity>>(); } + public void buildTrie(OWLOntology ontology) { + Map<Entity, Set<String>> relevantText = entityTextRetriever.getRelevantText(ontology); + + for (Entity entity : relevantText.keySet()) { + for (String text : relevantText.get(entity)) { + addEntry(text, entity); + // Adds also composing words, e.g. for "has child", "has" and "child" are also added + if (text.contains(" ")) { + for (String subtext : text.split(" ")) { + addEntry(subtext, entity); + } + } + } + } + } + @Override public void addEntry(String s, Entity e) { Set<Entity> candidates = trie.get(s); @@ -25,12 +45,13 @@ candidates = new HashSet<Entity>(); candidates.add(e); + + trie.put(s, candidates); } @Override public Set<Entity> getCandidateEntities(String s) { - // TODO Auto-generated method stub - return null; + return trie.get(s); } @Override @@ -38,12 +59,4 @@ return trie.getLongestMatch(s).toString(); } - /** - * @param args - */ - public static void main(String[] args) { - // TODO Auto-generated method stub - - } - } This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <and...@us...> - 2013-09-04 16:22:37
|
Revision: 4074 http://sourceforge.net/p/dl-learner/code/4074 Author: andremelo Date: 2013-09-04 16:22:34 +0000 (Wed, 04 Sep 2013) Log Message: ----------- Add constructor with buildTrie Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 16:14:38 UTC (rev 4073) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 16:22:34 UTC (rev 4074) @@ -22,6 +22,11 @@ this.trie = new PrefixTrie<Set<Entity>>(); } + public SimpleEntityCandidatesTrie(EntityTextRetriever entityTextRetriever, OWLOntology ontology) { + this(entityTextRetriever); + buildTrie(ontology); + } + public void buildTrie(OWLOntology ontology) { Map<Entity, Set<String>> relevantText = entityTextRetriever.getRelevantText(ontology); @@ -32,6 +37,7 @@ if (text.contains(" ")) { for (String subtext : text.split(" ")) { addEntry(subtext, entity); + //System.out.println("trie.add("+subtext+","++")"); } } } This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <and...@us...> - 2013-09-04 16:25:27
|
Revision: 4075 http://sourceforge.net/p/dl-learner/code/4075 Author: andremelo Date: 2013-09-04 16:25:24 +0000 (Wed, 04 Sep 2013) Log Message: ----------- Remove constructor without ontology Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 16:22:34 UTC (rev 4074) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 16:25:24 UTC (rev 4075) @@ -17,17 +17,13 @@ PrefixTrie<Set<Entity>> trie; EntityTextRetriever entityTextRetriever; - public SimpleEntityCandidatesTrie(EntityTextRetriever entityTextRetriever) { + public SimpleEntityCandidatesTrie(EntityTextRetriever entityTextRetriever, OWLOntology ontology) { this.entityTextRetriever = entityTextRetriever; - this.trie = new PrefixTrie<Set<Entity>>(); - } - - public SimpleEntityCandidatesTrie(EntityTextRetriever entityTextRetriever, OWLOntology ontology) { - this(entityTextRetriever); buildTrie(ontology); } - public void buildTrie(OWLOntology ontology) { + public void buildTrie(OWLOntology ontology) { + this.trie = new PrefixTrie<Set<Entity>>(); Map<Entity, Set<String>> relevantText = entityTextRetriever.getRelevantText(ontology); for (Entity entity : relevantText.keySet()) { This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <and...@us...> - 2013-09-04 16:26:28
|
Revision: 4076 http://sourceforge.net/p/dl-learner/code/4076 Author: andremelo Date: 2013-09-04 16:26:24 +0000 (Wed, 04 Sep 2013) Log Message: ----------- Remove contructor without ontology Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 16:25:24 UTC (rev 4075) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-04 16:26:24 UTC (rev 4076) @@ -2,14 +2,11 @@ import java.util.HashSet; import java.util.Map; -import java.util.Map.Entry; import java.util.Set; -import org.dllearner.algorithms.isle.textretrieval.AnnotationEntityTextRetriever; import org.dllearner.algorithms.isle.textretrieval.EntityTextRetriever; import org.dllearner.core.owl.Entity; import org.dllearner.utilities.datastructures.PrefixTrie; -import org.semanticweb.owlapi.model.OWLEntity; import org.semanticweb.owlapi.model.OWLOntology; public class SimpleEntityCandidatesTrie implements EntityCandidatesTrie { This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <and...@us...> - 2013-09-05 08:43:01
|
Revision: 4085 http://sourceforge.net/p/dl-learner/code/4085 Author: andremelo Date: 2013-09-05 08:42:59 +0000 (Thu, 05 Sep 2013) Log Message: ----------- Adding printTrie Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-05 08:32:57 UTC (rev 4084) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-05 08:42:59 UTC (rev 4085) @@ -1,6 +1,10 @@ package org.dllearner.algorithms.isle.index; +import java.util.ArrayList; +import java.util.Collection; +import java.util.Collections; import java.util.HashSet; +import java.util.List; import java.util.Map; import java.util.Set; @@ -58,5 +62,18 @@ CharSequence match = trie.getLongestMatch(s); return (match!=null) ? trie.getLongestMatch(s).toString() : null; } + + public void printTrie() { + System.out.println("Printing tree content:"); + Map<String,Set<Entity>> trieMap = trie.toMap(); + List<String> termsList = new ArrayList(trieMap.keySet()); + Collections.sort(termsList); + for (String key : termsList) { + System.out.println(key); + for (Entity candidate: trieMap.get(key)) { + System.out.println("\t"+candidate); + } + } + } } This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <dfl...@us...> - 2013-09-05 13:59:50
|
Revision: 4091 http://sourceforge.net/p/dl-learner/code/4091 Author: dfleischhacker Date: 2013-09-05 13:59:47 +0000 (Thu, 05 Sep 2013) Log Message: ----------- Reuse computed match instead of recomputing it Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-05 10:17:34 UTC (rev 4090) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-05 13:59:47 UTC (rev 4091) @@ -1,18 +1,12 @@ package org.dllearner.algorithms.isle.index; -import java.util.ArrayList; -import java.util.Collection; -import java.util.Collections; -import java.util.HashSet; -import java.util.List; -import java.util.Map; -import java.util.Set; - import org.dllearner.algorithms.isle.textretrieval.EntityTextRetriever; import org.dllearner.core.owl.Entity; import org.dllearner.utilities.datastructures.PrefixTrie; import org.semanticweb.owlapi.model.OWLOntology; +import java.util.*; + public class SimpleEntityCandidatesTrie implements EntityCandidatesTrie { PrefixTrie<Set<Entity>> trie; @@ -62,7 +56,7 @@ @Override public String getLongestMatch(String s) { CharSequence match = trie.getLongestMatch(s); - return (match!=null) ? trie.getLongestMatch(s).toString() : null; + return (match!=null) ? match.toString() : null; } public String toString() { This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <dfl...@us...> - 2013-09-06 14:10:46
|
Revision: 4096 http://sourceforge.net/p/dl-learner/code/4096 Author: dfleischhacker Date: 2013-09-06 14:10:41 +0000 (Fri, 06 Sep 2013) Log Message: ----------- Remove debugging output Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-06 13:31:43 UTC (rev 4095) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-06 14:10:41 UTC (rev 4096) @@ -52,7 +52,6 @@ } addEntry(text, entity); for (String alternativeText : nameGenerator.getAlternativeText(text)) { - System.out.println("New alternative text for " + text + " --> " + alternativeText); addEntry(alternativeText, entity); } // Adds also composing words, e.g. for "has child", "has" and "child" are also added @@ -60,7 +59,6 @@ for (String subtext : text.split(" ")) { addEntry(subtext, entity); for (String alternativeText : nameGenerator.getAlternativeText(subtext)) { - System.out.println("New alternative text for " + subtext + " --> " + alternativeText); addEntry(alternativeText, entity); } //System.out.println("trie.add("+subtext+","++")"); @@ -169,8 +167,8 @@ ArrayList<String> res = new ArrayList<String>(); res.add(LinguisticUtil.getInstance().getNormalizedForm(word)); - for (String w : LinguisticUtil.getInstance() - .getTopSynonymsForWord(LinguisticUtil.getInstance().getNormalizedForm(word), maxNumberOfSenses)) { + for (String w : LinguisticUtil.getInstance().getTopSynonymsForWord( + LinguisticUtil.getInstance().getNormalizedForm(word), maxNumberOfSenses)) { res.add(w.replaceAll("_", " ")); } This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <dfl...@us...> - 2013-09-09 10:19:00
|
Revision: 4101 http://sourceforge.net/p/dl-learner/code/4101 Author: dfleischhacker Date: 2013-09-09 10:18:57 +0000 (Mon, 09 Sep 2013) Log Message: ----------- Remove constructor defaulting to DummyNameGenerator Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-09 10:12:56 UTC (rev 4100) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-09 10:18:57 UTC (rev 4101) @@ -13,16 +13,16 @@ PrefixTrie<Set<Entity>> trie; EntityTextRetriever entityTextRetriever; - /** - * Initialize the trie with strings from the provided ontology using a no-op name generator, i.e., only the - * actual ontology strings are added and no expansion is done. - * - * @param entityTextRetriever the text retriever to use - * @param ontology the ontology to get strings from - */ - public SimpleEntityCandidatesTrie(EntityTextRetriever entityTextRetriever, OWLOntology ontology) { - this(entityTextRetriever, ontology, new DummyNameGenerator()); - } +// /** +// * Initialize the trie with strings from the provided ontology using a no-op name generator, i.e., only the +// * actual ontology strings are added and no expansion is done. +// * +// * @param entityTextRetriever the text retriever to use +// * @param ontology the ontology to get strings from +// */ +// public SimpleEntityCandidatesTrie(EntityTextRetriever entityTextRetriever, OWLOntology ontology) { +// this(entityTextRetriever, ontology, new DummyNameGenerator()); +// } /** * Initialize the trie with strings from the provided ontology and use the given entity name generator This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <and...@us...> - 2013-09-20 09:58:49
|
Revision: 4111 http://sourceforge.net/p/dl-learner/code/4111 Author: andremelo Date: 2013-09-20 09:58:45 +0000 (Fri, 20 Sep 2013) Log Message: ----------- Changing buildTrie to add all subsequences of an entity's text, instead of only composing tokens Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-16 00:14:34 UTC (rev 4110) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-20 09:58:45 UTC (rev 4111) @@ -50,24 +50,43 @@ if (text.trim().isEmpty()) { continue; } + addEntry(text, entity); + addSubsequences(entity, text); + for (String alternativeText : nameGenerator.getAlternativeText(text)) { addEntry(alternativeText, entity); } - // Adds also composing words, e.g. for "has child", "has" and "child" are also added - if (text.contains(" ")) { - for (String subtext : text.split(" ")) { - addEntry(subtext, entity); - for (String alternativeText : nameGenerator.getAlternativeText(subtext)) { - addEntry(alternativeText, entity); - } - //System.out.println("trie.add("+subtext+","++")"); - } - } + + } } } + /** + * Adds the subsequences of a test + * @param entity + * @param text + */ + private void addSubsequences(Entity entity, String text) { + if (text.contains(" ")) { + String[] tokens = text.split(" "); + for (int size=1; size<tokens.length; size++) { + + for (int start=0; start<tokens.length-size+1; start++) { + String subsequence = ""; + for (int i=0; i<size; i++) { + subsequence += tokens[start+i] + " "; + } + subsequence = subsequence.trim(); + + addEntry(subsequence, entity); + } + + } + } + } + @Override public void addEntry(String s, Entity e) { Set<Entity> candidates; This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <dfl...@us...> - 2013-09-23 12:22:33
|
Revision: 4112 http://sourceforge.net/p/dl-learner/code/4112 Author: dfleischhacker Date: 2013-09-23 12:22:30 +0000 (Mon, 23 Sep 2013) Log Message: ----------- Use WordNet expansion and lemmatizing also for subsequences Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-20 09:58:45 UTC (rev 4111) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-09-23 12:22:30 UTC (rev 4112) @@ -52,13 +52,11 @@ } addEntry(text, entity); - addSubsequences(entity, text); + addSubsequencesWordNet(entity, text); for (String alternativeText : nameGenerator.getAlternativeText(text)) { addEntry(alternativeText, entity); } - - } } } @@ -86,8 +84,57 @@ } } } - - @Override + + private void addSubsequencesWordNet(Entity entity, String text) { + if (text.contains(" ")) { + String[] tokens = text.split(" "); + + List<String>[] wordnetTokens = (ArrayList<String>[]) new ArrayList[tokens.length]; + + // generate list of lemmatized wordnet synonyms for each token + for (int i = 0; i < tokens.length; i++) { + wordnetTokens[i] = new ArrayList<String>(); + wordnetTokens[i].add(LinguisticUtil.getInstance().getNormalizedForm(tokens[i].toLowerCase())); + for (String w : LinguisticUtil.getInstance().getTopSynonymsForWord(tokens[i], 5)) { + wordnetTokens[i].add(LinguisticUtil.getInstance().getNormalizedForm(w).toLowerCase()); + } + } + + // generate subsequences starting at the given start index of the given size + Set<String> allPossibleSubsequences = getAllPossibleSubsequences(wordnetTokens); + + for (String s : allPossibleSubsequences) { + addEntry(s, entity); + } + } + } + + private static Set<String> getAllPossibleSubsequences(List<String>[] wordnetTokens) { + ArrayList<String> res = new ArrayList<String>(); + + for (int size = 1; size < wordnetTokens.length + 1; size++) { + for (int start = 0; start < wordnetTokens.length - size + 1; start++) { + getPossibleSubsequencesRec(res, new ArrayList<String>(), wordnetTokens, 0, size); + } + } + + return new HashSet<String>(res); + } + + private static void getPossibleSubsequencesRec(List<String> allSubsequences, List<String> currentSubsequence, List<String>[] wordnetTokens, + int curStart, int maxLength) { + if (currentSubsequence.size() == maxLength) { + allSubsequences.add(StringUtils.join(currentSubsequence, " ")); + return; + } + for (String w : wordnetTokens[curStart]) { + ArrayList<String> tmpSequence = new ArrayList<String>(currentSubsequence); + tmpSequence.add(w); + getPossibleSubsequencesRec(allSubsequences, tmpSequence, wordnetTokens, curStart + 1, maxLength); + } + } + + @Override public void addEntry(String s, Entity e) { Set<Entity> candidates; if (trie.contains(s)) @@ -124,8 +171,31 @@ } return output; } - - public void printTrie() { + + public static void main(String[] args) { + String[] tokens = "this is a long and very complex text".split(" "); + + List<String>[] wordnetTokens = (ArrayList<String>[]) new ArrayList[tokens.length]; + + // generate list of lemmatized wordnet synonyms for each token + for (int i = 0; i < tokens.length; i++) { + wordnetTokens[i] = new ArrayList<String>(); + wordnetTokens[i].add(LinguisticUtil.getInstance().getNormalizedForm(tokens[i])); + for (String w : LinguisticUtil.getInstance().getTopSynonymsForWord(tokens[i], 5)) { + System.out.println("Adding: " + LinguisticUtil.getInstance().getNormalizedForm(w)); + wordnetTokens[i].add(LinguisticUtil.getInstance().getNormalizedForm(w).replaceAll("_", " ")); + } + } + + // generate subsequences starting at the given start index of the given size + Set<String> allPossibleSubsequences = getAllPossibleSubsequences(wordnetTokens); + + for (String s : allPossibleSubsequences) { + System.out.println(s); + } + } + + public void printTrie() { System.out.println(this.toString()); } @@ -186,9 +256,8 @@ ArrayList<String> res = new ArrayList<String>(); res.add(LinguisticUtil.getInstance().getNormalizedForm(word)); - for (String w : LinguisticUtil.getInstance().getTopSynonymsForWord( - LinguisticUtil.getInstance().getNormalizedForm(word), maxNumberOfSenses)) { - res.add(w.replaceAll("_", " ")); + for (String w : LinguisticUtil.getInstance().getTopSynonymsForWord(word, maxNumberOfSenses)) { + res.add(LinguisticUtil.getInstance().getNormalizedForm(w.replaceAll("_", " "))); } return res; This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |
From: <lor...@us...> - 2013-11-12 13:41:08
|
Revision: 4145 http://sourceforge.net/p/dl-learner/code/4145 Author: lorenz_b Date: 2013-11-12 13:41:05 +0000 (Tue, 12 Nov 2013) Log Message: ----------- Fixed bug caused to leading/trailing spaces in trie. Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-11-11 15:35:44 UTC (rev 4144) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/index/SimpleEntityCandidatesTrie.java 2013-11-12 13:41:05 UTC (rev 4145) @@ -52,7 +52,6 @@ if (text.trim().isEmpty()) { continue; } - text = text.trim(); addEntry(text, entity); addSubsequencesWordNet(entity, text); @@ -150,6 +149,7 @@ @Override public void addEntry(String s, Entity e) { + s = s.trim(); FullTokenEntitySetPair candidates; if (trie.contains(s)) candidates = trie.get(s); @@ -162,6 +162,7 @@ } public void addEntry(String s, Entity e, String originalString) { + s = s.trim(); FullTokenEntitySetPair candidates; if (trie.contains(s)) candidates = trie.get(s); This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |