From: <lor...@us...> - 2013-09-04 16:04:23
|
Revision: 4071 http://sourceforge.net/p/dl-learner/code/4071 Author: lorenz_b Date: 2013-09-04 16:04:20 +0000 (Wed, 04 Sep 2013) Log Message: ----------- Added text normalization. Modified Paths: -------------- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/textretrieval/AnnotationEntityTextRetriever.java Modified: trunk/components-core/src/main/java/org/dllearner/algorithms/isle/textretrieval/AnnotationEntityTextRetriever.java =================================================================== --- trunk/components-core/src/main/java/org/dllearner/algorithms/isle/textretrieval/AnnotationEntityTextRetriever.java 2013-09-04 15:59:46 UTC (rev 4070) +++ trunk/components-core/src/main/java/org/dllearner/algorithms/isle/textretrieval/AnnotationEntityTextRetriever.java 2013-09-04 16:04:20 UTC (rev 4071) @@ -8,6 +8,8 @@ import java.util.Map; import java.util.Set; +import org.dllearner.algorithms.isle.index.LinguisticAnnotator; +import org.dllearner.algorithms.isle.index.LinguisticUtil; import org.dllearner.core.owl.Entity; import org.dllearner.kb.OWLAPIOntology; import org.dllearner.utilities.owl.OWLAPIConverter; @@ -21,7 +23,9 @@ import org.semanticweb.owlapi.util.IRIShortFormProvider; import org.semanticweb.owlapi.util.SimpleIRIShortFormProvider; +import com.google.common.base.Joiner; + /** * @author Lorenz Buehmann * @@ -86,7 +90,10 @@ } if(textWithWeight.isEmpty() && useShortFormFallback){ - textWithWeight.put(sfp.getShortForm(IRI.create(entity.getURI())), weight); + String shortForm = sfp.getShortForm(IRI.create(entity.getURI())); + shortForm = Joiner.on(" ").join(LinguisticUtil.getWordsFromCamelCase(shortForm)); + shortForm = Joiner.on(" ").join(LinguisticUtil.getWordsFromUnderscored(shortForm)); + textWithWeight.put(shortForm, weight); } return textWithWeight; This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. |