package org.molgenis.data.semanticsearch.string; import org.tartarus.snowball.ext.PorterStemmer; import org.testng.annotations.Test; import static org.testng.Assert.assertEquals; public class StemmerTest { private final Stemmer customPorterStemmer = new Stemmer(); @Test public void replaceIllegalCharacter() { assertEquals(customPorterStemmer.replaceIllegalCharacter("Hello__world!"), "hello world"); assertEquals(customPorterStemmer.replaceIllegalCharacter("Hello__world! 1234"), "hello world 1234"); assertEquals(customPorterStemmer.replaceIllegalCharacter("Hello_#45_world! 1234"), "hello 45 world 1234"); } @Test public void stemPhrase() { assertEquals(customPorterStemmer.cleanStemPhrase("i like smoking!"), "i like smoke"); assertEquals(customPorterStemmer.cleanStemPhrase("it`s not possibilities!"), "it not possibl"); } @Test public void stem() { assertEquals(customPorterStemmer.stem("use"), "us"); assertEquals(customPorterStemmer.stem("hypertension"), "hypertens"); PorterStemmer porterStemmer = new PorterStemmer(); porterStemmer.setCurrent("use"); porterStemmer.stem(); assertEquals(porterStemmer.getCurrent(), "us"); } }