package de.tudarmstadt.ukp.dkpro.core.decompounding.web1t; /* * Copyright 2010 * Ubiquitous Knowledge Processing (UKP) Lab * Technische Universität Darmstadt * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. **/ import java.io.File; import java.util.List; import junit.framework.Assert; import org.junit.Test; public class FinderTest { File source = new File("src/test/resources/n-grams"); File index = new File("src/test/resources/LuceneIndexer"); File jWeb1T = new File("src/test/resources/web1t/de"); @Test public void testFinder1() throws Exception { index.mkdirs(); // Create index LuceneIndexer indexer = new LuceneIndexer(source, index); indexer.index(); Finder f = new Finder(index, jWeb1T); // Search and check if data is correct List<NGramModel> result = f.find("couch"); Assert.assertEquals(1, result.size()); Assert.assertEquals("relax on the couch", result.get(0).getGram()); Assert.assertEquals(4, result.get(0).getN()); Assert.assertEquals(100, result.get(0).getFreq()); result = f.find("relax couch"); Assert.assertEquals(1, result.size()); Assert.assertEquals("relax on the couch", result.get(0).getGram()); Assert.assertEquals(4, result.get(0).getN()); Assert.assertEquals(100, result.get(0).getFreq()); result = f.find("relax"); Assert.assertEquals(3, result.size()); result = f.find("relax"); Assert.assertEquals(3, result.size()); // Delete index again for (File file : index.listFiles()) { for (File _f : file.listFiles()) { _f.delete(); } file.delete(); } index.delete(); } @Test public void testFinder2() throws Exception { index.mkdirs(); // Create index LuceneIndexer indexer = new LuceneIndexer(source, index, 2); indexer.index(); Finder f = new Finder(index, jWeb1T); // Search and check if data is correct List<NGramModel> result = f.find("couch"); Assert.assertEquals(1, result.size()); Assert.assertEquals("relax on the couch", result.get(0).getGram()); Assert.assertEquals(4, result.get(0).getN()); Assert.assertEquals(100, result.get(0).getFreq()); result = f.find("relax couch"); Assert.assertEquals(1, result.size()); Assert.assertEquals("relax on the couch", result.get(0).getGram()); Assert.assertEquals(4, result.get(0).getN()); Assert.assertEquals(100, result.get(0).getFreq()); result = f.find("relax"); Assert.assertEquals(3, result.size()); result = f.find("relax"); Assert.assertEquals(3, result.size()); // Delete index again for (File file : index.listFiles()) { for (File _f : file.listFiles()) { _f.delete(); } file.delete(); } index.delete(); } }