/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.lucene.analysis.uima;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.BaseTokenStreamTestCase;
import org.apache.lucene.analysis.TokenStream;
import org.junit.After;
import org.junit.Before;
import org.junit.Test;
/**
* Testcase for {@link UIMATypeAwareAnalyzer}
*/
public class UIMATypeAwareAnalyzerTest extends BaseTokenStreamTestCase {
private UIMATypeAwareAnalyzer analyzer;
@Override
@Before
public void setUp() throws Exception {
super.setUp();
analyzer = new UIMATypeAwareAnalyzer("/uima/AggregateSentenceAE.xml",
"org.apache.uima.TokenAnnotation", "posTag", null);
}
@Override
@After
public void tearDown() throws Exception {
analyzer.close();
super.tearDown();
}
@Test
public void baseUIMATypeAwareAnalyzerStreamTest() throws Exception {
// create a token stream
TokenStream ts = analyzer.tokenStream("text", "the big brown fox jumped on the wood");
// check that 'the big brown fox jumped on the wood' tokens have the expected PoS types
assertTokenStreamContents(ts,
new String[]{"the", "big", "brown", "fox", "jumped", "on", "the", "wood"},
new String[]{"at", "jj", "jj", "nn", "vbd", "in", "at", "nn"});
}
@Test @AwaitsFix(bugUrl = "https://issues.apache.org/jira/browse/LUCENE-3869")
public void testRandomStrings() throws Exception {
Analyzer analyzer = new UIMATypeAwareAnalyzer("/uima/TestAggregateSentenceAE.xml",
"org.apache.lucene.uima.ts.TokenAnnotation", "pos", null);
checkRandomData(random(), analyzer, 100 * RANDOM_MULTIPLIER);
analyzer.close();
}
}