/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.hive.ql.udf.generic;
import junit.framework.TestCase;
import org.apache.hadoop.hive.ql.metadata.HiveException;
import org.apache.hadoop.hive.ql.udf.generic.GenericUDF.DeferredJavaObject;
import org.apache.hadoop.hive.ql.udf.generic.GenericUDF.DeferredObject;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.primitive.PrimitiveObjectInspectorFactory;
import org.apache.hadoop.hive.serde2.typeinfo.TypeInfoFactory;
import org.apache.hadoop.io.BooleanWritable;
import org.apache.hadoop.io.Text;
public class TestGenericUDFRegexp extends TestCase {
public void testConstant() throws HiveException {
GenericUDFRegExp udf = new GenericUDFRegExp();
ObjectInspector valueOI0 = PrimitiveObjectInspectorFactory.writableStringObjectInspector;
Text regexText = new Text("^fo");
ObjectInspector valueOI1 = PrimitiveObjectInspectorFactory
.getPrimitiveWritableConstantObjectInspector(TypeInfoFactory.stringTypeInfo, regexText);
ObjectInspector[] arguments = { valueOI0, valueOI1 };
udf.initialize(arguments);
runAndVerifyConst("fofo", regexText, true, udf);
runAndVerifyConst("fofofo", regexText, true, udf);
runAndVerifyConst("fobar", regexText, true, udf);
runAndVerifyConst("barfobar", regexText, false, udf);
// null
runAndVerifyConst(null, regexText, null, udf);
}
public void testEmptyConstant() throws HiveException {
GenericUDFRegExp udf = new GenericUDFRegExp();
ObjectInspector valueOI0 = PrimitiveObjectInspectorFactory.writableStringObjectInspector;
Text regexText = new Text("");
ObjectInspector valueOI1 = PrimitiveObjectInspectorFactory
.getPrimitiveWritableConstantObjectInspector(TypeInfoFactory.stringTypeInfo, regexText);
ObjectInspector[] arguments = { valueOI0, valueOI1 };
udf.initialize(arguments);
// empty regex (should be one WARN message)
runAndVerifyConst("foo", regexText, false, udf);
runAndVerifyConst("bar", regexText, false, udf);
// null
runAndVerifyConst(null, regexText, null, udf);
}
public void testNullConstant() throws HiveException {
GenericUDFRegExp udf = new GenericUDFRegExp();
ObjectInspector valueOI0 = PrimitiveObjectInspectorFactory.writableStringObjectInspector;
Text regexText = null;
ObjectInspector valueOI1 = PrimitiveObjectInspectorFactory
.getPrimitiveWritableConstantObjectInspector(TypeInfoFactory.stringTypeInfo, regexText);
ObjectInspector[] arguments = { valueOI0, valueOI1 };
udf.initialize(arguments);
// null
runAndVerifyConst("fofo", regexText, null, udf);
runAndVerifyConst("fofofo", regexText, null, udf);
runAndVerifyConst("fobar", regexText, null, udf);
runAndVerifyConst(null, regexText, null, udf);
}
public void testNonConstant() throws HiveException {
GenericUDFRegExp udf = new GenericUDFRegExp();
ObjectInspector valueOI0 = PrimitiveObjectInspectorFactory.writableStringObjectInspector;
ObjectInspector valueOI1 = PrimitiveObjectInspectorFactory.writableStringObjectInspector;
ObjectInspector[] arguments = { valueOI0, valueOI1 };
udf.initialize(arguments);
runAndVerify("fofo", "^fo", true, udf);
runAndVerify("fo\no", "^fo\no$", true, udf);
runAndVerify("Bn", "^Ba*n", true, udf);
runAndVerify("afofo", "fo", true, udf);
runAndVerify("afofo", "^fo", false, udf);
runAndVerify("Baan", "^Ba?n", false, udf);
runAndVerify("axe", "pi|apa", false, udf);
runAndVerify("pip", "^(pi)*$", false, udf);
// empty regex (should be one WARN message)
runAndVerify("bar", "", false, udf);
runAndVerify("foo", "", false, udf);
// null
runAndVerify(null, "^fo", null, udf);
runAndVerify("fofo", null, null, udf);
}
private void runAndVerifyConst(String str, Text regexText, Boolean expResult, GenericUDF udf)
throws HiveException {
DeferredObject valueObj0 = new DeferredJavaObject(str != null ? new Text(str) : null);
DeferredObject valueObj1 = new DeferredJavaObject(regexText);
DeferredObject[] args = { valueObj0, valueObj1 };
BooleanWritable output = (BooleanWritable) udf.evaluate(args);
if (expResult == null) {
assertNull(output);
} else {
assertNotNull(output);
assertEquals("regexp() const test ", expResult.booleanValue(), output.get());
}
}
private void runAndVerify(String str, String regex, Boolean expResult, GenericUDF udf)
throws HiveException {
DeferredObject valueObj0 = new DeferredJavaObject(str != null ? new Text(str) : null);
DeferredObject valueObj1 = new DeferredJavaObject(regex != null ? new Text(regex) : null);
DeferredObject[] args = { valueObj0, valueObj1 };
BooleanWritable output = (BooleanWritable) udf.evaluate(args);
if (expResult == null) {
assertNull(output);
} else {
assertNotNull(output);
assertEquals("regexp() test ", expResult.booleanValue(), output.get());
}
}
}