/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.hive.common.type;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
import java.util.Random;
import org.junit.Rule;
import org.junit.Test;
import com.google.code.tempusfugit.concurrency.ConcurrentRule;
import com.google.code.tempusfugit.concurrency.RepeatingRule;
import com.google.code.tempusfugit.concurrency.annotations.Concurrent;
import com.google.code.tempusfugit.concurrency.annotations.Repeating;
public class TestHiveVarchar {
@Rule public ConcurrentRule concurrentRule = new ConcurrentRule();
@Rule public RepeatingRule repeatingRule = new RepeatingRule();
public TestHiveVarchar() {
super();
}
static Random rnd = new Random();
public static int getRandomSupplementaryChar() {
int lowSurrogate = 0xDC00 + rnd.nextInt(1024);
//return 0xD8000000 + lowSurrogate;
int highSurrogate = 0xD800;
return Character.toCodePoint((char)highSurrogate, (char)lowSurrogate);
}
public static int getRandomCodePoint() {
int codePoint;
if (rnd.nextDouble() < 0.50) {
codePoint = 32 + rnd.nextInt(90);
} else {
codePoint = getRandomSupplementaryChar();
}
if (!Character.isValidCodePoint(codePoint)) {
System.out.println(Integer.toHexString(codePoint) + " is not a valid code point");
}
return codePoint;
}
public static int getRandomCodePoint(int excludeChar) {
while (true) {
int codePoint = getRandomCodePoint();
if (codePoint != excludeChar) {
return codePoint;
}
}
}
@Test
@Concurrent(count=4)
@Repeating(repetition=100)
public void testStringLength() throws Exception {
int strLen = 20;
int[] lengths = { 15, 20, 25 };
// Try with supplementary characters
for (int idx1 = 0; idx1 < lengths.length; ++idx1) {
// Create random test string
StringBuilder sb = new StringBuilder();
int curLen = lengths[idx1];
for (int idx2 = 0; idx2 < curLen; ++idx2) {
sb.appendCodePoint(getRandomCodePoint(' '));
}
String testString = sb.toString();
assertEquals(curLen, testString.codePointCount(0, testString.length()));
String enforcedString = HiveBaseChar.enforceMaxLength(testString, strLen);
if (curLen <= strLen) {
// No truncation needed
assertEquals(testString, enforcedString);
} else {
// String should have been truncated.
assertEquals(strLen, enforcedString.codePointCount(0, enforcedString.length()));
}
}
// Try with ascii chars
String[] testStrings = {
"abcdefg",
"abcdefghijklmnopqrst",
"abcdefghijklmnopqrstuvwxyz"
};
for (String testString : testStrings) {
int curLen = testString.length();
assertEquals(curLen, testString.codePointCount(0, testString.length()));
String enforcedString = HiveBaseChar.enforceMaxLength(testString, strLen);
if (curLen <= strLen) {
// No truncation needed
assertEquals(testString, enforcedString);
} else {
// String should have been truncated.
assertEquals(strLen, enforcedString.codePointCount(0, enforcedString.length()));
}
}
HiveVarchar vc1 = new HiveVarchar("0123456789", 10);
assertEquals(10, vc1.getCharacterLength());
// Changing string value; getCharacterLength() should update accordingly
vc1.setValue("012345678901234");
assertEquals(15, vc1.getCharacterLength());
vc1.setValue("01234", -1);
assertEquals(5, vc1.getCharacterLength());
vc1.setValue(new HiveVarchar("0123456789", -1));
assertEquals(10, vc1.getCharacterLength());
vc1.setValue(new HiveVarchar("01234", -1), -1);
assertEquals(5, vc1.getCharacterLength());
}
@Test
@Concurrent(count=4)
@Repeating(repetition=100)
public void testComparison() throws Exception {
HiveVarchar hc1 = new HiveVarchar("abcd", 20);
HiveVarchar hc2 = new HiveVarchar("abcd", 20);
// Identical strings should be equal
assertTrue(hc1.equals(hc2));
assertTrue(hc2.equals(hc1));
assertEquals(0, hc1.compareTo(hc2));
assertEquals(0, hc2.compareTo(hc1));
// Unequal strings
hc2 = new HiveVarchar("abcde", 20);
assertFalse(hc1.equals(hc2));
assertFalse(hc2.equals(hc1));
assertFalse(0 == hc1.compareTo(hc2));
assertFalse(0 == hc2.compareTo(hc1));
// Trailing spaces are significant
hc2 = new HiveVarchar("abcd ", 30);
assertFalse(hc1.equals(hc2));
assertFalse(hc2.equals(hc1));
assertFalse(0 == hc1.compareTo(hc2));
assertFalse(0 == hc2.compareTo(hc1));
// Leading spaces are significant
hc2 = new HiveVarchar(" abcd", 20);
assertFalse(hc1.equals(hc2));
assertFalse(hc2.equals(hc1));
assertFalse(0 == hc1.compareTo(hc2));
assertFalse(0 == hc2.compareTo(hc1));
}
}