/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.commons.io.input;
import static org.junit.Assert.*;
import java.io.File;
import java.io.IOException;
import java.io.UnsupportedEncodingException;
import java.net.URISyntaxException;
import java.util.Arrays;
import java.util.Collection;
import org.junit.After;
import org.junit.Test;
import org.junit.runner.RunWith;
import org.junit.runners.Parameterized;
import org.junit.runners.Parameterized.Parameters;
@RunWith(Parameterized.class)
public class ReversedLinesFileReaderTestParamBlockSize {
private static final String UTF_8 = "UTF-8";
private static final String ISO_8859_1 = "ISO-8859-1";
@SuppressWarnings("boxing")
// small and uneven block sizes are not used in reality but are good to show that the algorithm is solid
@Parameters(name = "BlockSize={0}")
public static Collection<Integer[]> blockSizes() {
return Arrays.asList(new Integer[][]{{1}, {3}, {8}, {256}, {4096}});
}
private ReversedLinesFileReader reversedLinesFileReader;
private final int testParamBlockSize;
public ReversedLinesFileReaderTestParamBlockSize(final Integer testWithBlockSize) {
testParamBlockSize = testWithBlockSize;
}
// Strings are escaped in constants to avoid java source encoding issues (source file enc is UTF-8):
// "A Test Line. Special chars: ÄäÜüÖöß ÃáéÃïçñ ©µ¥£±²®"
private static final String TEST_LINE = "A Test Line. Special chars: \u00C4\u00E4\u00DC\u00FC\u00D6\u00F6\u00DF \u00C3\u00E1\u00E9\u00ED\u00EF\u00E7\u00F1\u00C2 \u00A9\u00B5\u00A5\u00A3\u00B1\u00B2\u00AE";
// Hiragana letters: �����
private static final String TEST_LINE_SHIFT_JIS1 = "Hiragana letters: \u3041\u3042\u3043\u3044\u3045";
// Kanji letters: 明輸å�京
private static final String TEST_LINE_SHIFT_JIS2 = "Kanji letters: \u660E\u8F38\u5B50\u4EAC";
// windows-31j characters
private static final String TEST_LINE_WINDOWS_31J_1 = "\u3041\u3042\u3043\u3044\u3045";
private static final String TEST_LINE_WINDOWS_31J_2 = "\u660E\u8F38\u5B50\u4EAC";
// gbk characters (Simplified Chinese)
private static final String TEST_LINE_GBK_1 = "\u660E\u8F38\u5B50\u4EAC";
private static final String TEST_LINE_GBK_2 = "\u7B80\u4F53\u4E2D\u6587";
// x-windows-949 characters (Korean)
private static final String TEST_LINE_X_WINDOWS_949_1 = "\uD55C\uAD6D\uC5B4";
private static final String TEST_LINE_X_WINDOWS_949_2 = "\uB300\uD55C\uBBFC\uAD6D";
// x-windows-950 characters (Traditional Chinese)
private static final String TEST_LINE_X_WINDOWS_950_1 = "\u660E\u8F38\u5B50\u4EAC";
private static final String TEST_LINE_X_WINDOWS_950_2 = "\u7E41\u9AD4\u4E2D\u6587";
@After
public void closeReader() {
try {
reversedLinesFileReader.close();
} catch (final Exception e) {
// ignore
}
}
@Test
public void testIsoFileDefaults() throws URISyntaxException, IOException {
final File testFileIso = new File(this.getClass().getResource("/test-file-iso8859-1.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileIso, testParamBlockSize, ISO_8859_1);
assertFileWithShrinkingTestLines(reversedLinesFileReader);
}
@Test
public void testUTF8FileWindowsBreaks() throws URISyntaxException, IOException {
final File testFileIso = new File(this.getClass().getResource("/test-file-utf8-win-linebr.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileIso, testParamBlockSize, UTF_8);
assertFileWithShrinkingTestLines(reversedLinesFileReader);
}
@Test
public void testUTF8FileCRBreaks() throws URISyntaxException, IOException {
final File testFileIso = new File(this.getClass().getResource("/test-file-utf8-cr-only.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileIso, testParamBlockSize, UTF_8);
assertFileWithShrinkingTestLines(reversedLinesFileReader);
}
@Test
public void testUTF8File() throws URISyntaxException, IOException {
final File testFileIso = new File(this.getClass().getResource("/test-file-utf8.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileIso, testParamBlockSize, UTF_8);
assertFileWithShrinkingTestLines(reversedLinesFileReader);
}
@Test
public void testEmptyFile() throws URISyntaxException, IOException {
final File testFileEmpty = new File(this.getClass().getResource("/test-file-empty.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileEmpty, testParamBlockSize, UTF_8);
assertNull(reversedLinesFileReader.readLine());
}
@Test
public void testUTF16BEFile() throws URISyntaxException, IOException {
final File testFileUTF16BE = new File(this.getClass().getResource("/test-file-utf16be.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileUTF16BE, testParamBlockSize, "UTF-16BE");
assertFileWithShrinkingTestLines(reversedLinesFileReader);
}
@Test
public void testUTF16LEFile() throws URISyntaxException, IOException {
final File testFileUTF16LE = new File(this.getClass().getResource("/test-file-utf16le.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileUTF16LE, testParamBlockSize, "UTF-16LE");
assertFileWithShrinkingTestLines(reversedLinesFileReader);
}
@Test
public void testShiftJISFile() throws URISyntaxException, IOException {
final File testFileShiftJIS = new File(this.getClass().getResource("/test-file-shiftjis.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileShiftJIS, testParamBlockSize, "Shift_JIS");
assertEqualsAndNoLineBreaks(TEST_LINE_SHIFT_JIS2, reversedLinesFileReader.readLine());
assertEqualsAndNoLineBreaks(TEST_LINE_SHIFT_JIS1, reversedLinesFileReader.readLine());
}
@Test
public void testWindows31jFile() throws URISyntaxException, IOException {
final File testFileWindows31J = new File(this.getClass().getResource("/test-file-windows-31j.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileWindows31J, testParamBlockSize, "windows-31j");
assertEqualsAndNoLineBreaks(TEST_LINE_WINDOWS_31J_2, reversedLinesFileReader.readLine());
assertEqualsAndNoLineBreaks(TEST_LINE_WINDOWS_31J_1, reversedLinesFileReader.readLine());
}
@Test
public void testGBK() throws URISyntaxException, IOException {
final File testFileGBK = new File(this.getClass().getResource("/test-file-gbk.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileGBK, testParamBlockSize, "GBK");
assertEqualsAndNoLineBreaks(TEST_LINE_GBK_2, reversedLinesFileReader.readLine());
assertEqualsAndNoLineBreaks(TEST_LINE_GBK_1, reversedLinesFileReader.readLine());
}
@Test
public void testxWindows949File() throws URISyntaxException, IOException {
final File testFilexWindows949 = new File(this.getClass().getResource("/test-file-x-windows-949.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFilexWindows949, testParamBlockSize, "x-windows-949");
assertEqualsAndNoLineBreaks(TEST_LINE_X_WINDOWS_949_2, reversedLinesFileReader.readLine());
assertEqualsAndNoLineBreaks(TEST_LINE_X_WINDOWS_949_1, reversedLinesFileReader.readLine());
}
@Test
public void testxWindows950File() throws URISyntaxException, IOException {
final File testFilexWindows950 = new File(this.getClass().getResource("/test-file-x-windows-950.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFilexWindows950, testParamBlockSize, "x-windows-950");
assertEqualsAndNoLineBreaks(TEST_LINE_X_WINDOWS_950_2, reversedLinesFileReader.readLine());
assertEqualsAndNoLineBreaks(TEST_LINE_X_WINDOWS_950_1, reversedLinesFileReader.readLine());
}
@Test // this test is run 3x for same block size as we want to test with 10
public void testFileSizeIsExactMultipleOfBlockSize() throws URISyntaxException, IOException {
final int blockSize = 10;
final File testFile20Bytes = new File(this.getClass().getResource("/test-file-20byteslength.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFile20Bytes, blockSize, ISO_8859_1);
final String testLine = "123456789";
assertEqualsAndNoLineBreaks(testLine, reversedLinesFileReader.readLine());
assertEqualsAndNoLineBreaks(testLine, reversedLinesFileReader.readLine());
}
@Test
public void testUTF8FileWindowsBreaksSmallBlockSize2VerifyBlockSpanningNewLines() throws URISyntaxException, IOException {
final File testFileUtf8 = new File(this.getClass().getResource("/test-file-utf8-win-linebr.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileUtf8, testParamBlockSize, UTF_8);
assertFileWithShrinkingTestLines(reversedLinesFileReader);
}
@Test
public void testIsoFileManyWindowsBreaksSmallBlockSize2VerifyBlockSpanningNewLines() throws URISyntaxException, IOException {
final File testFileIso = new File(this.getClass().getResource("/test-file-iso8859-1-shortlines-win-linebr.bin").toURI());
reversedLinesFileReader = new ReversedLinesFileReader(testFileIso, testParamBlockSize, ISO_8859_1);
for (int i = 3; i > 0; i--) {
for (int j = 1; j <= 3; j++) {
assertEqualsAndNoLineBreaks("", reversedLinesFileReader.readLine());
}
assertEqualsAndNoLineBreaks("" + i, reversedLinesFileReader.readLine());
}
}
@Test(expected = UnsupportedEncodingException.class)
public void testUnsupportedEncodingUTF16() throws URISyntaxException, IOException {
final File testFileEmpty = new File(this.getClass().getResource("/test-file-empty.bin").toURI());
new ReversedLinesFileReader(testFileEmpty, testParamBlockSize, "UTF-16").close();
}
@Test(expected = UnsupportedEncodingException.class)
public void testUnsupportedEncodingBig5() throws URISyntaxException, IOException {
final File testFileEncodingBig5 = new File(this.getClass().getResource("/test-file-empty.bin").toURI());
new ReversedLinesFileReader(testFileEncodingBig5, testParamBlockSize, "Big5").close();
}
private void assertFileWithShrinkingTestLines(final ReversedLinesFileReader reversedLinesFileReader) throws IOException {
String line = null;
int lineCount = 0;
while ((line = reversedLinesFileReader.readLine()) != null) {
lineCount++;
assertEqualsAndNoLineBreaks("Line " + lineCount + " is not matching", TEST_LINE.substring(0, lineCount), line);
}
}
static void assertEqualsAndNoLineBreaks(final String msg, final String expected, final String actual) {
if (actual != null) {
assertFalse("Line contains \\n: line=" + actual, actual.contains("\n"));
assertFalse("Line contains \\r: line=" + actual, actual.contains("\r"));
}
assertEquals(msg, expected, actual);
}
static void assertEqualsAndNoLineBreaks(final String expected, final String actual) {
assertEqualsAndNoLineBreaks(null, expected, actual);
}
}