/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* <p/>
* http://www.apache.org/licenses/LICENSE-2.0
* <p/>
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.ambari.view.hive20.resources.upload;
import org.apache.ambari.view.hive20.client.Row;
import org.apache.ambari.view.hive20.resources.uploads.parsers.ParseOptions;
import org.apache.ambari.view.hive20.resources.uploads.parsers.csv.opencsv.OpenCSVParser;
import org.junit.Assert;
import org.junit.Test;
import java.io.IOException;
import java.io.StringReader;
import java.util.Iterator;
public class OpenCSVParserTest {
/**
* no exception in creating csvParser with emtpy stream
* @throws IOException
*/
@Test
public void testEmptyStream() throws Exception {
String csv = "";
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, new ParseOptions());
) {
Assert.assertEquals("There should not be any rows.",false, jp.iterator().hasNext());
}
}
/**
* in case of csv an empty line is still considered as row
* @throws IOException
*/
@Test
public void testEmptyRow() throws Exception {
String csv = " ";
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, new ParseOptions());
) {
Iterator<Row> iterator = jp.iterator();
Assert.assertEquals("Iterator should be Empty", true, iterator.hasNext());
Assert.assertArrayEquals("Row should not be empty",new Object[]{" "},iterator.next().getRow());
}
}
@Test
public void testParse1Row() throws Exception {
String csv = "value1,c,10,10.1";
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, new ParseOptions());
) {
Iterator<Row> iterator = jp.iterator();
Assert.assertEquals("Iterator Empty!", true, iterator.hasNext());
Row row = iterator.next();
Row expected = new Row(new Object[]{"value1", "c", "10", "10.1"});
Assert.assertEquals("Row not equal!", expected, row);
Assert.assertEquals("Should report no more rows!", false, iterator.hasNext());
}
}
@Test
public void testParseMultipleRow() throws Exception {
String csv = "value1,c,10,10.1\n" +
"value2,c2,102,true";
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, new ParseOptions());
) {
Iterator<Row> iterator = jp.iterator();
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", new Row(new Object[]{"value1", "c", "10", "10.1"}), iterator.next());
Assert.assertEquals("Failed to detect 2nd row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 2nd row!", new Row(new Object[]{"value2", "c2", "102", Boolean.TRUE.toString()}), iterator.next());
Assert.assertEquals("Failed to detect end of rows!", false, iterator.hasNext());
Assert.assertEquals("Failed to detect end of rows 2nd time!", false, iterator.hasNext());
}
}
@Test
public void testQuotedAndEscapedEndline() throws Exception {
String csv = "\"row1-\ncol1\",1,1.1\n\"row2-\\\ncol1\",2,2.2\n";
ParseOptions po = new ParseOptions();
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"row1-\ncol1", "1", "1.1"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
Row row2 = new Row(new Object[]{"row2-\ncol1", "2", "2.2"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row2, iterator.next());
}
}
@Test
public void testQuotedDoubleQuote() throws Exception {
String csv = "\"aaa\",\"b\"\"bb\",\"ccc\"";
ParseOptions po = new ParseOptions();
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b\"bb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
}
}
@Test
public void testEscapedDoubleQuote() throws Exception {
String csv = "\"aaa\",\"b\\\"bb\",\"ccc\"";
ParseOptions po = new ParseOptions();
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b\"bb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
}
}
@Test
public void testSpecialEscape() throws Exception {
String csv = "\"aaa\",\"b$\"bb\",\"ccc\"";
ParseOptions po = new ParseOptions();
po.setOption(ParseOptions.OPTIONS_CSV_ESCAPE_CHAR,'$');
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b\"bb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
}
}
@Test
public void testSpecialEscapedEscape() throws Exception {
String csv = "aaa,b$$bb,ccc";
ParseOptions po = new ParseOptions();
po.setOption(ParseOptions.OPTIONS_CSV_ESCAPE_CHAR,'$');
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b$bb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
}
}
@Test
public void testSpecialUnEscapedEscape() throws Exception {
String csv = "aaa,b$bb,ccc";
ParseOptions po = new ParseOptions();
po.setOption(ParseOptions.OPTIONS_CSV_ESCAPE_CHAR,'$');
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "bbb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
}
}
@Test
public void test001Escape() throws Exception {
String csv = "aaa,b\001\"bb,ccc";
ParseOptions po = new ParseOptions();
po.setOption(ParseOptions.OPTIONS_CSV_ESCAPE_CHAR,'\001');
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b\"bb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next()); }
}
@Test
public void testSpecialQuote() throws Exception {
String csv = "\001aaa\001,\001b\001\001bb\001,\001ccc\001";
ParseOptions po = new ParseOptions();
po.setOption(ParseOptions.OPTIONS_CSV_QUOTE,'\001');
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b\001bb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
}
}
@Test
public void testSpaceAsDelimiterAndQuoted() throws Exception {
String csv = "aaa \"b bb\" ccc\naaa2 bbb2 \"c cc2\"";
ParseOptions po = new ParseOptions();
// po.setOption(ParseOptions.OPTIONS_CSV_ESCAPE_CHAR,'\001');
po.setOption(ParseOptions.OPTIONS_CSV_DELIMITER,' ');
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b bb", "ccc"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
Row row2 = new Row(new Object[]{"aaa2", "bbb2", "c cc2"});
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row2, iterator.next());
}
}
@Test
public void testFailedDelimiterEscaped() throws Exception {
String csv = "aaa,b\\,bb,ccc";
ParseOptions po = new ParseOptions();
try(
StringReader sr = new StringReader(csv);
OpenCSVParser jp = new OpenCSVParser(sr, po);
) {
Iterator<Row> iterator = jp.iterator();
Row row = new Row(new Object[]{"aaa", "b","bb", "ccc"}); // different from Common CSVParser
Assert.assertEquals("Failed to detect 1st row!", true, iterator.hasNext());
Assert.assertEquals("Failed to match 1st row!", row, iterator.next());
}
}
}