/* * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.qubole.presto.kinesis.decoder.csv; import static com.google.common.base.Preconditions.checkState; import java.nio.charset.StandardCharsets; import java.util.List; import java.util.Map; import java.util.Set; import au.com.bytecode.opencsv.CSVParser; import com.qubole.presto.kinesis.KinesisColumnHandle; import com.qubole.presto.kinesis.KinesisFieldValueProvider; import com.qubole.presto.kinesis.decoder.KinesisFieldDecoder; import com.qubole.presto.kinesis.decoder.KinesisRowDecoder; import com.google.inject.Inject; public class CsvKinesisRowDecoder implements KinesisRowDecoder { public static final String NAME = "csv"; private final CSVParser parser = new CSVParser(); @Inject CsvKinesisRowDecoder() { } @Override public String getName() { return NAME; } @Override public boolean decodeRow(byte[] data, Set<KinesisFieldValueProvider> fieldValueProviders, List<KinesisColumnHandle> columnHandles, Map<KinesisColumnHandle, KinesisFieldDecoder<?>> fieldDecoders) { String[] fields; try { // TODO - There is no reason why the row can't have a formatHint and it could be used // to set the charset here. String line = new String(data, StandardCharsets.UTF_8); fields = parser.parseLine(line); } catch (Exception e) { return false; } for (KinesisColumnHandle columnHandle : columnHandles) { if (columnHandle.isInternal()) { continue; } String mapping = columnHandle.getMapping(); checkState(mapping != null, "No mapping for column handle %s!", columnHandle); int columnIndex = Integer.parseInt(mapping); if (columnIndex >= fields.length) { continue; } @SuppressWarnings("unchecked") KinesisFieldDecoder<String> decoder = (KinesisFieldDecoder<String>) fieldDecoders.get(columnHandle); if (decoder != null) { fieldValueProviders.add(decoder.decode(fields[columnIndex], columnHandle)); } } return true; } }