/* * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.facebook.presto.decoder.csv; import au.com.bytecode.opencsv.CSVParser; import com.facebook.presto.decoder.DecoderColumnHandle; import com.facebook.presto.decoder.FieldDecoder; import com.facebook.presto.decoder.FieldValueProvider; import com.facebook.presto.decoder.RowDecoder; import javax.inject.Inject; import java.nio.charset.StandardCharsets; import java.util.List; import java.util.Map; import java.util.Set; import static com.google.common.base.Preconditions.checkState; /** * Decode row as CSV. This is an extremely primitive CSV decoder using {@link au.com.bytecode.opencsv.CSVParser]}. */ public class CsvRowDecoder implements RowDecoder { public static final String NAME = "csv"; private final CSVParser parser = new CSVParser(); @Inject CsvRowDecoder() { } @Override public String getName() { return NAME; } @Override public boolean decodeRow(byte[] data, Map<String, String> dataMap, Set<FieldValueProvider> fieldValueProviders, List<DecoderColumnHandle> columnHandles, Map<DecoderColumnHandle, FieldDecoder<?>> fieldDecoders) { String[] fields; try { // TODO - There is no reason why the row can't have a formatHint and it could be used // to set the charset here. String line = new String(data, StandardCharsets.UTF_8); fields = parser.parseLine(line); } catch (Exception e) { return true; } for (DecoderColumnHandle columnHandle : columnHandles) { if (columnHandle.isInternal()) { continue; } String mapping = columnHandle.getMapping(); checkState(mapping != null, "No mapping for column handle %s!", columnHandle); int columnIndex = Integer.parseInt(mapping); if (columnIndex >= fields.length) { continue; } @SuppressWarnings("unchecked") FieldDecoder<String> decoder = (FieldDecoder<String>) fieldDecoders.get(columnHandle); if (decoder != null) { fieldValueProviders.add(decoder.decode(fields[columnIndex], columnHandle)); } } return false; } }