/** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.camel.dataformat.bindy.csv; import java.io.IOException; import java.io.InputStream; import java.io.InputStreamReader; import java.io.OutputStream; import java.util.ArrayList; import java.util.Arrays; import java.util.HashMap; import java.util.Iterator; import java.util.List; import java.util.Map; import java.util.Scanner; import org.apache.camel.Exchange; import org.apache.camel.dataformat.bindy.BindyAbstractDataFormat; import org.apache.camel.dataformat.bindy.BindyAbstractFactory; import org.apache.camel.dataformat.bindy.BindyCsvFactory; import org.apache.camel.dataformat.bindy.FormatFactory; import org.apache.camel.dataformat.bindy.util.ConverterUtils; import org.apache.camel.spi.DataFormat; import org.apache.camel.util.IOHelper; import org.apache.camel.util.ObjectHelper; import org.slf4j.Logger; import org.slf4j.LoggerFactory; /** * A <a href="http://camel.apache.org/data-format.html">data format</a> ( * {@link DataFormat}) using Bindy to marshal to and from CSV files */ public class BindyCsvDataFormat extends BindyAbstractDataFormat { private static final Logger LOG = LoggerFactory.getLogger(BindyCsvDataFormat.class); public BindyCsvDataFormat() { } public BindyCsvDataFormat(Class<?> type) { super(type); } @Override public String getDataFormatName() { return "bindy-csv"; } @SuppressWarnings("unchecked") public void marshal(Exchange exchange, Object body, OutputStream outputStream) throws Exception { BindyCsvFactory factory = (BindyCsvFactory)getFactory(); ObjectHelper.notNull(factory, "not instantiated"); // Get CRLF byte[] bytesCRLF = ConverterUtils.getByteReturn(factory.getCarriageReturn()); if (factory.getGenerateHeaderColumnNames()) { String result = factory.generateHeader(); byte[] bytes = exchange.getContext().getTypeConverter().convertTo(byte[].class, exchange, result); outputStream.write(bytes); // Add a carriage return outputStream.write(bytesCRLF); } List<Map<String, Object>> models = new ArrayList<Map<String, Object>>(); // the body is not a prepared list of map that bindy expects so help a bit here and create one for us Iterator<Object> it = ObjectHelper.createIterator(body); while (it.hasNext()) { Object model = it.next(); if (model instanceof Map) { models.add((Map<String, Object>) model); } else { String name = model.getClass().getName(); Map<String, Object> row = new HashMap<String, Object>(1); row.put(name, model); row.putAll(createLinkedFieldsModel(model)); models.add(row); } } for (Map<String, Object> model : models) { String result = factory.unbind(model); byte[] bytes = exchange.getContext().getTypeConverter().convertTo(byte[].class, exchange, result); outputStream.write(bytes); // Add a carriage return outputStream.write(bytesCRLF); } } /** * check emptyStream and if CVSRecord is allow to process emptyStreams * avoid IllegalArgumentException and return empty list when unmarshalling */ private boolean checkEmptyStream(BindyCsvFactory factory, InputStream inputStream) throws IOException { boolean allowEmptyStream = factory.isAllowEmptyStream(); boolean isStreamEmpty = false; boolean canReturnEmptyListOfModels = false; if (inputStream == null || inputStream.available() == 0) { isStreamEmpty = true; } if (isStreamEmpty && allowEmptyStream) { canReturnEmptyListOfModels = true; } return canReturnEmptyListOfModels; } public Object unmarshal(Exchange exchange, InputStream inputStream) throws Exception { BindyCsvFactory factory = (BindyCsvFactory)getFactory(); ObjectHelper.notNull(factory, "not instantiated"); // List of Pojos List<Map<String, Object>> models = new ArrayList<Map<String, Object>>(); // Pojos of the model Map<String, Object> model; InputStreamReader in = null; Scanner scanner = null; try { if (checkEmptyStream(factory, inputStream)) { return models; } in = new InputStreamReader(inputStream, IOHelper.getCharsetName(exchange)); // Scanner is used to read big file scanner = new Scanner(in); // Retrieve the separator defined to split the record String separator = factory.getSeparator(); String quote = factory .getQuote(); ObjectHelper.notNull(separator, "The separator has not been defined in the annotation @CsvRecord or not instantiated during initModel."); int count = 0; // If the first line of the CSV file contains columns name, then we // skip this line if (factory.getSkipFirstLine()) { // Check if scanner is empty if (scanner.hasNextLine()) { scanner.nextLine(); } } while (scanner.hasNextLine()) { // Read the line String line = scanner.nextLine().trim(); if (ObjectHelper.isEmpty(line)) { // skip if line is empty continue; } // Increment counter count++; // Create POJO where CSV data will be stored model = factory.factory(); // Split the CSV record according to the separator defined in // annotated class @CSVRecord String[] tokens = line.split(separator, factory.getAutospanLine() ? factory.getMaxpos() : -1); List<String> result = Arrays.asList(tokens); // must unquote tokens before use result = unquoteTokens(result, separator, quote); if (result.size() == 0 || result.isEmpty()) { throw new java.lang.IllegalArgumentException("No records have been defined in the CSV"); } else { if (LOG.isDebugEnabled()) { LOG.debug("Size of the record splitted : {}", result.size()); } // Bind data from CSV record with model classes factory.bind(result, model, count); // Link objects together factory.link(model); // Add objects graph to the list models.add(model); LOG.debug("Graph of objects created: {}", model); } } // BigIntegerFormatFactory if models list is empty or not // If this is the case (correspond to an empty stream, ...) if (models.size() == 0) { throw new java.lang.IllegalArgumentException("No records have been defined in the CSV"); } else { return extractUnmarshalResult(models); } } finally { if (scanner != null) { scanner.close(); } if (in != null) { IOHelper.close(in, "in", LOG); } } } /** * Unquote the tokens, by removing leading and trailing quote chars, * as will handling fixing broken tokens which may have been split * by a separator inside a quote. */ private List<String> unquoteTokens(List<String> result, String separator, String quote) { // a current quoted token which we assemble from the broken pieces // we need to do this as we use the split method on the String class // to split the line using regular expression, and it does not handle // if the separator char is also inside a quoted token, therefore we need // to fix this afterwards StringBuilder current = new StringBuilder(); boolean inProgress = false; List<String> answer = new ArrayList<String>(); //parsing assumes matching close and end quotes for (String s : result) { boolean canStart = false; boolean canClose = false; boolean cutStart = false; boolean cutEnd = false; if (s.startsWith(quote)) { //token is just a quote if (s.length() == 1) { s = ""; //if token is a quote then it can only close processing if it has begun if (inProgress) { canClose = true; } else { canStart = true; } } else { //quote+"not empty" cutStart = true; canStart = true; } } //"not empty"+quote if (s.endsWith(quote)) { cutEnd = true; canClose = true; } //optimize to only substring once if (cutEnd || cutStart) { s = s.substring(cutStart ? 1 : 0, cutEnd ? s.length() - 1 : s.length()); } // are we in progress of rebuilding a broken token if (inProgress) { current.append(separator); current.append(s); if (canClose) { answer.add(current.toString()); current.setLength(0); inProgress = false; } } else { if (canStart && !canClose) { current.append(s); inProgress = true; } else { //case where no quotes answer.add(s); } } } // any left over from current? if (current.length() > 0) { answer.add(current.toString()); current.setLength(0); } return answer; } @Override protected BindyAbstractFactory createModelFactory(FormatFactory formatFactory) throws Exception { BindyCsvFactory bindyCsvFactory = new BindyCsvFactory(getClassType()); bindyCsvFactory.setFormatFactory(formatFactory); return bindyCsvFactory; } }