/* * Copyright 2013 Cloudera Inc. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.kitesdk.morphline.avro; import java.io.IOException; import java.io.InputStream; import java.util.Collection; import java.util.Collections; import java.util.HashMap; import java.util.Map; import org.apache.avro.Schema; import org.apache.avro.Schema.Field; import org.apache.avro.generic.GenericData; import org.apache.avro.generic.IndexedRecord; import org.kitesdk.morphline.api.Command; import org.kitesdk.morphline.api.CommandBuilder; import org.kitesdk.morphline.api.MorphlineCompilationException; import org.kitesdk.morphline.api.MorphlineContext; import org.kitesdk.morphline.api.Record; import org.kitesdk.morphline.base.AbstractCommand; import org.kitesdk.morphline.base.Fields; import org.kitesdk.morphline.shaded.com.google.common.io.Closeables; import org.kitesdk.morphline.stdio.AbstractParser; import com.google.common.annotations.Beta; import com.typesafe.config.Config; /** * Command that converts a morphline record to an Avro record that contains a Map with string keys * and array values where the array values can be null, boolean, int, long, float, double, string, * bytes. */ @Beta public final class ToAvroMapBuilder implements CommandBuilder { @Override public Collection<String> getNames() { return Collections.singletonList("toAvroMap"); } @Override public Command build(Config config, Command parent, Command child, MorphlineContext context) { return new ToAvroMap(this, config, parent, child, context); } /////////////////////////////////////////////////////////////////////////////// // Nested classes: /////////////////////////////////////////////////////////////////////////////// private static final class ToAvroMap extends AbstractCommand { private final Schema schema; public ToAvroMap(CommandBuilder builder, Config config, Command parent, Command child, MorphlineContext context) { super(builder, config, parent, child, context); InputStream in = null; try { in = getClass().getResourceAsStream("morphlineRecord.avsc"); this.schema = new Schema.Parser().parse(in); } catch (IOException e) { throw new MorphlineCompilationException("Cannot parse morphlineRecord schema", config, e, builder); } finally { Closeables.closeQuietly(in); } validateArguments(); } @Override protected boolean doProcess(Record inputRecord) { Record outputRecord = inputRecord.copy(); AbstractParser.removeAttachments(outputRecord); Map<String, Collection<Object>> map = inputRecord.getFields().asMap(); map = new HashMap<String, Collection<Object>>(map); // make it mutable Field field = schema.getFields().get(0); Object avroResult = AvroConversions.toAvro(map, field.schema()); if (avroResult == AvroConversions.ERROR) { LOG.debug("Cannot convert record: {} to schema: {}", inputRecord, schema); return false; } IndexedRecord avroRecord = new GenericData.Record(schema); avroRecord.put(field.pos(), avroResult); outputRecord.put(Fields.ATTACHMENT_BODY, avroRecord); // pass record to next command in chain: return super.doProcess(outputRecord); } } }