/*******************************************************************************
* Copyright 2017 Capital One Services, LLC and Bitwise, Inc.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
* http://www.apache.org/licenses/LICENSE-2.0
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License
*******************************************************************************/
package hydrograph.engine.cascading.assembly;
import cascading.flow.Flow;
import cascading.flow.FlowDef;
import cascading.flow.hadoop2.Hadoop2MR1FlowConnector;
import cascading.tuple.Fields;
import hydrograph.engine.cascading.assembly.InputFileParquetAssembly;
import hydrograph.engine.cascading.assembly.infra.ComponentParameters;
import hydrograph.engine.core.component.entity.InputFileParquetEntity;
import hydrograph.engine.core.component.entity.elements.OutSocket;
import hydrograph.engine.core.component.entity.elements.SchemaField;
import hydrograph.engine.utilites.AssemblyBuildHelper;
import hydrograph.engine.utilites.CascadingTestCase;
import org.junit.Test;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import java.util.Properties;
import static data.InputData.inputFileParquet;
public class InputFileParquetFileTest {
@Test
public void itShouldTestParquetInputFileAssembly() throws IOException {
String outPath = "testData/component/output/parquetIPFile";
Fields fields = new Fields("name", "surname", "city", "val", "date");
InputFileParquetEntity entity = new InputFileParquetEntity();
entity.setPath(inputFileParquet);
entity.setComponentId("input");
List<SchemaField> fieldList = new ArrayList<SchemaField>();
SchemaField sf1 = new SchemaField("name", "java.lang.String");
SchemaField sf2 = new SchemaField("surname", "java.lang.String");
SchemaField sf3 = new SchemaField("city", "java.lang.String");
SchemaField sf4 = new SchemaField("val", "java.lang.String");
SchemaField sf5 = new SchemaField("date", "java.lang.String");
fieldList.add(sf1);
fieldList.add(sf2);
fieldList.add(sf3);
fieldList.add(sf4);
fieldList.add(sf5);
entity.setFieldsList(fieldList);
Properties runtimeProp = new Properties();
runtimeProp.setProperty("prop", "propValue");
entity.setRuntimeProperties(runtimeProp);
List<OutSocket> outSockets = new ArrayList<OutSocket>();
outSockets.add(new OutSocket("outSocket"));
entity.setOutSocketList(outSockets);
FlowDef flowDef = FlowDef.flowDef();
ComponentParameters cpInput = new ComponentParameters();
cpInput.setFlowDef(flowDef);
InputFileParquetAssembly inputFileParquetAssembly = new InputFileParquetAssembly(entity, cpInput);
AssemblyBuildHelper.generateOutputPipes(fields,
inputFileParquetAssembly.getOutLink("out", "outSocket", entity.getComponentId()), outPath, flowDef);
Flow<?> flow = new Hadoop2MR1FlowConnector().connect(flowDef);
flow.complete();
CascadingTestCase.validateFieldLength(flow.openSink(), 5);
}
}