/******************************************************************************* * Copyright 2017 Capital One Services, LLC and Bitwise, Inc. * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * http://www.apache.org/licenses/LICENSE-2.0 * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License *******************************************************************************/ package hydrograph.engine.cascading.assembly; import cascading.flow.Flow; import cascading.flow.FlowDef; import cascading.flow.hadoop2.Hadoop2MR1FlowConnector; import hydrograph.engine.cascading.assembly.InputFileDelimitedAssembly; import hydrograph.engine.cascading.assembly.infra.ComponentParameters; import hydrograph.engine.core.component.entity.InputFileDelimitedEntity; import hydrograph.engine.core.component.entity.elements.OutSocket; import hydrograph.engine.core.component.entity.elements.SchemaField; import hydrograph.engine.utilites.AssemblyBuildHelper; import hydrograph.engine.utilites.CascadingTestCase; import org.junit.Test; import java.io.IOException; import java.util.ArrayList; import java.util.List; import static data.InputData.inputFileDelimited; public class InputFileDelimitedTest { @Test public void itShouldCheckFieldLengthOfDelimitedInputFile() throws IOException { String outPath = "testData/component/input/output/file1_input"; FlowDef flowDef = FlowDef.flowDef(); ComponentParameters cpInput = new ComponentParameters(); cpInput.setFlowDef(flowDef); InputFileDelimitedEntity inputFileDelimitedEntity = new InputFileDelimitedEntity(); inputFileDelimitedEntity.setComponentId("input"); inputFileDelimitedEntity.setPath(inputFileDelimited); inputFileDelimitedEntity.setDelimiter(","); List<SchemaField> fieldList = new ArrayList<SchemaField>(); SchemaField sf1 = new SchemaField("name", "java.lang.String"); SchemaField sf2 = new SchemaField("surname", "java.lang.String"); SchemaField sf3 = new SchemaField("city", "java.lang.String"); SchemaField sf4 = new SchemaField("val", "java.math.BigDecimal"); sf4.setFieldScale(3); sf4.setFieldScaleType("explicit"); SchemaField sf5 = new SchemaField("date", "java.util.Date"); sf5.setFieldFormat("yyyy-MM-dd"); fieldList.add(sf1); fieldList.add(sf2); fieldList.add(sf3); fieldList.add(sf4); fieldList.add(sf5); List<OutSocket> outSockets = new ArrayList<OutSocket>(); outSockets.add(new OutSocket("outSocket")); inputFileDelimitedEntity.setFieldsList(fieldList); inputFileDelimitedEntity.setOutSocketList(outSockets); InputFileDelimitedAssembly inputFile = new InputFileDelimitedAssembly( inputFileDelimitedEntity, cpInput); AssemblyBuildHelper.generateOutputPipes(inputFile.getOutLink("out", "outSocket", inputFileDelimitedEntity.getComponentId()), outPath, flowDef); Flow<?> flow = new Hadoop2MR1FlowConnector().connect(flowDef); flow.complete(); CascadingTestCase.validateFieldLength(flow.openSink(), 5); } }