package org.apache.blur.mapreduce.lib; /** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import java.io.IOException; import org.apache.blur.mapreduce.lib.BlurMutate.MUTATE_TYPE; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.fs.Path; import org.apache.hadoop.io.LongWritable; import org.apache.hadoop.io.Text; import org.apache.hadoop.io.Writable; import org.apache.hadoop.mrunit.mapreduce.MapDriver; import org.junit.Before; import org.junit.Test; public class CsvBlurMapperTest { private MapDriver<Writable, Text, Text, BlurMutate> _mapDriver; private CsvBlurMapper _mapper; @Before public void setUp() throws IOException { _mapper = new CsvBlurMapper(); _mapDriver = MapDriver.newMapDriver(_mapper); } @Test public void testMapperWithFamilyInData() { Configuration configuration = _mapDriver.getConfiguration(); CsvBlurMapper.setColumns(configuration, "cf1:col1,col2|cf2:col1,col2,col3"); _mapDriver.withInput(new LongWritable(), new Text("rowid1,record1,cf1,value1,value2")); _mapDriver.withOutput(new Text("rowid1"), new BlurMutate(MUTATE_TYPE.REPLACE, "rowid1", "record1", "cf1") .addColumn("col1", "value1").addColumn("col2", "value2")); _mapDriver.runTest(); } @Test public void testMapperFamilyPerPath() { Configuration configuration = _mapDriver.getConfiguration(); CsvBlurMapper.setColumns(configuration, "cf1:col1,col2|cf2:col1,col2,col3"); CsvBlurMapper.addFamilyPath(configuration, "cf1", new Path("/")); _mapper.setFamilyFromPath("cf1"); _mapDriver.withInput(new LongWritable(), new Text("rowid1,record1,value1,value2")); _mapDriver.withOutput(new Text("rowid1"), new BlurMutate(MUTATE_TYPE.REPLACE, "rowid1", "record1", "cf1") .addColumn("col1", "value1").addColumn("col2", "value2")); _mapDriver.runTest(); } @Test public void testMapperAutoGenerateRecordId() { Configuration configuration = _mapDriver.getConfiguration(); CsvBlurMapper.setAutoGenerateRecordIdAsHashOfData(configuration, true); CsvBlurMapper.setColumns(configuration, "cf1:col1,col2|cf2:col1,col2,col3"); CsvBlurMapper.addFamilyPath(configuration, "cf1", new Path("/")); _mapper.setFamilyFromPath("cf1"); _mapDriver.withInput(new LongWritable(), new Text("rowid1,value1,value2")); _mapDriver.withOutput(new Text("rowid1"), new BlurMutate(MUTATE_TYPE.REPLACE, "rowid1", "-25nqln3n2vb4cayex9y9tpxx3", "cf1") .addColumn("col1", "value1").addColumn("col2", "value2")); _mapDriver.runTest(); } @Test public void testMapperAutoGenerateRowId() { Configuration configuration = _mapDriver.getConfiguration(); CsvBlurMapper.setAutoGenerateRowIdAsHashOfData(configuration, true); CsvBlurMapper.setColumns(configuration, "cf1:col1,col2|cf2:col1,col2,col3"); CsvBlurMapper.addFamilyPath(configuration, "cf1", new Path("/")); _mapper.setFamilyFromPath("cf1"); _mapDriver.withInput(new LongWritable(), new Text("record1,value1,value2")); _mapDriver.withOutput(new Text("-50b4uzohynr7j7s9pve7ytz66"), new BlurMutate(MUTATE_TYPE.REPLACE, "-50b4uzohynr7j7s9pve7ytz66", "record1", "cf1") .addColumn("col1", "value1").addColumn("col2", "value2")); _mapDriver.runTest(); } @Test public void testMapperAutoGenerateRowIdAndRecordId() { Configuration configuration = _mapDriver.getConfiguration(); CsvBlurMapper.setAutoGenerateRecordIdAsHashOfData(configuration, true); CsvBlurMapper.setAutoGenerateRowIdAsHashOfData(configuration, true); CsvBlurMapper.setColumns(configuration, "cf1:col1,col2|cf2:col1,col2,col3"); CsvBlurMapper.addFamilyPath(configuration, "cf1", new Path("/")); _mapper.setFamilyFromPath("cf1"); _mapDriver.withInput(new LongWritable(), new Text("value1,value2")); _mapDriver.withOutput(new Text("5q0tme15ph3h5pns8sv3u5wy2"), new BlurMutate(MUTATE_TYPE.REPLACE, "5q0tme15ph3h5pns8sv3u5wy2", "5q0tme15ph3h5pns8sv3u5wy2", "cf1") .addColumn("col1", "value1").addColumn("col2", "value2")); _mapDriver.runTest(); } }