/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.pig.test; import static org.apache.pig.ExecType.MAPREDUCE; import java.io.File; import java.io.FileOutputStream; import java.io.IOException; import java.io.PrintStream; import java.io.PrintWriter; import java.util.ArrayList; import java.util.HashMap; import java.util.HashSet; import java.util.Iterator; import java.util.List; import java.util.Map; import java.util.Random; import java.util.StringTokenizer; import org.junit.AfterClass; import org.junit.Before; import org.junit.Test; import org.junit.runner.RunWith; import org.junit.runners.JUnit4; import org.apache.pig.ComparisonFunc; import org.apache.pig.EvalFunc; import org.apache.pig.ExecType; import org.apache.pig.PigServer; import org.apache.pig.backend.executionengine.ExecException; import org.apache.pig.builtin.BinStorage; import org.apache.pig.builtin.Distinct; import org.apache.pig.builtin.PigStorage; import org.apache.pig.builtin.TextLoader; import org.apache.pig.data.*; import org.apache.pig.impl.io.FileLocalizer; import org.apache.pig.impl.io.PigFile; import org.apache.pig.impl.logicalLayer.schema.Schema; import org.apache.pig.impl.logicalLayer.FrontendException; import org.apache.pig.impl.util.Pair; import org.apache.pig.test.utils.GenRandomData; import org.apache.pig.test.utils.Identity; import junit.framework.TestCase; @RunWith(JUnit4.class) public class TestCommit extends TestCase { static MiniCluster cluster = MiniCluster.buildCluster(); private PigServer pigServer; TupleFactory mTf = TupleFactory.getInstance(); @Before @Override public void setUp() throws Exception{ pigServer = new PigServer(ExecType.MAPREDUCE, cluster.getProperties()); } @AfterClass public static void oneTimeTearDown() throws Exception { cluster.shutDown(); } @Test public void testCheckin1() throws Exception{ Tuple expected1 = mTf.newTuple(2); Tuple expected2 = mTf.newTuple(2); expected1.set(0, "independent"); expected1.set(1, 50.0); expected2.set(0, "democrat"); expected2.set(1, 125.5); Util.createInputFile(cluster, "student", new String[]{"joe smith:18:3.5","amy brown:25:2.5","jim fox:20:4.0","leo fu:55:3.0"}); Util.createInputFile(cluster, "voter", new String[]{"amy brown,25,democrat,25.50","amy brown,25,democrat,100","jim fox,20,independent,50.0"}); pigServer.registerQuery("a = load 'student' using " + PigStorage.class.getName() + "(':') as (name, age, gpa);"); pigServer.registerQuery("b = load 'voter' using " + PigStorage.class.getName() + "(',') as (name, age, registration, contributions);"); pigServer.registerQuery("c = filter a by age < 50;"); pigServer.registerQuery("d = filter b by age < 50;"); pigServer.registerQuery("e = cogroup c by (name, age), d by (name, age);"); pigServer.registerQuery("f = foreach e generate flatten(c), flatten(d);"); pigServer.registerQuery("g = group f by registration;"); pigServer.registerQuery("h = foreach g generate (chararray)group, SUM(f.d::contributions);"); pigServer.registerQuery("i = order h by $1;"); Iterator<Tuple> iter = pigServer.openIterator("i"); int count = 0; while(iter.hasNext()){ Tuple t = iter.next(); count++; if (count == 1) { assertTrue(t.get(0).equals(expected1.get(0))); assertTrue(t.get(1).equals(expected1.get(1))); } else if (count == 2){ assertTrue(t.get(0).equals(expected2.get(0))); assertTrue(t.get(1).equals(expected2.get(1))); } } assertEquals(count, 2); Util.deleteFile(cluster, "student"); Util.deleteFile(cluster, "voter"); } @Test public void testCheckin2() throws Exception{ Tuple expected1 = mTf.newTuple(4); Tuple expected2 = mTf.newTuple(4); Util.createInputFile(cluster, "testCheckin2-input.txt", new String[]{"joe smith:18:3.5","amy brown:18:2.5","jim fox:20:4.0","leo fu:55:3.0", "amy smith:20:3.0"}); expected1.set(0, 18); expected1.set(1, 1L); expected1.set(2, "joe smith"); expected1.set(3, 18); expected2.set(0, 55); expected2.set(1, 1L); expected2.set(2, "leo fu"); expected2.set(3, 55); pigServer.registerQuery("a = load 'testCheckin2-input.txt' using " + PigStorage.class.getName() + "(':') as (name: chararray, age: int, gpa: float);"); pigServer.registerQuery("b = group a by age;"); //pigServer.registerQuery("c = foreach b { d = order a by $0; generate group, COUNT(d), MAX (d), MIN(d.$0);}; "); pigServer.registerQuery("c = foreach b { d = filter a by gpa > 2.5; " + "e = order a by name; f = a.age; g = distinct f; " + " generate group, COUNT(d), MAX (e.name), MIN(g.$0);};"); pigServer.registerQuery("h = order c by $1;"); pigServer.registerQuery("i = limit h 2;"); pigServer.store("i", "testCheckin2-output.txt"); pigServer.registerQuery("x = load 'testCheckin2-output.txt' as (age: int, cnt: long, max: chararray, min: int);"); pigServer.registerQuery("y = foreach x generate age, cnt, max, min;"); Iterator<Tuple> iter = pigServer.openIterator("y"); int count = 0; while(iter.hasNext()){ Tuple t = iter.next(); count++; if (count == 1) { assertTrue(t.get(0).equals(expected1.get(0))); assertTrue(t.get(1).equals(expected1.get(1))); assertTrue(t.get(2).equals(expected1.get(2))); assertTrue(t.get(3).equals(expected1.get(3))); } else if (count == 2){ assertTrue(t.get(0).equals(expected2.get(0))); assertTrue(t.get(1).equals(expected2.get(1))); assertTrue(t.get(2).equals(expected2.get(2))); assertTrue(t.get(3).equals(expected2.get(3))); } } assertEquals(count, 2); Util.deleteFile(cluster, "testCheckin2-input.txt"); } }