/*
* Copyright (c) 2007-2010 Concurrent, Inc. All Rights Reserved.
*
* Project and contact information: http://www.cascading.org/
*
* This file is part of the Cascading project.
*
* Cascading is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Cascading is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Cascading. If not, see <http://www.gnu.org/licenses/>.
*/
package cascading;
import java.util.HashMap;
import java.util.Map;
import cascading.flow.FlowConnector;
import cascading.operation.aggregator.Count;
import cascading.operation.regex.RegexParser;
import cascading.pipe.Each;
import cascading.pipe.Every;
import cascading.pipe.GroupBy;
import cascading.pipe.Pipe;
import cascading.scheme.TextLine;
import cascading.tap.Hfs;
import cascading.tap.Tap;
import cascading.tuple.Fields;
/**
*
*/
public class BasicTrapTest extends CascadingTestCase
{
String inputFileApache = "build/test/data/apache.10.txt";
String outputPath = "build/test/output/traps/";
public BasicTrapTest()
{
super( "trap tests" );
}
public void testTrapNamesFail() throws Exception
{
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), new RegexParser( new Fields( "ip" ), "^[^ ]*" ), new Fields( "ip" ) );
// always fail
pipe = new Each( pipe, new Fields( "ip" ), new TestFunction( new Fields( "test" ), null ), Fields.ALL );
pipe = new GroupBy( pipe, new Fields( "ip" ) );
pipe = new Every( pipe, new Count(), new Fields( "ip", "count" ) );
Tap sink = new Hfs( new TextLine(), outputPath + "all/tap", true );
Tap trap = new Hfs( new TextLine(), outputPath + "all/trap", true );
Map<String, Tap> sources = new HashMap<String, Tap>();
Map<String, Tap> sinks = new HashMap<String, Tap>();
Map<String, Tap> traps = new HashMap<String, Tap>();
sources.put( "test", source );
sinks.put( "test", sink );
traps.put( "nada", trap );
try
{
new FlowConnector().connect( "trap test", sources, sinks, traps, pipe );
fail( "did not fail on missing pipe name" );
}
catch( Exception exception )
{
}
}
public void testTrapNamesPass() throws Exception
{
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Pipe pipe = new Pipe( "map" );
pipe = new Each( pipe, new Fields( "line" ), new RegexParser( new Fields( "ip" ), "^[^ ]*" ), new Fields( "ip" ) );
// always fail
pipe = new Each( pipe, new Fields( "ip" ), new TestFunction( new Fields( "test" ), null ), Fields.ALL );
pipe = new GroupBy( "reduce", pipe, new Fields( "ip" ) );
pipe = new Every( pipe, new Count(), new Fields( "ip", "count" ) );
Tap sink = new Hfs( new TextLine(), outputPath + "all/tap", true );
Tap trap = new Hfs( new TextLine(), outputPath + "all/trap", true );
Map<String, Tap> sources = new HashMap<String, Tap>();
Map<String, Tap> sinks = new HashMap<String, Tap>();
Map<String, Tap> traps = new HashMap<String, Tap>();
sources.put( "map", source );
sinks.put( "reduce", sink );
traps.put( "map", trap );
new FlowConnector().connect( "trap test", sources, sinks, traps, pipe );
}
public void testTrapNamesPass2() throws Exception
{
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Pipe pipe = new Pipe( "map" );
pipe = new Each( pipe, new Fields( "line" ), new RegexParser( new Fields( "ip" ), "^[^ ]*" ), new Fields( "ip" ) );
pipe = new Pipe( "middle", pipe );
pipe = new Each( pipe, new Fields( "ip" ), new TestFunction( new Fields( "test" ), null ), Fields.ALL );
pipe = new GroupBy( "reduce", pipe, new Fields( "ip" ) );
pipe = new Every( pipe, new Count(), new Fields( "ip", "count" ) );
Tap sink = new Hfs( new TextLine(), outputPath + "all/tap", true );
Tap trap = new Hfs( new TextLine(), outputPath + "all/trap", true );
Map<String, Tap> sources = new HashMap<String, Tap>();
Map<String, Tap> sinks = new HashMap<String, Tap>();
Map<String, Tap> traps = new HashMap<String, Tap>();
sources.put( "map", source );
sinks.put( "reduce", sink );
traps.put( "middle", trap );
new FlowConnector().connect( "trap test", sources, sinks, traps, pipe );
}
public void testTrapNamesPass3() throws Exception
{
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), new RegexParser( new Fields( "ip" ), "^[^ ]*" ), new Fields( "ip" ) );
pipe = new Each( pipe, new Fields( "ip" ), new TestFunction( new Fields( "test" ), null ), Fields.ALL );
pipe = new GroupBy( pipe, new Fields( "ip" ) );
pipe = new Pipe( "first", pipe );
pipe = new Every( pipe, new Count(), new Fields( "ip", "count" ) );
pipe = new Pipe( "second", pipe );
pipe = new Every( pipe, new Count( new Fields( "count2" ) ), new Fields( "ip", "count", "count2" ) );
Tap sink = new Hfs( new TextLine(), outputPath + "all/tap", true );
Tap trap = new Hfs( new TextLine(), outputPath + "all/trap", true );
Map<String, Tap> sources = new HashMap<String, Tap>();
Map<String, Tap> sinks = new HashMap<String, Tap>();
Map<String, Tap> traps = new HashMap<String, Tap>();
sources.put( "test", source );
sinks.put( "second", sink );
traps.put( "first", trap );
new FlowConnector().connect( "trap test", sources, sinks, traps, pipe );
}
}