/*
* Copyright (c) 2007-2010 Concurrent, Inc. All Rights Reserved.
*
* Project and contact information: http://www.cascading.org/
*
* This file is part of the Cascading project.
*
* Cascading is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Cascading is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Cascading. If not, see <http://www.gnu.org/licenses/>.
*/
package cascading.operation.assertion;
import java.io.File;
import java.io.IOException;
import java.util.Map;
import cascading.ClusterTestCase;
import cascading.TestConstants;
import cascading.flow.Flow;
import cascading.flow.FlowConnector;
import cascading.operation.AssertionLevel;
import cascading.operation.aggregator.Count;
import cascading.operation.regex.RegexFilter;
import cascading.operation.regex.RegexParser;
import cascading.pipe.Each;
import cascading.pipe.Every;
import cascading.pipe.GroupBy;
import cascading.pipe.Pipe;
import cascading.scheme.TextLine;
import cascading.tap.Hfs;
import cascading.tap.Tap;
import cascading.tuple.Fields;
/**
*
*/
public class AppliedAssertionsTest extends ClusterTestCase
{
String inputFileApache = "build/test/data/apache.10.txt";
String outputPath = "build/test/output/assertions/";
private String apacheCommonRegex = TestConstants.APACHE_COMMON_REGEX;
private RegexParser apacheCommonParser = new RegexParser( new Fields( "ip", "time", "method", "event", "status", "size" ), apacheCommonRegex, new int[]{
1, 2, 3, 4, 5, 6} );
public AppliedAssertionsTest()
{
super( "applied assertions", false );
}
public void testValueAssertionsPass() throws Exception
{
if( !new File( inputFileApache ).exists() )
fail( "data file not found" );
copyFromLocal( inputFileApache );
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Tap sink = new Hfs( new TextLine(), outputPath + "value/pass", true );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), apacheCommonParser );
pipe = new Each( pipe, AssertionLevel.STRICT, new AssertNotNull() );
pipe = new Each( pipe, new Fields( "method" ), new RegexFilter( "^POST" ) );
pipe = new Each( pipe, new Fields( "method" ), AssertionLevel.STRICT, new AssertMatches( "^POST" ) );
pipe = new GroupBy( pipe, new Fields( "method" ) );
pipe = new Every( pipe, new Count(), new Fields( "method", "count" ) ); // count is a long value
pipe = new Each( pipe, new Fields( "count" ), AssertionLevel.STRICT, new AssertEquals( 7L ) );
Flow flow = new FlowConnector( getProperties() ).connect( source, sink, pipe );
flow.complete();
validateLength( flow, 1, null );
}
public void testValueAssertionsFail() throws Exception
{
if( !new File( inputFileApache ).exists() )
fail( "data file not found" );
copyFromLocal( inputFileApache );
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Tap sink = new Hfs( new TextLine(), outputPath + "value/fail", true );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), apacheCommonParser );
pipe = new Each( pipe, AssertionLevel.STRICT, new AssertNotNull() );
pipe = new Each( pipe, new Fields( "method" ), new RegexFilter( "^POST" ) );
pipe = new Each( pipe, new Fields( "method" ), AssertionLevel.STRICT, new AssertMatches( "^POST" ) );
pipe = new GroupBy( pipe, new Fields( "method" ) );
pipe = new Every( pipe, new Count(), new Fields( "method", "count" ) ); // count is a long value
pipe = new Each( pipe, new Fields( "count" ), AssertionLevel.STRICT, new AssertEquals( 0L ) );
Flow flow = new FlowConnector( getProperties() ).connect( source, sink, pipe );
try
{
flow.complete();
fail( "no assertions thrown" );
}
catch( Exception exception )
{
}
}
public void testValueAssertionsRemoval() throws Exception
{
runValueAssertions( AssertionLevel.NONE, AssertionLevel.STRICT, true );
runValueAssertions( AssertionLevel.VALID, AssertionLevel.STRICT, true );
runValueAssertions( AssertionLevel.STRICT, AssertionLevel.STRICT, false );
runValueAssertions( AssertionLevel.NONE, AssertionLevel.VALID, true );
runValueAssertions( AssertionLevel.VALID, AssertionLevel.VALID, false );
}
private void runValueAssertions( AssertionLevel planLevel, AssertionLevel setLevel, boolean pass ) throws IOException
{
if( !new File( inputFileApache ).exists() )
fail( "data file not found" );
copyFromLocal( inputFileApache );
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Tap sink = new Hfs( new TextLine(), outputPath + "value/" + planLevel + "/" + setLevel, true );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), apacheCommonParser );
pipe = new Each( pipe, setLevel, new AssertNotNull() );
pipe = new Each( pipe, new Fields( "method" ), new RegexFilter( "^POST" ) );
pipe = new Each( pipe, new Fields( "method" ), setLevel, new AssertMatches( "^POST" ) );
pipe = new GroupBy( pipe, new Fields( "method" ) );
pipe = new Every( pipe, new Count(), new Fields( "method", "count" ) ); // count is a long value
pipe = new Each( pipe, new Fields( "count" ), setLevel, new AssertEquals( 0L ) );
Map<Object, Object> properties = getProperties();
FlowConnector.setAssertionLevel( properties, planLevel );
FlowConnector flowConnector = new FlowConnector( properties );
Flow flow = flowConnector.connect( source, sink, pipe );
try
{
flow.complete();
if( !pass )
fail( "no assertions thrown" );
}
catch( Exception exception )
{
if( pass )
fail( "assertion thrown" );
}
if( pass )
validateLength( flow, 1, null );
}
public void testGroupAssertionsPass() throws Exception
{
if( !new File( inputFileApache ).exists() )
fail( "data file not found" );
copyFromLocal( inputFileApache );
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Tap sink = new Hfs( new TextLine(), outputPath + "pass", true );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), apacheCommonParser );
pipe = new Each( pipe, AssertionLevel.STRICT, new AssertNotNull() );
pipe = new Each( pipe, new Fields( "method" ), new RegexFilter( "^POST" ) );
pipe = new Each( pipe, new Fields( "method" ), AssertionLevel.STRICT, new AssertMatches( "^POST" ) );
pipe = new GroupBy( pipe, new Fields( "method" ) );
pipe = new Every( pipe, new Count(), new Fields( "method", "count" ) ); // count is a long value
pipe = new Every( pipe, AssertionLevel.STRICT, new AssertGroupSizeEquals( 7L ) );
Flow flow = new FlowConnector( getProperties() ).connect( source, sink, pipe );
flow.complete();
validateLength( flow, 1, null );
}
public void testGroupAssertionsFail() throws Exception
{
if( !new File( inputFileApache ).exists() )
fail( "data file not found" );
copyFromLocal( inputFileApache );
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Tap sink = new Hfs( new TextLine(), outputPath + "fail", true );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), apacheCommonParser );
pipe = new Each( pipe, AssertionLevel.STRICT, new AssertNotNull() );
pipe = new Each( pipe, new Fields( "method" ), new RegexFilter( "^POST" ) );
pipe = new Each( pipe, new Fields( "method" ), AssertionLevel.STRICT, new AssertMatches( "^POST" ) );
pipe = new GroupBy( pipe, new Fields( "method" ) );
pipe = new Every( pipe, new Count(), new Fields( "method", "count" ) ); // count is a long value
pipe = new Every( pipe, AssertionLevel.STRICT, new AssertGroupSizeEquals( 0L ) );
Flow flow = new FlowConnector( getProperties() ).connect( source, sink, pipe );
try
{
flow.complete();
fail( "no assertions thrown" );
}
catch( Exception exception )
{
}
}
public void testGroupAssertionsRemoval() throws Exception
{
runGroupAssertions( AssertionLevel.NONE, AssertionLevel.STRICT, true );
runGroupAssertions( AssertionLevel.VALID, AssertionLevel.STRICT, true );
runGroupAssertions( AssertionLevel.STRICT, AssertionLevel.STRICT, false );
runGroupAssertions( AssertionLevel.NONE, AssertionLevel.VALID, true );
runGroupAssertions( AssertionLevel.VALID, AssertionLevel.VALID, false );
}
private void runGroupAssertions( AssertionLevel planLevel, AssertionLevel setLevel, boolean pass ) throws IOException
{
if( !new File( inputFileApache ).exists() )
fail( "data file not found" );
copyFromLocal( inputFileApache );
Tap source = new Hfs( new TextLine( new Fields( "offset", "line" ) ), inputFileApache );
Tap sink = new Hfs( new TextLine(), outputPath + "value/" + planLevel + "/" + setLevel, true );
Pipe pipe = new Pipe( "test" );
pipe = new Each( pipe, new Fields( "line" ), apacheCommonParser );
pipe = new Each( pipe, setLevel, new AssertNotNull() );
pipe = new Each( pipe, new Fields( "method" ), new RegexFilter( "^POST" ) );
pipe = new Each( pipe, new Fields( "method" ), setLevel, new AssertMatches( "^POST" ) );
pipe = new GroupBy( pipe, new Fields( "method" ) );
pipe = new Every( pipe, new Count(), new Fields( "method", "count" ) ); // count is a long value
pipe = new Every( pipe, setLevel, new AssertGroupSizeEquals( 0L ) );
Map<Object, Object> properties = getProperties();
FlowConnector.setAssertionLevel( properties, planLevel );
FlowConnector flowConnector = new FlowConnector( properties );
Flow flow = flowConnector.connect( source, sink, pipe );
try
{
flow.complete();
if( !pass )
fail( "no assertions thrown" );
}
catch( Exception exception )
{
if( pass )
fail( "assertion thrown" );
}
if( pass )
validateLength( flow, 1, null );
}
}