/*
* Copyright (c) 2011-2015 EPFL DATA Laboratory
* Copyright (c) 2014-2015 The Squall Collaboration (see NOTICE)
*
* All rights reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ch.epfl.data.squall.examples.imperative.theta;
import java.util.Arrays;
import java.util.Date;
import java.util.List;
import java.util.Map;
import org.apache.log4j.Logger;
import ch.epfl.data.squall.components.Component;
import ch.epfl.data.squall.components.DataSourceComponent;
import ch.epfl.data.squall.components.theta.ThetaJoinComponentFactory;
import ch.epfl.data.squall.expressions.ColumnReference;
import ch.epfl.data.squall.expressions.IntegerYearFromDate;
import ch.epfl.data.squall.expressions.Multiplication;
import ch.epfl.data.squall.expressions.Subtraction;
import ch.epfl.data.squall.expressions.ValueExpression;
import ch.epfl.data.squall.expressions.ValueSpecification;
import ch.epfl.data.squall.operators.AggregateOperator;
import ch.epfl.data.squall.operators.AggregateSumOperator;
import ch.epfl.data.squall.operators.ProjectOperator;
import ch.epfl.data.squall.operators.SelectOperator;
import ch.epfl.data.squall.predicates.AndPredicate;
import ch.epfl.data.squall.predicates.ComparisonPredicate;
import ch.epfl.data.squall.predicates.LikePredicate;
import ch.epfl.data.squall.query_plans.QueryBuilder;
import ch.epfl.data.squall.query_plans.QueryPlan;
import ch.epfl.data.squall.query_plans.ThetaQueryPlansParameters;
import ch.epfl.data.squall.types.DateType;
import ch.epfl.data.squall.types.DoubleType;
import ch.epfl.data.squall.types.IntegerType;
import ch.epfl.data.squall.types.NumericType;
import ch.epfl.data.squall.types.StringType;
import ch.epfl.data.squall.types.Type;
public class ThetaTPCH9Plan extends QueryPlan {
private static Logger LOG = Logger.getLogger(ThetaTPCH9Plan.class);
private static final NumericType<Double> _doubleConv = new DoubleType();
private static final Type<Date> _dateConv = new DateType();
private static final StringType _sc = new StringType();
private static final IntegerType _ic = new IntegerType();
private static final String COLOR = "%green%";
private QueryBuilder _queryBuilder = new QueryBuilder();
public ThetaTPCH9Plan(String dataPath, String extension, Map conf) {
int Theta_JoinType = ThetaQueryPlansParameters.getThetaJoinType(conf);
// -------------------------------------------------------------------------------------
List<Integer> hashPart = Arrays.asList(0);
SelectOperator selectionPart = new SelectOperator(
new LikePredicate(new ColumnReference(_sc, 1),
new ValueSpecification(_sc, COLOR)));
ProjectOperator projectionPart = new ProjectOperator(new int[] { 0 });
DataSourceComponent relationPart = new DataSourceComponent("PART",
dataPath + "part" + extension).setOutputPartKey(hashPart)
.add(selectionPart).add(projectionPart);
_queryBuilder.add(relationPart);
// -------------------------------------------------------------------------------------
List<Integer> hashLineitem = Arrays.asList(1);
ProjectOperator projectionLineitem = new ProjectOperator(new int[] { 0,
1, 2, 4, 5, 6 });
DataSourceComponent relationLineitem = new DataSourceComponent(
"LINEITEM", dataPath + "lineitem" + extension)
.setOutputPartKey(hashLineitem).add(projectionLineitem);
_queryBuilder.add(relationLineitem);
// -------------------------------------------------------------------------------------
ColumnReference colP = new ColumnReference(_ic, 0);
ColumnReference colL = new ColumnReference(_ic, 1);
ComparisonPredicate P_L_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colP, colL);
Component P_Ljoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, relationPart,
relationLineitem, _queryBuilder)
.setOutputPartKey(Arrays.asList(0, 2))
.setJoinPredicate(P_L_comp)
.add(new ProjectOperator(new int[] { 0, 1, 3, 4, 5, 6 }));
// -------------------------------------------------------------------------------------
List<Integer> hashPartsupp = Arrays.asList(0, 1);
ProjectOperator projectionPartsupp = new ProjectOperator(new int[] { 0,
1, 3 });
DataSourceComponent relationPartsupp = new DataSourceComponent(
"PARTSUPP", dataPath + "partsupp" + extension)
.setOutputPartKey(hashPartsupp).add(projectionPartsupp);
_queryBuilder.add(relationPartsupp);
// -------------------------------------------------------------------------------------
ColumnReference colP_L1 = new ColumnReference(_ic, 0);
ColumnReference colP_L2 = new ColumnReference(_ic, 2);
ColumnReference colPS1 = new ColumnReference(_ic, 0);
ColumnReference colPS2 = new ColumnReference(_ic, 1);
ComparisonPredicate P_L_PS1_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colP_L1, colPS1);
ComparisonPredicate P_L_PS2_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colP_L2, colPS2);
AndPredicate P_L_PS = new AndPredicate(P_L_PS1_comp, P_L_PS2_comp);
Component P_L_PSjoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, P_Ljoin,
relationPartsupp, _queryBuilder)
.setOutputPartKey(Arrays.asList(0))
.add(new ProjectOperator(new int[] { 1, 2, 3, 4, 5, 8 }))
.setJoinPredicate(P_L_PS);
// -------------------------------------------------------------------------------------
List<Integer> hashOrders = Arrays.asList(0);
ProjectOperator projectionOrders = new ProjectOperator(
new ColumnReference(_sc, 0), new IntegerYearFromDate(
new ColumnReference(_dateConv, 4)));
DataSourceComponent relationOrders = new DataSourceComponent("ORDERS",
dataPath + "orders" + extension).setOutputPartKey(hashOrders)
.add(projectionOrders);
_queryBuilder.add(relationOrders);
// -------------------------------------------------------------------------------------
ColumnReference colP_L_PS = new ColumnReference(_ic, 0);
ColumnReference colO = new ColumnReference(_ic, 0);
ComparisonPredicate P_L_PS_O_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colP_L_PS, colO);
Component P_L_PS_Ojoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, P_L_PSjoin,
relationOrders, _queryBuilder)
.add(new ProjectOperator(new int[] { 1, 2, 3, 4, 5, 7 }))
.setJoinPredicate(P_L_PS_O_comp);
// -------------------------------------------------------------------------------------
List<Integer> hashSupplier = Arrays.asList(0);
ProjectOperator projectionSupplier = new ProjectOperator(new int[] { 0,
3 });
DataSourceComponent relationSupplier = new DataSourceComponent(
"SUPPLIER", dataPath + "supplier" + extension)
.setOutputPartKey(hashSupplier).add(projectionSupplier);
_queryBuilder.add(relationSupplier);
// -------------------------------------------------------------------------------------
ColumnReference P_L_PS_O = new ColumnReference(_ic, 0);
ColumnReference colS = new ColumnReference(_ic, 0);
ComparisonPredicate P_L_PS_O_S_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, P_L_PS_O, colS);
Component P_L_PS_O_Sjoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, P_L_PS_Ojoin,
relationSupplier, _queryBuilder)
.setOutputPartKey(Arrays.asList(5))
.add(new ProjectOperator(new int[] { 1, 2, 3, 4, 5, 7 }))
.setJoinPredicate(P_L_PS_O_S_comp);
// -------------------------------------------------------------------------------------
List<Integer> hashNation = Arrays.asList(0);
ProjectOperator projectionNation = new ProjectOperator(
new int[] { 0, 1 });
DataSourceComponent relationNation = new DataSourceComponent("NATION",
dataPath + "nation" + extension).setOutputPartKey(hashNation)
.add(projectionNation);
_queryBuilder.add(relationNation);
// -------------------------------------------------------------------------------------
// set up aggregation function on the StormComponent(Bolt) where join is
// performed
// 1 - discount
ValueExpression<Double> substract1 = new Subtraction(
new ValueSpecification(_doubleConv, 1.0), new ColumnReference(
_doubleConv, 2));
// extendedPrice*(1-discount)
ValueExpression<Double> product1 = new Multiplication(
new ColumnReference(_doubleConv, 1), substract1);
// ps_supplycost * l_quantity
ValueExpression<Double> product2 = new Multiplication(
new ColumnReference(_doubleConv, 3), new ColumnReference(
_doubleConv, 0));
// all together
ValueExpression<Double> substract2 = new Subtraction(product1, product2);
AggregateOperator agg = new AggregateSumOperator(substract2, conf)
.setGroupByColumns(Arrays.asList(5, 4));
ColumnReference P_L_PS_O_S = new ColumnReference(_ic, 5);
ColumnReference colN = new ColumnReference(_ic, 0);
ComparisonPredicate P_L_PS_O_S_N_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, P_L_PS_O_S, colN);
Component P_L_PS_O_S_Njoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, P_L_PS_O_Sjoin,
relationNation, _queryBuilder)
.add(new ProjectOperator(new int[] { 0, 1, 2, 3, 4, 7 }))
.add(agg).setJoinPredicate(P_L_PS_O_S_N_comp);
// -------------------------------------------------------------------------------------
}
@Override
public QueryBuilder getQueryPlan() {
return _queryBuilder;
}
}