/*
* Copyright (c) 2011-2015 EPFL DATA Laboratory
* Copyright (c) 2014-2015 The Squall Collaboration (see NOTICE)
*
* All rights reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ch.epfl.data.squall.examples.imperative.debug;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Date;
import java.util.Map;
import org.apache.log4j.Logger;
import ch.epfl.data.squall.components.Component;
import ch.epfl.data.squall.components.DataSourceComponent;
import ch.epfl.data.squall.components.theta.ThetaJoinComponentFactory;
import ch.epfl.data.squall.expressions.ColumnReference;
import ch.epfl.data.squall.expressions.IntegerYearFromDate;
import ch.epfl.data.squall.expressions.Multiplication;
import ch.epfl.data.squall.expressions.Subtraction;
import ch.epfl.data.squall.expressions.ValueExpression;
import ch.epfl.data.squall.expressions.ValueSpecification;
import ch.epfl.data.squall.operators.AggregateOperator;
import ch.epfl.data.squall.operators.AggregateSumOperator;
import ch.epfl.data.squall.operators.ProjectOperator;
import ch.epfl.data.squall.operators.SelectOperator;
import ch.epfl.data.squall.predicates.AndPredicate;
import ch.epfl.data.squall.predicates.BetweenPredicate;
import ch.epfl.data.squall.predicates.ComparisonPredicate;
import ch.epfl.data.squall.predicates.OrPredicate;
import ch.epfl.data.squall.query_plans.QueryBuilder;
import ch.epfl.data.squall.query_plans.QueryPlan;
import ch.epfl.data.squall.query_plans.ThetaQueryPlansParameters;
import ch.epfl.data.squall.types.DateType;
import ch.epfl.data.squall.types.DoubleType;
import ch.epfl.data.squall.types.IntegerType;
import ch.epfl.data.squall.types.NumericType;
import ch.epfl.data.squall.types.StringType;
import ch.epfl.data.squall.types.Type;
public class ThetaTPCH7_CustomPlan extends QueryPlan {
private static Logger LOG = Logger.getLogger(ThetaTPCH7_CustomPlan.class);
private QueryBuilder _queryBuilder = new QueryBuilder();
private static final IntegerType _ic = new IntegerType();
private static final String _date1Str = "1995-01-01";
private static final String _date2Str = "1996-12-31";
// private static final String _firstCountryName = "FRANCE";
// private static final String _secondCountryName = "GERMANY";
private static final String _firstCountryName = "PERU";
private static final String _secondCountryName = "ETHIOPIA";
private static final Type<Date> _dateConv = new DateType();
private static final NumericType<Double> _doubleConv = new DoubleType();
private static final Type<String> _sc = new StringType();
private static final Date _date1 = _dateConv.fromString(_date1Str);
private static final Date _date2 = _dateConv.fromString(_date2Str);
public ThetaTPCH7_CustomPlan(String dataPath, String extension, Map conf) {
int Theta_JoinType = ThetaQueryPlansParameters.getThetaJoinType(conf);
// -------------------------------------------------------------------------------------
ArrayList<Integer> hashNation2 = new ArrayList<Integer>(
Arrays.asList(1));
SelectOperator selectionNation2 = new SelectOperator(new OrPredicate(
new ComparisonPredicate(new ColumnReference(_sc, 1),
new ValueSpecification(_sc, _firstCountryName)),
new ComparisonPredicate(new ColumnReference(_sc, 1),
new ValueSpecification(_sc, _secondCountryName))));
ProjectOperator projectionNation2 = new ProjectOperator(new int[] { 1,
0 });
DataSourceComponent relationNation2 = new DataSourceComponent(
"NATION2", dataPath + "nation" + extension)
.setOutputPartKey(hashNation2).add(selectionNation2)
.add(projectionNation2);
_queryBuilder.add(relationNation2);
// -------------------------------------------------------------------------------------
ArrayList<Integer> hashCustomer = new ArrayList<Integer>(
Arrays.asList(1));
ProjectOperator projectionCustomer = new ProjectOperator(new int[] { 0,
3 });
DataSourceComponent relationCustomer = new DataSourceComponent(
"CUSTOMER", dataPath + "customer" + extension)
.setOutputPartKey(hashCustomer).add(projectionCustomer);
_queryBuilder.add(relationCustomer);
// -------------------------------------------------------------------------------------
ColumnReference colN = new ColumnReference(_ic, 1);
ColumnReference colC = new ColumnReference(_ic, 1);
ComparisonPredicate N_C_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colN, colC);
Component N_Cjoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, relationNation2,
relationCustomer, _queryBuilder)
.add(new ProjectOperator(new int[] { 0, 2 }))
.setJoinPredicate(N_C_comp);
// -------------------------------------------------------------------------------------
ArrayList<Integer> hashOrders = new ArrayList<Integer>(Arrays.asList(1));
ProjectOperator projectionOrders = new ProjectOperator(
new int[] { 0, 1 });
DataSourceComponent relationOrders = new DataSourceComponent("ORDERS",
dataPath + "orders" + extension).setOutputPartKey(hashOrders)
.add(projectionOrders);
_queryBuilder.add(relationOrders);
// -------------------------------------------------------------------------------------
ColumnReference colN_C = new ColumnReference(_ic, 1);
ColumnReference colO = new ColumnReference(_ic, 1);
ComparisonPredicate N_C_O_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colN_C, colO);
Component N_C_Ojoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, N_Cjoin,
relationOrders, _queryBuilder)
.add(new ProjectOperator(new int[] { 0, 2 }))
.setJoinPredicate(N_C_O_comp)
.setOutputPartKey(Arrays.asList(1));
// -------------------------------------------------------------------------------------
ArrayList<Integer> hashSupplier = new ArrayList<Integer>(
Arrays.asList(1));
ProjectOperator projectionSupplier = new ProjectOperator(new int[] { 0,
3 });
DataSourceComponent relationSupplier = new DataSourceComponent(
"SUPPLIER", dataPath + "supplier" + extension)
.setOutputPartKey(hashSupplier).add(projectionSupplier);
_queryBuilder.add(relationSupplier);
// -------------------------------------------------------------------------------------
ArrayList<Integer> hashNation1 = new ArrayList<Integer>(
Arrays.asList(1));
ProjectOperator projectionNation1 = new ProjectOperator(new int[] { 1,
0 });
DataSourceComponent relationNation1 = new DataSourceComponent(
"NATION1", dataPath + "nation" + extension)
.setOutputPartKey(hashNation1).add(selectionNation2)
.add(projectionNation1);
_queryBuilder.add(relationNation1);
// -------------------------------------------------------------------------------------
ColumnReference colS = new ColumnReference(_ic, 1);
ColumnReference colN2 = new ColumnReference(_ic, 1);
ComparisonPredicate S_N_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colS, colN2);
Component S_Njoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, relationSupplier,
relationNation1, _queryBuilder)
.add(new ProjectOperator(new int[] { 0, 2 }))
.setJoinPredicate(S_N_comp);
// .setHashIndexes(new ArrayList<Integer>(Arrays.asList(0)));
// -------------------------------------------------------------------------------------
ArrayList<Integer> hashLineitem = new ArrayList<Integer>(
Arrays.asList(2));
SelectOperator selectionLineitem = new SelectOperator(
new BetweenPredicate(new ColumnReference(_dateConv, 10), true,
new ValueSpecification(_dateConv, _date1), true,
new ValueSpecification(_dateConv, _date2)));
// first field in projection
ValueExpression extractYear = new IntegerYearFromDate(
new ColumnReference<Date>(_dateConv, 10));
// second field in projection
// 1 - discount
ValueExpression<Double> substract = new Subtraction(
new ValueSpecification(_doubleConv, 1.0), new ColumnReference(
_doubleConv, 6));
// extendedPrice*(1-discount)
ValueExpression<Double> product = new Multiplication(
new ColumnReference(_doubleConv, 5), substract);
// third field in projection
ColumnReference supplierKey = new ColumnReference(_sc, 2);
// forth field in projection
ColumnReference orderKey = new ColumnReference(_sc, 0);
ProjectOperator projectionLineitem = new ProjectOperator(extractYear,
product, supplierKey, orderKey);
DataSourceComponent relationLineitem = new DataSourceComponent(
"LINEITEM", dataPath + "lineitem" + extension)
.setOutputPartKey(hashLineitem).add(selectionLineitem)
.add(projectionLineitem);
_queryBuilder.add(relationLineitem);
// -------------------------------------------------------------------------------------
ColumnReference colL = new ColumnReference(_ic, 2);
ColumnReference colS_N = new ColumnReference(_ic, 0);
ComparisonPredicate L_S_N_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colL, colS_N);
// AggregateCountOperator agg= new AggregateCountOperator(conf);
Component L_S_Njoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, relationLineitem,
S_Njoin, _queryBuilder)
.add(new ProjectOperator(new int[] { 5, 0, 1, 3 }))
.setJoinPredicate(L_S_N_comp)
.setOutputPartKey(Arrays.asList(3))
// .addOperator(agg)
;
// -------------------------------------------------------------------------------------
// set up aggregation function on the same StormComponent(Bolt) where
// the last join is
SelectOperator so = new SelectOperator(
new OrPredicate(
new AndPredicate(
new ComparisonPredicate(new ColumnReference(
_sc, 0), new ValueSpecification(_sc,
_firstCountryName)),
new ComparisonPredicate(new ColumnReference(
_sc, 2), new ValueSpecification(_sc,
_secondCountryName))),
new AndPredicate(
new ComparisonPredicate(new ColumnReference(
_sc, 0), new ValueSpecification(_sc,
_secondCountryName)),
new ComparisonPredicate(new ColumnReference(
_sc, 2), new ValueSpecification(_sc,
_firstCountryName)))));
AggregateOperator agg = new AggregateSumOperator(new ColumnReference(
_doubleConv, 4), conf)
.setGroupByColumns(new ArrayList<Integer>(Arrays
.asList(2, 0, 3)));
ColumnReference colN_C_O = new ColumnReference(_ic, 1);
ColumnReference colL_S_N = new ColumnReference(_ic, 3);
ComparisonPredicate N_C_O_L_S_N_comp = new ComparisonPredicate(
ComparisonPredicate.EQUAL_OP, colN_C_O, colL_S_N);
Component N_C_O_L_S_Njoin = ThetaJoinComponentFactory
.createThetaJoinOperator(Theta_JoinType, N_C_Ojoin, L_S_Njoin,
_queryBuilder).add(so).add(agg)
.setJoinPredicate(N_C_O_L_S_N_comp)
.setContentSensitiveThetaJoinWrapper(_ic);
// -------------------------------------------------------------------------------------
}
@Override
public QueryBuilder getQueryPlan() {
return _queryBuilder;
}
}