/*
* Copyright (c) 2011-2015 EPFL DATA Laboratory
* Copyright (c) 2014-2015 The Squall Collaboration (see NOTICE)
*
* All rights reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package ch.epfl.data.squall.examples.imperative.shj;
import java.util.Arrays;
import java.util.Calendar;
import java.util.Date;
import java.util.List;
import java.util.Map;
import org.apache.log4j.Logger;
import ch.epfl.data.squall.components.DataSourceComponent;
import ch.epfl.data.squall.components.EquiJoinComponent;
import ch.epfl.data.squall.components.OperatorComponent;
import ch.epfl.data.squall.expressions.ColumnReference;
import ch.epfl.data.squall.expressions.DateSum;
import ch.epfl.data.squall.expressions.ValueExpression;
import ch.epfl.data.squall.expressions.ValueSpecification;
import ch.epfl.data.squall.operators.AggregateCountOperator;
import ch.epfl.data.squall.operators.AggregateOperator;
import ch.epfl.data.squall.operators.DistinctOperator;
import ch.epfl.data.squall.operators.ProjectOperator;
import ch.epfl.data.squall.operators.SelectOperator;
import ch.epfl.data.squall.predicates.BetweenPredicate;
import ch.epfl.data.squall.predicates.ComparisonPredicate;
import ch.epfl.data.squall.query_plans.QueryBuilder;
import ch.epfl.data.squall.query_plans.QueryPlan;
import ch.epfl.data.squall.types.DateType;
import ch.epfl.data.squall.types.IntegerType;
import ch.epfl.data.squall.types.Type;
/* TPC_H Query 4 - Order Priority Checking
SELECT O_ORDERPRIORITY, COUNT(*) AS ORDER_COUNT FROM ORDERS
WHERE O_ORDERDATE >= '1993-07-01' AND O_ORDERDATE < dateadd(mm,3, cast('1993-07-01' as date))
AND EXISTS (SELECT * FROM LINEITEM WHERE L_ORDERKEY = O_ORDERKEY AND L_COMMITDATE < L_RECEIPTDATE)
GROUP BY O_ORDERPRIORITY
ORDER BY O_ORDERPRIORITY
*/
public class TPCH4Plan extends QueryPlan {
private static void computeDates() {
// date2= date1 + 3 months
final String date1Str = "1993-07-01";
final int interval = 3;
final int unit = Calendar.MONTH;
// setting _date1
_date1 = _dc.fromString(date1Str);
// setting _date2
ValueExpression<Date> date1Ve, date2Ve;
date1Ve = new ValueSpecification<Date>(_dc, _date1);
date2Ve = new DateSum(date1Ve, unit, interval);
_date2 = date2Ve.eval(null);
// tuple is set to null since we are computing based on constants
}
private static Logger LOG = Logger.getLogger(TPCH4Plan.class);
private static final Type<Date> _dc = new DateType();
private static final IntegerType _ic = new IntegerType();
private final QueryBuilder _queryBuilder = new QueryBuilder();
// query variables
private static Date _date1, _date2;
public TPCH4Plan(String dataPath, String extension, Map conf) {
computeDates();
// -------------------------------------------------------------------------------------
final List<Integer> hashLineitem = Arrays.asList(0);
final SelectOperator selectionLineitem = new SelectOperator(
new ComparisonPredicate(ComparisonPredicate.LESS_OP,
new ColumnReference(_dc, 11), new ColumnReference(_dc,
12)));
final ProjectOperator projectionLineitem = new ProjectOperator(
new int[] { 0 });
final DataSourceComponent relationLineitem = new DataSourceComponent(
"LINEITEM", dataPath + "lineitem" + extension)
.setOutputPartKey(hashLineitem).add(selectionLineitem)
.add(projectionLineitem);
_queryBuilder.add(relationLineitem);
// -------------------------------------------------------------------------------------
final List<Integer> hashOrders = Arrays.asList(0);
final SelectOperator selectionOrders = new SelectOperator(
new BetweenPredicate(new ColumnReference(_dc, 4), true,
new ValueSpecification(_dc, _date1), false,
new ValueSpecification(_dc, _date2)));
final ProjectOperator projectionOrders = new ProjectOperator(new int[] {
0, 5 });
final DataSourceComponent relationOrders = new DataSourceComponent(
"ORDERS", dataPath + "orders" + extension)
.setOutputPartKey(hashOrders).add(selectionOrders)
.add(projectionOrders);
_queryBuilder.add(relationOrders);
// -------------------------------------------------------------------------------------
final EquiJoinComponent O_Ljoin = new EquiJoinComponent(relationOrders,
relationLineitem).setOutputPartKey(Arrays.asList(1));
_queryBuilder.add(O_Ljoin);
// -------------------------------------------------------------------------------------
// set up aggregation function on a separate StormComponent(Bolt)
final DistinctOperator distinctOp = new DistinctOperator(conf,
new int[] { 0 });
final AggregateOperator aggOp = new AggregateCountOperator(conf)
.setGroupByColumns(Arrays.asList(1)).setDistinct(distinctOp);
OperatorComponent oc = new OperatorComponent(O_Ljoin, "FINAL_RESULT")
.add(aggOp);
_queryBuilder.add(oc);
// -------------------------------------------------------------------------------------
}
@Override
public QueryBuilder getQueryPlan() {
return _queryBuilder;
}
}