/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.flink.optimizer.util; import java.util.ArrayList; import java.util.HashMap; import java.util.Iterator; import java.util.List; import java.util.Map; import org.apache.flink.api.common.Plan; import org.apache.flink.api.common.functions.Function; import org.apache.flink.api.common.io.FileInputFormat.FileBaseStatistics; import org.apache.flink.api.common.operators.GenericDataSourceBase; import org.apache.flink.api.common.operators.Operator; import org.apache.flink.api.common.operators.base.BulkIterationBase; import org.apache.flink.configuration.Configuration; import org.apache.flink.optimizer.DataStatistics; import org.apache.flink.optimizer.Optimizer; import org.apache.flink.optimizer.costs.DefaultCostEstimator; import org.apache.flink.optimizer.plan.OptimizedPlan; import org.apache.flink.optimizer.plan.PlanNode; import org.apache.flink.optimizer.plan.SingleInputPlanNode; import org.apache.flink.util.OperatingSystem; import org.apache.flink.util.TestLogger; import org.apache.flink.util.Visitor; import org.junit.Before; /** * Base class for Optimizer tests. Offers utility methods to trigger optimization * of a program and to fetch the nodes in an optimizer plan that correspond * the the node in the program plan. */ public abstract class CompilerTestBase extends TestLogger implements java.io.Serializable { private static final long serialVersionUID = 1L; protected static final String IN_FILE = OperatingSystem.isWindows() ? "file:/c:/" : "file:///dev/random"; protected static final String OUT_FILE = OperatingSystem.isWindows() ? "file:/c:/" : "file:///dev/null"; protected static final int DEFAULT_PARALLELISM = 8; protected static final String DEFAULT_PARALLELISM_STRING = String.valueOf(DEFAULT_PARALLELISM); private static final String CACHE_KEY = "cachekey"; // ------------------------------------------------------------------------ protected transient DataStatistics dataStats; protected transient Optimizer withStatsCompiler; protected transient Optimizer noStatsCompiler; private transient int statCounter; // ------------------------------------------------------------------------ @Before public void setup() { Configuration flinkConf = new Configuration(); this.dataStats = new DataStatistics(); this.withStatsCompiler = new Optimizer(this.dataStats, new DefaultCostEstimator(), flinkConf); this.withStatsCompiler.setDefaultParallelism(DEFAULT_PARALLELISM); this.noStatsCompiler = new Optimizer(null, new DefaultCostEstimator(), flinkConf); this.noStatsCompiler.setDefaultParallelism(DEFAULT_PARALLELISM); } // ------------------------------------------------------------------------ public OptimizedPlan compileWithStats(Plan p) { return this.withStatsCompiler.compile(p); } public OptimizedPlan compileNoStats(Plan p) { return this.noStatsCompiler.compile(p); } public static OperatorResolver getContractResolver(Plan plan) { return new OperatorResolver(plan); } public void setSourceStatistics(GenericDataSourceBase<?, ?> source, long size, float recordWidth) { setSourceStatistics(source, new FileBaseStatistics(Long.MAX_VALUE, size, recordWidth)); } public void setSourceStatistics(GenericDataSourceBase<?, ?> source, FileBaseStatistics stats) { final String key = CACHE_KEY + this.statCounter++; this.dataStats.cacheBaseStatistics(stats, key); source.setStatisticsKey(key); } public static OptimizerPlanNodeResolver getOptimizerPlanNodeResolver(OptimizedPlan plan) { return new OptimizerPlanNodeResolver(plan); } // ------------------------------------------------------------------------ public static final class OptimizerPlanNodeResolver { private final Map<String, ArrayList<PlanNode>> map; public OptimizerPlanNodeResolver(OptimizedPlan p) { HashMap<String, ArrayList<PlanNode>> map = new HashMap<String, ArrayList<PlanNode>>(); for (PlanNode n : p.getAllNodes()) { Operator<?> c = n.getOriginalOptimizerNode().getOperator(); String name = c.getName(); ArrayList<PlanNode> list = map.get(name); if (list == null) { list = new ArrayList<PlanNode>(2); map.put(name, list); } // check whether this node is a child of a node with the same contract (aka combiner) boolean shouldAdd = true; for (Iterator<PlanNode> iter = list.iterator(); iter.hasNext();) { PlanNode in = iter.next(); if (in.getOriginalOptimizerNode().getOperator() == c) { // is this the child or is our node the child if (in instanceof SingleInputPlanNode && n instanceof SingleInputPlanNode) { SingleInputPlanNode thisNode = (SingleInputPlanNode) n; SingleInputPlanNode otherNode = (SingleInputPlanNode) in; if (thisNode.getPredecessor() == otherNode) { // other node is child, remove it iter.remove(); } else if (otherNode.getPredecessor() == thisNode) { shouldAdd = false; } } else { throw new RuntimeException("Unrecodnized case in test."); } } } if (shouldAdd) { list.add(n); } } this.map = map; } @SuppressWarnings("unchecked") public <T extends PlanNode> T getNode(String name) { List<PlanNode> nodes = this.map.get(name); if (nodes == null || nodes.isEmpty()) { throw new RuntimeException("No node found with the given name."); } else if (nodes.size() != 1) { throw new RuntimeException("Multiple nodes found with the given name."); } else { return (T) nodes.get(0); } } @SuppressWarnings("unchecked") public <T extends PlanNode> T getNode(String name, Class<? extends Function> stubClass) { List<PlanNode> nodes = this.map.get(name); if (nodes == null || nodes.isEmpty()) { throw new RuntimeException("No node found with the given name and stub class."); } else { PlanNode found = null; for (PlanNode node : nodes) { if (node.getClass() == stubClass) { if (found == null) { found = node; } else { throw new RuntimeException("Multiple nodes found with the given name and stub class."); } } } if (found == null) { throw new RuntimeException("No node found with the given name and stub class."); } else { return (T) found; } } } public List<PlanNode> getNodes(String name) { List<PlanNode> nodes = this.map.get(name); if (nodes == null || nodes.isEmpty()) { throw new RuntimeException("No node found with the given name."); } else { return new ArrayList<PlanNode>(nodes); } } } /** * Collects all DataSources of a plan to add statistics * */ public static class SourceCollectorVisitor implements Visitor<Operator<?>> { protected final List<GenericDataSourceBase<?, ?>> sources = new ArrayList<GenericDataSourceBase<?, ?>>(4); @Override public boolean preVisit(Operator<?> visitable) { if(visitable instanceof GenericDataSourceBase) { sources.add((GenericDataSourceBase<?, ?>) visitable); } else if(visitable instanceof BulkIterationBase) { ((BulkIterationBase<?>) visitable).getNextPartialSolution().accept(this); } return true; } @Override public void postVisit(Operator<?> visitable) {} public List<GenericDataSourceBase<?, ?>> getSources() { return this.sources; } } }