/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.flink.api.java.operators; import org.apache.flink.annotation.Internal; import org.apache.flink.annotation.Public; import org.apache.flink.api.common.InvalidProgramException; import org.apache.flink.api.common.functions.Partitioner; import org.apache.flink.api.common.operators.Keys; import org.apache.flink.api.java.DataSet; /** * Grouping is an intermediate step for a transformation on a grouped DataSet.<br> * The following transformation can be applied on Grouping: * <ul> * <li>{@link UnsortedGrouping#reduce(org.apache.flink.api.common.functions.ReduceFunction)},</li> * <li>{@link UnsortedGrouping#reduceGroup(org.apache.flink.api.common.functions.GroupReduceFunction)}, and</li> * <li>{@link UnsortedGrouping#aggregate(org.apache.flink.api.java.aggregation.Aggregations, int)}.</li> * </ul> * * @param <T> The type of the elements of the grouped DataSet. * * @see DataSet */ @Public public abstract class Grouping<T> { protected final DataSet<T> inputDataSet; protected final Keys<T> keys; protected Partitioner<?> customPartitioner; public Grouping(DataSet<T> set, Keys<T> keys) { if (set == null || keys == null) { throw new NullPointerException(); } if (keys.isEmpty()) { throw new InvalidProgramException("The grouping keys must not be empty."); } this.inputDataSet = set; this.keys = keys; } /** * Returns the input DataSet of a grouping operation, that is the one before the grouping. This means that * if it is applied directly to the result of a grouping operation, it will cancel its effect. As an example, in the * following snippet: * <pre><code> * DataSet<X> notGrouped = input.groupBy().getDataSet(); * DataSet<Y> allReduced = notGrouped.reduce() * </pre></code> * the <code>groupBy()</code> is as if it never happened, as the <code>notGrouped</code> DataSet corresponds * to the input of the <code>groupBy()</code> (because of the <code>getDataset()</code>). * */ @Internal public DataSet<T> getInputDataSet() { return this.inputDataSet; } @Internal public Keys<T> getKeys() { return this.keys; } /** * Gets the custom partitioner to be used for this grouping, or {@code null}, if * none was defined. * * @return The custom partitioner to be used for this grouping. */ @Internal public Partitioner<?> getCustomPartitioner() { return this.customPartitioner; } }