/* * Copyright (C) 2014 The Calrissian Authors * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.calrissian.flowmix.api; import java.io.Serializable; import java.util.List; import java.util.Map; import org.calrissian.flowmix.core.model.event.AggregatedEvent; import org.calrissian.flowmix.core.support.window.WindowItem; import org.calrissian.flowmix.exceptions.FlowmixException; /** * An aggregator over a progressive/tumbling window allows aggregate values like * sums and averages to be maintained for some window at some point in time * without the whole window being available at any point in time. * * This is very useful for associative algorithms that can be implemented * without the entire dataset being available. Often this is good for reduce * functions that can summarize a dataset without the need to see each * individual point. * * Multiple events can be returned as the aggregate if necessary, this means * multiple aggregates could be maintained inside and emitted separately (i.e. * sum and count and sumsqaure, and average). */ public interface Aggregator extends Serializable { public static final String GROUP_BY = "groupBy"; public static final String GROUP_BY_DELIM = "\u0000"; void configure(Map<String, String> configuration); void added(WindowItem item); void evicted(WindowItem item); List<AggregatedEvent> aggregate(); }