/* * Copyright (c) 2008-2017, Hazelcast, Inc. All Rights Reserved. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.hazelcast.mapreduce; /** * <p> * This interface describes a mapreduce Job that is build by {@link JobTracker#newJob(KeyValueSource)}.<br> * It is used to execute mappings and calculations on the different cluster nodes and reduce or collate these mapped * values to results. * </p> * <p> * Implementations returned by the JobTracker are fully threadsafe and can be used concurrently and multiple * times <b>once the configuration is finished</b>. * </p> * <p> * <b>Caution: The generic types of Jobs change depending on the used methods, which can make it necessary to use * different assignment variables when used over multiple source lines.</b> * </p> * <p> * An example on how to use it: * <pre> * HazelcastInstance hz = getHazelcastInstance(); * IMap<Integer, Integer> map = (...) hz.getMap( "default" ); * JobTracker tracker = hz.getJobTracker( "default" ); * Job<Integer, Integer> job = tracker.newJob( KeyValueSource.fromMap( map ) ); * ICompletableFuture<Map<String, Integer>> future = job * .mapper( buildMapper() ).reducer( buildReducer() ).submit(); * Map<String, Integer> results = future.get(); * </pre> * </p> * * @param <KeyIn> type of key used as input key type * @param <ValueIn> type of value used as input value type * @since 3.2 * @deprecated MapReduce is deprecated and will be removed in 4.0. * For map aggregations, you can use {@link com.hazelcast.aggregation.Aggregator} on IMap. * For general data processing, it is superseded by <a href="http://jet.hazelcast.org">Hazelcast Jet</a>. */ @Deprecated public interface Job<KeyIn, ValueIn> { /** * Defines keys to execute the mapper and a possibly defined reducer against. If keys are known before submitting * the task, setting them can improve execution speed. * * @param keys keys to be executed against * @return instance of this Job with generics changed on usage */ Job<KeyIn, ValueIn> onKeys(Iterable<? extends KeyIn> keys); /** * Defines keys to execute the mapper and a possibly defined reducer against. If keys are known before submitting * the task, setting them can improve execution speed. * * @param keys keys to be executed against * @return instance of this Job with generics changed on usage */ Job<KeyIn, ValueIn> onKeys(KeyIn... keys); /** * Defines the number of elements per chunk. Whenever the chunk size is reached and a * {@link com.hazelcast.mapreduce.ReducerFactory} is defined, the chunk will be sent to the nodes that * is responsible for the emitted keys.<br/> * <b>Please note, that chunks are deactivated when no ReducerFactory is defined</b> * * @param chunkSize the number of elements per chunk * @return instance of this Job with generics changed on usage */ Job<KeyIn, ValueIn> chunkSize(int chunkSize); /** * Defines the strategy to handle topology changes while executing the map reduce job. For further * information see {@link com.hazelcast.mapreduce.TopologyChangedStrategy}. * * @param topologyChangedStrategy strategy to handle topology changes while executing the map reduce job * @return instance of this Job with generics changed on usage */ Job<KeyIn, ValueIn> topologyChangedStrategy(TopologyChangedStrategy topologyChangedStrategy); /** * Defines the {@link KeyPredicate} implementation to preselect keys the MapReduce task will be executed on. * Preselecting keys can speed up the job massively.<br> * This method can be used in conjunction with {@link #onKeys(Iterable)} or {@link #onKeys(Object...)} to define a * range of known and evaluated keys. * * @param predicate predicate implementation to be used to evaluate keys * @return instance of this Job with generics changed on usage */ Job<KeyIn, ValueIn> keyPredicate(KeyPredicate<? super KeyIn> predicate); /** * Defines the mapper for this task. This method is not idempotent and can be callable only one time. Further * calls result in an {@link IllegalStateException} to be thrown telling you to not change the internal state. * * @param mapper tasks mapper * @param <KeyOut> type of the emitted key * @param <ValueOut> type of the emitted value * @return instance of this Job with generics changed on usage */ <KeyOut, ValueOut> MappingJob<KeyIn, KeyOut, ValueOut> mapper(Mapper<KeyIn, ValueIn, KeyOut, ValueOut> mapper); }