/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package gobblin.util; import org.apache.hadoop.fs.Path; import com.google.common.base.Preconditions; import com.google.common.base.Strings; import gobblin.configuration.ConfigurationKeys; import gobblin.configuration.State; import gobblin.configuration.WorkUnitState; /** * Utility class for use with the {@link gobblin.fork.ForkOperator} class. * * @author Yinan Li */ public class ForkOperatorUtils { /** * Get a new property key from an original one with branch index (if applicable). * * @param key property key * @param numBranches number of branches (non-negative) * @param branchId branch id (non-negative) * @return a new property key */ public static String getPropertyNameForBranch(String key, int numBranches, int branchId) { Preconditions.checkArgument(numBranches >= 0, "The number of branches is expected to be non-negative"); Preconditions.checkArgument(branchId >= 0, "The branchId is expected to be non-negative"); return numBranches > 1 ? key + "." + branchId : key; } /** * Get a new property key from an original one with branch index (if applicable). * * @param key property key * @param branch branch index * @return a new property key */ public static String getPropertyNameForBranch(String key, int branch) { // A branch index of -1 means there is no fork and branching return branch >= 0 ? key + "." + branch : key; } /** * Get a new property key from an original one based on the branch id. The method assumes the branch id specified by * the {@link ConfigurationKeys#FORK_BRANCH_ID_KEY} parameter in the given WorkUnitState. The fork id key specifies * which fork this parameter belongs to. Note this method will only provide the aforementioned functionality for * {@link gobblin.converter.Converter}s. To get the same functionality in {@link gobblin.writer.DataWriter}s use * the {@link gobblin.writer.DataWriterBuilder#forBranch(int)} to construct a writer with a specific branch id. * * @param workUnitState contains the fork id key * @param key property key * @return a new property key */ public static String getPropertyNameForBranch(WorkUnitState workUnitState, String key) { Preconditions.checkNotNull(workUnitState, "Cannot get a property from a null WorkUnit"); Preconditions.checkNotNull(key, "Cannot get a the value for a null key"); if (!workUnitState.contains(ConfigurationKeys.FORK_BRANCH_ID_KEY)) { return key; } return workUnitState.getPropAsInt(ConfigurationKeys.FORK_BRANCH_ID_KEY) >= 0 ? key + "." + workUnitState.getPropAsInt(ConfigurationKeys.FORK_BRANCH_ID_KEY) : key; } /** * Get a new path with the given branch name as a sub directory. * * @param numBranches number of branches (non-negative) * @param branchId branch id (non-negative) * @return a new path */ public static String getPathForBranch(State state, String path, int numBranches, int branchId) { Preconditions.checkNotNull(state); Preconditions.checkNotNull(path); Preconditions.checkArgument(numBranches >= 0, "The number of branches is expected to be non-negative"); Preconditions.checkArgument(branchId >= 0, "The branch id is expected to be non-negative"); return numBranches > 1 ? path + Path.SEPARATOR + state.getProp(ConfigurationKeys.FORK_BRANCH_NAME_KEY + "." + branchId, ConfigurationKeys.DEFAULT_FORK_BRANCH_NAME + branchId) : path; } /** * Get the fork branch ID of a branch of a given task. * * @param taskId task ID * @param index branch index * @return a fork branch ID */ public static String getForkId(String taskId, int index) { return taskId + "." + index; } }