/** * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.alibaba.jstorm.task.group; import backtype.storm.tuple.Fields; import com.alibaba.jstorm.task.execute.MsgInfo; import com.alibaba.jstorm.utils.JStormUtils; import java.util.ArrayList; import java.util.Iterator; import java.util.List; import java.util.Map; /** * fields grouping * * @author yannian */ public class MkFieldsGrouper { protected Fields outFields; protected Fields groupFields; protected List<Integer> groupFieldIndex; protected List<Integer> outTasks; public MkFieldsGrouper(Fields _out_fields, Fields _group_fields, List<Integer> _out_tasks) { for (Iterator<String> it = _group_fields.iterator(); it.hasNext(); ) { String groupField = it.next(); // if groupField isn't in _out_fields, it would throw Exception _out_fields.fieldIndex(groupField); } this.outFields = _out_fields; this.groupFields = _group_fields; this.groupFieldIndex = new ArrayList<>(); for (String fieldStr : groupFields.toList()) { groupFieldIndex.add(outFields.fieldIndex(fieldStr)); } this.outTasks = _out_tasks; } public List<Integer> grouper(List<Object> values) { int hashcode = getHashCode(values); int group = Math.abs(hashcode % this.outTasks.size()); return JStormUtils.mk_list(outTasks.get(group)); } public void batchGrouper(List<MsgInfo> batch, Map<Object, List<MsgInfo>> ret) { for (MsgInfo msg : batch) { int hashcode = getHashCode(msg.values); int target = outTasks.get(Math.abs(hashcode % this.outTasks.size())); List<MsgInfo> targetBatch = ret.get(target); if (targetBatch == null) { targetBatch = new ArrayList<>(); ret.put(target, targetBatch); } targetBatch.add(msg); } } protected int getHashCode(List<Object> tuple) { if (groupFieldIndex.size() == 1) { return tuple.get(groupFieldIndex.get(0)).hashCode(); } else { List<Object> groupFieldValues = new ArrayList<>(groupFields.size()); for (Integer index : groupFieldIndex) { groupFieldValues.add(tuple.get(index)); } return groupFieldValues.hashCode(); } } }