/** * This software is licensed to you under the Apache License, Version 2.0 (the * "Apache License"). * * LinkedIn's contributions are made under the Apache License. If you contribute * to the Software, the contributions will be deemed to have been made under the * Apache License, unless you expressly indicate otherwise. Please do not make any * contributions that would be inconsistent with the Apache License. * * You may obtain a copy of the Apache License at http://www.apache.org/licenses/LICENSE-2.0 * Unless required by applicable law or agreed to in writing, this software * distributed under the Apache License is distributed on an "AS IS" BASIS, WITHOUT * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the Apache * License for the specific language governing permissions and limitations for the * software governed under the Apache License. * * © 2012 LinkedIn Corp. All Rights Reserved. */ package com.senseidb.search.req.mapred.functions; import java.io.Serializable; import java.util.List; import org.json.JSONException; import org.json.JSONObject; import com.senseidb.search.req.mapred.CombinerStage; import com.senseidb.search.req.mapred.FacetCountAccessor; import com.senseidb.search.req.mapred.FieldAccessor; import com.senseidb.search.req.mapred.SenseiMapReduce; import com.senseidb.util.JSONUtil.FastJSONArray; import com.senseidb.util.JSONUtil.FastJSONObject; public class AvgMapReduce implements SenseiMapReduce<AvgResult, AvgResult> { private String column; @Override public void init(JSONObject params) { column = params.optString("column"); if (column == null) { throw new IllegalStateException("Column parameter shouldn't be null"); } } @Override public AvgResult map(int[] docId, int docIdCount, long[] uids, FieldAccessor accessor, FacetCountAccessor facetCountAccessor) { double ret = 0; for (int i = 0; i < docIdCount; i++) { ret+= accessor.getDouble(column, docId[i]); } return new AvgResult(ret / docIdCount, docIdCount); } @Override public List<AvgResult> combine(List<AvgResult> mapResults, CombinerStage combinerStage) { AvgResult avgResult = reduce(mapResults); mapResults.clear(); mapResults.add(avgResult); return mapResults; } @Override public AvgResult reduce(List<AvgResult> combineResults) { if (combineResults.isEmpty()) { return null; } int minCount = Integer.MAX_VALUE; for (AvgResult avgResult : combineResults) { if (avgResult == null || avgResult.count == 0) { continue; } if (minCount > avgResult.count) { minCount = avgResult.count; } } if (minCount == Integer.MAX_VALUE) { return null; } double accumulatedValue = 0; int accumulatedCount = 0; for (AvgResult avgResult : combineResults) { if (avgResult == null || avgResult.count == 0) { continue; } accumulatedValue += avgResult.value / minCount * avgResult.count; accumulatedCount += avgResult.count; } double ret = accumulatedValue / ((double) accumulatedCount / minCount); return new AvgResult(ret, accumulatedCount); } @Override public JSONObject render(AvgResult reduceResult) { try { return new FastJSONObject().put("avg", reduceResult.value).put("count", reduceResult.count); } catch (JSONException e) { throw new RuntimeException(e); } } @Override public String[] getColumns() { return new String[]{column}; } } class AvgResult implements Serializable { public double value; public int count; public AvgResult(double value, int count) { super(); this.value = value; this.count = count; } }