/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.aliyun.odps.mapred.example.local.lib.aggregate;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.Map.Entry;
import com.aliyun.odps.data.Record;
import com.aliyun.odps.mapred.MapperBase;
import com.aliyun.odps.mapred.conf.JobConf;
/**
* This class implements the generic mapper of Aggregate.
*/
public class ValueAggregatorMapper extends MapperBase {
protected ArrayList<ValueAggregatorDescriptor> aggregatorDescriptorList = null;
private Record columnK, columnV;
@Override
public void setup(TaskContext context) throws IOException {
JobConf job = context.getJobConf();
this.initializeMySpec(job);
this.logSpec();
columnK = context.createMapOutputKeyRecord();
columnV = context.createMapOutputValueRecord();
}
private static ValueAggregatorDescriptor getValueAggregatorDescriptor(
String spec, JobConf job) {
if (spec == null) {
return null;
}
String[] segments = spec.split(",", -1);
String type = segments[0];
if (type.compareToIgnoreCase("UserDefined") == 0) {
String className = segments[1];
return new UserDefinedValueAggregatorDescriptor(className, job);
}
return null;
}
private static ArrayList<ValueAggregatorDescriptor> getAggregatorDescriptors(
JobConf job) {
String advn = "aggregator.descriptor";
int num = job.getInt(advn + ".num", 0);
ArrayList<ValueAggregatorDescriptor> retv = new ArrayList<ValueAggregatorDescriptor>(
num);
for (int i = 0; i < num; i++) {
String spec = job.get(advn + "." + i);
ValueAggregatorDescriptor ad = getValueAggregatorDescriptor(spec, job);
if (ad != null) {
retv.add(ad);
}
}
return retv;
}
private void initializeMySpec(JobConf job) {
this.aggregatorDescriptorList = getAggregatorDescriptors(job);
if (this.aggregatorDescriptorList.size() == 0) {
this.aggregatorDescriptorList
.add(new UserDefinedValueAggregatorDescriptor(
ValueAggregatorBaseDescriptor.class.getCanonicalName(), job));
}
}
protected void logSpec() {
}
@Override
public void cleanup(TaskContext context) throws IOException {
}
/**
* the map function. It iterates through the value aggregator descriptor list
* to generate aggregation id/value pairs and emit them.
*/
@Override
public void map(long recordNum, Record record, TaskContext context)
throws IOException {
// LongWritable key = new LongWritable(recordNum);
Iterator iter = this.aggregatorDescriptorList.iterator();
while (iter.hasNext()) {
ValueAggregatorDescriptor ad = (ValueAggregatorDescriptor) iter.next();
Iterator<Entry<String, String>> ens = ad.generateKeyValPairs(recordNum,
record).iterator();
while (ens.hasNext()) {
Entry<String, String> en = ens.next();
columnK.set(new Object[]{en.getKey()});
columnV.set(new Object[]{en.getValue()});
context.write(columnK, columnV);
}
}
}
}