/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.test.hadoopcompatibility.mapred;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import org.apache.flink.api.java.DataSet;
import org.apache.flink.api.java.ExecutionEnvironment;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
public class HadoopTestData {
public static DataSet<Tuple2<IntWritable, Text>> getKVPairDataSet(ExecutionEnvironment env) {
List<Tuple2<IntWritable, Text>> data = new ArrayList<Tuple2<IntWritable, Text>>();
data.add(new Tuple2<IntWritable, Text>(new IntWritable(1),new Text("Hi")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(2),new Text("Hello")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(3),new Text("Hello world")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(4),new Text("Hello world, how are you?")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(5),new Text("I am fine.")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(6),new Text("Luke Skywalker")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(7),new Text("Comment#1")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(8),new Text("Comment#2")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(9),new Text("Comment#3")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(10),new Text("Comment#4")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(11),new Text("Comment#5")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(12),new Text("Comment#6")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(13),new Text("Comment#7")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(14),new Text("Comment#8")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(15),new Text("Comment#9")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(16),new Text("Comment#10")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(17),new Text("Comment#11")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(18),new Text("Comment#12")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(19),new Text("Comment#13")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(20),new Text("Comment#14")));
data.add(new Tuple2<IntWritable, Text>(new IntWritable(21),new Text("Comment#15")));
Collections.shuffle(data);
return env.fromCollection(data);
}
}