/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package demo;
import org.apache.geode.spark.connector.GeodeConnectionConf;
import org.apache.spark.SparkConf;
import org.apache.spark.api.java.JavaPairRDD;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.api.java.JavaSparkContext;
import scala.Tuple2;
import java.util.*;
import static org.apache.geode.spark.connector.javaapi.GeodeJavaUtil.*;
/**
* This Spark application demonstrates how to save a RDD to Geode using Geode Spark
* Connector with Java.
* <p/>
* In order to run it, you will need to start Geode cluster, and create the following region
* with GFSH:
* <pre>
* gfsh> create region --name=str_str_region --type=REPLICATE \
* --key-constraint=java.lang.String --value-constraint=java.lang.String
* </pre>
*
* Once you compile and package the demo, the jar file basic-demos_2.10-0.5.0.jar
* should be generated under geode-spark-demos/basic-demos/target/scala-2.10/.
* Then run the following command to start a Spark job:
* <pre>
* <path to spark>/bin/spark-submit --master=local[2] --class demo.PairRDDSaveJavaDemo \
* <path to>/basic-demos_2.10-0.5.0.jar <locator host>:<port>
* </pre>
*
* Verify the data was saved to Geode with GFSH:
* <pre>gfsh> query --query="select * from /str_str_region.entrySet" </pre>
*/
public class PairRDDSaveJavaDemo {
public static void main(String[] argv) {
if (argv.length != 1) {
System.err.printf("Usage: PairRDDSaveJavaDemo <locators>\n");
return;
}
SparkConf conf = new SparkConf().setAppName("PairRDDSaveJavaDemo");
conf.set(GeodeLocatorPropKey, argv[0]);
JavaSparkContext sc = new JavaSparkContext(conf);
GeodeConnectionConf connConf = GeodeConnectionConf.apply(conf);
List<Tuple2<String, String>> data = new ArrayList<>();
data.add(new Tuple2<>("7", "seven"));
data.add(new Tuple2<>("8", "eight"));
data.add(new Tuple2<>("9", "nine"));
List<Tuple2<String, String>> data2 = new ArrayList<Tuple2<String, String>>();
data2.add(new Tuple2<>("11", "eleven"));
data2.add(new Tuple2<>("12", "twelve"));
data2.add(new Tuple2<>("13", "thirteen"));
// method 1: generate JavaPairRDD directly
JavaPairRDD<String, String> rdd1 = sc.parallelizePairs(data);
javaFunctions(rdd1).saveToGeode("str_str_region", connConf);
// method 2: convert JavaRDD<Tuple2<K,V>> to JavaPairRDD<K, V>
JavaRDD<Tuple2<String, String>> rdd2 = sc.parallelize(data2);
javaFunctions(toJavaPairRDD(rdd2)).saveToGeode("str_str_region", connConf);
sc.stop();
}
}