/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package demo; import org.apache.geode.spark.connector.GeodeConnectionConf; import org.apache.spark.SparkConf; import org.apache.spark.api.java.JavaPairRDD; import org.apache.spark.api.java.JavaRDD; import org.apache.spark.api.java.JavaSparkContext; import scala.Tuple2; import java.util.*; import static org.apache.geode.spark.connector.javaapi.GeodeJavaUtil.*; /** * This Spark application demonstrates how to save a RDD to Geode using Geode Spark * Connector with Java. * <p/> * In order to run it, you will need to start Geode cluster, and create the following region * with GFSH: * <pre> * gfsh> create region --name=str_str_region --type=REPLICATE \ * --key-constraint=java.lang.String --value-constraint=java.lang.String * </pre> * * Once you compile and package the demo, the jar file basic-demos_2.10-0.5.0.jar * should be generated under geode-spark-demos/basic-demos/target/scala-2.10/. * Then run the following command to start a Spark job: * <pre> * <path to spark>/bin/spark-submit --master=local[2] --class demo.PairRDDSaveJavaDemo \ * <path to>/basic-demos_2.10-0.5.0.jar <locator host>:<port> * </pre> * * Verify the data was saved to Geode with GFSH: * <pre>gfsh> query --query="select * from /str_str_region.entrySet" </pre> */ public class PairRDDSaveJavaDemo { public static void main(String[] argv) { if (argv.length != 1) { System.err.printf("Usage: PairRDDSaveJavaDemo <locators>\n"); return; } SparkConf conf = new SparkConf().setAppName("PairRDDSaveJavaDemo"); conf.set(GeodeLocatorPropKey, argv[0]); JavaSparkContext sc = new JavaSparkContext(conf); GeodeConnectionConf connConf = GeodeConnectionConf.apply(conf); List<Tuple2<String, String>> data = new ArrayList<>(); data.add(new Tuple2<>("7", "seven")); data.add(new Tuple2<>("8", "eight")); data.add(new Tuple2<>("9", "nine")); List<Tuple2<String, String>> data2 = new ArrayList<Tuple2<String, String>>(); data2.add(new Tuple2<>("11", "eleven")); data2.add(new Tuple2<>("12", "twelve")); data2.add(new Tuple2<>("13", "thirteen")); // method 1: generate JavaPairRDD directly JavaPairRDD<String, String> rdd1 = sc.parallelizePairs(data); javaFunctions(rdd1).saveToGeode("str_str_region", connConf); // method 2: convert JavaRDD<Tuple2<K,V>> to JavaPairRDD<K, V> JavaRDD<Tuple2<String, String>> rdd2 = sc.parallelize(data2); javaFunctions(toJavaPairRDD(rdd2)).saveToGeode("str_str_region", connConf); sc.stop(); } }