/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package demo; import org.apache.geode.spark.connector.GeodeConnectionConf; import org.apache.spark.SparkConf; import org.apache.spark.api.java.JavaRDD; import org.apache.spark.api.java.JavaSparkContext; import org.apache.spark.api.java.function.PairFunction; import scala.Tuple2; import java.util.ArrayList; import java.util.List; import static org.apache.geode.spark.connector.javaapi.GeodeJavaUtil.*; /** * This Spark application demonstrates how to save a RDD to Geode using Geode Spark * Connector with Java. * <p/> * In order to run it, you will need to start Geode cluster, and create the following region * with GFSH: * <pre> * gfsh> create region --name=str_int_region --type=REPLICATE \ * --key-constraint=java.lang.String --value-constraint=java.lang.Integer * </pre> * * Once you compile and package the demo, the jar file basic-demos_2.10-0.5.0.jar * should be generated under geode-spark-demos/basic-demos/target/scala-2.10/. * Then run the following command to start a Spark job: * <pre> * <path to spark>/bin/spark-submit --master=local[2] --class demo.RDDSaveJavaDemo \ * <path to>/basic-demos_2.10-0.5.0.jar <locator host>:<port> * </pre> * * Verify the data was saved to Geode with GFSH: * <pre>gfsh> query --query="select * from /str_int_region.entrySet" </pre> */ public class RDDSaveJavaDemo { public static void main(String[] argv) { if (argv.length != 1) { System.err.printf("Usage: RDDSaveJavaDemo <locators>\n"); return; } SparkConf conf = new SparkConf().setAppName("RDDSaveJavaDemo"); conf.set(GeodeLocatorPropKey, argv[0]); JavaSparkContext sc = new JavaSparkContext(conf); List<String> data = new ArrayList<String>(); data.add("abcdefg"); data.add("abcdefgh"); data.add("abcdefghi"); JavaRDD<String> rdd = sc.parallelize(data); GeodeConnectionConf connConf = GeodeConnectionConf.apply(conf); PairFunction<String, String, Integer> func = new PairFunction<String, String, Integer>() { @Override public Tuple2<String, Integer> call(String s) throws Exception { return new Tuple2<String, Integer>(s, s.length()); } }; javaFunctions(rdd).saveToGeode("str_int_region", func, connConf); sc.stop(); } }