package com.thinkbiganalytics.nifi.pyspark.utils; /*- * #%L * thinkbig-nifi-spark-processors * %% * Copyright (C) 2017 ThinkBig Analytics * %% * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * #L% */ import javax.annotation.Nonnull; /** * Helper utilities for ExecutePySpark processor */ public class PySparkUtils { private final static String CSV_DELIMITER = ","; private final static String PAIR_DELIMITER = "="; /** * Basic validation to check that a string is for the form value1,value2,value3 and so on * * @param appArgs String containing value to check * @return true/false result of validation */ public boolean validateCsvArgs(@Nonnull String appArgs) { if (appArgs.isEmpty()) { return false; } if ((appArgs.charAt(0) == CSV_DELIMITER.charAt(0)) || (appArgs.charAt(appArgs.length() - 1) == CSV_DELIMITER.charAt(0))) { return false; } String[] providedArgs; try { providedArgs = appArgs.split(","); } catch (Exception e) { return false; } return (providedArgs.length > 0); } /** * Get an array of values that are separated by commas in a single string * * @param appArgs String containing comma-separated values * @return String array of the values */ public String[] getCsvValuesAsArray(@Nonnull String appArgs) { if (!validateCsvArgs(appArgs)) { return new String[]{}; } return appArgs.split(CSV_DELIMITER); } /** * Get a string of values separated by comma from an array of values * * @param values Array of string values * @return String containing values separated by comma */ public String getCsvStringFromArray(@Nonnull String[] values) { if (values.length == 0) { return ""; } StringBuilder retVal = new StringBuilder(); for (int i = 0; i < values.length; i++) { retVal.append(values[i]); if (i != values.length - 1) { retVal.append(","); } } return retVal.toString(); } /** * Basic validation to check that a string is in the form key1=value1,key2=value2,key3=value3 and so on * * @param args String containing value to check * @return true/false result of validation */ public boolean validateKeyValueArgs(String args) { String[] keyValueArgsAsList = getCsvValuesAsArray(args); if (keyValueArgsAsList.length == 0) { return false; } for (String keyValuePair : keyValueArgsAsList) { if (!validateKeyValuePair(keyValuePair)) { return false; } } return true; } /** * Basic validation to check that a string is in the form key=value * * @param keyValuePair String containing value to check * @return true/false result of validation */ public boolean validateKeyValuePair(String keyValuePair) { if ((keyValuePair == null) || (keyValuePair.isEmpty())) { return false; } if (keyValuePair.charAt(0) == PAIR_DELIMITER.charAt(0) || (keyValuePair.charAt(keyValuePair.length() - 1) == PAIR_DELIMITER.charAt(0))) { return false; } int equalCount = 0; for (int i = 0; i < keyValuePair.length(); i++) { if (keyValuePair.charAt(i) == PAIR_DELIMITER.charAt(0)) { equalCount++; } if (equalCount > 1) { return false; } } return (equalCount == 1); } }