/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.pig.piggybank.evaluation.string; import java.io.IOException; import org.apache.pig.EvalFunc; import org.apache.pig.PigWarning; import org.apache.pig.data.DataType; import org.apache.pig.data.Tuple; import org.apache.pig.impl.logicalLayer.schema.Schema; /** * Given a string, this UDF replaces a substring given its starting index and * length with the given replacement string. If the the last argument is null, the specified * part of the string gets deleted. * * B = FOREACH A GENERATE Stuff($0, 10, 4, 'Pie') * If $0 is "Chocolate Cake" then the UDF will return "Chocolate Pie" * **/ public class Stuff extends EvalFunc<String> { public String exec(Tuple input) throws IOException { int inputSize = input.size(); if (input == null || inputSize == 0 || input.get(0) == null) { warn("Null input", PigWarning.UDF_WARNING_1); return null; } if (inputSize != 4) { throw new IOException("Stuff requires 4 arguments"); } String inString = (String) input.get(0); Integer startIndex = null; Object inStartIndex = input.get(1); //handle Double and Float if(inStartIndex instanceof Number){ startIndex = ((Number)inStartIndex).intValue(); }else{ warn("Specified startIndex is of type " + inStartIndex.getClass().getName() + ", only Numbers are supported", PigWarning.UDF_WARNING_1); return null; } Integer length = null; Object inLength = input.get(2); //handle Double and Float if(inLength instanceof Number){ length = ((Number)inLength).intValue(); }else{ warn("Specified length is of type " + inLength.getClass().getName() + ", only Numbers are supported", PigWarning.UDF_WARNING_1); return null; } String replacementString = (String) input.get(3); int strLength = inString.length(); if (startIndex < 0 || startIndex >= strLength) { throw new IOException("Given startIndex " + startIndex + " is out of bounds: [0," + strLength + ")"); } if (length < 0) { throw new IOException( "The number of characters to delete cannot be negative"); } StringBuffer result = new StringBuffer(); int upperBound = (startIndex + length > strLength) ? strLength : startIndex + length; for (int i = 0; i < strLength;) { // need to replace these characters if (i >= startIndex && i < upperBound) { if(replacementString != null) result.append(replacementString); i += length; } else { result.append(inString.charAt(i)); i++; } } return result.toString(); } /** * @param input * , schema of the input data * @return output schema */ @Override public Schema outputSchema(Schema input) { return new Schema(new Schema.FieldSchema(null, DataType.CHARARRAY)); } }