/*! ****************************************************************************** * * Pentaho Data Integration * * Copyright (C) 2002-2016 by Pentaho : http://www.pentaho.com * ******************************************************************************* * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ******************************************************************************/ package org.pentaho.di.www; import org.apache.commons.lang.StringUtils; import java.util.regex.Matcher; import java.util.regex.Pattern; public class ServletTestUtils { public static final char[] BAD_CHARACTERS_TO_ESCAPE = {'<', '>', '\'', '\"'}; public static final String BAD_STRING_TO_TEST = "!@#$%\"\'^&*()<>&/test string&"; // Pattern to check that ampersand character '&' was successfully escaped. // Eg search excluding '&', '<', '>', '"e;', ''', and numeric reference '&#' public static final Pattern PATTERN = Pattern.compile( "(&(?=(?!amp;))(?=(?!#[0-9a-f]{1,5};))(?=(?!lt;))(?=(?!gt;))(?=(?!quote;))(?=(?!apos;)))" ); public static String getInsideOfTag( String tag, String string ) { String open = "<" + tag + ">"; String close = "</" + tag + ">"; return string.substring( string.indexOf( open ) + open.length(), string.indexOf( close ) ); } public static boolean hasBadText( String value ) { Matcher matcher = PATTERN.matcher( value ); if ( matcher.find() ) { return true; } return StringUtils.containsAny( value, BAD_CHARACTERS_TO_ESCAPE ); } }