Java tutorial
/*! ****************************************************************************** * * Pentaho Data Integration * * Copyright (C) 2002-2016 by Pentaho : http://www.pentaho.com * ******************************************************************************* * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ******************************************************************************/ package org.pentaho.di.www; import org.apache.commons.lang.StringUtils; import java.util.regex.Matcher; import java.util.regex.Pattern; public class ServletTestUtils { public static final char[] BAD_CHARACTERS_TO_ESCAPE = { '<', '>', '\'', '\"' }; public static final String BAD_STRING_TO_TEST = "!@#$%\"\'^&*()<>&/test string&"; // Pattern to check that ampersand character '&' was successfully escaped. // Eg search excluding '&', '<', '>', '"e;', ''', and numeric reference '&#' public static final Pattern PATTERN = Pattern .compile("(&(?=(?!amp;))(?=(?!#[0-9a-f]{1,5};))(?=(?!lt;))(?=(?!gt;))(?=(?!quote;))(?=(?!apos;)))"); public static String getInsideOfTag(String tag, String string) { String open = "<" + tag + ">"; String close = "</" + tag + ">"; return string.substring(string.indexOf(open) + open.length(), string.indexOf(close)); } public static boolean hasBadText(String value) { Matcher matcher = PATTERN.matcher(value); if (matcher.find()) { return true; } return StringUtils.containsAny(value, BAD_CHARACTERS_TO_ESCAPE); } }