Here you can find the source of removeTags(String input, List
private static String removeTags(String input, List<String> knownTagList)
//package com.java2s; /**// w ww. j a v a 2 s .co m * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import java.util.List; import java.util.regex.Matcher; import java.util.regex.Pattern; import static java.util.regex.Pattern.*; public class Main { private static String removeTags(String input, List<String> knownTagList) { Pattern tag = compile("</?([^\\s>]*)\\s*[^>]*>", CASE_INSENSITIVE); Matcher matches = tag.matcher(input); while (matches.find()) { if (!knownTagList.contains(matches.group(1))) { input = input.replaceAll(quote(matches.group()), ""); } } return input; } private static String removeTags(String input, String startTag, String endTag) { while (input.contains(startTag)) { int start = input.indexOf(startTag); int end = input.substring(start + startTag.length()).indexOf(endTag); if (end == -1) input = input.substring(0, start); else input = input.substring(0, start) + input.substring(start + startTag.length() + end + endTag.length()); } return input; } }