com.switchfly.inputvalidation.sanitizer.StripHtmlSanitizer.java Source code

Java tutorial

Introduction

Here is the source code for com.switchfly.inputvalidation.sanitizer.StripHtmlSanitizer.java

Source

/*
 * Copyright 2012 Switchfly
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.switchfly.inputvalidation.sanitizer;

import org.apache.commons.lang.StringUtils;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.nodes.Entities;

public class StripHtmlSanitizer implements Sanitizer<String> {

    @Override
    public String execute(String content) {
        if (StringUtils.isBlank(content)) {
            return content;
        }
        Document document = Jsoup.parse(content);
        document.outputSettings().escapeMode(Entities.EscapeMode.xhtml);
        for (Element element : document.select("script,link,iframe,style")) {
            element.remove();
        }
        return document.text();
    }
}