no.get.cms.plugin.resourcecompressor.ContentLoader.java Source code

Java tutorial

Introduction

Here is the source code for no.get.cms.plugin.resourcecompressor.ContentLoader.java

Source

/*
Copyright 2012 Get AS
    
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
    
http://www.apache.org/licenses/LICENSE-2.0
    
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
 */
package no.get.cms.plugin.resourcecompressor;

import org.apache.commons.io.IOUtils;

import java.io.IOException;
import java.io.InputStream;
import java.net.MalformedURLException;
import java.net.URL;
import java.net.URLConnection;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

public class ContentLoader {

    public String load(String srcUrl) {
        try {
            URL url = new URL(srcUrl);
            URLConnection connection = url.openConnection();
            connection.setRequestProperty("Accept-Charset", "UTF-8");
            connection.setConnectTimeout(2000);
            connection.setReadTimeout(10000);
            connection.connect();
            InputStream inputStream = connection.getInputStream();
            String charset = extractCharsetFromContentType(connection.getContentType());
            String body = IOUtils.toString(inputStream, charset);
            IOUtils.close(connection);
            return body;
        } catch (MalformedURLException e) {
            throw new RuntimeException(e);
        } catch (IOException e) {
            throw new RuntimeException(e);
        }
    }

    private String extractCharsetFromContentType(String contentType) {
        Pattern charsetPattern = Pattern.compile(".*;charset=(^\\s*)");
        Matcher matcher = charsetPattern.matcher(contentType);
        if (matcher.find()) {
            return matcher.group(1);
        } else {
            return "UTF-8";
        }
    }
}