com.gu.logback.appender.kinesis.KinesisAppender.java Source code

Java tutorial

Introduction

Here is the source code for com.gu.logback.appender.kinesis.KinesisAppender.java

Source

/*******************************************************************************
 * Copyright 2014 Amazon.com, Inc. or its affiliates. All Rights Reserved.
 * 
 * Licensed under the Apache License, Version 2.0 (the "License").
 * You may not use this file except in compliance with the License.
 * A copy of the License is located at
 * 
 *  http://aws.amazon.com/apache2.0
 * 
 * or in the "license" file accompanying this file. This file is distributed
 * on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
 * express or implied. See the License for the specific language governing
 * permissions and limitations under the License.
 ******************************************************************************/

package com.gu.logback.appender.kinesis;

import java.nio.ByteBuffer;
import java.util.UUID;
import java.util.concurrent.BlockingQueue;
import java.util.concurrent.LinkedBlockingDeque;
import java.util.concurrent.ThreadPoolExecutor;
import java.util.concurrent.TimeUnit;
import com.amazonaws.ClientConfiguration;
import com.amazonaws.auth.AWSCredentialsProvider;
import com.amazonaws.auth.STSAssumeRoleSessionCredentialsProvider;
import com.amazonaws.regions.Region;
import com.amazonaws.regions.Regions;
import com.amazonaws.retry.PredefinedRetryPolicies;
import com.amazonaws.retry.RetryPolicy;
import com.amazonaws.services.kinesis.AmazonKinesisAsyncClient;
import com.amazonaws.services.kinesis.model.DescribeStreamResult;
import com.amazonaws.services.kinesis.model.PutRecordRequest;
import com.amazonaws.services.kinesis.model.ResourceNotFoundException;
import com.amazonaws.services.kinesis.model.StreamStatus;
import com.gu.logback.appender.kinesis.helpers.AsyncPutCallStatsReporter;
import com.gu.logback.appender.kinesis.helpers.BlockFastProducerPolicy;
import com.gu.logback.appender.kinesis.helpers.CustomCredentialsProviderChain;
import com.gu.logback.appender.kinesis.helpers.Validator;
import ch.qos.logback.core.AppenderBase;
import ch.qos.logback.core.LayoutBase;
import ch.qos.logback.core.spi.DeferredProcessingAware;

/**
 * LOGBack Appender implementation to support sending data from java applications
 * directly into a Kinesis stream.
 * 
 * More details are available <a
 * href="https://github.com/guardian/kinesis-logback-appender">here</a>
 */
public class KinesisAppender<Event extends DeferredProcessingAware> extends AppenderBase<Event> {

    private String encoding = AppenderConstants.DEFAULT_ENCODING;
    private int maxRetries = AppenderConstants.DEFAULT_MAX_RETRY_COUNT;
    private int bufferSize = AppenderConstants.DEFAULT_BUFFER_SIZE;
    private int threadCount = AppenderConstants.DEFAULT_THREAD_COUNT;
    private int shutdownTimeout = AppenderConstants.DEFAULT_SHUTDOWN_TIMEOUT_SEC;

    private String endpoint;
    private String region;
    private String streamName;
    private String roleToAssumeArn;

    private boolean initializationFailed = false;
    private BlockingQueue<Runnable> taskBuffer;
    private AmazonKinesisAsyncClient kinesisClient;
    private AsyncPutCallStatsReporter asyncCallHander;
    private LayoutBase<Event> layout;
    private AWSCredentialsProvider credentials = new CustomCredentialsProviderChain();

    public LayoutBase<Event> getLayout() {
        return layout;
    }

    public void setLayout(LayoutBase<Event> layout) {
        this.layout = layout;
    }

    /**
     * Configures this appender instance and makes it ready for use by the
     * consumers. It validates mandatory parameters and confirms if the configured
     * stream is ready for publishing data yet.
     * 
     * Error details are made available through the fallback handler for this
     * appender
     * 
     * @throws IllegalStateException
     *           if we encounter issues configuring this appender instance
     */
    @Override
    public void start() {
        if (layout == null) {
            initializationFailed = true;
            addError("Invalid configuration - No layout for appender: " + name);
            return;
        }

        if (streamName == null) {
            initializationFailed = true;
            addError("Invalid configuration - streamName cannot be null for appender: " + name);
            return;
        }

        ClientConfiguration clientConfiguration = new ClientConfiguration();
        clientConfiguration.setMaxErrorRetry(maxRetries);
        clientConfiguration.setRetryPolicy(new RetryPolicy(PredefinedRetryPolicies.DEFAULT_RETRY_CONDITION,
                PredefinedRetryPolicies.DEFAULT_BACKOFF_STRATEGY, maxRetries, true));
        clientConfiguration.setUserAgent(AppenderConstants.USER_AGENT_STRING);

        BlockingQueue<Runnable> taskBuffer = new LinkedBlockingDeque<Runnable>(bufferSize);
        ThreadPoolExecutor threadPoolExecutor = new ThreadPoolExecutor(threadCount, threadCount,
                AppenderConstants.DEFAULT_THREAD_KEEP_ALIVE_SEC, TimeUnit.SECONDS, taskBuffer,
                new BlockFastProducerPolicy());
        threadPoolExecutor.prestartAllCoreThreads();
        kinesisClient = new AmazonKinesisAsyncClient(credentials, clientConfiguration, threadPoolExecutor);

        boolean regionProvided = !Validator.isBlank(region);
        if (!regionProvided) {
            region = AppenderConstants.DEFAULT_REGION;
        }
        kinesisClient.setRegion(Region.getRegion(Regions.fromName(region)));
        if (!Validator.isBlank(endpoint)) {
            if (regionProvided) {
                addError("Received configuration for both region as well as Amazon Kinesis endpoint. (" + endpoint
                        + ") will be used as endpoint instead of default endpoint for region (" + region + ")");
            }
            kinesisClient.setEndpoint(endpoint);
        }

        DescribeStreamResult describeResult = null;
        try {
            describeResult = kinesisClient.describeStream(streamName);
            String streamStatus = describeResult.getStreamDescription().getStreamStatus();
            if (!StreamStatus.ACTIVE.name().equals(streamStatus)
                    && !StreamStatus.UPDATING.name().equals(streamStatus)) {
                initializationFailed = true;
                addError(
                        "Stream " + streamName + " is not ready (in active/updating status) for appender: " + name);
            }
        } catch (ResourceNotFoundException rnfe) {
            initializationFailed = true;
            addError("Stream " + streamName + " doesn't exist for appender: " + name, rnfe);
        }

        asyncCallHander = new AsyncPutCallStatsReporter(this);

        super.start();
    }

    /**
     * Closes this appender instance. Before exiting, the implementation tries to
     * flush out buffered log events within configured shutdownTimeout seconds. If
     * that doesn't finish within configured shutdownTimeout, it would drop all
     * the buffered log events.
     */
    @Override
    public void stop() {
        ThreadPoolExecutor threadpool = (ThreadPoolExecutor) kinesisClient.getExecutorService();
        threadpool.shutdown();
        BlockingQueue<Runnable> taskQueue = threadpool.getQueue();
        int bufferSizeBeforeShutdown = threadpool.getQueue().size();
        boolean gracefulShutdown = true;
        try {
            gracefulShutdown = threadpool.awaitTermination(shutdownTimeout, TimeUnit.SECONDS);
        } catch (InterruptedException e) {
            // we are anyways cleaning up
        } finally {
            int bufferSizeAfterShutdown = taskQueue.size();
            if (!gracefulShutdown || bufferSizeAfterShutdown > 0) {
                String errorMsg = "Kinesis Log4J Appender (" + name + ") waited for " + shutdownTimeout
                        + " seconds before terminating but could send only "
                        + (bufferSizeAfterShutdown - bufferSizeBeforeShutdown) + " logevents, it failed to send "
                        + bufferSizeAfterShutdown + " pending log events from it's processing queue";
                addError(errorMsg);
            }
        }
        kinesisClient.shutdown();
    }

    /**
     * This method is called whenever a logging happens via logger.log(..) API
     * calls. Implementation for this appender will take in log events instantly
     * as long as the buffer is not full (as per user configuration). This call
     * will block if internal buffer is full until internal threads create some
     * space by publishing some of the records.
     * 
     * If there is any error in parsing logevents, those logevents would be
     * dropped.
     */
    @Override
    protected void append(Event logEvent) {
        if (initializationFailed) {
            addError("Check the configuration and whether the configured stream " + streamName
                    + " exists and is active. Failed to initialize kinesis logback appender: " + name);
            return;
        }
        try {
            String message = this.layout.doLayout(logEvent);

            putMessage(message);
        } catch (Exception e) {
            addError("Failed to schedule log entry for publishing into Kinesis stream: " + streamName, e);
        }
    }

    private void putMessage(String message) throws Exception {
        ByteBuffer data = ByteBuffer.wrap(message.getBytes(encoding));
        kinesisClient.putRecordAsync(new PutRecordRequest().withPartitionKey(UUID.randomUUID().toString())
                .withStreamName(streamName).withData(data), asyncCallHander);
    }

    /**
     * Returns configured stream name
     * 
     * @return configured stream name
     */
    public String getStreamName() {
        return streamName;
    }

    /**
     * Sets streamName for the kinesis stream to which data is to be published.
     * 
     * @param streamName
     *          name of the kinesis stream to which data is to be published.
     */
    public void setStreamName(String streamName) {
        Validator.validate(!Validator.isBlank(streamName), "streamName cannot be blank");
        this.streamName = streamName.trim();
    }

    /**
     * Configured encoding for the data to be published. If none specified,
     * default is UTF-8
     * 
     * @return encoding for the data to be published. If none specified, default
     *         is UTF-8
     */
    public String getEncoding() {
        return this.encoding;
    }

    /**
     * Sets encoding for the data to be published. If none specified, default is
     * UTF-8
     * 
     * @param charset
     *          encoding for expected log messages
     */
    public void setEncoding(String charset) {
        Validator.validate(!Validator.isBlank(charset), "encoding cannot be blank");
        this.encoding = charset.trim();
    }

    /**
     * Returns configured maximum number of retries between API failures while
     * communicating with Kinesis. This is used in AWS SDK's default retries for
     * HTTP exceptions, throttling errors etc.
     * 
     * @return configured maximum number of retries between API failures while
     *         communicating with Kinesis
     */
    public int getMaxRetries() {
        return maxRetries;
    }

    /**
     * Configures maximum number of retries between API failures while
     * communicating with Kinesis. This is used in AWS SDK's default retries for
     * HTTP exceptions, throttling errors etc.
     * 
     * @param maxRetries 
     *       the number of retries between API failures               
     */
    public void setMaxRetries(int maxRetries) {
        Validator.validate(maxRetries > 0, "maxRetries must be > 0");
        this.maxRetries = maxRetries;
    }

    /**
     * Returns configured buffer size for this appender. This implementation would
     * buffer these many log events in memory while parallel threads are trying to
     * publish them to Kinesis.
     * 
     * @return configured buffer size for this appender.
     */
    public int getBufferSize() {
        return bufferSize;
    }

    /**
     * Configures buffer size for this appender. This implementation would buffer
     * these many log events in memory while parallel threads are trying to
     * publish them to Kinesis.
     *
     * @param bufferSize
     *       buffer size for this appender   
     *
     */
    public void setBufferSize(int bufferSize) {
        Validator.validate(bufferSize > 0, "bufferSize must be >0");
        this.bufferSize = bufferSize;
    }

    /**
     * Returns configured number of parallel thread count that would work on
     * publishing buffered events to Kinesis
     * 
     * @return configured number of parallel thread count that would work on
     *         publishing buffered events to Kinesis
     */
    public int getThreadCount() {
        return threadCount;
    }

    /**
     * Configures number of parallel thread count that would work on publishing
     * buffered events to Kinesis
     *
     * @param parallelCount 
     *       number of parallel thread count 
     *
     */
    public void setThreadCount(int parallelCount) {
        Validator.validate(parallelCount > 0, "threadCount must be >0");
        this.threadCount = parallelCount;
    }

    /**
     * Returns configured timeout between shutdown and clean up. When this
     * appender is asked to close/stop, it would wait for at most these many
     * seconds and try to send all buffered records to Kinesis. However if it
     * fails to publish them before timeout, it would drop those records and exit
     * immediately after timeout.
     * 
     * @return configured timeout for shutdown and clean up.
     */
    public int getShutdownTimeout() {
        return shutdownTimeout;
    }

    /**
     * Configures timeout between shutdown and clean up. When this appender is
     * asked to close/stop, it would wait for at most these many seconds and try
     * to send all buffered records to Kinesis. However if it fails to publish
     * them before timeout, it would drop those records and exit immediately after
     * timeout.
     *
     * @param shutdownTimeout 
     *       timeout between shutdown and clean up   
     *
     */
    public void setShutdownTimeout(int shutdownTimeout) {
        Validator.validate(shutdownTimeout > 0, "shutdownTimeout must be >0");
        this.shutdownTimeout = shutdownTimeout;
    }

    /**
     * Returns count of tasks scheduled to send records to Kinesis. Since
     * currently each task maps to sending one record, it is equivalent to number
     * of records in the buffer scheduled to be sent to Kinesis.
     * 
     * @return count of tasks scheduled to send records to Kinesis.
     */
    public int getTaskBufferSize() {
        return taskBuffer.size();
    }

    public String getRoleToAssumeArn() {
        return roleToAssumeArn;
    }

    public void setRoleToAssumeArn(String roleToAssumeArn) {
        this.roleToAssumeArn = roleToAssumeArn;
        if (!Validator.isBlank(roleToAssumeArn)) {
            String sessionId = "session" + Math.random();
            STSAssumeRoleSessionCredentialsProvider remoteAccountCredentials = new STSAssumeRoleSessionCredentialsProvider(
                    credentials, roleToAssumeArn, sessionId);

            credentials = remoteAccountCredentials;
        }
    }

    public void setCredentialsProvider(AWSCredentialsProvider credentialsProvider) {
        this.credentials = credentialsProvider;
    }

    /**
     * Returns configured Kinesis endpoint.
     * 
     * @return configured kinesis endpoint
     */
    public String getEndpoint() {
        return endpoint;
    }

    /**
     * Set kinesis endpoint. If set, it overrides the default kinesis endpoint in
     * the configured region
     * 
     * @param endpoint
     *          kinesis endpoint to which requests should be made.
     */
    public void setEndpoint(String endpoint) {
        this.endpoint = endpoint;
    }

    /**
     * Returns configured region for Kinesis.
     * 
     * @return configured region for Kinesis
     */
    public String getRegion() {
        return region;
    }

    /**
     * Configures the region and default endpoint for all Kinesis calls. If not
     * overridden by {@link #setEndpoint(String)}, all Kinesis requests are made
     * to the default endpoint in this region.
     * 
     * @param region
     *          the Kinesis region whose endpoint should be used for kinesis
     *          requests
     */
    public void setRegion(String region) {
        this.region = region;
    }
}