org.apache.gobblin.util.test.RetentionTestHelper.java Source code

Java tutorial

Introduction

Here is the source code for org.apache.gobblin.util.test.RetentionTestHelper.java

Source

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.gobblin.util.test;

import static org.mockito.Matchers.any;
import static org.mockito.Mockito.mock;
import static org.mockito.Mockito.when;

import java.io.InputStream;
import java.util.Map.Entry;
import java.util.Properties;

import org.apache.commons.lang3.StringUtils;
import org.apache.commons.lang3.reflect.ConstructorUtils;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;

import com.google.common.base.Optional;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.typesafe.config.Config;
import com.typesafe.config.ConfigFactory;

import org.apache.gobblin.config.client.ConfigClient;
import org.apache.gobblin.configuration.ConfigurationKeys;
import org.apache.gobblin.data.management.retention.DatasetCleaner;
import org.apache.gobblin.data.management.retention.dataset.CleanableDataset;
import org.apache.gobblin.data.management.retention.dataset.CleanableDatasetBase;
import org.apache.gobblin.data.management.retention.profile.MultiCleanableDatasetFinder;
import org.apache.gobblin.dataset.Dataset;
import org.apache.gobblin.dataset.DatasetsFinder;
import org.apache.gobblin.util.PathUtils;
import org.apache.gobblin.util.reflection.GobblinConstructorUtils;

/**
 * Helper methods for Retention integration tests
 */
public class RetentionTestHelper {

    /**
    *
    * Does gobblin retention for test data. {@link DatasetCleaner} which does retention in production can not be directly called as we need to resolve some
    * runtime properties like ${testNameTempPath}. This directory contains all the setup data created for a test by {@link RetentionTestDataGenerator#setup()}.
    * It is unique for each test.
    * The default {@link ConfigClient} used by {@link DatasetCleaner} connects to config store configs. We need to provide a
    * mock {@link ConfigClient} since the configs are in classpath and not on config store.
    *
    * @param retentionConfigClasspathResource this is the same jobProps/config files used while running a real retention job
    * @param testNameTempPath temp path for this test where test data is generated
    */
    public static void clean(FileSystem fs, Path retentionConfigClasspathResource,
            Optional<Path> additionalJobPropsClasspathResource, Path testNameTempPath) throws Exception {

        Properties additionalJobProps = new Properties();
        if (additionalJobPropsClasspathResource.isPresent()) {
            try (final InputStream stream = RetentionTestHelper.class.getClassLoader()
                    .getResourceAsStream(additionalJobPropsClasspathResource.get().toString())) {
                additionalJobProps.load(stream);
            }
        }

        if (retentionConfigClasspathResource.getName().endsWith(".job")) {

            Properties jobProps = new Properties();
            try (final InputStream stream = RetentionTestHelper.class.getClassLoader()
                    .getResourceAsStream(retentionConfigClasspathResource.toString())) {
                jobProps.load(stream);
                for (Entry<Object, Object> entry : jobProps.entrySet()) {
                    jobProps.put(entry.getKey(), StringUtils.replace((String) entry.getValue(),
                            "${testNameTempPath}", testNameTempPath.toString()));
                }
            }

            MultiCleanableDatasetFinder finder = new MultiCleanableDatasetFinder(fs, jobProps);
            for (Dataset dataset : finder.findDatasets()) {
                ((CleanableDataset) dataset).clean();
            }
        } else {
            Config testConfig = ConfigFactory.parseResources(retentionConfigClasspathResource.toString())
                    .withFallback(ConfigFactory.parseMap(ImmutableMap.of("testNameTempPath",
                            PathUtils.getPathWithoutSchemeAndAuthority(testNameTempPath).toString())))
                    .resolve();

            ConfigClient client = mock(ConfigClient.class);
            when(client.getConfig(any(String.class))).thenReturn(testConfig);
            Properties jobProps = new Properties();
            jobProps.setProperty(CleanableDatasetBase.SKIP_TRASH_KEY, Boolean.toString(true));
            jobProps.setProperty(ConfigurationKeys.CONFIG_MANAGEMENT_STORE_URI, "dummy");
            jobProps.setProperty(ConfigurationKeys.CONFIG_MANAGEMENT_STORE_ENABLED, "true");

            jobProps.putAll(additionalJobProps);

            @SuppressWarnings("unchecked")
            DatasetsFinder<CleanableDataset> finder = (DatasetsFinder<CleanableDataset>) GobblinConstructorUtils
                    .invokeFirstConstructor(
                            Class.forName(
                                    testConfig.getString(MultiCleanableDatasetFinder.DATASET_FINDER_CLASS_KEY)),
                            ImmutableList.of(fs, jobProps, testConfig, client),
                            ImmutableList.of(fs, jobProps, client));

            for (CleanableDataset dataset : finder.findDatasets()) {
                dataset.clean();
            }
        }
    }

    public static void clean(FileSystem fs, Path retentionConfigClasspathResource, Path testNameTempPath)
            throws Exception {
        clean(fs, retentionConfigClasspathResource, Optional.<Path>absent(), testNameTempPath);
    }

}