io.hops.erasure_coding.MapReduceEncodingManager.java Source code

Java tutorial

Introduction

Here is the source code for io.hops.erasure_coding.MapReduceEncodingManager.java

Source

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package io.hops.erasure_coding;

import io.hops.metadata.HdfsStorageFactory;
import io.hops.metadata.hdfs.dal.EncodingJobsDataAccess;
import io.hops.metadata.hdfs.entity.EncodingJob;
import io.hops.metadata.hdfs.entity.EncodingPolicy;
import io.hops.transaction.handler.HDFSOperationType;
import io.hops.transaction.handler.LightWeightRequestHandler;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.mapred.JobID;

import java.io.IOException;
import java.util.ArrayList;
import java.util.Collection;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;

/**
 * Implementation of {@link BaseEncodingManager} that uses map reduce jobs to
 * raid files.
 */
public class MapReduceEncodingManager extends BaseEncodingManager {

    public static final Log LOG = LogFactory.getLog(MapReduceEncodingManager.class);

    public static final String ENCODING_JOB_EXECUTION_LIMIT = "io.hops.erasure_coding.encoding_job_execution_limit";
    public static final long DEFAULT_ENCODING_JOB_EXECUTION_LIMIT = 24L * 3600L * 1000L;

    private final long executionLimit;
    private Map<String, MapReduceEncoder> currentJobs = new HashMap<String, MapReduceEncoder>();
    private Collection<MapReduceEncoder> completedJobs = new ArrayList<MapReduceEncoder>();

    private boolean initialized = false;

    public MapReduceEncodingManager(Configuration conf) throws IOException {
        super(conf);
        executionLimit = conf.getLong(ENCODING_JOB_EXECUTION_LIMIT, DEFAULT_ENCODING_JOB_EXECUTION_LIMIT);
        LOG.info("created");
    }

    @Override
    public void encodeFile(EncodingPolicy policy, Path sourceFile, Path parityFile, boolean copy) {
        initialize();

        Codec codec = Codec.getCodec(policy.getCodec());
        LOG.info("Start encoding with policy: " + policy + " for source file " + sourceFile.toUri().getPath()
                + " and parity file " + parityFile + " copy " + copy);
        PolicyInfo policyInfo = new PolicyInfo();
        try {
            policyInfo.setSrcPath(sourceFile.toUri().getPath());
            policyInfo.setCodecId(codec.getId());
            policyInfo.setProperty(PolicyInfo.PROPERTY_PARITY_PATH, parityFile.toUri().getPath());
            policyInfo.setProperty(PolicyInfo.PROPERTY_REPLICATION, String.valueOf(policy.getTargetReplication()));
            policyInfo.setProperty(PolicyInfo.PROPERTY_PARITY_REPLICATION, String.valueOf(1));
            policyInfo.setProperty(PolicyInfo.PROPERTY_COPY, String.valueOf(copy));
            raidFiles(policyInfo);
        } catch (IOException e) {
            LOG.error("Exception", e);
        }
    }

    /**
     * {@inheritDocs}
     */
    public void raidFiles(PolicyInfo info) throws IOException {
        MapReduceEncoder dr = new MapReduceEncoder(conf);
        boolean started = dr.startDistRaid(info);
        if (started) {
            String path = info.getSrcPath().toUri().getPath();
            // There is a risk that it crashes before persisting the job for recovery.
            // The ErasureCodingManager should restart the job in that case as it
            // does not set the state to active before this code succeeded.
            persistActiveJob(path, dr.getJobID(), dr.getConf().get(MapReduceEncoder.JOB_DIR_LABEL));
            currentJobs.put(path, dr);
        }
    }

    @Override
    public List<Report> computeReports() throws IOException {
        initialize();
        cleanRecovery();

        List<Report> reports = new ArrayList<Report>(currentJobs.size());
        for (Map.Entry<String, MapReduceEncoder> entry : currentJobs.entrySet()) {
            String fileName = entry.getKey();
            MapReduceEncoder job = entry.getValue();
            try {
                if (job.checkComplete() && job.successful()) {
                    reports.add(new Report(fileName, Report.Status.FINISHED));
                    LOG.info("Encoding successful for job " + job.getJobID());
                } else if (job.checkComplete() && !job.successful()) {
                    reports.add(new Report(fileName, Report.Status.FAILED));
                    LOG.info("Encoding failed for job " + job.getJobID());
                } else if (System.currentTimeMillis() - job.getStartTime() > executionLimit) {
                    job.killJob();
                    reports.add(new Report(fileName, Report.Status.CANCELED));
                    LOG.info("Encoding canceled for job " + job.getJobID());
                } else {
                    reports.add(new Report(fileName, Report.Status.ACTIVE));
                    LOG.info("Encoding active for job " + job.getJobID());
                }
            } catch (IOException e) {
                LOG.error("Exception during completeness check", e);
                try {
                    job.killJob();
                } catch (IOException e1) {
                }
                reports.add(new Report(fileName, Report.Status.FAILED));
            }
        }

        for (Report report : reports) {
            Report.Status status = report.getStatus();
            if (status == Report.Status.FINISHED || status == Report.Status.FAILED
                    || status == Report.Status.CANCELED) {
                MapReduceEncoder job = currentJobs.remove(report.getFilePath());
                completedJobs.add(job);
            }
        }

        return reports;
    }

    private void persistActiveJob(final String path, final JobID jobId, final String jobDir) throws IOException {
        new LightWeightRequestHandler(HDFSOperationType.PERSIST_ENCODING_JOB) {
            @Override
            public Object performTask() throws IOException {
                EncodingJobsDataAccess da = (EncodingJobsDataAccess) HdfsStorageFactory
                        .getDataAccess(EncodingJobsDataAccess.class);
                da.add(new EncodingJob(jobId.getJtIdentifier(), jobId.getId(), path, jobDir));
                return null;
            }
        }.handle();
    }

    private void cleanRecovery() throws IOException {
        new LightWeightRequestHandler(HDFSOperationType.DELETE_ENCODING_JOBS) {
            @Override
            public Object performTask() throws IOException {
                EncodingJobsDataAccess da = (EncodingJobsDataAccess) HdfsStorageFactory
                        .getDataAccess(EncodingJobsDataAccess.class);
                Iterator<MapReduceEncoder> it = completedJobs.iterator();
                while (it.hasNext()) {
                    MapReduceEncoder job = it.next();
                    JobID jobId = job.getJobID();
                    da.delete(new EncodingJob(jobId.getJtIdentifier(), jobId.getId()));
                    it.remove();
                }
                return null;
            }
        }.handle();
    }

    @Override
    public void cancelAll() {
        initialize();
        for (MapReduceEncoder job : currentJobs.values()) {
            try {
                job.killJob();
            } catch (IOException e) {
                LOG.error("Exception", e);
            }
        }
        currentJobs.clear();
    }

    @Override
    public void cancel(String toCancel) {
        initialize();
        MapReduceEncoder job = currentJobs.get(toCancel);
        try {
            job.killJob();
        } catch (IOException e) {
            LOG.error("Exception", e);
        }
        currentJobs.remove(toCancel);
    }

    private void initialize() {
        if (initialized) {
            return;
        }

        try {
            for (EncodingJob job : recoverActiveJobs()) {
                MapReduceEncoder recovered = new MapReduceEncoder(conf, job);
                currentJobs.put(job.getPath(), recovered);
            }
        } catch (IOException e) {
            LOG.error("Encoding job recovery failed", e);
            throw new RuntimeException(e);
        }

        initialized = true;
    }

    private Collection<EncodingJob> recoverActiveJobs() throws IOException {
        LightWeightRequestHandler handler = new LightWeightRequestHandler(HDFSOperationType.RECOVER_ENCODING_JOBS) {
            @Override
            public Object performTask() throws IOException {
                EncodingJobsDataAccess da = (EncodingJobsDataAccess) HdfsStorageFactory
                        .getDataAccess(EncodingJobsDataAccess.class);
                return da.findAll();
            }
        };

        return (Collection<EncodingJob>) handler.handle();
    }
}