org.apache.impala.catalog.HdfsPartition.java Source code

Introduction

Here is the source code for org.apache.impala.catalog.HdfsPartition.java
Source

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

package org.apache.impala.catalog;

import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.List;
import java.util.Map;
import java.util.concurrent.atomic.AtomicLong;

import org.apache.commons.lang.ArrayUtils;
import org.apache.hadoop.fs.Path;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import org.apache.impala.analysis.Expr;
import org.apache.impala.analysis.LiteralExpr;
import org.apache.impala.analysis.NullLiteral;
import org.apache.impala.analysis.PartitionKeyValue;
import org.apache.impala.analysis.ToSqlUtils;
import org.apache.impala.common.FileSystemUtil;
import org.apache.impala.common.ImpalaException;
import org.apache.impala.thrift.ImpalaInternalServiceConstants;
import org.apache.impala.thrift.TAccessLevel;
import org.apache.impala.thrift.TExpr;
import org.apache.impala.thrift.TExprNode;
import org.apache.impala.thrift.THdfsCompression;
import org.apache.impala.thrift.THdfsFileBlock;
import org.apache.impala.thrift.THdfsFileDesc;
import org.apache.impala.thrift.THdfsPartition;
import org.apache.impala.thrift.TNetworkAddress;
import org.apache.impala.thrift.TPartitionStats;
import org.apache.impala.thrift.TTableStats;
import org.apache.impala.util.HdfsCachingUtil;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.base.Joiner;
import com.google.common.base.Objects;
import com.google.common.base.Preconditions;
import com.google.common.base.Predicate;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.Lists;
import com.google.common.collect.Maps;

/**
 * Query-relevant information for one table partition. Partitions are comparable
 * based on their partition-key values. The comparison orders partitions in ascending
 * order with NULLs sorting last. The ordering is useful for displaying partitions
 * in SHOW statements.
 */
public class HdfsPartition implements Comparable<HdfsPartition> {
    /**
     * Metadata for a single file in this partition.
     * TODO: Do we even need this class? Just get rid of it and use the Thrift version?
     */
    static public class FileDescriptor implements Comparable<FileDescriptor> {
        private final THdfsFileDesc fileDescriptor_;

        public String getFileName() {
            return fileDescriptor_.getFile_name();
        }

        public long getFileLength() {
            return fileDescriptor_.getLength();
        }

        public THdfsCompression getFileCompression() {
            return fileDescriptor_.getCompression();
        }

        public long getModificationTime() {
            return fileDescriptor_.getLast_modification_time();
        }

        public List<THdfsFileBlock> getFileBlocks() {
            return fileDescriptor_.getFile_blocks();
        }

        public THdfsFileDesc toThrift() {
            return fileDescriptor_;
        }

        public FileDescriptor(String fileName, long fileLength, long modificationTime) {
            Preconditions.checkNotNull(fileName);
            Preconditions.checkArgument(fileLength >= 0);
            fileDescriptor_ = new THdfsFileDesc();
            fileDescriptor_.setFile_name(fileName);
            fileDescriptor_.setLength(fileLength);
            fileDescriptor_.setLast_modification_time(modificationTime);
            fileDescriptor_.setCompression(HdfsCompression.fromFileName(fileName).toThrift());
            List<THdfsFileBlock> emptyFileBlockList = Lists.newArrayList();
            fileDescriptor_.setFile_blocks(emptyFileBlockList);
        }

        private FileDescriptor(THdfsFileDesc fileDesc) {
            this(fileDesc.getFile_name(), fileDesc.length, fileDesc.last_modification_time);
            for (THdfsFileBlock block : fileDesc.getFile_blocks()) {
                fileDescriptor_.addToFile_blocks(block);
            }
        }

        public void addFileBlock(FileBlock blockMd) {
            addThriftFileBlock(blockMd.toThrift());
        }

        public void addThriftFileBlock(THdfsFileBlock block) {
            fileDescriptor_.addToFile_blocks(block);
        }

        public static FileDescriptor fromThrift(THdfsFileDesc desc) {
            return new FileDescriptor(desc);
        }

        @Override
        public String toString() {
            return Objects.toStringHelper(this).add("FileName", getFileName()).add("Length", getFileLength())
                    .toString();
        }

        /**
         * Orders file descriptors lexicographically by file name.
         */
        @Override
        public int compareTo(FileDescriptor otherFd) {
            return getFileName().compareTo(otherFd.getFileName());
        }
    }

    /**
     * Represents metadata of a single block replica.
     */
    public static class BlockReplica {
        private final boolean isCached_;
        private final int hostIdx_;

        /**
         * Creates a BlockReplica given a host ID/index and a flag specifying whether this
         * replica is cahced. Host IDs are assigned when loading the block metadata in
         * HdfsTable.
         */
        public BlockReplica(int hostIdx, boolean isCached) {
            hostIdx_ = hostIdx;
            isCached_ = isCached;
        }

        /**
         * Parses the location (an ip address:port string) of the replica and returns a
         * TNetworkAddress with this information, or null if parsing fails.
         */
        public static TNetworkAddress parseLocation(String location) {
            Preconditions.checkNotNull(location);
            String[] ip_port = location.split(":");
            if (ip_port.length != 2)
                return null;
            try {
                return new TNetworkAddress(ip_port[0], Integer.parseInt(ip_port[1]));
            } catch (NumberFormatException e) {
                return null;
            }
        }

        public boolean isCached() {
            return isCached_;
        }

        public int getHostIdx() {
            return hostIdx_;
        }
    }

    /**
     * File Block metadata
     */
    public static class FileBlock {
        private final THdfsFileBlock fileBlock_;
        private boolean isCached_; // Set to true if there is at least one cached replica.

        private FileBlock(THdfsFileBlock fileBlock) {
            fileBlock_ = fileBlock;
            isCached_ = false;
            for (boolean isCached : fileBlock.getIs_replica_cached()) {
                isCached_ |= isCached;
            }
        }

        /**
         * Construct a FileBlock given the start offset (in bytes) of the file associated
         * with this block, the length of the block (in bytes), and a list of BlockReplicas.
         * Does not fill diskIds.
         */
        public FileBlock(long offset, long blockLength, List<BlockReplica> replicaHostIdxs) {
            Preconditions.checkNotNull(replicaHostIdxs);
            fileBlock_ = new THdfsFileBlock();
            fileBlock_.setOffset(offset);
            fileBlock_.setLength(blockLength);

            fileBlock_.setReplica_host_idxs(new ArrayList<Integer>(replicaHostIdxs.size()));
            fileBlock_.setIs_replica_cached(new ArrayList<Boolean>(replicaHostIdxs.size()));
            isCached_ = false;
            for (BlockReplica replica : replicaHostIdxs) {
                fileBlock_.addToReplica_host_idxs(replica.getHostIdx());
                fileBlock_.addToIs_replica_cached(replica.isCached());
                isCached_ |= replica.isCached();
            }
        }

        public long getOffset() {
            return fileBlock_.getOffset();
        }

        public long getLength() {
            return fileBlock_.getLength();
        }

        public List<Integer> getReplicaHostIdxs() {
            return fileBlock_.getReplica_host_idxs();
        }

        /**
         * Populates the given THdfsFileBlock's list of disk ids with the given disk id
         * values. The number of disk ids must match the number of network addresses
         * set in the file block.
         */
        public static void setDiskIds(int[] diskIds, THdfsFileBlock fileBlock) {
            Preconditions.checkArgument(diskIds.length == fileBlock.getReplica_host_idxs().size());
            fileBlock.setDisk_ids(Arrays.asList(ArrayUtils.toObject(diskIds)));
        }

        /**
         * Return the disk id of the block in BlockLocation.getNames()[hostIndex]; -1 if
         * disk id is not supported.
         */
        public int getDiskId(int hostIndex) {
            if (fileBlock_.disk_ids == null)
                return -1;
            return fileBlock_.getDisk_ids().get(hostIndex);
        }

        public boolean isCached(int hostIndex) {
            return fileBlock_.getIs_replica_cached().get(hostIndex);
        }

        public THdfsFileBlock toThrift() {
            return fileBlock_;
        }

        public static FileBlock fromThrift(THdfsFileBlock thriftFileBlock) {
            return new FileBlock(thriftFileBlock);
        }

        @Override
        public String toString() {
            return Objects.toStringHelper(this).add("offset", fileBlock_.offset).add("length", fileBlock_.length)
                    .add("#disks", fileBlock_.getDisk_idsSize()).toString();
        }
    }

    private final HdfsTable table_;
    private final List<LiteralExpr> partitionKeyValues_;
    // estimated number of rows in partition; -1: unknown
    private long numRows_ = -1;
    private static AtomicLong partitionIdCounter_ = new AtomicLong();

    // A unique ID for each partition, used to identify a partition in the thrift
    // representation of a table.
    private final long id_;

    /*
     * Note: Although you can write multiple formats to a single partition (by changing
     * the format before each write), Hive won't let you read that data and neither should
     * we. We should therefore treat mixing formats inside one partition as user error.
     * It's easy to add per-file metadata to FileDescriptor if this changes.
     */
    private final HdfsStorageDescriptor fileFormatDescriptor_;
    private List<FileDescriptor> fileDescriptors_;
    private HdfsPartitionLocationCompressor.Location location_;
    private final static Logger LOG = LoggerFactory.getLogger(HdfsPartition.class);
    private boolean isDirty_ = false;
    // True if this partition is marked as cached. Does not necessarily mean the data is
    // cached.
    private boolean isMarkedCached_ = false;
    private final TAccessLevel accessLevel_;

    // (k,v) pairs of parameters for this partition, stored in the HMS. Used by Impala to
    // store intermediate state for statistics computations.
    private Map<String, String> hmsParameters_;

    public HdfsStorageDescriptor getInputFormatDescriptor() {
        return fileFormatDescriptor_;
    }

    public boolean isDefaultPartition() {
        return id_ == ImpalaInternalServiceConstants.DEFAULT_PARTITION_ID;
    }

    /**
     * Returns true if the partition resides at a location which can be cached (e.g. HDFS).
     */
    public boolean isCacheable() {
        return FileSystemUtil.isPathCacheable(new Path(getLocation()));
    }

    /**
     * Return a partition name formed by concatenating partition keys and their values,
     * compatible with the way Hive names partitions. Reuses Hive's
     * org.apache.hadoop.hive.common.FileUtils.makePartName() function to build the name
     * string because there are a number of special cases for how partition names are URL
     * escaped.
     * TODO: Consider storing the PartitionKeyValue in HdfsPartition. It would simplify
     * this code would be useful in other places, such as fromThrift().
     */
    public String getPartitionName() {
        List<String> partitionCols = Lists.newArrayList();
        for (int i = 0; i < getTable().getNumClusteringCols(); ++i) {
            partitionCols.add(getTable().getColumns().get(i).getName());
        }

        return org.apache.hadoop.hive.common.FileUtils.makePartName(partitionCols,
                getPartitionValuesAsStrings(true));
    }

    /**
     * Returns a list of partition values as strings. If mapNullsToHiveKey is true, any NULL
     * value is returned as the table's default null partition key string value, otherwise
     * they are returned as 'NULL'.
     */
    public List<String> getPartitionValuesAsStrings(boolean mapNullsToHiveKey) {
        List<String> ret = Lists.newArrayList();
        for (LiteralExpr partValue : getPartitionValues()) {
            if (mapNullsToHiveKey) {
                ret.add(PartitionKeyValue.getPartitionKeyValueString(partValue,
                        getTable().getNullPartitionKeyValue()));
            } else {
                ret.add(partValue.getStringValue());
            }
        }
        return ret;
    }

    /**
     * Utility method which returns a string of conjuncts of equality exprs to exactly
     * select this partition (e.g. ((month=2009) AND (year=2012)).
     * TODO: Remove this when the TODO elsewhere in this file to save and expose the
     * list of TPartitionKeyValues has been resolved.
     */
    public String getConjunctSql() {
        List<String> partColSql = Lists.newArrayList();
        for (Column partCol : getTable().getClusteringColumns()) {
            partColSql.add(ToSqlUtils.getIdentSql(partCol.getName()));
        }

        List<String> conjuncts = Lists.newArrayList();
        for (int i = 0; i < partColSql.size(); ++i) {
            LiteralExpr partVal = getPartitionValues().get(i);
            String partValSql = partVal.toSql();
            if (partVal instanceof NullLiteral || partValSql.isEmpty()) {
                conjuncts.add(partColSql.get(i) + " IS NULL");
            } else {
                conjuncts.add(partColSql.get(i) + "=" + partValSql);
            }
        }
        return "(" + Joiner.on(" AND ").join(conjuncts) + ")";
    }

    /**
     * Returns a string of the form part_key1=value1/part_key2=value2...
     */
    public String getValuesAsString() {
        StringBuilder partDescription = new StringBuilder();
        for (int i = 0; i < getTable().getNumClusteringCols(); ++i) {
            String columnName = getTable().getColumns().get(i).getName();
            String value = PartitionKeyValue.getPartitionKeyValueString(getPartitionValues().get(i),
                    getTable().getNullPartitionKeyValue());
            partDescription.append(columnName + "=" + value);
            if (i != getTable().getNumClusteringCols() - 1)
                partDescription.append("/");
        }
        return partDescription.toString();
    }

    /**
     * Returns the storage location (HDFS path) of this partition. Should only be called
     * for partitioned tables.
     */
    public String getLocation() {
        return (location_ != null) ? location_.toString() : null;
    }

    public Path getLocationPath() {
        return new Path(getLocation());
    }

    public long getId() {
        return id_;
    }

    public HdfsTable getTable() {
        return table_;
    }

    public void setNumRows(long numRows) {
        numRows_ = numRows;
    }

    public long getNumRows() {
        return numRows_;
    }

    public boolean isMarkedCached() {
        return isMarkedCached_;
    }

    void markCached() {
        isMarkedCached_ = true;
    }

    /**
     * Updates the file format of this partition and sets the corresponding input/output
     * format classes.
     */
    public void setFileFormat(HdfsFileFormat fileFormat) {
        fileFormatDescriptor_.setFileFormat(fileFormat);
        cachedMsPartitionDescriptor_.sdInputFormat = fileFormat.inputFormat();
        cachedMsPartitionDescriptor_.sdOutputFormat = fileFormat.outputFormat();
        cachedMsPartitionDescriptor_.sdSerdeInfo
                .setSerializationLib(fileFormatDescriptor_.getFileFormat().serializationLib());
    }

    public HdfsFileFormat getFileFormat() {
        return fileFormatDescriptor_.getFileFormat();
    }

    public void setLocation(String place) {
        location_ = table_.getPartitionLocationCompressor().new Location(place);
    }

    public org.apache.hadoop.hive.metastore.api.SerDeInfo getSerdeInfo() {
        return cachedMsPartitionDescriptor_.sdSerdeInfo;
    }

    // May return null if no per-partition stats were recorded, or if the per-partition
    // stats could not be deserialised from the parameter map.
    public TPartitionStats getPartitionStats() {
        try {
            return PartitionStatsUtil.partStatsFromParameters(hmsParameters_);
        } catch (ImpalaException e) {
            LOG.warn("Could not deserialise incremental stats state for " + getPartitionName()
                    + ", consider DROP INCREMENTAL STATS ... PARTITION ... and recomputing "
                    + "incremental stats for this table.");
            return null;
        }
    }

    public boolean hasIncrementalStats() {
        TPartitionStats partStats = getPartitionStats();
        return partStats != null && partStats.intermediate_col_stats != null;
    }

    /**
     * Returns the HDFS permissions Impala has to this partition's directory - READ_ONLY,
     * READ_WRITE, etc.
     */
    public TAccessLevel getAccessLevel() {
        return accessLevel_;
    }

    public Map<String, String> getParameters() {
        return hmsParameters_;
    }

    public void putToParameters(String k, String v) {
        hmsParameters_.put(k, v);
    }

    /**
     * Marks this partition's metadata as "dirty" indicating that changes have been
     * made and this partition's metadata should not be reused during the next
     * incremental metadata refresh.
     */
    public void markDirty() {
        isDirty_ = true;
    }

    public boolean isDirty() {
        return isDirty_;
    }

    /**
     * Returns an immutable list of partition key expressions
     */
    public List<LiteralExpr> getPartitionValues() {
        return partitionKeyValues_;
    }

    public LiteralExpr getPartitionValue(int i) {
        return partitionKeyValues_.get(i);
    }

    public List<HdfsPartition.FileDescriptor> getFileDescriptors() {
        return fileDescriptors_;
    }

    public void setFileDescriptors(List<FileDescriptor> descriptors) {
        fileDescriptors_ = descriptors;
    }

    public long getNumFileDescriptors() {
        return fileDescriptors_ == null ? 0 : fileDescriptors_.size();
    }

    public boolean hasFileDescriptors() {
        return !fileDescriptors_.isEmpty();
    }

    // Struct-style class for caching all the information we need to reconstruct an
    // HMS-compatible Partition object, for use in RPCs to the metastore. We do this rather
    // than cache the Thrift partition object itself as the latter can be large - thanks
    // mostly to the inclusion of the full FieldSchema list. This class is read-only - if
    // any field can be mutated by Impala it should belong to HdfsPartition itself (see
    // HdfsPartition.location_ for an example).
    //
    // TODO: Cache this descriptor in HdfsTable so that identical descriptors are shared
    // between HdfsPartition instances.
    // TODO: sdInputFormat and sdOutputFormat can be mutated by Impala when the file format
    // of a partition changes; move these fields to HdfsPartition.
    private static class CachedHmsPartitionDescriptor {
        public String sdInputFormat;
        public String sdOutputFormat;
        public final boolean sdCompressed;
        public final int sdNumBuckets;
        public final org.apache.hadoop.hive.metastore.api.SerDeInfo sdSerdeInfo;
        public final List<String> sdBucketCols;
        public final List<org.apache.hadoop.hive.metastore.api.Order> sdSortCols;
        public final Map<String, String> sdParameters;
        public final int msCreateTime;
        public final int msLastAccessTime;

        public CachedHmsPartitionDescriptor(org.apache.hadoop.hive.metastore.api.Partition msPartition) {
            org.apache.hadoop.hive.metastore.api.StorageDescriptor sd = null;
            if (msPartition != null) {
                sd = msPartition.getSd();
                msCreateTime = msPartition.getCreateTime();
                msLastAccessTime = msPartition.getLastAccessTime();
            } else {
                msCreateTime = msLastAccessTime = 0;
            }
            if (sd != null) {
                sdInputFormat = sd.getInputFormat();
                sdOutputFormat = sd.getOutputFormat();
                sdCompressed = sd.isCompressed();
                sdNumBuckets = sd.getNumBuckets();
                sdSerdeInfo = sd.getSerdeInfo();
                sdBucketCols = ImmutableList.copyOf(sd.getBucketCols());
                sdSortCols = ImmutableList.copyOf(sd.getSortCols());
                sdParameters = ImmutableMap.copyOf(sd.getParameters());
            } else {
                sdInputFormat = "";
                sdOutputFormat = "";
                sdCompressed = false;
                sdNumBuckets = 0;
                sdSerdeInfo = null;
                sdBucketCols = ImmutableList.of();
                sdSortCols = ImmutableList.of();
                sdParameters = ImmutableMap.of();
            }
        }
    }

    private final CachedHmsPartitionDescriptor cachedMsPartitionDescriptor_;

    public CachedHmsPartitionDescriptor getCachedMsPartitionDescriptor() {
        return cachedMsPartitionDescriptor_;
    }

    /**
     * Returns a Hive-compatible partition object that may be used in calls to the
     * metastore.
     */
    public org.apache.hadoop.hive.metastore.api.Partition toHmsPartition() {
        if (cachedMsPartitionDescriptor_ == null)
            return null;
        Preconditions.checkNotNull(table_.getNonPartitionFieldSchemas());
        // Update the serde library class based on the currently used file format.
        org.apache.hadoop.hive.metastore.api.StorageDescriptor storageDescriptor = new org.apache.hadoop.hive.metastore.api.StorageDescriptor(
                table_.getNonPartitionFieldSchemas(), getLocation(), cachedMsPartitionDescriptor_.sdInputFormat,
                cachedMsPartitionDescriptor_.sdOutputFormat, cachedMsPartitionDescriptor_.sdCompressed,
                cachedMsPartitionDescriptor_.sdNumBuckets, cachedMsPartitionDescriptor_.sdSerdeInfo,
                cachedMsPartitionDescriptor_.sdBucketCols, cachedMsPartitionDescriptor_.sdSortCols,
                cachedMsPartitionDescriptor_.sdParameters);
        org.apache.hadoop.hive.metastore.api.Partition partition = new org.apache.hadoop.hive.metastore.api.Partition(
                getPartitionValuesAsStrings(true), getTable().getDb().getName(), getTable().getName(),
                cachedMsPartitionDescriptor_.msCreateTime, cachedMsPartitionDescriptor_.msLastAccessTime,
                storageDescriptor, getParameters());
        return partition;
    }

    private HdfsPartition(HdfsTable table, org.apache.hadoop.hive.metastore.api.Partition msPartition,
            List<LiteralExpr> partitionKeyValues, HdfsStorageDescriptor fileFormatDescriptor,
            Collection<HdfsPartition.FileDescriptor> fileDescriptors, long id,
            HdfsPartitionLocationCompressor.Location location, TAccessLevel accessLevel) {
        table_ = table;
        if (msPartition == null) {
            cachedMsPartitionDescriptor_ = null;
        } else {
            cachedMsPartitionDescriptor_ = new CachedHmsPartitionDescriptor(msPartition);
        }
        location_ = location;
        partitionKeyValues_ = ImmutableList.copyOf(partitionKeyValues);
        fileDescriptors_ = ImmutableList.copyOf(fileDescriptors);
        fileFormatDescriptor_ = fileFormatDescriptor;
        id_ = id;
        accessLevel_ = accessLevel;
        if (msPartition != null && msPartition.getParameters() != null) {
            isMarkedCached_ = HdfsCachingUtil.getCacheDirectiveId(msPartition.getParameters()) != null;
            hmsParameters_ = msPartition.getParameters();
        } else {
            hmsParameters_ = Maps.newHashMap();
        }

        // TODO: instead of raising an exception, we should consider marking this partition
        // invalid and moving on, so that table loading won't fail and user can query other
        // partitions.
        for (FileDescriptor fileDescriptor : fileDescriptors_) {
            StringBuilder errorMsg = new StringBuilder();
            if (!getInputFormatDescriptor().getFileFormat()
                    .isFileCompressionTypeSupported(fileDescriptor.getFileName(), errorMsg)) {
                throw new RuntimeException(errorMsg.toString());
            }
        }
    }

    public HdfsPartition(HdfsTable table, org.apache.hadoop.hive.metastore.api.Partition msPartition,
            List<LiteralExpr> partitionKeyValues, HdfsStorageDescriptor fileFormatDescriptor,
            Collection<HdfsPartition.FileDescriptor> fileDescriptors, TAccessLevel accessLevel) {
        this(table, msPartition, partitionKeyValues, fileFormatDescriptor, fileDescriptors,
                partitionIdCounter_.getAndIncrement(),
                table.getPartitionLocationCompressor().new Location(
                        msPartition != null ? msPartition.getSd().getLocation() : table.getLocation()),
                accessLevel);
    }

    public static HdfsPartition defaultPartition(HdfsTable table, HdfsStorageDescriptor storageDescriptor) {
        List<LiteralExpr> emptyExprList = Lists.newArrayList();
        List<FileDescriptor> emptyFileDescriptorList = Lists.newArrayList();
        return new HdfsPartition(table, null, emptyExprList, storageDescriptor, emptyFileDescriptorList,
                ImpalaInternalServiceConstants.DEFAULT_PARTITION_ID, null, TAccessLevel.READ_WRITE);
    }

    /**
     * Return the size (in bytes) of all the files inside this partition
     */
    public long getSize() {
        long result = 0;
        for (HdfsPartition.FileDescriptor fileDescriptor : fileDescriptors_) {
            result += fileDescriptor.getFileLength();
        }
        return result;
    }

    @Override
    public String toString() {
        return Objects.toStringHelper(this).add("fileDescriptors", fileDescriptors_).toString();
    }

    private static Predicate<String> isIncrementalStatsKey = new Predicate<String>() {
        @Override
        public boolean apply(String key) {
            return !(key.startsWith(PartitionStatsUtil.INCREMENTAL_STATS_NUM_CHUNKS)
                    || key.startsWith(PartitionStatsUtil.INCREMENTAL_STATS_CHUNK_PREFIX));
        }
    };

    /**
     * Returns hmsParameters_ after filtering out all the partition
     * incremental stats information.
     */
    private Map<String, String> getFilteredHmsParameters() {
        return Maps.filterKeys(hmsParameters_, isIncrementalStatsKey);
    }

    public static HdfsPartition fromThrift(HdfsTable table, long id, THdfsPartition thriftPartition) {
        HdfsStorageDescriptor storageDesc = new HdfsStorageDescriptor(table.getName(),
                HdfsFileFormat.fromThrift(thriftPartition.getFileFormat()), thriftPartition.lineDelim,
                thriftPartition.fieldDelim, thriftPartition.collectionDelim, thriftPartition.mapKeyDelim,
                thriftPartition.escapeChar, (byte) '"', // TODO: We should probably add quoteChar to THdfsPartition.
                thriftPartition.blockSize);

        List<LiteralExpr> literalExpr = Lists.newArrayList();
        if (id != ImpalaInternalServiceConstants.DEFAULT_PARTITION_ID) {
            List<Column> clusterCols = Lists.newArrayList();
            for (int i = 0; i < table.getNumClusteringCols(); ++i) {
                clusterCols.add(table.getColumns().get(i));
            }

            List<TExprNode> exprNodes = Lists.newArrayList();
            for (TExpr expr : thriftPartition.getPartitionKeyExprs()) {
                for (TExprNode node : expr.getNodes()) {
                    exprNodes.add(node);
                }
            }
            Preconditions.checkState(clusterCols.size() == exprNodes.size(), String.format(
                    "Number of partition columns (%d) does not match number " + "of partition key expressions (%d)",
                    clusterCols.size(), exprNodes.size()));

            for (int i = 0; i < exprNodes.size(); ++i) {
                literalExpr.add(LiteralExpr.fromThrift(exprNodes.get(i), clusterCols.get(i).getType()));
            }
        }

        List<HdfsPartition.FileDescriptor> fileDescriptors = Lists.newArrayList();
        if (thriftPartition.isSetFile_desc()) {
            for (THdfsFileDesc desc : thriftPartition.getFile_desc()) {
                fileDescriptors.add(HdfsPartition.FileDescriptor.fromThrift(desc));
            }
        }

        TAccessLevel accessLevel = thriftPartition.isSetAccess_level() ? thriftPartition.getAccess_level()
                : TAccessLevel.READ_WRITE;
        HdfsPartitionLocationCompressor.Location location = thriftPartition.isSetLocation()
                ? table.getPartitionLocationCompressor().new Location(thriftPartition.getLocation())
                : null;
        HdfsPartition partition = new HdfsPartition(table, null, literalExpr, storageDesc, fileDescriptors, id,
                location, accessLevel);
        if (thriftPartition.isSetStats()) {
            partition.setNumRows(thriftPartition.getStats().getNum_rows());
        }
        if (thriftPartition.isSetIs_marked_cached()) {
            partition.isMarkedCached_ = thriftPartition.isIs_marked_cached();
        }

        if (thriftPartition.isSetHms_parameters()) {
            partition.hmsParameters_ = thriftPartition.getHms_parameters();
        } else {
            partition.hmsParameters_ = Maps.newHashMap();
        }

        return partition;
    }

    /**
     * Checks that this partition's metadata is well formed. This does not necessarily
     * mean the partition is supported by Impala.
     * Throws a CatalogException if there are any errors in the partition metadata.
     */
    public void checkWellFormed() throws CatalogException {
        try {
            // Validate all the partition key/values to ensure you can convert them toThrift()
            Expr.treesToThrift(getPartitionValues());
        } catch (Exception e) {
            throw new CatalogException(
                    "Partition (" + getPartitionName() + ") has invalid partition column values: ", e);
        }
    }

    public THdfsPartition toThrift(boolean includeFileDesc, boolean includeIncrementalStats) {
        List<TExpr> thriftExprs = Expr.treesToThrift(getPartitionValues());

        THdfsPartition thriftHdfsPart = new THdfsPartition(fileFormatDescriptor_.getLineDelim(),
                fileFormatDescriptor_.getFieldDelim(), fileFormatDescriptor_.getCollectionDelim(),
                fileFormatDescriptor_.getMapKeyDelim(), fileFormatDescriptor_.getEscapeChar(),
                fileFormatDescriptor_.getFileFormat().toThrift(), thriftExprs,
                fileFormatDescriptor_.getBlockSize());
        if (location_ != null)
            thriftHdfsPart.setLocation(location_.toThrift());
        thriftHdfsPart.setStats(new TTableStats(numRows_));
        thriftHdfsPart.setAccess_level(accessLevel_);
        thriftHdfsPart.setIs_marked_cached(isMarkedCached_);
        thriftHdfsPart.setId(getId());
        // IMPALA-4902: Shallow-clone the map to avoid concurrent modifications. One thread
        // may try to serialize the returned THdfsPartition after releasing the table's lock,
        // and another thread doing DDL may modify the map.
        thriftHdfsPart.setHms_parameters(
                Maps.newHashMap(includeIncrementalStats ? hmsParameters_ : getFilteredHmsParameters()));
        if (includeFileDesc) {
            // Add block location information
            for (FileDescriptor fd : fileDescriptors_) {
                thriftHdfsPart.addToFile_desc(fd.toThrift());
            }
        }

        return thriftHdfsPart;
    }

    /**
     * Comparison method to allow ordering of HdfsPartitions by their partition-key values.
     */
    @Override
    public int compareTo(HdfsPartition o) {
        return comparePartitionKeyValues(partitionKeyValues_, o.getPartitionValues());
    }

    @VisibleForTesting
    public static int comparePartitionKeyValues(List<LiteralExpr> lhs, List<LiteralExpr> rhs) {
        int sizeDiff = lhs.size() - rhs.size();
        if (sizeDiff != 0)
            return sizeDiff;
        for (int i = 0; i < lhs.size(); ++i) {
            int cmp = lhs.get(i).compareTo(rhs.get(i));
            if (cmp != 0)
                return cmp;
        }
        return 0;
    }
}