com.facebook.hive.orc.RecordReaderImpl.java Source code

Introduction

Here is the source code for com.facebook.hive.orc.RecordReaderImpl.java
Source

//  Copyright (c) 2013, Facebook, Inc.  All rights reserved.

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.facebook.hive.orc;

import com.facebook.hive.orc.compression.CompressionCodec;
import com.facebook.hive.orc.lazy.LazyBinaryTreeReader;
import com.facebook.hive.orc.lazy.LazyBooleanTreeReader;
import com.facebook.hive.orc.lazy.LazyByteTreeReader;
import com.facebook.hive.orc.lazy.LazyDoubleTreeReader;
import com.facebook.hive.orc.lazy.LazyFloatTreeReader;
import com.facebook.hive.orc.lazy.LazyIntTreeReader;
import com.facebook.hive.orc.lazy.LazyListTreeReader;
import com.facebook.hive.orc.lazy.LazyLongTreeReader;
import com.facebook.hive.orc.lazy.LazyMapTreeReader;
import com.facebook.hive.orc.lazy.LazyShortTreeReader;
import com.facebook.hive.orc.lazy.LazyStringTreeReader;
import com.facebook.hive.orc.lazy.LazyStructTreeReader;
import com.facebook.hive.orc.lazy.LazyTimestampTreeReader;
import com.facebook.hive.orc.lazy.LazyTreeReader;
import com.facebook.hive.orc.lazy.LazyUnionTreeReader;
import com.facebook.hive.orc.lazy.OrcLazyBinary;
import com.facebook.hive.orc.lazy.OrcLazyBoolean;
import com.facebook.hive.orc.lazy.OrcLazyByte;
import com.facebook.hive.orc.lazy.OrcLazyDouble;
import com.facebook.hive.orc.lazy.OrcLazyFloat;
import com.facebook.hive.orc.lazy.OrcLazyInt;
import com.facebook.hive.orc.lazy.OrcLazyList;
import com.facebook.hive.orc.lazy.OrcLazyLong;
import com.facebook.hive.orc.lazy.OrcLazyMap;
import com.facebook.hive.orc.lazy.OrcLazyObject;
import com.facebook.hive.orc.lazy.OrcLazyRow;
import com.facebook.hive.orc.lazy.OrcLazyShort;
import com.facebook.hive.orc.lazy.OrcLazyString;
import com.facebook.hive.orc.lazy.OrcLazyStruct;
import com.facebook.hive.orc.lazy.OrcLazyTimestamp;
import com.facebook.hive.orc.lazy.OrcLazyUnion;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.hive.serde2.ReaderWriterProfiler;

import java.io.IOException;
import java.nio.ByteBuffer;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

class RecordReaderImpl implements RecordReader {
    private final FSDataInputStream file;
    private final long firstRow;
    private final List<StripeInformation> stripes = new ArrayList<StripeInformation>();
    private OrcProto.StripeFooter stripeFooter;
    private final long totalRowCount;
    private final CompressionCodec codec;
    private final int bufferSize;
    private final boolean[] included;
    private final long rowIndexStride;
    private long rowInStripe = 0;
    private int currentStripe = 0;
    private long rowBaseInStripe = 0;
    private long rowCountInStripe = 0;
    private final Map<StreamName, InStream> streams = new HashMap<StreamName, InStream>();
    private OrcLazyRow reader;
    private final OrcProto.RowIndex[] indexes;
    private final int readStrides;
    private final boolean readEagerlyFromHdfs;
    private final long readEagerlyFromHdfsBytes;

    RecordReaderImpl(Iterable<StripeInformation> stripes, FileSystem fileSystem, Path path, long offset,
            long length, List<OrcProto.Type> types, CompressionCodec codec, int bufferSize, boolean[] included,
            long strideRate, Configuration conf) throws IOException {
        this.file = fileSystem.open(path);
        this.codec = codec;
        this.bufferSize = bufferSize;
        this.included = included;
        this.readStrides = OrcConf.getIntVar(conf, OrcConf.ConfVars.HIVE_ORC_READ_COMPRESSION_STRIDES);
        this.readEagerlyFromHdfs = OrcConf.getBoolVar(conf, OrcConf.ConfVars.HIVE_ORC_EAGER_HDFS_READ);
        this.readEagerlyFromHdfsBytes = OrcConf.getLongVar(conf, OrcConf.ConfVars.HIVE_ORC_EAGER_HDFS_READ_BYTES);
        long rows = 0;
        long skippedRows = 0;
        for (StripeInformation stripe : stripes) {
            long stripeStart = stripe.getOffset();
            if (offset > stripeStart) {
                skippedRows += stripe.getNumberOfRows();
            } else if (stripeStart < offset + length) {
                this.stripes.add(stripe);
                rows += stripe.getNumberOfRows();
            }
        }
        firstRow = skippedRows;
        totalRowCount = rows;
        indexes = new OrcProto.RowIndex[types.size()];
        rowIndexStride = strideRate;
        reader = createLazyRow(types, included);
        if (this.stripes.size() > 0) {
            readStripe();
        }
    }

    OrcLazyRow createLazyRow(List<OrcProto.Type> types, boolean[] included) throws IOException {
        OrcProto.Type type = types.get(0);
        int structFieldCount = type.getFieldNamesCount();
        OrcLazyObject[] structFields = new OrcLazyObject[structFieldCount];
        for (int i = 0; i < structFieldCount; i++) {
            int subtype = type.getSubtypes(i);
            if (included == null || included[subtype]) {
                structFields[i] = createLazyObject(subtype, types, included);
            }
        }
        return new OrcLazyRow(structFields, type.getFieldNamesList());
    }

    LazyTreeReader createLazyTreeReader(int columnId, List<OrcProto.Type> types, boolean[] included)
            throws IOException {
        OrcProto.Type type = types.get(columnId);
        switch (type.getKind()) {
        case BOOLEAN:
            return new LazyBooleanTreeReader(columnId, rowIndexStride);
        case BYTE:
            return new LazyByteTreeReader(columnId, rowIndexStride);
        case DOUBLE:
            return new LazyDoubleTreeReader(columnId, rowIndexStride);
        case FLOAT:
            return new LazyFloatTreeReader(columnId, rowIndexStride);
        case SHORT:
            return new LazyShortTreeReader(columnId, rowIndexStride);
        case LONG:
            return new LazyLongTreeReader(columnId, rowIndexStride);
        case INT:
            return new LazyIntTreeReader(columnId, rowIndexStride);
        case STRING:
            return new LazyStringTreeReader(columnId, rowIndexStride);
        case BINARY:
            return new LazyBinaryTreeReader(columnId, rowIndexStride);
        case TIMESTAMP:
            return new LazyTimestampTreeReader(columnId, rowIndexStride);
        case STRUCT:
            int structFieldCount = type.getFieldNamesCount();
            LazyTreeReader[] structFields = new LazyTreeReader[structFieldCount];
            for (int i = 0; i < structFieldCount; i++) {
                int subtype = type.getSubtypes(i);
                if (included == null || included[subtype]) {
                    structFields[i] = createLazyTreeReader(subtype, types, included);
                }
            }
            return new LazyStructTreeReader(columnId, rowIndexStride, structFields, type.getFieldNamesList());
        case LIST:
            LazyTreeReader elementReader = createLazyTreeReader(type.getSubtypes(0), types, included);
            return new LazyListTreeReader(columnId, rowIndexStride, elementReader);
        case MAP:
            LazyTreeReader keyReader = createLazyTreeReader(type.getSubtypes(0), types, included);
            LazyTreeReader valueReader = createLazyTreeReader(type.getSubtypes(1), types, included);
            return new LazyMapTreeReader(columnId, rowIndexStride, keyReader, valueReader);
        case UNION:
            int unionFieldCount = type.getSubtypesCount();
            LazyTreeReader[] unionFields = new LazyTreeReader[unionFieldCount];
            for (int i = 0; i < unionFieldCount; ++i) {
                unionFields[i] = createLazyTreeReader(type.getSubtypes(i), types, included);
            }
            return new LazyUnionTreeReader(columnId, rowIndexStride, unionFields);
        default:
            throw new IllegalArgumentException("Unsupported type " + type.getKind());
        }
    }

    OrcLazyObject createLazyObject(int columnId, List<OrcProto.Type> types, boolean[] included) throws IOException {
        OrcProto.Type type = types.get(columnId);
        switch (type.getKind()) {
        case BOOLEAN:
            return new OrcLazyBoolean((LazyBooleanTreeReader) createLazyTreeReader(columnId, types, included));
        case BYTE:
            return new OrcLazyByte((LazyByteTreeReader) createLazyTreeReader(columnId, types, included));
        case DOUBLE:
            return new OrcLazyDouble((LazyDoubleTreeReader) createLazyTreeReader(columnId, types, included));
        case FLOAT:
            return new OrcLazyFloat((LazyFloatTreeReader) createLazyTreeReader(columnId, types, included));
        case SHORT:
            return new OrcLazyShort((LazyShortTreeReader) createLazyTreeReader(columnId, types, included));
        case LONG:
            return new OrcLazyLong((LazyLongTreeReader) createLazyTreeReader(columnId, types, included));
        case INT:
            return new OrcLazyInt((LazyIntTreeReader) createLazyTreeReader(columnId, types, included));
        case STRING:
            return new OrcLazyString((LazyStringTreeReader) createLazyTreeReader(columnId, types, included));
        case BINARY:
            return new OrcLazyBinary((LazyBinaryTreeReader) createLazyTreeReader(columnId, types, included));
        case TIMESTAMP:
            return new OrcLazyTimestamp((LazyTimestampTreeReader) createLazyTreeReader(columnId, types, included));
        case STRUCT:
            return new OrcLazyStruct((LazyStructTreeReader) createLazyTreeReader(columnId, types, included));
        case LIST:
            return new OrcLazyList((LazyListTreeReader) createLazyTreeReader(columnId, types, included));
        case MAP:
            return new OrcLazyMap((LazyMapTreeReader) createLazyTreeReader(columnId, types, included));
        case UNION:
            return new OrcLazyUnion((LazyUnionTreeReader) createLazyTreeReader(columnId, types, included));
        default:
            throw new IllegalArgumentException("Unsupported type " + type.getKind());
        }
    }

    OrcProto.StripeFooter readStripeFooter(StripeInformation stripe) throws IOException {
        long offset = stripe.getOffset() + stripe.getIndexLength() + stripe.getDataLength();
        int tailLength = (int) stripe.getFooterLength();

        return OrcProto.StripeFooter
                .parseFrom(InStream.create("footer", file, offset, tailLength, codec, bufferSize));
    }

    private void readEntireStripeEagerly(StripeInformation stripe, long offset) throws IOException {
        byte[] buffer = new byte[(int) (stripe.getDataLength())];
        file.seek(offset + stripe.getIndexLength());
        file.readFully(buffer, 0, buffer.length);
        int sectionOffset = 0;
        for (OrcProto.Stream section : stripeFooter.getStreamsList()) {
            if (StreamName.getArea(section.getKind()) == StreamName.Area.DATA
                    || StreamName.getArea(section.getKind()) == StreamName.Area.DICTIONARY) {
                int sectionLength = (int) section.getLength();
                StreamName name = new StreamName(section.getColumn(), section.getKind());
                ByteBuffer sectionBuffer = ByteBuffer.wrap(buffer, sectionOffset, sectionLength);
                streams.put(name,
                        InStream.create(name.toString(), sectionBuffer, codec, bufferSize, section.getUseVInts()));
                sectionOffset += sectionLength;
            }
        }
    }

    private void readEntireStripeLazily(StripeInformation stripe, long offset) throws IOException {
        int sectionOffset = 0;
        for (OrcProto.Stream section : stripeFooter.getStreamsList()) {
            if (StreamName.getArea(section.getKind()) == StreamName.Area.DATA
                    || StreamName.getArea(section.getKind()) == StreamName.Area.DICTIONARY) {
                int sectionLength = (int) section.getLength();
                StreamName name = new StreamName(section.getColumn(), section.getKind());
                streams.put(name,
                        InStream.create(name.toString(), file, offset + stripe.getIndexLength() + sectionOffset,
                                sectionLength, codec, bufferSize, section.getUseVInts(), readStrides));
                sectionOffset += sectionLength;
            }
        }
    }

    private void readIncludedStreamsEagerly(StripeInformation stripe, List<OrcProto.Stream> streamList, long offset,
            int currentSection) throws IOException {
        long sectionOffset = stripe.getIndexLength();
        while (currentSection < streamList.size()) {
            int bytes = 0;

            // find the first section that shouldn't be read
            int excluded = currentSection;
            while (excluded < streamList.size() && included[streamList.get(excluded).getColumn()]) {
                bytes += streamList.get(excluded++).getLength();
            }

            // actually read the bytes as a big chunk
            if (currentSection < excluded) {
                byte[] buffer = new byte[bytes];
                file.seek(offset + sectionOffset);
                file.readFully(buffer, 0, bytes);
                sectionOffset += bytes;

                // create the streams for the sections we just read
                bytes = 0;
                while (currentSection < excluded) {
                    OrcProto.Stream section = streamList.get(currentSection);
                    StreamName name = new StreamName(section.getColumn(), section.getKind());
                    this.streams.put(name,
                            InStream.create(name.toString(),
                                    ByteBuffer.wrap(buffer, bytes, (int) section.getLength()), codec, bufferSize,
                                    section.getUseVInts()));
                    currentSection++;
                    bytes += section.getLength();
                }
            }

            // skip forward until we get back to a section that we need
            while (currentSection < streamList.size() && !included[streamList.get(currentSection).getColumn()]) {
                sectionOffset += streamList.get(currentSection).getLength();
                currentSection++;
            }
        }
    }

    private void readIncludedStreamsLazily(StripeInformation stripe, List<OrcProto.Stream> streamList, long offset,
            int currentSection) throws IOException {
        long sectionOffset = stripe.getIndexLength();
        while (currentSection < streamList.size()) {
            if (included[streamList.get(currentSection).getColumn()]) {
                OrcProto.Stream section = streamList.get(currentSection);
                StreamName name = new StreamName(section.getColumn(), section.getKind());
                this.streams.put(name, InStream.create(name.toString(), file, offset + sectionOffset,
                        (int) section.getLength(), codec, bufferSize, section.getUseVInts(), readStrides));
            }
            sectionOffset += streamList.get(currentSection).getLength();
            currentSection += 1;
        }
    }

    protected boolean shouldReadEagerly(StripeInformation stripe, int currentSection) {
        if (readEagerlyFromHdfsBytes <= 0) {
            return readEagerlyFromHdfs;
        }

        long inputBytes = 0;
        if (included == null) {
            inputBytes = stripe.getDataLength();
        } else {
            List<OrcProto.Stream> streamList = stripeFooter.getStreamsList();
            for (int i = currentSection; i < streamList.size(); i++) {
                if (included[streamList.get(i).getColumn()]) {
                    inputBytes += streamList.get(i).getLength();
                }
            }
        }

        return inputBytes <= readEagerlyFromHdfsBytes;
    }

    private void readStripe() throws IOException {
        StripeInformation stripe = stripes.get(currentStripe);
        stripeFooter = readStripeFooter(stripe);
        long offset = stripe.getOffset();
        streams.clear();

        // if we aren't projecting columns, just read the whole stripe
        if (included == null) {
            if (shouldReadEagerly(stripe, 0)) {
                readEntireStripeEagerly(stripe, offset);
            } else {
                readEntireStripeLazily(stripe, offset);
            }
        } else {
            List<OrcProto.Stream> streamList = stripeFooter.getStreamsList();
            // the index of the current section
            int currentSection = 0;
            while (currentSection < streamList.size()
                    && StreamName.getArea(streamList.get(currentSection).getKind()) != StreamName.Area.DATA
                    && StreamName.getArea(streamList.get(currentSection).getKind()) != StreamName.Area.DICTIONARY) {
                currentSection += 1;
            }

            if (shouldReadEagerly(stripe, currentSection)) {
                readIncludedStreamsEagerly(stripe, streamList, offset, currentSection);
            } else {
                readIncludedStreamsLazily(stripe, streamList, offset, currentSection);
            }
        }

        rowInStripe = 0;
        rowCountInStripe = stripe.getNumberOfRows();
        rowBaseInStripe = 0;
        for (int i = 0; i < currentStripe; ++i) {
            rowBaseInStripe += stripes.get(i).getNumberOfRows();
        }
        readRowIndex();
        ReaderWriterProfiler.start(ReaderWriterProfiler.Counter.DESERIALIZATION_TIME);
        reader.startStripe(streams, stripeFooter.getColumnsList(), indexes, rowBaseInStripe);
        ReaderWriterProfiler.end(ReaderWriterProfiler.Counter.DESERIALIZATION_TIME);

        // We don't need the indices anymore, so free them
        for (int i = 0; i < indexes.length; ++i) {
            indexes[i] = null;
        }
    }

    @Override
    public boolean hasNext() throws IOException {
        return rowInStripe < rowCountInStripe || currentStripe < stripes.size() - 1;
    }

    @Override
    public Object next(Object previous) throws IOException {
        if (rowInStripe >= rowCountInStripe) {
            reader.close();
            currentStripe += 1;
            readStripe();
        }
        rowInStripe += 1;

        if (previous == null) {
            previous = reader;
        } else if (previous != reader) {
            ((OrcLazyRow) previous).reset(reader);
            reader = (OrcLazyRow) previous;
        }

        ((OrcLazyObject) previous).next();
        return previous;
    }

    @Override
    public void close() throws IOException {
        file.close();
        reader.close();
    }

    @Override
    public long getRowNumber() {
        return rowInStripe + rowBaseInStripe + firstRow;
    }

    /**
     * Return the fraction of rows that have been read from the selected.
     * section of the file
     * @return fraction between 0.0 and 1.0 of rows consumed
     */
    @Override
    public float getProgress() {
        return ((float) rowBaseInStripe + rowInStripe) / totalRowCount;
    }

    private int findStripe(long rowNumber) {
        if (rowNumber < 0) {
            throw new IllegalArgumentException("Seek to a negative row number " + rowNumber);
        } else if (rowNumber < firstRow) {
            throw new IllegalArgumentException("Seek before reader range " + rowNumber);
        }
        rowNumber -= firstRow;
        for (int i = 0; i < stripes.size(); i++) {
            StripeInformation stripe = stripes.get(i);
            if (stripe.getNumberOfRows() > rowNumber) {
                return i;
            }
            rowNumber -= stripe.getNumberOfRows();
        }
        throw new IllegalArgumentException("Seek after the end of reader range");
    }

    private void readRowIndex() throws IOException {
        long offset = stripes.get(currentStripe).getOffset();
        for (OrcProto.Stream stream : stripeFooter.getStreamsList()) {
            if (stream.getKind() == OrcProto.Stream.Kind.ROW_INDEX) {
                int col = stream.getColumn();
                if ((included == null || included[col]) && indexes[col] == null) {
                    indexes[col] = OrcProto.RowIndex.parseFrom(InStream.create("index", file, offset,
                            (int) stream.getLength(), codec, bufferSize, stream.getUseVInts(), readStrides));
                }
            }
            offset += stream.getLength();
        }
    }

    @Override
    public void seekToRow(long rowNumber) throws IOException {
        // Update the stripe
        int rightStripe = findStripe(rowNumber);
        if (rightStripe != this.currentStripe) {
            this.currentStripe = rightStripe;
            readStripe();
        }

        // Update the row number within the stripe
        this.rowInStripe = rowNumber - this.rowBaseInStripe - this.firstRow;

        // Update the reader
        this.reader.seekToRow(rowNumber);
    }

    @Override
    public OrcLazyRow getReader() {
        return reader;
    }
}