org.apache.hadoop.hdfs.server.datanode.TestDataNodeVolumeFailure.java Source code

Introduction

Here is the source code for org.apache.hadoop.hdfs.server.datanode.TestDataNodeVolumeFailure.java
Source

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.hdfs.server.datanode;

import java.io.File;
import java.io.FilenameFilter;
import java.io.IOException;
import java.net.InetSocketAddress;
import java.net.Socket;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.hdfs.BlockReader;
import org.apache.hadoop.hdfs.BlockReaderFactory;
import org.apache.hadoop.hdfs.DFSTestUtil;
import org.apache.hadoop.hdfs.HdfsConfiguration;
import org.apache.hadoop.hdfs.MiniDFSCluster;
import org.apache.hadoop.hdfs.protocol.DatanodeInfo;
import org.apache.hadoop.hdfs.protocol.ExtendedBlock;
import org.apache.hadoop.hdfs.protocol.LocatedBlock;
import org.apache.hadoop.hdfs.server.blockmanagement.BlockManagerTestUtil;
import org.apache.hadoop.hdfs.server.common.HdfsServerConstants;
import org.apache.hadoop.hdfs.server.namenode.FSNamesystem;
import org.apache.hadoop.hdfs.server.protocol.DatanodeRegistration;
import org.apache.hadoop.hdfs.server.protocol.NamenodeProtocols;
import org.apache.hadoop.hdfs.DFSConfigKeys;
import org.apache.hadoop.net.NetUtils;

import org.junit.After;
import org.junit.Before;
import org.junit.Test;
import static org.junit.Assert.*;

/**
 * Fine-grain testing of block files and locations after volume failure.
 */
public class TestDataNodeVolumeFailure {
    static final Log LOG = LogFactory.getLog(TestDataNodeVolumeFailure.class);
    final private int block_size = 512;
    MiniDFSCluster cluster = null;
    int dn_num = 2;
    int blocks_num = 30;
    short repl = 2;
    File dataDir = null;
    File data_fail = null;
    File failedDir = null;

    // mapping blocks to Meta files(physical files) and locs(NameNode locations)
    private class BlockLocs {
        public int num_files = 0;
        public int num_locs = 0;
    }

    // block id to BlockLocs
    Map<String, BlockLocs> block_map = new HashMap<String, BlockLocs>();

    @Before
    public void setUp() throws Exception {
        // bring up a cluster of 2
        Configuration conf = new HdfsConfiguration();
        conf.setLong(DFSConfigKeys.DFS_BLOCK_SIZE_KEY, block_size);
        // Allow a single volume failure (there are two volumes)
        conf.setInt(DFSConfigKeys.DFS_DATANODE_FAILED_VOLUMES_TOLERATED_KEY, 1);
        cluster = new MiniDFSCluster.Builder(conf).numDataNodes(dn_num).build();
        cluster.waitActive();
    }

    @After
    public void tearDown() throws Exception {
        if (data_fail != null) {
            data_fail.setWritable(true);
        }
        if (failedDir != null) {
            failedDir.setWritable(true);
        }
        if (cluster != null) {
            cluster.shutdown();
        }
    }

    /*
     * Verify the number of blocks and files are correct after volume failure,
     * and that we can replicate to both datanodes even after a single volume
     * failure if the configuration parameter allows this.
     */
    @Test
    public void testVolumeFailure() throws IOException {
        FileSystem fs = cluster.getFileSystem();
        dataDir = new File(cluster.getDataDirectory());
        LOG.info("Data dir: is " + dataDir.getPath());

        // Data dir structure is dataDir/data[1-4]/[current,tmp...]
        // data1,2 is for datanode 1, data2,3 - datanode2 
        String filename = "/test.txt";
        Path filePath = new Path(filename);

        // we use only small number of blocks to avoid creating subdirs in the data dir..
        int filesize = block_size * blocks_num;
        DFSTestUtil.createFile(fs, filePath, filesize, repl, 1L);
        DFSTestUtil.waitReplication(fs, filePath, repl);
        LOG.info("file " + filename + "(size " + filesize + ") is created and replicated");

        // fail the volume
        // delete/make non-writable one of the directories (failed volume)
        data_fail = new File(dataDir, "data3");
        failedDir = MiniDFSCluster.getFinalizedDir(dataDir, cluster.getNamesystem().getBlockPoolId());
        if (failedDir.exists() &&
        //!FileUtil.fullyDelete(failedDir)
                !deteteBlocks(failedDir)) {
            throw new IOException("Could not delete hdfs directory '" + failedDir + "'");
        }
        data_fail.setReadOnly();
        failedDir.setReadOnly();
        LOG.info("Deleteing " + failedDir.getPath() + "; exist=" + failedDir.exists());

        // access all the blocks on the "failed" DataNode, 
        // we need to make sure that the "failed" volume is being accessed - 
        // and that will cause failure, blocks removal, "emergency" block report
        triggerFailure(filename, filesize);

        // make sure a block report is sent 
        DataNode dn = cluster.getDataNodes().get(1); //corresponds to dir data3
        String bpid = cluster.getNamesystem().getBlockPoolId();
        DatanodeRegistration dnR = dn.getDNRegistrationForBP(bpid);
        long[] bReport = dn.getFSDataset().getBlockReport(bpid).getBlockListAsLongs();
        cluster.getNameNodeRpc().blockReport(dnR, bpid, bReport);

        // verify number of blocks and files...
        verify(filename, filesize);

        // create another file (with one volume failed).
        LOG.info("creating file test1.txt");
        Path fileName1 = new Path("/test1.txt");
        DFSTestUtil.createFile(fs, fileName1, filesize, repl, 1L);

        // should be able to replicate to both nodes (2 DN, repl=2)
        DFSTestUtil.waitReplication(fs, fileName1, repl);
        LOG.info("file " + fileName1.getName() + " is created and replicated");
    }

    /**
     * verifies two things:
     *  1. number of locations of each block in the name node
     *   matches number of actual files
     *  2. block files + pending block equals to total number of blocks that a file has 
     *     including the replication (HDFS file has 30 blocks, repl=2 - total 60
     * @param fn - file name
     * @param fs - file size
     * @throws IOException
     */
    private void verify(String fn, int fs) throws IOException {
        // now count how many physical blocks are there
        int totalReal = countRealBlocks(block_map);
        LOG.info("countRealBlocks counted " + totalReal + " blocks");

        // count how many blocks store in NN structures.
        int totalNN = countNNBlocks(block_map, fn, fs);
        LOG.info("countNNBlocks counted " + totalNN + " blocks");

        for (String bid : block_map.keySet()) {
            BlockLocs bl = block_map.get(bid);
            // LOG.info(bid + "->" + bl.num_files + "vs." + bl.num_locs);
            // number of physical files (1 or 2) should be same as number of datanodes
            // in the list of the block locations
            assertEquals("Num files should match num locations", bl.num_files, bl.num_locs);
        }
        assertEquals("Num physical blocks should match num stored in the NN", totalReal, totalNN);

        // now check the number of under-replicated blocks
        FSNamesystem fsn = cluster.getNamesystem();
        // force update of all the metric counts by calling computeDatanodeWork
        BlockManagerTestUtil.getComputedDatanodeWork(fsn.getBlockManager());
        // get all the counts 
        long underRepl = fsn.getUnderReplicatedBlocks();
        long pendRepl = fsn.getPendingReplicationBlocks();
        long totalRepl = underRepl + pendRepl;
        LOG.info("underreplicated after = " + underRepl + " and pending repl =" + pendRepl + "; total underRepl = "
                + totalRepl);

        LOG.info("total blocks (real and replicating):" + (totalReal + totalRepl) + " vs. all files blocks "
                + blocks_num * 2);

        // together all the blocks should be equal to all real + all underreplicated
        assertEquals("Incorrect total block count", totalReal + totalRepl, blocks_num * repl);
    }

    /**
     * go to each block on the 2nd DataNode until it fails...
     * @param path
     * @param size
     * @throws IOException
     */
    private void triggerFailure(String path, long size) throws IOException {
        NamenodeProtocols nn = cluster.getNameNodeRpc();
        List<LocatedBlock> locatedBlocks = nn.getBlockLocations(path, 0, size).getLocatedBlocks();

        for (LocatedBlock lb : locatedBlocks) {
            DatanodeInfo dinfo = lb.getLocations()[1];
            ExtendedBlock b = lb.getBlock();
            try {
                accessBlock(dinfo, lb);
            } catch (IOException e) {
                LOG.info("Failure triggered, on block: " + b.getBlockId()
                        + "; corresponding volume should be removed by now");
                break;
            }
        }
    }

    /**
     * simulate failure delete all the block files
     * @param dir
     * @throws IOException
     */
    private boolean deteteBlocks(File dir) {
        File[] fileList = dir.listFiles();
        for (File f : fileList) {
            if (f.getName().startsWith("blk_")) {
                if (!f.delete())
                    return false;

            }
        }
        return true;
    }

    /**
     * try to access a block on a data node. If fails - throws exception
     * @param datanode
     * @param lblock
     * @throws IOException
     */
    private void accessBlock(DatanodeInfo datanode, LocatedBlock lblock) throws IOException {
        InetSocketAddress targetAddr = null;
        Socket s = null;
        ExtendedBlock block = lblock.getBlock();

        targetAddr = NetUtils.createSocketAddr(datanode.getName());

        s = new Socket();
        s.connect(targetAddr, HdfsServerConstants.READ_TIMEOUT);
        s.setSoTimeout(HdfsServerConstants.READ_TIMEOUT);

        String file = BlockReaderFactory.getFileName(targetAddr, "test-blockpoolid", block.getBlockId());
        BlockReader blockReader = BlockReaderFactory.newBlockReader(s, file, block, lblock.getBlockToken(), 0, -1,
                4096);

        // nothing - if it fails - it will throw and exception
    }

    /**
     * Count datanodes that have copies of the blocks for a file
     * put it into the map
     * @param map
     * @param path
     * @param size
     * @return
     * @throws IOException
     */
    private int countNNBlocks(Map<String, BlockLocs> map, String path, long size) throws IOException {
        int total = 0;

        NamenodeProtocols nn = cluster.getNameNodeRpc();
        List<LocatedBlock> locatedBlocks = nn.getBlockLocations(path, 0, size).getLocatedBlocks();
        //LOG.info("Number of blocks: " + locatedBlocks.size()); 

        for (LocatedBlock lb : locatedBlocks) {
            String blockId = "" + lb.getBlock().getBlockId();
            //System.out.print(blockId + ": ");
            DatanodeInfo[] dn_locs = lb.getLocations();
            BlockLocs bl = map.get(blockId);
            if (bl == null) {
                bl = new BlockLocs();
            }
            //System.out.print(dn_info.name+",");
            total += dn_locs.length;
            bl.num_locs += dn_locs.length;
            map.put(blockId, bl);
            //LOG.info();
        }
        return total;
    }

    /**
     *  look for real blocks
     *  by counting *.meta files in all the storage dirs 
     * @param map
     * @return
     */
    private int countRealBlocks(Map<String, BlockLocs> map) {
        int total = 0;
        final String bpid = cluster.getNamesystem().getBlockPoolId();
        for (int i = 0; i < dn_num; i++) {
            for (int j = 0; j <= 1; j++) {
                File storageDir = MiniDFSCluster.getStorageDir(i, j);
                File dir = MiniDFSCluster.getFinalizedDir(storageDir, bpid);
                if (dir == null) {
                    LOG.info("dir is null for dn=" + i + " and data_dir=" + j);
                    continue;
                }

                String[] res = metaFilesInDir(dir);
                if (res == null) {
                    LOG.info("res is null for dir = " + dir + " i=" + i + " and j=" + j);
                    continue;
                }
                //LOG.info("for dn" + i + "." + j + ": " + dir + "=" + res.length+ " files");

                //int ii = 0;
                for (String s : res) {
                    // cut off "blk_-" at the beginning and ".meta" at the end
                    assertNotNull("Block file name should not be null", s);
                    String bid = s.substring(s.indexOf("_") + 1, s.lastIndexOf("_"));
                    //LOG.info(ii++ + ". block " + s + "; id=" + bid);
                    BlockLocs val = map.get(bid);
                    if (val == null) {
                        val = new BlockLocs();
                    }
                    val.num_files++; // one more file for the block
                    map.put(bid, val);

                }
                //LOG.info("dir1="+dir.getPath() + "blocks=" + res.length);
                //LOG.info("dir2="+dir2.getPath() + "blocks=" + res2.length);

                total += res.length;
            }
        }
        return total;
    }

    /*
     * count how many files *.meta are in the dir
     */
    private String[] metaFilesInDir(File dir) {
        String[] res = dir.list(new FilenameFilter() {
            public boolean accept(File dir, String name) {
                return name.startsWith("blk_") && name.endsWith(FSDataset.METADATA_EXTENSION);
            }
        });
        return res;
    }
}