PerformanceEvaluation.java Source code

Introduction

Here is the source code for PerformanceEvaluation.java
Source

/**
 * Copyright 2007 The Apache Software Foundation
 *
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
import org.apache.hadoop.hbase.*;
import java.io.DataInput;
import java.io.DataOutput;
import java.io.IOException;
import java.io.PrintStream;
import java.io.File;
import java.text.SimpleDateFormat;
import java.util.ArrayList;
import java.util.Date;
import java.util.List;
import java.util.Map;
import java.util.Random;
import java.util.TreeMap;
import java.util.Arrays;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.lang.reflect.Constructor;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.hbase.client.Get;
import org.apache.hadoop.hbase.client.HBaseAdmin;
import org.apache.hadoop.hbase.client.HTable;
import org.apache.hadoop.hbase.client.Put;
import org.apache.hadoop.hbase.client.Result;
import org.apache.hadoop.hbase.client.ResultScanner;
import org.apache.hadoop.hbase.client.Scan;
import org.apache.hadoop.hbase.filter.PageFilter;
import org.apache.hadoop.hbase.filter.WhileMatchFilter;
import org.apache.hadoop.hbase.filter.Filter;
import org.apache.hadoop.hbase.filter.SingleColumnValueFilter;
import org.apache.hadoop.hbase.filter.CompareFilter;
import org.apache.hadoop.hbase.filter.BinaryComparator;
import org.apache.hadoop.hbase.mapreduce.TableMapReduceUtil;
import org.apache.hadoop.hbase.util.Bytes;
import org.apache.hadoop.hbase.util.FSUtils;
import org.apache.hadoop.hbase.util.Hash;
import org.apache.hadoop.hbase.util.MurmurHash;
import org.apache.hadoop.hbase.util.Pair;
import org.apache.hadoop.hbase.zookeeper.MiniZooKeeperCluster;
import org.apache.hadoop.hdfs.MiniDFSCluster;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.NullWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.io.Writable;
import org.apache.hadoop.mapreduce.InputSplit;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.JobContext;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.RecordReader;
import org.apache.hadoop.mapreduce.TaskAttemptContext;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
import org.apache.hadoop.mapreduce.lib.reduce.LongSumReducer;
import org.apache.hadoop.util.LineReader;

/**
 * Script used evaluating HBase performance and scalability.  Runs a HBase
 * client that steps through one of a set of hardcoded tests or 'experiments'
 * (e.g. a random reads test, a random writes test, etc.). Pass on the
 * command-line which test to run and how many clients are participating in
 * this experiment. Run <code>java PerformanceEvaluation --help</code> to
 * obtain usage.
 *
 * <p>This class sets up and runs the evaluation programs described in
 * Section 7, <i>Performance Evaluation</i>, of the <a
 * href="http://labs.google.com/papers/bigtable.html">Bigtable</a>
 * paper, pages 8-10.
 *
 * <p>If number of clients > 1, we start up a MapReduce job. Each map task
 * runs an individual client. Each client does about 1GB of data.
 */
public class PerformanceEvaluation {
    protected static final Log LOG = LogFactory.getLog(PerformanceEvaluation.class.getName());

    private static final int ROW_LENGTH = 1000;
    private static final int ONE_GB = 1024 * 1024 * 1000;
    private static final int ROWS_PER_GB = ONE_GB / ROW_LENGTH;

    public static final byte[] TABLE_NAME = Bytes.toBytes("TestTable");
    public static final byte[] FAMILY_NAME = Bytes.toBytes("info");
    public static final byte[] QUALIFIER_NAME = Bytes.toBytes("data");

    public static int SCANNER_CACHING = 30;

    protected static final HTableDescriptor TABLE_DESCRIPTOR;
    static {
        TABLE_DESCRIPTOR = new HTableDescriptor(TABLE_NAME);
        TABLE_DESCRIPTOR.addFamily(new HColumnDescriptor(FAMILY_NAME));
    }

    protected Map<String, CmdDescriptor> commands = new TreeMap<String, CmdDescriptor>();

    volatile Configuration conf;
    private boolean miniCluster = false;
    private boolean nomapred = false;
    private int N = 1;
    private int R = ROWS_PER_GB;
    private int S = SCANNER_CACHING;
    private boolean flushCommits = true;
    private boolean writeToWAL = true;

    private static final Path PERF_EVAL_DIR = new Path("performance_evaluation");
    /**
     * Regex to parse lines in input file passed to mapreduce task.
     */
    public static final Pattern LINE_PATTERN = Pattern.compile("startRow=(\\d+),\\s+"
            + "perClientRunRows=(\\d+),\\s+" + "totalRows=(\\d+),\\s+" + "clients=(\\d+),\\s+"
            + "flushCommits=(\\w+),\\s+" + "writeToWAL=(\\w+),\\s+" + "scanCache=(\\d+)");

    /**
     * Enum for map metrics.  Keep it out here rather than inside in the Map
     * inner-class so we can find associated properties.
     */
    protected static enum Counter {
        /** elapsed time */
        ELAPSED_TIME,
        /** number of rows */
        ROWS
    }

    /**
     * Constructor
     * @param c Configuration object
     */
    public PerformanceEvaluation(final Configuration c) {
        this.conf = c;

        addCommandDescriptor(RandomReadTest.class, "randomRead", "Run random read test");
        addCommandDescriptor(RandomSeekScanTest.class, "randomSeekScan", "Run random seek and scan 100 test");
        addCommandDescriptor(RandomScanWithRange10Test.class, "scanRange10",
                "Run random seek scan with both start and stop row (max 10 rows)");
        addCommandDescriptor(RandomScanWithRange100Test.class, "scanRange100",
                "Run random seek scan with both start and stop row (max 100 rows)");
        addCommandDescriptor(RandomScanWithRange1000Test.class, "scanRange1000",
                "Run random seek scan with both start and stop row (max 1000 rows)");
        addCommandDescriptor(RandomScanWithRange10000Test.class, "scanRange10000",
                "Run random seek scan with both start and stop row (max 10000 rows)");
        addCommandDescriptor(RandomWriteTest.class, "randomWrite", "Run random write test");
        addCommandDescriptor(SequentialReadTest.class, "sequentialRead", "Run sequential read test");
        addCommandDescriptor(SequentialWriteTest.class, "sequentialWrite", "Run sequential write test");
        addCommandDescriptor(ScanTest.class, "scan", "Run scan test (read every row)");
        addCommandDescriptor(FilteredScanTest.class, "filterScan",
                "Run scan test using a filter to find a specific row based on it's value (make sure to use --rows=20)");
    }

    protected void addCommandDescriptor(Class<? extends Test> cmdClass, String name, String description) {
        CmdDescriptor cmdDescriptor = new CmdDescriptor(cmdClass, name, description);
        commands.put(name, cmdDescriptor);
    }

    /**
     * Implementations can have their status set.
     */
    static interface Status {
        /**
         * Sets status
         * @param msg status message
         * @throws IOException
         */
        void setStatus(final String msg) throws IOException;
    }

    /**
     *  This class works as the InputSplit of Performance Evaluation
     *  MapReduce InputFormat, and the Record Value of RecordReader.
     *  Each map task will only read one record from a PeInputSplit,
     *  the record value is the PeInputSplit itself.
     */
    public static class PeInputSplit extends InputSplit implements Writable {
        private int startRow = 0;
        private int rows = 0;
        private int scanCache = 0;
        private int totalRows = 0;
        private int clients = 0;
        private boolean flushCommits = false;
        private boolean writeToWAL = true;

        public PeInputSplit() {
            this.startRow = 0;
            this.rows = 0;
            this.totalRows = 0;
            this.clients = 0;
            this.scanCache = 0;
            this.flushCommits = false;
            this.writeToWAL = true;
        }

        public PeInputSplit(int startRow, int rows, int totalRows, int clients, boolean flushCommits,
                boolean writeToWAL, int scanCache) {
            this.startRow = startRow;
            this.rows = rows;
            this.totalRows = totalRows;
            this.clients = clients;
            this.flushCommits = flushCommits;
            this.writeToWAL = writeToWAL;
            this.scanCache = scanCache;
        }

        @Override
        public void readFields(DataInput in) throws IOException {
            this.startRow = in.readInt();
            this.rows = in.readInt();
            this.totalRows = in.readInt();
            this.clients = in.readInt();
            this.flushCommits = in.readBoolean();
            this.writeToWAL = in.readBoolean();
            this.scanCache = in.readInt();
        }

        @Override
        public void write(DataOutput out) throws IOException {
            out.writeInt(startRow);
            out.writeInt(rows);
            out.writeInt(totalRows);
            out.writeInt(clients);
            out.writeBoolean(flushCommits);
            out.writeBoolean(writeToWAL);
            out.writeInt(scanCache);
        }

        @Override
        public long getLength() throws IOException, InterruptedException {
            return 0;
        }

        @Override
        public String[] getLocations() throws IOException, InterruptedException {
            return new String[0];
        }

        public int getStartRow() {
            return startRow;
        }

        public int getRows() {
            return rows;
        }

        public int getScanCache() {
            return scanCache;
        }

        public int getTotalRows() {
            return totalRows;
        }

        public int getClients() {
            return clients;
        }

        public boolean isFlushCommits() {
            return flushCommits;
        }

        public boolean isWriteToWAL() {
            return writeToWAL;
        }
    }

    /**
     *  InputFormat of Performance Evaluation MapReduce job.
     *  It extends from FileInputFormat, want to use it's methods such as setInputPaths().
     */
    public static class PeInputFormat extends FileInputFormat<NullWritable, PeInputSplit> {

        @Override
        public List<InputSplit> getSplits(JobContext job) throws IOException {
            // generate splits
            List<InputSplit> splitList = new ArrayList<InputSplit>();

            for (FileStatus file : listStatus(job)) {
                Path path = file.getPath();
                FileSystem fs = path.getFileSystem(job.getConfiguration());
                FSDataInputStream fileIn = fs.open(path);
                LineReader in = new LineReader(fileIn, job.getConfiguration());
                int lineLen = 0;
                while (true) {
                    Text lineText = new Text();
                    lineLen = in.readLine(lineText);
                    if (lineLen <= 0) {
                        break;
                    }
                    Matcher m = LINE_PATTERN.matcher(lineText.toString());
                    if ((m != null) && m.matches()) {
                        int startRow = Integer.parseInt(m.group(1));
                        int rows = Integer.parseInt(m.group(2));
                        int totalRows = Integer.parseInt(m.group(3));
                        int clients = Integer.parseInt(m.group(4));
                        boolean flushCommits = Boolean.parseBoolean(m.group(5));
                        boolean writeToWAL = Boolean.parseBoolean(m.group(6));
                        int scanCache = Integer.parseInt(m.group(7));

                        LOG.debug("split[" + splitList.size() + "] " + " startRow=" + startRow + " rows=" + rows
                                + " totalRows=" + totalRows + " clients=" + clients + " flushCommits="
                                + flushCommits + " writeToWAL=" + writeToWAL);

                        PeInputSplit newSplit = new PeInputSplit(startRow, rows, totalRows, clients, flushCommits,
                                writeToWAL, scanCache);
                        splitList.add(newSplit);
                    }
                }
                in.close();
            }

            LOG.info("Total # of splits: " + splitList.size());
            return splitList;
        }

        @Override
        public RecordReader<NullWritable, PeInputSplit> createRecordReader(InputSplit split,
                TaskAttemptContext context) {
            return new PeRecordReader();
        }

        public static class PeRecordReader extends RecordReader<NullWritable, PeInputSplit> {
            private boolean readOver = false;
            private PeInputSplit split = null;
            private NullWritable key = null;
            private PeInputSplit value = null;

            @Override
            public void initialize(InputSplit split, TaskAttemptContext context)
                    throws IOException, InterruptedException {
                this.readOver = false;
                this.split = (PeInputSplit) split;
            }

            @Override
            public boolean nextKeyValue() throws IOException, InterruptedException {
                if (readOver) {
                    return false;
                }

                key = NullWritable.get();
                value = (PeInputSplit) split;

                readOver = true;
                return true;
            }

            @Override
            public NullWritable getCurrentKey() throws IOException, InterruptedException {
                return key;
            }

            @Override
            public PeInputSplit getCurrentValue() throws IOException, InterruptedException {
                return value;
            }

            @Override
            public float getProgress() throws IOException, InterruptedException {
                if (readOver) {
                    return 1.0f;
                } else {
                    return 0.0f;
                }
            }

            @Override
            public void close() throws IOException {
                // do nothing
            }
        }
    }

    /**
     * MapReduce job that runs a performance evaluation client in each map task.
     */
    public static class EvaluationMapTask extends Mapper<NullWritable, PeInputSplit, LongWritable, LongWritable> {

        /** configuration parameter name that contains the command */
        public final static String CMD_KEY = "EvaluationMapTask.command";
        /** configuration parameter name that contains the PE impl */
        public static final String PE_KEY = "EvaluationMapTask.performanceEvalImpl";

        private Class<? extends Test> cmd;
        private PerformanceEvaluation pe;

        @Override
        protected void setup(Context context) throws IOException, InterruptedException {
            this.cmd = forName(context.getConfiguration().get(CMD_KEY), Test.class);

            // this is required so that extensions of PE are instantiated within the
            // map reduce task...
            Class<? extends PerformanceEvaluation> peClass = forName(context.getConfiguration().get(PE_KEY),
                    PerformanceEvaluation.class);
            try {
                this.pe = peClass.getConstructor(Configuration.class).newInstance(context.getConfiguration());
            } catch (Exception e) {
                throw new IllegalStateException("Could not instantiate PE instance", e);
            }
        }

        private <Type> Class<? extends Type> forName(String className, Class<Type> type) {
            Class<? extends Type> clazz = null;
            try {
                clazz = Class.forName(className).asSubclass(type);
            } catch (ClassNotFoundException e) {
                throw new IllegalStateException("Could not find class for name: " + className, e);
            }
            return clazz;
        }

        protected void map(NullWritable key, PeInputSplit value, final Context context)
                throws IOException, InterruptedException {

            Status status = new Status() {
                public void setStatus(String msg) {
                    context.setStatus(msg);
                }
            };

            // Evaluation task
            long elapsedTime = this.pe.runOneClient(this.cmd, value.getStartRow(), value.getRows(),
                    value.getTotalRows(), value.isFlushCommits(), value.isWriteToWAL(), status,
                    value.getScanCache());
            // Collect how much time the thing took. Report as map output and
            // to the ELAPSED_TIME counter.
            context.getCounter(Counter.ELAPSED_TIME).increment(elapsedTime);
            context.getCounter(Counter.ROWS).increment(value.rows);
            context.write(new LongWritable(value.startRow), new LongWritable(elapsedTime));
            context.progress();
        }
    }

    /*
     * If table does not already exist, create.
     * @param c Client to use checking.
     * @return True if we created the table.
     * @throws IOException
     */
    private boolean checkTable(HBaseAdmin admin) throws IOException {
        HTableDescriptor tableDescriptor = getTableDescriptor();
        boolean tableExists = admin.tableExists(tableDescriptor.getName());
        if (!tableExists) {
            admin.createTable(tableDescriptor);
            LOG.info("Table " + tableDescriptor + " created");
        }
        return !tableExists;
    }

    protected HTableDescriptor getTableDescriptor() {
        return TABLE_DESCRIPTOR;
    }

    /*
     * We're to run multiple clients concurrently.  Setup a mapreduce job.  Run
     * one map per client.  Then run a single reduce to sum the elapsed times.
     * @param cmd Command to run.
     * @throws IOException
     */
    private void runNIsMoreThanOne(final Class<? extends Test> cmd)
            throws IOException, InterruptedException, ClassNotFoundException {
        checkTable(new HBaseAdmin(conf));
        if (this.nomapred) {
            doMultipleClients(cmd);
        } else {
            doMapReduce(cmd);
        }
    }

    /*
     * Run all clients in this vm each to its own thread.
     * @param cmd Command to run.
     * @throws IOException
     */
    private void doMultipleClients(final Class<? extends Test> cmd) throws IOException {
        final List<Thread> threads = new ArrayList<Thread>(this.N);
        final int perClientRows = R / N;
        for (int i = 0; i < this.N; i++) {
            Thread t = new Thread(Integer.toString(i)) {
                @Override
                public void run() {
                    super.run();
                    PerformanceEvaluation pe = new PerformanceEvaluation(conf);
                    int index = Integer.parseInt(getName());
                    try {
                        long elapsedTime = pe.runOneClient(cmd, index * perClientRows, perClientRows, R,
                                flushCommits, writeToWAL, new Status() {
                                    public void setStatus(final String msg) throws IOException {
                                        LOG.info("client-" + getName() + " " + msg);
                                    }
                                }, S);
                        LOG.info("Finished " + getName() + " in " + elapsedTime + "ms writing " + perClientRows
                                + " rows");
                    } catch (IOException e) {
                        throw new RuntimeException(e);
                    }
                }
            };
            threads.add(t);
        }
        for (Thread t : threads) {
            t.start();
        }
        for (Thread t : threads) {
            while (t.isAlive()) {
                try {
                    t.join();
                } catch (InterruptedException e) {
                    LOG.debug("Interrupted, continuing" + e.toString());
                }
            }
        }
    }

    /*
     * Run a mapreduce job.  Run as many maps as asked-for clients.
     * Before we start up the job, write out an input file with instruction
     * per client regards which row they are to start on.
     * @param cmd Command to run.
     * @throws IOException
     */
    private void doMapReduce(final Class<? extends Test> cmd)
            throws IOException, InterruptedException, ClassNotFoundException {
        Path inputDir = writeInputFile(this.conf);
        this.conf.set(EvaluationMapTask.CMD_KEY, cmd.getName());
        this.conf.set(EvaluationMapTask.PE_KEY, getClass().getName());
        Job job = new Job(this.conf);
        job.setJarByClass(PerformanceEvaluation.class);
        job.setJobName("HBase Performance Evaluation");

        job.setInputFormatClass(PeInputFormat.class);
        PeInputFormat.setInputPaths(job, inputDir);

        job.setOutputKeyClass(LongWritable.class);
        job.setOutputValueClass(LongWritable.class);

        job.setMapperClass(EvaluationMapTask.class);
        job.setReducerClass(LongSumReducer.class);

        job.setNumReduceTasks(1);

        job.setOutputFormatClass(TextOutputFormat.class);
        TextOutputFormat.setOutputPath(job, new Path(inputDir, "outputs"));

        TableMapReduceUtil.addDependencyJars(job);
        job.waitForCompletion(true);
    }

    /*
     * Write input file of offsets-per-client for the mapreduce job.
     * @param c Configuration
     * @return Directory that contains file written.
     * @throws IOException
     */
    private Path writeInputFile(final Configuration c) throws IOException {
        FileSystem fs = FileSystem.get(c);
        if (!fs.exists(PERF_EVAL_DIR)) {
            fs.mkdirs(PERF_EVAL_DIR);
        }
        SimpleDateFormat formatter = new SimpleDateFormat("yyyyMMddHHmmss");
        Path subdir = new Path(PERF_EVAL_DIR, formatter.format(new Date()));
        fs.mkdirs(subdir);
        Path inputFile = new Path(subdir, "input.txt");
        PrintStream out = new PrintStream(fs.create(inputFile));
        // Make input random.
        Map<Integer, String> m = new TreeMap<Integer, String>();
        Hash h = MurmurHash.getInstance();
        int perClientRows = (this.R / this.N);
        try {
            for (int i = 0; i < 10; i++) {
                for (int j = 0; j < N; j++) {
                    String s = "startRow=" + ((j * perClientRows) + (i * (perClientRows / 10)))
                            + ", perClientRunRows=" + (perClientRows / 10) + ", totalRows=" + this.R + ", clients="
                            + this.N + ", flushCommits=" + this.flushCommits + ", writeToWAL=" + this.writeToWAL
                            + ", scanCache=" + this.S;
                    int hash = h.hash(Bytes.toBytes(s));
                    m.put(hash, s);
                }
            }
            for (Map.Entry<Integer, String> e : m.entrySet()) {
                out.println(e.getValue());
            }
        } finally {
            out.close();
        }
        return subdir;
    }

    /**
     * Describes a command.
     */
    static class CmdDescriptor {
        private Class<? extends Test> cmdClass;
        private String name;
        private String description;

        CmdDescriptor(Class<? extends Test> cmdClass, String name, String description) {
            this.cmdClass = cmdClass;
            this.name = name;
            this.description = description;
        }

        public Class<? extends Test> getCmdClass() {
            return cmdClass;
        }

        public String getName() {
            return name;
        }

        public String getDescription() {
            return description;
        }
    }

    /**
     * Wraps up options passed to {@link org.apache.hadoop.hbase.PerformanceEvaluation.Test
     * tests}.  This makes the reflection logic a little easier to understand...
     */
    static class TestOptions {
        private int startRow;
        private int perClientRunRows;
        private int totalRows;
        private int scanCache;
        private byte[] tableName;
        private boolean flushCommits;
        private boolean writeToWAL = true;

        TestOptions() {
        }

        TestOptions(int startRow, int perClientRunRows, int totalRows, byte[] tableName, boolean flushCommits,
                boolean writeToWAL, int scanCache) {
            this.startRow = startRow;
            this.perClientRunRows = perClientRunRows;
            this.totalRows = totalRows;
            this.tableName = tableName;
            this.flushCommits = flushCommits;
            this.writeToWAL = writeToWAL;
            this.scanCache = scanCache;
        }

        public int getStartRow() {
            return startRow;
        }

        public int getPerClientRunRows() {
            return perClientRunRows;
        }

        public int getTotalRows() {
            return totalRows;
        }

        public byte[] getTableName() {
            return tableName;
        }

        public boolean isFlushCommits() {
            return flushCommits;
        }

        public boolean isWriteToWAL() {
            return writeToWAL;
        }

        public int getScanCache() {
            return scanCache;
        }

    }

    /*
     * A test.
     * Subclass to particularize what happens per row.
     */
    static abstract class Test {
        // Below is make it so when Tests are all running in the one
        // jvm, that they each have a differently seeded Random.
        private static final Random randomSeed = new Random(System.currentTimeMillis());

        private static long nextRandomSeed() {
            return randomSeed.nextLong();
        }

        protected final Random rand = new Random(nextRandomSeed());

        protected final int startRow;
        protected final int perClientRunRows;
        protected final int totalRows;
        private final Status status;
        protected byte[] tableName;
        protected HBaseAdmin admin;
        protected HTable table;
        protected volatile Configuration conf;
        protected boolean flushCommits;
        protected boolean writeToWAL;
        protected final int scanCache;

        /**
         * Note that all subclasses of this class must provide a public contructor
         * that has the exact same list of arguments.
         */
        Test(final Configuration conf, final TestOptions options, final Status status) {
            super();
            this.startRow = options.getStartRow();
            this.scanCache = options.getScanCache();
            this.perClientRunRows = options.getPerClientRunRows();
            this.totalRows = options.getTotalRows();
            this.status = status;
            this.tableName = options.getTableName();
            this.table = null;
            this.conf = conf;
            this.flushCommits = options.isFlushCommits();
            this.writeToWAL = options.isWriteToWAL();
        }

        private String generateStatus(final int sr, final int i, final int lr) {
            return sr + "/" + i + "/" + lr;
        }

        protected int getReportingPeriod() {
            int period = this.perClientRunRows / 10;
            return period == 0 ? this.perClientRunRows : period;
        }

        void testSetup() throws IOException {
            this.admin = new HBaseAdmin(conf);
            this.table = new HTable(conf, tableName);
            this.table.setAutoFlush(false);
            System.out.println("Setting scanner caching to " + this.scanCache);
            this.table.setScannerCaching(this.scanCache);
        }

        void testTakedown() throws IOException {
            if (flushCommits) {
                this.table.flushCommits();
            }
        }

        /*
         * Run test
         * @return Elapsed time.
         * @throws IOException
         */
        long test() throws IOException {
            long elapsedTime;
            testSetup();
            long startTime = System.currentTimeMillis();
            try {
                testTimed();
                elapsedTime = System.currentTimeMillis() - startTime;
            } finally {
                testTakedown();
            }
            return elapsedTime;
        }

        /**
         * Provides an extension point for tests that don't want a per row invocation.
         */
        void testTimed() throws IOException {
            int lastRow = this.startRow + this.perClientRunRows;
            // Report on completion of 1/10th of total.
            for (int i = this.startRow; i < lastRow; i++) {
                testRow(i);
                if (status != null && i > 0 && (i % getReportingPeriod()) == 0) {
                    status.setStatus(generateStatus(this.startRow, i, lastRow));
                }
            }
        }

        /*
        * Test for individual row.
        * @param i Row index.
        */
        void testRow(final int i) throws IOException {
        }
    }

    @SuppressWarnings("unused")
    static class RandomSeekScanTest extends Test {
        RandomSeekScanTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testRow(final int i) throws IOException {
            Scan scan = new Scan(getRandomRow(this.rand, this.totalRows));
            scan.addColumn(FAMILY_NAME, QUALIFIER_NAME);
            scan.setFilter(new WhileMatchFilter(new PageFilter(120)));
            ResultScanner s = this.table.getScanner(scan);
            //int count = 0;
            for (Result rr = null; (rr = s.next()) != null;) {
                // LOG.info("" + count++ + " " + rr.toString());
            }
            s.close();
        }

        @Override
        protected int getReportingPeriod() {
            int period = this.perClientRunRows / 100;
            return period == 0 ? this.perClientRunRows : period;
        }

    }

    @SuppressWarnings("unused")
    static abstract class RandomScanWithRangeTest extends Test {
        RandomScanWithRangeTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testRow(final int i) throws IOException {
            Pair<byte[], byte[]> startAndStopRow = getStartAndStopRow();
            Scan scan = new Scan(startAndStopRow.getFirst(), startAndStopRow.getSecond());
            scan.addColumn(FAMILY_NAME, QUALIFIER_NAME);
            ResultScanner s = this.table.getScanner(scan);
            int count = 0;
            for (Result rr = null; (rr = s.next()) != null;) {
                count++;
            }

            if (i % 100 == 0) {
                LOG.info(String.format("Scan for key range %s - %s returned %s rows",
                        Bytes.toString(startAndStopRow.getFirst()), Bytes.toString(startAndStopRow.getSecond()),
                        count));
            }

            s.close();
        }

        protected abstract Pair<byte[], byte[]> getStartAndStopRow();

        protected Pair<byte[], byte[]> generateStartAndStopRows(int maxRange) {
            int start = this.rand.nextInt(Integer.MAX_VALUE) % totalRows;
            int stop = start + maxRange;
            return new Pair<byte[], byte[]>(format(start), format(stop));
        }

        @Override
        protected int getReportingPeriod() {
            int period = this.perClientRunRows / 100;
            return period == 0 ? this.perClientRunRows : period;
        }
    }

    static class RandomScanWithRange10Test extends RandomScanWithRangeTest {
        RandomScanWithRange10Test(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        protected Pair<byte[], byte[]> getStartAndStopRow() {
            return generateStartAndStopRows(10);
        }
    }

    static class RandomScanWithRange100Test extends RandomScanWithRangeTest {
        RandomScanWithRange100Test(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        protected Pair<byte[], byte[]> getStartAndStopRow() {
            return generateStartAndStopRows(100);
        }
    }

    static class RandomScanWithRange1000Test extends RandomScanWithRangeTest {
        RandomScanWithRange1000Test(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        protected Pair<byte[], byte[]> getStartAndStopRow() {
            return generateStartAndStopRows(1000);
        }
    }

    static class RandomScanWithRange10000Test extends RandomScanWithRangeTest {
        RandomScanWithRange10000Test(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        protected Pair<byte[], byte[]> getStartAndStopRow() {
            return generateStartAndStopRows(10000);
        }
    }

    static class RandomReadTest extends Test {
        RandomReadTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testRow(final int i) throws IOException {
            Get get = new Get(getRandomRow(this.rand, this.totalRows));
            get.addColumn(FAMILY_NAME, QUALIFIER_NAME);
            this.table.get(get);
        }

        @Override
        protected int getReportingPeriod() {
            int period = this.perClientRunRows / 100;
            return period == 0 ? this.perClientRunRows : period;
        }

    }

    static class RandomWriteTest extends Test {
        RandomWriteTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testRow(final int i) throws IOException {
            byte[] row = getRandomRow(this.rand, this.totalRows);
            Put put = new Put(row);
            byte[] value = generateValue(this.rand);
            put.add(FAMILY_NAME, QUALIFIER_NAME, value);
            put.setWriteToWAL(writeToWAL);
            table.put(put);
        }
    }

    static class ScanTest extends Test {
        private ResultScanner testScanner;

        ScanTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testSetup() throws IOException {
            super.testSetup();
        }

        @Override
        void testTakedown() throws IOException {
            if (this.testScanner != null) {
                this.testScanner.close();
            }
            super.testTakedown();
        }

        @Override
        void testRow(final int i) throws IOException {
            if (this.testScanner == null) {
                Scan scan = new Scan(format(this.startRow));
                scan.addColumn(FAMILY_NAME, QUALIFIER_NAME);
                this.testScanner = table.getScanner(scan);
            }
            testScanner.next();
        }

    }

    static class SequentialReadTest extends Test {
        SequentialReadTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testRow(final int i) throws IOException {
            Get get = new Get(format(i));
            get.addColumn(FAMILY_NAME, QUALIFIER_NAME);
            table.get(get);
        }

    }

    static class SequentialWriteTest extends Test {
        SequentialWriteTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testRow(final int i) throws IOException {
            Put put = new Put(format(i));
            byte[] value = generateValue(this.rand);
            put.add(FAMILY_NAME, QUALIFIER_NAME, value);
            put.setWriteToWAL(writeToWAL);
            table.put(put);
        }

    }

    static class FilteredScanTest extends Test {
        protected static final Log LOG = LogFactory.getLog(FilteredScanTest.class.getName());

        FilteredScanTest(Configuration conf, TestOptions options, Status status) {
            super(conf, options, status);
        }

        @Override
        void testRow(int i) throws IOException {
            byte[] value = generateValue(this.rand);
            Scan scan = constructScan(value);
            ResultScanner scanner = null;
            try {
                scanner = this.table.getScanner(scan);
                while (scanner.next() != null) {
                }
            } finally {
                if (scanner != null)
                    scanner.close();
            }
        }

        protected Scan constructScan(byte[] valuePrefix) throws IOException {
            Filter filter = new SingleColumnValueFilter(FAMILY_NAME, QUALIFIER_NAME, CompareFilter.CompareOp.EQUAL,
                    new BinaryComparator(valuePrefix));
            Scan scan = new Scan();
            scan.addColumn(FAMILY_NAME, QUALIFIER_NAME);
            scan.setFilter(filter);
            return scan;
        }
    }

    /*
     * Format passed integer.
     * @param number
     * @return Returns zero-prefixed 10-byte wide decimal version of passed
     * number (Does absolute in case number is negative).
     */
    public static byte[] format(final int number) {
        byte[] b = new byte[10];
        int d = Math.abs(number);
        for (int i = b.length - 1; i >= 0; i--) {
            b[i] = (byte) ((d % 10) + '0');
            d /= 10;
        }
        return b;
    }

    /*
     * This method takes some time and is done inline uploading data.  For
     * example, doing the mapfile test, generation of the key and value
     * consumes about 30% of CPU time.
     * @return Generated random value to insert into a table cell.
     */
    public static byte[] generateValue(final Random r) {
        byte[] b = new byte[ROW_LENGTH];
        r.nextBytes(b);
        return b;
    }

    static byte[] getRandomRow(final Random random, final int totalRows) {
        return format(random.nextInt(Integer.MAX_VALUE) % totalRows);
    }

    long runOneClient(final Class<? extends Test> cmd, final int startRow, final int perClientRunRows,
            final int totalRows, boolean flushCommits, boolean writeToWAL, final Status status, final int scanCache)
            throws IOException {
        status.setStatus("Start " + cmd + " at offset " + startRow + " for " + perClientRunRows + " rows");
        long totalElapsedTime = 0;

        Test t = null;
        TestOptions options = new TestOptions(startRow, perClientRunRows, totalRows, getTableDescriptor().getName(),
                flushCommits, writeToWAL, scanCache);
        try {
            Constructor<? extends Test> constructor = cmd.getDeclaredConstructor(Configuration.class,
                    TestOptions.class, Status.class);
            t = constructor.newInstance(this.conf, options, status);
        } catch (NoSuchMethodException e) {
            throw new IllegalArgumentException("Invalid command class: " + cmd.getName()
                    + ".  It does not provide a constructor as described by"
                    + "the javadoc comment.  Available constructors are: "
                    + Arrays.toString(cmd.getConstructors()));
        } catch (Exception e) {
            throw new IllegalStateException("Failed to construct command class", e);
        }
        totalElapsedTime = t.test();

        status.setStatus("Finished " + cmd + " in " + totalElapsedTime + "ms at offset " + startRow + " for "
                + perClientRunRows + " rows");
        return totalElapsedTime;
    }

    private void runNIsOne(final Class<? extends Test> cmd) {
        Status status = new Status() {
            public void setStatus(String msg) throws IOException {
                LOG.info(msg);
            }
        };

        HBaseAdmin admin = null;
        try {
            admin = new HBaseAdmin(this.conf);
            checkTable(admin);
            runOneClient(cmd, 0, this.R, this.R, this.flushCommits, this.writeToWAL, status, this.S);
        } catch (Exception e) {
            LOG.error("Failed", e);
        }
    }

    private void runTest(final Class<? extends Test> cmd)
            throws IOException, InterruptedException, ClassNotFoundException {
        MiniHBaseCluster hbaseMiniCluster = null;
        MiniDFSCluster dfsCluster = null;
        MiniZooKeeperCluster zooKeeperCluster = null;
        if (this.miniCluster) {
            dfsCluster = new MiniDFSCluster(conf, 2, true, (String[]) null);
            zooKeeperCluster = new MiniZooKeeperCluster();
            int zooKeeperPort = zooKeeperCluster.startup(new File(System.getProperty("java.io.tmpdir")));

            // mangle the conf so that the fs parameter points to the minidfs we
            // just started up
            FileSystem fs = dfsCluster.getFileSystem();
            conf.set("fs.default.name", fs.getUri().toString());
            conf.set("hbase.zookeeper.property.clientPort", Integer.toString(zooKeeperPort));
            Path parentdir = fs.getHomeDirectory();
            conf.set(HConstants.HBASE_DIR, parentdir.toString());
            fs.mkdirs(parentdir);
            FSUtils.setVersion(fs, parentdir);
            hbaseMiniCluster = new MiniHBaseCluster(this.conf, N);
        }

        try {
            if (N == 1) {
                // If there is only one client and one HRegionServer, we assume nothing
                // has been set up at all.
                runNIsOne(cmd);
            } else {
                // Else, run
                runNIsMoreThanOne(cmd);
            }
        } finally {
            if (this.miniCluster) {
                if (hbaseMiniCluster != null)
                    hbaseMiniCluster.shutdown();
                if (zooKeeperCluster != null)
                    zooKeeperCluster.shutdown();
                HBaseTestCase.shutdownDfs(dfsCluster);
            }
        }
    }

    protected void printUsage() {
        printUsage(null);
    }

    protected void printUsage(final String message) {
        if (message != null && message.length() > 0) {
            System.err.println(message);
        }
        System.err.println("Usage: java " + this.getClass().getName() + " \\");
        System.err.println("  [--miniCluster] [--nomapred] [--rows=ROWS] <command> <nclients>");
        System.err.println();
        System.err.println("Options:");
        System.err.println(" miniCluster     Run the test on an HBaseMiniCluster");
        System.err.println(" nomapred        Run multiple clients using threads " + "(rather than use mapreduce)");
        System.err.println(" rows            Rows each client runs. Default: One million");
        System.err
                .println(" flushCommits    Used to determine if the test should flush the table.  Default: false");
        System.err.println(" writeToWAL      Set writeToWAL on puts. Default: True");
        System.err.println();
        System.err.println("Command:");
        for (CmdDescriptor command : commands.values()) {
            System.err.println(String.format(" %-15s %s", command.getName(), command.getDescription()));
        }
        System.err.println();
        System.err.println("Args:");
        System.err.println(" nclients        Integer. Required. Total number of " + "clients (and HRegionServers)");
        System.err.println("                 running: 1 <= value <= 500");
        System.err.println("Examples:");
        System.err.println(" To run a single evaluation client:");
        System.err.println(" $ bin/hbase " + this.getClass().getName() + " sequentialWrite 1");
    }

    private void getArgs(final int start, final String[] args) {
        if (start + 1 > args.length) {
            throw new IllegalArgumentException("must supply the number of clients");
        }
        N = Integer.parseInt(args[start]);
        if (N < 1) {
            throw new IllegalArgumentException("Number of clients must be > 1");
        }
        // Set total number of rows to write.
        this.R = this.R * N;
    }

    public int doCommandLine(final String[] args) {
        // Process command-line args. TODO: Better cmd-line processing
        // (but hopefully something not as painful as cli options).
        int errCode = -1;
        if (args.length < 1) {
            printUsage();
            return errCode;
        }

        try {
            for (int i = 0; i < args.length; i++) {
                String cmd = args[i];
                if (cmd.equals("-h") || cmd.startsWith("--h")) {
                    printUsage();
                    errCode = 0;
                    break;
                }

                final String miniClusterArgKey = "--miniCluster";
                if (cmd.startsWith(miniClusterArgKey)) {
                    this.miniCluster = true;
                    continue;
                }

                final String nmr = "--nomapred";
                if (cmd.startsWith(nmr)) {
                    this.nomapred = true;
                    continue;
                }

                final String rows = "--rows=";
                if (cmd.startsWith(rows)) {
                    this.R = Integer.parseInt(cmd.substring(rows.length()));
                    continue;
                }

                final String scanCache = "--scanCache=";
                if (cmd.startsWith(scanCache)) {
                    this.S = Integer.parseInt(cmd.substring(scanCache.length()));
                    continue;
                }

                final String flushCommits = "--flushCommits=";
                if (cmd.startsWith(flushCommits)) {
                    this.flushCommits = Boolean.parseBoolean(cmd.substring(flushCommits.length()));
                    continue;
                }

                final String writeToWAL = "--writeToWAL=";
                if (cmd.startsWith(writeToWAL)) {
                    this.writeToWAL = Boolean.parseBoolean(cmd.substring(writeToWAL.length()));
                    continue;
                }

                Class<? extends Test> cmdClass = determineCommandClass(cmd);
                if (cmdClass != null) {
                    getArgs(i + 1, args);
                    runTest(cmdClass);
                    errCode = 0;
                    break;
                }

                printUsage();
                break;
            }
        } catch (Exception e) {
            e.printStackTrace();
        }

        return errCode;
    }

    private Class<? extends Test> determineCommandClass(String cmd) {
        CmdDescriptor descriptor = commands.get(cmd);
        return descriptor != null ? descriptor.getCmdClass() : null;
    }

    /**
     * @param args
     */
    public static void main(final String[] args) {
        Configuration c = HBaseConfiguration.create();
        System.exit(new PerformanceEvaluation(c).doCommandLine(args));
    }
}