com.cloudera.sqoop.manager.NetezzaImportManualTest.java Source code

Java tutorial

Introduction

Here is the source code for com.cloudera.sqoop.manager.NetezzaImportManualTest.java

Source

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.cloudera.sqoop.manager;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.sql.Connection;
import java.sql.PreparedStatement;
import java.sql.ResultSet;
import java.sql.SQLException;
import java.sql.Statement;
import java.util.ArrayList;
import java.util.Arrays;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IOUtils;
import org.apache.sqoop.manager.NetezzaManager;
import org.junit.After;
import org.junit.Before;
import org.junit.Test;

import com.cloudera.sqoop.SqoopOptions;
import com.cloudera.sqoop.testutil.CommonArgs;
import com.cloudera.sqoop.testutil.ImportJobTestCase;
import com.cloudera.sqoop.util.FileListing;

/**
 * Test the Netezza implementation.
 *
 * This uses both JDBC and external tables to import data from an Netezza
 * database into HDFS.
 *
 * Since this requires an Netezza Server installation, this class is named in
 * such a way that Sqoop's default QA process does not run it. You need to run
 * this manually with -Dtestcase=NetezzaImportManualTest.
 *
 */
public class NetezzaImportManualTest extends ImportJobTestCase {

    public static final Log LOG = LogFactory.getLog(NetezzaImportManualTest.class.getName());

    // instance variables populated during setUp, used during tests
    private NetezzaManager manager;
    private Connection conn;

    @Override
    protected boolean useHsqldbTestServer() {
        return false;
    }

    @Override
    protected String getTableName() {
        return NetezzaTestUtils.TABLE_NAME + "_IMP_";
    }

    private void createTable(String tableName, String... extraColumns) throws SQLException {
        PreparedStatement statement = conn.prepareStatement("DROP TABLE " + tableName, ResultSet.TYPE_FORWARD_ONLY,
                ResultSet.CONCUR_READ_ONLY);
        try {
            statement.executeUpdate();
            conn.commit();
        } catch (SQLException sqle) {
            conn.rollback();
        } finally {
            statement.close();
        }

        StringBuilder sb = new StringBuilder();
        sb.append("CREATE TABLE " + tableName + " (");
        sb.append("id INT NOT NULL PRIMARY KEY, ");
        sb.append("name VARCHAR(24) NOT NULL, ");
        sb.append("start_date DATE, ");
        sb.append("Salary FLOAT, ");
        sb.append("Fired BOOL, ");
        sb.append("dept VARCHAR(32) ");
        for (String col : extraColumns) {
            sb.append(", " + col + "  INTEGER");
        }
        sb.append(")");

        statement = conn.prepareStatement(sb.toString(), ResultSet.TYPE_FORWARD_ONLY, ResultSet.CONCUR_READ_ONLY);
        try {
            statement.executeUpdate();
            conn.commit();
        } finally {
            statement.close();
        }
    }

    private void populateTable(String tableName) throws SQLException {
        Statement statement = conn.createStatement();
        try {
            statement.executeUpdate(
                    "INSERT INTO " + tableName + " VALUES(1,'Aaron','2009-05-14',1000000.00,TRUE,'engineering')");
            statement.executeUpdate(
                    "INSERT INTO " + tableName + " VALUES(2,'Bob','2009-04-20',400.00,TRUE,'sales')");
            statement.executeUpdate(
                    "INSERT INTO " + tableName + " VALUES(3,'Fred','2009-01-23',15.00,FALSE,'marketing')");
            conn.commit();
        } finally {
            statement.close();
        }
    }

    private void populateTableWithNull(String tableName) throws SQLException {
        Statement statement = conn.createStatement();
        try {
            statement.executeUpdate("INSERT INTO " + tableName + " VALUES(1,'Aaron','2009-05-14',1000000.00,TRUE,"
                    + "'engineering',NULL,1)");
            statement.executeUpdate(
                    "INSERT INTO " + tableName + " VALUES(2,'Bob','2009-04-20',400.00,TRUE,'sales',NULL,2)");
            statement.executeUpdate(
                    "INSERT INTO " + tableName + " VALUES(3,'Fred','2009-01-23',15.00,FALSE,'marketing',NULL,3)");
            conn.commit();
        } finally {
            statement.close();
        }
    }

    public void setUpData() {
        SqoopOptions options = new SqoopOptions(NetezzaTestUtils.getNZConnectString(), getTableName());
        options.setUsername(NetezzaTestUtils.getNZUser());
        options.setPassword(NetezzaTestUtils.getNZPassword());
        try {
            manager = new NetezzaManager(options);
            conn = manager.getConnection();
            createTable(getTableName());
            populateTable(getTableName());
            String tableNameWithNull = getTableName() + "_W_N";
            createTable(tableNameWithNull, new String[] { "col0", "col1" });
            populateTableWithNull(tableNameWithNull);
        } catch (SQLException sqlE) {
            fail("Setup failed with SQLException " + sqlE);
        }
    }

    @Before
    public void setUp() {
        super.setUp();
        setUpData();
    }

    @After
    public void tearDown() {
        super.tearDown();
        try {
            manager.close();
        } catch (SQLException sqlE) {
            LOG.error("Got SQLException: " + sqlE.toString());
            fail("Got SQLException: " + sqlE.toString());
        }
    }

    private String[] getExpectedResults() {
        String[] expectedResults = { "1,Aaron,2009-05-14,1000000.0,true,engineering",
                "2,Bob,2009-04-20,400.0,true,sales", "3,Fred,2009-01-23,15.0,false,marketing", };

        return expectedResults;
    }

    private String[] getDirectModeExpectedResults() {
        String[] expectedResults = { "1,Aaron,2009-05-14,1000000,T,engineering", "2,Bob,2009-04-20,400,T,sales",
                "3,Fred,2009-01-23,15,F,marketing", };
        return expectedResults;
    }

    private String[] getExpectedResultsWithNulls() {
        String[] expectedResults = { "1,Aaron,2009-05-14,1000000.0,true,engineering,\\N,1",
                "2,Bob,2009-04-20,400.0,true,sales,\\N,2", "3,Fred,2009-01-23,15.0,false,marketing,\\N,3", };

        return expectedResults;
    }

    private String[] getDirectModeExpectedResultsWithNulls() {
        String[] expectedResults = { "1,Aaron,2009-05-14,1000000,T,engineering,\\N,1",
                "2,Bob,2009-04-20,400,T,sales,\\N,2", "3,Fred,2009-01-23,15,F,marketing,\\N,3", };

        return expectedResults;
    }

    private String[] getArgv(boolean isDirect, String tableName, String... extraArgs) {
        ArrayList<String> args = new ArrayList<String>();

        CommonArgs.addHadoopFlags(args);

        args.add("--table");
        args.add(tableName);
        args.add("--warehouse-dir");
        args.add(getWarehouseDir());
        args.add("--connect");
        args.add(NetezzaTestUtils.getNZConnectString());
        args.add("--username");
        args.add(NetezzaTestUtils.getNZUser());
        args.add("--password");
        args.add(NetezzaTestUtils.getNZPassword());
        args.add("--num-mappers");
        args.add("1");

        if (isDirect) {
            args.add("--direct");
        }
        for (String arg : extraArgs) {
            args.add(arg);
        }
        return args.toArray(new String[args.size()]);
    }

    private void runNetezzaTest(boolean isDirect, String tableName, String[] expectedResults, String... extraArgs)
            throws IOException {

        Path warehousePath = new Path(this.getWarehouseDir());
        Path tablePath = new Path(warehousePath, tableName);

        Path filePath;

        filePath = new Path(tablePath, "part-m-00000");

        File tableFile = new File(tablePath.toString());
        if (tableFile.exists() && tableFile.isDirectory()) {
            // remove the directory before running the import.
            FileListing.recursiveDeleteDir(tableFile);
        }

        String[] argv = getArgv(isDirect, tableName, extraArgs);
        try {
            runImport(argv);
        } catch (IOException ioe) {
            LOG.error("Got IOException during import: " + ioe.toString());
            ioe.printStackTrace();
            fail(ioe.toString());
        }

        File f = new File(filePath.toString());
        assertTrue("Could not find imported data file : " + f, f.exists());
        BufferedReader r = null;
        try {
            // Read through the file and make sure it's all there.
            r = new BufferedReader(new InputStreamReader(new FileInputStream(f)));
            String[] s = new String[3];
            for (int i = 0; i < s.length; ++i) {
                s[i] = r.readLine();
                LOG.info("Line read from file = " + s[i]);
            }
            Arrays.sort(s);
            for (int i = 0; i < expectedResults.length; ++i) {
                assertEquals(expectedResults[i], s[i]);
            }
        } catch (IOException ioe) {
            LOG.error("Got IOException verifying results: " + ioe.toString());
            ioe.printStackTrace();
            fail(ioe.toString());
        } finally {
            IOUtils.closeStream(r);
        }
    }

    @Test
    public void testNetezzaImport() throws IOException {

        runNetezzaTest(false, getTableName(), getExpectedResults());
    }

    @Test
    public void testDirectImport() throws IOException {
        runNetezzaTest(true, getTableName(), getDirectModeExpectedResults());
    }

    @Test
    public void testListTables() throws IOException {
        SqoopOptions options = new SqoopOptions(NetezzaTestUtils.getNZConnectString(), getTableName());
        options.setUsername(NetezzaTestUtils.getNZUser());
        options.setPassword(NetezzaTestUtils.getNZPassword());

        ConnManager mgr = new NetezzaManager(options);
        String[] tables = mgr.listTables();
        Arrays.sort(tables);
        assertTrue(getTableName() + " is not found!", Arrays.binarySearch(tables, getTableName()) >= 0);
    }

    @Test
    public void testIncrementalImport() throws IOException {
        String[] expectedResults = {};

        String[] extraArgs = { "--incremental", "lastmodified", "--check-column", "START_DATE", };

        runNetezzaTest(false, getTableName(), expectedResults, extraArgs);
    }

    @Test
    public void testNullStringValue() throws Exception {

        String[] extraArgs = { "--null-string", "\\\\N", "--null-non-string", "\\\\N", };

        String[] expectedResultsWithNulls = getExpectedResultsWithNulls();
        String tableNameWithNull = getTableName() + "_W_N";

        runNetezzaTest(false, tableNameWithNull, expectedResultsWithNulls, extraArgs);
    }

    @Test
    public void testValidExtraArgs() throws Exception {

        String[] extraArgs = { "--", "--log-dir", "/tmp", "--max-errors", "2", };
        String[] expectedResults = getDirectModeExpectedResults();
        String tableName = getTableName();

        runNetezzaTest(true, tableName, expectedResults, extraArgs);
    }

}