Java tutorial
/** * Licensed to Cloudera, Inc. under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. Cloudera, Inc. licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.cloudera.sqoop.manager; import java.io.BufferedReader; import java.io.IOException; import java.io.InputStreamReader; import java.io.FileInputStream; import java.io.File; import java.sql.Connection; import java.sql.SQLException; import java.sql.Statement; import java.util.ArrayList; import org.apache.commons.logging.Log; import org.apache.commons.logging.LogFactory; import org.junit.After; import org.junit.Before; import org.junit.Test; import org.apache.hadoop.fs.Path; import org.apache.hadoop.io.IOUtils; import com.cloudera.sqoop.SqoopOptions; import com.cloudera.sqoop.testutil.CommonArgs; import com.cloudera.sqoop.testutil.ImportJobTestCase; import com.cloudera.sqoop.util.FileListing; /** * Test the DirectMySQLManager implementation. * This differs from MySQLManager only in its importTable() method, which * uses mysqldump instead of mapreduce+DBInputFormat. * * Since this requires a MySQL installation on your local machine to use, this * class is named in such a way that Hadoop's default QA process does not run * it. You need to run this manually with -Dtestcase=DirectMySQLTest. * * You need to put MySQL's Connector/J JDBC driver library into a location * where Hadoop will be able to access it (since this library cannot be checked * into Apache's tree for licensing reasons). * * You should also create a database named 'sqooptestdb' and authorize yourself: * * CREATE DATABASE sqooptestdb; * use mysql; * GRANT ALL PRIVILEGES ON sqooptestdb.* TO 'yourusername'@'localhost'; * flush privileges; * */ public class DirectMySQLTest extends ImportJobTestCase { public static final Log LOG = LogFactory.getLog(DirectMySQLTest.class.getName()); static final String TABLE_PREFIX = "EMPLOYEES_MYSQL_"; // instance variables populated during setUp, used during tests private DirectMySQLManager manager; @Override protected String getTablePrefix() { return TABLE_PREFIX; } @Before public void setUp() { super.setUp(); SqoopOptions options = new SqoopOptions(MySQLTestUtils.CONNECT_STRING, getTableName()); options.setUsername(MySQLTestUtils.getCurrentUser()); LOG.debug("Setting up another DirectMySQLTest: " + MySQLTestUtils.CONNECT_STRING); manager = new DirectMySQLManager(options); Connection connection = null; Statement st = null; try { connection = manager.getConnection(); connection.setAutoCommit(false); st = connection.createStatement(); // create the database table and populate it with data. st.executeUpdate("DROP TABLE IF EXISTS " + getTableName()); st.executeUpdate("CREATE TABLE " + getTableName() + " (" + "id INT NOT NULL PRIMARY KEY AUTO_INCREMENT, " + "name VARCHAR(24) NOT NULL, " + "start_date DATE, " + "salary FLOAT, " + "dept VARCHAR(32))"); st.executeUpdate("INSERT INTO " + getTableName() + " VALUES(" + "NULL,'Aaron','2009-05-14',1000000.00,'engineering')"); st.executeUpdate( "INSERT INTO " + getTableName() + " VALUES(" + "NULL,'Bob','2009-04-20',400.00,'sales')"); st.executeUpdate( "INSERT INTO " + getTableName() + " VALUES(" + "NULL,'Fred','2009-01-23',15.00,'marketing')"); connection.commit(); } catch (SQLException sqlE) { LOG.error("Encountered SQL Exception: " + sqlE); sqlE.printStackTrace(); fail("SQLException when running test setUp(): " + sqlE); } finally { try { if (null != st) { st.close(); } if (null != connection) { connection.close(); } } catch (SQLException sqlE) { LOG.warn("Got SQLException when closing connection: " + sqlE); } } } @After public void tearDown() { super.tearDown(); if (null != manager) { try { manager.close(); manager = null; } catch (SQLException sqlE) { LOG.error("Got SQLException: " + sqlE.toString()); fail("Got SQLException: " + sqlE.toString()); } } } private String[] getArgv(boolean mysqlOutputDelims, boolean isDirect, String tableName, String... extraArgs) { ArrayList<String> args = new ArrayList<String>(); CommonArgs.addHadoopFlags(args); args.add("--table"); args.add(tableName); args.add("--warehouse-dir"); args.add(getWarehouseDir()); args.add("--connect"); args.add(MySQLTestUtils.CONNECT_STRING); if (isDirect) { args.add("--direct"); } args.add("--username"); args.add(MySQLTestUtils.getCurrentUser()); args.add("--where"); args.add("id > 1"); args.add("--num-mappers"); args.add("1"); if (mysqlOutputDelims) { args.add("--mysql-delimiters"); } if (null != extraArgs) { for (String arg : extraArgs) { args.add(arg); } } return args.toArray(new String[0]); } private void doImport(boolean mysqlOutputDelims, boolean isDirect, String tableName, String[] expectedResults, String[] extraArgs) throws IOException { Path warehousePath = new Path(this.getWarehouseDir()); Path tablePath = new Path(warehousePath, tableName); Path filePath = new Path(tablePath, "part-m-00000"); File tableFile = new File(tablePath.toString()); if (tableFile.exists() && tableFile.isDirectory()) { // remove the directory before running the import. FileListing.recursiveDeleteDir(tableFile); } String[] argv = getArgv(mysqlOutputDelims, isDirect, tableName, extraArgs); try { runImport(argv); } catch (IOException ioe) { LOG.error("Got IOException during import: " + ioe.toString()); ioe.printStackTrace(); fail(ioe.toString()); } File f = new File(filePath.toString()); assertTrue("Could not find imported data file: " + f, f.exists()); BufferedReader r = null; try { // Read through the file and make sure it's all there. r = new BufferedReader(new InputStreamReader(new FileInputStream(f))); for (String expectedLine : expectedResults) { assertEquals(expectedLine, r.readLine()); } } catch (IOException ioe) { LOG.error("Got IOException verifying results: " + ioe.toString()); ioe.printStackTrace(); fail(ioe.toString()); } finally { IOUtils.closeStream(r); } } @Test public void testDirectBulkImportWithDefaultDelims() throws IOException { // no quoting of strings allowed. String[] expectedResults = { "2,Bob,2009-04-20,400,sales", "3,Fred,2009-01-23,15,marketing", }; doImport(false, true, getTableName(), expectedResults, null); } @Test public void testWithExtraParams() throws IOException { // no quoting of strings allowed. String[] expectedResults = { "2,Bob,2009-04-20,400,sales", "3,Fred,2009-01-23,15,marketing", }; String[] extraArgs = { "--", "--lock-tables" }; doImport(false, true, getTableName(), expectedResults, extraArgs); } @Test public void testMultiMappers() throws IOException { // no quoting of strings allowed. String[] expectedResults = { "2,Bob,2009-04-20,400,sales", "3,Fred,2009-01-23,15,marketing", }; String[] extraArgs = { "-m", "2" }; doImport(false, true, getTableName(), expectedResults, extraArgs); } @Test public void testJdbcColumnSubset() throws IOException { // Test that column subsets work in JDBC mode. LOG.info("Starting JDBC Column Subset test."); String[] expectedResults = { "2,Bob,400.0", "3,Fred,15.0", }; String[] extraArgs = { "--columns", "id,name,salary" }; doImport(false, false, getTableName(), expectedResults, extraArgs); } @Test public void testDirectColumnSubset() throws IOException { // Using a column subset should actually force direct mode off, but this // should just warn the user and do a normal import. LOG.info("Starting Direct Column Subset test."); String[] expectedResults = { "2,Bob,400.0", "3,Fred,15.0", }; String[] extraArgs = { "--columns", "id,name,salary" }; doImport(false, true, getTableName(), expectedResults, extraArgs); } @Test public void testDirectBulkImportWithMySQLQuotes() throws IOException { // mysql quotes all string-based output. String[] expectedResults = { "2,'Bob','2009-04-20',400,'sales'", "3,'Fred','2009-01-23',15,'marketing'", }; doImport(true, true, getTableName(), expectedResults, null); } @Test public void testMySQLJdbcImport() throws IOException { String[] expectedResults = { "2,Bob,2009-04-20,400.0,sales", "3,Fred,2009-01-23,15.0,marketing", }; doImport(false, false, getTableName(), expectedResults, null); } @Test public void testJdbcEscapedTableName() throws Exception { // Test a JDBC-based import of a table whose name is // a reserved sql keyword (and is thus `quoted`) final String RESERVED_TABLE_NAME = "TABLE"; SqoopOptions options = new SqoopOptions(MySQLTestUtils.CONNECT_STRING, RESERVED_TABLE_NAME); options.setUsername(MySQLTestUtils.getCurrentUser()); ConnManager mgr = new MySQLManager(options); Connection connection = null; Statement st = null; try { connection = mgr.getConnection(); connection.setAutoCommit(false); st = connection.createStatement(); // create the database table and populate it with data. st.executeUpdate("DROP TABLE IF EXISTS `" + RESERVED_TABLE_NAME + "`"); st.executeUpdate("CREATE TABLE `" + RESERVED_TABLE_NAME + "` (" + "id INT NOT NULL PRIMARY KEY AUTO_INCREMENT, " + "name VARCHAR(24) NOT NULL, " + "start_date DATE, " + "salary FLOAT, " + "dept VARCHAR(32))"); st.executeUpdate("INSERT INTO `" + RESERVED_TABLE_NAME + "` VALUES(" + "2,'Aaron','2009-05-14',1000000.00,'engineering')"); connection.commit(); } finally { if (null != st) { st.close(); } if (null != connection) { connection.close(); } } String[] expectedResults = { "2,Aaron,2009-05-14,1000000.0,engineering", }; doImport(false, false, RESERVED_TABLE_NAME, expectedResults, null); } @Test public void testJdbcEscapedColumnName() throws Exception { // Test a JDBC-based import of a table with a column whose name is // a reserved sql keyword (and is thus `quoted`). final String TABLE_NAME = "mysql_escaped_col_table"; setCurTableName(TABLE_NAME); SqoopOptions options = new SqoopOptions(MySQLTestUtils.CONNECT_STRING, TABLE_NAME); options.setUsername(MySQLTestUtils.getCurrentUser()); ConnManager mgr = new MySQLManager(options); Connection connection = null; Statement st = null; try { connection = mgr.getConnection(); connection.setAutoCommit(false); st = connection.createStatement(); // create the database table and populate it with data. st.executeUpdate("DROP TABLE IF EXISTS " + TABLE_NAME); st.executeUpdate("CREATE TABLE " + TABLE_NAME + " (" + "id INT NOT NULL PRIMARY KEY AUTO_INCREMENT, " + "`table` VARCHAR(24) NOT NULL, " + "`CREATE` DATE, " + "salary FLOAT, " + "dept VARCHAR(32))"); st.executeUpdate( "INSERT INTO " + TABLE_NAME + " VALUES(" + "2,'Aaron','2009-05-14',1000000.00,'engineering')"); connection.commit(); } finally { if (null != st) { st.close(); } if (null != connection) { connection.close(); } } String[] expectedResults = { "2,Aaron,2009-05-14,1000000.0,engineering", }; doImport(false, false, TABLE_NAME, expectedResults, null); } }