core.DatabaseSaverEx.java Source code

Java tutorial

Introduction

Here is the source code for core.DatabaseSaverEx.java

Source

/*
 *    This program is free software; you can redistribute it and/or modify
 *    it under the terms of the GNU General Public License as published by
 *    the Free Software Foundation; either version 2 of the License, or
 *    (at your option) any later version.
 *
 *    This program is distributed in the hope that it will be useful,
 *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *    GNU General Public License for more details.
 *
 *    You should have received a copy of the GNU General Public License
 *    along with this program; if not, write to the Free Software
 *    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */

/*
 *    DatabaseSaver.java
 *    Copyright (C) 2004 University of Waikato, Hamilton, New Zealand
 *
 */

package core;

import weka.core.Attribute;
import weka.core.Capabilities;
import weka.core.FastVector;
import weka.core.Instance;
import weka.core.Instances;
import weka.core.Option;
import weka.core.OptionHandler;
import weka.core.RevisionUtils;
import weka.core.Utils;
import weka.core.Capabilities.Capability;
import weka.core.converters.*;
import java.io.File;
import java.io.IOException;
import java.sql.SQLException;
import java.text.SimpleDateFormat;
import java.util.Enumeration;
import java.util.Properties;
import java.util.Vector;

/**
 <!-- globalinfo-start -->
 * Writes to a database (tested with MySQL, InstantDB, HSQLDB).
 * <p/>
 <!-- globalinfo-end -->
 *
 <!-- options-start -->
 * Valid options are: <p/>
 * 
 * <pre> -url &lt;JDBC URL&gt;
 *  The JDBC URL to connect to.
 *  (default: from DatabaseUtils.props file)</pre>
 * 
 * <pre> -user &lt;name&gt;
 *  The user to connect with to the database.
 *  (default: none)</pre>
 * 
 * <pre> -password &lt;password&gt;
 *  The password to connect with to the database.
 *  (default: none)</pre>
 * 
 * <pre> -T &lt;table name&gt;
 *  The name of the table.
 *  (default: the relation name)</pre>
 * 
 * <pre> -P
 *  Add an ID column as primary key. The name is specified
 *  in the DatabaseUtils file ('idColumn'). The DatabaseLoader
 *  won't load this column.</pre>
 * 
 * <pre> -i &lt;input file name&gt;
 *  Input file in arff format that should be saved in database.</pre>
 * 
 <!-- options-end -->
 *
 * @author Stefan Mutter (mutter@cs.waikato.ac.nz)
 * @version $Revision: 7499 $
 */
public class DatabaseSaverEx extends AbstractSaver
        implements BatchConverter, IncrementalConverter, DatabaseConverter, OptionHandler {

    /** for serialization. */
    static final long serialVersionUID = 863971733782624956L;

    /** The database connection. */
    private DatabaseConnection m_DataBaseConnection;

    /** The name of the table in which the instances should be stored. */
    private String m_tableName;

    /** An input arff file (for command line use). */
    private String m_inputFile;

    /** The database specific type for a string (read in from the properties file). */
    private String m_createText;

    /** The database specific type for a double (read in from the properties file). */
    private String m_createDouble;

    /** The database specific type for an int (read in from the properties file). */
    private String m_createInt;

    /** The database specific type for a date (read in from the properties file). */
    private String m_createDate;

    /** For converting the date value into a database string. */
    private SimpleDateFormat m_DateFormat;

    /** The name of the primary key column that will be automatically generated (if enabled). The name is read from DatabaseUtils.*/
    private String m_idColumn;

    /** counts the rows and used as a primary key value. */
    private int m_count;

    /** Flag indicating if a primary key column should be added. */
    private boolean m_id;

    /** Flag indicating whether the default name of the table is the relaion name or not.*/
    private boolean m_tabName;

    /** the user name for the database. */
    private String m_Username;

    /** the password for the database. */
    private String m_Password;

    /** The property file for the database connection. */
    protected static String PROPERTY_FILE = DatabaseConnection.PROPERTY_FILE;

    /** Properties associated with the database connection. */
    protected static Properties PROPERTIES;

    /** reads the property file */
    static {

        try {
            PROPERTIES = Utils.readProperties(PROPERTY_FILE);

        } catch (Exception ex) {
            System.err.println("Problem reading properties. Fix before continuing.");
            System.err.println(ex);
        }
    }

    /** 
     * Constructor.
     * 
     * @throws Exception throws Exception if property file cannot be read
     */
    public DatabaseSaverEx() throws Exception {

        resetOptions();
        m_createText = PROPERTIES.getProperty("CREATE_STRING");
        m_createDouble = PROPERTIES.getProperty("CREATE_DOUBLE");
        m_createInt = PROPERTIES.getProperty("CREATE_INT");
        m_createDate = PROPERTIES.getProperty("CREATE_DATE", "DATETIME");
        m_DateFormat = new SimpleDateFormat(PROPERTIES.getProperty("DateFormat", "yyyy-MM-dd HH:mm:ss"));
        m_idColumn = PROPERTIES.getProperty("idColumn");
    }

    /** 
     * Resets the Saver ready to save a new data set.
     */
    public void resetOptions() {

        super.resetOptions();
        setRetrieval(NONE);
        m_tableName = "";
        m_Username = "";
        m_Password = "";
        m_count = 1;
        m_id = false;
        m_tabName = true;
        try {
            if (m_DataBaseConnection != null && m_DataBaseConnection.isConnected())
                m_DataBaseConnection.disconnectFromDatabase();
            m_DataBaseConnection = new DatabaseConnection();
        } catch (Exception ex) {
            printException(ex);
        }
    }

    /** 
     * Cancels the incremental saving process and tries to drop the table if 
     * the write mode is CANCEL.
     */
    public void cancel() {

        if (getWriteMode() == CANCEL) {
            try {
                m_DataBaseConnection.update("DROP TABLE " + m_tableName);
                if (m_DataBaseConnection.tableExists(m_tableName))
                    System.err.println("Table cannot be dropped.");
            } catch (Exception ex) {
                printException(ex);
            }
            resetOptions();
        }
    }

    /**
     * Returns a string describing this Saver.
     * 
     * @return a description of the Saver suitable for
     * displaying in the explorer/experimenter gui
     */
    public String globalInfo() {
        return "Writes to a database (tested with MySQL, InstantDB, HSQLDB).";
    }

    /** 
     * Sets the table's name.
     * 
     * @param tn the name of the table
     */
    public void setTableName(String tn) {

        m_tableName = tn;
    }

    /** 
     * Gets the table's name.
     * 
     * @return the table's name
     */
    public String getTableName() {

        return m_tableName;
    }

    /** 
     * Returns the tip text for this property.
     * 
     * @return the tip text for this property
     */
    public String tableNameTipText() {

        return "Sets the name of the table.";
    }

    /** 
     * En/Dis-ables the automatic generation of a primary key.
     * 
     * @param flag flag for automatic key-genereration
     */
    public void setAutoKeyGeneration(boolean flag) {

        m_id = flag;
    }

    /** 
     * Gets whether or not a primary key will be generated automatically.
     * 
     * @return true if a primary key column will be generated, false otherwise
     */
    public boolean getAutoKeyGeneration() {

        return m_id;
    }

    /** 
     * Returns the tip text for this property.
     * 
     * @return tip text for this property
     */
    public String autoKeyGenerationTipText() {

        return "If set to true, a primary key column is generated automatically (containing the row number as INTEGER). The name of the key is read from DatabaseUtils (idColumn)"
                + " This primary key can be used for incremental loading (requires an unique key). This primary key will not be loaded as an attribute.";
    }

    /** 
     * En/Dis-ables that the relation name is used for the name of the table (default enabled).
     * 
     * @param flag if true the relation name is used as table name
     */
    public void setRelationForTableName(boolean flag) {

        m_tabName = flag;
    }

    /** 
     * Gets whether or not the relation name is used as name of the table.
     * 
     * @return true if the relation name is used as the name of the table, false otherwise
     */
    public boolean getRelationForTableName() {

        return m_tabName;
    }

    /** 
     * Returns the tip text fo this property.
     * 
     * @return the tip text for this property
     */
    public String relationForTableNameTipText() {

        return "If set to true, the relation name will be used as name for the database table. Otherwise the user has to provide a table name.";
    }

    /** 
     * Sets the database URL.
     * 
     * @param url the URL
     */
    public void setUrl(String url) {

        m_DataBaseConnection.setDatabaseURL(url);

    }

    /** 
     * Gets the database URL.
     * 
     * @return the URL
     */
    public String getUrl() {

        return m_DataBaseConnection.getDatabaseURL();
    }

    /** 
     * Returns the tip text for this property.
     * 
     * @return the tip text for this property
     */
    public String urlTipText() {

        return "The URL of the database";
    }

    /** 
     * Sets the database user.
     * 
     * @param user the user name
     */
    public void setUser(String user) {
        m_Username = user;
        m_DataBaseConnection.setUsername(user);
    }

    /** 
     * Gets the database user.
     * 
     * @return the user name
     */
    public String getUser() {

        return m_DataBaseConnection.getUsername();
    }

    /** 
     * Returns the tip text for this property.
     * 
     * @return the tip text for this property
     */
    public String userTipText() {

        return "The user name for the database";
    }

    /** 
     * Sets the database password.
     * 
     * @param password the password
     */
    public void setPassword(String password) {
        m_Password = password;
        m_DataBaseConnection.setPassword(password);
    }

    /**
     * Returns the database password.
     *
     * @return the database password
     */
    public String getPassword() {
        return m_DataBaseConnection.getPassword();
    }

    /** 
     * Returns the tip text for this property.
     * 
     * @return the tip text for this property
     */
    public String passwordTipText() {

        return "The database password";
    }

    /** 
     * Sets the database url.
     * 
     * @param url the database url
     * @param userName the user name
     * @param password the password
     */
    public void setDestination(String url, String userName, String password) {

        try {
            m_DataBaseConnection = new DatabaseConnection();
            m_DataBaseConnection.setDatabaseURL(url);
            m_DataBaseConnection.setUsername(userName);
            m_DataBaseConnection.setPassword(password);
        } catch (Exception ex) {
            printException(ex);
        }
    }

    /** 
     * Sets the database url.
     * 
     * @param url the database url
     */
    public void setDestination(String url) {

        try {
            m_DataBaseConnection = new DatabaseConnection();
            m_DataBaseConnection.setDatabaseURL(url);
            m_DataBaseConnection.setUsername(m_Username);
            m_DataBaseConnection.setPassword(m_Password);
        } catch (Exception ex) {
            printException(ex);
        }
    }

    /** Sets the database url using the DatabaseUtils file. */
    public void setDestination() {

        try {
            m_DataBaseConnection = new DatabaseConnection();
            m_DataBaseConnection.setUsername(m_Username);
            m_DataBaseConnection.setPassword(m_Password);
        } catch (Exception ex) {
            printException(ex);
        }
    }

    /** 
     * Returns the Capabilities of this saver.
     *
     * @return            the capabilities of this object
     * @see               Capabilities
     */
    public Capabilities getCapabilities() {
        Capabilities result = super.getCapabilities();

        // attributes
        result.enable(Capability.NOMINAL_ATTRIBUTES);
        result.enable(Capability.NUMERIC_ATTRIBUTES);
        result.enable(Capability.DATE_ATTRIBUTES);
        result.enable(Capability.STRING_ATTRIBUTES);
        result.enable(Capability.MISSING_VALUES);

        // class
        result.enable(Capability.NOMINAL_CLASS);
        result.enable(Capability.NUMERIC_CLASS);
        result.enable(Capability.DATE_CLASS);
        result.enable(Capability.STRING_CLASS);
        result.enable(Capability.NO_CLASS);
        result.enable(Capability.MISSING_CLASS_VALUES);

        return result;
    }

    /**
    * Opens a connection to the database.
    *
    */
    public void connectToDatabase() {

        try {
            if (!m_DataBaseConnection.isConnected())
                m_DataBaseConnection.connectToDatabase();
        } catch (Exception ex) {
            printException(ex);
        }
    }

    /** 
     * Writes the structure (header information) to a database by creating a new table.
     * 
     * @throws Exception if something goes wrong
     */
    private void writeStructure() throws Exception {

        StringBuffer query = new StringBuffer();
        Instances structure = getInstances();
        query.append("CREATE TABLE ");
        if (m_tabName || m_tableName.equals(""))
            m_tableName = m_DataBaseConnection.maskKeyword(structure.relationName());
        if (m_DataBaseConnection.getUpperCase()) {
            m_tableName = m_tableName.toUpperCase();
            m_createInt = m_createInt.toUpperCase();
            m_createDouble = m_createDouble.toUpperCase();
            m_createText = m_createText.toUpperCase();
            m_createDate = m_createDate.toUpperCase();
        }
        m_tableName = m_tableName.replaceAll("[^\\w]", "_");
        m_tableName = m_DataBaseConnection.maskKeyword(m_tableName);
        query.append(m_tableName);
        if (structure.numAttributes() == 0)
            throw new Exception("Instances have no attribute.");
        query.append(" ( ");
        if (m_id) {
            if (m_DataBaseConnection.getUpperCase())
                m_idColumn = m_idColumn.toUpperCase();
            query.append(m_DataBaseConnection.maskKeyword(m_idColumn));
            query.append(" ");
            query.append(m_createInt);
            query.append(" PRIMARY KEY,");
        }
        for (int i = 0; i < structure.numAttributes(); i++) {
            Attribute att = structure.attribute(i);
            String attName = att.name();
            attName = attName.replaceAll("[^\\w]", "_");
            attName = m_DataBaseConnection.maskKeyword(attName);
            if (m_DataBaseConnection.getUpperCase())
                query.append(attName.toUpperCase());
            else
                query.append(attName);
            if (att.isDate())
                query.append(" " + m_createDate);
            else {
                if (att.isNumeric())
                    query.append(" " + m_createDouble);
                else
                    query.append(" " + m_createText);
            }
            if (i != structure.numAttributes() - 1)
                query.append(", ");
        }
        query.append(" )");
        //System.out.println(query.toString());
        m_DataBaseConnection.update(query.toString());
        m_DataBaseConnection.close();
        if (!m_DataBaseConnection.tableExists(m_tableName)) {
            throw new IOException("Table cannot be built.");
        }
    }

    /**
     * inserts the given instance into the table.
     * 
     * @param inst the instance to insert
     * @throws Exception if something goes wrong
     */
    public void writeInstance(Instance inst) throws Exception {

        StringBuffer insert = new StringBuffer();
        insert.append("INSERT INTO ");
        insert.append(m_tableName);
        insert.append(" VALUES ( ");
        if (m_id) {
            insert.append(m_count);
            insert.append(", ");
            m_count++;
        }
        for (int j = 0; j < inst.numAttributes(); j++) {
            if (inst.isMissing(j))
                insert.append("NULL");
            else {
                if ((inst.attribute(j)).isDate())
                    insert.append("'" + m_DateFormat.format((long) inst.value(j)) + "'");
                else if ((inst.attribute(j)).isNumeric())
                    insert.append(inst.value(j));
                else {
                    String stringInsert = "'" + inst.stringValue(j) + "'";
                    if (stringInsert.length() > 2)
                        stringInsert = stringInsert.replaceAll("''", "'");
                    insert.append(stringInsert);
                }
            }
            if (j != inst.numAttributes() - 1)
                insert.append(", ");
        }
        insert.append(" )");
        //System.out.println(insert.toString());
        if (m_DataBaseConnection.update(insert.toString()) < 1) {
            throw new IOException("Tuple cannot be inserted.");
        } else {
            m_DataBaseConnection.close();
        }
    }

    /** 
     * Saves an instances incrementally. Structure has to be set by using the
     * setStructure() method or setInstances() method. When a structure is set, a table is created. 
     * 
     * @param inst the instance to save
     * @throws IOException throws IOEXception.
     */
    public void writeIncremental(Instance inst) throws IOException {

        int writeMode = getWriteMode();
        Instances structure = getInstances();

        if (m_DataBaseConnection == null)
            throw new IOException("No database has been set up.");
        if (getRetrieval() == BATCH)
            throw new IOException("Batch and incremental saving cannot be mixed.");
        setRetrieval(INCREMENTAL);

        try {
            if (!m_DataBaseConnection.isConnected())
                connectToDatabase();
            if (writeMode == WAIT) {
                if (structure == null) {
                    setWriteMode(CANCEL);
                    if (inst != null)
                        throw new Exception("Structure(Header Information) has to be set in advance");
                } else
                    setWriteMode(STRUCTURE_READY);
                writeMode = getWriteMode();
            }
            if (writeMode == CANCEL) {
                cancel();
            }
            if (writeMode == STRUCTURE_READY) {
                setWriteMode(WRITE);
                writeStructure();
                writeMode = getWriteMode();
            }
            if (writeMode == WRITE) {
                if (structure == null)
                    throw new IOException("No instances information available.");
                if (inst != null) {
                    //write instance 
                    writeInstance(inst);
                } else {
                    //close
                    m_DataBaseConnection.disconnectFromDatabase();
                    resetStructure();
                    m_count = 1;
                }
            }
        } catch (Exception ex) {
            printException(ex);
        }
    }

    /** 
     * Writes a Batch of instances.
     * 
     * @throws IOException throws IOException
     */
    public void writeBatch() throws IOException {

        Instances instances = getInstances();
        if (instances == null)
            throw new IOException("No instances to save");
        if (getRetrieval() == INCREMENTAL)
            throw new IOException("Batch and incremental saving cannot be mixed.");
        if (m_DataBaseConnection == null)
            throw new IOException("No database has been set up.");
        setRetrieval(BATCH);
        try {
            if (!m_DataBaseConnection.isConnected())
                connectToDatabase();
            setWriteMode(WRITE);
            writeStructure();
            for (int i = 0; i < instances.numInstances(); i++) {
                writeInstance(instances.instance(i));
            }
            m_DataBaseConnection.disconnectFromDatabase();
            setWriteMode(WAIT);
            resetStructure();
            m_count = 1;
        } catch (Exception ex) {
            printException(ex);
        }
    }

    /**
     * Prints an exception.
     * 
     * @param ex the exception to print
     */
    private void printException(Exception ex) {

        System.out.println("\n--- Exception caught ---\n");
        while (ex != null) {
            System.out.println("Message:   " + ex.getMessage());
            if (ex instanceof SQLException) {
                System.out.println("SQLState:  " + ((SQLException) ex).getSQLState());
                System.out.println("ErrorCode: " + ((SQLException) ex).getErrorCode());
                ex = ((SQLException) ex).getNextException();
            } else
                ex = null;
            System.out.println("");
        }

    }

    /** 
     * Gets the setting.
     * 
     * @return the current setting
     */
    public String[] getOptions() {
        Vector options = new Vector();

        if ((getUrl() != null) && (getUrl().length() != 0)) {
            options.add("-url");
            options.add(getUrl());
        }

        if ((getUser() != null) && (getUser().length() != 0)) {
            options.add("-user");
            options.add(getUser());
        }

        if ((getPassword() != null) && (getPassword().length() != 0)) {
            options.add("-password");
            options.add(getPassword());
        }

        if ((m_tableName != null) && (m_tableName.length() != 0)) {
            options.add("-T");
            options.add(m_tableName);
        }

        if (m_id)
            options.add("-P");

        if ((m_inputFile != null) && (m_inputFile.length() != 0)) {
            options.add("-i");
            options.add(m_inputFile);
        }

        return (String[]) options.toArray(new String[options.size()]);
    }

    /** 
     * Lists the available options.
     * 
     * @return an enumeration of the available options
     */
    public java.util.Enumeration listOptions() {

        FastVector newVector = new FastVector();

        newVector.addElement(
                new Option("\tThe JDBC URL to connect to.\n" + "\t(default: from DatabaseUtils.props file)", "url",
                        1, "-url <JDBC URL>"));

        newVector.addElement(new Option("\tThe user to connect with to the database.\n" + "\t(default: none)",
                "user", 1, "-user <name>"));

        newVector.addElement(new Option("\tThe password to connect with to the database.\n" + "\t(default: none)",
                "password", 1, "-password <password>"));

        newVector.addElement(new Option("\tThe name of the table.\n" + "\t(default: the relation name)", "T", 1,
                "-T <table name>"));

        newVector.addElement(new Option("\tAdd an ID column as primary key. The name is specified\n"
                + "\tin the DatabaseUtils file ('idColumn'). The DatabaseLoader\n" + "\twon't load this column.",
                "P", 0, "-P"));

        newVector.addElement(new Option("\tInput file in arff format that should be saved in database.", "i", 1,
                "-i <input file name>"));

        return newVector.elements();
    }

    /** 
     * Sets the options. <p/>
     *
     <!-- options-start -->
     * Valid options are: <p/>
     * 
     * <pre> -url &lt;JDBC URL&gt;
     *  The JDBC URL to connect to.
     *  (default: from DatabaseUtils.props file)</pre>
     * 
     * <pre> -user &lt;name&gt;
     *  The user to connect with to the database.
     *  (default: none)</pre>
     * 
     * <pre> -password &lt;password&gt;
     *  The password to connect with to the database.
     *  (default: none)</pre>
     * 
     * <pre> -T &lt;table name&gt;
     *  The name of the table.
     *  (default: the relation name)</pre>
     * 
     * <pre> -P
     *  Add an ID column as primary key. The name is specified
     *  in the DatabaseUtils file ('idColumn'). The DatabaseLoader
     *  won't load this column.</pre>
     * 
     * <pre> -i &lt;input file name&gt;
     *  Input file in arff format that should be saved in database.</pre>
     * 
     <!-- options-end -->
     *
     * @param options the options
     * @throws Exception if options cannot be set
     */
    public void setOptions(String[] options) throws Exception {

        String tableString, inputString, tmpStr;

        resetOptions();

        tmpStr = Utils.getOption("url", options);
        if (tmpStr.length() != 0)
            setUrl(tmpStr);

        tmpStr = Utils.getOption("user", options);
        if (tmpStr.length() != 0)
            setUser(tmpStr);

        tmpStr = Utils.getOption("password", options);
        if (tmpStr.length() != 0)
            setPassword(tmpStr);

        tableString = Utils.getOption('T', options);

        inputString = Utils.getOption('i', options);

        if (tableString.length() != 0) {
            m_tableName = tableString;
            m_tabName = false;
        }

        m_id = Utils.getFlag('P', options);

        if (inputString.length() != 0) {
            try {
                m_inputFile = inputString;
                ArffLoader al = new ArffLoader();
                File inputFile = new File(inputString);
                al.setSource(inputFile);
                setInstances(al.getDataSet());
                //System.out.println(getInstances());
                if (tableString.length() == 0)
                    m_tableName = getInstances().relationName();
            } catch (Exception ex) {
                printException(ex);
                ex.printStackTrace();
            }
        }
    }

    /**
     * Returns the revision string.
     * 
     * @return      the revision
     */
    public String getRevision() {
        return RevisionUtils.extract("$Revision: 7499 $");
    }

    public void writeInstances(Instances inst) throws Exception {
        for (int i = 0; i < inst.numInstances(); i++) {
            writeInstance(inst.instance(i));
        }
    }

    /**
     * Main method.
     *
     * @param options should contain the options of a Saver.
     */
    public static void main(String[] options) {

        StringBuffer text = new StringBuffer();
        text.append("\n\nDatabaseSaver options:\n");
        try {
            DatabaseSaver asv = new DatabaseSaver();
            try {
                Enumeration enumi = asv.listOptions();
                while (enumi.hasMoreElements()) {
                    Option option = (Option) enumi.nextElement();
                    text.append(option.synopsis() + '\n');
                    text.append(option.description() + '\n');
                }
                asv.setOptions(options);
                asv.setDestination();
            } catch (Exception ex) {
                ex.printStackTrace();
            }
            //incremental

            /*asv.setRetrieval(INCREMENTAL);
            Instances instances = asv.getInstances();
            asv.setStructure(instances);
            for(int i = 0; i < instances.numInstances(); i++){ //last instance is null and finishes incremental saving
                asv.writeIncremental(instances.instance(i));
            }
            asv.writeIncremental(null);*/

            //batch
            asv.writeBatch();
        } catch (Exception ex) {
            ex.printStackTrace();
            System.out.println(text);
        }

    }
}