it.unibas.spicy.persistence.csv.ExportCSVInstances.java Source code

Introduction

Here is the source code for it.unibas.spicy.persistence.csv.ExportCSVInstances.java
Source

/* Copyright 2015-2016 by the Athens University of Economics and Business (AUEB).
    
   This file is part of MIPMap.
    
   MIPMap is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
    
MIPMap is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.
    
You should have received a copy of the GNU General Public License
along with MIPMap.  If not, see <http://www.gnu.org/licenses/>.
 */

package it.unibas.spicy.persistence.csv;

import au.com.bytecode.opencsv.CSVReader;
import au.com.bytecode.opencsv.CSVWriter;
import it.unibas.spicy.model.datasource.INode;
import it.unibas.spicy.model.mapping.IDataSourceProxy;
import it.unibas.spicy.model.mapping.MappingTask;
import it.unibas.spicy.persistence.AccessConfiguration;
import it.unibas.spicy.persistence.DAOException;
import it.unibas.spicy.persistence.relational.IConnectionFactory;
import it.unibas.spicy.persistence.relational.SimpleDbConnectionFactory;
import it.unibas.spicy.utility.SpicyEngineConstants;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.sql.Connection;
import java.sql.DatabaseMetaData;
import java.sql.ResultSet;
import java.sql.SQLException;
import java.sql.Statement;
import java.util.HashMap;
import java.util.HashSet;
import java.util.logging.Level;
import java.util.logging.Logger;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;

//giannisk
public class ExportCSVInstances {
    private static Log logger = LogFactory.getLog(ExportCSVInstances.class);

    private Connection getConnectionToPostgres(IConnectionFactory connectionFactory) throws DAOException {
        AccessConfiguration accessConfiguration = new AccessConfiguration();
        accessConfiguration.setDriver(SpicyEngineConstants.ACCESS_CONFIGURATION_DRIVER);
        accessConfiguration
                .setUri(SpicyEngineConstants.ACCESS_CONFIGURATION_URI + SpicyEngineConstants.MAPPING_TASK_DB_NAME);
        accessConfiguration.setLogin(SpicyEngineConstants.ACCESS_CONFIGURATION_LOGIN);
        accessConfiguration.setPassword(SpicyEngineConstants.ACCESS_CONFIGURATION_PASS);

        return connectionFactory.getConnection(accessConfiguration);
    }

    public void exportCSVInstances(MappingTask mappingTask, String directoryPath, String suffix, int scenarioNo)
            throws DAOException, SQLException, IOException {
        IDataSourceProxy dataSourceTarget = mappingTask.getTargetProxy();
        String folderPath = generateFolderPath(dataSourceTarget.getIntermediateSchema(), directoryPath, suffix, 0);
        //create CSV Folder
        new File(folderPath).mkdir();
        //connection to Postgres
        IConnectionFactory connectionFactory = new SimpleDbConnectionFactory();
        Connection connection = getConnectionToPostgres(connectionFactory);
        try {
            Statement statement = connection.createStatement();

            //get table names from target database
            DatabaseMetaData databaseMetaData = connection.getMetaData();
            String[] tableTypes = new String[] { "TABLE" };

            ResultSet tableResultSet = databaseMetaData.getTables(SpicyEngineConstants.MAPPING_TASK_DB_NAME,
                    SpicyEngineConstants.TARGET_SCHEMA_NAME + scenarioNo, null, tableTypes);
            while (tableResultSet.next()) {
                String tableName = tableResultSet.getString("TABLE_NAME");
                createCSVDocument(tableName, SpicyEngineConstants.TARGET_SCHEMA_NAME + scenarioNo, dataSourceTarget,
                        folderPath, statement, null);
            }
        } finally {
            //close connection
            if (connection != null)
                connectionFactory.close(connection);
        }
    }

    private String generateFolderPath(INode rootNode, String directoryPath, String suffix, int i) {
        String folderPath = "";
        if (directoryPath.endsWith(File.separator)) {
            folderPath = directoryPath + rootNode.getLabel() + suffix + i;
        } else {
            folderPath = directoryPath + File.separator + rootNode.getLabel() + suffix + i;
        }
        return folderPath;
    }

    public void createCSVDocument(String tableName, String schema, IDataSourceProxy dataSourceTarget,
            String folderPath, Statement statement, String[] columnNames) throws SQLException, IOException {
        createCSVDocument(tableName, schema, dataSourceTarget, folderPath, statement, columnNames, false);
    }

    public void createCSVDocument(String tableName, String schema, IDataSourceProxy dataSourceTarget,
            String folderPath, Statement statement, String[] columnNames, boolean unpivot)
            throws SQLException, IOException {
        File file = new File(folderPath + File.separator + tableName + ".csv");
        ResultSet allRows = statement.executeQuery("SELECT * FROM " + schema + ".\"" + tableName + "\";");
        int columnCount = allRows.getMetaData().getColumnCount();

        if (columnNames == null) {
            //first write column names
            columnNames = new String[columnCount];
            int i = 0;
            //datasource is null when exporting the unpivoted csv table
            if (dataSourceTarget != null) {
                INode tableNode = dataSourceTarget.getIntermediateSchema().getChild(tableName);
                //get column names from the first table tuple only           
                for (INode column : tableNode.getChild(0).getChildren()) {
                    String columnLabel = column.getLabel();
                    String oldValue = dataSourceTarget.getChangedValue(tableName + "." + columnLabel);
                    if (oldValue != null) {
                        columnNames[i] = oldValue;
                    } else {
                        columnNames[i] = columnLabel;
                    }
                    i++;
                }
            }
        }
        CSVWriter csvWriter = new CSVWriter(new FileWriter(file), CSVWriter.DEFAULT_SEPARATOR,
                CSVWriter.NO_QUOTE_CHARACTER, CSVWriter.NO_ESCAPE_CHARACTER);
        csvWriter.writeNext(columnNames, false);

        try {
            //then write the data                           
            while (allRows.next()) {
                String[] row = new String[columnCount];
                for (int j = 1; j <= columnCount; j++) {
                    String dataType = allRows.getMetaData().getColumnTypeName(j);
                    String value = allRows.getString(j);
                    //if the value is null write null to csv file
                    if (value == null) {
                        //avenet 20170721 - here we can export either null or ,,. Postgres treats them the same - we export ,, because it is more correct
                        //avenet 20170215 null values in Postgres csv mode correspond to ,,
                        value = "";
                        //                        value = "null";
                    }
                    //if the type is String/text etc and is not null put the value between double quotes
                    else if (dataType.toLowerCase().startsWith("varchar")
                            || dataType.toLowerCase().startsWith("char")
                            || dataType.toLowerCase().startsWith("text") || dataType.equalsIgnoreCase("bpchar")
                            || dataType.equalsIgnoreCase("bit") || dataType.equalsIgnoreCase("mediumtext")
                            || dataType.equalsIgnoreCase("longtext") || dataType.equalsIgnoreCase("serial")
                            || dataType.equalsIgnoreCase("enum")) {
                        //avenet 20170724 - by adding these double quotes string values are stored in the form ,"value", and nulls as ,,
                        value = "\"" + value + "\"";
                    }
                    row[j - 1] = value;
                }
                //the following false value means there will not be quotes added, since we have already added double quotes only for string results
                csvWriter.writeNext(row, false);
            }
        } finally {
            csvWriter.close();
            allRows.close();
        }
    }

    public void appendCSVInstances(MappingTask mappingTask, HashMap<String, String> directoryPaths, int scenarioNo)
            throws SQLException, DAOException, IOException {
        //connection to Postgres
        IConnectionFactory connectionFactory = new SimpleDbConnectionFactory();
        Connection connection = getConnectionToPostgres(connectionFactory);
        try {
            Statement statement = connection.createStatement();

            //get table names from target database
            DatabaseMetaData databaseMetaData = connection.getMetaData();
            String[] tableTypes = new String[] { "TABLE" };
            ResultSet tableResultSet = databaseMetaData.getTables(SpicyEngineConstants.MAPPING_TASK_DB_NAME,
                    SpicyEngineConstants.TARGET_SCHEMA_NAME + scenarioNo, null, tableTypes);
            //for each table
            while (tableResultSet.next()) {
                String tableName = tableResultSet.getString("TABLE_NAME");
                String filePath = directoryPaths.get(tableName);

                if ((filePath != null) && (!filePath.equals(""))) {
                    ResultSet allRows = statement.executeQuery("SELECT * FROM "
                            + SpicyEngineConstants.TARGET_SCHEMA_NAME + scenarioNo + ".\"" + tableName + "\";");
                    //no of columns
                    int columnCount = allRows.getMetaData().getColumnCount();
                    //column names
                    String[] columnNames = new String[columnCount];
                    for (int i = 1; i <= columnCount; i++) {
                        columnNames[i - 1] = allRows.getMetaData().getColumnName(i);
                    }
                    if (checkDocForCSVColumns(columnCount, columnNames, filePath))
                        appendToCSVDocument(allRows, columnCount, filePath);
                    else {
                        throw new DAOException("Column names do not match those of the csv file");
                    }
                    allRows.close();
                } else {
                    System.out.println("The CSV file " + tableName + " cannot be found!");
                    System.exit(-1);
                }
            }
        } finally {
            //close connection
            if (connection != null)
                connectionFactory.close(connection);
        }
    }

    private boolean checkDocForCSVColumns(int columnCount, String[] columnNames, String filePath) {
        try {
            CSVReader reader = new CSVReader(new FileReader(filePath));
            // nextLine[] is an array of values from the line
            String[] nextLine;
            //read only first line
            nextLine = reader.readNext();

            //check for same length first
            if (nextLine.length != columnCount)
                return false;

            int i = 0;
            //if table columns are not the same -or the same order- as the ones of the csv file 
            for (String columnName : columnNames) {
                String csvColumnName = nextLine[i].replace("\"", "");
                if (!columnName.equalsIgnoreCase(csvColumnName)) {
                    return false;
                }
                i++;
            }
            reader.close();
            return true;
        } catch (FileNotFoundException ex) {
            Logger.getLogger(ExportCSVInstances.class.getName()).log(Level.SEVERE, null, ex);
            return false;
        } catch (IOException ex) {
            Logger.getLogger(ExportCSVInstances.class.getName()).log(Level.SEVERE, null, ex);
            return false;
        }
    }

    private void appendToCSVDocument(ResultSet allRows, int columnCount, String filePath)
            throws SQLException, IOException {
        //the flag 'true' means that the writer will go to the end of the file and append the new data
        BufferedWriter bfout = new BufferedWriter(new FileWriter(filePath, true));
        try {
            while (allRows.next()) {
                String row = "";
                for (int j = 1; j <= columnCount; j++) {
                    String dataType = allRows.getMetaData().getColumnTypeName(j);
                    String value = allRows.getString(j);
                    //if the value is null write null to csv file
                    if (value == null) {
                        //                        avenet 20170215 - using "" is the copy csv format for Postgres
                        value = "";
                    }
                    //if the type is String/text etc and is not null put the value between double quotes
                    else if (dataType.toLowerCase().startsWith("varchar")
                            || dataType.toLowerCase().startsWith("char")
                            || dataType.toLowerCase().startsWith("text") || dataType.equalsIgnoreCase("bpchar")
                            || dataType.equalsIgnoreCase("bit") || dataType.equalsIgnoreCase("mediumtext")
                            || dataType.equalsIgnoreCase("longtext") || dataType.equalsIgnoreCase("serial")
                            || dataType.equalsIgnoreCase("enum")) {
                        value = "\"" + value + "\"";
                    }
                    row = row + value + ",";
                }
                //take out the last ',' character
                row = row.substring(0, row.length() - 1);
                bfout.write(row);
                bfout.newLine();
            }
        } finally {
            bfout.close();
        }
    }

    public void exportPKConstraintCSVInstances(MappingTask mappingTask, String directoryPath,
            HashSet<String> tableNames, String suffix, int scenarioNo)
            throws DAOException, SQLException, IOException {
        IDataSourceProxy dataSourceTarget = mappingTask.getTargetProxy();
        String folderPath = generateFolderPath(dataSourceTarget.getIntermediateSchema(), directoryPath, suffix, 0);
        //create Folder
        new File(folderPath).mkdir();
        //connection to Postgres
        IConnectionFactory connectionFactory = new SimpleDbConnectionFactory();
        Connection connection = getConnectionToPostgres(connectionFactory);

        try {
            Statement statement = connection.createStatement();
            for (String tableName : tableNames) {
                createCSVDocument(tableName, SpicyEngineConstants.WORK_SCHEMA_NAME, dataSourceTarget, folderPath,
                        statement, null);
            }
        } finally {
            //close connection
            if (connection != null)
                connectionFactory.close(connection);
        }
    }

}