eu.stratosphere.pact.test.contracts.MatchITCase.java Source code

Java tutorial

Introduction

Here is the source code for eu.stratosphere.pact.test.contracts.MatchITCase.java

Source

/***********************************************************************************************************************
 *
 * Copyright (C) 2010 by the Stratosphere project (http://stratosphere.eu)
 *
 * Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
 * an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
 * specific language governing permissions and limitations under the License.
 *
 **********************************************************************************************************************/

package eu.stratosphere.pact.test.contracts;

import java.io.FileNotFoundException;
import java.io.IOException;
import java.util.Collection;
import java.util.LinkedList;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.junit.runner.RunWith;
import org.junit.runners.Parameterized;
import org.junit.runners.Parameterized.Parameters;

import eu.stratosphere.nephele.configuration.Configuration;
import eu.stratosphere.nephele.jobgraph.JobGraph;
import eu.stratosphere.pact.common.contract.FileDataSink;
import eu.stratosphere.pact.common.contract.FileDataSource;
import eu.stratosphere.pact.common.contract.MatchContract;
import eu.stratosphere.pact.common.io.DelimitedInputFormat;
import eu.stratosphere.pact.common.plan.Plan;
import eu.stratosphere.pact.common.stubs.Collector;
import eu.stratosphere.pact.common.stubs.MatchStub;
import eu.stratosphere.pact.common.type.PactRecord;
import eu.stratosphere.pact.common.type.base.PactInteger;
import eu.stratosphere.pact.common.type.base.PactString;
import eu.stratosphere.pact.compiler.DataStatistics;
import eu.stratosphere.pact.compiler.PactCompiler;
import eu.stratosphere.pact.compiler.plan.candidate.OptimizedPlan;
import eu.stratosphere.pact.compiler.plantranslate.NepheleJobGraphGenerator;
import eu.stratosphere.pact.test.contracts.io.ContractITCaseIOFormats.ContractITCaseInputFormat;
import eu.stratosphere.pact.test.contracts.io.ContractITCaseIOFormats.ContractITCaseOutputFormat;
import eu.stratosphere.pact.test.util.TestBase;

/**
 * @author Fabian Hueske
 */
@RunWith(Parameterized.class)
public class MatchITCase extends TestBase

{
    private static final Log LOG = LogFactory.getLog(MatchITCase.class);

    public MatchITCase(String clusterConfig, Configuration testConfig) {
        super(testConfig, clusterConfig);
    }

    private static final String MATCH_LEFT_IN_1 = "1 1\n2 2\n3 3\n4 4\n";

    private static final String MATCH_LEFT_IN_2 = "1 2\n2 3\n3 4\n4 5\n";

    private static final String MATCH_LEFT_IN_3 = "1 3\n2 4\n3 5\n4 6\n";

    private static final String MATCH_LEFT_IN_4 = "1 4\n2 5\n3 6\n4 7\n";

    private static final String MATCH_RIGHT_IN_1 = "1 1\n2 2\n3 3\n5 1\n";

    private static final String MATCH_RIGHT_IN_2 = "1 1\n2 2\n3 3\n6 1\n";

    private static final String MATCH_RIGHT_IN_3 = "1 1\n2 2\n2 2\n7 1\n";

    private static final String MATCH_RIGHT_IN_4 = "1 1\n2 2\n2 2\n8 1\n";

    //   private static final String MATCH_RESULT = "1 0\n1 0\n1 0\n1 0\n1 1\n1 1\n1 1\n1 1\n1 2\n1 2\n1 2\n1 2\n1 3\n1 3\n1 3\n1 3\n"
    //         + "3 0\n3 0\n3 1\n3 1\n3 2\n3 2\n3 3\n3 3\n"
    //         + "2 0\n2 1\n2 2\n2 3\n2 0\n2 1\n2 2\n2 3\n2 0\n2 1\n2 2\n2 3\n2 0\n2 1\n2 2\n2 3\n2 0\n2 1\n2 2\n2 3\n2 0\n2 1\n2 2\n2 3\n";

    private static final String MATCH_RESULT = "2 1\n2 1\n2 1\n2 1\n2 2\n2 2\n2 2\n2 2\n2 3\n2 3\n2 3\n2 3\n2 4\n2 4\n2 4\n2 4\n"
            + "4 1\n4 1\n4 2\n4 2\n4 3\n4 3\n4 4\n4 4\n"
            + "3 1\n3 2\n3 3\n3 4\n3 1\n3 2\n3 3\n3 4\n3 1\n3 2\n3 3\n3 4\n3 1\n3 2\n3 3\n3 4\n3 1\n3 2\n3 3\n3 4\n3 1\n3 2\n3 3\n3 4\n";

    @Override
    protected void preSubmit() throws Exception {
        String tempPath = getFilesystemProvider().getTempDirPath();

        getFilesystemProvider().createDir(tempPath + "/match_left");

        getFilesystemProvider().createFile(tempPath + "/match_left/matchTest_1.txt", MATCH_LEFT_IN_1);
        getFilesystemProvider().createFile(tempPath + "/match_left/matchTest_2.txt", MATCH_LEFT_IN_2);
        getFilesystemProvider().createFile(tempPath + "/match_left/matchTest_3.txt", MATCH_LEFT_IN_3);
        getFilesystemProvider().createFile(tempPath + "/match_left/matchTest_4.txt", MATCH_LEFT_IN_4);

        getFilesystemProvider().createDir(tempPath + "/match_right");

        getFilesystemProvider().createFile(tempPath + "/match_right/matchTest_1.txt", MATCH_RIGHT_IN_1);
        getFilesystemProvider().createFile(tempPath + "/match_right/matchTest_2.txt", MATCH_RIGHT_IN_2);
        getFilesystemProvider().createFile(tempPath + "/match_right/matchTest_3.txt", MATCH_RIGHT_IN_3);
        getFilesystemProvider().createFile(tempPath + "/match_right/matchTest_4.txt", MATCH_RIGHT_IN_4);

    }

    public static class TestMatcher extends MatchStub {

        private PactString keyString = new PactString();
        private PactString valueString = new PactString();

        @Override
        public void match(PactRecord value1, PactRecord value2, Collector<PactRecord> out) throws Exception {
            keyString = value1.getField(0, keyString);
            keyString.setValue("" + (Integer.parseInt(keyString.getValue()) + 1));
            value1.setField(0, keyString);
            valueString = value1.getField(1, valueString);
            int val1 = Integer.parseInt(valueString.getValue()) + 2;
            valueString = value2.getField(1, valueString);
            int val2 = Integer.parseInt(valueString.getValue()) + 1;

            value1.setField(1, new PactInteger(val1 - val2));

            out.collect(value1);

            if (LOG.isDebugEnabled())
                LOG.debug("Processed: [" + keyString.toString() + "," + val1 + "] + " + "[" + keyString.toString()
                        + "," + val2 + "]");
        }

    }

    @Override
    protected JobGraph getJobGraph() throws Exception {

        String pathPrefix = getFilesystemProvider().getURIPrefix() + getFilesystemProvider().getTempDirPath();

        FileDataSource input_left = new FileDataSource(ContractITCaseInputFormat.class, pathPrefix + "/match_left");
        DelimitedInputFormat.configureDelimitedFormat(input_left).recordDelimiter('\n');
        input_left.setDegreeOfParallelism(config.getInteger("MatchTest#NoSubtasks", 1));

        FileDataSource input_right = new FileDataSource(ContractITCaseInputFormat.class,
                pathPrefix + "/match_right");
        DelimitedInputFormat.configureDelimitedFormat(input_right).recordDelimiter('\n');
        input_right.setDegreeOfParallelism(config.getInteger("MatchTest#NoSubtasks", 1));

        MatchContract testMatcher = MatchContract.builder(TestMatcher.class, PactString.class, 0, 0).build();
        testMatcher.setDegreeOfParallelism(config.getInteger("MatchTest#NoSubtasks", 1));
        testMatcher.getParameters().setString(PactCompiler.HINT_LOCAL_STRATEGY,
                config.getString("MatchTest#LocalStrategy", ""));
        if (config.getString("MatchTest#ShipStrategy", "").equals("BROADCAST_FIRST")) {
            testMatcher.getParameters().setString(PactCompiler.HINT_SHIP_STRATEGY_FIRST_INPUT,
                    PactCompiler.HINT_SHIP_STRATEGY_BROADCAST);
            testMatcher.getParameters().setString(PactCompiler.HINT_SHIP_STRATEGY_SECOND_INPUT,
                    PactCompiler.HINT_SHIP_STRATEGY_FORWARD);
        } else if (config.getString("MatchTest#ShipStrategy", "").equals("BROADCAST_SECOND")) {
            testMatcher.getParameters().setString(PactCompiler.HINT_SHIP_STRATEGY_FIRST_INPUT,
                    PactCompiler.HINT_SHIP_STRATEGY_FORWARD);
            testMatcher.getParameters().setString(PactCompiler.HINT_SHIP_STRATEGY_SECOND_INPUT,
                    PactCompiler.HINT_SHIP_STRATEGY_BROADCAST);
        } else {
            testMatcher.getParameters().setString(PactCompiler.HINT_SHIP_STRATEGY,
                    config.getString("MatchTest#ShipStrategy", ""));
        }

        FileDataSink output = new FileDataSink(ContractITCaseOutputFormat.class, pathPrefix + "/result.txt");
        output.setDegreeOfParallelism(1);

        output.addInput(testMatcher);
        testMatcher.addFirstInput(input_left);
        testMatcher.addSecondInput(input_right);

        Plan plan = new Plan(output);

        PactCompiler pc = new PactCompiler(new DataStatistics());
        OptimizedPlan op = pc.compile(plan);

        NepheleJobGraphGenerator jgg = new NepheleJobGraphGenerator();
        return jgg.compileJobGraph(op);

    }

    @Override
    protected void postSubmit() throws Exception {
        String tempPath = getFilesystemProvider().getTempDirPath();

        compareResultsByLinesInMemory(MATCH_RESULT, tempPath + "/result.txt");

        getFilesystemProvider().delete(tempPath + "/result.txt", true);
        getFilesystemProvider().delete(tempPath + "/match_left", true);
        getFilesystemProvider().delete(tempPath + "/match_right", true);

    }

    @Parameters
    public static Collection<Object[]> getConfigurations() throws FileNotFoundException, IOException {

        LinkedList<Configuration> tConfigs = new LinkedList<Configuration>();

        String[] localStrategies = { PactCompiler.HINT_LOCAL_STRATEGY_SORT_BOTH_MERGE,
                PactCompiler.HINT_LOCAL_STRATEGY_HASH_BUILD_FIRST,
                PactCompiler.HINT_LOCAL_STRATEGY_HASH_BUILD_SECOND };

        String[] shipStrategies = { PactCompiler.HINT_SHIP_STRATEGY_REPARTITION_HASH, "BROADCAST_FIRST",
                "BROADCAST_SECOND" };

        for (String localStrategy : localStrategies) {
            for (String shipStrategy : shipStrategies) {

                Configuration config = new Configuration();
                config.setString("MatchTest#LocalStrategy", localStrategy);
                config.setString("MatchTest#ShipStrategy", shipStrategy);
                config.setInteger("MatchTest#NoSubtasks", 4);

                tConfigs.add(config);
            }
        }

        return toParameterList(MatchITCase.class, tConfigs);
    }

}