eu.stratosphere.pact.runtime.task.CoGroupTaskExternalITCase.java Source code

Java tutorial

Introduction

Here is the source code for eu.stratosphere.pact.runtime.task.CoGroupTaskExternalITCase.java

Source

/***********************************************************************************************************************
 *
 * Copyright (C) 2010 by the Stratosphere project (http://stratosphere.eu)
 *
 * Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
 * an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
 * specific language governing permissions and limitations under the License.
 *
 **********************************************************************************************************************/

package eu.stratosphere.pact.runtime.task;

import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;

import junit.framework.Assert;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.junit.Test;

import eu.stratosphere.pact.common.stubs.CoGroupStub;
import eu.stratosphere.pact.common.stubs.Collector;
import eu.stratosphere.pact.common.type.Key;
import eu.stratosphere.pact.common.type.PactRecord;
import eu.stratosphere.pact.common.type.base.PactInteger;
import eu.stratosphere.pact.runtime.plugable.PactRecordComparatorFactory;
import eu.stratosphere.pact.runtime.task.util.TaskConfig.LocalStrategy;
import eu.stratosphere.pact.runtime.test.util.UniformPactRecordGenerator;
import eu.stratosphere.pact.runtime.test.util.TaskTestBase;

public class CoGroupTaskExternalITCase extends TaskTestBase {
    private static final Log LOG = LogFactory.getLog(CoGroupTaskExternalITCase.class);

    private final List<PactRecord> outList = new ArrayList<PactRecord>();

    @Test
    public void testExternalSortCoGroupTask() {

        int keyCnt1 = 16384;
        int valCnt1 = 4 * 2;

        int keyCnt2 = 65536 * 2;
        int valCnt2 = 1;

        super.initEnvironment(6 * 1024 * 1024);
        super.addInput(new UniformPactRecordGenerator(keyCnt1, valCnt1, false), 1);
        super.addInput(new UniformPactRecordGenerator(keyCnt2, valCnt2, false), 2);
        super.addOutput(this.outList);

        CoGroupTask<PactRecord, PactRecord, PactRecord> testTask = new CoGroupTask<PactRecord, PactRecord, PactRecord>();
        super.getTaskConfig().setLocalStrategy(LocalStrategy.SORT_BOTH_MERGE);
        super.getTaskConfig().setMemorySize(6 * 1024 * 1024);
        super.getTaskConfig().setNumFilehandles(4);

        final int[] keyPos1 = new int[] { 0 };
        final int[] keyPos2 = new int[] { 0 };
        @SuppressWarnings("unchecked")
        final Class<? extends Key>[] keyClasses = (Class<? extends Key>[]) new Class[] { PactInteger.class };

        PactRecordComparatorFactory.writeComparatorSetupToConfig(super.getTaskConfig().getConfiguration(),
                super.getTaskConfig().getPrefixForInputParameters(0), keyPos1, keyClasses);
        PactRecordComparatorFactory.writeComparatorSetupToConfig(super.getTaskConfig().getConfiguration(),
                super.getTaskConfig().getPrefixForInputParameters(1), keyPos2, keyClasses);

        super.registerTask(testTask, MockCoGroupStub.class);

        try {
            testTask.invoke();
        } catch (Exception e) {
            LOG.debug(e);
            Assert.fail("Invoke method caused exception.");
        }

        int expCnt = valCnt1 * valCnt2 * Math.min(keyCnt1, keyCnt2) + Math.max(keyCnt1, keyCnt2)
                - Math.min(keyCnt1, keyCnt2);

        Assert.assertTrue("Resultset size was " + this.outList.size() + ". Expected was " + expCnt,
                this.outList.size() == expCnt);

        this.outList.clear();

    }

    public static class MockCoGroupStub extends CoGroupStub {

        @Override
        public void coGroup(Iterator<PactRecord> records1, Iterator<PactRecord> records2,
                Collector<PactRecord> out) {
            int val1Cnt = 0;

            while (records1.hasNext()) {
                val1Cnt++;
                records1.next();
            }

            while (records2.hasNext()) {
                PactRecord record2 = records2.next();
                if (val1Cnt == 0) {
                    out.collect(record2);
                } else {
                    for (int i = 0; i < val1Cnt; i++) {
                        out.collect(record2);
                    }
                }
            }
        }
    }
}