Java tutorial
/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.giraph.partition; import java.net.InetSocketAddress; import java.util.ArrayList; import java.util.Collection; import org.apache.giraph.conf.GiraphConstants; import org.apache.giraph.conf.ImmutableClassesGiraphConfiguration; import org.apache.giraph.partition.PartitionOwner; import org.apache.giraph.partition.WorkerGraphPartitioner; import org.apache.giraph.worker.WorkerInfo; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.io.LongWritable; import org.apache.hadoop.io.Writable; import org.junit.Test; import static org.junit.Assert.assertTrue; import static org.junit.Assert.assertEquals; /** Test {@link org.apache.giraph.partition.SimpleLongRangePartitionerFactory}. */ public class SimpleRangePartitionFactoryTest { private void testRange(int numWorkers, int keySpaceSize, int allowedWorkerDiff, boolean emptyWorkers) { Configuration conf = new Configuration(); conf.setLong(GiraphConstants.PARTITION_VERTEX_KEY_SPACE_SIZE, keySpaceSize); SimpleLongRangePartitionerFactory<Writable, Writable> factory = new SimpleLongRangePartitionerFactory<Writable, Writable>(); factory.setConf(new ImmutableClassesGiraphConfiguration(conf)); ArrayList<WorkerInfo> infos = new ArrayList<WorkerInfo>(); for (int i = 0; i < numWorkers; i++) { WorkerInfo info = new WorkerInfo(); info.setInetSocketAddress(new InetSocketAddress(8080)); info.setTaskId(i); infos.add(info); } Collection<PartitionOwner> owners = factory.createMasterGraphPartitioner() .createInitialPartitionOwners(infos, -1); int[] tasks = new int[owners.size()]; for (PartitionOwner owner : owners) { WorkerInfo worker = owner.getWorkerInfo(); assertEquals(0, tasks[owner.getPartitionId()]); tasks[owner.getPartitionId()] = worker.getTaskId() + 1; } checkMapping(tasks, allowedWorkerDiff, emptyWorkers); WorkerGraphPartitioner<LongWritable, Writable, Writable> workerPartitioner = factory .createWorkerGraphPartitioner(); workerPartitioner.updatePartitionOwners(null, owners); LongWritable longWritable = new LongWritable(); int[] partitions = new int[keySpaceSize]; for (int i = 0; i < keySpaceSize; i++) { longWritable.set(i); PartitionOwner owner = workerPartitioner.getPartitionOwner(longWritable); partitions[i] = owner.getPartitionId(); } checkMapping(partitions, 1, emptyWorkers); } private void checkMapping(int[] mapping, int allowedDiff, boolean emptyWorkers) { int prev = -1; int max = 0; int min = Integer.MAX_VALUE; int cur = 0; for (int value : mapping) { if (value != prev) { if (prev != -1) { min = Math.min(cur, min); max = Math.max(cur, max); assertTrue(prev < value); if (!emptyWorkers) { assertEquals(prev + 1, value); } } cur = 1; } else { cur++; } prev = value; } assertTrue(min + allowedDiff >= max); } @Test public void testLongRangePartitionerFactory() { // perfect distribution testRange(10, 100000, 0, false); testRange(1000, 100000, 0, false); // perfect distribution even when max is hit, and max is not divisible by #workers testRange(8949, 100023, 0, false); testRange(1949, 211111, 0, false); // imperfect distribution - because there are more workers than max partitions. testRange(194942, 211111, 1, true); } }