DijikstraAlgo.java Source code

Introduction

Here is the source code for DijikstraAlgo.java
Source

/*
Desciption: The code given below implements the parallel bfs 
   using the mapreduce paradigm.
author : https://github.com/himank/Graph-Algorithm-MapReduce 
The code is available under under gnu license. 
mofified by : prateek and sagar.
Date created: 1 june, 2016
Date modified: 8 june 2016
*/

import java.io.IOException;
import java.net.URI;
import java.util.*;
import java.io.*;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.*;
import org.apache.hadoop.mapred.*;
import org.apache.hadoop.mapred.Reducer;

/*
 * This class will responsible for taking the input from a file and
 * running the iterative Map-Reduce functionality to perform Dijikstra Algorithm
 *
 */
public class DijikstraAlgo {

    public static String OUT = "outfile";
    public static String IN = "inputlarger";

    public static class Map extends MapReduceBase implements Mapper<LongWritable, Text, LongWritable, Text> {

        /*
         * Overriding the map function
         */
        @Override
        public void map(LongWritable key, Text value, OutputCollector<LongWritable, Text> output, Reporter reporter)
                throws IOException {
            Text word = new Text();
            String line = value.toString(); // looks like 1 0 2:3:
            String[] sp = line.split("\t| "); // splits on space
            int distanceadd = Integer.parseInt(sp[1]) + 1;
            String[] PointsTo = sp[2].split(":");
            for (int i = 0; i < PointsTo.length; i++) {
                word.set("VALUE " + distanceadd); // tells me to look at
                // distance value
                output.collect(new LongWritable(Integer.parseInt(PointsTo[i])), word);
                word.clear();
            }

            // pass in current node's distance (if it is the lowest distance)
            word.set("VALUE " + sp[1]);
            output.collect(new LongWritable(Integer.parseInt(sp[0])), word);
            word.clear();

            word.set("NODES " + sp[2]);
            output.collect(new LongWritable(Integer.parseInt(sp[0])), word);
            word.clear();
        }
    }

    public static class Reduce extends MapReduceBase implements Reducer<LongWritable, Text, LongWritable, Text> {
        /*
         * Overriding the reduce function
         */
        @Override
        public void reduce(LongWritable key, Iterator<Text> values, OutputCollector<LongWritable, Text> output,
                Reporter reporter) throws IOException {
            String nodes = "UNMODED";
            Text word = new Text();
            int lowest = 125; // In this 125 is considered as infinite distance
            while (values.hasNext()) { // looks like NODES/VALUES 1 0 2:3:, we
                // need to use the first as a key
                String[] sp = values.next().toString().split(" "); // splits on
                // space
                // look at first value
                if (sp[0].equalsIgnoreCase("NODES")) {
                    nodes = null;
                    nodes = sp[1];
                } else if (sp[0].equalsIgnoreCase("VALUE")) {
                    int distance = Integer.parseInt(sp[1]);
                    lowest = Math.min(distance, lowest);
                }
            }
            word.set(lowest + " " + nodes);
            output.collect(key, word);
            word.clear();
        }
    }

    public static void main(String[] args) throws Exception {
        run(args);
    }

    public static void run(String[] args) throws Exception {
        IN = "hdfs://10.8.3.161:9000/user/sagar/input/";
        OUT = "hdfs://10.8.3.161:9000/user/sagar/output/";
        String input = IN;
        String output = OUT + System.nanoTime();
        String MAX_SPLIT_SIZE = args[0];
        boolean isdone = false;

        // Reiteration again and again till the convergence
        while (isdone == false) {
            JobConf conf = new JobConf(DijikstraAlgo.class);
            conf.setJobName("Dijikstra");
            // conf.set("mapred.max.split.size", MAX_SPLIT_SIZE);
            conf.setOutputKeyClass(LongWritable.class);
            conf.setOutputValueClass(Text.class);
            conf.setMapperClass(Map.class);
            conf.setReducerClass(Reduce.class);
            conf.setInputFormat(TextInputFormat.class);
            conf.setOutputFormat(TextOutputFormat.class);

            FileInputFormat.setInputPaths(conf, new Path(input));
            FileOutputFormat.setOutputPath(conf, new Path(output));

            JobClient.runJob(conf);

            input = output + "/part-00000";
            isdone = true;// set the job to NOT run again!
            Path ofile = new Path(input);
            FileSystem fs = FileSystem.get(new URI("hdfs://10.8.3.165:9000"), conf);
            //FileSystem fs = FileSystem.get(new Configuration());
            BufferedReader br = new BufferedReader(new InputStreamReader(fs.open(ofile)));
            HashMap<Integer, Integer> imap = new HashMap<Integer, Integer>();
            String line = br.readLine();
            // Read the current output file and put it into HashMap
            while (line != null) {
                String[] sp = line.split("\t| ");
                int node = Integer.parseInt(sp[0]);
                int distance = Integer.parseInt(sp[1]);
                imap.put(node, distance);
                line = br.readLine();
            }
            br.close();

            // Check for convergence condition if any node is still left then
            // continue else stop
            Iterator<Integer> itr = imap.keySet().iterator();
            while (itr.hasNext()) {
                int key = itr.next();
                int value = imap.get(key);
                if (value >= 125) {
                    isdone = false;
                }
            }
            input = output;
            output = OUT + System.nanoTime();
        }
    }
}