Java tutorial
/* * This file is part of Gradoop. * * Gradoop is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * Gradoop is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with Gradoop. If not, see <http://www.gnu.org/licenses/>. */ package org.gradoop.flink.algorithms.fsm.functions; import com.google.common.collect.Lists; import com.google.common.collect.Maps; import org.apache.flink.api.common.functions.FlatMapFunction; import org.apache.flink.util.Collector; import org.gradoop.flink.algorithms.fsm.canonicalization.CanonicalLabeler; import org.gradoop.flink.algorithms.fsm.config.FSMConfig; import org.gradoop.flink.algorithms.fsm.pojos.Embedding; import org.gradoop.flink.algorithms.fsm.pojos.FSMEdge; import org.gradoop.flink.algorithms.fsm.tuples.FSMGraph; import org.gradoop.flink.algorithms.fsm.tuples.SubgraphEmbeddings; import java.util.Collection; import java.util.Map; /** * graph => embedding(k=1),.. */ public class SingleEdgeEmbeddings implements FlatMapFunction<FSMGraph, SubgraphEmbeddings> { /** * reuse tuple to avoid instantiations */ private final SubgraphEmbeddings reuseTuple = new SubgraphEmbeddings(); /** * graph labeler */ private final CanonicalLabeler canonicalLabeler; /** * Constructor. * * @param fsmConfig FSM configuration */ public SingleEdgeEmbeddings(FSMConfig fsmConfig) { canonicalLabeler = fsmConfig.getCanonicalLabeler(); } @Override public void flatMap(FSMGraph graph, Collector<SubgraphEmbeddings> out) throws Exception { Map<Integer, String> vertices = graph.getVertices(); Map<String, Collection<Embedding>> subgraphEmbeddings = Maps.newHashMap(); for (Map.Entry<Integer, FSMEdge> entry : graph.getEdges().entrySet()) { FSMEdge edge = entry.getValue(); int sourceId = edge.getSourceId(); int targetId = edge.getTargetId(); Map<Integer, String> incidentVertices = Maps.newHashMapWithExpectedSize(2); incidentVertices.put(sourceId, vertices.get(sourceId)); if (sourceId != targetId) { incidentVertices.put(targetId, vertices.get(targetId)); } Map<Integer, FSMEdge> singleEdge = Maps.newHashMapWithExpectedSize(1); singleEdge.put(entry.getKey(), edge); Embedding embedding = new Embedding(incidentVertices, singleEdge); String subgraph = canonicalLabeler.label(embedding); Collection<Embedding> embeddings = subgraphEmbeddings.get(subgraph); if (embeddings == null) { subgraphEmbeddings.put(subgraph, Lists.newArrayList(embedding)); } else { embeddings.add(embedding); } } reuseTuple.setGraphId(graph.getId()); reuseTuple.setSize(1); for (Map.Entry<String, Collection<Embedding>> entry : subgraphEmbeddings.entrySet()) { reuseTuple.setSubgraph(entry.getKey()); reuseTuple.setEmbeddings(entry.getValue()); out.collect(reuseTuple); } } }