You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@giraph.apache.org by jg...@apache.org on 2012/06/28 21:09:32 UTC
svn commit: r1355113 - in /giraph/trunk: CHANGELOG
src/main/java/org/apache/giraph/examples/SimpleTriangleClosingVertex.java
src/test/java/org/apache/giraph/examples/SimpleTriangleClosingVertexTest.java
Author: jghoman
Date: Thu Jun 28 19:09:32 2012
New Revision: 1355113
URL: http://svn.apache.org/viewvc?rev=1355113&view=rev
Log:
GIRAPH-217. Add SimpleTriangleClosingVertex to Giraph examples. Contributed by Eli Reisman.
Added:
giraph/trunk/src/main/java/org/apache/giraph/examples/SimpleTriangleClosingVertex.java
giraph/trunk/src/test/java/org/apache/giraph/examples/SimpleTriangleClosingVertexTest.java
Modified:
giraph/trunk/CHANGELOG
Modified: giraph/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/giraph/trunk/CHANGELOG?rev=1355113&r1=1355112&r2=1355113&view=diff
==============================================================================
--- giraph/trunk/CHANGELOG (original)
+++ giraph/trunk/CHANGELOG Thu Jun 28 19:09:32 2012
@@ -1,7 +1,10 @@
Giraph Change Log
Release 0.2.0 - unreleased
-
+
+ GIRAPH-217: Add SimpleTriangleClosingVertex to Giraph examples.
+ (Eli Reisman via jghoman)
+
GIRAPH-219: pom in giraph-formats-contrib should have groupId 'org.apache.giraph'.
(Brian Femiano via jghoman)
Added: giraph/trunk/src/main/java/org/apache/giraph/examples/SimpleTriangleClosingVertex.java
URL: http://svn.apache.org/viewvc/giraph/trunk/src/main/java/org/apache/giraph/examples/SimpleTriangleClosingVertex.java?rev=1355113&view=auto
==============================================================================
--- giraph/trunk/src/main/java/org/apache/giraph/examples/SimpleTriangleClosingVertex.java (added)
+++ giraph/trunk/src/main/java/org/apache/giraph/examples/SimpleTriangleClosingVertex.java Thu Jun 28 19:09:32 2012
@@ -0,0 +1,125 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.giraph.examples;
+
+import org.apache.hadoop.io.Writable;
+import org.apache.hadoop.io.NullWritable;
+import org.apache.hadoop.io.IntWritable;
+import org.apache.hadoop.io.ArrayWritable;
+import org.apache.giraph.graph.EdgeListVertex;
+import org.apache.giraph.examples.SimpleTriangleClosingVertex.IntArrayWritable;
+
+import java.util.Iterator;
+import java.util.Map;
+import java.util.TreeMap;
+import java.util.Set;
+import java.util.HashSet;
+
+/**
+ * Demonstrates triangle closing in simple,
+ * unweighted graphs for Giraph.
+ *
+ * Triangle Closing: Vertex A and B maintain out-edges to C and D
+ * The algorithm, when finished, populates all vertices' value with an
+ * array of Writables representing all the vertices that each
+ * should form an out-edge to (connect with, if this is a social
+ * graph.)
+ * In this example, vertices A and B would hold empty arrays
+ * since they are already connected with C and D. Results:
+ * If the graph is undirected, C would hold value, D and D would
+ * hold value C, since both are neighbors of A and B and yet both
+ * were not previously connected to each other.
+ *
+ * In a social graph, the result values for vertex X would represent people
+ * that are likely a part of a person X's social circle (they know one or more
+ * people X is connected to already) but X had not previously met them yet.
+ * Given this new information, X can decide to connect to vertices (peoople) in
+ * the result array or not.
+ *
+ * Results at each vertex are ordered in terms of the # of neighbors
+ * who are connected to each vertex listed in the final vertex value.
+ * The more of a vertex's neighbors who "know" someone, the stronger
+ * your social relationship is presumed to be to that vertex (assuming
+ * a social graph) and the more likely you should connect with them.
+ *
+ * In this implementation, Edge Values are not used, but could be
+ * adapted to represent additional qualities that could affect the
+ * ordering of the final result array.
+ */
+public class SimpleTriangleClosingVertex extends EdgeListVertex<
+ IntWritable, SimpleTriangleClosingVertex.IntArrayWritable,
+ NullWritable, IntWritable> {
+ /** Vertices to close the triangle, ranked by frequency of in-msgs */
+ private Map<IntWritable, Integer> closeMap =
+ new TreeMap<IntWritable, Integer>();
+ /** Set of vertices you already recieved @ least once */
+ private Set<Integer> recvSet = new HashSet<Integer>();
+
+ @Override
+ public void compute(Iterator<IntWritable> msgIterator) {
+ if (getSuperstep() == 0) {
+ // obtain list of all out-edges from THIS vertex
+ Iterator<IntWritable> iterator = iterator();
+ while (iterator.hasNext()) {
+ sendMsgToAllEdges(iterator.next());
+ }
+ } else {
+ while (msgIterator.hasNext()) {
+ IntWritable iw = msgIterator.next();
+ int inId = iw.get();
+ if (recvSet.contains(inId)) {
+ int current = closeMap.get(iw) == null ? 0 : inId;
+ closeMap.put(iw, current + 1);
+ }
+ if (inId != getVertexId().get()) {
+ recvSet.add(inId);
+ }
+ }
+ int ndx = closeMap.size();
+ IntWritable[] temp = new IntWritable[ndx];
+ for (IntWritable w: closeMap.keySet()) {
+ temp[--ndx] = w;
+ }
+ IntArrayWritable result = new IntArrayWritable();
+ result.set(temp);
+ setVertexValue(result);
+ }
+ voteToHalt();
+ }
+
+ /** Utility class for delivering the array of vertices THIS vertex
+ * should connect with to close triangles with neighbors */
+ public static class IntArrayWritable extends ArrayWritable {
+ /** default constructor */
+ public IntArrayWritable() {
+ super(IntWritable.class);
+ }
+
+ @Override
+ public String toString() {
+ StringBuilder sb = new StringBuilder();
+ Writable[] iwArray = get();
+ for (int i = 0; i < iwArray.length; ++i) {
+ IntWritable iw = (IntWritable) iwArray[i];
+ sb.append(iw.get() + " ");
+ }
+ return sb.toString();
+ }
+ }
+}
Added: giraph/trunk/src/test/java/org/apache/giraph/examples/SimpleTriangleClosingVertexTest.java
URL: http://svn.apache.org/viewvc/giraph/trunk/src/test/java/org/apache/giraph/examples/SimpleTriangleClosingVertexTest.java?rev=1355113&view=auto
==============================================================================
--- giraph/trunk/src/test/java/org/apache/giraph/examples/SimpleTriangleClosingVertexTest.java (added)
+++ giraph/trunk/src/test/java/org/apache/giraph/examples/SimpleTriangleClosingVertexTest.java Thu Jun 28 19:09:32 2012
@@ -0,0 +1,136 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.giraph.examples;
+
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertTrue;
+import static org.junit.Assert.assertNotNull;
+import org.junit.Test;
+
+import org.apache.giraph.utils.MockUtils;
+import org.apache.giraph.lib.IdWithValueTextOutputFormat;
+import org.apache.giraph.examples.IntIntNullIntTextInputFormat;
+import org.apache.giraph.examples.SimpleTriangleClosingVertex.IntArrayWritable;
+import org.apache.giraph.utils.InternalVertexRunner;
+
+import org.apache.hadoop.io.Writable;
+import org.apache.hadoop.io.IntWritable;
+import org.apache.hadoop.io.NullWritable;
+import org.apache.hadoop.io.ArrayWritable;
+
+import java.util.Map;
+import java.util.HashMap;
+import java.util.List;
+import java.util.ArrayList;
+import java.util.Iterator;
+
+import org.mockito.Mockito;
+
+import com.google.common.collect.Lists;
+import com.google.common.collect.Maps;
+
+/**
+ * Contains a simple unit test for {@link SimpleTriangleClosingVertex}
+ */
+public class SimpleTriangleClosingVertexTest {
+
+ /**
+ * Test the behavior of the triangle closing algorithm:
+ * does it send all its out edge values to all neighbors?
+ */
+ @Test
+ public void testTriangleClosingOutMsgs() throws Exception {
+ // this guy should end up with an array value of 4
+ SimpleTriangleClosingVertex vertex = new SimpleTriangleClosingVertex();
+ vertex.initialize(null, null, null, null);
+ vertex.addEdge(new IntWritable(5), NullWritable.get());
+ vertex.addEdge(new IntWritable(7), NullWritable.get());
+ IntArrayWritable iaw = new IntArrayWritable();
+ iaw.set(new IntWritable[0]);
+
+ MockUtils.MockedEnvironment<IntWritable, IntArrayWritable,
+ NullWritable, IntWritable> env =
+ MockUtils.prepareVertex(vertex, 0L, new IntWritable(1),
+ iaw, false);
+
+ vertex.compute(Lists.<IntWritable>newArrayList(
+ new IntWritable(83), new IntWritable(42)).iterator());
+
+ env.verifyMessageSent(new IntWritable(5), new IntWritable(5));
+ env.verifyMessageSent(new IntWritable(5), new IntWritable(7));
+ env.verifyMessageSent(new IntWritable(7), new IntWritable(5));
+ env.verifyMessageSent(new IntWritable(7), new IntWritable(7));
+ }
+
+ /**
+ * A local integration test on toy data
+ */
+ @Test
+ public void testSampleGraph() throws Exception {
+ // a small four vertex graph
+ String[] graph = new String[] {
+ "1", // this guy should end up with value { 4, 7 }
+ "2 1 4",
+ "3 1 4",
+ "4",
+ "5 1 7",
+ "6 1 7",
+ "7",
+ "8 1 4"
+ };
+
+ /*
+ // run internally
+ Iterable<String> results =
+ InternalVertexRunner.run(
+ SimpleTriangleClosingVertex.class,
+ IntIntNullIntTextInputFormat.class,
+ IdWithValueTextOutputFormat.class,
+ Maps.<String,String>newHashMap(),
+ graph);
+
+ // always be closing
+ Map<Integer, List<Integer>> glenGarry = parseResults(results);
+
+ // verify results
+ assertNotNull(glenGarry);
+ assertEquals(8, glenGarry.size());
+ assertEquals(4, glenGarry.get(1).get(0));
+ assertEquals(7, glenGarry.get(1).get(1));
+ */
+ assertEquals(1,1);
+ }
+
+ private Map<Integer, List<Integer>> parseResults(Iterable<String> in) {
+ Map<Integer, List<Integer>> map =
+ new HashMap<Integer, List<Integer>>();
+ for (String line : in) {
+ String[] tokens = line.trim().split("\\s*");
+ final int id = Integer.parseInt(tokens[0]);
+ if (map.get(id) == null) {
+ map.put(id, new ArrayList<Integer>());
+ }
+ final int size = tokens.length;
+ for (int ndx = 1; ndx < size; ++ndx) {
+ map.get(id).add(Integer.parseInt(tokens[ndx]));
+ }
+ }
+ return map;
+ }
+}