You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@mahout.apache.org by sm...@apache.org on 2013/06/28 02:10:00 UTC
svn commit: r1497615 - in /mahout/trunk/core/src:
main/java/org/apache/mahout/clustering/kmeans/
main/java/org/apache/mahout/clustering/spectral/kmeans/
test/java/org/apache/mahout/clustering/kmeans/
Author: smarthi
Date: Fri Jun 28 00:10:00 2013
New Revision: 1497615
URL: http://svn.apache.org/r1497615
Log:
MAHOUT-1214: Improve the accuracy of the Spectral KMeans Method - minor code cleanup
Modified:
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/kmeans/EigenSeedGenerator.java
mahout/trunk/core/src/main/java/org/apache/mahout/clustering/spectral/kmeans/SpectralKMeansDriver.java
mahout/trunk/core/src/test/java/org/apache/mahout/clustering/kmeans/TestEigenSeedGenerator.java
Modified: mahout/trunk/core/src/main/java/org/apache/mahout/clustering/kmeans/EigenSeedGenerator.java
URL: http://svn.apache.org/viewvc/mahout/trunk/core/src/main/java/org/apache/mahout/clustering/kmeans/EigenSeedGenerator.java?rev=1497615&r1=1497614&r2=1497615&view=diff
==============================================================================
--- mahout/trunk/core/src/main/java/org/apache/mahout/clustering/kmeans/EigenSeedGenerator.java (original)
+++ mahout/trunk/core/src/main/java/org/apache/mahout/clustering/kmeans/EigenSeedGenerator.java Fri Jun 28 00:10:00 2013
@@ -18,7 +18,6 @@
package org.apache.mahout.clustering.kmeans;
import java.io.IOException;
-import java.util.Iterator;
import java.util.Map;
import org.apache.hadoop.conf.Configuration;
@@ -90,10 +89,8 @@ public final class EigenSeedGenerator {
fileStatus.getPath(), true, conf)) {
Writable key = record.getFirst();
VectorWritable value = record.getSecond();
- Iterator<Vector.Element> nonZeroElements = value.get().nonZeroes().iterator();
- while (nonZeroElements.hasNext()) {
- Vector.Element e = nonZeroElements.next();
+ for (Vector.Element e : value.get().nonZeroes()) {
int index = e.index();
double v = Math.abs(e.get());
@@ -112,9 +109,7 @@ public final class EigenSeedGenerator {
}
try {
- Iterator<Integer> iter = maxEigens.keySet().iterator();
- while (iter.hasNext()) {
- int key = iter.next();
+ for (Integer key : maxEigens.keySet()) {
writer.append(chosenTexts.get(key), chosenClusters.get(key));
}
log.info("EigenSeedGenerator:: Wrote {} Klusters to {}", chosenTexts.size(), outFile);
Modified: mahout/trunk/core/src/main/java/org/apache/mahout/clustering/spectral/kmeans/SpectralKMeansDriver.java
URL: http://svn.apache.org/viewvc/mahout/trunk/core/src/main/java/org/apache/mahout/clustering/spectral/kmeans/SpectralKMeansDriver.java?rev=1497615&r1=1497614&r2=1497615&view=diff
==============================================================================
--- mahout/trunk/core/src/main/java/org/apache/mahout/clustering/spectral/kmeans/SpectralKMeansDriver.java (original)
+++ mahout/trunk/core/src/main/java/org/apache/mahout/clustering/spectral/kmeans/SpectralKMeansDriver.java Fri Jun 28 00:10:00 2013
@@ -255,7 +255,7 @@ public class SpectralKMeansDriver extend
Text mappingValue = new Text();
IntWritable mappingIndex = new IntWritable();
while (reader.next(mappingIndex, mappingValue)) {
- String s = new String(mappingValue.toString());
+ String s = mappingValue.toString();
mapping.add(s);
}
HadoopUtil.delete(conf, mappingPath);
Modified: mahout/trunk/core/src/test/java/org/apache/mahout/clustering/kmeans/TestEigenSeedGenerator.java
URL: http://svn.apache.org/viewvc/mahout/trunk/core/src/test/java/org/apache/mahout/clustering/kmeans/TestEigenSeedGenerator.java?rev=1497615&r1=1497614&r2=1497615&view=diff
==============================================================================
--- mahout/trunk/core/src/test/java/org/apache/mahout/clustering/kmeans/TestEigenSeedGenerator.java (original)
+++ mahout/trunk/core/src/test/java/org/apache/mahout/clustering/kmeans/TestEigenSeedGenerator.java Fri Jun 28 00:10:00 2013
@@ -65,7 +65,6 @@ public final class TestEigenSeedGenerato
fs = FileSystem.get(conf);
}
- /** Story: test eigen seed generation generates 3 clusters with proper ids and data */
@Test
public void testEigenSeedGenerator() throws Exception {
List<VectorWritable> points = getPoints();