You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@mahout.apache.org by df...@apache.org on 2013/06/02 21:48:43 UTC

svn commit: r1488777 - in /mahout/trunk: CHANGELOG core/src/main/java/org/apache/mahout/clustering/ClusteringUtils.java

Author: dfilimon
Date: Sun Jun  2 19:48:43 2013
New Revision: 1488777

URL: http://svn.apache.org/r1488777
Log:
MAHOUT-1237: Fixed total clustering cost computation


Modified:
    mahout/trunk/CHANGELOG
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/ClusteringUtils.java

Modified: mahout/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/mahout/trunk/CHANGELOG?rev=1488777&r1=1488776&r2=1488777&view=diff
==============================================================================
--- mahout/trunk/CHANGELOG (original)
+++ mahout/trunk/CHANGELOG Sun Jun  2 19:48:43 2013
@@ -2,6 +2,8 @@ Mahout Change Log
 
 Release 0.8 - unreleased
 
+__MAHOUT-1237: Total cluster cost isn't computed properly (dfilimon)
+
   MAHOUT-1196: LogisticModelParameters uses csv.getTargetCategories() even if csv is not used. (Vineet Krishnan via ssc)
 
 __MAHOUT-1224: Add the option of running a StreamingKMeans pass in the Reducer before BallKMeans (dfilimon)

Modified: mahout/trunk/core/src/main/java/org/apache/mahout/clustering/ClusteringUtils.java
URL: http://svn.apache.org/viewvc/mahout/trunk/core/src/main/java/org/apache/mahout/clustering/ClusteringUtils.java?rev=1488777&r1=1488776&r2=1488777&view=diff
==============================================================================
--- mahout/trunk/core/src/main/java/org/apache/mahout/clustering/ClusteringUtils.java (original)
+++ mahout/trunk/core/src/main/java/org/apache/mahout/clustering/ClusteringUtils.java Sun Jun  2 19:48:43 2013
@@ -69,8 +69,7 @@ public class ClusteringUtils {
   public static double totalClusterCost(Iterable<? extends Vector> datapoints, Searcher centroids) {
     double totalCost = 0;
     for (Vector vector : datapoints) {
-      Centroid closest = (Centroid) centroids.searchFirst(vector, false).getValue();
-      totalCost += closest.getWeight();
+      totalCost += centroids.searchFirst(vector, false).getWeight();
     }
     return totalCost;
   }