You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@mahout.apache.org by sr...@apache.org on 2012/04/06 14:41:16 UTC

svn commit: r1310302 - /mahout/trunk/core/src/main/java/org/apache/mahout/vectorizer/tfidf/TFIDFPartialVectorReducer.java

Author: srowen
Date: Fri Apr  6 12:41:15 2012
New Revision: 1310302

URL: http://svn.apache.org/viewvc?rev=1310302&view=rev
Log:
MAHOUT-973 fix treatment of value as percentage

Modified:
    mahout/trunk/core/src/main/java/org/apache/mahout/vectorizer/tfidf/TFIDFPartialVectorReducer.java

Modified: mahout/trunk/core/src/main/java/org/apache/mahout/vectorizer/tfidf/TFIDFPartialVectorReducer.java
URL: http://svn.apache.org/viewvc/mahout/trunk/core/src/main/java/org/apache/mahout/vectorizer/tfidf/TFIDFPartialVectorReducer.java?rev=1310302&r1=1310301&r2=1310302&view=diff
==============================================================================
--- mahout/trunk/core/src/main/java/org/apache/mahout/vectorizer/tfidf/TFIDFPartialVectorReducer.java (original)
+++ mahout/trunk/core/src/main/java/org/apache/mahout/vectorizer/tfidf/TFIDFPartialVectorReducer.java Fri Apr  6 12:41:15 2012
@@ -78,7 +78,7 @@ public class TFIDFPartialVectorReducer e
         continue;
       }
       long df = dictionary.get(e.index());
-      if (maxDf > -1 && df > maxDf) {
+      if (maxDf > -1 && (100.0 * df) / vectorCount > maxDf) {
         continue;
       }
       if (df < minDf) {