You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@mahout.apache.org by je...@apache.org on 2010/05/18 23:53:53 UTC

svn commit: r945913 - in /mahout/trunk: conf/lda.props examples/bin/ examples/bin/build-reuters.sh

Author: jeastman
Date: Tue May 18 21:53:52 2010
New Revision: 945913

URL: http://svn.apache.org/viewvc?rev=945913&view=rev
Log:
added clusterdump and ldatopics to build-reuters.sh

Modified:
    mahout/trunk/conf/lda.props
    mahout/trunk/examples/bin/   (props changed)
    mahout/trunk/examples/bin/build-reuters.sh

Modified: mahout/trunk/conf/lda.props
URL: http://svn.apache.org/viewvc/mahout/trunk/conf/lda.props?rev=945913&r1=945912&r2=945913&view=diff
==============================================================================
--- mahout/trunk/conf/lda.props (original)
+++ mahout/trunk/conf/lda.props Tue May 18 21:53:52 2010
@@ -6,6 +6,6 @@
 
 # The following parameters all have default values if not specified
 #a|topicSmoothing = <topic smoothing. Default: 50/numTopics>
-#maxIter|maxIter = <maximum number of iterations. Default: -1 (until converged)>
-#numReducers|numReducers = <the number of reducers. Default: 2>
+#x|maxIter = <maximum number of iterations. Default: -1 (until converged)>
+#r|numReducers = <the number of reducers. Default: 2>
 

Propchange: mahout/trunk/examples/bin/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Tue May 18 21:53:52 2010
@@ -0,0 +1 @@
+work

Modified: mahout/trunk/examples/bin/build-reuters.sh
URL: http://svn.apache.org/viewvc/mahout/trunk/examples/bin/build-reuters.sh?rev=945913&r1=945912&r2=945913&view=diff
==============================================================================
--- mahout/trunk/examples/bin/build-reuters.sh (original)
+++ mahout/trunk/examples/bin/build-reuters.sh Tue May 18 21:53:52 2010
@@ -40,6 +40,12 @@ cd ../..
 ./bin/mahout org.apache.lucene.benchmark.utils.ExtractReuters ./examples/bin/work/reuters-sgm/ ./examples/bin/work/reuters-out/
 ./bin/mahout seqdirectory -i ./examples/bin/work/reuters-out/ -o ./examples/bin/work/reuters-out-seqdir -c UTF-8
 ./bin/mahout seq2sparse -i ./examples/bin/work/reuters-out-seqdir/ -o ./examples/bin/work/reuters-out-seqdir-sparse
-#./bin/mahout kmeans -i ./examples/bin/work/reuters-out-seqdir-sparse/tfidf/vectors/ -c ./examples/bin/work/clusters -o ./examples/bin/work/reuters-kmeans -k 20 -ow
+
+# to use k-Means clustering, uncomment the next two lines
+#./bin/mahout kmeans -i ./examples/bin/work/reuters-out-seqdir-sparse/tfidf/vectors/ -c ./examples/bin/work/clusters -o ./examples/bin/work/reuters-kmeans -x 10 -k 20 -ow
+#./bin/mahout clusterdump -s examples/bin/work/reuters-kmeans/clusters-10 -d examples/bin/work/reuters-out-seqdir-sparse/dictionary.file-0 -dt sequencefile -b 100 -n 20
+
+# to use LDA clustering, uncomment the next two lines
 #./bin/mahout lda -i ./examples/bin/work/reuters-out-seqdir-sparse/tfidf/vectors -o ./examples/bin/work/reuters-lda -k 20 -v 50000 -ow
+#./bin/mahout ldatopics -i ./examples/bin/work/reuters-lda/state-9 -d ./examples/bin/work/reuters-out-seqdir-sparse/dictionary.file-0 -dt sequencefile