You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@mahout.apache.org by je...@apache.org on 2010/05/18 23:53:53 UTC
svn commit: r945913 - in /mahout/trunk: conf/lda.props examples/bin/
examples/bin/build-reuters.sh
Author: jeastman
Date: Tue May 18 21:53:52 2010
New Revision: 945913
URL: http://svn.apache.org/viewvc?rev=945913&view=rev
Log:
added clusterdump and ldatopics to build-reuters.sh
Modified:
mahout/trunk/conf/lda.props
mahout/trunk/examples/bin/ (props changed)
mahout/trunk/examples/bin/build-reuters.sh
Modified: mahout/trunk/conf/lda.props
URL: http://svn.apache.org/viewvc/mahout/trunk/conf/lda.props?rev=945913&r1=945912&r2=945913&view=diff
==============================================================================
--- mahout/trunk/conf/lda.props (original)
+++ mahout/trunk/conf/lda.props Tue May 18 21:53:52 2010
@@ -6,6 +6,6 @@
# The following parameters all have default values if not specified
#a|topicSmoothing = <topic smoothing. Default: 50/numTopics>
-#maxIter|maxIter = <maximum number of iterations. Default: -1 (until converged)>
-#numReducers|numReducers = <the number of reducers. Default: 2>
+#x|maxIter = <maximum number of iterations. Default: -1 (until converged)>
+#r|numReducers = <the number of reducers. Default: 2>
Propchange: mahout/trunk/examples/bin/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Tue May 18 21:53:52 2010
@@ -0,0 +1 @@
+work
Modified: mahout/trunk/examples/bin/build-reuters.sh
URL: http://svn.apache.org/viewvc/mahout/trunk/examples/bin/build-reuters.sh?rev=945913&r1=945912&r2=945913&view=diff
==============================================================================
--- mahout/trunk/examples/bin/build-reuters.sh (original)
+++ mahout/trunk/examples/bin/build-reuters.sh Tue May 18 21:53:52 2010
@@ -40,6 +40,12 @@ cd ../..
./bin/mahout org.apache.lucene.benchmark.utils.ExtractReuters ./examples/bin/work/reuters-sgm/ ./examples/bin/work/reuters-out/
./bin/mahout seqdirectory -i ./examples/bin/work/reuters-out/ -o ./examples/bin/work/reuters-out-seqdir -c UTF-8
./bin/mahout seq2sparse -i ./examples/bin/work/reuters-out-seqdir/ -o ./examples/bin/work/reuters-out-seqdir-sparse
-#./bin/mahout kmeans -i ./examples/bin/work/reuters-out-seqdir-sparse/tfidf/vectors/ -c ./examples/bin/work/clusters -o ./examples/bin/work/reuters-kmeans -k 20 -ow
+
+# to use k-Means clustering, uncomment the next two lines
+#./bin/mahout kmeans -i ./examples/bin/work/reuters-out-seqdir-sparse/tfidf/vectors/ -c ./examples/bin/work/clusters -o ./examples/bin/work/reuters-kmeans -x 10 -k 20 -ow
+#./bin/mahout clusterdump -s examples/bin/work/reuters-kmeans/clusters-10 -d examples/bin/work/reuters-out-seqdir-sparse/dictionary.file-0 -dt sequencefile -b 100 -n 20
+
+# to use LDA clustering, uncomment the next two lines
#./bin/mahout lda -i ./examples/bin/work/reuters-out-seqdir-sparse/tfidf/vectors -o ./examples/bin/work/reuters-lda -k 20 -v 50000 -ow
+#./bin/mahout ldatopics -i ./examples/bin/work/reuters-lda/state-9 -d ./examples/bin/work/reuters-out-seqdir-sparse/dictionary.file-0 -dt sequencefile